diff --git "a/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" "b/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" --- "a/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" +++ "b/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.4211, "train/learning_rate": 5.805515239477504e-08, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 6756, "_timestamp": 1646072785, "_step": 1191, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 199.0, 773.0, 38.0, 3.0], "bins": [-638.4752197265625, -628.0576171875, -617.6399536132812, -607.2223510742188, -596.8046875, -586.3870849609375, -575.969482421875, -565.5518188476562, -555.1342163085938, -544.7166137695312, -534.2989501953125, -523.88134765625, -513.4636840820312, -503.04608154296875, -492.6284484863281, -482.2108154296875, -471.7931823730469, -461.37554931640625, -450.9579162597656, -440.5403137207031, -430.1226806640625, -419.7050476074219, -409.28741455078125, -398.8697814941406, -388.4521484375, -378.0345153808594, -367.61688232421875, -357.19927978515625, -346.7816467285156, -336.364013671875, -325.9463806152344, -315.52874755859375, -305.1111145019531, -294.6934814453125, -284.2758483886719, -273.8582458496094, -263.44061279296875, -253.02297973632812, -242.6053466796875, -232.18771362304688, -221.77011108398438, -211.35247802734375, -200.9348602294922, -190.51722717285156, -180.099609375, -169.68197631835938, -159.26434326171875, -148.84671020507812, -138.42909240722656, -128.01145935058594, -117.59384155273438, -107.17620849609375, -96.75858306884766, -86.34095764160156, -75.92332458496094, -65.50569915771484, -55.08807373046875, -44.670448303222656, -34.2528190612793, -23.83519172668457, -13.417564392089844, -2.99993896484375, 7.417690277099609, 17.83531951904297, 28.252946853637695]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 7.0, 4.0, 3.0, 2.0, 12.0, 7.0, 9.0, 10.0, 13.0, 26.0, 23.0, 22.0, 24.0, 29.0, 36.0, 37.0, 45.0, 33.0, 39.0, 37.0, 61.0, 51.0, 50.0, 48.0, 51.0, 46.0, 37.0, 24.0, 35.0, 21.0, 27.0, 20.0, 19.0, 14.0, 16.0, 12.0, 13.0, 11.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.6351318359375, -54.82221984863281, -53.009307861328125, -51.19639587402344, -49.383480072021484, -47.5705680847168, -45.75765609741211, -43.94474411010742, -42.13182830810547, -40.31891632080078, -38.506004333496094, -36.693092346191406, -34.88017654418945, -33.067264556884766, -31.254352569580078, -29.44144058227539, -27.628528594970703, -25.815616607666016, -24.002702713012695, -22.189790725708008, -20.376876831054688, -18.56396484375, -16.751052856445312, -14.938139915466309, -13.125226974487305, -11.3123140335083, -9.499401092529297, -7.686489105224609, -5.8735761642456055, -4.060663223266602, -2.247751235961914, -0.43483829498291016, 1.3780746459960938, 3.1909873485565186, 5.003900051116943, 6.816812515258789, 8.629725456237793, 10.442638397216797, 12.255550384521484, 14.068463325500488, 15.881376266479492, 17.69428825378418, 19.5072021484375, 21.320114135742188, 23.133026123046875, 24.945940017700195, 26.758852005004883, 28.571765899658203, 30.38467788696289, 32.19758987426758, 34.010501861572266, 35.82341766357422, 37.636329650878906, 39.449241638183594, 41.26215362548828, 43.07506561279297, 44.887977600097656, 46.700889587402344, 48.51380157470703, 50.32671356201172, 52.13962936401367, 53.95254135131836, 55.76545333862305, 57.578365325927734, 59.39128112792969]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 10.0, 12.0, 20.0, 15.0, 32.0, 45.0, 51.0, 46.0, 68.0, 78.0, 72.0, 86.0, 83.0, 89.0, 75.0, 51.0, 40.0, 31.0, 32.0, 19.0, 12.0, 10.0, 11.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.62652587890625, -9.3936767578125, -9.16082763671875, -8.927978515625, -8.69512939453125, -8.4622802734375, -8.22943115234375, -7.99658203125, -7.76373291015625, -7.5308837890625, -7.29803466796875, -7.065185546875, -6.83233642578125, -6.5994873046875, -6.36663818359375, -6.1337890625, -5.90093994140625, -5.6680908203125, -5.43524169921875, -5.202392578125, -4.96954345703125, -4.7366943359375, -4.50384521484375, -4.27099609375, -4.03814697265625, -3.8052978515625, -3.57244873046875, -3.339599609375, -3.10675048828125, -2.8739013671875, -2.64105224609375, -2.408203125, -2.17535400390625, -1.9425048828125, -1.70965576171875, -1.476806640625, -1.24395751953125, -1.0111083984375, -0.77825927734375, -0.54541015625, -0.31256103515625, -0.0797119140625, 0.15313720703125, 0.385986328125, 0.61883544921875, 0.8516845703125, 1.08453369140625, 1.3173828125, 1.55023193359375, 1.7830810546875, 2.01593017578125, 2.248779296875, 2.48162841796875, 2.7144775390625, 2.94732666015625, 3.18017578125, 3.41302490234375, 3.6458740234375, 3.87872314453125, 4.111572265625, 4.34442138671875, 4.5772705078125, 4.81011962890625, 5.04296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4.0, 8.0, 11.0, 13.0, 29.0, 34.0, 72.0, 89.0, 139.0, 212.0, 396.0, 735.0, 1454.0, 3154.0, 9650.0, 51280.0, 1266920.0, 2726149.0, 110410.0, 15390.0, 4333.0, 1812.0, 835.0, 446.0, 255.0, 145.0, 110.0, 66.0, 56.0, 31.0, 17.0, 14.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.0, -21.4381103515625, -20.876220703125, -20.3143310546875, -19.75244140625, -19.1905517578125, -18.628662109375, -18.0667724609375, -17.5048828125, -16.9429931640625, -16.381103515625, -15.8192138671875, -15.25732421875, -14.6954345703125, -14.133544921875, -13.5716552734375, -13.009765625, -12.4478759765625, -11.885986328125, -11.3240966796875, -10.76220703125, -10.2003173828125, -9.638427734375, -9.0765380859375, -8.5146484375, -7.9527587890625, -7.390869140625, -6.8289794921875, -6.26708984375, -5.7052001953125, -5.143310546875, -4.5814208984375, -4.01953125, -3.4576416015625, -2.895751953125, -2.3338623046875, -1.77197265625, -1.2100830078125, -0.648193359375, -0.0863037109375, 0.4755859375, 1.0374755859375, 1.599365234375, 2.1612548828125, 2.72314453125, 3.2850341796875, 3.846923828125, 4.4088134765625, 4.970703125, 5.5325927734375, 6.094482421875, 6.6563720703125, 7.21826171875, 7.7801513671875, 8.342041015625, 8.9039306640625, 9.4658203125, 10.0277099609375, 10.589599609375, 11.1514892578125, 11.71337890625, 12.2752685546875, 12.837158203125, 13.3990478515625, 13.9609375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 10.0, 13.0, 11.0, 32.0, 53.0, 49.0, 112.0, 172.0, 272.0, 472.0, 830.0, 815.0, 513.0, 268.0, 172.0, 85.0, 60.0, 42.0, 24.0, 20.0, 11.0, 11.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.671875, -27.97314453125, -27.2744140625, -26.57568359375, -25.876953125, -25.17822265625, -24.4794921875, -23.78076171875, -23.08203125, -22.38330078125, -21.6845703125, -20.98583984375, -20.287109375, -19.58837890625, -18.8896484375, -18.19091796875, -17.4921875, -16.79345703125, -16.0947265625, -15.39599609375, -14.697265625, -13.99853515625, -13.2998046875, -12.60107421875, -11.90234375, -11.20361328125, -10.5048828125, -9.80615234375, -9.107421875, -8.40869140625, -7.7099609375, -7.01123046875, -6.3125, -5.61376953125, -4.9150390625, -4.21630859375, -3.517578125, -2.81884765625, -2.1201171875, -1.42138671875, -0.72265625, -0.02392578125, 0.6748046875, 1.37353515625, 2.072265625, 2.77099609375, 3.4697265625, 4.16845703125, 4.8671875, 5.56591796875, 6.2646484375, 6.96337890625, 7.662109375, 8.36083984375, 9.0595703125, 9.75830078125, 10.45703125, 11.15576171875, 11.8544921875, 12.55322265625, 13.251953125, 13.95068359375, 14.6494140625, 15.34814453125, 16.046875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 13.0, 24.0, 31.0, 84.0, 145.0, 272.0, 602.0, 1688.0, 19694.0, 4153828.0, 15221.0, 1551.0, 584.0, 232.0, 132.0, 58.0, 40.0, 22.0, 19.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -84.2548828125, -81.072265625, -77.8896484375, -74.70703125, -71.5244140625, -68.341796875, -65.1591796875, -61.9765625, -58.7939453125, -55.611328125, -52.4287109375, -49.24609375, -46.0634765625, -42.880859375, -39.6982421875, -36.515625, -33.3330078125, -30.150390625, -26.9677734375, -23.78515625, -20.6025390625, -17.419921875, -14.2373046875, -11.0546875, -7.8720703125, -4.689453125, -1.5068359375, 1.67578125, 4.8583984375, 8.041015625, 11.2236328125, 14.40625, 17.5888671875, 20.771484375, 23.9541015625, 27.13671875, 30.3193359375, 33.501953125, 36.6845703125, 39.8671875, 43.0498046875, 46.232421875, 49.4150390625, 52.59765625, 55.7802734375, 58.962890625, 62.1455078125, 65.328125, 68.5107421875, 71.693359375, 74.8759765625, 78.05859375, 81.2412109375, 84.423828125, 87.6064453125, 90.7890625, 93.9716796875, 97.154296875, 100.3369140625, 103.51953125, 106.7021484375, 109.884765625, 113.0673828125, 116.25]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 106.0, 600.0, 285.0, 12.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.01038360595703, -31.39297103881836, -24.775558471679688, -18.15814781188965, -11.540735244750977, -4.9233245849609375, 1.6940879821777344, 8.311500549316406, 14.928913116455078, 21.54632568359375, 28.163738250732422, 34.781150817871094, 41.3985595703125, 48.01597213745117, 54.633384704589844, 61.250797271728516, 67.86820983886719, 74.4856185913086, 81.10303497314453, 87.72044372558594, 94.33786010742188, 100.95526885986328, 107.57267761230469, 114.19009399414062, 120.80751037597656, 127.42491912841797, 134.04232788085938, 140.6597442626953, 147.27716064453125, 153.89456176757812, 160.51197814941406, 167.12939453125, 173.74681091308594, 180.36422729492188, 186.98162841796875, 193.5990447998047, 200.21646118164062, 206.8338623046875, 213.45127868652344, 220.06869506835938, 226.6861114501953, 233.30352783203125, 239.92092895507812, 246.53834533691406, 253.15576171875, 259.7731628417969, 266.3905944824219, 273.00799560546875, 279.6253967285156, 286.2427978515625, 292.8602294921875, 299.4776306152344, 306.09503173828125, 312.71246337890625, 319.3298645019531, 325.947265625, 332.564697265625, 339.1820983886719, 345.7995300292969, 352.41693115234375, 359.0343322753906, 365.6517639160156, 372.2691650390625, 378.8865966796875, 385.5039978027344]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 2.0, 14.0, 16.0, 19.0, 20.0, 30.0, 27.0, 46.0, 38.0, 48.0, 50.0, 57.0, 59.0, 63.0, 59.0, 51.0, 66.0, 49.0, 45.0, 47.0, 40.0, 28.0, 24.0, 19.0, 17.0, 19.0, 6.0, 7.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.2113037109375, -70.05340576171875, -67.8955078125, -65.73760986328125, -63.579708099365234, -61.421810150146484, -59.26390838623047, -57.10601043701172, -54.94811248779297, -52.79021453857422, -50.63231658935547, -48.47441482543945, -46.3165168762207, -44.15861892700195, -42.00071716308594, -39.84281921386719, -37.68492126464844, -35.52702331542969, -33.36912536621094, -31.211223602294922, -29.053325653076172, -26.895427703857422, -24.73752784729004, -22.579627990722656, -20.421730041503906, -18.263832092285156, -16.105932235717773, -13.948033332824707, -11.79013442993164, -9.632235527038574, -7.474336624145508, -5.316437721252441, -3.158538818359375, -1.0006399154663086, 1.1572589874267578, 3.315157890319824, 5.473056793212891, 7.630955696105957, 9.788854598999023, 11.94675350189209, 14.104652404785156, 16.262550354003906, 18.42045021057129, 20.578350067138672, 22.736248016357422, 24.894145965576172, 27.052045822143555, 29.209945678710938, 31.367843627929688, 33.52574157714844, 35.68363952636719, 37.8415412902832, 39.99943923950195, 42.1573371887207, 44.31523895263672, 46.47313690185547, 48.63103485107422, 50.78893280029297, 52.94683074951172, 55.104732513427734, 57.262630462646484, 59.420528411865234, 61.57843017578125, 63.736328125, 65.89422607421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 16.0, 18.0, 17.0, 15.0, 31.0, 17.0, 24.0, 36.0, 34.0, 33.0, 48.0, 50.0, 50.0, 55.0, 52.0, 62.0, 58.0, 47.0, 54.0, 30.0, 44.0, 33.0, 31.0, 20.0, 15.0, 13.0, 17.0, 11.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.29296875, -6.13153076171875, -5.9700927734375, -5.80865478515625, -5.647216796875, -5.48577880859375, -5.3243408203125, -5.16290283203125, -5.00146484375, -4.84002685546875, -4.6785888671875, -4.51715087890625, -4.355712890625, -4.19427490234375, -4.0328369140625, -3.87139892578125, -3.7099609375, -3.54852294921875, -3.3870849609375, -3.22564697265625, -3.064208984375, -2.90277099609375, -2.7413330078125, -2.57989501953125, -2.41845703125, -2.25701904296875, -2.0955810546875, -1.93414306640625, -1.772705078125, -1.61126708984375, -1.4498291015625, -1.28839111328125, -1.126953125, -0.96551513671875, -0.8040771484375, -0.64263916015625, -0.481201171875, -0.31976318359375, -0.1583251953125, 0.00311279296875, 0.16455078125, 0.32598876953125, 0.4874267578125, 0.64886474609375, 0.810302734375, 0.97174072265625, 1.1331787109375, 1.29461669921875, 1.4560546875, 1.61749267578125, 1.7789306640625, 1.94036865234375, 2.101806640625, 2.26324462890625, 2.4246826171875, 2.58612060546875, 2.74755859375, 2.90899658203125, 3.0704345703125, 3.23187255859375, 3.393310546875, 3.55474853515625, 3.7161865234375, 3.87762451171875, 4.0390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 8.0, 13.0, 17.0, 22.0, 35.0, 42.0, 89.0, 102.0, 183.0, 302.0, 449.0, 704.0, 1127.0, 1783.0, 2727.0, 4546.0, 7419.0, 11690.0, 19468.0, 33639.0, 58963.0, 111802.0, 223293.0, 266057.0, 135739.0, 70513.0, 39252.0, 22660.0, 13811.0, 8325.0, 5118.0, 3155.0, 2007.0, 1254.0, 777.0, 550.0, 304.0, 215.0, 133.0, 87.0, 52.0, 37.0, 28.0, 10.0, 7.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 4.0], "bins": [-0.7763671875, -0.7522125244140625, -0.728057861328125, -0.7039031982421875, -0.67974853515625, -0.6555938720703125, -0.631439208984375, -0.6072845458984375, -0.5831298828125, -0.5589752197265625, -0.534820556640625, -0.5106658935546875, -0.48651123046875, -0.4623565673828125, -0.438201904296875, -0.4140472412109375, -0.389892578125, -0.3657379150390625, -0.341583251953125, -0.3174285888671875, -0.29327392578125, -0.2691192626953125, -0.244964599609375, -0.2208099365234375, -0.1966552734375, -0.1725006103515625, -0.148345947265625, -0.1241912841796875, -0.10003662109375, -0.0758819580078125, -0.051727294921875, -0.0275726318359375, -0.00341796875, 0.0207366943359375, 0.044891357421875, 0.0690460205078125, 0.09320068359375, 0.1173553466796875, 0.141510009765625, 0.1656646728515625, 0.1898193359375, 0.2139739990234375, 0.238128662109375, 0.2622833251953125, 0.28643798828125, 0.3105926513671875, 0.334747314453125, 0.3589019775390625, 0.383056640625, 0.4072113037109375, 0.431365966796875, 0.4555206298828125, 0.47967529296875, 0.5038299560546875, 0.527984619140625, 0.5521392822265625, 0.5762939453125, 0.6004486083984375, 0.624603271484375, 0.6487579345703125, 0.67291259765625, 0.6970672607421875, 0.721221923828125, 0.7453765869140625, 0.76953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 9.0, 10.0, 16.0, 18.0, 27.0, 23.0, 26.0, 26.0, 26.0, 27.0, 32.0, 36.0, 51.0, 36.0, 42.0, 42.0, 1063.0, 38.0, 38.0, 47.0, 41.0, 31.0, 43.0, 26.0, 35.0, 32.0, 23.0, 20.0, 14.0, 17.0, 12.0, 12.0, 15.0, 9.0, 11.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.446624755859375, -2.36199951171875, -2.277374267578125, -2.1927490234375, -2.108123779296875, -2.02349853515625, -1.938873291015625, -1.854248046875, -1.769622802734375, -1.68499755859375, -1.600372314453125, -1.5157470703125, -1.431121826171875, -1.34649658203125, -1.261871337890625, -1.17724609375, -1.092620849609375, -1.00799560546875, -0.923370361328125, -0.8387451171875, -0.754119873046875, -0.66949462890625, -0.584869384765625, -0.500244140625, -0.415618896484375, -0.33099365234375, -0.246368408203125, -0.1617431640625, -0.077117919921875, 0.00750732421875, 0.092132568359375, 0.1767578125, 0.261383056640625, 0.34600830078125, 0.430633544921875, 0.5152587890625, 0.599884033203125, 0.68450927734375, 0.769134521484375, 0.853759765625, 0.938385009765625, 1.02301025390625, 1.107635498046875, 1.1922607421875, 1.276885986328125, 1.36151123046875, 1.446136474609375, 1.53076171875, 1.615386962890625, 1.70001220703125, 1.784637451171875, 1.8692626953125, 1.953887939453125, 2.03851318359375, 2.123138427734375, 2.207763671875, 2.292388916015625, 2.37701416015625, 2.461639404296875, 2.5462646484375, 2.630889892578125, 2.71551513671875, 2.800140380859375, 2.884765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 14.0, 19.0, 26.0, 45.0, 60.0, 67.0, 143.0, 166.0, 315.0, 353.0, 595.0, 886.0, 1324.0, 1876.0, 2637.0, 3929.0, 5793.0, 8424.0, 12820.0, 18899.0, 28910.0, 44685.0, 71852.0, 116453.0, 200355.0, 1249274.0, 119444.0, 73563.0, 45799.0, 29574.0, 19114.0, 12771.0, 8515.0, 5815.0, 3943.0, 2773.0, 1862.0, 1309.0, 882.0, 584.0, 413.0, 287.0, 181.0, 118.0, 74.0, 65.0, 29.0, 32.0, 22.0, 11.0, 13.0, 8.0, 1.0, 4.0, 3.0, 2.0], "bins": [-0.56787109375, -0.5506744384765625, -0.533477783203125, -0.5162811279296875, -0.49908447265625, -0.4818878173828125, -0.464691162109375, -0.4474945068359375, -0.4302978515625, -0.4131011962890625, -0.395904541015625, -0.3787078857421875, -0.36151123046875, -0.3443145751953125, -0.327117919921875, -0.3099212646484375, -0.292724609375, -0.2755279541015625, -0.258331298828125, -0.2411346435546875, -0.22393798828125, -0.2067413330078125, -0.189544677734375, -0.1723480224609375, -0.1551513671875, -0.1379547119140625, -0.120758056640625, -0.1035614013671875, -0.08636474609375, -0.0691680908203125, -0.051971435546875, -0.0347747802734375, -0.017578125, -0.0003814697265625, 0.016815185546875, 0.0340118408203125, 0.05120849609375, 0.0684051513671875, 0.085601806640625, 0.1027984619140625, 0.1199951171875, 0.1371917724609375, 0.154388427734375, 0.1715850830078125, 0.18878173828125, 0.2059783935546875, 0.223175048828125, 0.2403717041015625, 0.257568359375, 0.2747650146484375, 0.291961669921875, 0.3091583251953125, 0.32635498046875, 0.3435516357421875, 0.360748291015625, 0.3779449462890625, 0.3951416015625, 0.4123382568359375, 0.429534912109375, 0.4467315673828125, 0.46392822265625, 0.4811248779296875, 0.498321533203125, 0.5155181884765625, 0.53271484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 2.0, 7.0, 9.0, 17.0, 16.0, 19.0, 22.0, 30.0, 41.0, 45.0, 47.0, 55.0, 71.0, 59.0, 62.0, 59.0, 76.0, 51.0, 52.0, 43.0, 27.0, 47.0, 26.0, 22.0, 16.0, 11.0, 14.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002894401550292969, -0.0002780109643936157, -0.00026658177375793457, -0.0002551525831222534, -0.00024372339248657227, -0.0002322942018508911, -0.00022086501121520996, -0.0002094358205795288, -0.00019800662994384766, -0.0001865774393081665, -0.00017514824867248535, -0.0001637190580368042, -0.00015228986740112305, -0.0001408606767654419, -0.00012943148612976074, -0.00011800229549407959, -0.00010657310485839844, -9.514391422271729e-05, -8.371472358703613e-05, -7.228553295135498e-05, -6.085634231567383e-05, -4.9427151679992676e-05, -3.7997961044311523e-05, -2.656877040863037e-05, -1.5139579772949219e-05, -3.7103891372680664e-06, 7.718801498413086e-06, 1.9147992134094238e-05, 3.057718276977539e-05, 4.200637340545654e-05, 5.3435564041137695e-05, 6.486475467681885e-05, 7.62939453125e-05, 8.772313594818115e-05, 9.91523265838623e-05, 0.00011058151721954346, 0.00012201070785522461, 0.00013343989849090576, 0.00014486908912658691, 0.00015629827976226807, 0.00016772747039794922, 0.00017915666103363037, 0.00019058585166931152, 0.00020201504230499268, 0.00021344423294067383, 0.00022487342357635498, 0.00023630261421203613, 0.0002477318048477173, 0.00025916099548339844, 0.0002705901861190796, 0.00028201937675476074, 0.0002934485673904419, 0.00030487775802612305, 0.0003163069486618042, 0.00032773613929748535, 0.0003391653299331665, 0.00035059452056884766, 0.0003620237112045288, 0.00037345290184020996, 0.0003848820924758911, 0.00039631128311157227, 0.0004077404737472534, 0.00041916966438293457, 0.0004305988550186157, 0.0004420280456542969]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 7.0, 6.0, 7.0, 12.0, 11.0, 23.0, 38.0, 45.0, 41.0, 73.0, 98.0, 144.0, 191.0, 244.0, 378.0, 696.0, 3017.0, 1039662.0, 1912.0, 616.0, 389.0, 241.0, 184.0, 125.0, 92.0, 75.0, 43.0, 57.0, 29.0, 18.0, 22.0, 8.0, 5.0, 10.0, 5.0, 10.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.00812530517578125, -0.00788944959640503, -0.007653594017028809, -0.007417738437652588, -0.007181882858276367, -0.0069460272789001465, -0.006710171699523926, -0.006474316120147705, -0.006238460540771484, -0.006002604961395264, -0.005766749382019043, -0.005530893802642822, -0.0052950382232666016, -0.005059182643890381, -0.00482332706451416, -0.0045874714851379395, -0.004351615905761719, -0.004115760326385498, -0.0038799047470092773, -0.0036440491676330566, -0.003408193588256836, -0.0031723380088806152, -0.0029364824295043945, -0.002700626850128174, -0.002464771270751953, -0.0022289156913757324, -0.0019930601119995117, -0.001757204532623291, -0.0015213489532470703, -0.0012854933738708496, -0.001049637794494629, -0.0008137822151184082, -0.0005779266357421875, -0.0003420710563659668, -0.0001062154769897461, 0.0001296401023864746, 0.0003654956817626953, 0.000601351261138916, 0.0008372068405151367, 0.0010730624198913574, 0.0013089179992675781, 0.0015447735786437988, 0.0017806291580200195, 0.0020164847373962402, 0.002252340316772461, 0.0024881958961486816, 0.0027240514755249023, 0.002959907054901123, 0.0031957626342773438, 0.0034316182136535645, 0.003667473793029785, 0.003903329372406006, 0.0041391849517822266, 0.004375040531158447, 0.004610896110534668, 0.004846751689910889, 0.005082607269287109, 0.00531846284866333, 0.005554318428039551, 0.0057901740074157715, 0.006026029586791992, 0.006261885166168213, 0.006497740745544434, 0.006733596324920654, 0.006969451904296875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 374.0, 640.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027660042978823185, -0.0027096248231828213, -0.002653245348483324, -0.002596865873783827, -0.002540486166253686, -0.0024841066915541887, -0.0024277272168546915, -0.0023713477421551943, -0.002314968267455697, -0.0022585887927562, -0.0022022093180567026, -0.0021458298433572054, -0.0020894501358270645, -0.0020330706611275673, -0.00197669118642807, -0.0019203117117285728, -0.0018639322370290756, -0.0018075527623295784, -0.0017511731712147593, -0.0016947936965152621, -0.001638414221815765, -0.0015820346307009459, -0.0015256551560014486, -0.0014692756813019514, -0.0014128960901871324, -0.0013565166154876351, -0.001300137024372816, -0.0012437575496733189, -0.0011873780749738216, -0.0011309986002743244, -0.0010746190091595054, -0.0010182395344600081, -0.0009618600597605109, -0.0009054805268533528, -0.0008491010521538556, -0.0007927215192466974, -0.0007363420445472002, -0.0006799625116400421, -0.0006235829787328839, -0.0005672035040333867, -0.0005108240293338895, -0.0004544445255305618, -0.0003980650217272341, -0.000341685488820076, -0.00028530601412057877, -0.00022892648121342063, -0.00017254697741009295, -0.00011616747360676527, -5.9787940699607134e-05, -3.408433258300647e-06, 5.297107418300584e-05, 0.00010935058526229113, 0.0001657300890656188, 0.00022210960742086172, 0.0002784891112241894, 0.0003348686150275171, 0.00039124811883084476, 0.00044762762263417244, 0.0005040071555413306, 0.0005603866302408278, 0.0006167661631479859, 0.0006731456378474832, 0.0007295251707546413, 0.0007859047036617994, 0.0008422841783612967]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 4.0, 8.0, 10.0, 7.0, 10.0, 11.0, 12.0, 10.0, 23.0, 9.0, 33.0, 21.0, 21.0, 39.0, 20.0, 48.0, 28.0, 32.0, 35.0, 42.0, 37.0, 52.0, 41.0, 32.0, 34.0, 35.0, 36.0, 28.0, 31.0, 28.0, 24.0, 30.0, 24.0, 24.0, 13.0, 21.0, 21.0, 13.0, 15.0, 6.0, 9.0, 4.0, 5.0, 5.0, 3.0, 7.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018829107284545898, -0.00018277112394571304, -0.0001772511750459671, -0.00017173122614622116, -0.00016621127724647522, -0.00016069132834672928, -0.00015517137944698334, -0.0001496514305472374, -0.00014413148164749146, -0.00013861153274774551, -0.00013309158384799957, -0.00012757163494825363, -0.00012205168604850769, -0.00011653173714876175, -0.00011101178824901581, -0.00010549183934926987, -9.997189044952393e-05, -9.445194154977798e-05, -8.893199265003204e-05, -8.34120437502861e-05, -7.789209485054016e-05, -7.237214595079422e-05, -6.685219705104828e-05, -6.133224815130234e-05, -5.5812299251556396e-05, -5.0292350351810455e-05, -4.4772401452064514e-05, -3.925245255231857e-05, -3.373250365257263e-05, -2.821255475282669e-05, -2.269260585308075e-05, -1.717265695333481e-05, -1.1652708053588867e-05, -6.132759153842926e-06, -6.128102540969849e-07, 4.907138645648956e-06, 1.0427087545394897e-05, 1.594703644514084e-05, 2.146698534488678e-05, 2.698693424463272e-05, 3.250688314437866e-05, 3.80268320441246e-05, 4.3546780943870544e-05, 4.9066729843616486e-05, 5.458667874336243e-05, 6.010662764310837e-05, 6.562657654285431e-05, 7.114652544260025e-05, 7.666647434234619e-05, 8.218642324209213e-05, 8.770637214183807e-05, 9.322632104158401e-05, 9.874626994132996e-05, 0.0001042662188410759, 0.00010978616774082184, 0.00011530611664056778, 0.00012082606554031372, 0.00012634601444005966, 0.0001318659633398056, 0.00013738591223955154, 0.00014290586113929749, 0.00014842581003904343, 0.00015394575893878937, 0.0001594657078385353, 0.00016498565673828125]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 16.0, 18.0, 17.0, 15.0, 31.0, 17.0, 24.0, 36.0, 34.0, 33.0, 48.0, 50.0, 50.0, 55.0, 52.0, 62.0, 58.0, 47.0, 54.0, 30.0, 44.0, 33.0, 31.0, 20.0, 15.0, 13.0, 17.0, 11.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.29296875, -6.13153076171875, -5.9700927734375, -5.80865478515625, -5.647216796875, -5.48577880859375, -5.3243408203125, -5.16290283203125, -5.00146484375, -4.84002685546875, -4.6785888671875, -4.51715087890625, -4.355712890625, -4.19427490234375, -4.0328369140625, -3.87139892578125, -3.7099609375, -3.54852294921875, -3.3870849609375, -3.22564697265625, -3.064208984375, -2.90277099609375, -2.7413330078125, -2.57989501953125, -2.41845703125, -2.25701904296875, -2.0955810546875, -1.93414306640625, -1.772705078125, -1.61126708984375, -1.4498291015625, -1.28839111328125, -1.126953125, -0.96551513671875, -0.8040771484375, -0.64263916015625, -0.481201171875, -0.31976318359375, -0.1583251953125, 0.00311279296875, 0.16455078125, 0.32598876953125, 0.4874267578125, 0.64886474609375, 0.810302734375, 0.97174072265625, 1.1331787109375, 1.29461669921875, 1.4560546875, 1.61749267578125, 1.7789306640625, 1.94036865234375, 2.101806640625, 2.26324462890625, 2.4246826171875, 2.58612060546875, 2.74755859375, 2.90899658203125, 3.0704345703125, 3.23187255859375, 3.393310546875, 3.55474853515625, 3.7161865234375, 3.87762451171875, 4.0390625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 9.0, 9.0, 19.0, 23.0, 20.0, 42.0, 44.0, 69.0, 103.0, 126.0, 182.0, 231.0, 321.0, 491.0, 635.0, 933.0, 1326.0, 1971.0, 3080.0, 5351.0, 10535.0, 30146.0, 756300.0, 195459.0, 19870.0, 8296.0, 4420.0, 2745.0, 1694.0, 1169.0, 828.0, 574.0, 425.0, 297.0, 223.0, 169.0, 111.0, 79.0, 67.0, 40.0, 35.0, 24.0, 19.0, 18.0, 11.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.515625, -29.58642578125, -28.6572265625, -27.72802734375, -26.798828125, -25.86962890625, -24.9404296875, -24.01123046875, -23.08203125, -22.15283203125, -21.2236328125, -20.29443359375, -19.365234375, -18.43603515625, -17.5068359375, -16.57763671875, -15.6484375, -14.71923828125, -13.7900390625, -12.86083984375, -11.931640625, -11.00244140625, -10.0732421875, -9.14404296875, -8.21484375, -7.28564453125, -6.3564453125, -5.42724609375, -4.498046875, -3.56884765625, -2.6396484375, -1.71044921875, -0.78125, 0.14794921875, 1.0771484375, 2.00634765625, 2.935546875, 3.86474609375, 4.7939453125, 5.72314453125, 6.65234375, 7.58154296875, 8.5107421875, 9.43994140625, 10.369140625, 11.29833984375, 12.2275390625, 13.15673828125, 14.0859375, 15.01513671875, 15.9443359375, 16.87353515625, 17.802734375, 18.73193359375, 19.6611328125, 20.59033203125, 21.51953125, 22.44873046875, 23.3779296875, 24.30712890625, 25.236328125, 26.16552734375, 27.0947265625, 28.02392578125, 28.953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 7.0, 8.0, 11.0, 12.0, 11.0, 14.0, 10.0, 19.0, 15.0, 22.0, 27.0, 22.0, 39.0, 30.0, 32.0, 43.0, 40.0, 55.0, 79.0, 204.0, 1642.0, 216.0, 84.0, 52.0, 37.0, 36.0, 35.0, 37.0, 29.0, 33.0, 25.0, 20.0, 19.0, 18.0, 14.0, 7.0, 10.0, 9.0, 1.0, 10.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.4609375, -12.0777587890625, -11.694580078125, -11.3114013671875, -10.92822265625, -10.5450439453125, -10.161865234375, -9.7786865234375, -9.3955078125, -9.0123291015625, -8.629150390625, -8.2459716796875, -7.86279296875, -7.4796142578125, -7.096435546875, -6.7132568359375, -6.330078125, -5.9468994140625, -5.563720703125, -5.1805419921875, -4.79736328125, -4.4141845703125, -4.031005859375, -3.6478271484375, -3.2646484375, -2.8814697265625, -2.498291015625, -2.1151123046875, -1.73193359375, -1.3487548828125, -0.965576171875, -0.5823974609375, -0.19921875, 0.1839599609375, 0.567138671875, 0.9503173828125, 1.33349609375, 1.7166748046875, 2.099853515625, 2.4830322265625, 2.8662109375, 3.2493896484375, 3.632568359375, 4.0157470703125, 4.39892578125, 4.7821044921875, 5.165283203125, 5.5484619140625, 5.931640625, 6.3148193359375, 6.697998046875, 7.0811767578125, 7.46435546875, 7.8475341796875, 8.230712890625, 8.6138916015625, 8.9970703125, 9.3802490234375, 9.763427734375, 10.1466064453125, 10.52978515625, 10.9129638671875, 11.296142578125, 11.6793212890625, 12.0625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 8.0, 13.0, 17.0, 15.0, 24.0, 21.0, 28.0, 37.0, 37.0, 38.0, 56.0, 69.0, 172.0, 551.0, 3187.0, 3109555.0, 30118.0, 925.0, 302.0, 127.0, 72.0, 35.0, 39.0, 31.0, 29.0, 22.0, 20.0, 30.0, 19.0, 7.0, 15.0, 10.0, 12.0, 11.0, 4.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-55.0625, -53.32568359375, -51.5888671875, -49.85205078125, -48.115234375, -46.37841796875, -44.6416015625, -42.90478515625, -41.16796875, -39.43115234375, -37.6943359375, -35.95751953125, -34.220703125, -32.48388671875, -30.7470703125, -29.01025390625, -27.2734375, -25.53662109375, -23.7998046875, -22.06298828125, -20.326171875, -18.58935546875, -16.8525390625, -15.11572265625, -13.37890625, -11.64208984375, -9.9052734375, -8.16845703125, -6.431640625, -4.69482421875, -2.9580078125, -1.22119140625, 0.515625, 2.25244140625, 3.9892578125, 5.72607421875, 7.462890625, 9.19970703125, 10.9365234375, 12.67333984375, 14.41015625, 16.14697265625, 17.8837890625, 19.62060546875, 21.357421875, 23.09423828125, 24.8310546875, 26.56787109375, 28.3046875, 30.04150390625, 31.7783203125, 33.51513671875, 35.251953125, 36.98876953125, 38.7255859375, 40.46240234375, 42.19921875, 43.93603515625, 45.6728515625, 47.40966796875, 49.146484375, 50.88330078125, 52.6201171875, 54.35693359375, 56.09375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 755.0, 243.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.55690002441406, -167.24212646484375, -162.92735290527344, -158.61257934570312, -154.2978057861328, -149.9830322265625, -145.6682586669922, -141.35348510742188, -137.0386962890625, -132.7239227294922, -128.40914916992188, -124.09437561035156, -119.77960205078125, -115.46482849121094, -111.1500473022461, -106.83527374267578, -102.5205078125, -98.20573425292969, -93.89096069335938, -89.57618713378906, -85.26141357421875, -80.94664001464844, -76.6318588256836, -72.31708526611328, -68.00231170654297, -63.687538146972656, -59.372764587402344, -55.057987213134766, -50.74321365356445, -46.42844009399414, -42.11366271972656, -37.79888916015625, -33.48411560058594, -29.169342041015625, -24.85456657409668, -20.539791107177734, -16.225017547607422, -11.91024398803711, -7.595468521118164, -3.2806930541992188, 1.0340805053710938, 5.348855018615723, 9.663629531860352, 13.97840404510498, 18.29317855834961, 22.607952117919922, 26.922727584838867, 31.237503051757812, 35.552276611328125, 39.86705017089844, 44.18182373046875, 48.49660110473633, 52.81137466430664, 57.12614822387695, 61.44092559814453, 65.75569915771484, 70.07047271728516, 74.38524627685547, 78.70001983642578, 83.0147933959961, 87.32957458496094, 91.64434814453125, 95.95912170410156, 100.27389526367188, 104.58866882324219]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 0.0, 3.0, 9.0, 5.0, 6.0, 19.0, 8.0, 7.0, 14.0, 20.0, 23.0, 27.0, 26.0, 23.0, 30.0, 32.0, 42.0, 28.0, 48.0, 43.0, 48.0, 45.0, 47.0, 38.0, 45.0, 46.0, 39.0, 35.0, 25.0, 42.0, 25.0, 28.0, 20.0, 21.0, 17.0, 11.0, 8.0, 16.0, 5.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.96411895751953, -35.4940071105957, -34.02389907836914, -32.55378723144531, -31.083677291870117, -29.613567352294922, -28.143457412719727, -26.67334747314453, -25.203235626220703, -23.733125686645508, -22.263015747070312, -20.792903900146484, -19.32279396057129, -17.852684020996094, -16.3825740814209, -14.912463188171387, -13.442354202270508, -11.972244262695312, -10.5021333694458, -9.032023429870605, -7.561913013458252, -6.091802597045898, -4.621692657470703, -3.1515817642211914, -1.681471824645996, -0.21136152744293213, 1.2587487697601318, 2.7288589477539062, 4.19896936416626, 5.669079780578613, 7.139189720153809, 8.60930061340332, 10.079410552978516, 11.549520492553711, 13.019631385803223, 14.489741325378418, 15.95985221862793, 17.429962158203125, 18.90007209777832, 20.370182037353516, 21.840293884277344, 23.31040382385254, 24.780513763427734, 26.250625610351562, 27.720735549926758, 29.190845489501953, 30.66095542907715, 32.131065368652344, 33.601173400878906, 35.071285247802734, 36.5413932800293, 38.011505126953125, 39.48161315917969, 40.951725006103516, 42.421836853027344, 43.891944885253906, 45.362056732177734, 46.83216857910156, 48.302276611328125, 49.77238845825195, 51.242496490478516, 52.712608337402344, 54.182716369628906, 55.652828216552734, 57.12294006347656]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 7.0, 11.0, 10.0, 14.0, 19.0, 20.0, 17.0, 25.0, 22.0, 28.0, 25.0, 39.0, 30.0, 45.0, 51.0, 54.0, 47.0, 58.0, 54.0, 61.0, 55.0, 38.0, 35.0, 39.0, 34.0, 29.0, 19.0, 23.0, 19.0, 15.0, 11.0, 7.0, 14.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1875, -6.020263671875, -5.85302734375, -5.685791015625, -5.5185546875, -5.351318359375, -5.18408203125, -5.016845703125, -4.849609375, -4.682373046875, -4.51513671875, -4.347900390625, -4.1806640625, -4.013427734375, -3.84619140625, -3.678955078125, -3.51171875, -3.344482421875, -3.17724609375, -3.010009765625, -2.8427734375, -2.675537109375, -2.50830078125, -2.341064453125, -2.173828125, -2.006591796875, -1.83935546875, -1.672119140625, -1.5048828125, -1.337646484375, -1.17041015625, -1.003173828125, -0.8359375, -0.668701171875, -0.50146484375, -0.334228515625, -0.1669921875, 0.000244140625, 0.16748046875, 0.334716796875, 0.501953125, 0.669189453125, 0.83642578125, 1.003662109375, 1.1708984375, 1.338134765625, 1.50537109375, 1.672607421875, 1.83984375, 2.007080078125, 2.17431640625, 2.341552734375, 2.5087890625, 2.676025390625, 2.84326171875, 3.010498046875, 3.177734375, 3.344970703125, 3.51220703125, 3.679443359375, 3.8466796875, 4.013916015625, 4.18115234375, 4.348388671875, 4.515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 8.0, 5.0, 7.0, 11.0, 21.0, 18.0, 26.0, 32.0, 53.0, 77.0, 111.0, 200.0, 319.0, 551.0, 1045.0, 2162.0, 4484.0, 10499.0, 30649.0, 201788.0, 3619767.0, 268429.0, 33329.0, 10871.0, 4800.0, 2275.0, 1155.0, 622.0, 325.0, 209.0, 129.0, 95.0, 58.0, 43.0, 24.0, 16.0, 16.0, 15.0, 7.0, 9.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.5087890625, -25.611328125, -24.7138671875, -23.81640625, -22.9189453125, -22.021484375, -21.1240234375, -20.2265625, -19.3291015625, -18.431640625, -17.5341796875, -16.63671875, -15.7392578125, -14.841796875, -13.9443359375, -13.046875, -12.1494140625, -11.251953125, -10.3544921875, -9.45703125, -8.5595703125, -7.662109375, -6.7646484375, -5.8671875, -4.9697265625, -4.072265625, -3.1748046875, -2.27734375, -1.3798828125, -0.482421875, 0.4150390625, 1.3125, 2.2099609375, 3.107421875, 4.0048828125, 4.90234375, 5.7998046875, 6.697265625, 7.5947265625, 8.4921875, 9.3896484375, 10.287109375, 11.1845703125, 12.08203125, 12.9794921875, 13.876953125, 14.7744140625, 15.671875, 16.5693359375, 17.466796875, 18.3642578125, 19.26171875, 20.1591796875, 21.056640625, 21.9541015625, 22.8515625, 23.7490234375, 24.646484375, 25.5439453125, 26.44140625, 27.3388671875, 28.236328125, 29.1337890625, 30.03125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 9.0, 16.0, 25.0, 40.0, 48.0, 56.0, 99.0, 129.0, 214.0, 346.0, 618.0, 771.0, 606.0, 346.0, 242.0, 148.0, 92.0, 73.0, 49.0, 29.0, 25.0, 33.0, 14.0, 11.0, 7.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.5703125, -26.75, -25.9296875, -25.109375, -24.2890625, -23.46875, -22.6484375, -21.828125, -21.0078125, -20.1875, -19.3671875, -18.546875, -17.7265625, -16.90625, -16.0859375, -15.265625, -14.4453125, -13.625, -12.8046875, -11.984375, -11.1640625, -10.34375, -9.5234375, -8.703125, -7.8828125, -7.0625, -6.2421875, -5.421875, -4.6015625, -3.78125, -2.9609375, -2.140625, -1.3203125, -0.5, 0.3203125, 1.140625, 1.9609375, 2.78125, 3.6015625, 4.421875, 5.2421875, 6.0625, 6.8828125, 7.703125, 8.5234375, 9.34375, 10.1640625, 10.984375, 11.8046875, 12.625, 13.4453125, 14.265625, 15.0859375, 15.90625, 16.7265625, 17.546875, 18.3671875, 19.1875, 20.0078125, 20.828125, 21.6484375, 22.46875, 23.2890625, 24.109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 7.0, 6.0, 11.0, 7.0, 21.0, 27.0, 36.0, 38.0, 54.0, 87.0, 123.0, 168.0, 334.0, 838.0, 13162.0, 4170489.0, 7280.0, 710.0, 339.0, 173.0, 118.0, 84.0, 49.0, 32.0, 30.0, 21.0, 16.0, 6.0, 2.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.25, -80.49609375, -76.7421875, -72.98828125, -69.234375, -65.48046875, -61.7265625, -57.97265625, -54.21875, -50.46484375, -46.7109375, -42.95703125, -39.203125, -35.44921875, -31.6953125, -27.94140625, -24.1875, -20.43359375, -16.6796875, -12.92578125, -9.171875, -5.41796875, -1.6640625, 2.08984375, 5.84375, 9.59765625, 13.3515625, 17.10546875, 20.859375, 24.61328125, 28.3671875, 32.12109375, 35.875, 39.62890625, 43.3828125, 47.13671875, 50.890625, 54.64453125, 58.3984375, 62.15234375, 65.90625, 69.66015625, 73.4140625, 77.16796875, 80.921875, 84.67578125, 88.4296875, 92.18359375, 95.9375, 99.69140625, 103.4453125, 107.19921875, 110.953125, 114.70703125, 118.4609375, 122.21484375, 125.96875, 129.72265625, 133.4765625, 137.23046875, 140.984375, 144.73828125, 148.4921875, 152.24609375, 156.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [4.0, 2.0, 134.0, 771.0, 107.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.26115798950195, -23.710105895996094, -14.159051895141602, -4.607997894287109, 4.94305419921875, 14.49410629272461, 24.045162200927734, 33.59621047973633, 43.14726638793945, 52.69831848144531, 62.24937438964844, 71.80043029785156, 81.35147857666016, 90.90252685546875, 100.45358276367188, 110.004638671875, 119.55569458007812, 129.10675048828125, 138.65780639648438, 148.2088623046875, 157.75990295410156, 167.3109588623047, 176.8620147705078, 186.41305541992188, 195.964111328125, 205.51516723632812, 215.06622314453125, 224.61727905273438, 234.16831970214844, 243.71937561035156, 253.2704315185547, 262.82147216796875, 272.3725280761719, 281.923583984375, 291.4746398925781, 301.02569580078125, 310.5767517089844, 320.1278076171875, 329.6788330078125, 339.2298889160156, 348.78094482421875, 358.3320007324219, 367.883056640625, 377.4341125488281, 386.98516845703125, 396.53619384765625, 406.0872802734375, 415.6383056640625, 425.18939208984375, 434.7404479980469, 444.29150390625, 453.8425598144531, 463.39361572265625, 472.94464111328125, 482.4957275390625, 492.0467529296875, 501.5978088378906, 511.14886474609375, 520.6998901367188, 530.2509765625, 539.802001953125, 549.3530883789062, 558.9041137695312, 568.4552001953125, 578.0062255859375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 9.0, 12.0, 9.0, 16.0, 16.0, 19.0, 17.0, 31.0, 25.0, 26.0, 40.0, 43.0, 33.0, 34.0, 38.0, 38.0, 52.0, 44.0, 50.0, 47.0, 35.0, 47.0, 26.0, 38.0, 34.0, 19.0, 27.0, 24.0, 23.0, 21.0, 20.0, 16.0, 15.0, 8.0, 10.0, 8.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-69.60829162597656, -67.6014404296875, -65.59459686279297, -63.587745666503906, -61.580894470214844, -59.57404708862305, -57.56719970703125, -55.56034851074219, -53.553497314453125, -51.54664993286133, -49.539798736572266, -47.53295135498047, -45.526100158691406, -43.51925277709961, -41.51240539550781, -39.50555419921875, -37.49870681762695, -35.491859436035156, -33.485008239746094, -31.478160858154297, -29.471309661865234, -27.464462280273438, -25.457612991333008, -23.450763702392578, -21.44391441345215, -19.43706512451172, -17.43021583557129, -15.423367500305176, -13.416518211364746, -11.409668922424316, -9.402820587158203, -7.395971298217773, -5.389122009277344, -3.382272958755493, -1.3754239082336426, 0.6314249038696289, 2.6382741928100586, 4.645123481750488, 6.651971817016602, 8.658821105957031, 10.665670394897461, 12.67251968383789, 14.67936897277832, 16.68621826171875, 18.693065643310547, 20.69991683959961, 22.706764221191406, 24.713613510131836, 26.720462799072266, 28.727312088012695, 30.734161376953125, 32.74100875854492, 34.747859954833984, 36.75470733642578, 38.761558532714844, 40.76840591430664, 42.77525329589844, 44.782100677490234, 46.7889518737793, 48.795799255371094, 50.802650451660156, 52.80949783325195, 54.81634521484375, 56.82319641113281, 58.830047607421875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 9.0, 13.0, 7.0, 14.0, 17.0, 22.0, 23.0, 35.0, 23.0, 35.0, 29.0, 33.0, 43.0, 40.0, 42.0, 50.0, 45.0, 59.0, 53.0, 40.0, 45.0, 43.0, 32.0, 40.0, 29.0, 27.0, 23.0, 19.0, 17.0, 14.0, 12.0, 7.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.7109375, -5.55352783203125, -5.3961181640625, -5.23870849609375, -5.081298828125, -4.92388916015625, -4.7664794921875, -4.60906982421875, -4.45166015625, -4.29425048828125, -4.1368408203125, -3.97943115234375, -3.822021484375, -3.66461181640625, -3.5072021484375, -3.34979248046875, -3.1923828125, -3.03497314453125, -2.8775634765625, -2.72015380859375, -2.562744140625, -2.40533447265625, -2.2479248046875, -2.09051513671875, -1.93310546875, -1.77569580078125, -1.6182861328125, -1.46087646484375, -1.303466796875, -1.14605712890625, -0.9886474609375, -0.83123779296875, -0.673828125, -0.51641845703125, -0.3590087890625, -0.20159912109375, -0.044189453125, 0.11322021484375, 0.2706298828125, 0.42803955078125, 0.58544921875, 0.74285888671875, 0.9002685546875, 1.05767822265625, 1.215087890625, 1.37249755859375, 1.5299072265625, 1.68731689453125, 1.8447265625, 2.00213623046875, 2.1595458984375, 2.31695556640625, 2.474365234375, 2.63177490234375, 2.7891845703125, 2.94659423828125, 3.10400390625, 3.26141357421875, 3.4188232421875, 3.57623291015625, 3.733642578125, 3.89105224609375, 4.0484619140625, 4.20587158203125, 4.36328125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 15.0, 19.0, 37.0, 54.0, 79.0, 118.0, 192.0, 310.0, 453.0, 686.0, 1059.0, 1833.0, 2942.0, 4715.0, 7616.0, 12326.0, 20740.0, 34448.0, 58052.0, 101939.0, 192597.0, 265304.0, 145790.0, 79400.0, 46776.0, 27820.0, 16736.0, 9980.0, 6300.0, 3768.0, 2378.0, 1466.0, 940.0, 607.0, 356.0, 216.0, 162.0, 100.0, 80.0, 54.0, 31.0, 17.0, 11.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.87060546875, -0.844451904296875, -0.81829833984375, -0.792144775390625, -0.7659912109375, -0.739837646484375, -0.71368408203125, -0.687530517578125, -0.661376953125, -0.635223388671875, -0.60906982421875, -0.582916259765625, -0.5567626953125, -0.530609130859375, -0.50445556640625, -0.478302001953125, -0.4521484375, -0.425994873046875, -0.39984130859375, -0.373687744140625, -0.3475341796875, -0.321380615234375, -0.29522705078125, -0.269073486328125, -0.242919921875, -0.216766357421875, -0.19061279296875, -0.164459228515625, -0.1383056640625, -0.112152099609375, -0.08599853515625, -0.059844970703125, -0.03369140625, -0.007537841796875, 0.01861572265625, 0.044769287109375, 0.0709228515625, 0.097076416015625, 0.12322998046875, 0.149383544921875, 0.175537109375, 0.201690673828125, 0.22784423828125, 0.253997802734375, 0.2801513671875, 0.306304931640625, 0.33245849609375, 0.358612060546875, 0.384765625, 0.410919189453125, 0.43707275390625, 0.463226318359375, 0.4893798828125, 0.515533447265625, 0.54168701171875, 0.567840576171875, 0.593994140625, 0.620147705078125, 0.64630126953125, 0.672454833984375, 0.6986083984375, 0.724761962890625, 0.75091552734375, 0.777069091796875, 0.80322265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 4.0, 2.0, 11.0, 14.0, 9.0, 12.0, 17.0, 11.0, 26.0, 29.0, 24.0, 22.0, 20.0, 30.0, 43.0, 33.0, 32.0, 41.0, 35.0, 45.0, 1059.0, 40.0, 44.0, 39.0, 34.0, 45.0, 34.0, 31.0, 29.0, 34.0, 30.0, 20.0, 26.0, 17.0, 9.0, 14.0, 11.0, 7.0, 12.0, 5.0, 5.0, 7.0, 0.0, 9.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.734375, -2.64202880859375, -2.5496826171875, -2.45733642578125, -2.364990234375, -2.27264404296875, -2.1802978515625, -2.08795166015625, -1.99560546875, -1.90325927734375, -1.8109130859375, -1.71856689453125, -1.626220703125, -1.53387451171875, -1.4415283203125, -1.34918212890625, -1.2568359375, -1.16448974609375, -1.0721435546875, -0.97979736328125, -0.887451171875, -0.79510498046875, -0.7027587890625, -0.61041259765625, -0.51806640625, -0.42572021484375, -0.3333740234375, -0.24102783203125, -0.148681640625, -0.05633544921875, 0.0360107421875, 0.12835693359375, 0.220703125, 0.31304931640625, 0.4053955078125, 0.49774169921875, 0.590087890625, 0.68243408203125, 0.7747802734375, 0.86712646484375, 0.95947265625, 1.05181884765625, 1.1441650390625, 1.23651123046875, 1.328857421875, 1.42120361328125, 1.5135498046875, 1.60589599609375, 1.6982421875, 1.79058837890625, 1.8829345703125, 1.97528076171875, 2.067626953125, 2.15997314453125, 2.2523193359375, 2.34466552734375, 2.43701171875, 2.52935791015625, 2.6217041015625, 2.71405029296875, 2.806396484375, 2.89874267578125, 2.9910888671875, 3.08343505859375, 3.17578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 7.0, 15.0, 18.0, 30.0, 45.0, 61.0, 101.0, 140.0, 202.0, 320.0, 486.0, 761.0, 1079.0, 1647.0, 2387.0, 3792.0, 5561.0, 8600.0, 13120.0, 20200.0, 31747.0, 52094.0, 85638.0, 150482.0, 1299043.0, 168678.0, 95309.0, 56819.0, 35211.0, 22080.0, 14080.0, 9200.0, 6152.0, 4050.0, 2662.0, 1785.0, 1138.0, 794.0, 530.0, 349.0, 258.0, 144.0, 98.0, 78.0, 45.0, 36.0, 21.0, 10.0, 10.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.69873046875, -0.6779327392578125, -0.657135009765625, -0.6363372802734375, -0.61553955078125, -0.5947418212890625, -0.573944091796875, -0.5531463623046875, -0.5323486328125, -0.5115509033203125, -0.490753173828125, -0.4699554443359375, -0.44915771484375, -0.4283599853515625, -0.407562255859375, -0.3867645263671875, -0.365966796875, -0.3451690673828125, -0.324371337890625, -0.3035736083984375, -0.28277587890625, -0.2619781494140625, -0.241180419921875, -0.2203826904296875, -0.1995849609375, -0.1787872314453125, -0.157989501953125, -0.1371917724609375, -0.11639404296875, -0.0955963134765625, -0.074798583984375, -0.0540008544921875, -0.033203125, -0.0124053955078125, 0.008392333984375, 0.0291900634765625, 0.04998779296875, 0.0707855224609375, 0.091583251953125, 0.1123809814453125, 0.1331787109375, 0.1539764404296875, 0.174774169921875, 0.1955718994140625, 0.21636962890625, 0.2371673583984375, 0.257965087890625, 0.2787628173828125, 0.299560546875, 0.3203582763671875, 0.341156005859375, 0.3619537353515625, 0.38275146484375, 0.4035491943359375, 0.424346923828125, 0.4451446533203125, 0.4659423828125, 0.4867401123046875, 0.507537841796875, 0.5283355712890625, 0.54913330078125, 0.5699310302734375, 0.590728759765625, 0.6115264892578125, 0.63232421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 9.0, 16.0, 8.0, 14.0, 21.0, 24.0, 35.0, 31.0, 32.0, 28.0, 41.0, 50.0, 54.0, 55.0, 66.0, 75.0, 42.0, 45.0, 49.0, 51.0, 38.0, 46.0, 18.0, 17.0, 18.0, 14.0, 15.0, 19.0, 12.0, 5.0, 9.0, 8.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.0005235671997070312, -0.00051068514585495, -0.0004978030920028687, -0.00048492103815078735, -0.00047203898429870605, -0.00045915693044662476, -0.00044627487659454346, -0.00043339282274246216, -0.00042051076889038086, -0.00040762871503829956, -0.00039474666118621826, -0.00038186460733413696, -0.00036898255348205566, -0.00035610049962997437, -0.00034321844577789307, -0.00033033639192581177, -0.00031745433807373047, -0.00030457228422164917, -0.00029169023036956787, -0.00027880817651748657, -0.0002659261226654053, -0.000253044068813324, -0.00024016201496124268, -0.00022727996110916138, -0.00021439790725708008, -0.00020151585340499878, -0.00018863379955291748, -0.00017575174570083618, -0.00016286969184875488, -0.00014998763799667358, -0.00013710558414459229, -0.00012422353029251099, -0.00011134147644042969, -9.845942258834839e-05, -8.557736873626709e-05, -7.269531488418579e-05, -5.981326103210449e-05, -4.693120718002319e-05, -3.4049153327941895e-05, -2.1167099475860596e-05, -8.285045623779297e-06, 4.597008228302002e-06, 1.74790620803833e-05, 3.03611159324646e-05, 4.32431697845459e-05, 5.61252236366272e-05, 6.90072774887085e-05, 8.18893313407898e-05, 9.47713851928711e-05, 0.00010765343904495239, 0.00012053549289703369, 0.000133417546749115, 0.0001462996006011963, 0.0001591816544532776, 0.0001720637083053589, 0.00018494576215744019, 0.00019782781600952148, 0.00021070986986160278, 0.00022359192371368408, 0.00023647397756576538, 0.0002493560314178467, 0.000262238085269928, 0.0002751201391220093, 0.0002880021929740906, 0.0003008842468261719]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 16.0, 11.0, 22.0, 21.0, 30.0, 39.0, 66.0, 66.0, 101.0, 144.0, 317.0, 602.0, 4301.0, 1040318.0, 1268.0, 426.0, 242.0, 148.0, 102.0, 70.0, 53.0, 32.0, 32.0, 18.0, 14.0, 20.0, 13.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00841522216796875, -0.008054494857788086, -0.007693767547607422, -0.007333040237426758, -0.006972312927246094, -0.00661158561706543, -0.006250858306884766, -0.0058901309967041016, -0.0055294036865234375, -0.0051686763763427734, -0.004807949066162109, -0.004447221755981445, -0.004086494445800781, -0.003725767135620117, -0.003365039825439453, -0.003004312515258789, -0.002643585205078125, -0.002282857894897461, -0.0019221305847167969, -0.0015614032745361328, -0.0012006759643554688, -0.0008399486541748047, -0.0004792213439941406, -0.00011849403381347656, 0.0002422332763671875, 0.0006029605865478516, 0.0009636878967285156, 0.0013244152069091797, 0.0016851425170898438, 0.002045869827270508, 0.002406597137451172, 0.002767324447631836, 0.0031280517578125, 0.003488779067993164, 0.003849506378173828, 0.004210233688354492, 0.004570960998535156, 0.00493168830871582, 0.005292415618896484, 0.0056531429290771484, 0.0060138702392578125, 0.0063745975494384766, 0.006735324859619141, 0.007096052169799805, 0.007456779479980469, 0.007817506790161133, 0.008178234100341797, 0.008538961410522461, 0.008899688720703125, 0.009260416030883789, 0.009621143341064453, 0.009981870651245117, 0.010342597961425781, 0.010703325271606445, 0.01106405258178711, 0.011424779891967773, 0.011785507202148438, 0.012146234512329102, 0.012506961822509766, 0.01286768913269043, 0.013228416442871094, 0.013589143753051758, 0.013949871063232422, 0.014310598373413086, 0.01467132568359375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 14.0, 57.0, 248.0, 461.0, 195.0, 31.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003618910850491375, -0.00034320427221246064, -0.00032451743027195334, -0.0003058306174352765, -0.0002871437754947692, -0.0002684569626580924, -0.0002497701207175851, -0.00023108330788090825, -0.00021239648049231619, -0.00019370965310372412, -0.00017502282571513206, -0.00015633599832654, -0.00013764918548986316, -0.00011896235082531348, -0.00010027553071267903, -8.158870332408696e-05, -6.29018759354949e-05, -4.4215048546902835e-05, -2.5528224796289578e-05, -6.841401045676321e-06, 1.1845426342915744e-05, 3.053225373150781e-05, 4.921907384414226e-05, 6.790590123273432e-05, 8.659272862132639e-05, 0.00010527955600991845, 0.00012396638339851052, 0.00014265321078710258, 0.00016134002362377942, 0.0001800268655642867, 0.00019871367840096354, 0.0002174005057895556, 0.00023608730407431722, 0.00025477411691099405, 0.00027346095885150135, 0.0002921477716881782, 0.0003108346136286855, 0.0003295214264653623, 0.00034820823930203915, 0.00036689508124254644, 0.00038558192318305373, 0.00040426873601973057, 0.00042295557796023786, 0.0004416423907969147, 0.000460329232737422, 0.0004790160455740988, 0.0004977028584107757, 0.0005163897294551134, 0.0005350764840841293, 0.0005537632969208062, 0.000572450109757483, 0.0005911369808018208, 0.0006098237936384976, 0.0006285106064751744, 0.0006471974193118513, 0.0006658842321485281, 0.0006845711031928658, 0.0007032579160295427, 0.0007219447288662195, 0.0007406315999105573, 0.0007593184127472341, 0.0007780052255839109, 0.0007966920384205878, 0.0008153788512572646, 0.0008340657223016024]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 8.0, 12.0, 21.0, 16.0, 25.0, 19.0, 28.0, 16.0, 24.0, 37.0, 27.0, 36.0, 27.0, 29.0, 37.0, 49.0, 42.0, 39.0, 49.0, 37.0, 37.0, 35.0, 36.0, 30.0, 33.0, 31.0, 26.0, 20.0, 19.0, 25.0, 19.0, 15.0, 9.0, 17.0, 7.0, 5.0, 7.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002194046974182129, -0.00021274667233228683, -0.00020608864724636078, -0.00019943062216043472, -0.00019277259707450867, -0.0001861145719885826, -0.00017945654690265656, -0.0001727985218167305, -0.00016614049673080444, -0.0001594824716448784, -0.00015282444655895233, -0.00014616642147302628, -0.00013950839638710022, -0.00013285037130117416, -0.0001261923462152481, -0.00011953432112932205, -0.000112876296043396, -0.00010621827095746994, -9.956024587154388e-05, -9.290222078561783e-05, -8.624419569969177e-05, -7.958617061376572e-05, -7.292814552783966e-05, -6.62701204419136e-05, -5.961209535598755e-05, -5.295407027006149e-05, -4.629604518413544e-05, -3.963802009820938e-05, -3.2979995012283325e-05, -2.632196992635727e-05, -1.9663944840431213e-05, -1.3005919754505157e-05, -6.3478946685791016e-06, 3.1013041734695435e-07, 6.96815550327301e-06, 1.3626180589199066e-05, 2.0284205675125122e-05, 2.6942230761051178e-05, 3.3600255846977234e-05, 4.025828093290329e-05, 4.6916306018829346e-05, 5.35743311047554e-05, 6.023235619068146e-05, 6.689038127660751e-05, 7.354840636253357e-05, 8.020643144845963e-05, 8.686445653438568e-05, 9.352248162031174e-05, 0.00010018050670623779, 0.00010683853179216385, 0.0001134965568780899, 0.00012015458196401596, 0.00012681260704994202, 0.00013347063213586807, 0.00014012865722179413, 0.00014678668230772018, 0.00015344470739364624, 0.0001601027324795723, 0.00016676075756549835, 0.0001734187826514244, 0.00018007680773735046, 0.00018673483282327652, 0.00019339285790920258, 0.00020005088299512863, 0.0002067089080810547]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 9.0, 13.0, 7.0, 14.0, 17.0, 22.0, 23.0, 35.0, 23.0, 35.0, 29.0, 33.0, 43.0, 40.0, 42.0, 50.0, 45.0, 59.0, 53.0, 40.0, 45.0, 43.0, 32.0, 40.0, 29.0, 27.0, 23.0, 19.0, 17.0, 14.0, 12.0, 7.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.7109375, -5.55352783203125, -5.3961181640625, -5.23870849609375, -5.081298828125, -4.92388916015625, -4.7664794921875, -4.60906982421875, -4.45166015625, -4.29425048828125, -4.1368408203125, -3.97943115234375, -3.822021484375, -3.66461181640625, -3.5072021484375, -3.34979248046875, -3.1923828125, -3.03497314453125, -2.8775634765625, -2.72015380859375, -2.562744140625, -2.40533447265625, -2.2479248046875, -2.09051513671875, -1.93310546875, -1.77569580078125, -1.6182861328125, -1.46087646484375, -1.303466796875, -1.14605712890625, -0.9886474609375, -0.83123779296875, -0.673828125, -0.51641845703125, -0.3590087890625, -0.20159912109375, -0.044189453125, 0.11322021484375, 0.2706298828125, 0.42803955078125, 0.58544921875, 0.74285888671875, 0.9002685546875, 1.05767822265625, 1.215087890625, 1.37249755859375, 1.5299072265625, 1.68731689453125, 1.8447265625, 2.00213623046875, 2.1595458984375, 2.31695556640625, 2.474365234375, 2.63177490234375, 2.7891845703125, 2.94659423828125, 3.10400390625, 3.26141357421875, 3.4188232421875, 3.57623291015625, 3.733642578125, 3.89105224609375, 4.0484619140625, 4.20587158203125, 4.36328125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 21.0, 23.0, 46.0, 48.0, 78.0, 91.0, 131.0, 225.0, 299.0, 563.0, 958.0, 1930.0, 4603.0, 13680.0, 46226.0, 193152.0, 543248.0, 178341.0, 43035.0, 12883.0, 4531.0, 1970.0, 919.0, 539.0, 304.0, 225.0, 130.0, 81.0, 70.0, 59.0, 31.0, 27.0, 15.0, 14.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.796875, -5.62872314453125, -5.4605712890625, -5.29241943359375, -5.124267578125, -4.95611572265625, -4.7879638671875, -4.61981201171875, -4.45166015625, -4.28350830078125, -4.1153564453125, -3.94720458984375, -3.779052734375, -3.61090087890625, -3.4427490234375, -3.27459716796875, -3.1064453125, -2.93829345703125, -2.7701416015625, -2.60198974609375, -2.433837890625, -2.26568603515625, -2.0975341796875, -1.92938232421875, -1.76123046875, -1.59307861328125, -1.4249267578125, -1.25677490234375, -1.088623046875, -0.92047119140625, -0.7523193359375, -0.58416748046875, -0.416015625, -0.24786376953125, -0.0797119140625, 0.08843994140625, 0.256591796875, 0.42474365234375, 0.5928955078125, 0.76104736328125, 0.92919921875, 1.09735107421875, 1.2655029296875, 1.43365478515625, 1.601806640625, 1.76995849609375, 1.9381103515625, 2.10626220703125, 2.2744140625, 2.44256591796875, 2.6107177734375, 2.77886962890625, 2.947021484375, 3.11517333984375, 3.2833251953125, 3.45147705078125, 3.61962890625, 3.78778076171875, 3.9559326171875, 4.12408447265625, 4.292236328125, 4.46038818359375, 4.6285400390625, 4.79669189453125, 4.96484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 9.0, 8.0, 16.0, 15.0, 17.0, 23.0, 26.0, 30.0, 25.0, 25.0, 30.0, 30.0, 40.0, 54.0, 40.0, 83.0, 437.0, 1607.0, 81.0, 38.0, 53.0, 42.0, 43.0, 42.0, 24.0, 28.0, 27.0, 17.0, 23.0, 21.0, 15.0, 19.0, 11.0, 7.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.53125, -16.0313720703125, -15.531494140625, -15.0316162109375, -14.53173828125, -14.0318603515625, -13.531982421875, -13.0321044921875, -12.5322265625, -12.0323486328125, -11.532470703125, -11.0325927734375, -10.53271484375, -10.0328369140625, -9.532958984375, -9.0330810546875, -8.533203125, -8.0333251953125, -7.533447265625, -7.0335693359375, -6.53369140625, -6.0338134765625, -5.533935546875, -5.0340576171875, -4.5341796875, -4.0343017578125, -3.534423828125, -3.0345458984375, -2.53466796875, -2.0347900390625, -1.534912109375, -1.0350341796875, -0.53515625, -0.0352783203125, 0.464599609375, 0.9644775390625, 1.46435546875, 1.9642333984375, 2.464111328125, 2.9639892578125, 3.4638671875, 3.9637451171875, 4.463623046875, 4.9635009765625, 5.46337890625, 5.9632568359375, 6.463134765625, 6.9630126953125, 7.462890625, 7.9627685546875, 8.462646484375, 8.9625244140625, 9.46240234375, 9.9622802734375, 10.462158203125, 10.9620361328125, 11.4619140625, 11.9617919921875, 12.461669921875, 12.9615478515625, 13.46142578125, 13.9613037109375, 14.461181640625, 14.9610595703125, 15.4609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 9.0, 7.0, 9.0, 15.0, 17.0, 28.0, 22.0, 18.0, 23.0, 38.0, 31.0, 61.0, 77.0, 139.0, 191.0, 545.0, 2388.0, 2961827.0, 178001.0, 1239.0, 395.0, 174.0, 97.0, 75.0, 42.0, 37.0, 30.0, 30.0, 29.0, 21.0, 16.0, 20.0, 10.0, 6.0, 11.0, 6.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.21875, -35.044921875, -33.87109375, -32.697265625, -31.5234375, -30.349609375, -29.17578125, -28.001953125, -26.828125, -25.654296875, -24.48046875, -23.306640625, -22.1328125, -20.958984375, -19.78515625, -18.611328125, -17.4375, -16.263671875, -15.08984375, -13.916015625, -12.7421875, -11.568359375, -10.39453125, -9.220703125, -8.046875, -6.873046875, -5.69921875, -4.525390625, -3.3515625, -2.177734375, -1.00390625, 0.169921875, 1.34375, 2.517578125, 3.69140625, 4.865234375, 6.0390625, 7.212890625, 8.38671875, 9.560546875, 10.734375, 11.908203125, 13.08203125, 14.255859375, 15.4296875, 16.603515625, 17.77734375, 18.951171875, 20.125, 21.298828125, 22.47265625, 23.646484375, 24.8203125, 25.994140625, 27.16796875, 28.341796875, 29.515625, 30.689453125, 31.86328125, 33.037109375, 34.2109375, 35.384765625, 36.55859375, 37.732421875, 38.90625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 8.0, 19.0, 75.0, 173.0, 236.0, 254.0, 154.0, 59.0, 29.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.962770938873291, -5.297201633453369, -4.631632328033447, -3.9660627841949463, -3.3004934787750244, -2.6349241733551025, -1.9693546295166016, -1.3037853240966797, -0.6382160186767578, 0.027353346347808838, 0.6929227113723755, 1.358492136001587, 2.024061441421509, 2.6896307468414307, 3.3552002906799316, 4.0207695960998535, 4.686338901519775, 5.351908206939697, 6.017477512359619, 6.683047294616699, 7.348616600036621, 8.014185905456543, 8.679755210876465, 9.345324516296387, 10.010893821716309, 10.67646312713623, 11.342032432556152, 12.007601737976074, 12.673171043395996, 13.338740348815918, 14.004310607910156, 14.669879913330078, 15.335447311401367, 16.00101661682129, 16.66658592224121, 17.332155227661133, 17.997724533081055, 18.663293838500977, 19.3288631439209, 19.99443244934082, 20.660001754760742, 21.325571060180664, 21.991140365600586, 22.656709671020508, 23.32227897644043, 23.98784828186035, 24.653417587280273, 25.318986892700195, 25.98455810546875, 26.650127410888672, 27.315696716308594, 27.981266021728516, 28.646835327148438, 29.31240463256836, 29.97797393798828, 30.643543243408203, 31.309112548828125, 31.974681854248047, 32.64025115966797, 33.30582046508789, 33.97138977050781, 34.636959075927734, 35.302528381347656, 35.96809768676758, 36.6336669921875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 12.0, 16.0, 10.0, 16.0, 11.0, 22.0, 22.0, 36.0, 37.0, 31.0, 47.0, 29.0, 32.0, 39.0, 44.0, 44.0, 43.0, 44.0, 56.0, 49.0, 50.0, 38.0, 27.0, 36.0, 26.0, 25.0, 22.0, 15.0, 29.0, 17.0, 8.0, 13.0, 6.0, 14.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.35805130004883, -52.647804260253906, -50.937557220458984, -49.22731018066406, -47.517066955566406, -45.806819915771484, -44.09657287597656, -42.38632583618164, -40.67607879638672, -38.9658317565918, -37.255584716796875, -35.54534149169922, -33.8350944519043, -32.124847412109375, -30.414600372314453, -28.70435333251953, -26.994110107421875, -25.283863067626953, -23.573617935180664, -21.863370895385742, -20.153125762939453, -18.44287872314453, -16.73263168334961, -15.022385597229004, -13.312139511108398, -11.601893424987793, -9.891647338867188, -8.181400299072266, -6.47115421295166, -4.760908126831055, -3.050661087036133, -1.3404150009155273, 0.36983489990234375, 2.0800812244415283, 3.790327548980713, 5.500574111938477, 7.210820198059082, 8.921066284179688, 10.63131332397461, 12.341559410095215, 14.05180549621582, 15.762051582336426, 17.47229766845703, 19.182544708251953, 20.892791748046875, 22.603036880493164, 24.313283920288086, 26.023529052734375, 27.733776092529297, 29.44402313232422, 31.154268264770508, 32.86451721191406, 34.57476043701172, 36.28500747680664, 37.99525451660156, 39.705501556396484, 41.415748596191406, 43.12599563598633, 44.83624267578125, 46.546485900878906, 48.25673294067383, 49.96697998046875, 51.67722702026367, 53.387474060058594, 55.09771728515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 3.0, 7.0, 9.0, 11.0, 11.0, 10.0, 18.0, 9.0, 23.0, 22.0, 28.0, 27.0, 26.0, 35.0, 36.0, 44.0, 35.0, 37.0, 46.0, 50.0, 50.0, 57.0, 55.0, 35.0, 50.0, 37.0, 38.0, 28.0, 25.0, 27.0, 21.0, 10.0, 20.0, 11.0, 12.0, 6.0, 9.0, 12.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.73046875, -5.56939697265625, -5.4083251953125, -5.24725341796875, -5.086181640625, -4.92510986328125, -4.7640380859375, -4.60296630859375, -4.44189453125, -4.28082275390625, -4.1197509765625, -3.95867919921875, -3.797607421875, -3.63653564453125, -3.4754638671875, -3.31439208984375, -3.1533203125, -2.99224853515625, -2.8311767578125, -2.67010498046875, -2.509033203125, -2.34796142578125, -2.1868896484375, -2.02581787109375, -1.86474609375, -1.70367431640625, -1.5426025390625, -1.38153076171875, -1.220458984375, -1.05938720703125, -0.8983154296875, -0.73724365234375, -0.576171875, -0.41510009765625, -0.2540283203125, -0.09295654296875, 0.068115234375, 0.22918701171875, 0.3902587890625, 0.55133056640625, 0.71240234375, 0.87347412109375, 1.0345458984375, 1.19561767578125, 1.356689453125, 1.51776123046875, 1.6788330078125, 1.83990478515625, 2.0009765625, 2.16204833984375, 2.3231201171875, 2.48419189453125, 2.645263671875, 2.80633544921875, 2.9674072265625, 3.12847900390625, 3.28955078125, 3.45062255859375, 3.6116943359375, 3.77276611328125, 3.933837890625, 4.09490966796875, 4.2559814453125, 4.41705322265625, 4.578125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 12.0, 10.0, 6.0, 18.0, 14.0, 15.0, 33.0, 35.0, 56.0, 74.0, 119.0, 176.0, 343.0, 772.0, 3004.0, 24010.0, 597422.0, 3239332.0, 310238.0, 14954.0, 2170.0, 671.0, 300.0, 162.0, 97.0, 61.0, 49.0, 32.0, 28.0, 14.0, 17.0, 12.0, 5.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.46875, -19.9215087890625, -19.374267578125, -18.8270263671875, -18.27978515625, -17.7325439453125, -17.185302734375, -16.6380615234375, -16.0908203125, -15.5435791015625, -14.996337890625, -14.4490966796875, -13.90185546875, -13.3546142578125, -12.807373046875, -12.2601318359375, -11.712890625, -11.1656494140625, -10.618408203125, -10.0711669921875, -9.52392578125, -8.9766845703125, -8.429443359375, -7.8822021484375, -7.3349609375, -6.7877197265625, -6.240478515625, -5.6932373046875, -5.14599609375, -4.5987548828125, -4.051513671875, -3.5042724609375, -2.95703125, -2.4097900390625, -1.862548828125, -1.3153076171875, -0.76806640625, -0.2208251953125, 0.326416015625, 0.8736572265625, 1.4208984375, 1.9681396484375, 2.515380859375, 3.0626220703125, 3.60986328125, 4.1571044921875, 4.704345703125, 5.2515869140625, 5.798828125, 6.3460693359375, 6.893310546875, 7.4405517578125, 7.98779296875, 8.5350341796875, 9.082275390625, 9.6295166015625, 10.1767578125, 10.7239990234375, 11.271240234375, 11.8184814453125, 12.36572265625, 12.9129638671875, 13.460205078125, 14.0074462890625, 14.5546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 16.0, 10.0, 29.0, 40.0, 58.0, 79.0, 116.0, 171.0, 280.0, 432.0, 653.0, 719.0, 492.0, 316.0, 200.0, 151.0, 94.0, 64.0, 47.0, 38.0, 17.0, 13.0, 14.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.078125, -28.335693359375, -27.59326171875, -26.850830078125, -26.1083984375, -25.365966796875, -24.62353515625, -23.881103515625, -23.138671875, -22.396240234375, -21.65380859375, -20.911376953125, -20.1689453125, -19.426513671875, -18.68408203125, -17.941650390625, -17.19921875, -16.456787109375, -15.71435546875, -14.971923828125, -14.2294921875, -13.487060546875, -12.74462890625, -12.002197265625, -11.259765625, -10.517333984375, -9.77490234375, -9.032470703125, -8.2900390625, -7.547607421875, -6.80517578125, -6.062744140625, -5.3203125, -4.577880859375, -3.83544921875, -3.093017578125, -2.3505859375, -1.608154296875, -0.86572265625, -0.123291015625, 0.619140625, 1.361572265625, 2.10400390625, 2.846435546875, 3.5888671875, 4.331298828125, 5.07373046875, 5.816162109375, 6.55859375, 7.301025390625, 8.04345703125, 8.785888671875, 9.5283203125, 10.270751953125, 11.01318359375, 11.755615234375, 12.498046875, 13.240478515625, 13.98291015625, 14.725341796875, 15.4677734375, 16.210205078125, 16.95263671875, 17.695068359375, 18.4375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 9.0, 18.0, 29.0, 28.0, 60.0, 76.0, 113.0, 180.0, 260.0, 464.0, 1192.0, 26659.0, 4112762.0, 49792.0, 1364.0, 474.0, 257.0, 162.0, 101.0, 82.0, 48.0, 43.0, 25.0, 22.0, 10.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.0625, -50.8095703125, -48.556640625, -46.3037109375, -44.05078125, -41.7978515625, -39.544921875, -37.2919921875, -35.0390625, -32.7861328125, -30.533203125, -28.2802734375, -26.02734375, -23.7744140625, -21.521484375, -19.2685546875, -17.015625, -14.7626953125, -12.509765625, -10.2568359375, -8.00390625, -5.7509765625, -3.498046875, -1.2451171875, 1.0078125, 3.2607421875, 5.513671875, 7.7666015625, 10.01953125, 12.2724609375, 14.525390625, 16.7783203125, 19.03125, 21.2841796875, 23.537109375, 25.7900390625, 28.04296875, 30.2958984375, 32.548828125, 34.8017578125, 37.0546875, 39.3076171875, 41.560546875, 43.8134765625, 46.06640625, 48.3193359375, 50.572265625, 52.8251953125, 55.078125, 57.3310546875, 59.583984375, 61.8369140625, 64.08984375, 66.3427734375, 68.595703125, 70.8486328125, 73.1015625, 75.3544921875, 77.607421875, 79.8603515625, 82.11328125, 84.3662109375, 86.619140625, 88.8720703125, 91.125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 92.0, 707.0, 211.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-588.1069946289062, -577.901123046875, -567.6953125, -557.4894409179688, -547.2836303710938, -537.0777587890625, -526.8719482421875, -516.6660766601562, -506.46026611328125, -496.2544250488281, -486.048583984375, -475.8427429199219, -465.63690185546875, -455.4310607910156, -445.2252197265625, -435.01934814453125, -424.8135070800781, -414.607666015625, -404.4018249511719, -394.19598388671875, -383.9901428222656, -373.7843017578125, -363.5784606933594, -353.37261962890625, -343.166748046875, -332.9609069824219, -322.75506591796875, -312.5492248535156, -302.3433837890625, -292.1375427246094, -281.93170166015625, -271.725830078125, -261.52001953125, -251.31417846679688, -241.10833740234375, -230.90249633789062, -220.6966552734375, -210.49081420898438, -200.2849578857422, -190.07911682128906, -179.873291015625, -169.66744995117188, -159.46160888671875, -149.25576782226562, -139.0499267578125, -128.84408569335938, -118.63822937011719, -108.43238830566406, -98.2265396118164, -88.02069854736328, -77.81484985351562, -67.6090087890625, -57.403167724609375, -47.19732666015625, -36.99148178100586, -26.78563690185547, -16.579795837402344, -6.373952865600586, 3.831890106201172, 14.03773307800293, 24.243576049804688, 34.44941711425781, 44.6552619934082, 54.861106872558594, 65.06694793701172]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 10.0, 3.0, 11.0, 8.0, 18.0, 12.0, 17.0, 26.0, 25.0, 21.0, 21.0, 30.0, 23.0, 40.0, 31.0, 27.0, 39.0, 46.0, 38.0, 45.0, 23.0, 46.0, 40.0, 34.0, 38.0, 27.0, 29.0, 35.0, 29.0, 24.0, 30.0, 26.0, 24.0, 23.0, 16.0, 8.0, 9.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.29388427734375, -52.568817138671875, -50.84375, -49.118682861328125, -47.39361572265625, -45.668548583984375, -43.9434814453125, -42.218414306640625, -40.49334716796875, -38.768280029296875, -37.043212890625, -35.318145751953125, -33.59307861328125, -31.868011474609375, -30.1429443359375, -28.417877197265625, -26.692811965942383, -24.967744827270508, -23.242677688598633, -21.517610549926758, -19.792543411254883, -18.06747817993164, -16.342411041259766, -14.617342948913574, -12.8922758102417, -11.167208671569824, -9.44214153289795, -7.717074871063232, -5.992007732391357, -4.266941070556641, -2.5418739318847656, -0.8168067932128906, 0.9082603454589844, 2.6333274841308594, 4.358394622802734, 6.083461284637451, 7.808528423309326, 9.533595085144043, 11.258662223815918, 12.983729362487793, 14.708796501159668, 16.433862686157227, 18.1589298248291, 19.883996963500977, 21.60906410217285, 23.334131240844727, 25.0591983795166, 26.784265518188477, 28.50933265686035, 30.234399795532227, 31.9594669342041, 33.684532165527344, 35.40959930419922, 37.134666442871094, 38.85973358154297, 40.584800720214844, 42.30986785888672, 44.034934997558594, 45.76000213623047, 47.485069274902344, 49.21013641357422, 50.935203552246094, 52.66027069091797, 54.385337829589844, 56.11040496826172]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 12.0, 8.0, 8.0, 14.0, 14.0, 10.0, 18.0, 21.0, 32.0, 27.0, 32.0, 32.0, 24.0, 36.0, 51.0, 29.0, 48.0, 37.0, 51.0, 43.0, 51.0, 49.0, 44.0, 49.0, 36.0, 34.0, 21.0, 31.0, 31.0, 20.0, 15.0, 11.0, 9.0, 8.0, 9.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2265625, -5.06439208984375, -4.9022216796875, -4.74005126953125, -4.577880859375, -4.41571044921875, -4.2535400390625, -4.09136962890625, -3.92919921875, -3.76702880859375, -3.6048583984375, -3.44268798828125, -3.280517578125, -3.11834716796875, -2.9561767578125, -2.79400634765625, -2.6318359375, -2.46966552734375, -2.3074951171875, -2.14532470703125, -1.983154296875, -1.82098388671875, -1.6588134765625, -1.49664306640625, -1.33447265625, -1.17230224609375, -1.0101318359375, -0.84796142578125, -0.685791015625, -0.52362060546875, -0.3614501953125, -0.19927978515625, -0.037109375, 0.12506103515625, 0.2872314453125, 0.44940185546875, 0.611572265625, 0.77374267578125, 0.9359130859375, 1.09808349609375, 1.26025390625, 1.42242431640625, 1.5845947265625, 1.74676513671875, 1.908935546875, 2.07110595703125, 2.2332763671875, 2.39544677734375, 2.5576171875, 2.71978759765625, 2.8819580078125, 3.04412841796875, 3.206298828125, 3.36846923828125, 3.5306396484375, 3.69281005859375, 3.85498046875, 4.01715087890625, 4.1793212890625, 4.34149169921875, 4.503662109375, 4.66583251953125, 4.8280029296875, 4.99017333984375, 5.15234375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 6.0, 10.0, 9.0, 18.0, 23.0, 32.0, 37.0, 52.0, 71.0, 101.0, 157.0, 256.0, 374.0, 472.0, 721.0, 1083.0, 1570.0, 2366.0, 3531.0, 5383.0, 8465.0, 13279.0, 21158.0, 33813.0, 57093.0, 98510.0, 172252.0, 244687.0, 156638.0, 88838.0, 51828.0, 31164.0, 19382.0, 12223.0, 7711.0, 4995.0, 3338.0, 2260.0, 1439.0, 1019.0, 713.0, 431.0, 324.0, 216.0, 150.0, 118.0, 73.0, 57.0, 40.0, 23.0, 15.0, 15.0, 10.0, 8.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.76806640625, -0.7436141967773438, -0.7191619873046875, -0.6947097778320312, -0.670257568359375, -0.6458053588867188, -0.6213531494140625, -0.5969009399414062, -0.57244873046875, -0.5479965209960938, -0.5235443115234375, -0.49909210205078125, -0.474639892578125, -0.45018768310546875, -0.4257354736328125, -0.40128326416015625, -0.3768310546875, -0.35237884521484375, -0.3279266357421875, -0.30347442626953125, -0.279022216796875, -0.25457000732421875, -0.2301177978515625, -0.20566558837890625, -0.18121337890625, -0.15676116943359375, -0.1323089599609375, -0.10785675048828125, -0.083404541015625, -0.05895233154296875, -0.0345001220703125, -0.01004791259765625, 0.014404296875, 0.03885650634765625, 0.0633087158203125, 0.08776092529296875, 0.112213134765625, 0.13666534423828125, 0.1611175537109375, 0.18556976318359375, 0.21002197265625, 0.23447418212890625, 0.2589263916015625, 0.28337860107421875, 0.307830810546875, 0.33228302001953125, 0.3567352294921875, 0.38118743896484375, 0.4056396484375, 0.43009185791015625, 0.4545440673828125, 0.47899627685546875, 0.503448486328125, 0.5279006958007812, 0.5523529052734375, 0.5768051147460938, 0.60125732421875, 0.6257095336914062, 0.6501617431640625, 0.6746139526367188, 0.699066162109375, 0.7235183715820312, 0.7479705810546875, 0.7724227905273438, 0.796875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 4.0, 5.0, 7.0, 11.0, 8.0, 12.0, 9.0, 16.0, 14.0, 23.0, 16.0, 21.0, 19.0, 28.0, 39.0, 21.0, 43.0, 45.0, 35.0, 42.0, 45.0, 1061.0, 42.0, 40.0, 37.0, 43.0, 37.0, 26.0, 32.0, 37.0, 23.0, 25.0, 22.0, 18.0, 15.0, 15.0, 13.0, 12.0, 13.0, 8.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.84765625, -2.75567626953125, -2.6636962890625, -2.57171630859375, -2.479736328125, -2.38775634765625, -2.2957763671875, -2.20379638671875, -2.11181640625, -2.01983642578125, -1.9278564453125, -1.83587646484375, -1.743896484375, -1.65191650390625, -1.5599365234375, -1.46795654296875, -1.3759765625, -1.28399658203125, -1.1920166015625, -1.10003662109375, -1.008056640625, -0.91607666015625, -0.8240966796875, -0.73211669921875, -0.64013671875, -0.54815673828125, -0.4561767578125, -0.36419677734375, -0.272216796875, -0.18023681640625, -0.0882568359375, 0.00372314453125, 0.095703125, 0.18768310546875, 0.2796630859375, 0.37164306640625, 0.463623046875, 0.55560302734375, 0.6475830078125, 0.73956298828125, 0.83154296875, 0.92352294921875, 1.0155029296875, 1.10748291015625, 1.199462890625, 1.29144287109375, 1.3834228515625, 1.47540283203125, 1.5673828125, 1.65936279296875, 1.7513427734375, 1.84332275390625, 1.935302734375, 2.02728271484375, 2.1192626953125, 2.21124267578125, 2.30322265625, 2.39520263671875, 2.4871826171875, 2.57916259765625, 2.671142578125, 2.76312255859375, 2.8551025390625, 2.94708251953125, 3.0390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 14.0, 15.0, 27.0, 47.0, 51.0, 112.0, 159.0, 238.0, 316.0, 522.0, 685.0, 997.0, 1476.0, 2131.0, 3245.0, 4675.0, 6797.0, 10387.0, 15530.0, 24333.0, 38678.0, 63029.0, 107734.0, 196292.0, 1284523.0, 131346.0, 75151.0, 45761.0, 28333.0, 18164.0, 11986.0, 7670.0, 5207.0, 3625.0, 2516.0, 1689.0, 1136.0, 815.0, 550.0, 364.0, 267.0, 161.0, 123.0, 84.0, 53.0, 38.0, 25.0, 18.0, 11.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6675491333007812, -0.6461334228515625, -0.6247177124023438, -0.603302001953125, -0.5818862915039062, -0.5604705810546875, -0.5390548706054688, -0.51763916015625, -0.49622344970703125, -0.4748077392578125, -0.45339202880859375, -0.431976318359375, -0.41056060791015625, -0.3891448974609375, -0.36772918701171875, -0.3463134765625, -0.32489776611328125, -0.3034820556640625, -0.28206634521484375, -0.260650634765625, -0.23923492431640625, -0.2178192138671875, -0.19640350341796875, -0.17498779296875, -0.15357208251953125, -0.1321563720703125, -0.11074066162109375, -0.089324951171875, -0.06790924072265625, -0.0464935302734375, -0.02507781982421875, -0.003662109375, 0.01775360107421875, 0.0391693115234375, 0.06058502197265625, 0.082000732421875, 0.10341644287109375, 0.1248321533203125, 0.14624786376953125, 0.16766357421875, 0.18907928466796875, 0.2104949951171875, 0.23191070556640625, 0.253326416015625, 0.27474212646484375, 0.2961578369140625, 0.31757354736328125, 0.3389892578125, 0.36040496826171875, 0.3818206787109375, 0.40323638916015625, 0.424652099609375, 0.44606781005859375, 0.4674835205078125, 0.48889923095703125, 0.51031494140625, 0.5317306518554688, 0.5531463623046875, 0.5745620727539062, 0.595977783203125, 0.6173934936523438, 0.6388092041015625, 0.6602249145507812, 0.681640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 14.0, 19.0, 16.0, 15.0, 20.0, 19.0, 31.0, 36.0, 54.0, 44.0, 66.0, 67.0, 69.0, 74.0, 60.0, 64.0, 60.0, 45.0, 40.0, 39.0, 21.0, 22.0, 20.0, 15.0, 8.0, 9.0, 10.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005450248718261719, -0.0005289986729621887, -0.0005129724740982056, -0.0004969462752342224, -0.00048092007637023926, -0.0004648938775062561, -0.00044886767864227295, -0.0004328414797782898, -0.00041681528091430664, -0.0004007890820503235, -0.00038476288318634033, -0.0003687366843223572, -0.000352710485458374, -0.00033668428659439087, -0.0003206580877304077, -0.00030463188886642456, -0.0002886056900024414, -0.00027257949113845825, -0.0002565532922744751, -0.00024052709341049194, -0.0002245008945465088, -0.00020847469568252563, -0.00019244849681854248, -0.00017642229795455933, -0.00016039609909057617, -0.00014436990022659302, -0.00012834370136260986, -0.00011231750249862671, -9.629130363464355e-05, -8.02651047706604e-05, -6.423890590667725e-05, -4.821270704269409e-05, -3.218650817871094e-05, -1.6160309314727783e-05, -1.341104507446289e-07, 1.5892088413238525e-05, 3.191828727722168e-05, 4.7944486141204834e-05, 6.397068500518799e-05, 7.999688386917114e-05, 9.60230827331543e-05, 0.00011204928159713745, 0.0001280754804611206, 0.00014410167932510376, 0.00016012787818908691, 0.00017615407705307007, 0.00019218027591705322, 0.00020820647478103638, 0.00022423267364501953, 0.00024025887250900269, 0.00025628507137298584, 0.000272311270236969, 0.00028833746910095215, 0.0003043636679649353, 0.00032038986682891846, 0.0003364160656929016, 0.00035244226455688477, 0.0003684684634208679, 0.0003844946622848511, 0.00040052086114883423, 0.0004165470600128174, 0.00043257325887680054, 0.0004485994577407837, 0.00046462565660476685, 0.00048065185546875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 4.0, 6.0, 7.0, 8.0, 13.0, 7.0, 17.0, 17.0, 21.0, 27.0, 30.0, 65.0, 88.0, 146.0, 205.0, 363.0, 1037.0, 1037134.0, 8085.0, 515.0, 269.0, 138.0, 94.0, 69.0, 45.0, 31.0, 20.0, 21.0, 11.0, 18.0, 9.0, 12.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0130615234375, -0.012662410736083984, -0.012263298034667969, -0.011864185333251953, -0.011465072631835938, -0.011065959930419922, -0.010666847229003906, -0.01026773452758789, -0.009868621826171875, -0.00946950912475586, -0.009070396423339844, -0.008671283721923828, -0.008272171020507812, -0.007873058319091797, -0.007473945617675781, -0.007074832916259766, -0.00667572021484375, -0.006276607513427734, -0.005877494812011719, -0.005478382110595703, -0.0050792694091796875, -0.004680156707763672, -0.004281044006347656, -0.0038819313049316406, -0.003482818603515625, -0.0030837059020996094, -0.0026845932006835938, -0.002285480499267578, -0.0018863677978515625, -0.0014872550964355469, -0.0010881423950195312, -0.0006890296936035156, -0.0002899169921875, 0.00010919570922851562, 0.0005083084106445312, 0.0009074211120605469, 0.0013065338134765625, 0.0017056465148925781, 0.0021047592163085938, 0.0025038719177246094, 0.002902984619140625, 0.0033020973205566406, 0.0037012100219726562, 0.004100322723388672, 0.0044994354248046875, 0.004898548126220703, 0.005297660827636719, 0.005696773529052734, 0.00609588623046875, 0.006494998931884766, 0.006894111633300781, 0.007293224334716797, 0.0076923370361328125, 0.008091449737548828, 0.008490562438964844, 0.00888967514038086, 0.009288787841796875, 0.00968790054321289, 0.010087013244628906, 0.010486125946044922, 0.010885238647460938, 0.011284351348876953, 0.011683464050292969, 0.012082576751708984, 0.012481689453125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 116.0, 707.0, 182.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023232121020555496, -0.002281415509060025, -0.0022396191488951445, -0.00219782255589962, -0.0021560261957347393, -0.002114229602739215, -0.0020724330097436905, -0.0020306366495788097, -0.0019888400565832853, -0.0019470435800030828, -0.0019052471034228802, -0.0018634505104273558, -0.0018216540338471532, -0.0017798575572669506, -0.0017380609642714262, -0.0016962644876912236, -0.001654468011111021, -0.0016126715345308185, -0.0015708750579506159, -0.0015290784649550915, -0.001487281988374889, -0.0014454855117946863, -0.001403688918799162, -0.0013618924422189593, -0.0013200959656387568, -0.0012782994890585542, -0.0012365030124783516, -0.0011947064194828272, -0.0011529099429026246, -0.001111113466322422, -0.0010693168733268976, -0.001027520396746695, -0.0009857239201664925, -0.0009439274435862899, -0.0009021309087984264, -0.0008603343740105629, -0.0008185378974303603, -0.0007767414208501577, -0.0007349448860622942, -0.0006931483512744308, -0.0006513518746942282, -0.0006095553981140256, -0.0005677588633261621, -0.0005259623285382986, -0.00048416585195809603, -0.000442369346274063, -0.00040057284059002995, -0.0003587763349059969, -0.0003169798292219639, -0.00027518332353793085, -0.0002333868178538978, -0.00019159031216986477, -0.00014979380648583174, -0.0001079973008017987, -6.620079511776567e-05, -2.440428943373263e-05, 1.7392216250300407e-05, 5.9188721934333444e-05, 0.00010098522761836648, 0.00014278173330239952, 0.00018457823898643255, 0.0002263747446704656, 0.0002681712503544986, 0.00030996775603853166, 0.0003517642617225647]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 8.0, 3.0, 6.0, 13.0, 12.0, 19.0, 19.0, 23.0, 19.0, 25.0, 34.0, 32.0, 33.0, 34.0, 31.0, 47.0, 50.0, 40.0, 36.0, 47.0, 47.0, 46.0, 28.0, 35.0, 34.0, 29.0, 32.0, 40.0, 23.0, 18.0, 16.0, 23.0, 17.0, 14.0, 11.0, 16.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00025641918182373047, -0.00024845823645591736, -0.00024049729108810425, -0.00023253634572029114, -0.00022457540035247803, -0.00021661445498466492, -0.0002086535096168518, -0.0002006925642490387, -0.00019273161888122559, -0.00018477067351341248, -0.00017680972814559937, -0.00016884878277778625, -0.00016088783740997314, -0.00015292689204216003, -0.00014496594667434692, -0.0001370050013065338, -0.0001290440559387207, -0.00012108311057090759, -0.00011312216520309448, -0.00010516121983528137, -9.720027446746826e-05, -8.923932909965515e-05, -8.127838373184204e-05, -7.331743836402893e-05, -6.535649299621582e-05, -5.739554762840271e-05, -4.94346022605896e-05, -4.147365689277649e-05, -3.351271152496338e-05, -2.555176615715027e-05, -1.7590820789337158e-05, -9.629875421524048e-06, -1.6689300537109375e-06, 6.292015314102173e-06, 1.4252960681915283e-05, 2.2213906049728394e-05, 3.0174851417541504e-05, 3.8135796785354614e-05, 4.6096742153167725e-05, 5.4057687520980835e-05, 6.201863288879395e-05, 6.997957825660706e-05, 7.794052362442017e-05, 8.590146899223328e-05, 9.386241436004639e-05, 0.0001018233597278595, 0.00010978430509567261, 0.00011774525046348572, 0.00012570619583129883, 0.00013366714119911194, 0.00014162808656692505, 0.00014958903193473816, 0.00015754997730255127, 0.00016551092267036438, 0.0001734718680381775, 0.0001814328134059906, 0.0001893937587738037, 0.00019735470414161682, 0.00020531564950942993, 0.00021327659487724304, 0.00022123754024505615, 0.00022919848561286926, 0.00023715943098068237, 0.0002451203763484955, 0.0002530813217163086]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 12.0, 8.0, 8.0, 14.0, 14.0, 10.0, 18.0, 21.0, 32.0, 27.0, 32.0, 32.0, 24.0, 36.0, 51.0, 29.0, 48.0, 37.0, 51.0, 43.0, 51.0, 49.0, 44.0, 49.0, 36.0, 34.0, 21.0, 31.0, 31.0, 20.0, 15.0, 11.0, 9.0, 8.0, 9.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2265625, -5.06439208984375, -4.9022216796875, -4.74005126953125, -4.577880859375, -4.41571044921875, -4.2535400390625, -4.09136962890625, -3.92919921875, -3.76702880859375, -3.6048583984375, -3.44268798828125, -3.280517578125, -3.11834716796875, -2.9561767578125, -2.79400634765625, -2.6318359375, -2.46966552734375, -2.3074951171875, -2.14532470703125, -1.983154296875, -1.82098388671875, -1.6588134765625, -1.49664306640625, -1.33447265625, -1.17230224609375, -1.0101318359375, -0.84796142578125, -0.685791015625, -0.52362060546875, -0.3614501953125, -0.19927978515625, -0.037109375, 0.12506103515625, 0.2872314453125, 0.44940185546875, 0.611572265625, 0.77374267578125, 0.9359130859375, 1.09808349609375, 1.26025390625, 1.42242431640625, 1.5845947265625, 1.74676513671875, 1.908935546875, 2.07110595703125, 2.2332763671875, 2.39544677734375, 2.5576171875, 2.71978759765625, 2.8819580078125, 3.04412841796875, 3.206298828125, 3.36846923828125, 3.5306396484375, 3.69281005859375, 3.85498046875, 4.01715087890625, 4.1793212890625, 4.34149169921875, 4.503662109375, 4.66583251953125, 4.8280029296875, 4.99017333984375, 5.15234375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 11.0, 14.0, 11.0, 10.0, 17.0, 28.0, 36.0, 59.0, 78.0, 91.0, 143.0, 215.0, 318.0, 503.0, 735.0, 1192.0, 2123.0, 3845.0, 7421.0, 15796.0, 37459.0, 99707.0, 328021.0, 364664.0, 110647.0, 40395.0, 17154.0, 8054.0, 4065.0, 2126.0, 1272.0, 815.0, 472.0, 328.0, 219.0, 161.0, 112.0, 64.0, 40.0, 37.0, 26.0, 21.0, 16.0, 11.0, 9.0, 5.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.48828125, -3.379425048828125, -3.27056884765625, -3.161712646484375, -3.0528564453125, -2.944000244140625, -2.83514404296875, -2.726287841796875, -2.617431640625, -2.508575439453125, -2.39971923828125, -2.290863037109375, -2.1820068359375, -2.073150634765625, -1.96429443359375, -1.855438232421875, -1.74658203125, -1.637725830078125, -1.52886962890625, -1.420013427734375, -1.3111572265625, -1.202301025390625, -1.09344482421875, -0.984588623046875, -0.875732421875, -0.766876220703125, -0.65802001953125, -0.549163818359375, -0.4403076171875, -0.331451416015625, -0.22259521484375, -0.113739013671875, -0.0048828125, 0.103973388671875, 0.21282958984375, 0.321685791015625, 0.4305419921875, 0.539398193359375, 0.64825439453125, 0.757110595703125, 0.865966796875, 0.974822998046875, 1.08367919921875, 1.192535400390625, 1.3013916015625, 1.410247802734375, 1.51910400390625, 1.627960205078125, 1.73681640625, 1.845672607421875, 1.95452880859375, 2.063385009765625, 2.1722412109375, 2.281097412109375, 2.38995361328125, 2.498809814453125, 2.607666015625, 2.716522216796875, 2.82537841796875, 2.934234619140625, 3.0430908203125, 3.151947021484375, 3.26080322265625, 3.369659423828125, 3.478515625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 4.0, 12.0, 11.0, 10.0, 17.0, 19.0, 16.0, 31.0, 36.0, 32.0, 32.0, 39.0, 42.0, 46.0, 57.0, 61.0, 223.0, 1786.0, 103.0, 57.0, 64.0, 44.0, 41.0, 47.0, 35.0, 30.0, 16.0, 28.0, 15.0, 16.0, 16.0, 9.0, 13.0, 9.0, 3.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -16.998291015625, -16.41845703125, -15.838623046875, -15.2587890625, -14.678955078125, -14.09912109375, -13.519287109375, -12.939453125, -12.359619140625, -11.77978515625, -11.199951171875, -10.6201171875, -10.040283203125, -9.46044921875, -8.880615234375, -8.30078125, -7.720947265625, -7.14111328125, -6.561279296875, -5.9814453125, -5.401611328125, -4.82177734375, -4.241943359375, -3.662109375, -3.082275390625, -2.50244140625, -1.922607421875, -1.3427734375, -0.762939453125, -0.18310546875, 0.396728515625, 0.9765625, 1.556396484375, 2.13623046875, 2.716064453125, 3.2958984375, 3.875732421875, 4.45556640625, 5.035400390625, 5.615234375, 6.195068359375, 6.77490234375, 7.354736328125, 7.9345703125, 8.514404296875, 9.09423828125, 9.674072265625, 10.25390625, 10.833740234375, 11.41357421875, 11.993408203125, 12.5732421875, 13.153076171875, 13.73291015625, 14.312744140625, 14.892578125, 15.472412109375, 16.05224609375, 16.632080078125, 17.2119140625, 17.791748046875, 18.37158203125, 18.951416015625, 19.53125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 10.0, 5.0, 15.0, 11.0, 11.0, 21.0, 21.0, 32.0, 30.0, 31.0, 64.0, 77.0, 109.0, 202.0, 386.0, 1099.0, 12272.0, 3060969.0, 67103.0, 1903.0, 560.0, 223.0, 145.0, 97.0, 61.0, 57.0, 39.0, 28.0, 24.0, 21.0, 18.0, 11.0, 10.0, 9.0, 5.0, 9.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.4375, -32.444580078125, -31.45166015625, -30.458740234375, -29.4658203125, -28.472900390625, -27.47998046875, -26.487060546875, -25.494140625, -24.501220703125, -23.50830078125, -22.515380859375, -21.5224609375, -20.529541015625, -19.53662109375, -18.543701171875, -17.55078125, -16.557861328125, -15.56494140625, -14.572021484375, -13.5791015625, -12.586181640625, -11.59326171875, -10.600341796875, -9.607421875, -8.614501953125, -7.62158203125, -6.628662109375, -5.6357421875, -4.642822265625, -3.64990234375, -2.656982421875, -1.6640625, -0.671142578125, 0.32177734375, 1.314697265625, 2.3076171875, 3.300537109375, 4.29345703125, 5.286376953125, 6.279296875, 7.272216796875, 8.26513671875, 9.258056640625, 10.2509765625, 11.243896484375, 12.23681640625, 13.229736328125, 14.22265625, 15.215576171875, 16.20849609375, 17.201416015625, 18.1943359375, 19.187255859375, 20.18017578125, 21.173095703125, 22.166015625, 23.158935546875, 24.15185546875, 25.144775390625, 26.1376953125, 27.130615234375, 28.12353515625, 29.116455078125, 30.109375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 14.0, 45.0, 127.0, 252.0, 296.0, 175.0, 63.0, 25.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61174201965332, -8.57434368133545, -7.536944389343262, -6.499546051025391, -5.462147235870361, -4.424748420715332, -3.387350082397461, -2.3499512672424316, -1.3125524520874023, -0.2751537561416626, 0.7622449398040771, 1.7996435165405273, 2.8370423316955566, 3.874441146850586, 4.911839485168457, 5.949238300323486, 6.986637115478516, 8.024035453796387, 9.061434745788574, 10.098833084106445, 11.136232376098633, 12.173630714416504, 13.211029052734375, 14.248428344726562, 15.285826683044434, 16.323225021362305, 17.360624313354492, 18.398021697998047, 19.435420989990234, 20.472820281982422, 21.51021957397461, 22.547616958618164, 23.58501434326172, 24.622413635253906, 25.65981101989746, 26.69721031188965, 27.734609603881836, 28.77200698852539, 29.809406280517578, 30.846805572509766, 31.884204864501953, 32.92160415649414, 33.95900344848633, 34.99639892578125, 36.03379821777344, 37.071197509765625, 38.10859680175781, 39.14599609375, 40.18339538574219, 41.220794677734375, 42.25819396972656, 43.29559326171875, 44.33298873901367, 45.37038803100586, 46.40778732299805, 47.445186614990234, 48.482582092285156, 49.519981384277344, 50.55738067626953, 51.59477996826172, 52.63217544555664, 53.66957473754883, 54.706974029541016, 55.7443733215332, 56.78177261352539]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 8.0, 5.0, 7.0, 6.0, 7.0, 3.0, 11.0, 8.0, 14.0, 14.0, 16.0, 25.0, 33.0, 28.0, 42.0, 40.0, 46.0, 44.0, 57.0, 44.0, 52.0, 38.0, 55.0, 36.0, 47.0, 33.0, 28.0, 36.0, 28.0, 35.0, 20.0, 24.0, 17.0, 17.0, 16.0, 15.0, 15.0, 9.0, 11.0, 6.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.94017028808594, -54.101715087890625, -52.26325988769531, -50.4248046875, -48.58634948730469, -46.747894287109375, -44.90943908691406, -43.07098388671875, -41.23252868652344, -39.394073486328125, -37.55561828613281, -35.7171630859375, -33.87870788574219, -32.040252685546875, -30.201799392700195, -28.363344192504883, -26.524890899658203, -24.68643569946289, -22.847980499267578, -21.009525299072266, -19.171070098876953, -17.33261489868164, -15.494161605834961, -13.655706405639648, -11.817251205444336, -9.978796005249023, -8.140340805053711, -6.301886558532715, -4.463431358337402, -2.62497615814209, -0.7865219116210938, 1.0519332885742188, 2.8903884887695312, 4.728843688964844, 6.567298412322998, 8.405753135681152, 10.244208335876465, 12.082663536071777, 13.921117782592773, 15.759572982788086, 17.5980281829834, 19.43648338317871, 21.274938583374023, 23.113391876220703, 24.951847076416016, 26.790302276611328, 28.62875747680664, 30.467212677001953, 32.305667877197266, 34.14412307739258, 35.98257827758789, 37.8210334777832, 39.659488677978516, 41.49794387817383, 43.336395263671875, 45.17485046386719, 47.0133056640625, 48.85176086425781, 50.690216064453125, 52.52867126464844, 54.36712646484375, 56.20558166503906, 58.044036865234375, 59.88249206542969, 61.720947265625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 8.0, 4.0, 11.0, 5.0, 10.0, 14.0, 12.0, 13.0, 12.0, 30.0, 22.0, 29.0, 29.0, 28.0, 32.0, 36.0, 43.0, 45.0, 30.0, 47.0, 45.0, 46.0, 49.0, 55.0, 45.0, 44.0, 35.0, 32.0, 27.0, 30.0, 26.0, 19.0, 28.0, 6.0, 10.0, 10.0, 6.0, 11.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.22265625, -5.05645751953125, -4.8902587890625, -4.72406005859375, -4.557861328125, -4.39166259765625, -4.2254638671875, -4.05926513671875, -3.89306640625, -3.72686767578125, -3.5606689453125, -3.39447021484375, -3.228271484375, -3.06207275390625, -2.8958740234375, -2.72967529296875, -2.5634765625, -2.39727783203125, -2.2310791015625, -2.06488037109375, -1.898681640625, -1.73248291015625, -1.5662841796875, -1.40008544921875, -1.23388671875, -1.06768798828125, -0.9014892578125, -0.73529052734375, -0.569091796875, -0.40289306640625, -0.2366943359375, -0.07049560546875, 0.095703125, 0.26190185546875, 0.4281005859375, 0.59429931640625, 0.760498046875, 0.92669677734375, 1.0928955078125, 1.25909423828125, 1.42529296875, 1.59149169921875, 1.7576904296875, 1.92388916015625, 2.090087890625, 2.25628662109375, 2.4224853515625, 2.58868408203125, 2.7548828125, 2.92108154296875, 3.0872802734375, 3.25347900390625, 3.419677734375, 3.58587646484375, 3.7520751953125, 3.91827392578125, 4.08447265625, 4.25067138671875, 4.4168701171875, 4.58306884765625, 4.749267578125, 4.91546630859375, 5.0816650390625, 5.24786376953125, 5.4140625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 10.0, 11.0, 9.0, 14.0, 14.0, 20.0, 19.0, 22.0, 18.0, 30.0, 24.0, 23.0, 31.0, 28.0, 58.0, 116.0, 824.0, 17305.0, 3149680.0, 1019371.0, 5782.0, 439.0, 90.0, 49.0, 39.0, 29.0, 28.0, 30.0, 19.0, 27.0, 23.0, 18.0, 13.0, 8.0, 15.0, 12.0, 11.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.953125, -28.949951171875, -27.94677734375, -26.943603515625, -25.9404296875, -24.937255859375, -23.93408203125, -22.930908203125, -21.927734375, -20.924560546875, -19.92138671875, -18.918212890625, -17.9150390625, -16.911865234375, -15.90869140625, -14.905517578125, -13.90234375, -12.899169921875, -11.89599609375, -10.892822265625, -9.8896484375, -8.886474609375, -7.88330078125, -6.880126953125, -5.876953125, -4.873779296875, -3.87060546875, -2.867431640625, -1.8642578125, -0.861083984375, 0.14208984375, 1.145263671875, 2.1484375, 3.151611328125, 4.15478515625, 5.157958984375, 6.1611328125, 7.164306640625, 8.16748046875, 9.170654296875, 10.173828125, 11.177001953125, 12.18017578125, 13.183349609375, 14.1865234375, 15.189697265625, 16.19287109375, 17.196044921875, 18.19921875, 19.202392578125, 20.20556640625, 21.208740234375, 22.2119140625, 23.215087890625, 24.21826171875, 25.221435546875, 26.224609375, 27.227783203125, 28.23095703125, 29.234130859375, 30.2373046875, 31.240478515625, 32.24365234375, 33.246826171875, 34.25]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 8.0, 17.0, 16.0, 37.0, 41.0, 79.0, 83.0, 151.0, 234.0, 338.0, 570.0, 741.0, 611.0, 402.0, 249.0, 159.0, 114.0, 79.0, 46.0, 28.0, 24.0, 13.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.546875, -26.8680419921875, -26.189208984375, -25.5103759765625, -24.83154296875, -24.1527099609375, -23.473876953125, -22.7950439453125, -22.1162109375, -21.4373779296875, -20.758544921875, -20.0797119140625, -19.40087890625, -18.7220458984375, -18.043212890625, -17.3643798828125, -16.685546875, -16.0067138671875, -15.327880859375, -14.6490478515625, -13.97021484375, -13.2913818359375, -12.612548828125, -11.9337158203125, -11.2548828125, -10.5760498046875, -9.897216796875, -9.2183837890625, -8.53955078125, -7.8607177734375, -7.181884765625, -6.5030517578125, -5.82421875, -5.1453857421875, -4.466552734375, -3.7877197265625, -3.10888671875, -2.4300537109375, -1.751220703125, -1.0723876953125, -0.3935546875, 0.2852783203125, 0.964111328125, 1.6429443359375, 2.32177734375, 3.0006103515625, 3.679443359375, 4.3582763671875, 5.037109375, 5.7159423828125, 6.394775390625, 7.0736083984375, 7.75244140625, 8.4312744140625, 9.110107421875, 9.7889404296875, 10.4677734375, 11.1466064453125, 11.825439453125, 12.5042724609375, 13.18310546875, 13.8619384765625, 14.540771484375, 15.2196044921875, 15.8984375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 13.0, 19.0, 33.0, 43.0, 77.0, 123.0, 213.0, 334.0, 795.0, 11502.0, 4165605.0, 13949.0, 714.0, 350.0, 193.0, 121.0, 69.0, 49.0, 27.0, 9.0, 12.0, 5.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.1875, -68.9814453125, -65.775390625, -62.5693359375, -59.36328125, -56.1572265625, -52.951171875, -49.7451171875, -46.5390625, -43.3330078125, -40.126953125, -36.9208984375, -33.71484375, -30.5087890625, -27.302734375, -24.0966796875, -20.890625, -17.6845703125, -14.478515625, -11.2724609375, -8.06640625, -4.8603515625, -1.654296875, 1.5517578125, 4.7578125, 7.9638671875, 11.169921875, 14.3759765625, 17.58203125, 20.7880859375, 23.994140625, 27.2001953125, 30.40625, 33.6123046875, 36.818359375, 40.0244140625, 43.23046875, 46.4365234375, 49.642578125, 52.8486328125, 56.0546875, 59.2607421875, 62.466796875, 65.6728515625, 68.87890625, 72.0849609375, 75.291015625, 78.4970703125, 81.703125, 84.9091796875, 88.115234375, 91.3212890625, 94.52734375, 97.7333984375, 100.939453125, 104.1455078125, 107.3515625, 110.5576171875, 113.763671875, 116.9697265625, 120.17578125, 123.3818359375, 126.587890625, 129.7939453125, 133.0]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 62.0, 208.0, 377.0, 253.0, 84.0, 14.0, 6.0, 0.0, 2.0, 2.0], "bins": [-271.8650207519531, -267.0650634765625, -262.26507568359375, -257.4651184082031, -252.6651611328125, -247.86520385742188, -243.0652313232422, -238.2652587890625, -233.46530151367188, -228.66534423828125, -223.86537170410156, -219.06539916992188, -214.26544189453125, -209.46548461914062, -204.66551208496094, -199.86553955078125, -195.06558227539062, -190.265625, -185.4656524658203, -180.66567993164062, -175.86572265625, -171.06576538085938, -166.2657928466797, -161.4658203125, -156.66586303710938, -151.86590576171875, -147.06593322753906, -142.26596069335938, -137.46600341796875, -132.66604614257812, -127.86607360839844, -123.06610870361328, -118.26615905761719, -113.46619415283203, -108.66622924804688, -103.86626434326172, -99.06629943847656, -94.2663345336914, -89.46636962890625, -84.6664047241211, -79.86643981933594, -75.06647491455078, -70.26651000976562, -65.46654510498047, -60.66658020019531, -55.866615295410156, -51.066650390625, -46.266685485839844, -41.46672058105469, -36.66675567626953, -31.866790771484375, -27.06682586669922, -22.266860961914062, -17.466896057128906, -12.66693115234375, -7.866966247558594, -3.0670013427734375, 1.7329635620117188, 6.532928466796875, 11.332893371582031, 16.132858276367188, 20.932823181152344, 25.7327880859375, 30.532752990722656, 35.33271789550781]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 7.0, 2.0, 2.0, 8.0, 4.0, 8.0, 11.0, 5.0, 11.0, 10.0, 11.0, 21.0, 20.0, 19.0, 22.0, 26.0, 32.0, 25.0, 38.0, 48.0, 45.0, 51.0, 33.0, 48.0, 47.0, 39.0, 45.0, 40.0, 40.0, 39.0, 34.0, 35.0, 27.0, 25.0, 24.0, 13.0, 16.0, 15.0, 14.0, 9.0, 11.0, 13.0, 10.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.365203857421875, -43.54517364501953, -41.72513961791992, -39.90510940551758, -38.085079193115234, -36.265045166015625, -34.44501495361328, -32.62498474121094, -30.804954528808594, -28.984922409057617, -27.164892196655273, -25.344860076904297, -23.524829864501953, -21.704797744750977, -19.884765625, -18.064735412597656, -16.24470329284668, -14.42467212677002, -12.60464096069336, -10.784608840942383, -8.964578628540039, -7.1445465087890625, -5.324515342712402, -3.504484176635742, -1.684453010559082, 0.13557827472686768, 1.9556095600128174, 3.7756409645080566, 5.595672130584717, 7.415703773498535, 9.235734939575195, 11.055766105651855, 12.875797271728516, 14.695828437805176, 16.515859603881836, 18.335891723632812, 20.155921936035156, 21.975954055786133, 23.79598617553711, 25.616016387939453, 27.436046600341797, 29.256078720092773, 31.076108932495117, 32.896141052246094, 34.71617126464844, 36.53620147705078, 38.35623550415039, 40.176265716552734, 41.996299743652344, 43.81632995605469, 45.6363639831543, 47.45639419555664, 49.276424407958984, 51.096458435058594, 52.91648864746094, 54.73651885986328, 56.556549072265625, 58.37657928466797, 60.19661331176758, 62.01664352416992, 63.836673736572266, 65.65670776367188, 67.47673797607422, 69.29676818847656, 71.1167984008789]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 7.0, 9.0, 15.0, 7.0, 13.0, 18.0, 14.0, 22.0, 27.0, 28.0, 21.0, 27.0, 28.0, 33.0, 46.0, 42.0, 37.0, 51.0, 50.0, 41.0, 50.0, 44.0, 49.0, 45.0, 37.0, 29.0, 29.0, 30.0, 23.0, 12.0, 18.0, 18.0, 17.0, 9.0, 17.0, 10.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.12890625, -4.96002197265625, -4.7911376953125, -4.62225341796875, -4.453369140625, -4.28448486328125, -4.1156005859375, -3.94671630859375, -3.77783203125, -3.60894775390625, -3.4400634765625, -3.27117919921875, -3.102294921875, -2.93341064453125, -2.7645263671875, -2.59564208984375, -2.4267578125, -2.25787353515625, -2.0889892578125, -1.92010498046875, -1.751220703125, -1.58233642578125, -1.4134521484375, -1.24456787109375, -1.07568359375, -0.90679931640625, -0.7379150390625, -0.56903076171875, -0.400146484375, -0.23126220703125, -0.0623779296875, 0.10650634765625, 0.275390625, 0.44427490234375, 0.6131591796875, 0.78204345703125, 0.950927734375, 1.11981201171875, 1.2886962890625, 1.45758056640625, 1.62646484375, 1.79534912109375, 1.9642333984375, 2.13311767578125, 2.302001953125, 2.47088623046875, 2.6397705078125, 2.80865478515625, 2.9775390625, 3.14642333984375, 3.3153076171875, 3.48419189453125, 3.653076171875, 3.82196044921875, 3.9908447265625, 4.15972900390625, 4.32861328125, 4.49749755859375, 4.6663818359375, 4.83526611328125, 5.004150390625, 5.17303466796875, 5.3419189453125, 5.51080322265625, 5.6796875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 10.0, 24.0, 25.0, 53.0, 63.0, 90.0, 126.0, 195.0, 275.0, 451.0, 725.0, 1186.0, 1822.0, 2953.0, 4668.0, 7752.0, 12854.0, 20597.0, 34828.0, 60651.0, 110730.0, 211067.0, 261287.0, 137905.0, 72931.0, 41731.0, 24748.0, 14848.0, 9035.0, 5655.0, 3444.0, 2189.0, 1291.0, 860.0, 544.0, 290.0, 221.0, 130.0, 81.0, 85.0, 40.0, 29.0, 20.0, 15.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.85107421875, -0.8228607177734375, -0.794647216796875, -0.7664337158203125, -0.73822021484375, -0.7100067138671875, -0.681793212890625, -0.6535797119140625, -0.6253662109375, -0.5971527099609375, -0.568939208984375, -0.5407257080078125, -0.51251220703125, -0.4842987060546875, -0.456085205078125, -0.4278717041015625, -0.399658203125, -0.3714447021484375, -0.343231201171875, -0.3150177001953125, -0.28680419921875, -0.2585906982421875, -0.230377197265625, -0.2021636962890625, -0.1739501953125, -0.1457366943359375, -0.117523193359375, -0.0893096923828125, -0.06109619140625, -0.0328826904296875, -0.004669189453125, 0.0235443115234375, 0.0517578125, 0.0799713134765625, 0.108184814453125, 0.1363983154296875, 0.16461181640625, 0.1928253173828125, 0.221038818359375, 0.2492523193359375, 0.2774658203125, 0.3056793212890625, 0.333892822265625, 0.3621063232421875, 0.39031982421875, 0.4185333251953125, 0.446746826171875, 0.4749603271484375, 0.503173828125, 0.5313873291015625, 0.559600830078125, 0.5878143310546875, 0.61602783203125, 0.6442413330078125, 0.672454833984375, 0.7006683349609375, 0.7288818359375, 0.7570953369140625, 0.785308837890625, 0.8135223388671875, 0.84173583984375, 0.8699493408203125, 0.898162841796875, 0.9263763427734375, 0.95458984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 1.0, 3.0, 5.0, 9.0, 9.0, 14.0, 12.0, 16.0, 23.0, 21.0, 22.0, 28.0, 30.0, 20.0, 32.0, 41.0, 21.0, 37.0, 41.0, 33.0, 36.0, 1051.0, 41.0, 38.0, 43.0, 44.0, 37.0, 33.0, 32.0, 31.0, 32.0, 21.0, 26.0, 22.0, 19.0, 17.0, 14.0, 10.0, 7.0, 14.0, 10.0, 7.0, 2.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.375, -3.274688720703125, -3.17437744140625, -3.074066162109375, -2.9737548828125, -2.873443603515625, -2.77313232421875, -2.672821044921875, -2.572509765625, -2.472198486328125, -2.37188720703125, -2.271575927734375, -2.1712646484375, -2.070953369140625, -1.97064208984375, -1.870330810546875, -1.77001953125, -1.669708251953125, -1.56939697265625, -1.469085693359375, -1.3687744140625, -1.268463134765625, -1.16815185546875, -1.067840576171875, -0.967529296875, -0.867218017578125, -0.76690673828125, -0.666595458984375, -0.5662841796875, -0.465972900390625, -0.36566162109375, -0.265350341796875, -0.1650390625, -0.064727783203125, 0.03558349609375, 0.135894775390625, 0.2362060546875, 0.336517333984375, 0.43682861328125, 0.537139892578125, 0.637451171875, 0.737762451171875, 0.83807373046875, 0.938385009765625, 1.0386962890625, 1.139007568359375, 1.23931884765625, 1.339630126953125, 1.43994140625, 1.540252685546875, 1.64056396484375, 1.740875244140625, 1.8411865234375, 1.941497802734375, 2.04180908203125, 2.142120361328125, 2.242431640625, 2.342742919921875, 2.44305419921875, 2.543365478515625, 2.6436767578125, 2.743988037109375, 2.84429931640625, 2.944610595703125, 3.044921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 17.0, 17.0, 21.0, 38.0, 57.0, 81.0, 105.0, 150.0, 246.0, 332.0, 478.0, 641.0, 929.0, 1311.0, 1725.0, 2507.0, 3548.0, 5109.0, 7005.0, 10326.0, 14945.0, 21992.0, 32681.0, 49468.0, 77491.0, 125528.0, 1253785.0, 175974.0, 106980.0, 67359.0, 43701.0, 28777.0, 19481.0, 13311.0, 8981.0, 6556.0, 4511.0, 3133.0, 2279.0, 1594.0, 1176.0, 807.0, 605.0, 419.0, 283.0, 182.0, 148.0, 101.0, 70.0, 49.0, 34.0, 29.0, 20.0, 15.0, 5.0, 6.0, 4.0, 3.0], "bins": [-0.65673828125, -0.6367416381835938, -0.6167449951171875, -0.5967483520507812, -0.576751708984375, -0.5567550659179688, -0.5367584228515625, -0.5167617797851562, -0.49676513671875, -0.47676849365234375, -0.4567718505859375, -0.43677520751953125, -0.416778564453125, -0.39678192138671875, -0.3767852783203125, -0.35678863525390625, -0.3367919921875, -0.31679534912109375, -0.2967987060546875, -0.27680206298828125, -0.256805419921875, -0.23680877685546875, -0.2168121337890625, -0.19681549072265625, -0.17681884765625, -0.15682220458984375, -0.1368255615234375, -0.11682891845703125, -0.096832275390625, -0.07683563232421875, -0.0568389892578125, -0.03684234619140625, -0.016845703125, 0.00315093994140625, 0.0231475830078125, 0.04314422607421875, 0.063140869140625, 0.08313751220703125, 0.1031341552734375, 0.12313079833984375, 0.14312744140625, 0.16312408447265625, 0.1831207275390625, 0.20311737060546875, 0.223114013671875, 0.24311065673828125, 0.2631072998046875, 0.28310394287109375, 0.3031005859375, 0.32309722900390625, 0.3430938720703125, 0.36309051513671875, 0.383087158203125, 0.40308380126953125, 0.4230804443359375, 0.44307708740234375, 0.46307373046875, 0.48307037353515625, 0.5030670166015625, 0.5230636596679688, 0.543060302734375, 0.5630569458007812, 0.5830535888671875, 0.6030502319335938, 0.623046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 5.0, 10.0, 14.0, 17.0, 28.0, 24.0, 27.0, 37.0, 58.0, 58.0, 75.0, 70.0, 75.0, 75.0, 78.0, 52.0, 61.0, 46.0, 32.0, 35.0, 24.0, 9.0, 8.0, 11.0, 9.0, 11.0, 8.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005273818969726562, -0.0005113109946250916, -0.0004952400922775269, -0.00047916918992996216, -0.00046309828758239746, -0.00044702738523483276, -0.00043095648288726807, -0.00041488558053970337, -0.00039881467819213867, -0.000382743775844574, -0.0003666728734970093, -0.0003506019711494446, -0.0003345310688018799, -0.0003184601664543152, -0.0003023892641067505, -0.0002863183617591858, -0.0002702474594116211, -0.0002541765570640564, -0.0002381056547164917, -0.000222034752368927, -0.0002059638500213623, -0.0001898929476737976, -0.0001738220453262329, -0.0001577511429786682, -0.00014168024063110352, -0.00012560933828353882, -0.00010953843593597412, -9.346753358840942e-05, -7.739663124084473e-05, -6.132572889328003e-05, -4.525482654571533e-05, -2.9183924198150635e-05, -1.3113021850585938e-05, 2.9578804969787598e-06, 1.9028782844543457e-05, 3.5099685192108154e-05, 5.117058753967285e-05, 6.724148988723755e-05, 8.331239223480225e-05, 9.938329458236694e-05, 0.00011545419692993164, 0.00013152509927749634, 0.00014759600162506104, 0.00016366690397262573, 0.00017973780632019043, 0.00019580870866775513, 0.00021187961101531982, 0.00022795051336288452, 0.00024402141571044922, 0.0002600923180580139, 0.0002761632204055786, 0.0002922341227531433, 0.000308305025100708, 0.0003243759274482727, 0.0003404468297958374, 0.0003565177321434021, 0.0003725886344909668, 0.0003886595368385315, 0.0004047304391860962, 0.0004208013415336609, 0.0004368722438812256, 0.0004529431462287903, 0.000469014048576355, 0.0004850849509239197, 0.0005011558532714844]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 8.0, 9.0, 12.0, 23.0, 24.0, 45.0, 69.0, 120.0, 163.0, 288.0, 509.0, 4461.0, 1039695.0, 1910.0, 485.0, 224.0, 146.0, 120.0, 67.0, 51.0, 38.0, 21.0, 24.0, 2.0, 8.0, 5.0, 3.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01320648193359375, -0.012786149978637695, -0.01236581802368164, -0.011945486068725586, -0.011525154113769531, -0.011104822158813477, -0.010684490203857422, -0.010264158248901367, -0.009843826293945312, -0.009423494338989258, -0.009003162384033203, -0.008582830429077148, -0.008162498474121094, -0.007742166519165039, -0.007321834564208984, -0.00690150260925293, -0.006481170654296875, -0.00606083869934082, -0.005640506744384766, -0.005220174789428711, -0.004799842834472656, -0.0043795108795166016, -0.003959178924560547, -0.003538846969604492, -0.0031185150146484375, -0.002698183059692383, -0.002277851104736328, -0.0018575191497802734, -0.0014371871948242188, -0.001016855239868164, -0.0005965232849121094, -0.0001761913299560547, 0.000244140625, 0.0006644725799560547, 0.0010848045349121094, 0.001505136489868164, 0.0019254684448242188, 0.0023458003997802734, 0.002766132354736328, 0.003186464309692383, 0.0036067962646484375, 0.004027128219604492, 0.004447460174560547, 0.0048677921295166016, 0.005288124084472656, 0.005708456039428711, 0.006128787994384766, 0.00654911994934082, 0.006969451904296875, 0.00738978385925293, 0.007810115814208984, 0.008230447769165039, 0.008650779724121094, 0.009071111679077148, 0.009491443634033203, 0.009911775588989258, 0.010332107543945312, 0.010752439498901367, 0.011172771453857422, 0.011593103408813477, 0.012013435363769531, 0.012433767318725586, 0.01285409927368164, 0.013274431228637695, 0.01369476318359375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 498.0, 463.0, 32.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.003202585969120264, -0.003145412774756551, -0.003088239813223481, -0.003031066618859768, -0.0029738936573266983, -0.002916720462962985, -0.0028595475014299154, -0.002802374307066202, -0.0027452013455331326, -0.0026880281511694193, -0.0026308551896363497, -0.0025736819952726364, -0.002516509033739567, -0.0024593358393758535, -0.002402162877842784, -0.0023449896834790707, -0.0022878164891153574, -0.002230643294751644, -0.0021734703332185745, -0.0021162971388548613, -0.0020591241773217916, -0.0020019509829580784, -0.0019447780214250088, -0.0018876048270612955, -0.001830431865528226, -0.0017732587875798345, -0.001716085709631443, -0.0016589126316830516, -0.0016017395537346601, -0.0015445663593709469, -0.0014873933978378773, -0.001430220203474164, -0.0013730472419410944, -0.001315874163992703, -0.0012587010860443115, -0.00120152800809592, -0.0011443549301475286, -0.0010871817357838154, -0.0010300087742507458, -0.0009728355798870325, -0.0009156625019386411, -0.0008584894239902496, -0.0008013163460418582, -0.0007441432680934668, -0.0006869701319374144, -0.000629797053989023, -0.0005726239760406315, -0.0005154508398845792, -0.0004582777910400182, -0.00040110471309162676, -0.00034393160603940487, -0.00028675852809101343, -0.00022958543559070677, -0.0001724123430904001, -0.00011523926514200866, -5.806615808978677e-05, -8.930801413953304e-07, 5.628000872093253e-05, 0.00011345309758326039, 0.00017062618280760944, 0.0002277992753079161, 0.00028497236780822277, 0.0003421454457566142, 0.0003993185528088361, 0.00045649163075722754]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 7.0, 14.0, 16.0, 5.0, 19.0, 21.0, 27.0, 17.0, 14.0, 35.0, 32.0, 37.0, 38.0, 40.0, 39.0, 36.0, 50.0, 50.0, 33.0, 47.0, 48.0, 38.0, 42.0, 42.0, 30.0, 28.0, 30.0, 23.0, 18.0, 15.0, 12.0, 17.0, 13.0, 15.0, 9.0, 11.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002529025077819824, -0.0002455078065395355, -0.00023811310529708862, -0.00023071840405464172, -0.00022332370281219482, -0.00021592900156974792, -0.00020853430032730103, -0.00020113959908485413, -0.00019374489784240723, -0.00018635019659996033, -0.00017895549535751343, -0.00017156079411506653, -0.00016416609287261963, -0.00015677139163017273, -0.00014937669038772583, -0.00014198198914527893, -0.00013458728790283203, -0.00012719258666038513, -0.00011979788541793823, -0.00011240318417549133, -0.00010500848293304443, -9.761378169059753e-05, -9.021908044815063e-05, -8.282437920570374e-05, -7.542967796325684e-05, -6.803497672080994e-05, -6.064027547836304e-05, -5.324557423591614e-05, -4.585087299346924e-05, -3.845617175102234e-05, -3.106147050857544e-05, -2.366676926612854e-05, -1.627206802368164e-05, -8.877366781234741e-06, -1.4826655387878418e-06, 5.912035703659058e-06, 1.3306736946105957e-05, 2.0701438188552856e-05, 2.8096139430999756e-05, 3.5490840673446655e-05, 4.2885541915893555e-05, 5.0280243158340454e-05, 5.7674944400787354e-05, 6.506964564323425e-05, 7.246434688568115e-05, 7.985904812812805e-05, 8.725374937057495e-05, 9.464845061302185e-05, 0.00010204315185546875, 0.00010943785309791565, 0.00011683255434036255, 0.00012422725558280945, 0.00013162195682525635, 0.00013901665806770325, 0.00014641135931015015, 0.00015380606055259705, 0.00016120076179504395, 0.00016859546303749084, 0.00017599016427993774, 0.00018338486552238464, 0.00019077956676483154, 0.00019817426800727844, 0.00020556896924972534, 0.00021296367049217224, 0.00022035837173461914]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 7.0, 9.0, 15.0, 7.0, 13.0, 18.0, 14.0, 22.0, 27.0, 28.0, 21.0, 27.0, 28.0, 33.0, 46.0, 42.0, 37.0, 51.0, 50.0, 41.0, 50.0, 44.0, 49.0, 45.0, 37.0, 29.0, 29.0, 30.0, 23.0, 12.0, 18.0, 18.0, 17.0, 9.0, 17.0, 10.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.12890625, -4.96002197265625, -4.7911376953125, -4.62225341796875, -4.453369140625, -4.28448486328125, -4.1156005859375, -3.94671630859375, -3.77783203125, -3.60894775390625, -3.4400634765625, -3.27117919921875, -3.102294921875, -2.93341064453125, -2.7645263671875, -2.59564208984375, -2.4267578125, -2.25787353515625, -2.0889892578125, -1.92010498046875, -1.751220703125, -1.58233642578125, -1.4134521484375, -1.24456787109375, -1.07568359375, -0.90679931640625, -0.7379150390625, -0.56903076171875, -0.400146484375, -0.23126220703125, -0.0623779296875, 0.10650634765625, 0.275390625, 0.44427490234375, 0.6131591796875, 0.78204345703125, 0.950927734375, 1.11981201171875, 1.2886962890625, 1.45758056640625, 1.62646484375, 1.79534912109375, 1.9642333984375, 2.13311767578125, 2.302001953125, 2.47088623046875, 2.6397705078125, 2.80865478515625, 2.9775390625, 3.14642333984375, 3.3153076171875, 3.48419189453125, 3.653076171875, 3.82196044921875, 3.9908447265625, 4.15972900390625, 4.32861328125, 4.49749755859375, 4.6663818359375, 4.83526611328125, 5.004150390625, 5.17303466796875, 5.3419189453125, 5.51080322265625, 5.6796875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 5.0, 10.0, 13.0, 11.0, 23.0, 44.0, 51.0, 54.0, 78.0, 112.0, 172.0, 215.0, 344.0, 566.0, 796.0, 1415.0, 2421.0, 5063.0, 11027.0, 30647.0, 106062.0, 481712.0, 300480.0, 67911.0, 21299.0, 8435.0, 4002.0, 2128.0, 1251.0, 738.0, 485.0, 289.0, 177.0, 153.0, 97.0, 85.0, 45.0, 39.0, 26.0, 20.0, 12.0, 6.0, 8.0, 5.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.140625, -4.0145263671875, -3.888427734375, -3.7623291015625, -3.63623046875, -3.5101318359375, -3.384033203125, -3.2579345703125, -3.1318359375, -3.0057373046875, -2.879638671875, -2.7535400390625, -2.62744140625, -2.5013427734375, -2.375244140625, -2.2491455078125, -2.123046875, -1.9969482421875, -1.870849609375, -1.7447509765625, -1.61865234375, -1.4925537109375, -1.366455078125, -1.2403564453125, -1.1142578125, -0.9881591796875, -0.862060546875, -0.7359619140625, -0.60986328125, -0.4837646484375, -0.357666015625, -0.2315673828125, -0.10546875, 0.0206298828125, 0.146728515625, 0.2728271484375, 0.39892578125, 0.5250244140625, 0.651123046875, 0.7772216796875, 0.9033203125, 1.0294189453125, 1.155517578125, 1.2816162109375, 1.40771484375, 1.5338134765625, 1.659912109375, 1.7860107421875, 1.912109375, 2.0382080078125, 2.164306640625, 2.2904052734375, 2.41650390625, 2.5426025390625, 2.668701171875, 2.7947998046875, 2.9208984375, 3.0469970703125, 3.173095703125, 3.2991943359375, 3.42529296875, 3.5513916015625, 3.677490234375, 3.8035888671875, 3.9296875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 6.0, 9.0, 20.0, 13.0, 20.0, 26.0, 18.0, 34.0, 40.0, 55.0, 46.0, 53.0, 61.0, 111.0, 1926.0, 173.0, 65.0, 39.0, 50.0, 56.0, 38.0, 39.0, 34.0, 24.0, 16.0, 15.0, 15.0, 6.0, 14.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-27.484375, -26.753173828125, -26.02197265625, -25.290771484375, -24.5595703125, -23.828369140625, -23.09716796875, -22.365966796875, -21.634765625, -20.903564453125, -20.17236328125, -19.441162109375, -18.7099609375, -17.978759765625, -17.24755859375, -16.516357421875, -15.78515625, -15.053955078125, -14.32275390625, -13.591552734375, -12.8603515625, -12.129150390625, -11.39794921875, -10.666748046875, -9.935546875, -9.204345703125, -8.47314453125, -7.741943359375, -7.0107421875, -6.279541015625, -5.54833984375, -4.817138671875, -4.0859375, -3.354736328125, -2.62353515625, -1.892333984375, -1.1611328125, -0.429931640625, 0.30126953125, 1.032470703125, 1.763671875, 2.494873046875, 3.22607421875, 3.957275390625, 4.6884765625, 5.419677734375, 6.15087890625, 6.882080078125, 7.61328125, 8.344482421875, 9.07568359375, 9.806884765625, 10.5380859375, 11.269287109375, 12.00048828125, 12.731689453125, 13.462890625, 14.194091796875, 14.92529296875, 15.656494140625, 16.3876953125, 17.118896484375, 17.85009765625, 18.581298828125, 19.3125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 9.0, 12.0, 5.0, 17.0, 18.0, 15.0, 25.0, 41.0, 46.0, 68.0, 104.0, 143.0, 245.0, 590.0, 3471.0, 3014078.0, 124255.0, 1494.0, 445.0, 202.0, 118.0, 71.0, 60.0, 39.0, 14.0, 31.0, 21.0, 11.0, 18.0, 9.0, 8.0, 2.0, 2.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.65625, -29.513671875, -28.37109375, -27.228515625, -26.0859375, -24.943359375, -23.80078125, -22.658203125, -21.515625, -20.373046875, -19.23046875, -18.087890625, -16.9453125, -15.802734375, -14.66015625, -13.517578125, -12.375, -11.232421875, -10.08984375, -8.947265625, -7.8046875, -6.662109375, -5.51953125, -4.376953125, -3.234375, -2.091796875, -0.94921875, 0.193359375, 1.3359375, 2.478515625, 3.62109375, 4.763671875, 5.90625, 7.048828125, 8.19140625, 9.333984375, 10.4765625, 11.619140625, 12.76171875, 13.904296875, 15.046875, 16.189453125, 17.33203125, 18.474609375, 19.6171875, 20.759765625, 21.90234375, 23.044921875, 24.1875, 25.330078125, 26.47265625, 27.615234375, 28.7578125, 29.900390625, 31.04296875, 32.185546875, 33.328125, 34.470703125, 35.61328125, 36.755859375, 37.8984375, 39.041015625, 40.18359375, 41.326171875, 42.46875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 171.0, 739.0, 103.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.85891723632812, -143.07476806640625, -140.2906036376953, -137.50645446777344, -134.7222900390625, -131.93814086914062, -129.15399169921875, -126.36983489990234, -123.58567810058594, -120.80152130126953, -118.01736450195312, -115.23321533203125, -112.44905853271484, -109.66490173339844, -106.88075256347656, -104.09659576416016, -101.31243896484375, -98.52828216552734, -95.74412536621094, -92.95997619628906, -90.17581939697266, -87.39166259765625, -84.60751342773438, -81.82335662841797, -79.03919982910156, -76.25504302978516, -73.47088623046875, -70.68673706054688, -67.90258026123047, -65.11842346191406, -62.33427047729492, -59.55011749267578, -56.76596450805664, -53.9818115234375, -51.197654724121094, -48.41349792480469, -45.62934494018555, -42.845191955566406, -40.06103515625, -37.276878356933594, -34.49272537231445, -31.70857048034668, -28.924415588378906, -26.140260696411133, -23.35610580444336, -20.571950912475586, -17.787796020507812, -15.003641128540039, -12.219486236572266, -9.435331344604492, -6.651176452636719, -3.8670215606689453, -1.0828666687011719, 1.7012882232666016, 4.485443115234375, 7.269598007202148, 10.053752899169922, 12.837907791137695, 15.622062683105469, 18.406217575073242, 21.190372467041016, 23.97452735900879, 26.758682250976562, 29.542837142944336, 32.32699203491211]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 7.0, 8.0, 7.0, 14.0, 13.0, 13.0, 21.0, 16.0, 25.0, 31.0, 28.0, 34.0, 33.0, 28.0, 46.0, 36.0, 34.0, 41.0, 45.0, 36.0, 34.0, 37.0, 30.0, 38.0, 30.0, 32.0, 25.0, 36.0, 18.0, 20.0, 27.0, 25.0, 16.0, 20.0, 16.0, 14.0, 10.0, 5.0, 10.0, 10.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.84174346923828, -51.20581817626953, -49.56989669799805, -47.93397521972656, -46.29804992675781, -44.66212463378906, -43.02620315551758, -41.390281677246094, -39.754356384277344, -38.118431091308594, -36.48250961303711, -34.846588134765625, -33.210662841796875, -31.574739456176758, -29.93881607055664, -28.302892684936523, -26.666969299316406, -25.03104591369629, -23.395122528076172, -21.759199142456055, -20.123275756835938, -18.48735237121582, -16.851428985595703, -15.215505599975586, -13.579582214355469, -11.943658828735352, -10.307735443115234, -8.671812057495117, -7.035888671875, -5.399965286254883, -3.7640419006347656, -2.1281185150146484, -0.49219512939453125, 1.143728256225586, 2.779651641845703, 4.41557502746582, 6.0514984130859375, 7.687421798706055, 9.323345184326172, 10.959268569946289, 12.595191955566406, 14.231115341186523, 15.86703872680664, 17.502962112426758, 19.138885498046875, 20.774808883666992, 22.41073226928711, 24.046655654907227, 25.682579040527344, 27.31850242614746, 28.954425811767578, 30.590349197387695, 32.22627258300781, 33.86219787597656, 35.49811935424805, 37.13404083251953, 38.76996612548828, 40.40589141845703, 42.041812896728516, 43.677734375, 45.31365966796875, 46.9495849609375, 48.585506439208984, 50.22142791748047, 51.85735321044922]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 8.0, 11.0, 6.0, 10.0, 9.0, 15.0, 10.0, 14.0, 18.0, 20.0, 25.0, 29.0, 23.0, 23.0, 35.0, 37.0, 41.0, 34.0, 40.0, 53.0, 43.0, 57.0, 35.0, 50.0, 44.0, 48.0, 32.0, 41.0, 29.0, 25.0, 22.0, 15.0, 19.0, 22.0, 6.0, 20.0, 15.0, 6.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.28515625, -5.1119384765625, -4.938720703125, -4.7655029296875, -4.59228515625, -4.4190673828125, -4.245849609375, -4.0726318359375, -3.8994140625, -3.7261962890625, -3.552978515625, -3.3797607421875, -3.20654296875, -3.0333251953125, -2.860107421875, -2.6868896484375, -2.513671875, -2.3404541015625, -2.167236328125, -1.9940185546875, -1.82080078125, -1.6475830078125, -1.474365234375, -1.3011474609375, -1.1279296875, -0.9547119140625, -0.781494140625, -0.6082763671875, -0.43505859375, -0.2618408203125, -0.088623046875, 0.0845947265625, 0.2578125, 0.4310302734375, 0.604248046875, 0.7774658203125, 0.95068359375, 1.1239013671875, 1.297119140625, 1.4703369140625, 1.6435546875, 1.8167724609375, 1.989990234375, 2.1632080078125, 2.33642578125, 2.5096435546875, 2.682861328125, 2.8560791015625, 3.029296875, 3.2025146484375, 3.375732421875, 3.5489501953125, 3.72216796875, 3.8953857421875, 4.068603515625, 4.2418212890625, 4.4150390625, 4.5882568359375, 4.761474609375, 4.9346923828125, 5.10791015625, 5.2811279296875, 5.454345703125, 5.6275634765625, 5.80078125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 9.0, 3.0, 10.0, 8.0, 18.0, 19.0, 26.0, 24.0, 30.0, 44.0, 71.0, 102.0, 195.0, 379.0, 1087.0, 3539.0, 14292.0, 80068.0, 662130.0, 2335069.0, 946128.0, 124343.0, 19600.0, 4553.0, 1378.0, 488.0, 230.0, 119.0, 86.0, 62.0, 31.0, 35.0, 18.0, 19.0, 14.0, 9.0, 11.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7890625, -9.4691162109375, -9.149169921875, -8.8292236328125, -8.50927734375, -8.1893310546875, -7.869384765625, -7.5494384765625, -7.2294921875, -6.9095458984375, -6.589599609375, -6.2696533203125, -5.94970703125, -5.6297607421875, -5.309814453125, -4.9898681640625, -4.669921875, -4.3499755859375, -4.030029296875, -3.7100830078125, -3.39013671875, -3.0701904296875, -2.750244140625, -2.4302978515625, -2.1103515625, -1.7904052734375, -1.470458984375, -1.1505126953125, -0.83056640625, -0.5106201171875, -0.190673828125, 0.1292724609375, 0.44921875, 0.7691650390625, 1.089111328125, 1.4090576171875, 1.72900390625, 2.0489501953125, 2.368896484375, 2.6888427734375, 3.0087890625, 3.3287353515625, 3.648681640625, 3.9686279296875, 4.28857421875, 4.6085205078125, 4.928466796875, 5.2484130859375, 5.568359375, 5.8883056640625, 6.208251953125, 6.5281982421875, 6.84814453125, 7.1680908203125, 7.488037109375, 7.8079833984375, 8.1279296875, 8.4478759765625, 8.767822265625, 9.0877685546875, 9.40771484375, 9.7276611328125, 10.047607421875, 10.3675537109375, 10.6875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 28.0, 25.0, 52.0, 65.0, 98.0, 144.0, 260.0, 413.0, 640.0, 723.0, 598.0, 374.0, 229.0, 143.0, 88.0, 53.0, 38.0, 27.0, 14.0, 21.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.966064453125, -26.24462890625, -25.523193359375, -24.8017578125, -24.080322265625, -23.35888671875, -22.637451171875, -21.916015625, -21.194580078125, -20.47314453125, -19.751708984375, -19.0302734375, -18.308837890625, -17.58740234375, -16.865966796875, -16.14453125, -15.423095703125, -14.70166015625, -13.980224609375, -13.2587890625, -12.537353515625, -11.81591796875, -11.094482421875, -10.373046875, -9.651611328125, -8.93017578125, -8.208740234375, -7.4873046875, -6.765869140625, -6.04443359375, -5.322998046875, -4.6015625, -3.880126953125, -3.15869140625, -2.437255859375, -1.7158203125, -0.994384765625, -0.27294921875, 0.448486328125, 1.169921875, 1.891357421875, 2.61279296875, 3.334228515625, 4.0556640625, 4.777099609375, 5.49853515625, 6.219970703125, 6.94140625, 7.662841796875, 8.38427734375, 9.105712890625, 9.8271484375, 10.548583984375, 11.27001953125, 11.991455078125, 12.712890625, 13.434326171875, 14.15576171875, 14.877197265625, 15.5986328125, 16.320068359375, 17.04150390625, 17.762939453125, 18.484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 6.0, 11.0, 10.0, 12.0, 19.0, 21.0, 38.0, 56.0, 93.0, 109.0, 168.0, 334.0, 988.0, 47984.0, 4132958.0, 10022.0, 659.0, 254.0, 177.0, 118.0, 85.0, 39.0, 35.0, 23.0, 19.0, 16.0, 8.0, 4.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.8125, -71.1162109375, -68.419921875, -65.7236328125, -63.02734375, -60.3310546875, -57.634765625, -54.9384765625, -52.2421875, -49.5458984375, -46.849609375, -44.1533203125, -41.45703125, -38.7607421875, -36.064453125, -33.3681640625, -30.671875, -27.9755859375, -25.279296875, -22.5830078125, -19.88671875, -17.1904296875, -14.494140625, -11.7978515625, -9.1015625, -6.4052734375, -3.708984375, -1.0126953125, 1.68359375, 4.3798828125, 7.076171875, 9.7724609375, 12.46875, 15.1650390625, 17.861328125, 20.5576171875, 23.25390625, 25.9501953125, 28.646484375, 31.3427734375, 34.0390625, 36.7353515625, 39.431640625, 42.1279296875, 44.82421875, 47.5205078125, 50.216796875, 52.9130859375, 55.609375, 58.3056640625, 61.001953125, 63.6982421875, 66.39453125, 69.0908203125, 71.787109375, 74.4833984375, 77.1796875, 79.8759765625, 82.572265625, 85.2685546875, 87.96484375, 90.6611328125, 93.357421875, 96.0537109375, 98.75]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 18.0, 73.0, 308.0, 369.0, 199.0, 36.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-124.89875030517578, -119.7562484741211, -114.61375427246094, -109.47125244140625, -104.32875061035156, -99.18624877929688, -94.04375457763672, -88.90125274658203, -83.75875854492188, -78.61625671386719, -73.47376251220703, -68.33126068115234, -63.188758850097656, -58.046260833740234, -52.90376281738281, -47.761260986328125, -42.61875915527344, -37.476261138916016, -32.33375930786133, -27.191261291503906, -22.04876136779785, -16.906261444091797, -11.763763427734375, -6.6212615966796875, -1.4787635803222656, 3.663735866546631, 8.806235313415527, 13.948734283447266, 19.09123420715332, 24.233734130859375, 29.376232147216797, 34.518733978271484, 39.66123962402344, 44.80373764038086, 49.94623947143555, 55.08873748779297, 60.231239318847656, 65.37373352050781, 70.5162353515625, 75.65873718261719, 80.80123901367188, 85.94374084472656, 91.08623504638672, 96.2287368774414, 101.3712387084961, 106.51373291015625, 111.65623474121094, 116.79873657226562, 121.94123077392578, 127.08373260498047, 132.22622680664062, 137.3687286376953, 142.51123046875, 147.6537322998047, 152.79623413085938, 157.938720703125, 163.0812225341797, 168.22372436523438, 173.36622619628906, 178.50872802734375, 183.65121459960938, 188.79371643066406, 193.93621826171875, 199.07872009277344, 204.22122192382812]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 9.0, 15.0, 15.0, 6.0, 15.0, 15.0, 23.0, 27.0, 27.0, 35.0, 38.0, 30.0, 38.0, 29.0, 42.0, 35.0, 43.0, 35.0, 51.0, 30.0, 42.0, 30.0, 29.0, 38.0, 39.0, 30.0, 40.0, 25.0, 22.0, 20.0, 19.0, 15.0, 9.0, 11.0, 14.0, 7.0, 8.0, 6.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.622406005859375, -50.974788665771484, -49.32716751098633, -47.67955017089844, -46.03193283081055, -44.384315490722656, -42.7366943359375, -41.08907699584961, -39.44145965576172, -37.79384231567383, -36.14622116088867, -34.49860382080078, -32.85098648071289, -31.203367233276367, -29.555747985839844, -27.908130645751953, -26.260509490966797, -24.612890243530273, -22.965272903442383, -21.31765365600586, -19.67003631591797, -18.022417068481445, -16.374797821044922, -14.727179527282715, -13.079561233520508, -11.4319429397583, -9.784324645996094, -8.13670539855957, -6.489087104797363, -4.841468811035156, -3.193849563598633, -1.5462312698364258, 0.10138702392578125, 1.7490055561065674, 3.3966240882873535, 5.044242858886719, 6.691861152648926, 8.339479446411133, 9.987098693847656, 11.634716987609863, 13.28233528137207, 14.929953575134277, 16.577571868896484, 18.225191116333008, 19.87281036376953, 21.520427703857422, 23.168046951293945, 24.81566619873047, 26.46328353881836, 28.110902786254883, 29.758520126342773, 31.406139373779297, 33.05375671386719, 34.701377868652344, 36.348995208740234, 37.996612548828125, 39.64423370361328, 41.29185104370117, 42.93947219848633, 44.58708953857422, 46.23470687866211, 47.88232421875, 49.529945373535156, 51.17756271362305, 52.82518005371094]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 11.0, 2.0, 5.0, 9.0, 5.0, 9.0, 13.0, 15.0, 16.0, 21.0, 23.0, 29.0, 35.0, 18.0, 26.0, 28.0, 49.0, 45.0, 31.0, 49.0, 43.0, 45.0, 50.0, 45.0, 38.0, 48.0, 38.0, 34.0, 34.0, 25.0, 25.0, 27.0, 21.0, 12.0, 15.0, 12.0, 13.0, 13.0, 9.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.00384521484375, -4.8319091796875, -4.65997314453125, -4.488037109375, -4.31610107421875, -4.1441650390625, -3.97222900390625, -3.80029296875, -3.62835693359375, -3.4564208984375, -3.28448486328125, -3.112548828125, -2.94061279296875, -2.7686767578125, -2.59674072265625, -2.4248046875, -2.25286865234375, -2.0809326171875, -1.90899658203125, -1.737060546875, -1.56512451171875, -1.3931884765625, -1.22125244140625, -1.04931640625, -0.87738037109375, -0.7054443359375, -0.53350830078125, -0.361572265625, -0.18963623046875, -0.0177001953125, 0.15423583984375, 0.326171875, 0.49810791015625, 0.6700439453125, 0.84197998046875, 1.013916015625, 1.18585205078125, 1.3577880859375, 1.52972412109375, 1.70166015625, 1.87359619140625, 2.0455322265625, 2.21746826171875, 2.389404296875, 2.56134033203125, 2.7332763671875, 2.90521240234375, 3.0771484375, 3.24908447265625, 3.4210205078125, 3.59295654296875, 3.764892578125, 3.93682861328125, 4.1087646484375, 4.28070068359375, 4.45263671875, 4.62457275390625, 4.7965087890625, 4.96844482421875, 5.140380859375, 5.31231689453125, 5.4842529296875, 5.65618896484375, 5.828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 11.0, 24.0, 27.0, 42.0, 66.0, 92.0, 113.0, 169.0, 271.0, 399.0, 625.0, 916.0, 1444.0, 2082.0, 3367.0, 5320.0, 8425.0, 13224.0, 21561.0, 35665.0, 61286.0, 111960.0, 218869.0, 256923.0, 130108.0, 70410.0, 40259.0, 24170.0, 14928.0, 9190.0, 5783.0, 3756.0, 2501.0, 1583.0, 1018.0, 644.0, 418.0, 311.0, 176.0, 153.0, 81.0, 55.0, 39.0, 39.0, 10.0, 9.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.86865234375, -0.8407363891601562, -0.8128204345703125, -0.7849044799804688, -0.756988525390625, -0.7290725708007812, -0.7011566162109375, -0.6732406616210938, -0.64532470703125, -0.6174087524414062, -0.5894927978515625, -0.5615768432617188, -0.533660888671875, -0.5057449340820312, -0.4778289794921875, -0.44991302490234375, -0.4219970703125, -0.39408111572265625, -0.3661651611328125, -0.33824920654296875, -0.310333251953125, -0.28241729736328125, -0.2545013427734375, -0.22658538818359375, -0.19866943359375, -0.17075347900390625, -0.1428375244140625, -0.11492156982421875, -0.087005615234375, -0.05908966064453125, -0.0311737060546875, -0.00325775146484375, 0.024658203125, 0.05257415771484375, 0.0804901123046875, 0.10840606689453125, 0.136322021484375, 0.16423797607421875, 0.1921539306640625, 0.22006988525390625, 0.24798583984375, 0.27590179443359375, 0.3038177490234375, 0.33173370361328125, 0.359649658203125, 0.38756561279296875, 0.4154815673828125, 0.44339752197265625, 0.4713134765625, 0.49922943115234375, 0.5271453857421875, 0.5550613403320312, 0.582977294921875, 0.6108932495117188, 0.6388092041015625, 0.6667251586914062, 0.69464111328125, 0.7225570678710938, 0.7504730224609375, 0.7783889770507812, 0.806304931640625, 0.8342208862304688, 0.8621368408203125, 0.8900527954101562, 0.91796875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 2.0, 6.0, 9.0, 7.0, 7.0, 15.0, 14.0, 11.0, 20.0, 13.0, 19.0, 24.0, 47.0, 31.0, 29.0, 30.0, 50.0, 51.0, 40.0, 49.0, 31.0, 1063.0, 36.0, 38.0, 41.0, 34.0, 39.0, 34.0, 23.0, 28.0, 18.0, 24.0, 18.0, 19.0, 16.0, 16.0, 15.0, 6.0, 9.0, 7.0, 10.0, 8.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.728302001953125, -2.62847900390625, -2.528656005859375, -2.4288330078125, -2.329010009765625, -2.22918701171875, -2.129364013671875, -2.029541015625, -1.929718017578125, -1.82989501953125, -1.730072021484375, -1.6302490234375, -1.530426025390625, -1.43060302734375, -1.330780029296875, -1.23095703125, -1.131134033203125, -1.03131103515625, -0.931488037109375, -0.8316650390625, -0.731842041015625, -0.63201904296875, -0.532196044921875, -0.432373046875, -0.332550048828125, -0.23272705078125, -0.132904052734375, -0.0330810546875, 0.066741943359375, 0.16656494140625, 0.266387939453125, 0.3662109375, 0.466033935546875, 0.56585693359375, 0.665679931640625, 0.7655029296875, 0.865325927734375, 0.96514892578125, 1.064971923828125, 1.164794921875, 1.264617919921875, 1.36444091796875, 1.464263916015625, 1.5640869140625, 1.663909912109375, 1.76373291015625, 1.863555908203125, 1.96337890625, 2.063201904296875, 2.16302490234375, 2.262847900390625, 2.3626708984375, 2.462493896484375, 2.56231689453125, 2.662139892578125, 2.761962890625, 2.861785888671875, 2.96160888671875, 3.061431884765625, 3.1612548828125, 3.261077880859375, 3.36090087890625, 3.460723876953125, 3.560546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 15.0, 13.0, 22.0, 32.0, 47.0, 67.0, 110.0, 176.0, 248.0, 352.0, 514.0, 729.0, 1040.0, 1557.0, 2174.0, 3126.0, 4583.0, 6768.0, 9845.0, 15197.0, 23305.0, 36507.0, 58957.0, 97970.0, 171060.0, 1290048.0, 144192.0, 84142.0, 50819.0, 31761.0, 20265.0, 13211.0, 9017.0, 6006.0, 3924.0, 2851.0, 2081.0, 1361.0, 924.0, 666.0, 479.0, 331.0, 200.0, 128.0, 105.0, 71.0, 49.0, 30.0, 12.0, 19.0, 7.0, 8.0, 2.0, 6.0, 0.0, 3.0], "bins": [-0.7353515625, -0.7133026123046875, -0.691253662109375, -0.6692047119140625, -0.64715576171875, -0.6251068115234375, -0.603057861328125, -0.5810089111328125, -0.5589599609375, -0.5369110107421875, -0.514862060546875, -0.4928131103515625, -0.47076416015625, -0.4487152099609375, -0.426666259765625, -0.4046173095703125, -0.382568359375, -0.3605194091796875, -0.338470458984375, -0.3164215087890625, -0.29437255859375, -0.2723236083984375, -0.250274658203125, -0.2282257080078125, -0.2061767578125, -0.1841278076171875, -0.162078857421875, -0.1400299072265625, -0.11798095703125, -0.0959320068359375, -0.073883056640625, -0.0518341064453125, -0.02978515625, -0.0077362060546875, 0.014312744140625, 0.0363616943359375, 0.05841064453125, 0.0804595947265625, 0.102508544921875, 0.1245574951171875, 0.1466064453125, 0.1686553955078125, 0.190704345703125, 0.2127532958984375, 0.23480224609375, 0.2568511962890625, 0.278900146484375, 0.3009490966796875, 0.322998046875, 0.3450469970703125, 0.367095947265625, 0.3891448974609375, 0.41119384765625, 0.4332427978515625, 0.455291748046875, 0.4773406982421875, 0.4993896484375, 0.5214385986328125, 0.543487548828125, 0.5655364990234375, 0.58758544921875, 0.6096343994140625, 0.631683349609375, 0.6537322998046875, 0.67578125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 10.0, 9.0, 11.0, 6.0, 7.0, 15.0, 16.0, 20.0, 16.0, 23.0, 20.0, 34.0, 43.0, 56.0, 49.0, 52.0, 58.0, 52.0, 69.0, 61.0, 55.0, 55.0, 37.0, 43.0, 35.0, 36.0, 25.0, 16.0, 15.0, 5.0, 8.0, 9.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.000400543212890625, -0.0003871545195579529, -0.00037376582622528076, -0.00036037713289260864, -0.0003469884395599365, -0.0003335997462272644, -0.0003202110528945923, -0.00030682235956192017, -0.00029343366622924805, -0.00028004497289657593, -0.0002666562795639038, -0.0002532675862312317, -0.00023987889289855957, -0.00022649019956588745, -0.00021310150623321533, -0.0001997128129005432, -0.0001863241195678711, -0.00017293542623519897, -0.00015954673290252686, -0.00014615803956985474, -0.00013276934623718262, -0.0001193806529045105, -0.00010599195957183838, -9.260326623916626e-05, -7.921457290649414e-05, -6.582587957382202e-05, -5.24371862411499e-05, -3.904849290847778e-05, -2.5659799575805664e-05, -1.2271106243133545e-05, 1.1175870895385742e-06, 1.4506280422210693e-05, 2.7894973754882812e-05, 4.128366708755493e-05, 5.467236042022705e-05, 6.806105375289917e-05, 8.144974708557129e-05, 9.483844041824341e-05, 0.00010822713375091553, 0.00012161582708358765, 0.00013500452041625977, 0.00014839321374893188, 0.000161781907081604, 0.00017517060041427612, 0.00018855929374694824, 0.00020194798707962036, 0.00021533668041229248, 0.0002287253737449646, 0.00024211406707763672, 0.00025550276041030884, 0.00026889145374298096, 0.0002822801470756531, 0.0002956688404083252, 0.0003090575337409973, 0.00032244622707366943, 0.00033583492040634155, 0.00034922361373901367, 0.0003626123070716858, 0.0003760010004043579, 0.00038938969373703003, 0.00040277838706970215, 0.00041616708040237427, 0.0004295557737350464, 0.0004429444670677185, 0.0004563331604003906]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 6.0, 5.0, 8.0, 16.0, 19.0, 35.0, 49.0, 65.0, 82.0, 165.0, 303.0, 532.0, 3075.0, 1039797.0, 3084.0, 553.0, 240.0, 143.0, 107.0, 68.0, 44.0, 38.0, 18.0, 12.0, 9.0, 13.0, 15.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0155487060546875, -0.015144824981689453, -0.014740943908691406, -0.01433706283569336, -0.013933181762695312, -0.013529300689697266, -0.013125419616699219, -0.012721538543701172, -0.012317657470703125, -0.011913776397705078, -0.011509895324707031, -0.011106014251708984, -0.010702133178710938, -0.01029825210571289, -0.009894371032714844, -0.009490489959716797, -0.00908660888671875, -0.008682727813720703, -0.008278846740722656, -0.00787496566772461, -0.0074710845947265625, -0.007067203521728516, -0.006663322448730469, -0.006259441375732422, -0.005855560302734375, -0.005451679229736328, -0.005047798156738281, -0.004643917083740234, -0.0042400360107421875, -0.0038361549377441406, -0.0034322738647460938, -0.003028392791748047, -0.00262451171875, -0.002220630645751953, -0.0018167495727539062, -0.0014128684997558594, -0.0010089874267578125, -0.0006051063537597656, -0.00020122528076171875, 0.00020265579223632812, 0.000606536865234375, 0.0010104179382324219, 0.0014142990112304688, 0.0018181800842285156, 0.0022220611572265625, 0.0026259422302246094, 0.0030298233032226562, 0.003433704376220703, 0.00383758544921875, 0.004241466522216797, 0.004645347595214844, 0.005049228668212891, 0.0054531097412109375, 0.005856990814208984, 0.006260871887207031, 0.006664752960205078, 0.007068634033203125, 0.007472515106201172, 0.007876396179199219, 0.008280277252197266, 0.008684158325195312, 0.00908803939819336, 0.009491920471191406, 0.009895801544189453, 0.0102996826171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 91.0, 730.0, 189.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023884994443506002, -0.002328182104974985, -0.0022678645327687263, -0.0022075471933931112, -0.002147229854017496, -0.002086912514641881, -0.002026595175266266, -0.001966277603060007, -0.001905960263684392, -0.0018456429243087769, -0.00178532546851784, -0.001725008012726903, -0.0016646906733512878, -0.0016043733339756727, -0.0015440558781847358, -0.0014837384223937988, -0.0014234210830181837, -0.0013631037436425686, -0.0013027862878516316, -0.0012424688320606947, -0.0011821514926850796, -0.0011218341533094645, -0.0010615166975185275, -0.0010011992417275906, -0.0009408819023519754, -0.0008805645047686994, -0.0008202471071854234, -0.0007599297096021473, -0.0006996123120188713, -0.0006392949144355953, -0.0005789775168523192, -0.0005186601192690432, -0.000458342838101089, -0.00039802544051781297, -0.00033770804293453693, -0.0002773906453512609, -0.00021707324776798487, -0.00015675585018470883, -9.64384526014328e-05, -3.612105501815677e-05, 2.4196342565119267e-05, 8.45137401483953e-05, 0.00014483113773167133, 0.00020514853531494737, 0.0002654659328982234, 0.00032578333048149943, 0.00038610072806477547, 0.0004464181256480515, 0.0005067355232313275, 0.0005670529208146036, 0.0006273703183978796, 0.0006876877159811556, 0.0007480051135644317, 0.0008083225111477077, 0.0008686399087309837, 0.0009289573063142598, 0.0009892747038975358, 0.0010495921596884727, 0.0011099094990640879, 0.001170226838439703, 0.00123054429423064, 0.0012908617500215769, 0.001351179089397192, 0.0014114964287728071, 0.001471813884563744]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 2.0, 6.0, 5.0, 8.0, 11.0, 8.0, 21.0, 17.0, 11.0, 10.0, 22.0, 25.0, 39.0, 40.0, 37.0, 26.0, 39.0, 32.0, 43.0, 40.0, 37.0, 31.0, 44.0, 37.0, 38.0, 31.0, 24.0, 23.0, 34.0, 33.0, 33.0, 22.0, 21.0, 26.0, 16.0, 20.0, 18.0, 9.0, 15.0, 8.0, 7.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00021779537200927734, -0.00021124351769685745, -0.00020469166338443756, -0.00019813980907201767, -0.00019158795475959778, -0.0001850361004471779, -0.000178484246134758, -0.0001719323918223381, -0.0001653805375099182, -0.00015882868319749832, -0.00015227682888507843, -0.00014572497457265854, -0.00013917312026023865, -0.00013262126594781876, -0.00012606941163539886, -0.00011951755732297897, -0.00011296570301055908, -0.00010641384869813919, -9.98619943857193e-05, -9.331014007329941e-05, -8.675828576087952e-05, -8.020643144845963e-05, -7.365457713603973e-05, -6.710272282361984e-05, -6.055086851119995e-05, -5.399901419878006e-05, -4.744715988636017e-05, -4.089530557394028e-05, -3.4343451261520386e-05, -2.7791596949100494e-05, -2.1239742636680603e-05, -1.4687888324260712e-05, -8.13603401184082e-06, -1.584179699420929e-06, 4.967674612998962e-06, 1.1519528925418854e-05, 1.8071383237838745e-05, 2.4623237550258636e-05, 3.117509186267853e-05, 3.772694617509842e-05, 4.427880048751831e-05, 5.08306547999382e-05, 5.738250911235809e-05, 6.393436342477798e-05, 7.048621773719788e-05, 7.703807204961777e-05, 8.358992636203766e-05, 9.014178067445755e-05, 9.669363498687744e-05, 0.00010324548929929733, 0.00010979734361171722, 0.00011634919792413712, 0.000122901052236557, 0.0001294529065489769, 0.0001360047608613968, 0.00014255661517381668, 0.00014910846948623657, 0.00015566032379865646, 0.00016221217811107635, 0.00016876403242349625, 0.00017531588673591614, 0.00018186774104833603, 0.00018841959536075592, 0.0001949714496731758, 0.0002015233039855957]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 11.0, 2.0, 5.0, 9.0, 5.0, 9.0, 13.0, 15.0, 16.0, 21.0, 23.0, 29.0, 35.0, 18.0, 26.0, 28.0, 49.0, 45.0, 31.0, 49.0, 43.0, 45.0, 50.0, 45.0, 38.0, 48.0, 38.0, 34.0, 34.0, 25.0, 25.0, 27.0, 21.0, 12.0, 15.0, 12.0, 13.0, 13.0, 9.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.00384521484375, -4.8319091796875, -4.65997314453125, -4.488037109375, -4.31610107421875, -4.1441650390625, -3.97222900390625, -3.80029296875, -3.62835693359375, -3.4564208984375, -3.28448486328125, -3.112548828125, -2.94061279296875, -2.7686767578125, -2.59674072265625, -2.4248046875, -2.25286865234375, -2.0809326171875, -1.90899658203125, -1.737060546875, -1.56512451171875, -1.3931884765625, -1.22125244140625, -1.04931640625, -0.87738037109375, -0.7054443359375, -0.53350830078125, -0.361572265625, -0.18963623046875, -0.0177001953125, 0.15423583984375, 0.326171875, 0.49810791015625, 0.6700439453125, 0.84197998046875, 1.013916015625, 1.18585205078125, 1.3577880859375, 1.52972412109375, 1.70166015625, 1.87359619140625, 2.0455322265625, 2.21746826171875, 2.389404296875, 2.56134033203125, 2.7332763671875, 2.90521240234375, 3.0771484375, 3.24908447265625, 3.4210205078125, 3.59295654296875, 3.764892578125, 3.93682861328125, 4.1087646484375, 4.28070068359375, 4.45263671875, 4.62457275390625, 4.7965087890625, 4.96844482421875, 5.140380859375, 5.31231689453125, 5.4842529296875, 5.65618896484375, 5.828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 10.0, 3.0, 8.0, 10.0, 7.0, 18.0, 18.0, 28.0, 40.0, 69.0, 101.0, 191.0, 335.0, 626.0, 1269.0, 2618.0, 5253.0, 11807.0, 28155.0, 79228.0, 252014.0, 419149.0, 158916.0, 52188.0, 19926.0, 8633.0, 3864.0, 1971.0, 922.0, 483.0, 268.0, 151.0, 83.0, 65.0, 28.0, 23.0, 23.0, 11.0, 14.0, 11.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.24609375, -3.13897705078125, -3.0318603515625, -2.92474365234375, -2.817626953125, -2.71051025390625, -2.6033935546875, -2.49627685546875, -2.38916015625, -2.28204345703125, -2.1749267578125, -2.06781005859375, -1.960693359375, -1.85357666015625, -1.7464599609375, -1.63934326171875, -1.5322265625, -1.42510986328125, -1.3179931640625, -1.21087646484375, -1.103759765625, -0.99664306640625, -0.8895263671875, -0.78240966796875, -0.67529296875, -0.56817626953125, -0.4610595703125, -0.35394287109375, -0.246826171875, -0.13970947265625, -0.0325927734375, 0.07452392578125, 0.181640625, 0.28875732421875, 0.3958740234375, 0.50299072265625, 0.610107421875, 0.71722412109375, 0.8243408203125, 0.93145751953125, 1.03857421875, 1.14569091796875, 1.2528076171875, 1.35992431640625, 1.467041015625, 1.57415771484375, 1.6812744140625, 1.78839111328125, 1.8955078125, 2.00262451171875, 2.1097412109375, 2.21685791015625, 2.323974609375, 2.43109130859375, 2.5382080078125, 2.64532470703125, 2.75244140625, 2.85955810546875, 2.9666748046875, 3.07379150390625, 3.180908203125, 3.28802490234375, 3.3951416015625, 3.50225830078125, 3.609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 6.0, 8.0, 10.0, 14.0, 17.0, 21.0, 27.0, 17.0, 28.0, 34.0, 30.0, 45.0, 33.0, 47.0, 52.0, 56.0, 86.0, 1532.0, 462.0, 83.0, 63.0, 51.0, 42.0, 38.0, 29.0, 27.0, 18.0, 19.0, 27.0, 8.0, 24.0, 22.0, 17.0, 9.0, 9.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.999755859375, -18.40576171875, -17.811767578125, -17.2177734375, -16.623779296875, -16.02978515625, -15.435791015625, -14.841796875, -14.247802734375, -13.65380859375, -13.059814453125, -12.4658203125, -11.871826171875, -11.27783203125, -10.683837890625, -10.08984375, -9.495849609375, -8.90185546875, -8.307861328125, -7.7138671875, -7.119873046875, -6.52587890625, -5.931884765625, -5.337890625, -4.743896484375, -4.14990234375, -3.555908203125, -2.9619140625, -2.367919921875, -1.77392578125, -1.179931640625, -0.5859375, 0.008056640625, 0.60205078125, 1.196044921875, 1.7900390625, 2.384033203125, 2.97802734375, 3.572021484375, 4.166015625, 4.760009765625, 5.35400390625, 5.947998046875, 6.5419921875, 7.135986328125, 7.72998046875, 8.323974609375, 8.91796875, 9.511962890625, 10.10595703125, 10.699951171875, 11.2939453125, 11.887939453125, 12.48193359375, 13.075927734375, 13.669921875, 14.263916015625, 14.85791015625, 15.451904296875, 16.0458984375, 16.639892578125, 17.23388671875, 17.827880859375, 18.421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 1.0, 10.0, 3.0, 8.0, 14.0, 15.0, 24.0, 20.0, 15.0, 30.0, 31.0, 47.0, 55.0, 98.0, 148.0, 215.0, 349.0, 1009.0, 12165.0, 3080595.0, 47790.0, 1687.0, 493.0, 275.0, 160.0, 98.0, 81.0, 40.0, 46.0, 31.0, 26.0, 29.0, 25.0, 10.0, 18.0, 7.0, 7.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.68603515625, -28.6845703125, -27.68310546875, -26.681640625, -25.68017578125, -24.6787109375, -23.67724609375, -22.67578125, -21.67431640625, -20.6728515625, -19.67138671875, -18.669921875, -17.66845703125, -16.6669921875, -15.66552734375, -14.6640625, -13.66259765625, -12.6611328125, -11.65966796875, -10.658203125, -9.65673828125, -8.6552734375, -7.65380859375, -6.65234375, -5.65087890625, -4.6494140625, -3.64794921875, -2.646484375, -1.64501953125, -0.6435546875, 0.35791015625, 1.359375, 2.36083984375, 3.3623046875, 4.36376953125, 5.365234375, 6.36669921875, 7.3681640625, 8.36962890625, 9.37109375, 10.37255859375, 11.3740234375, 12.37548828125, 13.376953125, 14.37841796875, 15.3798828125, 16.38134765625, 17.3828125, 18.38427734375, 19.3857421875, 20.38720703125, 21.388671875, 22.39013671875, 23.3916015625, 24.39306640625, 25.39453125, 26.39599609375, 27.3974609375, 28.39892578125, 29.400390625, 30.40185546875, 31.4033203125, 32.40478515625, 33.40625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [3.0, 48.0, 802.0, 160.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.05388069152832, -6.874826431274414, -2.695772171020508, 1.4832820892333984, 5.662336349487305, 9.841390609741211, 14.020444869995117, 18.199499130249023, 22.37855339050293, 26.557607650756836, 30.736661911010742, 34.91571807861328, 39.09477233886719, 43.273826599121094, 47.452880859375, 51.631935119628906, 55.81098937988281, 59.99004364013672, 64.16909790039062, 68.34815216064453, 72.52720642089844, 76.70626068115234, 80.88531494140625, 85.06436920166016, 89.24342346191406, 93.42247772216797, 97.60153198242188, 101.78058624267578, 105.95964050292969, 110.1386947631836, 114.3177490234375, 118.4968032836914, 122.67584228515625, 126.85489654541016, 131.03395080566406, 135.2130126953125, 139.39205932617188, 143.57110595703125, 147.7501678466797, 151.92922973632812, 156.1082763671875, 160.28732299804688, 164.4663848876953, 168.64544677734375, 172.82449340820312, 177.0035400390625, 181.18260192871094, 185.36166381835938, 189.54071044921875, 193.71975708007812, 197.89881896972656, 202.077880859375, 206.25692749023438, 210.43597412109375, 214.6150360107422, 218.79409790039062, 222.97314453125, 227.15219116210938, 231.3312530517578, 235.51031494140625, 239.68936157226562, 243.868408203125, 248.04747009277344, 252.22653198242188, 256.40557861328125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 10.0, 8.0, 12.0, 15.0, 6.0, 4.0, 18.0, 18.0, 17.0, 30.0, 28.0, 21.0, 19.0, 35.0, 35.0, 48.0, 38.0, 39.0, 34.0, 29.0, 42.0, 53.0, 37.0, 32.0, 38.0, 44.0, 36.0, 25.0, 28.0, 22.0, 23.0, 28.0, 14.0, 17.0, 15.0, 13.0, 10.0, 10.0, 14.0, 9.0, 9.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-63.37583923339844, -61.554351806640625, -59.73286437988281, -57.911380767822266, -56.08989334106445, -54.26840591430664, -52.446922302246094, -50.62543487548828, -48.80394744873047, -46.982460021972656, -45.160972595214844, -43.3394889831543, -41.518001556396484, -39.69651412963867, -37.875030517578125, -36.05354309082031, -34.2320556640625, -32.41056823730469, -30.589082717895508, -28.767597198486328, -26.946109771728516, -25.124622344970703, -23.303136825561523, -21.481651306152344, -19.66016387939453, -17.83867645263672, -16.01719093322754, -14.195704460144043, -12.374217987060547, -10.55273151397705, -8.731245040893555, -6.909758567810059, -5.0882720947265625, -3.2667856216430664, -1.4452991485595703, 0.3761873245239258, 2.197673797607422, 4.019160270690918, 5.840646743774414, 7.66213321685791, 9.483619689941406, 11.305106163024902, 13.126592636108398, 14.948079109191895, 16.76956558227539, 18.591053009033203, 20.412538528442383, 22.234024047851562, 24.055511474609375, 25.876998901367188, 27.698484420776367, 29.519969940185547, 31.34145736694336, 33.16294479370117, 34.98442840576172, 36.80591583251953, 38.627403259277344, 40.448890686035156, 42.27037811279297, 44.091861724853516, 45.91334915161133, 47.73483657836914, 49.55632019042969, 51.3778076171875, 53.19929504394531]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 5.0, 3.0, 7.0, 9.0, 4.0, 8.0, 9.0, 18.0, 13.0, 19.0, 22.0, 32.0, 17.0, 24.0, 36.0, 25.0, 43.0, 38.0, 40.0, 29.0, 41.0, 39.0, 47.0, 52.0, 37.0, 42.0, 37.0, 42.0, 37.0, 27.0, 22.0, 35.0, 24.0, 20.0, 17.0, 12.0, 13.0, 12.0, 9.0, 11.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.07421875, -4.904296875, -4.734375, -4.564453125, -4.39453125, -4.224609375, -4.0546875, -3.884765625, -3.71484375, -3.544921875, -3.375, -3.205078125, -3.03515625, -2.865234375, -2.6953125, -2.525390625, -2.35546875, -2.185546875, -2.015625, -1.845703125, -1.67578125, -1.505859375, -1.3359375, -1.166015625, -0.99609375, -0.826171875, -0.65625, -0.486328125, -0.31640625, -0.146484375, 0.0234375, 0.193359375, 0.36328125, 0.533203125, 0.703125, 0.873046875, 1.04296875, 1.212890625, 1.3828125, 1.552734375, 1.72265625, 1.892578125, 2.0625, 2.232421875, 2.40234375, 2.572265625, 2.7421875, 2.912109375, 3.08203125, 3.251953125, 3.421875, 3.591796875, 3.76171875, 3.931640625, 4.1015625, 4.271484375, 4.44140625, 4.611328125, 4.78125, 4.951171875, 5.12109375, 5.291015625, 5.4609375, 5.630859375, 5.80078125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 8.0, 7.0, 6.0, 10.0, 4.0, 13.0, 17.0, 22.0, 26.0, 31.0, 33.0, 38.0, 57.0, 96.0, 156.0, 331.0, 1098.0, 6321.0, 67677.0, 1612939.0, 2372440.0, 121022.0, 9339.0, 1561.0, 427.0, 201.0, 103.0, 53.0, 50.0, 45.0, 24.0, 27.0, 20.0, 14.0, 18.0, 10.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.9765625, -15.4456787109375, -14.914794921875, -14.3839111328125, -13.85302734375, -13.3221435546875, -12.791259765625, -12.2603759765625, -11.7294921875, -11.1986083984375, -10.667724609375, -10.1368408203125, -9.60595703125, -9.0750732421875, -8.544189453125, -8.0133056640625, -7.482421875, -6.9515380859375, -6.420654296875, -5.8897705078125, -5.35888671875, -4.8280029296875, -4.297119140625, -3.7662353515625, -3.2353515625, -2.7044677734375, -2.173583984375, -1.6427001953125, -1.11181640625, -0.5809326171875, -0.050048828125, 0.4808349609375, 1.01171875, 1.5426025390625, 2.073486328125, 2.6043701171875, 3.13525390625, 3.6661376953125, 4.197021484375, 4.7279052734375, 5.2587890625, 5.7896728515625, 6.320556640625, 6.8514404296875, 7.38232421875, 7.9132080078125, 8.444091796875, 8.9749755859375, 9.505859375, 10.0367431640625, 10.567626953125, 11.0985107421875, 11.62939453125, 12.1602783203125, 12.691162109375, 13.2220458984375, 13.7529296875, 14.2838134765625, 14.814697265625, 15.3455810546875, 15.87646484375, 16.4073486328125, 16.938232421875, 17.4691162109375, 18.0]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 3.0, 19.0, 16.0, 31.0, 34.0, 48.0, 88.0, 122.0, 192.0, 230.0, 360.0, 516.0, 609.0, 555.0, 402.0, 263.0, 195.0, 117.0, 74.0, 62.0, 40.0, 27.0, 27.0, 12.0, 8.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.25, -19.646240234375, -19.04248046875, -18.438720703125, -17.8349609375, -17.231201171875, -16.62744140625, -16.023681640625, -15.419921875, -14.816162109375, -14.21240234375, -13.608642578125, -13.0048828125, -12.401123046875, -11.79736328125, -11.193603515625, -10.58984375, -9.986083984375, -9.38232421875, -8.778564453125, -8.1748046875, -7.571044921875, -6.96728515625, -6.363525390625, -5.759765625, -5.156005859375, -4.55224609375, -3.948486328125, -3.3447265625, -2.740966796875, -2.13720703125, -1.533447265625, -0.9296875, -0.325927734375, 0.27783203125, 0.881591796875, 1.4853515625, 2.089111328125, 2.69287109375, 3.296630859375, 3.900390625, 4.504150390625, 5.10791015625, 5.711669921875, 6.3154296875, 6.919189453125, 7.52294921875, 8.126708984375, 8.73046875, 9.334228515625, 9.93798828125, 10.541748046875, 11.1455078125, 11.749267578125, 12.35302734375, 12.956787109375, 13.560546875, 14.164306640625, 14.76806640625, 15.371826171875, 15.9755859375, 16.579345703125, 17.18310546875, 17.786865234375, 18.390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 2.0, 7.0, 4.0, 11.0, 12.0, 18.0, 21.0, 28.0, 40.0, 49.0, 58.0, 93.0, 103.0, 157.0, 215.0, 330.0, 835.0, 7116.0, 3160006.0, 1019411.0, 3970.0, 681.0, 319.0, 208.0, 146.0, 116.0, 78.0, 65.0, 40.0, 37.0, 23.0, 27.0, 12.0, 13.0, 8.0, 4.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.59375, -56.63525390625, -54.6767578125, -52.71826171875, -50.759765625, -48.80126953125, -46.8427734375, -44.88427734375, -42.92578125, -40.96728515625, -39.0087890625, -37.05029296875, -35.091796875, -33.13330078125, -31.1748046875, -29.21630859375, -27.2578125, -25.29931640625, -23.3408203125, -21.38232421875, -19.423828125, -17.46533203125, -15.5068359375, -13.54833984375, -11.58984375, -9.63134765625, -7.6728515625, -5.71435546875, -3.755859375, -1.79736328125, 0.1611328125, 2.11962890625, 4.078125, 6.03662109375, 7.9951171875, 9.95361328125, 11.912109375, 13.87060546875, 15.8291015625, 17.78759765625, 19.74609375, 21.70458984375, 23.6630859375, 25.62158203125, 27.580078125, 29.53857421875, 31.4970703125, 33.45556640625, 35.4140625, 37.37255859375, 39.3310546875, 41.28955078125, 43.248046875, 45.20654296875, 47.1650390625, 49.12353515625, 51.08203125, 53.04052734375, 54.9990234375, 56.95751953125, 58.916015625, 60.87451171875, 62.8330078125, 64.79150390625, 66.75]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 15.0, 24.0, 68.0, 123.0, 210.0, 178.0, 146.0, 118.0, 61.0, 38.0, 16.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.94272232055664, -50.34061050415039, -47.73849868774414, -45.13638687133789, -42.534278869628906, -39.932167053222656, -37.330055236816406, -34.727943420410156, -32.125831604003906, -29.523719787597656, -26.921607971191406, -24.31949806213379, -21.71738624572754, -19.11527442932129, -16.513164520263672, -13.911052703857422, -11.308940887451172, -8.706829071044922, -6.104718208312988, -3.5026068687438965, -0.9004955291748047, 1.7016162872314453, 4.303727149963379, 6.9058380126953125, 9.507949829101562, 12.110061645507812, 14.712172508239746, 17.31428337097168, 19.91639518737793, 22.51850700378418, 25.120616912841797, 27.722728729248047, 30.32483673095703, 32.92694854736328, 35.52906036376953, 38.13117218017578, 40.73328399658203, 43.33539581298828, 45.937503814697266, 48.539615631103516, 51.141727447509766, 53.743839263916016, 56.345951080322266, 58.948062896728516, 61.5501708984375, 64.15228271484375, 66.75439453125, 69.35650634765625, 71.9586181640625, 74.56072998046875, 77.162841796875, 79.76495361328125, 82.3670654296875, 84.96917724609375, 87.5712890625, 90.17340087890625, 92.7755126953125, 95.37762451171875, 97.979736328125, 100.58184814453125, 103.1839599609375, 105.78607177734375, 108.38818359375, 110.99029541015625, 113.59239959716797]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 7.0, 8.0, 9.0, 8.0, 8.0, 12.0, 10.0, 14.0, 14.0, 25.0, 18.0, 34.0, 21.0, 38.0, 33.0, 38.0, 43.0, 43.0, 44.0, 40.0, 43.0, 48.0, 46.0, 38.0, 36.0, 35.0, 31.0, 35.0, 37.0, 21.0, 34.0, 21.0, 13.0, 16.0, 12.0, 18.0, 14.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.909263610839844, -48.3282585144043, -46.74725341796875, -45.16624450683594, -43.58523941040039, -42.004234313964844, -40.4232292175293, -38.84222412109375, -37.2612190246582, -35.680213928222656, -34.09920883178711, -32.51820373535156, -30.937196731567383, -29.356189727783203, -27.775184631347656, -26.19417953491211, -24.61317253112793, -23.032167434692383, -21.451160430908203, -19.870155334472656, -18.28915023803711, -16.708145141601562, -15.127138137817383, -13.546133041381836, -11.965126991271973, -10.38412094116211, -8.803115844726562, -7.222109794616699, -5.641104221343994, -4.060098648071289, -2.479092597961426, -0.8980875015258789, 0.6829185485839844, 2.2639241218566895, 3.8449299335479736, 5.425935745239258, 7.006941318511963, 8.587946891784668, 10.168952941894531, 11.749958038330078, 13.330964088439941, 14.911970138549805, 16.49297523498535, 18.07398223876953, 19.654987335205078, 21.235992431640625, 22.816997528076172, 24.39800262451172, 25.9790096282959, 27.560014724731445, 29.141021728515625, 30.722026824951172, 32.30303192138672, 33.884037017822266, 35.46504211425781, 37.046051025390625, 38.62705612182617, 40.20806121826172, 41.789066314697266, 43.37007141113281, 44.951080322265625, 46.53208541870117, 48.11309051513672, 49.694095611572266, 51.27510070800781]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 12.0, 11.0, 10.0, 8.0, 17.0, 22.0, 23.0, 27.0, 26.0, 29.0, 45.0, 36.0, 37.0, 39.0, 32.0, 51.0, 38.0, 44.0, 46.0, 43.0, 37.0, 39.0, 41.0, 37.0, 35.0, 31.0, 25.0, 22.0, 17.0, 18.0, 21.0, 14.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5546875, -5.3758544921875, -5.197021484375, -5.0181884765625, -4.83935546875, -4.6605224609375, -4.481689453125, -4.3028564453125, -4.1240234375, -3.9451904296875, -3.766357421875, -3.5875244140625, -3.40869140625, -3.2298583984375, -3.051025390625, -2.8721923828125, -2.693359375, -2.5145263671875, -2.335693359375, -2.1568603515625, -1.97802734375, -1.7991943359375, -1.620361328125, -1.4415283203125, -1.2626953125, -1.0838623046875, -0.905029296875, -0.7261962890625, -0.54736328125, -0.3685302734375, -0.189697265625, -0.0108642578125, 0.16796875, 0.3468017578125, 0.525634765625, 0.7044677734375, 0.88330078125, 1.0621337890625, 1.240966796875, 1.4197998046875, 1.5986328125, 1.7774658203125, 1.956298828125, 2.1351318359375, 2.31396484375, 2.4927978515625, 2.671630859375, 2.8504638671875, 3.029296875, 3.2081298828125, 3.386962890625, 3.5657958984375, 3.74462890625, 3.9234619140625, 4.102294921875, 4.2811279296875, 4.4599609375, 4.6387939453125, 4.817626953125, 4.9964599609375, 5.17529296875, 5.3541259765625, 5.532958984375, 5.7117919921875, 5.890625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 11.0, 19.0, 27.0, 52.0, 54.0, 94.0, 138.0, 217.0, 294.0, 463.0, 721.0, 1118.0, 1805.0, 2591.0, 4134.0, 6490.0, 10333.0, 17389.0, 29919.0, 53212.0, 97122.0, 184213.0, 270767.0, 163479.0, 87091.0, 47589.0, 26958.0, 15897.0, 9661.0, 5912.0, 3794.0, 2482.0, 1520.0, 967.0, 689.0, 449.0, 305.0, 189.0, 136.0, 79.0, 49.0, 42.0, 27.0, 19.0, 11.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9563674926757812, -0.9259185791015625, -0.8954696655273438, -0.865020751953125, -0.8345718383789062, -0.8041229248046875, -0.7736740112304688, -0.74322509765625, -0.7127761840820312, -0.6823272705078125, -0.6518783569335938, -0.621429443359375, -0.5909805297851562, -0.5605316162109375, -0.5300827026367188, -0.4996337890625, -0.46918487548828125, -0.4387359619140625, -0.40828704833984375, -0.377838134765625, -0.34738922119140625, -0.3169403076171875, -0.28649139404296875, -0.25604248046875, -0.22559356689453125, -0.1951446533203125, -0.16469573974609375, -0.134246826171875, -0.10379791259765625, -0.0733489990234375, -0.04290008544921875, -0.012451171875, 0.01799774169921875, 0.0484466552734375, 0.07889556884765625, 0.109344482421875, 0.13979339599609375, 0.1702423095703125, 0.20069122314453125, 0.23114013671875, 0.26158905029296875, 0.2920379638671875, 0.32248687744140625, 0.352935791015625, 0.38338470458984375, 0.4138336181640625, 0.44428253173828125, 0.4747314453125, 0.5051803588867188, 0.5356292724609375, 0.5660781860351562, 0.596527099609375, 0.6269760131835938, 0.6574249267578125, 0.6878738403320312, 0.71832275390625, 0.7487716674804688, 0.7792205810546875, 0.8096694946289062, 0.840118408203125, 0.8705673217773438, 0.9010162353515625, 0.9314651489257812, 0.9619140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 9.0, 6.0, 10.0, 10.0, 19.0, 18.0, 14.0, 26.0, 28.0, 45.0, 30.0, 46.0, 33.0, 37.0, 36.0, 28.0, 49.0, 1065.0, 43.0, 46.0, 38.0, 47.0, 39.0, 40.0, 26.0, 26.0, 30.0, 25.0, 30.0, 24.0, 14.0, 20.0, 14.0, 10.0, 4.0, 8.0, 6.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0], "bins": [-4.18359375, -4.06707763671875, -3.9505615234375, -3.83404541015625, -3.717529296875, -3.60101318359375, -3.4844970703125, -3.36798095703125, -3.25146484375, -3.13494873046875, -3.0184326171875, -2.90191650390625, -2.785400390625, -2.66888427734375, -2.5523681640625, -2.43585205078125, -2.3193359375, -2.20281982421875, -2.0863037109375, -1.96978759765625, -1.853271484375, -1.73675537109375, -1.6202392578125, -1.50372314453125, -1.38720703125, -1.27069091796875, -1.1541748046875, -1.03765869140625, -0.921142578125, -0.80462646484375, -0.6881103515625, -0.57159423828125, -0.455078125, -0.33856201171875, -0.2220458984375, -0.10552978515625, 0.010986328125, 0.12750244140625, 0.2440185546875, 0.36053466796875, 0.47705078125, 0.59356689453125, 0.7100830078125, 0.82659912109375, 0.943115234375, 1.05963134765625, 1.1761474609375, 1.29266357421875, 1.4091796875, 1.52569580078125, 1.6422119140625, 1.75872802734375, 1.875244140625, 1.99176025390625, 2.1082763671875, 2.22479248046875, 2.34130859375, 2.45782470703125, 2.5743408203125, 2.69085693359375, 2.807373046875, 2.92388916015625, 3.0404052734375, 3.15692138671875, 3.2734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 12.0, 23.0, 31.0, 24.0, 72.0, 81.0, 133.0, 193.0, 325.0, 476.0, 836.0, 1276.0, 1985.0, 3081.0, 5152.0, 8236.0, 13357.0, 22130.0, 37946.0, 65216.0, 117977.0, 225570.0, 1294953.0, 127456.0, 69846.0, 39582.0, 23720.0, 14155.0, 8701.0, 5368.0, 3379.0, 2170.0, 1346.0, 821.0, 560.0, 327.0, 218.0, 142.0, 83.0, 59.0, 55.0, 16.0, 12.0, 8.0, 10.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8340911865234375, -0.805389404296875, -0.7766876220703125, -0.74798583984375, -0.7192840576171875, -0.690582275390625, -0.6618804931640625, -0.6331787109375, -0.6044769287109375, -0.575775146484375, -0.5470733642578125, -0.51837158203125, -0.4896697998046875, -0.460968017578125, -0.4322662353515625, -0.403564453125, -0.3748626708984375, -0.346160888671875, -0.3174591064453125, -0.28875732421875, -0.2600555419921875, -0.231353759765625, -0.2026519775390625, -0.1739501953125, -0.1452484130859375, -0.116546630859375, -0.0878448486328125, -0.05914306640625, -0.0304412841796875, -0.001739501953125, 0.0269622802734375, 0.0556640625, 0.0843658447265625, 0.113067626953125, 0.1417694091796875, 0.17047119140625, 0.1991729736328125, 0.227874755859375, 0.2565765380859375, 0.2852783203125, 0.3139801025390625, 0.342681884765625, 0.3713836669921875, 0.40008544921875, 0.4287872314453125, 0.457489013671875, 0.4861907958984375, 0.514892578125, 0.5435943603515625, 0.572296142578125, 0.6009979248046875, 0.62969970703125, 0.6584014892578125, 0.687103271484375, 0.7158050537109375, 0.7445068359375, 0.7732086181640625, 0.801910400390625, 0.8306121826171875, 0.85931396484375, 0.8880157470703125, 0.916717529296875, 0.9454193115234375, 0.97412109375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 5.0, 6.0, 8.0, 3.0, 8.0, 12.0, 15.0, 6.0, 21.0, 25.0, 24.0, 32.0, 41.0, 57.0, 51.0, 60.0, 62.0, 71.0, 68.0, 58.0, 38.0, 60.0, 49.0, 43.0, 32.0, 33.0, 23.0, 10.0, 14.0, 11.0, 9.0, 15.0, 6.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004563331604003906, -0.00044209882616996765, -0.0004278644919395447, -0.0004136301577091217, -0.00039939582347869873, -0.00038516148924827576, -0.0003709271550178528, -0.0003566928207874298, -0.00034245848655700684, -0.00032822415232658386, -0.0003139898180961609, -0.0002997554838657379, -0.00028552114963531494, -0.00027128681540489197, -0.000257052481174469, -0.00024281814694404602, -0.00022858381271362305, -0.00021434947848320007, -0.0002001151442527771, -0.00018588081002235413, -0.00017164647579193115, -0.00015741214156150818, -0.0001431778073310852, -0.00012894347310066223, -0.00011470913887023926, -0.00010047480463981628, -8.624047040939331e-05, -7.200613617897034e-05, -5.777180194854736e-05, -4.353746771812439e-05, -2.9303133487701416e-05, -1.5068799257278442e-05, -8.344650268554688e-07, 1.3399869203567505e-05, 2.763420343399048e-05, 4.186853766441345e-05, 5.6102871894836426e-05, 7.03372061252594e-05, 8.457154035568237e-05, 9.880587458610535e-05, 0.00011304020881652832, 0.0001272745430469513, 0.00014150887727737427, 0.00015574321150779724, 0.00016997754573822021, 0.0001842118799686432, 0.00019844621419906616, 0.00021268054842948914, 0.0002269148826599121, 0.00024114921689033508, 0.00025538355112075806, 0.00026961788535118103, 0.000283852219581604, 0.000298086553812027, 0.00031232088804244995, 0.0003265552222728729, 0.0003407895565032959, 0.00035502389073371887, 0.00036925822496414185, 0.0003834925591945648, 0.0003977268934249878, 0.00041196122765541077, 0.00042619556188583374, 0.0004404298961162567, 0.0004546642303466797]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 8.0, 9.0, 13.0, 18.0, 33.0, 34.0, 53.0, 71.0, 118.0, 213.0, 330.0, 821.0, 244133.0, 800553.0, 1071.0, 421.0, 211.0, 136.0, 72.0, 46.0, 32.0, 25.0, 18.0, 18.0, 16.0, 12.0, 10.0, 8.0, 3.0, 4.0, 5.0, 3.0, 9.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01161956787109375, -0.01124560832977295, -0.010871648788452148, -0.010497689247131348, -0.010123729705810547, -0.009749770164489746, -0.009375810623168945, -0.009001851081848145, -0.008627891540527344, -0.008253931999206543, -0.007879972457885742, -0.007506012916564941, -0.007132053375244141, -0.00675809383392334, -0.006384134292602539, -0.006010174751281738, -0.0056362152099609375, -0.005262255668640137, -0.004888296127319336, -0.004514336585998535, -0.004140377044677734, -0.0037664175033569336, -0.003392457962036133, -0.003018498420715332, -0.0026445388793945312, -0.0022705793380737305, -0.0018966197967529297, -0.001522660255432129, -0.0011487007141113281, -0.0007747411727905273, -0.00040078163146972656, -2.682209014892578e-05, 0.000347137451171875, 0.0007210969924926758, 0.0010950565338134766, 0.0014690160751342773, 0.0018429756164550781, 0.002216935157775879, 0.0025908946990966797, 0.0029648542404174805, 0.0033388137817382812, 0.003712773323059082, 0.004086732864379883, 0.004460692405700684, 0.004834651947021484, 0.005208611488342285, 0.005582571029663086, 0.005956530570983887, 0.0063304901123046875, 0.006704449653625488, 0.007078409194946289, 0.00745236873626709, 0.00782632827758789, 0.008200287818908691, 0.008574247360229492, 0.008948206901550293, 0.009322166442871094, 0.009696125984191895, 0.010070085525512695, 0.010444045066833496, 0.010818004608154297, 0.011191964149475098, 0.011565923690795898, 0.0119398832321167, 0.0123138427734375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 76.0, 348.0, 413.0, 146.0, 23.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006749026360921562, -0.0006397803663276136, -0.0006046581547707319, -0.0005695358850061893, -0.0005344136152416468, -0.0004992913454771042, -0.00046416910481639206, -0.00042904686415567994, -0.00039392459439113736, -0.0003588023246265948, -0.00032368008396588266, -0.00028855784330517054, -0.00025343557354062796, -0.0002183133183280006, -0.00018319106311537325, -0.00014806882245466113, -0.00011294655269011855, -7.78242974774912e-05, -4.270204226486385e-05, -7.579787052236497e-06, 2.7542468160390854e-05, 6.26647233730182e-05, 9.778697858564556e-05, 0.00013290921924635768, 0.00016803148901090026, 0.0002031537442235276, 0.00023827599943615496, 0.0002733982400968671, 0.00030852050986140966, 0.00034364277962595224, 0.00037876502028666437, 0.0004138872609473765, 0.00044900947250425816, 0.00048413174226880074, 0.0005192540120333433, 0.000554376223590225, 0.0005894984933547676, 0.0006246207631193101, 0.0006597429746761918, 0.0006948652444407344, 0.000729987514205277, 0.0007651097839698195, 0.0008002320537343621, 0.0008353542652912438, 0.0008704765350557864, 0.000905598804820329, 0.0009407210163772106, 0.0009758432861417532, 0.0010109655559062958, 0.0010460878256708384, 0.001081210095435381, 0.0011163323651999235, 0.001151454634964466, 0.0011865767883136868, 0.0012216990580782294, 0.001256821327842772, 0.0012919435976073146, 0.0013270658673718572, 0.0013621881371363997, 0.0013973104069009423, 0.001432432560250163, 0.0014675548300147057, 0.0015026770997792482, 0.0015377993695437908, 0.0015729216393083334]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 3.0, 7.0, 4.0, 15.0, 13.0, 16.0, 16.0, 23.0, 21.0, 23.0, 34.0, 23.0, 33.0, 36.0, 37.0, 40.0, 38.0, 30.0, 35.0, 45.0, 53.0, 23.0, 45.0, 45.0, 34.0, 26.0, 33.0, 30.0, 37.0, 19.0, 28.0, 17.0, 16.0, 13.0, 11.0, 6.0, 18.0, 10.0, 4.0, 5.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00021910667419433594, -0.00021243561059236526, -0.0002057645469903946, -0.00019909348338842392, -0.00019242241978645325, -0.00018575135618448257, -0.0001790802925825119, -0.00017240922898054123, -0.00016573816537857056, -0.00015906710177659988, -0.0001523960381746292, -0.00014572497457265854, -0.00013905391097068787, -0.0001323828473687172, -0.00012571178376674652, -0.00011904072016477585, -0.00011236965656280518, -0.0001056985929608345, -9.902752935886383e-05, -9.235646575689316e-05, -8.568540215492249e-05, -7.901433855295181e-05, -7.234327495098114e-05, -6.567221134901047e-05, -5.9001147747039795e-05, -5.233008414506912e-05, -4.565902054309845e-05, -3.898795694112778e-05, -3.2316893339157104e-05, -2.5645829737186432e-05, -1.897476613521576e-05, -1.2303702533245087e-05, -5.632638931274414e-06, 1.0384246706962585e-06, 7.709488272666931e-06, 1.4380551874637604e-05, 2.1051615476608276e-05, 2.772267907857895e-05, 3.439374268054962e-05, 4.1064806282520294e-05, 4.773586988449097e-05, 5.440693348646164e-05, 6.107799708843231e-05, 6.774906069040298e-05, 7.442012429237366e-05, 8.109118789434433e-05, 8.7762251496315e-05, 9.443331509828568e-05, 0.00010110437870025635, 0.00010777544230222702, 0.00011444650590419769, 0.00012111756950616837, 0.00012778863310813904, 0.0001344596967101097, 0.00014113076031208038, 0.00014780182391405106, 0.00015447288751602173, 0.0001611439511179924, 0.00016781501471996307, 0.00017448607832193375, 0.00018115714192390442, 0.0001878282055258751, 0.00019449926912784576, 0.00020117033272981644, 0.0002078413963317871]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 12.0, 11.0, 10.0, 8.0, 17.0, 22.0, 23.0, 27.0, 26.0, 29.0, 45.0, 36.0, 37.0, 39.0, 32.0, 51.0, 38.0, 44.0, 46.0, 43.0, 37.0, 39.0, 41.0, 37.0, 35.0, 31.0, 25.0, 22.0, 17.0, 18.0, 21.0, 14.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5546875, -5.3758544921875, -5.197021484375, -5.0181884765625, -4.83935546875, -4.6605224609375, -4.481689453125, -4.3028564453125, -4.1240234375, -3.9451904296875, -3.766357421875, -3.5875244140625, -3.40869140625, -3.2298583984375, -3.051025390625, -2.8721923828125, -2.693359375, -2.5145263671875, -2.335693359375, -2.1568603515625, -1.97802734375, -1.7991943359375, -1.620361328125, -1.4415283203125, -1.2626953125, -1.0838623046875, -0.905029296875, -0.7261962890625, -0.54736328125, -0.3685302734375, -0.189697265625, -0.0108642578125, 0.16796875, 0.3468017578125, 0.525634765625, 0.7044677734375, 0.88330078125, 1.0621337890625, 1.240966796875, 1.4197998046875, 1.5986328125, 1.7774658203125, 1.956298828125, 2.1351318359375, 2.31396484375, 2.4927978515625, 2.671630859375, 2.8504638671875, 3.029296875, 3.2081298828125, 3.386962890625, 3.5657958984375, 3.74462890625, 3.9234619140625, 4.102294921875, 4.2811279296875, 4.4599609375, 4.6387939453125, 4.817626953125, 4.9964599609375, 5.17529296875, 5.3541259765625, 5.532958984375, 5.7117919921875, 5.890625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 34.0, 33.0, 53.0, 69.0, 108.0, 136.0, 194.0, 282.0, 391.0, 579.0, 907.0, 1337.0, 2202.0, 3598.0, 6162.0, 11728.0, 24533.0, 60251.0, 194739.0, 504320.0, 143932.0, 47955.0, 20478.0, 10027.0, 5499.0, 3094.0, 1955.0, 1216.0, 809.0, 546.0, 399.0, 291.0, 199.0, 116.0, 90.0, 77.0, 37.0, 37.0, 33.0, 21.0, 19.0, 11.0, 6.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.65234375, -4.51300048828125, -4.3736572265625, -4.23431396484375, -4.094970703125, -3.95562744140625, -3.8162841796875, -3.67694091796875, -3.53759765625, -3.39825439453125, -3.2589111328125, -3.11956787109375, -2.980224609375, -2.84088134765625, -2.7015380859375, -2.56219482421875, -2.4228515625, -2.28350830078125, -2.1441650390625, -2.00482177734375, -1.865478515625, -1.72613525390625, -1.5867919921875, -1.44744873046875, -1.30810546875, -1.16876220703125, -1.0294189453125, -0.89007568359375, -0.750732421875, -0.61138916015625, -0.4720458984375, -0.33270263671875, -0.193359375, -0.05401611328125, 0.0853271484375, 0.22467041015625, 0.364013671875, 0.50335693359375, 0.6427001953125, 0.78204345703125, 0.92138671875, 1.06072998046875, 1.2000732421875, 1.33941650390625, 1.478759765625, 1.61810302734375, 1.7574462890625, 1.89678955078125, 2.0361328125, 2.17547607421875, 2.3148193359375, 2.45416259765625, 2.593505859375, 2.73284912109375, 2.8721923828125, 3.01153564453125, 3.15087890625, 3.29022216796875, 3.4295654296875, 3.56890869140625, 3.708251953125, 3.84759521484375, 3.9869384765625, 4.12628173828125, 4.265625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 5.0, 7.0, 3.0, 8.0, 9.0, 11.0, 12.0, 14.0, 21.0, 27.0, 24.0, 25.0, 21.0, 32.0, 26.0, 29.0, 33.0, 29.0, 56.0, 83.0, 271.0, 1680.0, 123.0, 61.0, 55.0, 44.0, 31.0, 28.0, 32.0, 34.0, 27.0, 29.0, 16.0, 18.0, 20.0, 16.0, 8.0, 10.0, 10.0, 13.0, 8.0, 9.0, 8.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.533447265625, -16.00439453125, -15.475341796875, -14.9462890625, -14.417236328125, -13.88818359375, -13.359130859375, -12.830078125, -12.301025390625, -11.77197265625, -11.242919921875, -10.7138671875, -10.184814453125, -9.65576171875, -9.126708984375, -8.59765625, -8.068603515625, -7.53955078125, -7.010498046875, -6.4814453125, -5.952392578125, -5.42333984375, -4.894287109375, -4.365234375, -3.836181640625, -3.30712890625, -2.778076171875, -2.2490234375, -1.719970703125, -1.19091796875, -0.661865234375, -0.1328125, 0.396240234375, 0.92529296875, 1.454345703125, 1.9833984375, 2.512451171875, 3.04150390625, 3.570556640625, 4.099609375, 4.628662109375, 5.15771484375, 5.686767578125, 6.2158203125, 6.744873046875, 7.27392578125, 7.802978515625, 8.33203125, 8.861083984375, 9.39013671875, 9.919189453125, 10.4482421875, 10.977294921875, 11.50634765625, 12.035400390625, 12.564453125, 13.093505859375, 13.62255859375, 14.151611328125, 14.6806640625, 15.209716796875, 15.73876953125, 16.267822265625, 16.796875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 11.0, 16.0, 17.0, 23.0, 23.0, 25.0, 43.0, 41.0, 82.0, 132.0, 167.0, 283.0, 646.0, 3322.0, 609572.0, 2525340.0, 4324.0, 710.0, 313.0, 163.0, 113.0, 81.0, 62.0, 57.0, 28.0, 22.0, 14.0, 14.0, 9.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.15625, -35.78271484375, -34.4091796875, -33.03564453125, -31.662109375, -30.28857421875, -28.9150390625, -27.54150390625, -26.16796875, -24.79443359375, -23.4208984375, -22.04736328125, -20.673828125, -19.30029296875, -17.9267578125, -16.55322265625, -15.1796875, -13.80615234375, -12.4326171875, -11.05908203125, -9.685546875, -8.31201171875, -6.9384765625, -5.56494140625, -4.19140625, -2.81787109375, -1.4443359375, -0.07080078125, 1.302734375, 2.67626953125, 4.0498046875, 5.42333984375, 6.796875, 8.17041015625, 9.5439453125, 10.91748046875, 12.291015625, 13.66455078125, 15.0380859375, 16.41162109375, 17.78515625, 19.15869140625, 20.5322265625, 21.90576171875, 23.279296875, 24.65283203125, 26.0263671875, 27.39990234375, 28.7734375, 30.14697265625, 31.5205078125, 32.89404296875, 34.267578125, 35.64111328125, 37.0146484375, 38.38818359375, 39.76171875, 41.13525390625, 42.5087890625, 43.88232421875, 45.255859375, 46.62939453125, 48.0029296875, 49.37646484375, 50.75]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 10.0, 22.0, 55.0, 58.0, 100.0, 113.0, 176.0, 137.0, 101.0, 97.0, 55.0, 39.0, 13.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.346296310424805, -28.64324188232422, -27.940187454223633, -27.237133026123047, -26.534076690673828, -25.831022262573242, -25.127967834472656, -24.42491340637207, -23.721858978271484, -23.0188045501709, -22.315750122070312, -21.612693786621094, -20.909639358520508, -20.206584930419922, -19.503530502319336, -18.80047607421875, -18.09741973876953, -17.394365310668945, -16.69131088256836, -15.988255500793457, -15.285201072692871, -14.582145690917969, -13.879091262817383, -13.176036834716797, -12.472982406616211, -11.769927978515625, -11.066872596740723, -10.363818168640137, -9.66076374053955, -8.957708358764648, -8.254653930664062, -7.551599502563477, -6.848544120788574, -6.14548921585083, -5.442434787750244, -4.7393798828125, -4.036325454711914, -3.33327054977417, -2.630215644836426, -1.9271612167358398, -1.2241063117980957, -0.5210515856742859, 0.18200314044952393, 0.8850579261779785, 1.5881125926971436, 2.2911672592163086, 2.9942221641540527, 3.6972765922546387, 4.400331497192383, 5.103386402130127, 5.806440830230713, 6.509495735168457, 7.212550163269043, 7.915605068206787, 8.618659973144531, 9.321714401245117, 10.024768829345703, 10.727823257446289, 11.430878639221191, 12.133933067321777, 12.836987495422363, 13.540042877197266, 14.243097305297852, 14.946151733398438, 15.64920711517334]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 10.0, 7.0, 9.0, 16.0, 12.0, 14.0, 7.0, 13.0, 22.0, 15.0, 20.0, 38.0, 30.0, 28.0, 28.0, 37.0, 34.0, 40.0, 41.0, 40.0, 35.0, 54.0, 32.0, 37.0, 36.0, 33.0, 35.0, 27.0, 29.0, 25.0, 22.0, 28.0, 29.0, 14.0, 18.0, 19.0, 12.0, 6.0, 9.0, 7.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-57.35395812988281, -55.69116973876953, -54.028385162353516, -52.3656005859375, -50.70281219482422, -49.04002380371094, -47.37723922729492, -45.714454650878906, -44.051666259765625, -42.388877868652344, -40.72609329223633, -39.06330871582031, -37.40052032470703, -35.73773193359375, -34.074947357177734, -32.41216278076172, -30.749374389648438, -29.08658790588379, -27.42380142211914, -25.761014938354492, -24.098228454589844, -22.435441970825195, -20.772655487060547, -19.1098690032959, -17.44708251953125, -15.784296035766602, -14.121509552001953, -12.458723068237305, -10.795936584472656, -9.133150100708008, -7.470363616943359, -5.807577133178711, -4.1447906494140625, -2.482004165649414, -0.8192176818847656, 0.8435688018798828, 2.5063552856445312, 4.16914176940918, 5.831928253173828, 7.494714736938477, 9.157501220703125, 10.820287704467773, 12.483074188232422, 14.14586067199707, 15.808647155761719, 17.471433639526367, 19.134220123291016, 20.797006607055664, 22.459793090820312, 24.12257957458496, 25.78536605834961, 27.448152542114258, 29.110939025878906, 30.773725509643555, 32.4365119934082, 34.09929656982422, 35.7620849609375, 37.42487335205078, 39.0876579284668, 40.75044250488281, 42.413230895996094, 44.076019287109375, 45.73880386352539, 47.401588439941406, 49.06437683105469]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 6.0, 14.0, 11.0, 16.0, 15.0, 27.0, 19.0, 32.0, 25.0, 30.0, 43.0, 41.0, 31.0, 40.0, 49.0, 33.0, 43.0, 44.0, 46.0, 41.0, 35.0, 49.0, 42.0, 34.0, 37.0, 25.0, 16.0, 24.0, 18.0, 21.0, 18.0, 7.0, 10.0, 9.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.66796875, -5.4833984375, -5.298828125, -5.1142578125, -4.9296875, -4.7451171875, -4.560546875, -4.3759765625, -4.19140625, -4.0068359375, -3.822265625, -3.6376953125, -3.453125, -3.2685546875, -3.083984375, -2.8994140625, -2.71484375, -2.5302734375, -2.345703125, -2.1611328125, -1.9765625, -1.7919921875, -1.607421875, -1.4228515625, -1.23828125, -1.0537109375, -0.869140625, -0.6845703125, -0.5, -0.3154296875, -0.130859375, 0.0537109375, 0.23828125, 0.4228515625, 0.607421875, 0.7919921875, 0.9765625, 1.1611328125, 1.345703125, 1.5302734375, 1.71484375, 1.8994140625, 2.083984375, 2.2685546875, 2.453125, 2.6376953125, 2.822265625, 3.0068359375, 3.19140625, 3.3759765625, 3.560546875, 3.7451171875, 3.9296875, 4.1142578125, 4.298828125, 4.4833984375, 4.66796875, 4.8525390625, 5.037109375, 5.2216796875, 5.40625, 5.5908203125, 5.775390625, 5.9599609375, 6.14453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 8.0, 16.0, 22.0, 33.0, 62.0, 74.0, 120.0, 180.0, 310.0, 584.0, 1073.0, 2127.0, 4443.0, 10263.0, 27643.0, 88036.0, 324207.0, 1008811.0, 1525975.0, 835750.0, 254567.0, 70797.0, 22539.0, 8820.0, 3717.0, 1833.0, 930.0, 481.0, 310.0, 176.0, 111.0, 71.0, 46.0, 33.0, 25.0, 19.0, 11.0, 10.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.6412353515625, -5.442626953125, -5.2440185546875, -5.04541015625, -4.8468017578125, -4.648193359375, -4.4495849609375, -4.2509765625, -4.0523681640625, -3.853759765625, -3.6551513671875, -3.45654296875, -3.2579345703125, -3.059326171875, -2.8607177734375, -2.662109375, -2.4635009765625, -2.264892578125, -2.0662841796875, -1.86767578125, -1.6690673828125, -1.470458984375, -1.2718505859375, -1.0732421875, -0.8746337890625, -0.676025390625, -0.4774169921875, -0.27880859375, -0.0802001953125, 0.118408203125, 0.3170166015625, 0.515625, 0.7142333984375, 0.912841796875, 1.1114501953125, 1.31005859375, 1.5086669921875, 1.707275390625, 1.9058837890625, 2.1044921875, 2.3031005859375, 2.501708984375, 2.7003173828125, 2.89892578125, 3.0975341796875, 3.296142578125, 3.4947509765625, 3.693359375, 3.8919677734375, 4.090576171875, 4.2891845703125, 4.48779296875, 4.6864013671875, 4.885009765625, 5.0836181640625, 5.2822265625, 5.4808349609375, 5.679443359375, 5.8780517578125, 6.07666015625, 6.2752685546875, 6.473876953125, 6.6724853515625, 6.87109375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 12.0, 12.0, 10.0, 15.0, 28.0, 45.0, 61.0, 72.0, 101.0, 133.0, 168.0, 256.0, 316.0, 433.0, 507.0, 481.0, 396.0, 280.0, 209.0, 122.0, 133.0, 79.0, 54.0, 46.0, 34.0, 21.0, 17.0, 10.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.078125, -20.57275390625, -20.0673828125, -19.56201171875, -19.056640625, -18.55126953125, -18.0458984375, -17.54052734375, -17.03515625, -16.52978515625, -16.0244140625, -15.51904296875, -15.013671875, -14.50830078125, -14.0029296875, -13.49755859375, -12.9921875, -12.48681640625, -11.9814453125, -11.47607421875, -10.970703125, -10.46533203125, -9.9599609375, -9.45458984375, -8.94921875, -8.44384765625, -7.9384765625, -7.43310546875, -6.927734375, -6.42236328125, -5.9169921875, -5.41162109375, -4.90625, -4.40087890625, -3.8955078125, -3.39013671875, -2.884765625, -2.37939453125, -1.8740234375, -1.36865234375, -0.86328125, -0.35791015625, 0.1474609375, 0.65283203125, 1.158203125, 1.66357421875, 2.1689453125, 2.67431640625, 3.1796875, 3.68505859375, 4.1904296875, 4.69580078125, 5.201171875, 5.70654296875, 6.2119140625, 6.71728515625, 7.22265625, 7.72802734375, 8.2333984375, 8.73876953125, 9.244140625, 9.74951171875, 10.2548828125, 10.76025390625, 11.265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 5.0, 8.0, 8.0, 10.0, 15.0, 18.0, 30.0, 30.0, 54.0, 75.0, 86.0, 116.0, 154.0, 266.0, 477.0, 2098.0, 224599.0, 3953174.0, 11097.0, 861.0, 352.0, 218.0, 146.0, 77.0, 70.0, 59.0, 36.0, 43.0, 19.0, 14.0, 20.0, 13.0, 11.0, 9.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.1875, -48.1181640625, -46.048828125, -43.9794921875, -41.91015625, -39.8408203125, -37.771484375, -35.7021484375, -33.6328125, -31.5634765625, -29.494140625, -27.4248046875, -25.35546875, -23.2861328125, -21.216796875, -19.1474609375, -17.078125, -15.0087890625, -12.939453125, -10.8701171875, -8.80078125, -6.7314453125, -4.662109375, -2.5927734375, -0.5234375, 1.5458984375, 3.615234375, 5.6845703125, 7.75390625, 9.8232421875, 11.892578125, 13.9619140625, 16.03125, 18.1005859375, 20.169921875, 22.2392578125, 24.30859375, 26.3779296875, 28.447265625, 30.5166015625, 32.5859375, 34.6552734375, 36.724609375, 38.7939453125, 40.86328125, 42.9326171875, 45.001953125, 47.0712890625, 49.140625, 51.2099609375, 53.279296875, 55.3486328125, 57.41796875, 59.4873046875, 61.556640625, 63.6259765625, 65.6953125, 67.7646484375, 69.833984375, 71.9033203125, 73.97265625, 76.0419921875, 78.111328125, 80.1806640625, 82.25]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 10.0, 63.0, 173.0, 275.0, 268.0, 159.0, 45.0, 13.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-199.8118133544922, -195.46070861816406, -191.10958862304688, -186.75848388671875, -182.40737915039062, -178.0562744140625, -173.7051544189453, -169.3540496826172, -165.00294494628906, -160.65184020996094, -156.30072021484375, -151.94961547851562, -147.5985107421875, -143.24740600585938, -138.8962860107422, -134.54518127441406, -130.19406127929688, -125.84294891357422, -121.4918441772461, -117.14073181152344, -112.78962707519531, -108.43851470947266, -104.08740234375, -99.73629760742188, -95.38519287109375, -91.0340805053711, -86.68297576904297, -82.33186340332031, -77.98075866699219, -73.62964630126953, -69.27853393554688, -64.92742919921875, -60.576324462890625, -56.225215911865234, -51.874107360839844, -47.52299499511719, -43.17189025878906, -38.820777893066406, -34.469669342041016, -30.118560791015625, -25.767452239990234, -21.416343688964844, -17.065235137939453, -12.71412467956543, -8.363016128540039, -4.011907577514648, 0.339202880859375, 4.690311431884766, 9.041419982910156, 13.392528533935547, 17.743637084960938, 22.09474754333496, 26.44585609436035, 30.796964645385742, 35.148075103759766, 39.499183654785156, 43.85029220581055, 48.20140075683594, 52.55250930786133, 56.90361785888672, 61.254730224609375, 65.6058349609375, 69.95694732666016, 74.30805969238281, 78.65916442871094]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 3.0, 11.0, 7.0, 9.0, 7.0, 16.0, 18.0, 16.0, 22.0, 18.0, 20.0, 28.0, 28.0, 36.0, 36.0, 52.0, 49.0, 53.0, 38.0, 46.0, 36.0, 43.0, 33.0, 36.0, 40.0, 39.0, 34.0, 27.0, 33.0, 30.0, 19.0, 20.0, 14.0, 12.0, 13.0, 10.0, 13.0, 9.0, 6.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.4869384765625, -49.87363052368164, -48.260318756103516, -46.647010803222656, -45.03369903564453, -43.42039108276367, -41.80708312988281, -40.19377136230469, -38.58046340942383, -36.96715545654297, -35.353843688964844, -33.740535736083984, -32.12722396850586, -30.513916015625, -28.900606155395508, -27.287296295166016, -25.673986434936523, -24.06067657470703, -22.44736671447754, -20.834056854248047, -19.220748901367188, -17.607439041137695, -15.994129180908203, -14.380820274353027, -12.767510414123535, -11.154200553894043, -9.540891647338867, -7.927581787109375, -6.314272403717041, -4.700963020324707, -3.087653160095215, -1.474344253540039, 0.13896560668945312, 1.7522751092910767, 3.3655846118927, 4.978894233703613, 6.592203617095947, 8.205513000488281, 9.818822860717773, 11.43213176727295, 13.045441627502441, 14.658751487731934, 16.27206039428711, 17.8853702545166, 19.498680114746094, 21.111988067626953, 22.725299835205078, 24.338607788085938, 25.95191764831543, 27.565227508544922, 29.178537368774414, 30.791847229003906, 32.405155181884766, 34.018463134765625, 35.63177490234375, 37.24508285522461, 38.858394622802734, 40.471702575683594, 42.08501434326172, 43.69832229614258, 45.3116340637207, 46.92494201660156, 48.53825378417969, 50.15156173706055, 51.764869689941406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 6.0, 22.0, 22.0, 25.0, 17.0, 35.0, 36.0, 30.0, 36.0, 37.0, 50.0, 34.0, 48.0, 44.0, 42.0, 46.0, 53.0, 45.0, 36.0, 40.0, 32.0, 29.0, 23.0, 31.0, 29.0, 17.0, 14.0, 13.0, 20.0, 7.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.55078125, -6.3590087890625, -6.167236328125, -5.9754638671875, -5.78369140625, -5.5919189453125, -5.400146484375, -5.2083740234375, -5.0166015625, -4.8248291015625, -4.633056640625, -4.4412841796875, -4.24951171875, -4.0577392578125, -3.865966796875, -3.6741943359375, -3.482421875, -3.2906494140625, -3.098876953125, -2.9071044921875, -2.71533203125, -2.5235595703125, -2.331787109375, -2.1400146484375, -1.9482421875, -1.7564697265625, -1.564697265625, -1.3729248046875, -1.18115234375, -0.9893798828125, -0.797607421875, -0.6058349609375, -0.4140625, -0.2222900390625, -0.030517578125, 0.1612548828125, 0.35302734375, 0.5447998046875, 0.736572265625, 0.9283447265625, 1.1201171875, 1.3118896484375, 1.503662109375, 1.6954345703125, 1.88720703125, 2.0789794921875, 2.270751953125, 2.4625244140625, 2.654296875, 2.8460693359375, 3.037841796875, 3.2296142578125, 3.42138671875, 3.6131591796875, 3.804931640625, 3.9967041015625, 4.1884765625, 4.3802490234375, 4.572021484375, 4.7637939453125, 4.95556640625, 5.1473388671875, 5.339111328125, 5.5308837890625, 5.72265625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 9.0, 6.0, 6.0, 17.0, 22.0, 33.0, 43.0, 51.0, 95.0, 150.0, 201.0, 323.0, 468.0, 736.0, 1060.0, 1597.0, 2532.0, 3924.0, 6090.0, 9483.0, 15250.0, 24923.0, 40460.0, 69007.0, 119891.0, 215314.0, 225635.0, 126166.0, 72457.0, 43064.0, 25618.0, 15892.0, 9843.0, 6407.0, 4040.0, 2665.0, 1722.0, 1114.0, 765.0, 473.0, 331.0, 237.0, 139.0, 90.0, 76.0, 43.0, 32.0, 21.0, 17.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.86572265625, -0.8378372192382812, -0.8099517822265625, -0.7820663452148438, -0.754180908203125, -0.7262954711914062, -0.6984100341796875, -0.6705245971679688, -0.64263916015625, -0.6147537231445312, -0.5868682861328125, -0.5589828491210938, -0.531097412109375, -0.5032119750976562, -0.4753265380859375, -0.44744110107421875, -0.4195556640625, -0.39167022705078125, -0.3637847900390625, -0.33589935302734375, -0.308013916015625, -0.28012847900390625, -0.2522430419921875, -0.22435760498046875, -0.19647216796875, -0.16858673095703125, -0.1407012939453125, -0.11281585693359375, -0.084930419921875, -0.05704498291015625, -0.0291595458984375, -0.00127410888671875, 0.026611328125, 0.05449676513671875, 0.0823822021484375, 0.11026763916015625, 0.138153076171875, 0.16603851318359375, 0.1939239501953125, 0.22180938720703125, 0.24969482421875, 0.27758026123046875, 0.3054656982421875, 0.33335113525390625, 0.361236572265625, 0.38912200927734375, 0.4170074462890625, 0.44489288330078125, 0.4727783203125, 0.5006637573242188, 0.5285491943359375, 0.5564346313476562, 0.584320068359375, 0.6122055053710938, 0.6400909423828125, 0.6679763793945312, 0.69586181640625, 0.7237472534179688, 0.7516326904296875, 0.7795181274414062, 0.807403564453125, 0.8352890014648438, 0.8631744384765625, 0.8910598754882812, 0.9189453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 7.0, 2.0, 2.0, 3.0, 8.0, 10.0, 9.0, 10.0, 9.0, 18.0, 8.0, 11.0, 21.0, 25.0, 30.0, 26.0, 28.0, 33.0, 29.0, 33.0, 41.0, 39.0, 34.0, 27.0, 38.0, 1056.0, 27.0, 32.0, 43.0, 33.0, 33.0, 35.0, 36.0, 32.0, 19.0, 20.0, 20.0, 24.0, 17.0, 16.0, 19.0, 11.0, 12.0, 10.0, 8.0, 14.0, 9.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.55078125, -3.448150634765625, -3.34552001953125, -3.242889404296875, -3.1402587890625, -3.037628173828125, -2.93499755859375, -2.832366943359375, -2.729736328125, -2.627105712890625, -2.52447509765625, -2.421844482421875, -2.3192138671875, -2.216583251953125, -2.11395263671875, -2.011322021484375, -1.90869140625, -1.806060791015625, -1.70343017578125, -1.600799560546875, -1.4981689453125, -1.395538330078125, -1.29290771484375, -1.190277099609375, -1.087646484375, -0.985015869140625, -0.88238525390625, -0.779754638671875, -0.6771240234375, -0.574493408203125, -0.47186279296875, -0.369232177734375, -0.2666015625, -0.163970947265625, -0.06134033203125, 0.041290283203125, 0.1439208984375, 0.246551513671875, 0.34918212890625, 0.451812744140625, 0.554443359375, 0.657073974609375, 0.75970458984375, 0.862335205078125, 0.9649658203125, 1.067596435546875, 1.17022705078125, 1.272857666015625, 1.37548828125, 1.478118896484375, 1.58074951171875, 1.683380126953125, 1.7860107421875, 1.888641357421875, 1.99127197265625, 2.093902587890625, 2.196533203125, 2.299163818359375, 2.40179443359375, 2.504425048828125, 2.6070556640625, 2.709686279296875, 2.81231689453125, 2.914947509765625, 3.017578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 8.0, 14.0, 23.0, 25.0, 38.0, 48.0, 73.0, 126.0, 177.0, 260.0, 375.0, 544.0, 819.0, 1209.0, 1762.0, 2443.0, 3634.0, 5305.0, 7798.0, 11428.0, 17042.0, 26258.0, 39833.0, 62694.0, 100271.0, 174079.0, 1278231.0, 132673.0, 80289.0, 51215.0, 32617.0, 21592.0, 14070.0, 9557.0, 6579.0, 4383.0, 3038.0, 2099.0, 1363.0, 994.0, 697.0, 493.0, 327.0, 199.0, 161.0, 90.0, 66.0, 41.0, 24.0, 14.0, 15.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.71240234375, -0.6888656616210938, -0.6653289794921875, -0.6417922973632812, -0.618255615234375, -0.5947189331054688, -0.5711822509765625, -0.5476455688476562, -0.52410888671875, -0.5005722045898438, -0.4770355224609375, -0.45349884033203125, -0.429962158203125, -0.40642547607421875, -0.3828887939453125, -0.35935211181640625, -0.3358154296875, -0.31227874755859375, -0.2887420654296875, -0.26520538330078125, -0.241668701171875, -0.21813201904296875, -0.1945953369140625, -0.17105865478515625, -0.14752197265625, -0.12398529052734375, -0.1004486083984375, -0.07691192626953125, -0.053375244140625, -0.02983856201171875, -0.0063018798828125, 0.01723480224609375, 0.040771484375, 0.06430816650390625, 0.0878448486328125, 0.11138153076171875, 0.134918212890625, 0.15845489501953125, 0.1819915771484375, 0.20552825927734375, 0.22906494140625, 0.25260162353515625, 0.2761383056640625, 0.29967498779296875, 0.323211669921875, 0.34674835205078125, 0.3702850341796875, 0.39382171630859375, 0.4173583984375, 0.44089508056640625, 0.4644317626953125, 0.48796844482421875, 0.511505126953125, 0.5350418090820312, 0.5585784912109375, 0.5821151733398438, 0.60565185546875, 0.6291885375976562, 0.6527252197265625, 0.6762619018554688, 0.699798583984375, 0.7233352661132812, 0.7468719482421875, 0.7704086303710938, 0.7939453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 10.0, 8.0, 10.0, 13.0, 17.0, 14.0, 17.0, 19.0, 24.0, 30.0, 32.0, 36.0, 48.0, 42.0, 53.0, 60.0, 47.0, 53.0, 52.0, 50.0, 55.0, 49.0, 33.0, 38.0, 24.0, 21.0, 15.0, 11.0, 20.0, 15.0, 12.0, 13.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004000663757324219, -0.0003859996795654297, -0.0003719329833984375, -0.0003578662872314453, -0.0003437995910644531, -0.00032973289489746094, -0.00031566619873046875, -0.00030159950256347656, -0.0002875328063964844, -0.0002734661102294922, -0.0002593994140625, -0.0002453327178955078, -0.00023126602172851562, -0.00021719932556152344, -0.00020313262939453125, -0.00018906593322753906, -0.00017499923706054688, -0.0001609325408935547, -0.0001468658447265625, -0.0001327991485595703, -0.00011873245239257812, -0.00010466575622558594, -9.059906005859375e-05, -7.653236389160156e-05, -6.246566772460938e-05, -4.839897155761719e-05, -3.4332275390625e-05, -2.0265579223632812e-05, -6.198883056640625e-06, 7.867813110351562e-06, 2.193450927734375e-05, 3.600120544433594e-05, 5.0067901611328125e-05, 6.413459777832031e-05, 7.82012939453125e-05, 9.226799011230469e-05, 0.00010633468627929688, 0.00012040138244628906, 0.00013446807861328125, 0.00014853477478027344, 0.00016260147094726562, 0.0001766681671142578, 0.00019073486328125, 0.0002048015594482422, 0.00021886825561523438, 0.00023293495178222656, 0.00024700164794921875, 0.00026106834411621094, 0.0002751350402832031, 0.0002892017364501953, 0.0003032684326171875, 0.0003173351287841797, 0.0003314018249511719, 0.00034546852111816406, 0.00035953521728515625, 0.00037360191345214844, 0.0003876686096191406, 0.0004017353057861328, 0.000415802001953125, 0.0004298686981201172, 0.0004439353942871094, 0.00045800209045410156, 0.00047206878662109375, 0.00048613548278808594, 0.0005002021789550781]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 9.0, 13.0, 15.0, 14.0, 15.0, 20.0, 43.0, 45.0, 64.0, 107.0, 143.0, 267.0, 495.0, 1038.0, 107731.0, 935202.0, 1854.0, 543.0, 284.0, 201.0, 112.0, 71.0, 64.0, 30.0, 32.0, 23.0, 23.0, 15.0, 11.0, 7.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.012176513671875, -0.01179802417755127, -0.011419534683227539, -0.011041045188903809, -0.010662555694580078, -0.010284066200256348, -0.009905576705932617, -0.009527087211608887, -0.009148597717285156, -0.008770108222961426, -0.008391618728637695, -0.008013129234313965, -0.007634639739990234, -0.007256150245666504, -0.0068776607513427734, -0.006499171257019043, -0.0061206817626953125, -0.005742192268371582, -0.0053637027740478516, -0.004985213279724121, -0.004606723785400391, -0.00422823429107666, -0.0038497447967529297, -0.0034712553024291992, -0.0030927658081054688, -0.0027142763137817383, -0.002335786819458008, -0.0019572973251342773, -0.0015788078308105469, -0.0012003183364868164, -0.0008218288421630859, -0.00044333934783935547, -6.4849853515625e-05, 0.00031363964080810547, 0.0006921291351318359, 0.0010706186294555664, 0.0014491081237792969, 0.0018275976181030273, 0.002206087112426758, 0.0025845766067504883, 0.0029630661010742188, 0.0033415555953979492, 0.0037200450897216797, 0.00409853458404541, 0.004477024078369141, 0.004855513572692871, 0.0052340030670166016, 0.005612492561340332, 0.0059909820556640625, 0.006369471549987793, 0.0067479610443115234, 0.007126450538635254, 0.007504940032958984, 0.007883429527282715, 0.008261919021606445, 0.008640408515930176, 0.009018898010253906, 0.009397387504577637, 0.009775876998901367, 0.010154366493225098, 0.010532855987548828, 0.010911345481872559, 0.011289834976196289, 0.01166832447052002, 0.01204681396484375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 34.0, 180.0, 417.0, 275.0, 79.0, 19.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006863728631287813, -0.0006496244459412992, -0.0006128760287538171, -0.000576127611566335, -0.0005393791943788528, -0.0005026307189837098, -0.0004658823017962277, -0.0004291338846087456, -0.00039238546742126346, -0.00035563705023378134, -0.0003188886330462992, -0.00028214018675498664, -0.0002453917695675045, -0.0002086433523800224, -0.00017189492064062506, -0.0001351464889012277, -9.83980717137456e-05, -6.164964725030586e-05, -2.490122278686613e-05, 1.1847201676573604e-05, 4.859562614001334e-05, 8.534404332749546e-05, 0.0001220924750668928, 0.00015884090680629015, 0.00019558932399377227, 0.0002323377411812544, 0.0002690861583687365, 0.0003058346046600491, 0.0003425830218475312, 0.0003793314390350133, 0.0004160798853263259, 0.000452828302513808, 0.0004895767197012901, 0.0005263251368887722, 0.0005630735540762544, 0.0005998219712637365, 0.0006365703884512186, 0.0006733188638463616, 0.0007100672810338438, 0.0007468156982213259, 0.000783564115408808, 0.0008203125325962901, 0.0008570609497837722, 0.0008938093669712543, 0.0009305578423663974, 0.0009673062013462186, 0.0010040546767413616, 0.0010408030357211828, 0.0010775515111163259, 0.0011142999865114689, 0.00115104834549129, 0.0011877968208864331, 0.0012245451798662543, 0.0012612936552613974, 0.0012980420142412186, 0.0013347904896363616, 0.0013715389650315046, 0.0014082874404266477, 0.0014450357994064689, 0.001481784274801612, 0.001518532633781433, 0.0015552811091765761, 0.0015920294681563973, 0.0016287779435515404, 0.0016655263025313616]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 10.0, 9.0, 5.0, 3.0, 4.0, 9.0, 11.0, 14.0, 20.0, 15.0, 12.0, 18.0, 21.0, 23.0, 23.0, 32.0, 26.0, 36.0, 28.0, 29.0, 35.0, 27.0, 37.0, 35.0, 47.0, 36.0, 35.0, 30.0, 25.0, 30.0, 31.0, 34.0, 32.0, 29.0, 19.0, 29.0, 17.0, 18.0, 16.0, 12.0, 15.0, 5.0, 10.0, 7.0, 9.0, 5.0, 9.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0], "bins": [-0.0002532005310058594, -0.0002459865063428879, -0.00023877248167991638, -0.00023155845701694489, -0.0002243444323539734, -0.0002171304076910019, -0.0002099163830280304, -0.0002027023583650589, -0.0001954883337020874, -0.0001882743090391159, -0.0001810602843761444, -0.0001738462597131729, -0.00016663223505020142, -0.00015941821038722992, -0.00015220418572425842, -0.00014499016106128693, -0.00013777613639831543, -0.00013056211173534393, -0.00012334808707237244, -0.00011613406240940094, -0.00010892003774642944, -0.00010170601308345795, -9.449198842048645e-05, -8.727796375751495e-05, -8.006393909454346e-05, -7.284991443157196e-05, -6.563588976860046e-05, -5.842186510562897e-05, -5.120784044265747e-05, -4.3993815779685974e-05, -3.677979111671448e-05, -2.956576645374298e-05, -2.2351741790771484e-05, -1.5137717127799988e-05, -7.923692464828491e-06, -7.096678018569946e-07, 6.504356861114502e-06, 1.3718381524085999e-05, 2.0932406187057495e-05, 2.8146430850028992e-05, 3.536045551300049e-05, 4.2574480175971985e-05, 4.978850483894348e-05, 5.700252950191498e-05, 6.421655416488647e-05, 7.143057882785797e-05, 7.864460349082947e-05, 8.585862815380096e-05, 9.307265281677246e-05, 0.00010028667747974396, 0.00010750070214271545, 0.00011471472680568695, 0.00012192875146865845, 0.00012914277613162994, 0.00013635680079460144, 0.00014357082545757294, 0.00015078485012054443, 0.00015799887478351593, 0.00016521289944648743, 0.00017242692410945892, 0.00017964094877243042, 0.00018685497343540192, 0.0001940689980983734, 0.0002012830227613449, 0.0002084970474243164]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 6.0, 22.0, 22.0, 25.0, 17.0, 35.0, 36.0, 30.0, 36.0, 37.0, 50.0, 34.0, 48.0, 44.0, 42.0, 46.0, 53.0, 45.0, 36.0, 40.0, 32.0, 29.0, 23.0, 31.0, 29.0, 17.0, 14.0, 13.0, 20.0, 7.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.55078125, -6.3590087890625, -6.167236328125, -5.9754638671875, -5.78369140625, -5.5919189453125, -5.400146484375, -5.2083740234375, -5.0166015625, -4.8248291015625, -4.633056640625, -4.4412841796875, -4.24951171875, -4.0577392578125, -3.865966796875, -3.6741943359375, -3.482421875, -3.2906494140625, -3.098876953125, -2.9071044921875, -2.71533203125, -2.5235595703125, -2.331787109375, -2.1400146484375, -1.9482421875, -1.7564697265625, -1.564697265625, -1.3729248046875, -1.18115234375, -0.9893798828125, -0.797607421875, -0.6058349609375, -0.4140625, -0.2222900390625, -0.030517578125, 0.1612548828125, 0.35302734375, 0.5447998046875, 0.736572265625, 0.9283447265625, 1.1201171875, 1.3118896484375, 1.503662109375, 1.6954345703125, 1.88720703125, 2.0789794921875, 2.270751953125, 2.4625244140625, 2.654296875, 2.8460693359375, 3.037841796875, 3.2296142578125, 3.42138671875, 3.6131591796875, 3.804931640625, 3.9967041015625, 4.1884765625, 4.3802490234375, 4.572021484375, 4.7637939453125, 4.95556640625, 5.1473388671875, 5.339111328125, 5.5308837890625, 5.72265625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 11.0, 15.0, 22.0, 28.0, 33.0, 63.0, 88.0, 132.0, 234.0, 400.0, 616.0, 1197.0, 2148.0, 4364.0, 9285.0, 23070.0, 69216.0, 271163.0, 470391.0, 130645.0, 38222.0, 14247.0, 6268.0, 2936.0, 1565.0, 838.0, 503.0, 314.0, 170.0, 112.0, 76.0, 57.0, 41.0, 17.0, 15.0, 14.0, 5.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.2734375, -5.11944580078125, -4.9654541015625, -4.81146240234375, -4.657470703125, -4.50347900390625, -4.3494873046875, -4.19549560546875, -4.04150390625, -3.88751220703125, -3.7335205078125, -3.57952880859375, -3.425537109375, -3.27154541015625, -3.1175537109375, -2.96356201171875, -2.8095703125, -2.65557861328125, -2.5015869140625, -2.34759521484375, -2.193603515625, -2.03961181640625, -1.8856201171875, -1.73162841796875, -1.57763671875, -1.42364501953125, -1.2696533203125, -1.11566162109375, -0.961669921875, -0.80767822265625, -0.6536865234375, -0.49969482421875, -0.345703125, -0.19171142578125, -0.0377197265625, 0.11627197265625, 0.270263671875, 0.42425537109375, 0.5782470703125, 0.73223876953125, 0.88623046875, 1.04022216796875, 1.1942138671875, 1.34820556640625, 1.502197265625, 1.65618896484375, 1.8101806640625, 1.96417236328125, 2.1181640625, 2.27215576171875, 2.4261474609375, 2.58013916015625, 2.734130859375, 2.88812255859375, 3.0421142578125, 3.19610595703125, 3.35009765625, 3.50408935546875, 3.6580810546875, 3.81207275390625, 3.966064453125, 4.12005615234375, 4.2740478515625, 4.42803955078125, 4.58203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 8.0, 5.0, 9.0, 14.0, 6.0, 19.0, 15.0, 31.0, 21.0, 26.0, 24.0, 27.0, 40.0, 43.0, 43.0, 39.0, 62.0, 112.0, 444.0, 1519.0, 111.0, 60.0, 44.0, 34.0, 31.0, 43.0, 38.0, 27.0, 21.0, 22.0, 23.0, 12.0, 10.0, 15.0, 12.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.796875, -22.146484375, -21.49609375, -20.845703125, -20.1953125, -19.544921875, -18.89453125, -18.244140625, -17.59375, -16.943359375, -16.29296875, -15.642578125, -14.9921875, -14.341796875, -13.69140625, -13.041015625, -12.390625, -11.740234375, -11.08984375, -10.439453125, -9.7890625, -9.138671875, -8.48828125, -7.837890625, -7.1875, -6.537109375, -5.88671875, -5.236328125, -4.5859375, -3.935546875, -3.28515625, -2.634765625, -1.984375, -1.333984375, -0.68359375, -0.033203125, 0.6171875, 1.267578125, 1.91796875, 2.568359375, 3.21875, 3.869140625, 4.51953125, 5.169921875, 5.8203125, 6.470703125, 7.12109375, 7.771484375, 8.421875, 9.072265625, 9.72265625, 10.373046875, 11.0234375, 11.673828125, 12.32421875, 12.974609375, 13.625, 14.275390625, 14.92578125, 15.576171875, 16.2265625, 16.876953125, 17.52734375, 18.177734375, 18.828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 4.0, 5.0, 9.0, 9.0, 12.0, 16.0, 16.0, 18.0, 24.0, 34.0, 33.0, 45.0, 69.0, 120.0, 116.0, 187.0, 300.0, 520.0, 2440.0, 644345.0, 2492429.0, 3273.0, 572.0, 321.0, 207.0, 132.0, 96.0, 70.0, 66.0, 46.0, 31.0, 38.0, 16.0, 22.0, 10.0, 14.0, 8.0, 11.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-38.65625, -37.32568359375, -35.9951171875, -34.66455078125, -33.333984375, -32.00341796875, -30.6728515625, -29.34228515625, -28.01171875, -26.68115234375, -25.3505859375, -24.02001953125, -22.689453125, -21.35888671875, -20.0283203125, -18.69775390625, -17.3671875, -16.03662109375, -14.7060546875, -13.37548828125, -12.044921875, -10.71435546875, -9.3837890625, -8.05322265625, -6.72265625, -5.39208984375, -4.0615234375, -2.73095703125, -1.400390625, -0.06982421875, 1.2607421875, 2.59130859375, 3.921875, 5.25244140625, 6.5830078125, 7.91357421875, 9.244140625, 10.57470703125, 11.9052734375, 13.23583984375, 14.56640625, 15.89697265625, 17.2275390625, 18.55810546875, 19.888671875, 21.21923828125, 22.5498046875, 23.88037109375, 25.2109375, 26.54150390625, 27.8720703125, 29.20263671875, 30.533203125, 31.86376953125, 33.1943359375, 34.52490234375, 35.85546875, 37.18603515625, 38.5166015625, 39.84716796875, 41.177734375, 42.50830078125, 43.8388671875, 45.16943359375, 46.5]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 41.0, 225.0, 452.0, 246.0, 35.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.57462310791016, -66.5911865234375, -64.60775756835938, -62.62432098388672, -60.64088439941406, -58.657447814941406, -56.674015045166016, -54.690582275390625, -52.70714569091797, -50.72370910644531, -48.74027633666992, -46.75684356689453, -44.773406982421875, -42.78997039794922, -40.80653762817383, -38.82310485839844, -36.83966827392578, -34.856231689453125, -32.872798919677734, -30.88936424255371, -28.905929565429688, -26.922494888305664, -24.93906021118164, -22.955625534057617, -20.972190856933594, -18.98875617980957, -17.005321502685547, -15.021886825561523, -13.0384521484375, -11.055017471313477, -9.071582794189453, -7.08814811706543, -5.104709625244141, -3.121274948120117, -1.1378402709960938, 0.8455944061279297, 2.829029083251953, 4.812463760375977, 6.7958984375, 8.779333114624023, 10.762767791748047, 12.74620246887207, 14.729637145996094, 16.713071823120117, 18.69650650024414, 20.679941177368164, 22.663375854492188, 24.64681053161621, 26.630245208740234, 28.613679885864258, 30.59711456298828, 32.58055114746094, 34.56398391723633, 36.54741668701172, 38.530853271484375, 40.51428985595703, 42.49772262573242, 44.48115539550781, 46.46459197998047, 48.448028564453125, 50.431461334228516, 52.414894104003906, 54.39833068847656, 56.38176727294922, 58.36520004272461]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 8.0, 8.0, 9.0, 13.0, 22.0, 17.0, 17.0, 18.0, 18.0, 26.0, 30.0, 33.0, 31.0, 40.0, 52.0, 54.0, 37.0, 51.0, 51.0, 66.0, 52.0, 39.0, 33.0, 34.0, 36.0, 26.0, 29.0, 28.0, 19.0, 14.0, 21.0, 6.0, 8.0, 15.0, 9.0, 5.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.504302978515625, -58.72920227050781, -56.954105377197266, -55.17900466918945, -53.403907775878906, -51.628807067871094, -49.85370635986328, -48.078609466552734, -46.30350875854492, -44.52840805053711, -42.75331115722656, -40.97821044921875, -39.2031135559082, -37.42801284790039, -35.652915954589844, -33.87781524658203, -32.10271453857422, -30.32761573791504, -28.55251693725586, -26.777416229248047, -25.002317428588867, -23.227218627929688, -21.452119827270508, -19.677021026611328, -17.90192413330078, -16.1268253326416, -14.351725578308105, -12.576626777648926, -10.80152702331543, -9.02642822265625, -7.25132942199707, -5.476229667663574, -3.701129913330078, -1.9260307550430298, -0.15093159675598145, 1.6241674423217773, 3.3992667198181152, 5.174365997314453, 6.949464797973633, 8.724564552307129, 10.499663352966309, 12.274762153625488, 14.049861907958984, 15.824960708618164, 17.600059509277344, 19.375160217285156, 21.150257110595703, 22.925357818603516, 24.700456619262695, 26.475555419921875, 28.250654220581055, 30.025753021240234, 31.800853729248047, 33.575950622558594, 35.351051330566406, 37.12615203857422, 38.901248931884766, 40.67634963989258, 42.451446533203125, 44.22654724121094, 46.001644134521484, 47.7767448425293, 49.551841735839844, 51.326942443847656, 53.10204315185547]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 10.0, 13.0, 9.0, 21.0, 19.0, 27.0, 19.0, 29.0, 30.0, 35.0, 39.0, 35.0, 27.0, 51.0, 52.0, 36.0, 43.0, 42.0, 41.0, 49.0, 57.0, 31.0, 24.0, 38.0, 28.0, 23.0, 26.0, 20.0, 22.0, 20.0, 19.0, 9.0, 9.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.6640625, -6.47216796875, -6.2802734375, -6.08837890625, -5.896484375, -5.70458984375, -5.5126953125, -5.32080078125, -5.12890625, -4.93701171875, -4.7451171875, -4.55322265625, -4.361328125, -4.16943359375, -3.9775390625, -3.78564453125, -3.59375, -3.40185546875, -3.2099609375, -3.01806640625, -2.826171875, -2.63427734375, -2.4423828125, -2.25048828125, -2.05859375, -1.86669921875, -1.6748046875, -1.48291015625, -1.291015625, -1.09912109375, -0.9072265625, -0.71533203125, -0.5234375, -0.33154296875, -0.1396484375, 0.05224609375, 0.244140625, 0.43603515625, 0.6279296875, 0.81982421875, 1.01171875, 1.20361328125, 1.3955078125, 1.58740234375, 1.779296875, 1.97119140625, 2.1630859375, 2.35498046875, 2.546875, 2.73876953125, 2.9306640625, 3.12255859375, 3.314453125, 3.50634765625, 3.6982421875, 3.89013671875, 4.08203125, 4.27392578125, 4.4658203125, 4.65771484375, 4.849609375, 5.04150390625, 5.2333984375, 5.42529296875, 5.6171875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 6.0, 9.0, 10.0, 12.0, 14.0, 19.0, 26.0, 27.0, 31.0, 30.0, 45.0, 62.0, 60.0, 120.0, 232.0, 862.0, 17477.0, 3487930.0, 682171.0, 4040.0, 480.0, 166.0, 98.0, 62.0, 52.0, 42.0, 41.0, 27.0, 21.0, 15.0, 18.0, 16.0, 12.0, 13.0, 8.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.8125, -37.697265625, -36.58203125, -35.466796875, -34.3515625, -33.236328125, -32.12109375, -31.005859375, -29.890625, -28.775390625, -27.66015625, -26.544921875, -25.4296875, -24.314453125, -23.19921875, -22.083984375, -20.96875, -19.853515625, -18.73828125, -17.623046875, -16.5078125, -15.392578125, -14.27734375, -13.162109375, -12.046875, -10.931640625, -9.81640625, -8.701171875, -7.5859375, -6.470703125, -5.35546875, -4.240234375, -3.125, -2.009765625, -0.89453125, 0.220703125, 1.3359375, 2.451171875, 3.56640625, 4.681640625, 5.796875, 6.912109375, 8.02734375, 9.142578125, 10.2578125, 11.373046875, 12.48828125, 13.603515625, 14.71875, 15.833984375, 16.94921875, 18.064453125, 19.1796875, 20.294921875, 21.41015625, 22.525390625, 23.640625, 24.755859375, 25.87109375, 26.986328125, 28.1015625, 29.216796875, 30.33203125, 31.447265625, 32.5625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 9.0, 17.0, 17.0, 23.0, 24.0, 35.0, 42.0, 47.0, 73.0, 84.0, 125.0, 175.0, 214.0, 287.0, 310.0, 342.0, 392.0, 405.0, 321.0, 255.0, 201.0, 137.0, 103.0, 83.0, 70.0, 52.0, 48.0, 42.0, 39.0, 20.0, 21.0, 13.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-11.6640625, -11.3040771484375, -10.944091796875, -10.5841064453125, -10.22412109375, -9.8641357421875, -9.504150390625, -9.1441650390625, -8.7841796875, -8.4241943359375, -8.064208984375, -7.7042236328125, -7.34423828125, -6.9842529296875, -6.624267578125, -6.2642822265625, -5.904296875, -5.5443115234375, -5.184326171875, -4.8243408203125, -4.46435546875, -4.1043701171875, -3.744384765625, -3.3843994140625, -3.0244140625, -2.6644287109375, -2.304443359375, -1.9444580078125, -1.58447265625, -1.2244873046875, -0.864501953125, -0.5045166015625, -0.14453125, 0.2154541015625, 0.575439453125, 0.9354248046875, 1.29541015625, 1.6553955078125, 2.015380859375, 2.3753662109375, 2.7353515625, 3.0953369140625, 3.455322265625, 3.8153076171875, 4.17529296875, 4.5352783203125, 4.895263671875, 5.2552490234375, 5.615234375, 5.9752197265625, 6.335205078125, 6.6951904296875, 7.05517578125, 7.4151611328125, 7.775146484375, 8.1351318359375, 8.4951171875, 8.8551025390625, 9.215087890625, 9.5750732421875, 9.93505859375, 10.2950439453125, 10.655029296875, 11.0150146484375, 11.375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 4.0, 1.0, 13.0, 7.0, 10.0, 11.0, 16.0, 30.0, 32.0, 30.0, 54.0, 48.0, 75.0, 80.0, 103.0, 146.0, 173.0, 267.0, 399.0, 869.0, 6599.0, 2688803.0, 1489234.0, 5082.0, 800.0, 418.0, 249.0, 165.0, 117.0, 103.0, 76.0, 70.0, 36.0, 40.0, 27.0, 27.0, 12.0, 18.0, 11.0, 12.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.625, -41.876953125, -40.12890625, -38.380859375, -36.6328125, -34.884765625, -33.13671875, -31.388671875, -29.640625, -27.892578125, -26.14453125, -24.396484375, -22.6484375, -20.900390625, -19.15234375, -17.404296875, -15.65625, -13.908203125, -12.16015625, -10.412109375, -8.6640625, -6.916015625, -5.16796875, -3.419921875, -1.671875, 0.076171875, 1.82421875, 3.572265625, 5.3203125, 7.068359375, 8.81640625, 10.564453125, 12.3125, 14.060546875, 15.80859375, 17.556640625, 19.3046875, 21.052734375, 22.80078125, 24.548828125, 26.296875, 28.044921875, 29.79296875, 31.541015625, 33.2890625, 35.037109375, 36.78515625, 38.533203125, 40.28125, 42.029296875, 43.77734375, 45.525390625, 47.2734375, 49.021484375, 50.76953125, 52.517578125, 54.265625, 56.013671875, 57.76171875, 59.509765625, 61.2578125, 63.005859375, 64.75390625, 66.501953125, 68.25]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 14.0, 41.0, 103.0, 176.0, 238.0, 231.0, 116.0, 63.0, 16.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.58984375, -22.22252082824707, -18.85519790649414, -15.487876892089844, -12.120553970336914, -8.753231048583984, -5.3859100341796875, -2.018587112426758, 1.3487358093261719, 4.716058254241943, 8.083380699157715, 11.450702667236328, 14.818025588989258, 18.185348510742188, 21.552669525146484, 24.919992446899414, 28.287315368652344, 31.654638290405273, 35.0219612121582, 38.3892822265625, 41.75660705566406, 45.12392807006836, 48.491249084472656, 51.85857391357422, 55.225894927978516, 58.59321594238281, 61.960540771484375, 65.32786560058594, 68.69518280029297, 72.06250762939453, 75.42982482910156, 78.79714965820312, 82.16447448730469, 85.53179931640625, 88.89911651611328, 92.26644134521484, 95.6337661743164, 99.00108337402344, 102.368408203125, 105.73573303222656, 109.10305786132812, 112.47038269042969, 115.83769989013672, 119.20502471923828, 122.57234954833984, 125.93966674804688, 129.30699157714844, 132.67431640625, 136.0416259765625, 139.40895080566406, 142.77627563476562, 146.14358520507812, 149.5109100341797, 152.87823486328125, 156.2455596923828, 159.61288452148438, 162.98020935058594, 166.3475341796875, 169.71485900878906, 173.08218383789062, 176.44949340820312, 179.8168182373047, 183.18414306640625, 186.5514678955078, 189.91879272460938]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 7.0, 10.0, 12.0, 12.0, 3.0, 17.0, 16.0, 15.0, 19.0, 19.0, 23.0, 22.0, 21.0, 26.0, 41.0, 34.0, 41.0, 36.0, 44.0, 38.0, 44.0, 38.0, 47.0, 43.0, 31.0, 41.0, 31.0, 30.0, 23.0, 22.0, 27.0, 20.0, 30.0, 16.0, 12.0, 8.0, 19.0, 9.0, 10.0, 12.0, 5.0, 2.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.049949645996094, -34.77021789550781, -33.49048614501953, -32.21075439453125, -30.93102264404297, -29.651290893554688, -28.371559143066406, -27.091827392578125, -25.812095642089844, -24.532363891601562, -23.25263214111328, -21.972900390625, -20.69316864013672, -19.413436889648438, -18.133705139160156, -16.853973388671875, -15.574239730834961, -14.29450798034668, -13.014776229858398, -11.735044479370117, -10.455312728881836, -9.175580978393555, -7.895848274230957, -6.616116523742676, -5.3363847732543945, -4.056653022766113, -2.776921033859253, -1.4971890449523926, -0.21745729446411133, 1.06227445602417, 2.3420066833496094, 3.6217384338378906, 4.901470184326172, 6.181201934814453, 7.460933685302734, 8.740665435791016, 10.020397186279297, 11.300128936767578, 12.579861640930176, 13.859593391418457, 15.139325141906738, 16.419057846069336, 17.698789596557617, 18.9785213470459, 20.25825309753418, 21.53798484802246, 22.817716598510742, 24.097448348999023, 25.377180099487305, 26.656911849975586, 27.936643600463867, 29.21637535095215, 30.49610710144043, 31.77583885192871, 33.055572509765625, 34.335304260253906, 35.61503601074219, 36.89476776123047, 38.17449951171875, 39.45423126220703, 40.73396301269531, 42.013694763183594, 43.293426513671875, 44.573158264160156, 45.85289001464844]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 13.0, 7.0, 8.0, 15.0, 13.0, 16.0, 21.0, 17.0, 25.0, 30.0, 33.0, 33.0, 36.0, 30.0, 46.0, 31.0, 35.0, 41.0, 26.0, 48.0, 40.0, 39.0, 44.0, 41.0, 27.0, 39.0, 26.0, 28.0, 29.0, 28.0, 16.0, 20.0, 20.0, 15.0, 12.0, 7.0, 14.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.1514892578125, -5.970947265625, -5.7904052734375, -5.60986328125, -5.4293212890625, -5.248779296875, -5.0682373046875, -4.8876953125, -4.7071533203125, -4.526611328125, -4.3460693359375, -4.16552734375, -3.9849853515625, -3.804443359375, -3.6239013671875, -3.443359375, -3.2628173828125, -3.082275390625, -2.9017333984375, -2.72119140625, -2.5406494140625, -2.360107421875, -2.1795654296875, -1.9990234375, -1.8184814453125, -1.637939453125, -1.4573974609375, -1.27685546875, -1.0963134765625, -0.915771484375, -0.7352294921875, -0.5546875, -0.3741455078125, -0.193603515625, -0.0130615234375, 0.16748046875, 0.3480224609375, 0.528564453125, 0.7091064453125, 0.8896484375, 1.0701904296875, 1.250732421875, 1.4312744140625, 1.61181640625, 1.7923583984375, 1.972900390625, 2.1534423828125, 2.333984375, 2.5145263671875, 2.695068359375, 2.8756103515625, 3.05615234375, 3.2366943359375, 3.417236328125, 3.5977783203125, 3.7783203125, 3.9588623046875, 4.139404296875, 4.3199462890625, 4.50048828125, 4.6810302734375, 4.861572265625, 5.0421142578125, 5.22265625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 9.0, 18.0, 26.0, 41.0, 45.0, 75.0, 118.0, 158.0, 195.0, 315.0, 476.0, 664.0, 916.0, 1365.0, 1929.0, 2785.0, 4232.0, 6430.0, 9579.0, 14449.0, 22414.0, 35127.0, 55854.0, 89463.0, 146149.0, 227960.0, 159915.0, 97740.0, 60889.0, 37760.0, 24092.0, 15798.0, 10257.0, 6864.0, 4595.0, 3073.0, 2098.0, 1467.0, 964.0, 667.0, 513.0, 286.0, 243.0, 147.0, 123.0, 82.0, 60.0, 32.0, 37.0, 16.0, 11.0, 11.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.84423828125, -0.8175125122070312, -0.7907867431640625, -0.7640609741210938, -0.737335205078125, -0.7106094360351562, -0.6838836669921875, -0.6571578979492188, -0.63043212890625, -0.6037063598632812, -0.5769805908203125, -0.5502548217773438, -0.523529052734375, -0.49680328369140625, -0.4700775146484375, -0.44335174560546875, -0.4166259765625, -0.38990020751953125, -0.3631744384765625, -0.33644866943359375, -0.309722900390625, -0.28299713134765625, -0.2562713623046875, -0.22954559326171875, -0.20281982421875, -0.17609405517578125, -0.1493682861328125, -0.12264251708984375, -0.095916748046875, -0.06919097900390625, -0.0424652099609375, -0.01573944091796875, 0.010986328125, 0.03771209716796875, 0.0644378662109375, 0.09116363525390625, 0.117889404296875, 0.14461517333984375, 0.1713409423828125, 0.19806671142578125, 0.22479248046875, 0.25151824951171875, 0.2782440185546875, 0.30496978759765625, 0.331695556640625, 0.35842132568359375, 0.3851470947265625, 0.41187286376953125, 0.4385986328125, 0.46532440185546875, 0.4920501708984375, 0.5187759399414062, 0.545501708984375, 0.5722274780273438, 0.5989532470703125, 0.6256790161132812, 0.65240478515625, 0.6791305541992188, 0.7058563232421875, 0.7325820922851562, 0.759307861328125, 0.7860336303710938, 0.8127593994140625, 0.8394851684570312, 0.8662109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 3.0, 6.0, 7.0, 16.0, 18.0, 21.0, 23.0, 31.0, 22.0, 32.0, 48.0, 38.0, 39.0, 31.0, 36.0, 45.0, 44.0, 1077.0, 41.0, 45.0, 48.0, 39.0, 29.0, 41.0, 22.0, 29.0, 27.0, 24.0, 22.0, 21.0, 16.0, 15.0, 11.0, 7.0, 8.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.390625, -4.267822265625, -4.14501953125, -4.022216796875, -3.8994140625, -3.776611328125, -3.65380859375, -3.531005859375, -3.408203125, -3.285400390625, -3.16259765625, -3.039794921875, -2.9169921875, -2.794189453125, -2.67138671875, -2.548583984375, -2.42578125, -2.302978515625, -2.18017578125, -2.057373046875, -1.9345703125, -1.811767578125, -1.68896484375, -1.566162109375, -1.443359375, -1.320556640625, -1.19775390625, -1.074951171875, -0.9521484375, -0.829345703125, -0.70654296875, -0.583740234375, -0.4609375, -0.338134765625, -0.21533203125, -0.092529296875, 0.0302734375, 0.153076171875, 0.27587890625, 0.398681640625, 0.521484375, 0.644287109375, 0.76708984375, 0.889892578125, 1.0126953125, 1.135498046875, 1.25830078125, 1.381103515625, 1.50390625, 1.626708984375, 1.74951171875, 1.872314453125, 1.9951171875, 2.117919921875, 2.24072265625, 2.363525390625, 2.486328125, 2.609130859375, 2.73193359375, 2.854736328125, 2.9775390625, 3.100341796875, 3.22314453125, 3.345947265625, 3.46875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 9.0, 9.0, 15.0, 23.0, 33.0, 67.0, 95.0, 124.0, 186.0, 286.0, 452.0, 626.0, 967.0, 1513.0, 2239.0, 3438.0, 5013.0, 7713.0, 12092.0, 18818.0, 30214.0, 49345.0, 83538.0, 149650.0, 1311109.0, 174373.0, 96039.0, 55742.0, 33704.0, 21266.0, 13136.0, 8562.0, 5725.0, 3724.0, 2449.0, 1653.0, 1100.0, 722.0, 446.0, 298.0, 213.0, 134.0, 88.0, 69.0, 33.0, 26.0, 17.0, 13.0, 9.0, 6.0, 2.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.833984375, -0.8067474365234375, -0.779510498046875, -0.7522735595703125, -0.72503662109375, -0.6977996826171875, -0.670562744140625, -0.6433258056640625, -0.6160888671875, -0.5888519287109375, -0.561614990234375, -0.5343780517578125, -0.50714111328125, -0.4799041748046875, -0.452667236328125, -0.4254302978515625, -0.398193359375, -0.3709564208984375, -0.343719482421875, -0.3164825439453125, -0.28924560546875, -0.2620086669921875, -0.234771728515625, -0.2075347900390625, -0.1802978515625, -0.1530609130859375, -0.125823974609375, -0.0985870361328125, -0.07135009765625, -0.0441131591796875, -0.016876220703125, 0.0103607177734375, 0.03759765625, 0.0648345947265625, 0.092071533203125, 0.1193084716796875, 0.14654541015625, 0.1737823486328125, 0.201019287109375, 0.2282562255859375, 0.2554931640625, 0.2827301025390625, 0.309967041015625, 0.3372039794921875, 0.36444091796875, 0.3916778564453125, 0.418914794921875, 0.4461517333984375, 0.473388671875, 0.5006256103515625, 0.527862548828125, 0.5550994873046875, 0.58233642578125, 0.6095733642578125, 0.636810302734375, 0.6640472412109375, 0.6912841796875, 0.7185211181640625, 0.745758056640625, 0.7729949951171875, 0.80023193359375, 0.8274688720703125, 0.854705810546875, 0.8819427490234375, 0.9091796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 6.0, 6.0, 9.0, 14.0, 8.0, 13.0, 11.0, 17.0, 22.0, 26.0, 44.0, 39.0, 45.0, 45.0, 57.0, 69.0, 71.0, 54.0, 71.0, 57.0, 49.0, 45.0, 40.0, 30.0, 23.0, 26.0, 15.0, 15.0, 11.0, 9.0, 15.0, 6.0, 5.0, 5.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005655288696289062, -0.0005484223365783691, -0.000531315803527832, -0.0005142092704772949, -0.0004971027374267578, -0.0004799962043762207, -0.0004628896713256836, -0.0004457831382751465, -0.0004286766052246094, -0.00041157007217407227, -0.00039446353912353516, -0.00037735700607299805, -0.00036025047302246094, -0.00034314393997192383, -0.0003260374069213867, -0.0003089308738708496, -0.0002918243408203125, -0.0002747178077697754, -0.0002576112747192383, -0.00024050474166870117, -0.00022339820861816406, -0.00020629167556762695, -0.00018918514251708984, -0.00017207860946655273, -0.00015497207641601562, -0.00013786554336547852, -0.0001207590103149414, -0.0001036524772644043, -8.654594421386719e-05, -6.943941116333008e-05, -5.233287811279297e-05, -3.522634506225586e-05, -1.811981201171875e-05, -1.0132789611816406e-06, 1.609325408935547e-05, 3.319978713989258e-05, 5.030632019042969e-05, 6.74128532409668e-05, 8.45193862915039e-05, 0.00010162591934204102, 0.00011873245239257812, 0.00013583898544311523, 0.00015294551849365234, 0.00017005205154418945, 0.00018715858459472656, 0.00020426511764526367, 0.00022137165069580078, 0.0002384781837463379, 0.000255584716796875, 0.0002726912498474121, 0.0002897977828979492, 0.00030690431594848633, 0.00032401084899902344, 0.00034111738204956055, 0.00035822391510009766, 0.00037533044815063477, 0.0003924369812011719, 0.000409543514251709, 0.0004266500473022461, 0.0004437565803527832, 0.0004608631134033203, 0.0004779696464538574, 0.0004950761795043945, 0.0005121827125549316, 0.0005292892456054688]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 12.0, 12.0, 25.0, 20.0, 28.0, 53.0, 77.0, 126.0, 210.0, 491.0, 1654.0, 1016260.0, 27997.0, 780.0, 296.0, 164.0, 102.0, 80.0, 41.0, 38.0, 12.0, 14.0, 15.0, 9.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157012939453125, -0.015190839767456055, -0.01468038558959961, -0.014169931411743164, -0.013659477233886719, -0.013149023056030273, -0.012638568878173828, -0.012128114700317383, -0.011617660522460938, -0.011107206344604492, -0.010596752166748047, -0.010086297988891602, -0.009575843811035156, -0.009065389633178711, -0.008554935455322266, -0.00804448127746582, -0.007534027099609375, -0.00702357292175293, -0.006513118743896484, -0.006002664566040039, -0.005492210388183594, -0.0049817562103271484, -0.004471302032470703, -0.003960847854614258, -0.0034503936767578125, -0.002939939498901367, -0.002429485321044922, -0.0019190311431884766, -0.0014085769653320312, -0.0008981227874755859, -0.0003876686096191406, 0.0001227855682373047, 0.00063323974609375, 0.0011436939239501953, 0.0016541481018066406, 0.002164602279663086, 0.0026750564575195312, 0.0031855106353759766, 0.003695964813232422, 0.004206418991088867, 0.0047168731689453125, 0.005227327346801758, 0.005737781524658203, 0.0062482357025146484, 0.006758689880371094, 0.007269144058227539, 0.007779598236083984, 0.00829005241394043, 0.008800506591796875, 0.00931096076965332, 0.009821414947509766, 0.010331869125366211, 0.010842323303222656, 0.011352777481079102, 0.011863231658935547, 0.012373685836791992, 0.012884140014648438, 0.013394594192504883, 0.013905048370361328, 0.014415502548217773, 0.014925956726074219, 0.015436410903930664, 0.01594686508178711, 0.016457319259643555, 0.0169677734375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 105.0, 682.0, 215.0, 9.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009810629999265075, -0.00091396807692945, -0.0008468731539323926, -0.0007797781727276742, -0.0007126832497306168, -0.0006455883267335594, -0.000578493345528841, -0.0005113984225317836, -0.00044430349953472614, -0.0003772085765376687, -0.0003101136244367808, -0.00024301868688780814, -0.00017592374933883548, -0.00010882882634177804, -4.1733874240890145e-05, 2.536107785999775e-05, 9.245600085705519e-05, 0.00015955093840602785, 0.00022664587595500052, 0.0002937408280558884, 0.00036083575105294585, 0.0004279306740500033, 0.0004950256552547216, 0.0005621205782517791, 0.0006292155012488365, 0.000696310424245894, 0.0007634053472429514, 0.0008305003284476697, 0.0008975952514447272, 0.0009646901744417846, 0.001031785155646503, 0.0010988800786435604, 0.0011659751180559397, 0.0012330700410529971, 0.0013001649640500546, 0.001367259887047112, 0.0014343548100441694, 0.0015014498494565487, 0.0015685447724536061, 0.0016356396954506636, 0.001702734618447721, 0.0017698295414447784, 0.0018369244644418359, 0.0019040193874388933, 0.0019711144268512726, 0.002038209233433008, 0.0021053042728453875, 0.0021723993122577667, 0.0022394941188395023, 0.0023065891582518816, 0.002373683964833617, 0.0024407790042459965, 0.002507873810827732, 0.0025749688502401114, 0.002642063656821847, 0.0027091586962342262, 0.002776253502815962, 0.002843348542228341, 0.0029104433488100767, 0.002977538388222456, 0.0030446331948041916, 0.003111728234216571, 0.0031788230407983065, 0.0032459180802106857, 0.003313013119623065]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 3.0, 1.0, 6.0, 11.0, 3.0, 5.0, 8.0, 10.0, 15.0, 5.0, 12.0, 29.0, 13.0, 25.0, 31.0, 33.0, 37.0, 43.0, 40.0, 34.0, 38.0, 32.0, 36.0, 36.0, 37.0, 33.0, 30.0, 32.0, 47.0, 33.0, 35.0, 28.0, 24.0, 23.0, 35.0, 16.0, 17.0, 11.0, 13.0, 12.0, 14.0, 9.0, 11.0, 11.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0002714991569519043, -0.0002638213336467743, -0.0002561435103416443, -0.0002484656870365143, -0.00024078786373138428, -0.00023311004042625427, -0.00022543221712112427, -0.00021775439381599426, -0.00021007657051086426, -0.00020239874720573425, -0.00019472092390060425, -0.00018704310059547424, -0.00017936527729034424, -0.00017168745398521423, -0.00016400963068008423, -0.00015633180737495422, -0.00014865398406982422, -0.00014097616076469421, -0.0001332983374595642, -0.0001256205141544342, -0.0001179426908493042, -0.0001102648675441742, -0.00010258704423904419, -9.490922093391418e-05, -8.723139762878418e-05, -7.955357432365417e-05, -7.187575101852417e-05, -6.419792771339417e-05, -5.652010440826416e-05, -4.8842281103134155e-05, -4.116445779800415e-05, -3.3486634492874146e-05, -2.580881118774414e-05, -1.8130987882614136e-05, -1.0453164577484131e-05, -2.775341272354126e-06, 4.902482032775879e-06, 1.2580305337905884e-05, 2.025812864303589e-05, 2.7935951948165894e-05, 3.56137752532959e-05, 4.32915985584259e-05, 5.096942186355591e-05, 5.864724516868591e-05, 6.632506847381592e-05, 7.400289177894592e-05, 8.168071508407593e-05, 8.935853838920593e-05, 9.703636169433594e-05, 0.00010471418499946594, 0.00011239200830459595, 0.00012006983160972595, 0.00012774765491485596, 0.00013542547821998596, 0.00014310330152511597, 0.00015078112483024597, 0.00015845894813537598, 0.00016613677144050598, 0.00017381459474563599, 0.000181492418050766, 0.000189170241355896, 0.000196848064661026, 0.000204525887966156, 0.000212203711271286, 0.00021988153457641602]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 13.0, 7.0, 8.0, 15.0, 13.0, 16.0, 21.0, 17.0, 25.0, 30.0, 33.0, 33.0, 36.0, 30.0, 46.0, 31.0, 35.0, 41.0, 26.0, 48.0, 40.0, 39.0, 44.0, 41.0, 27.0, 39.0, 26.0, 28.0, 29.0, 28.0, 16.0, 21.0, 19.0, 15.0, 12.0, 7.0, 14.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.1514892578125, -5.970947265625, -5.7904052734375, -5.60986328125, -5.4293212890625, -5.248779296875, -5.0682373046875, -4.8876953125, -4.7071533203125, -4.526611328125, -4.3460693359375, -4.16552734375, -3.9849853515625, -3.804443359375, -3.6239013671875, -3.443359375, -3.2628173828125, -3.082275390625, -2.9017333984375, -2.72119140625, -2.5406494140625, -2.360107421875, -2.1795654296875, -1.9990234375, -1.8184814453125, -1.637939453125, -1.4573974609375, -1.27685546875, -1.0963134765625, -0.915771484375, -0.7352294921875, -0.5546875, -0.3741455078125, -0.193603515625, -0.0130615234375, 0.16748046875, 0.3480224609375, 0.528564453125, 0.7091064453125, 0.8896484375, 1.0701904296875, 1.250732421875, 1.4312744140625, 1.61181640625, 1.7923583984375, 1.972900390625, 2.1534423828125, 2.333984375, 2.5145263671875, 2.695068359375, 2.8756103515625, 3.05615234375, 3.2366943359375, 3.417236328125, 3.5977783203125, 3.7783203125, 3.9588623046875, 4.139404296875, 4.3199462890625, 4.50048828125, 4.6810302734375, 4.861572265625, 5.0421142578125, 5.22265625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 9.0, 10.0, 11.0, 13.0, 25.0, 39.0, 49.0, 80.0, 113.0, 144.0, 227.0, 372.0, 593.0, 969.0, 1526.0, 2629.0, 4192.0, 7286.0, 12230.0, 22611.0, 43806.0, 92643.0, 232976.0, 354338.0, 139737.0, 61580.0, 30810.0, 16265.0, 9209.0, 5593.0, 3174.0, 1956.0, 1249.0, 747.0, 447.0, 283.0, 203.0, 128.0, 85.0, 61.0, 47.0, 30.0, 18.0, 14.0, 11.0, 7.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.00390625, -2.907745361328125, -2.81158447265625, -2.715423583984375, -2.6192626953125, -2.523101806640625, -2.42694091796875, -2.330780029296875, -2.234619140625, -2.138458251953125, -2.04229736328125, -1.946136474609375, -1.8499755859375, -1.753814697265625, -1.65765380859375, -1.561492919921875, -1.46533203125, -1.369171142578125, -1.27301025390625, -1.176849365234375, -1.0806884765625, -0.984527587890625, -0.88836669921875, -0.792205810546875, -0.696044921875, -0.599884033203125, -0.50372314453125, -0.407562255859375, -0.3114013671875, -0.215240478515625, -0.11907958984375, -0.022918701171875, 0.0732421875, 0.169403076171875, 0.26556396484375, 0.361724853515625, 0.4578857421875, 0.554046630859375, 0.65020751953125, 0.746368408203125, 0.842529296875, 0.938690185546875, 1.03485107421875, 1.131011962890625, 1.2271728515625, 1.323333740234375, 1.41949462890625, 1.515655517578125, 1.61181640625, 1.707977294921875, 1.80413818359375, 1.900299072265625, 1.9964599609375, 2.092620849609375, 2.18878173828125, 2.284942626953125, 2.381103515625, 2.477264404296875, 2.57342529296875, 2.669586181640625, 2.7657470703125, 2.861907958984375, 2.95806884765625, 3.054229736328125, 3.150390625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 4.0, 6.0, 7.0, 4.0, 7.0, 16.0, 12.0, 18.0, 23.0, 17.0, 27.0, 31.0, 33.0, 47.0, 52.0, 57.0, 102.0, 1565.0, 449.0, 105.0, 56.0, 53.0, 58.0, 47.0, 40.0, 31.0, 25.0, 32.0, 21.0, 22.0, 20.0, 10.0, 13.0, 6.0, 6.0, 4.0, 8.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.781982421875, -19.04833984375, -18.314697265625, -17.5810546875, -16.847412109375, -16.11376953125, -15.380126953125, -14.646484375, -13.912841796875, -13.17919921875, -12.445556640625, -11.7119140625, -10.978271484375, -10.24462890625, -9.510986328125, -8.77734375, -8.043701171875, -7.31005859375, -6.576416015625, -5.8427734375, -5.109130859375, -4.37548828125, -3.641845703125, -2.908203125, -2.174560546875, -1.44091796875, -0.707275390625, 0.0263671875, 0.760009765625, 1.49365234375, 2.227294921875, 2.9609375, 3.694580078125, 4.42822265625, 5.161865234375, 5.8955078125, 6.629150390625, 7.36279296875, 8.096435546875, 8.830078125, 9.563720703125, 10.29736328125, 11.031005859375, 11.7646484375, 12.498291015625, 13.23193359375, 13.965576171875, 14.69921875, 15.432861328125, 16.16650390625, 16.900146484375, 17.6337890625, 18.367431640625, 19.10107421875, 19.834716796875, 20.568359375, 21.302001953125, 22.03564453125, 22.769287109375, 23.5029296875, 24.236572265625, 24.97021484375, 25.703857421875, 26.4375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 12.0, 15.0, 11.0, 19.0, 26.0, 35.0, 39.0, 49.0, 55.0, 82.0, 125.0, 170.0, 249.0, 349.0, 744.0, 7047.0, 3009985.0, 123302.0, 1951.0, 480.0, 280.0, 172.0, 123.0, 82.0, 69.0, 51.0, 29.0, 29.0, 19.0, 11.0, 11.0, 10.0, 11.0, 13.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.6875, -44.2939453125, -42.900390625, -41.5068359375, -40.11328125, -38.7197265625, -37.326171875, -35.9326171875, -34.5390625, -33.1455078125, -31.751953125, -30.3583984375, -28.96484375, -27.5712890625, -26.177734375, -24.7841796875, -23.390625, -21.9970703125, -20.603515625, -19.2099609375, -17.81640625, -16.4228515625, -15.029296875, -13.6357421875, -12.2421875, -10.8486328125, -9.455078125, -8.0615234375, -6.66796875, -5.2744140625, -3.880859375, -2.4873046875, -1.09375, 0.2998046875, 1.693359375, 3.0869140625, 4.48046875, 5.8740234375, 7.267578125, 8.6611328125, 10.0546875, 11.4482421875, 12.841796875, 14.2353515625, 15.62890625, 17.0224609375, 18.416015625, 19.8095703125, 21.203125, 22.5966796875, 23.990234375, 25.3837890625, 26.77734375, 28.1708984375, 29.564453125, 30.9580078125, 32.3515625, 33.7451171875, 35.138671875, 36.5322265625, 37.92578125, 39.3193359375, 40.712890625, 42.1064453125, 43.5]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 51.0, 151.0, 372.0, 297.0, 112.0, 20.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.156606674194336, -27.310348510742188, -25.464088439941406, -23.617830276489258, -21.77157211303711, -19.925312042236328, -18.07905387878418, -16.23279571533203, -14.386536598205566, -12.540277481079102, -10.694019317626953, -8.847760200500488, -7.001501560211182, -5.155242919921875, -3.30898380279541, -1.4627256393432617, 0.3835334777832031, 2.2297921180725098, 4.076050758361816, 5.922309875488281, 7.768568515777588, 9.614827156066895, 11.46108627319336, 13.307344436645508, 15.153603553771973, 16.999862670898438, 18.846120834350586, 20.692378997802734, 22.538639068603516, 24.384897232055664, 26.231155395507812, 28.077415466308594, 29.92367172241211, 31.769929885864258, 33.616188049316406, 35.46244812011719, 37.30870819091797, 39.154964447021484, 41.001224517822266, 42.84748077392578, 44.69374084472656, 46.540000915527344, 48.38625717163086, 50.23251724243164, 52.07877731323242, 53.92503356933594, 55.77129364013672, 57.6175537109375, 59.46381378173828, 61.31007385253906, 63.15633010864258, 65.00259399414062, 66.84884643554688, 68.69510650634766, 70.54136657714844, 72.38762664794922, 74.23387908935547, 76.08013916015625, 77.92639923095703, 79.77265930175781, 81.61891174316406, 83.46517181396484, 85.31143188476562, 87.1576919555664, 89.00395202636719]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 10.0, 7.0, 6.0, 18.0, 17.0, 24.0, 14.0, 11.0, 27.0, 26.0, 30.0, 45.0, 29.0, 34.0, 32.0, 29.0, 43.0, 45.0, 59.0, 33.0, 33.0, 38.0, 38.0, 35.0, 46.0, 25.0, 30.0, 24.0, 33.0, 22.0, 21.0, 19.0, 19.0, 8.0, 16.0, 11.0, 7.0, 5.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.529762268066406, -49.7943115234375, -48.058860778808594, -46.32341384887695, -44.58796310424805, -42.85251235961914, -41.117061614990234, -39.381614685058594, -37.64616394042969, -35.91071319580078, -34.175262451171875, -32.439815521240234, -30.704364776611328, -28.968914031982422, -27.233463287353516, -25.498014450073242, -23.762563705444336, -22.02711296081543, -20.291664123535156, -18.55621337890625, -16.820764541625977, -15.08531379699707, -13.34986400604248, -11.61441421508789, -9.8789644241333, -8.143514633178711, -6.408064842224121, -4.672614574432373, -2.937164783477783, -1.2017145156860352, 0.5337352752685547, 2.2691850662231445, 4.004634857177734, 5.740084648132324, 7.475534439086914, 9.21098518371582, 10.946434020996094, 12.681884765625, 14.41733455657959, 16.15278434753418, 17.888233184814453, 19.62368392944336, 21.359132766723633, 23.09458351135254, 24.830032348632812, 26.56548309326172, 28.300933837890625, 30.0363826751709, 31.771833419799805, 33.50728225708008, 35.242733001708984, 36.97818374633789, 38.7136344909668, 40.44908142089844, 42.184532165527344, 43.91998291015625, 45.655433654785156, 47.39088439941406, 49.12633514404297, 50.86178207397461, 52.597232818603516, 54.33268356323242, 56.06813430786133, 57.80358123779297, 59.539031982421875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 10.0, 9.0, 8.0, 16.0, 11.0, 12.0, 16.0, 24.0, 28.0, 32.0, 30.0, 32.0, 41.0, 30.0, 42.0, 39.0, 37.0, 41.0, 40.0, 39.0, 40.0, 42.0, 52.0, 33.0, 29.0, 31.0, 34.0, 31.0, 24.0, 21.0, 18.0, 20.0, 19.0, 11.0, 16.0, 10.0, 7.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.75, -6.55615234375, -6.3623046875, -6.16845703125, -5.974609375, -5.78076171875, -5.5869140625, -5.39306640625, -5.19921875, -5.00537109375, -4.8115234375, -4.61767578125, -4.423828125, -4.22998046875, -4.0361328125, -3.84228515625, -3.6484375, -3.45458984375, -3.2607421875, -3.06689453125, -2.873046875, -2.67919921875, -2.4853515625, -2.29150390625, -2.09765625, -1.90380859375, -1.7099609375, -1.51611328125, -1.322265625, -1.12841796875, -0.9345703125, -0.74072265625, -0.546875, -0.35302734375, -0.1591796875, 0.03466796875, 0.228515625, 0.42236328125, 0.6162109375, 0.81005859375, 1.00390625, 1.19775390625, 1.3916015625, 1.58544921875, 1.779296875, 1.97314453125, 2.1669921875, 2.36083984375, 2.5546875, 2.74853515625, 2.9423828125, 3.13623046875, 3.330078125, 3.52392578125, 3.7177734375, 3.91162109375, 4.10546875, 4.29931640625, 4.4931640625, 4.68701171875, 4.880859375, 5.07470703125, 5.2685546875, 5.46240234375, 5.65625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 9.0, 10.0, 22.0, 26.0, 30.0, 39.0, 51.0, 59.0, 116.0, 149.0, 206.0, 373.0, 578.0, 1210.0, 2707.0, 7473.0, 29676.0, 183918.0, 1015312.0, 1962888.0, 820835.0, 133066.0, 24050.0, 6327.0, 2372.0, 1112.0, 588.0, 338.0, 217.0, 171.0, 82.0, 63.0, 46.0, 48.0, 22.0, 14.0, 19.0, 13.0, 14.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.28125, -8.9949951171875, -8.708740234375, -8.4224853515625, -8.13623046875, -7.8499755859375, -7.563720703125, -7.2774658203125, -6.9912109375, -6.7049560546875, -6.418701171875, -6.1324462890625, -5.84619140625, -5.5599365234375, -5.273681640625, -4.9874267578125, -4.701171875, -4.4149169921875, -4.128662109375, -3.8424072265625, -3.55615234375, -3.2698974609375, -2.983642578125, -2.6973876953125, -2.4111328125, -2.1248779296875, -1.838623046875, -1.5523681640625, -1.26611328125, -0.9798583984375, -0.693603515625, -0.4073486328125, -0.12109375, 0.1651611328125, 0.451416015625, 0.7376708984375, 1.02392578125, 1.3101806640625, 1.596435546875, 1.8826904296875, 2.1689453125, 2.4552001953125, 2.741455078125, 3.0277099609375, 3.31396484375, 3.6002197265625, 3.886474609375, 4.1727294921875, 4.458984375, 4.7452392578125, 5.031494140625, 5.3177490234375, 5.60400390625, 5.8902587890625, 6.176513671875, 6.4627685546875, 6.7490234375, 7.0352783203125, 7.321533203125, 7.6077880859375, 7.89404296875, 8.1802978515625, 8.466552734375, 8.7528076171875, 9.0390625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 8.0, 11.0, 16.0, 30.0, 37.0, 56.0, 68.0, 86.0, 119.0, 134.0, 209.0, 332.0, 396.0, 535.0, 506.0, 374.0, 281.0, 245.0, 178.0, 116.0, 95.0, 66.0, 46.0, 35.0, 26.0, 19.0, 17.0, 11.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.3631591796875, -11.906005859375, -11.4488525390625, -10.99169921875, -10.5345458984375, -10.077392578125, -9.6202392578125, -9.1630859375, -8.7059326171875, -8.248779296875, -7.7916259765625, -7.33447265625, -6.8773193359375, -6.420166015625, -5.9630126953125, -5.505859375, -5.0487060546875, -4.591552734375, -4.1343994140625, -3.67724609375, -3.2200927734375, -2.762939453125, -2.3057861328125, -1.8486328125, -1.3914794921875, -0.934326171875, -0.4771728515625, -0.02001953125, 0.4371337890625, 0.894287109375, 1.3514404296875, 1.80859375, 2.2657470703125, 2.722900390625, 3.1800537109375, 3.63720703125, 4.0943603515625, 4.551513671875, 5.0086669921875, 5.4658203125, 5.9229736328125, 6.380126953125, 6.8372802734375, 7.29443359375, 7.7515869140625, 8.208740234375, 8.6658935546875, 9.123046875, 9.5802001953125, 10.037353515625, 10.4945068359375, 10.95166015625, 11.4088134765625, 11.865966796875, 12.3231201171875, 12.7802734375, 13.2374267578125, 13.694580078125, 14.1517333984375, 14.60888671875, 15.0660400390625, 15.523193359375, 15.9803466796875, 16.4375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 9.0, 12.0, 18.0, 24.0, 25.0, 36.0, 37.0, 54.0, 87.0, 115.0, 167.0, 267.0, 429.0, 1373.0, 137776.0, 4044247.0, 7766.0, 740.0, 361.0, 201.0, 138.0, 110.0, 63.0, 53.0, 38.0, 33.0, 20.0, 16.0, 17.0, 8.0, 9.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15625, -59.95849609375, -57.7607421875, -55.56298828125, -53.365234375, -51.16748046875, -48.9697265625, -46.77197265625, -44.57421875, -42.37646484375, -40.1787109375, -37.98095703125, -35.783203125, -33.58544921875, -31.3876953125, -29.18994140625, -26.9921875, -24.79443359375, -22.5966796875, -20.39892578125, -18.201171875, -16.00341796875, -13.8056640625, -11.60791015625, -9.41015625, -7.21240234375, -5.0146484375, -2.81689453125, -0.619140625, 1.57861328125, 3.7763671875, 5.97412109375, 8.171875, 10.36962890625, 12.5673828125, 14.76513671875, 16.962890625, 19.16064453125, 21.3583984375, 23.55615234375, 25.75390625, 27.95166015625, 30.1494140625, 32.34716796875, 34.544921875, 36.74267578125, 38.9404296875, 41.13818359375, 43.3359375, 45.53369140625, 47.7314453125, 49.92919921875, 52.126953125, 54.32470703125, 56.5224609375, 58.72021484375, 60.91796875, 63.11572265625, 65.3134765625, 67.51123046875, 69.708984375, 71.90673828125, 74.1044921875, 76.30224609375, 78.5]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 16.0, 194.0, 529.0, 245.0, 28.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.300514221191406, -44.32118225097656, -36.34185028076172, -28.362516403198242, -20.3831844329834, -12.403850555419922, -4.424518585205078, 3.5548133850097656, 11.53414535522461, 19.513477325439453, 27.492809295654297, 35.472145080566406, 43.45147705078125, 51.430809020996094, 59.41014099121094, 67.38947296142578, 75.36880493164062, 83.34813690185547, 91.32746887207031, 99.30680084228516, 107.2861328125, 115.26547241210938, 123.24479675292969, 131.22413635253906, 139.20346069335938, 147.18280029296875, 155.16212463378906, 163.14146423339844, 171.12078857421875, 179.10012817382812, 187.07945251464844, 195.0587921142578, 203.0381317138672, 211.01747131347656, 218.99679565429688, 226.97613525390625, 234.95545959472656, 242.93479919433594, 250.91412353515625, 258.8934631347656, 266.872802734375, 274.8521423339844, 282.83148193359375, 290.810791015625, 298.7901306152344, 306.76947021484375, 314.7488098144531, 322.7281188964844, 330.70745849609375, 338.6867980957031, 346.6661376953125, 354.64544677734375, 362.6247863769531, 370.6041259765625, 378.5834655761719, 386.5627746582031, 394.5421142578125, 402.5214538574219, 410.50079345703125, 418.4801025390625, 426.4594421386719, 434.43878173828125, 442.4181213378906, 450.3974304199219, 458.37677001953125]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 7.0, 10.0, 13.0, 12.0, 14.0, 25.0, 22.0, 22.0, 31.0, 27.0, 27.0, 37.0, 38.0, 30.0, 41.0, 38.0, 34.0, 43.0, 45.0, 53.0, 42.0, 17.0, 42.0, 41.0, 26.0, 25.0, 33.0, 29.0, 27.0, 26.0, 26.0, 14.0, 13.0, 9.0, 13.0, 8.0, 3.0, 8.0, 8.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.74163055419922, -44.348087310791016, -42.95454788208008, -41.561004638671875, -40.16746520996094, -38.773921966552734, -37.38037872314453, -35.986839294433594, -34.59329605102539, -33.19975280761719, -31.80621337890625, -30.412670135498047, -29.019128799438477, -27.625587463378906, -26.232046127319336, -24.838504791259766, -23.444963455200195, -22.051422119140625, -20.657880783081055, -19.264339447021484, -17.87079620361328, -16.47725486755371, -15.08371353149414, -13.690171241760254, -12.296629905700684, -10.903088569641113, -9.509546279907227, -8.116004943847656, -6.722463130950928, -5.328921318054199, -3.935379981994629, -2.541837692260742, -1.1482963562011719, 0.2452453374862671, 1.638787031173706, 3.0323286056518555, 4.425870418548584, 5.8194122314453125, 7.212953567504883, 8.60649585723877, 10.00003719329834, 11.39357852935791, 12.787120819091797, 14.180662155151367, 15.574203491210938, 16.96774673461914, 18.361286163330078, 19.75482940673828, 21.14837074279785, 22.541912078857422, 23.935453414916992, 25.328994750976562, 26.722537994384766, 28.116079330444336, 29.509620666503906, 30.90316390991211, 32.29670333862305, 33.69024658203125, 35.08378601074219, 36.47732925415039, 37.87086868286133, 39.26441192626953, 40.65795135498047, 42.05149459838867, 43.445037841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 2.0, 6.0, 6.0, 14.0, 16.0, 9.0, 17.0, 15.0, 25.0, 37.0, 25.0, 25.0, 28.0, 36.0, 42.0, 49.0, 43.0, 47.0, 37.0, 51.0, 44.0, 43.0, 40.0, 37.0, 43.0, 33.0, 40.0, 24.0, 35.0, 26.0, 26.0, 17.0, 12.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.90234375, -6.6944580078125, -6.486572265625, -6.2786865234375, -6.07080078125, -5.8629150390625, -5.655029296875, -5.4471435546875, -5.2392578125, -5.0313720703125, -4.823486328125, -4.6156005859375, -4.40771484375, -4.1998291015625, -3.991943359375, -3.7840576171875, -3.576171875, -3.3682861328125, -3.160400390625, -2.9525146484375, -2.74462890625, -2.5367431640625, -2.328857421875, -2.1209716796875, -1.9130859375, -1.7052001953125, -1.497314453125, -1.2894287109375, -1.08154296875, -0.8736572265625, -0.665771484375, -0.4578857421875, -0.25, -0.0421142578125, 0.165771484375, 0.3736572265625, 0.58154296875, 0.7894287109375, 0.997314453125, 1.2052001953125, 1.4130859375, 1.6209716796875, 1.828857421875, 2.0367431640625, 2.24462890625, 2.4525146484375, 2.660400390625, 2.8682861328125, 3.076171875, 3.2840576171875, 3.491943359375, 3.6998291015625, 3.90771484375, 4.1156005859375, 4.323486328125, 4.5313720703125, 4.7392578125, 4.9471435546875, 5.155029296875, 5.3629150390625, 5.57080078125, 5.7786865234375, 5.986572265625, 6.1944580078125, 6.40234375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 15.0, 20.0, 24.0, 39.0, 61.0, 93.0, 133.0, 236.0, 333.0, 534.0, 864.0, 1294.0, 2130.0, 3409.0, 5581.0, 8892.0, 14662.0, 24440.0, 42134.0, 74351.0, 136709.0, 251402.0, 214002.0, 113439.0, 63492.0, 35997.0, 21129.0, 12519.0, 7876.0, 4749.0, 2916.0, 1851.0, 1167.0, 714.0, 469.0, 287.0, 229.0, 126.0, 77.0, 46.0, 42.0, 22.0, 15.0, 8.0, 7.0, 8.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9233932495117188, -0.8902435302734375, -0.8570938110351562, -0.823944091796875, -0.7907943725585938, -0.7576446533203125, -0.7244949340820312, -0.69134521484375, -0.6581954956054688, -0.6250457763671875, -0.5918960571289062, -0.558746337890625, -0.5255966186523438, -0.4924468994140625, -0.45929718017578125, -0.4261474609375, -0.39299774169921875, -0.3598480224609375, -0.32669830322265625, -0.293548583984375, -0.26039886474609375, -0.2272491455078125, -0.19409942626953125, -0.16094970703125, -0.12779998779296875, -0.0946502685546875, -0.06150054931640625, -0.028350830078125, 0.00479888916015625, 0.0379486083984375, 0.07109832763671875, 0.104248046875, 0.13739776611328125, 0.1705474853515625, 0.20369720458984375, 0.236846923828125, 0.26999664306640625, 0.3031463623046875, 0.33629608154296875, 0.36944580078125, 0.40259552001953125, 0.4357452392578125, 0.46889495849609375, 0.502044677734375, 0.5351943969726562, 0.5683441162109375, 0.6014938354492188, 0.6346435546875, 0.6677932739257812, 0.7009429931640625, 0.7340927124023438, 0.767242431640625, 0.8003921508789062, 0.8335418701171875, 0.8666915893554688, 0.89984130859375, 0.9329910278320312, 0.9661407470703125, 0.9992904663085938, 1.032440185546875, 1.0655899047851562, 1.0987396240234375, 1.1318893432617188, 1.1650390625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 4.0, 10.0, 8.0, 11.0, 10.0, 13.0, 26.0, 27.0, 13.0, 27.0, 35.0, 29.0, 29.0, 42.0, 35.0, 40.0, 33.0, 51.0, 48.0, 1065.0, 41.0, 41.0, 32.0, 41.0, 42.0, 31.0, 28.0, 36.0, 26.0, 16.0, 26.0, 19.0, 8.0, 14.0, 14.0, 6.0, 3.0, 9.0, 5.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.443359375, -3.325775146484375, -3.20819091796875, -3.090606689453125, -2.9730224609375, -2.855438232421875, -2.73785400390625, -2.620269775390625, -2.502685546875, -2.385101318359375, -2.26751708984375, -2.149932861328125, -2.0323486328125, -1.914764404296875, -1.79718017578125, -1.679595947265625, -1.56201171875, -1.444427490234375, -1.32684326171875, -1.209259033203125, -1.0916748046875, -0.974090576171875, -0.85650634765625, -0.738922119140625, -0.621337890625, -0.503753662109375, -0.38616943359375, -0.268585205078125, -0.1510009765625, -0.033416748046875, 0.08416748046875, 0.201751708984375, 0.3193359375, 0.436920166015625, 0.55450439453125, 0.672088623046875, 0.7896728515625, 0.907257080078125, 1.02484130859375, 1.142425537109375, 1.260009765625, 1.377593994140625, 1.49517822265625, 1.612762451171875, 1.7303466796875, 1.847930908203125, 1.96551513671875, 2.083099365234375, 2.20068359375, 2.318267822265625, 2.43585205078125, 2.553436279296875, 2.6710205078125, 2.788604736328125, 2.90618896484375, 3.023773193359375, 3.141357421875, 3.258941650390625, 3.37652587890625, 3.494110107421875, 3.6116943359375, 3.729278564453125, 3.84686279296875, 3.964447021484375, 4.08203125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 16.0, 11.0, 23.0, 45.0, 53.0, 97.0, 118.0, 214.0, 267.0, 421.0, 574.0, 856.0, 1314.0, 2002.0, 3115.0, 4649.0, 7316.0, 11763.0, 18493.0, 30250.0, 50059.0, 85780.0, 159367.0, 1323726.0, 170074.0, 89833.0, 52398.0, 31235.0, 19162.0, 11937.0, 7608.0, 4863.0, 3198.0, 2044.0, 1376.0, 983.0, 604.0, 392.0, 267.0, 199.0, 131.0, 100.0, 59.0, 45.0, 31.0, 27.0, 12.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.95556640625, -0.9270782470703125, -0.898590087890625, -0.8701019287109375, -0.84161376953125, -0.8131256103515625, -0.784637451171875, -0.7561492919921875, -0.7276611328125, -0.6991729736328125, -0.670684814453125, -0.6421966552734375, -0.61370849609375, -0.5852203369140625, -0.556732177734375, -0.5282440185546875, -0.499755859375, -0.4712677001953125, -0.442779541015625, -0.4142913818359375, -0.38580322265625, -0.3573150634765625, -0.328826904296875, -0.3003387451171875, -0.2718505859375, -0.2433624267578125, -0.214874267578125, -0.1863861083984375, -0.15789794921875, -0.1294097900390625, -0.100921630859375, -0.0724334716796875, -0.0439453125, -0.0154571533203125, 0.013031005859375, 0.0415191650390625, 0.07000732421875, 0.0984954833984375, 0.126983642578125, 0.1554718017578125, 0.1839599609375, 0.2124481201171875, 0.240936279296875, 0.2694244384765625, 0.29791259765625, 0.3264007568359375, 0.354888916015625, 0.3833770751953125, 0.411865234375, 0.4403533935546875, 0.468841552734375, 0.4973297119140625, 0.52581787109375, 0.5543060302734375, 0.582794189453125, 0.6112823486328125, 0.6397705078125, 0.6682586669921875, 0.696746826171875, 0.7252349853515625, 0.75372314453125, 0.7822113037109375, 0.810699462890625, 0.8391876220703125, 0.86767578125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 11.0, 11.0, 11.0, 22.0, 20.0, 26.0, 32.0, 36.0, 53.0, 71.0, 82.0, 69.0, 82.0, 78.0, 58.0, 76.0, 40.0, 41.0, 34.0, 33.0, 19.0, 21.0, 11.0, 10.0, 7.0, 11.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000858306884765625, -0.0008352473378181458, -0.0008121877908706665, -0.0007891282439231873, -0.000766068696975708, -0.0007430091500282288, -0.0007199496030807495, -0.0006968900561332703, -0.000673830509185791, -0.0006507709622383118, -0.0006277114152908325, -0.0006046518683433533, -0.000581592321395874, -0.0005585327744483948, -0.0005354732275009155, -0.0005124136805534363, -0.000489354133605957, -0.0004662945866584778, -0.00044323503971099854, -0.0004201754927635193, -0.00039711594581604004, -0.0003740563988685608, -0.00035099685192108154, -0.0003279373049736023, -0.00030487775802612305, -0.0002818182110786438, -0.00025875866413116455, -0.0002356991171836853, -0.00021263957023620605, -0.0001895800232887268, -0.00016652047634124756, -0.0001434609293937683, -0.00012040138244628906, -9.734183549880981e-05, -7.428228855133057e-05, -5.122274160385132e-05, -2.816319465637207e-05, -5.103647708892822e-06, 1.7955899238586426e-05, 4.1015446186065674e-05, 6.407499313354492e-05, 8.713454008102417e-05, 0.00011019408702850342, 0.00013325363397598267, 0.00015631318092346191, 0.00017937272787094116, 0.0002024322748184204, 0.00022549182176589966, 0.0002485513687133789, 0.00027161091566085815, 0.0002946704626083374, 0.00031773000955581665, 0.0003407895565032959, 0.00036384910345077515, 0.0003869086503982544, 0.00040996819734573364, 0.0004330277442932129, 0.00045608729124069214, 0.0004791468381881714, 0.0005022063851356506, 0.0005252659320831299, 0.0005483254790306091, 0.0005713850259780884, 0.0005944445729255676, 0.0006175041198730469]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 9.0, 4.0, 8.0, 4.0, 13.0, 15.0, 25.0, 28.0, 29.0, 45.0, 49.0, 98.0, 126.0, 229.0, 505.0, 2101.0, 1024475.0, 19171.0, 811.0, 314.0, 152.0, 94.0, 61.0, 45.0, 35.0, 24.0, 23.0, 17.0, 12.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01293182373046875, -0.01240837574005127, -0.011884927749633789, -0.011361479759216309, -0.010838031768798828, -0.010314583778381348, -0.009791135787963867, -0.009267687797546387, -0.008744239807128906, -0.008220791816711426, -0.007697343826293945, -0.007173895835876465, -0.006650447845458984, -0.006126999855041504, -0.0056035518646240234, -0.005080103874206543, -0.0045566558837890625, -0.004033207893371582, -0.0035097599029541016, -0.002986311912536621, -0.0024628639221191406, -0.0019394159317016602, -0.0014159679412841797, -0.0008925199508666992, -0.00036907196044921875, 0.00015437602996826172, 0.0006778240203857422, 0.0012012720108032227, 0.0017247200012207031, 0.0022481679916381836, 0.002771615982055664, 0.0032950639724731445, 0.003818511962890625, 0.0043419599533081055, 0.004865407943725586, 0.005388855934143066, 0.005912303924560547, 0.006435751914978027, 0.006959199905395508, 0.007482647895812988, 0.008006095886230469, 0.00852954387664795, 0.00905299186706543, 0.00957643985748291, 0.01009988784790039, 0.010623335838317871, 0.011146783828735352, 0.011670231819152832, 0.012193679809570312, 0.012717127799987793, 0.013240575790405273, 0.013764023780822754, 0.014287471771240234, 0.014810919761657715, 0.015334367752075195, 0.015857815742492676, 0.016381263732910156, 0.016904711723327637, 0.017428159713745117, 0.017951607704162598, 0.018475055694580078, 0.01899850368499756, 0.01952195167541504, 0.02004539966583252, 0.02056884765625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 206.0, 599.0, 181.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001273144967854023, -0.001213787472806871, -0.001154429977759719, -0.0010950724827125669, -0.0010357149876654148, -0.0009763575508259237, -0.0009170001139864326, -0.0008576426189392805, -0.0007982851238921285, -0.0007389276288449764, -0.0006795701337978244, -0.0006202126969583333, -0.0005608552019111812, -0.0005014977068640292, -0.0004421402409207076, -0.000382782774977386, -0.00032342527993023396, -0.0002640677848830819, -0.00020471031893976033, -0.0001453528384445235, -8.59953579492867e-05, -2.6637862902134657e-05, 3.271960304118693e-05, 9.207706898450851e-05, 0.00015143456403166056, 0.00021079204452689737, 0.0002701495250221342, 0.00032950699096545577, 0.0003888644860126078, 0.00044822198105975986, 0.000507579417899251, 0.000566936912946403, 0.0006262944079935551, 0.0006856519030407071, 0.0007450093980878592, 0.0008043668349273503, 0.0008637243299745023, 0.0009230818250216544, 0.0009824392618611455, 0.0010417967569082975, 0.0011011542519554496, 0.0011605117470026016, 0.0012198692420497537, 0.0012792267370969057, 0.001338584115728736, 0.0013979417271912098, 0.00145729910582304, 0.001516656600870192, 0.001576014095917344, 0.0016353715909644961, 0.0016947290860116482, 0.0017540865810588002, 0.0018134440761059523, 0.0018728014547377825, 0.0019321589497849345, 0.0019915164448320866, 0.0020508738234639168, 0.002110231202095747, 0.002169588813558221, 0.002228946192190051, 0.002288303803652525, 0.002347661182284355, 0.002407018793746829, 0.0024663761723786592, 0.002525733783841133]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 7.0, 8.0, 15.0, 13.0, 17.0, 12.0, 21.0, 20.0, 25.0, 31.0, 38.0, 41.0, 35.0, 35.0, 50.0, 38.0, 58.0, 40.0, 45.0, 39.0, 47.0, 53.0, 39.0, 48.0, 41.0, 23.0, 25.0, 28.0, 23.0, 22.0, 11.0, 13.0, 7.0, 9.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00037992000579833984, -0.0003685504198074341, -0.0003571808338165283, -0.00034581124782562256, -0.0003344416618347168, -0.00032307207584381104, -0.0003117024898529053, -0.0003003329038619995, -0.00028896331787109375, -0.000277593731880188, -0.0002662241458892822, -0.00025485455989837646, -0.0002434849739074707, -0.00023211538791656494, -0.00022074580192565918, -0.00020937621593475342, -0.00019800662994384766, -0.0001866370439529419, -0.00017526745796203613, -0.00016389787197113037, -0.0001525282859802246, -0.00014115869998931885, -0.00012978911399841309, -0.00011841952800750732, -0.00010704994201660156, -9.56803560256958e-05, -8.431077003479004e-05, -7.294118404388428e-05, -6.157159805297852e-05, -5.0202012062072754e-05, -3.883242607116699e-05, -2.746284008026123e-05, -1.609325408935547e-05, -4.723668098449707e-06, 6.645917892456055e-06, 1.8015503883361816e-05, 2.9385089874267578e-05, 4.075467586517334e-05, 5.21242618560791e-05, 6.349384784698486e-05, 7.486343383789062e-05, 8.623301982879639e-05, 9.760260581970215e-05, 0.00010897219181060791, 0.00012034177780151367, 0.00013171136379241943, 0.0001430809497833252, 0.00015445053577423096, 0.00016582012176513672, 0.00017718970775604248, 0.00018855929374694824, 0.000199928879737854, 0.00021129846572875977, 0.00022266805171966553, 0.0002340376377105713, 0.00024540722370147705, 0.0002567768096923828, 0.0002681463956832886, 0.00027951598167419434, 0.0002908855676651001, 0.00030225515365600586, 0.0003136247396469116, 0.0003249943256378174, 0.00033636391162872314, 0.0003477334976196289]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 2.0, 6.0, 6.0, 14.0, 16.0, 9.0, 17.0, 15.0, 25.0, 37.0, 25.0, 25.0, 28.0, 36.0, 42.0, 49.0, 43.0, 47.0, 37.0, 51.0, 44.0, 43.0, 40.0, 38.0, 42.0, 33.0, 40.0, 24.0, 35.0, 26.0, 26.0, 17.0, 12.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.90234375, -6.6944580078125, -6.486572265625, -6.2786865234375, -6.07080078125, -5.8629150390625, -5.655029296875, -5.4471435546875, -5.2392578125, -5.0313720703125, -4.823486328125, -4.6156005859375, -4.40771484375, -4.1998291015625, -3.991943359375, -3.7840576171875, -3.576171875, -3.3682861328125, -3.160400390625, -2.9525146484375, -2.74462890625, -2.5367431640625, -2.328857421875, -2.1209716796875, -1.9130859375, -1.7052001953125, -1.497314453125, -1.2894287109375, -1.08154296875, -0.8736572265625, -0.665771484375, -0.4578857421875, -0.25, -0.0421142578125, 0.165771484375, 0.3736572265625, 0.58154296875, 0.7894287109375, 0.997314453125, 1.2052001953125, 1.4130859375, 1.6209716796875, 1.828857421875, 2.0367431640625, 2.24462890625, 2.4525146484375, 2.660400390625, 2.8682861328125, 3.076171875, 3.2840576171875, 3.491943359375, 3.6998291015625, 3.90771484375, 4.1156005859375, 4.323486328125, 4.5313720703125, 4.7392578125, 4.9471435546875, 5.155029296875, 5.3629150390625, 5.57080078125, 5.7786865234375, 5.986572265625, 6.1944580078125, 6.40234375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 19.0, 18.0, 14.0, 22.0, 35.0, 65.0, 92.0, 106.0, 161.0, 232.0, 362.0, 594.0, 1046.0, 1934.0, 3851.0, 8274.0, 17506.0, 37971.0, 84670.0, 199725.0, 366990.0, 180739.0, 77462.0, 35009.0, 16119.0, 7426.0, 3543.0, 1886.0, 954.0, 566.0, 384.0, 244.0, 149.0, 115.0, 74.0, 61.0, 33.0, 30.0, 13.0, 13.0, 12.0, 12.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.75177001953125, -3.6285400390625, -3.50531005859375, -3.382080078125, -3.25885009765625, -3.1356201171875, -3.01239013671875, -2.88916015625, -2.76593017578125, -2.6427001953125, -2.51947021484375, -2.396240234375, -2.27301025390625, -2.1497802734375, -2.02655029296875, -1.9033203125, -1.78009033203125, -1.6568603515625, -1.53363037109375, -1.410400390625, -1.28717041015625, -1.1639404296875, -1.04071044921875, -0.91748046875, -0.79425048828125, -0.6710205078125, -0.54779052734375, -0.424560546875, -0.30133056640625, -0.1781005859375, -0.05487060546875, 0.068359375, 0.19158935546875, 0.3148193359375, 0.43804931640625, 0.561279296875, 0.68450927734375, 0.8077392578125, 0.93096923828125, 1.05419921875, 1.17742919921875, 1.3006591796875, 1.42388916015625, 1.547119140625, 1.67034912109375, 1.7935791015625, 1.91680908203125, 2.0400390625, 2.16326904296875, 2.2864990234375, 2.40972900390625, 2.532958984375, 2.65618896484375, 2.7794189453125, 2.90264892578125, 3.02587890625, 3.14910888671875, 3.2723388671875, 3.39556884765625, 3.518798828125, 3.64202880859375, 3.7652587890625, 3.88848876953125, 4.01171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 4.0, 3.0, 1.0, 4.0, 9.0, 10.0, 11.0, 11.0, 16.0, 24.0, 33.0, 31.0, 39.0, 25.0, 44.0, 53.0, 53.0, 61.0, 111.0, 1536.0, 454.0, 121.0, 58.0, 41.0, 48.0, 37.0, 32.0, 31.0, 30.0, 28.0, 17.0, 13.0, 12.0, 9.0, 10.0, 6.0, 8.0, 9.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-28.84375, -28.063720703125, -27.28369140625, -26.503662109375, -25.7236328125, -24.943603515625, -24.16357421875, -23.383544921875, -22.603515625, -21.823486328125, -21.04345703125, -20.263427734375, -19.4833984375, -18.703369140625, -17.92333984375, -17.143310546875, -16.36328125, -15.583251953125, -14.80322265625, -14.023193359375, -13.2431640625, -12.463134765625, -11.68310546875, -10.903076171875, -10.123046875, -9.343017578125, -8.56298828125, -7.782958984375, -7.0029296875, -6.222900390625, -5.44287109375, -4.662841796875, -3.8828125, -3.102783203125, -2.32275390625, -1.542724609375, -0.7626953125, 0.017333984375, 0.79736328125, 1.577392578125, 2.357421875, 3.137451171875, 3.91748046875, 4.697509765625, 5.4775390625, 6.257568359375, 7.03759765625, 7.817626953125, 8.59765625, 9.377685546875, 10.15771484375, 10.937744140625, 11.7177734375, 12.497802734375, 13.27783203125, 14.057861328125, 14.837890625, 15.617919921875, 16.39794921875, 17.177978515625, 17.9580078125, 18.738037109375, 19.51806640625, 20.298095703125, 21.078125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 8.0, 12.0, 10.0, 10.0, 20.0, 21.0, 22.0, 30.0, 48.0, 75.0, 94.0, 125.0, 164.0, 281.0, 456.0, 1595.0, 78745.0, 3056121.0, 5950.0, 705.0, 344.0, 238.0, 174.0, 105.0, 70.0, 72.0, 44.0, 39.0, 33.0, 15.0, 19.0, 12.0, 12.0, 9.0, 4.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.25, -46.4794921875, -44.708984375, -42.9384765625, -41.16796875, -39.3974609375, -37.626953125, -35.8564453125, -34.0859375, -32.3154296875, -30.544921875, -28.7744140625, -27.00390625, -25.2333984375, -23.462890625, -21.6923828125, -19.921875, -18.1513671875, -16.380859375, -14.6103515625, -12.83984375, -11.0693359375, -9.298828125, -7.5283203125, -5.7578125, -3.9873046875, -2.216796875, -0.4462890625, 1.32421875, 3.0947265625, 4.865234375, 6.6357421875, 8.40625, 10.1767578125, 11.947265625, 13.7177734375, 15.48828125, 17.2587890625, 19.029296875, 20.7998046875, 22.5703125, 24.3408203125, 26.111328125, 27.8818359375, 29.65234375, 31.4228515625, 33.193359375, 34.9638671875, 36.734375, 38.5048828125, 40.275390625, 42.0458984375, 43.81640625, 45.5869140625, 47.357421875, 49.1279296875, 50.8984375, 52.6689453125, 54.439453125, 56.2099609375, 57.98046875, 59.7509765625, 61.521484375, 63.2919921875, 65.0625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 34.0, 95.0, 232.0, 364.0, 198.0, 65.0, 14.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.634822845458984, -10.941692352294922, -9.248560905456543, -7.555429935455322, -5.862298965454102, -4.169168472290039, -2.47603702545166, -0.7829055786132812, 0.9102249145507812, 2.603355884552002, 4.296486854553223, 5.989617824554443, 7.682748794555664, 9.375879287719727, 11.069010734558105, 12.762142181396484, 14.455272674560547, 16.14840316772461, 17.841533660888672, 19.534666061401367, 21.22779655456543, 22.920927047729492, 24.614059448242188, 26.30718994140625, 28.000320434570312, 29.693450927734375, 31.386581420898438, 33.0797119140625, 34.77284240722656, 36.465972900390625, 38.15910720825195, 39.852237701416016, 41.54536437988281, 43.238494873046875, 44.93162536621094, 46.624755859375, 48.31788635253906, 50.011016845703125, 51.70415115356445, 53.397281646728516, 55.09041213989258, 56.78354263305664, 58.4766731262207, 60.169803619384766, 61.862937927246094, 63.556068420410156, 65.24919891357422, 66.94232940673828, 68.63545989990234, 70.3285903930664, 72.02172088623047, 73.71485137939453, 75.4079818725586, 77.10111236572266, 78.79424285888672, 80.48738098144531, 82.18051147460938, 83.87364196777344, 85.5667724609375, 87.25990295410156, 88.95303344726562, 90.64616394042969, 92.33929443359375, 94.03242492675781, 95.72555541992188]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 2.0, 6.0, 6.0, 11.0, 9.0, 9.0, 20.0, 21.0, 22.0, 29.0, 25.0, 31.0, 32.0, 47.0, 34.0, 43.0, 48.0, 46.0, 40.0, 49.0, 49.0, 62.0, 26.0, 48.0, 49.0, 37.0, 37.0, 37.0, 25.0, 20.0, 20.0, 21.0, 15.0, 7.0, 5.0, 4.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.82101058959961, -55.9080924987793, -53.995174407958984, -52.08225631713867, -50.169334411621094, -48.25641632080078, -46.34349822998047, -44.430580139160156, -42.517662048339844, -40.60474395751953, -38.69182586669922, -36.778907775878906, -34.865989685058594, -32.95307159423828, -31.040149688720703, -29.12723159790039, -27.214313507080078, -25.301395416259766, -23.388477325439453, -21.475557327270508, -19.562639236450195, -17.649721145629883, -15.736802101135254, -13.823883056640625, -11.910964965820312, -9.998046875, -8.085127830505371, -6.1722092628479, -4.25929069519043, -2.346372604370117, -0.4334535598754883, 1.4794654846191406, 3.3923873901367188, 5.3053059577941895, 7.21822452545166, 9.131143569946289, 11.044061660766602, 12.956979751586914, 14.869898796081543, 16.782817840576172, 18.695735931396484, 20.608654022216797, 22.52157211303711, 24.434492111206055, 26.347410202026367, 28.26032829284668, 30.173248291015625, 32.08616638183594, 33.99908447265625, 35.91200256347656, 37.824920654296875, 39.73783874511719, 41.6507568359375, 43.56367492675781, 45.47659683227539, 47.3895149230957, 49.302433013916016, 51.21535110473633, 53.12826919555664, 55.04118728637695, 56.95410919189453, 58.867027282714844, 60.779945373535156, 62.69286346435547, 64.60578155517578]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 4.0, 8.0, 16.0, 14.0, 11.0, 17.0, 25.0, 19.0, 23.0, 20.0, 41.0, 31.0, 37.0, 40.0, 36.0, 47.0, 54.0, 44.0, 46.0, 55.0, 38.0, 27.0, 40.0, 46.0, 38.0, 27.0, 38.0, 28.0, 23.0, 25.0, 26.0, 11.0, 10.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.97265625, -6.75579833984375, -6.5389404296875, -6.32208251953125, -6.105224609375, -5.88836669921875, -5.6715087890625, -5.45465087890625, -5.23779296875, -5.02093505859375, -4.8040771484375, -4.58721923828125, -4.370361328125, -4.15350341796875, -3.9366455078125, -3.71978759765625, -3.5029296875, -3.28607177734375, -3.0692138671875, -2.85235595703125, -2.635498046875, -2.41864013671875, -2.2017822265625, -1.98492431640625, -1.76806640625, -1.55120849609375, -1.3343505859375, -1.11749267578125, -0.900634765625, -0.68377685546875, -0.4669189453125, -0.25006103515625, -0.033203125, 0.18365478515625, 0.4005126953125, 0.61737060546875, 0.834228515625, 1.05108642578125, 1.2679443359375, 1.48480224609375, 1.70166015625, 1.91851806640625, 2.1353759765625, 2.35223388671875, 2.569091796875, 2.78594970703125, 3.0028076171875, 3.21966552734375, 3.4365234375, 3.65338134765625, 3.8702392578125, 4.08709716796875, 4.303955078125, 4.52081298828125, 4.7376708984375, 4.95452880859375, 5.17138671875, 5.38824462890625, 5.6051025390625, 5.82196044921875, 6.038818359375, 6.25567626953125, 6.4725341796875, 6.68939208984375, 6.90625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 6.0, 7.0, 14.0, 19.0, 16.0, 17.0, 24.0, 28.0, 33.0, 28.0, 43.0, 47.0, 86.0, 295.0, 1455.0, 31883.0, 2953219.0, 1195165.0, 10505.0, 816.0, 193.0, 77.0, 45.0, 48.0, 33.0, 33.0, 30.0, 24.0, 17.0, 22.0, 13.0, 5.0, 10.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.53125, -25.642578125, -24.75390625, -23.865234375, -22.9765625, -22.087890625, -21.19921875, -20.310546875, -19.421875, -18.533203125, -17.64453125, -16.755859375, -15.8671875, -14.978515625, -14.08984375, -13.201171875, -12.3125, -11.423828125, -10.53515625, -9.646484375, -8.7578125, -7.869140625, -6.98046875, -6.091796875, -5.203125, -4.314453125, -3.42578125, -2.537109375, -1.6484375, -0.759765625, 0.12890625, 1.017578125, 1.90625, 2.794921875, 3.68359375, 4.572265625, 5.4609375, 6.349609375, 7.23828125, 8.126953125, 9.015625, 9.904296875, 10.79296875, 11.681640625, 12.5703125, 13.458984375, 14.34765625, 15.236328125, 16.125, 17.013671875, 17.90234375, 18.791015625, 19.6796875, 20.568359375, 21.45703125, 22.345703125, 23.234375, 24.123046875, 25.01171875, 25.900390625, 26.7890625, 27.677734375, 28.56640625, 29.455078125, 30.34375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 9.0, 6.0, 12.0, 18.0, 16.0, 29.0, 19.0, 54.0, 64.0, 83.0, 97.0, 160.0, 167.0, 239.0, 297.0, 397.0, 482.0, 432.0, 350.0, 286.0, 206.0, 173.0, 118.0, 82.0, 87.0, 40.0, 41.0, 33.0, 21.0, 16.0, 13.0, 6.0, 12.0, 7.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1484375, -12.7479248046875, -12.347412109375, -11.9468994140625, -11.54638671875, -11.1458740234375, -10.745361328125, -10.3448486328125, -9.9443359375, -9.5438232421875, -9.143310546875, -8.7427978515625, -8.34228515625, -7.9417724609375, -7.541259765625, -7.1407470703125, -6.740234375, -6.3397216796875, -5.939208984375, -5.5386962890625, -5.13818359375, -4.7376708984375, -4.337158203125, -3.9366455078125, -3.5361328125, -3.1356201171875, -2.735107421875, -2.3345947265625, -1.93408203125, -1.5335693359375, -1.133056640625, -0.7325439453125, -0.33203125, 0.0684814453125, 0.468994140625, 0.8695068359375, 1.27001953125, 1.6705322265625, 2.071044921875, 2.4715576171875, 2.8720703125, 3.2725830078125, 3.673095703125, 4.0736083984375, 4.47412109375, 4.8746337890625, 5.275146484375, 5.6756591796875, 6.076171875, 6.4766845703125, 6.877197265625, 7.2777099609375, 7.67822265625, 8.0787353515625, 8.479248046875, 8.8797607421875, 9.2802734375, 9.6807861328125, 10.081298828125, 10.4818115234375, 10.88232421875, 11.2828369140625, 11.683349609375, 12.0838623046875, 12.484375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 16.0, 17.0, 14.0, 26.0, 18.0, 26.0, 41.0, 49.0, 74.0, 84.0, 138.0, 173.0, 288.0, 554.0, 2531.0, 1972171.0, 2213831.0, 2561.0, 603.0, 310.0, 208.0, 136.0, 90.0, 79.0, 48.0, 26.0, 34.0, 25.0, 24.0, 9.0, 10.0, 9.0, 11.0, 14.0, 3.0, 4.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.375, -63.2666015625, -61.158203125, -59.0498046875, -56.94140625, -54.8330078125, -52.724609375, -50.6162109375, -48.5078125, -46.3994140625, -44.291015625, -42.1826171875, -40.07421875, -37.9658203125, -35.857421875, -33.7490234375, -31.640625, -29.5322265625, -27.423828125, -25.3154296875, -23.20703125, -21.0986328125, -18.990234375, -16.8818359375, -14.7734375, -12.6650390625, -10.556640625, -8.4482421875, -6.33984375, -4.2314453125, -2.123046875, -0.0146484375, 2.09375, 4.2021484375, 6.310546875, 8.4189453125, 10.52734375, 12.6357421875, 14.744140625, 16.8525390625, 18.9609375, 21.0693359375, 23.177734375, 25.2861328125, 27.39453125, 29.5029296875, 31.611328125, 33.7197265625, 35.828125, 37.9365234375, 40.044921875, 42.1533203125, 44.26171875, 46.3701171875, 48.478515625, 50.5869140625, 52.6953125, 54.8037109375, 56.912109375, 59.0205078125, 61.12890625, 63.2373046875, 65.345703125, 67.4541015625, 69.5625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [4.0, 5.0, 100.0, 481.0, 361.0, 65.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.876556396484375, -22.218677520751953, -14.560799598693848, -6.902921676635742, 0.7549571990966797, 8.412834167480469, 16.07071304321289, 23.728591918945312, 31.386470794677734, 39.044349670410156, 46.70222854614258, 54.360107421875, 62.017982482910156, 69.67585754394531, 77.333740234375, 84.99162292480469, 92.64949798583984, 100.307373046875, 107.96525573730469, 115.62313079833984, 123.28101348876953, 130.9388885498047, 138.59677124023438, 146.254638671875, 153.9125213623047, 161.57040405273438, 169.228271484375, 176.8861541748047, 184.54403686523438, 192.201904296875, 199.8597869873047, 207.51766967773438, 215.17555236816406, 222.83343505859375, 230.49130249023438, 238.14918518066406, 245.80706787109375, 253.46493530273438, 261.1228332519531, 268.78070068359375, 276.4385681152344, 284.096435546875, 291.75433349609375, 299.4122009277344, 307.070068359375, 314.72796630859375, 322.3858337402344, 330.043701171875, 337.70159912109375, 345.3594665527344, 353.0173645019531, 360.67523193359375, 368.3330993652344, 375.9909973144531, 383.64886474609375, 391.3067626953125, 398.9646301269531, 406.62249755859375, 414.2803955078125, 421.9382629394531, 429.59613037109375, 437.2540283203125, 444.9118957519531, 452.56976318359375, 460.2276611328125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 7.0, 4.0, 8.0, 4.0, 13.0, 12.0, 22.0, 20.0, 16.0, 17.0, 26.0, 27.0, 19.0, 26.0, 20.0, 30.0, 44.0, 53.0, 39.0, 31.0, 43.0, 41.0, 43.0, 40.0, 40.0, 34.0, 29.0, 43.0, 31.0, 17.0, 25.0, 20.0, 28.0, 15.0, 18.0, 16.0, 17.0, 15.0, 8.0, 13.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0], "bins": [-43.180816650390625, -41.95011520385742, -40.71941375732422, -39.488712310791016, -38.25801086425781, -37.02730941772461, -35.796607971191406, -34.56590270996094, -33.335205078125, -32.1045036315918, -30.873802185058594, -29.64310073852539, -28.412399291992188, -27.181697845458984, -25.95099449157715, -24.720293045043945, -23.48958969116211, -22.258888244628906, -21.028186798095703, -19.7974853515625, -18.566783905029297, -17.336082458496094, -16.105379104614258, -14.874677658081055, -13.643976211547852, -12.413274765014648, -11.182573318481445, -9.951870918273926, -8.721169471740723, -7.4904680252075195, -6.259766101837158, -5.029064178466797, -3.798358917236328, -2.567657232284546, -1.3369555473327637, -0.10625386238098145, 1.1244478225708008, 2.355149269104004, 3.5858511924743652, 4.816553115844727, 6.04725456237793, 7.277956008911133, 8.508657455444336, 9.739359855651855, 10.970061302185059, 12.200762748718262, 13.431465148925781, 14.662166595458984, 15.892868041992188, 17.12356948852539, 18.354270935058594, 19.584972381591797, 20.815673828125, 22.046375274658203, 23.27707862854004, 24.507780075073242, 25.738481521606445, 26.96918296813965, 28.19988441467285, 29.430585861206055, 30.66128921508789, 31.891990661621094, 33.1226921081543, 34.3533935546875, 35.5840950012207]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 16.0, 14.0, 23.0, 18.0, 30.0, 24.0, 28.0, 35.0, 36.0, 33.0, 42.0, 46.0, 50.0, 44.0, 41.0, 45.0, 50.0, 38.0, 34.0, 41.0, 40.0, 37.0, 37.0, 31.0, 27.0, 26.0, 18.0, 13.0, 11.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.40625, -7.18658447265625, -6.9669189453125, -6.74725341796875, -6.527587890625, -6.30792236328125, -6.0882568359375, -5.86859130859375, -5.64892578125, -5.42926025390625, -5.2095947265625, -4.98992919921875, -4.770263671875, -4.55059814453125, -4.3309326171875, -4.11126708984375, -3.8916015625, -3.67193603515625, -3.4522705078125, -3.23260498046875, -3.012939453125, -2.79327392578125, -2.5736083984375, -2.35394287109375, -2.13427734375, -1.91461181640625, -1.6949462890625, -1.47528076171875, -1.255615234375, -1.03594970703125, -0.8162841796875, -0.59661865234375, -0.376953125, -0.15728759765625, 0.0623779296875, 0.28204345703125, 0.501708984375, 0.72137451171875, 0.9410400390625, 1.16070556640625, 1.38037109375, 1.60003662109375, 1.8197021484375, 2.03936767578125, 2.259033203125, 2.47869873046875, 2.6983642578125, 2.91802978515625, 3.1376953125, 3.35736083984375, 3.5770263671875, 3.79669189453125, 4.016357421875, 4.23602294921875, 4.4556884765625, 4.67535400390625, 4.89501953125, 5.11468505859375, 5.3343505859375, 5.55401611328125, 5.773681640625, 5.99334716796875, 6.2130126953125, 6.43267822265625, 6.65234375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 28.0, 30.0, 42.0, 59.0, 96.0, 119.0, 208.0, 312.0, 477.0, 735.0, 1123.0, 1750.0, 2727.0, 4466.0, 6779.0, 10907.0, 17343.0, 27910.0, 45204.0, 75650.0, 128731.0, 226243.0, 203187.0, 116444.0, 67905.0, 41163.0, 25756.0, 15902.0, 9932.0, 6246.0, 3893.0, 2545.0, 1611.0, 1035.0, 672.0, 477.0, 247.0, 191.0, 131.0, 80.0, 63.0, 38.0, 25.0, 14.0, 14.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.0224609375, -0.9913864135742188, -0.9603118896484375, -0.9292373657226562, -0.898162841796875, -0.8670883178710938, -0.8360137939453125, -0.8049392700195312, -0.77386474609375, -0.7427902221679688, -0.7117156982421875, -0.6806411743164062, -0.649566650390625, -0.6184921264648438, -0.5874176025390625, -0.5563430786132812, -0.5252685546875, -0.49419403076171875, -0.4631195068359375, -0.43204498291015625, -0.400970458984375, -0.36989593505859375, -0.3388214111328125, -0.30774688720703125, -0.27667236328125, -0.24559783935546875, -0.2145233154296875, -0.18344879150390625, -0.152374267578125, -0.12129974365234375, -0.0902252197265625, -0.05915069580078125, -0.028076171875, 0.00299835205078125, 0.0340728759765625, 0.06514739990234375, 0.096221923828125, 0.12729644775390625, 0.1583709716796875, 0.18944549560546875, 0.22052001953125, 0.25159454345703125, 0.2826690673828125, 0.31374359130859375, 0.344818115234375, 0.37589263916015625, 0.4069671630859375, 0.43804168701171875, 0.4691162109375, 0.5001907348632812, 0.5312652587890625, 0.5623397827148438, 0.593414306640625, 0.6244888305664062, 0.6555633544921875, 0.6866378784179688, 0.71771240234375, 0.7487869262695312, 0.7798614501953125, 0.8109359741210938, 0.842010498046875, 0.8730850219726562, 0.9041595458984375, 0.9352340698242188, 0.96630859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 8.0, 8.0, 10.0, 15.0, 10.0, 9.0, 22.0, 22.0, 31.0, 21.0, 35.0, 31.0, 28.0, 36.0, 25.0, 40.0, 44.0, 36.0, 21.0, 1074.0, 39.0, 47.0, 40.0, 45.0, 31.0, 31.0, 26.0, 33.0, 25.0, 22.0, 27.0, 15.0, 19.0, 13.0, 20.0, 10.0, 10.0, 6.0, 6.0, 1.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.23046875, -4.110504150390625, -3.99053955078125, -3.870574951171875, -3.7506103515625, -3.630645751953125, -3.51068115234375, -3.390716552734375, -3.270751953125, -3.150787353515625, -3.03082275390625, -2.910858154296875, -2.7908935546875, -2.670928955078125, -2.55096435546875, -2.430999755859375, -2.31103515625, -2.191070556640625, -2.07110595703125, -1.951141357421875, -1.8311767578125, -1.711212158203125, -1.59124755859375, -1.471282958984375, -1.351318359375, -1.231353759765625, -1.11138916015625, -0.991424560546875, -0.8714599609375, -0.751495361328125, -0.63153076171875, -0.511566162109375, -0.3916015625, -0.271636962890625, -0.15167236328125, -0.031707763671875, 0.0882568359375, 0.208221435546875, 0.32818603515625, 0.448150634765625, 0.568115234375, 0.688079833984375, 0.80804443359375, 0.928009033203125, 1.0479736328125, 1.167938232421875, 1.28790283203125, 1.407867431640625, 1.52783203125, 1.647796630859375, 1.76776123046875, 1.887725830078125, 2.0076904296875, 2.127655029296875, 2.24761962890625, 2.367584228515625, 2.487548828125, 2.607513427734375, 2.72747802734375, 2.847442626953125, 2.9674072265625, 3.087371826171875, 3.20733642578125, 3.327301025390625, 3.447265625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 7.0, 1.0, 12.0, 9.0, 16.0, 36.0, 42.0, 60.0, 100.0, 137.0, 226.0, 321.0, 480.0, 745.0, 1147.0, 1760.0, 2647.0, 4067.0, 6166.0, 9447.0, 14891.0, 23799.0, 38560.0, 63901.0, 110809.0, 207837.0, 1290866.0, 128780.0, 73040.0, 43675.0, 26538.0, 16804.0, 10623.0, 6832.0, 4327.0, 2890.0, 1933.0, 1219.0, 840.0, 520.0, 336.0, 214.0, 177.0, 104.0, 82.0, 37.0, 36.0, 16.0, 11.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89013671875, -0.8605880737304688, -0.8310394287109375, -0.8014907836914062, -0.771942138671875, -0.7423934936523438, -0.7128448486328125, -0.6832962036132812, -0.65374755859375, -0.6241989135742188, -0.5946502685546875, -0.5651016235351562, -0.535552978515625, -0.5060043334960938, -0.4764556884765625, -0.44690704345703125, -0.4173583984375, -0.38780975341796875, -0.3582611083984375, -0.32871246337890625, -0.299163818359375, -0.26961517333984375, -0.2400665283203125, -0.21051788330078125, -0.18096923828125, -0.15142059326171875, -0.1218719482421875, -0.09232330322265625, -0.062774658203125, -0.03322601318359375, -0.0036773681640625, 0.02587127685546875, 0.055419921875, 0.08496856689453125, 0.1145172119140625, 0.14406585693359375, 0.173614501953125, 0.20316314697265625, 0.2327117919921875, 0.26226043701171875, 0.29180908203125, 0.32135772705078125, 0.3509063720703125, 0.38045501708984375, 0.410003662109375, 0.43955230712890625, 0.4691009521484375, 0.49864959716796875, 0.5281982421875, 0.5577468872070312, 0.5872955322265625, 0.6168441772460938, 0.646392822265625, 0.6759414672851562, 0.7054901123046875, 0.7350387573242188, 0.76458740234375, 0.7941360473632812, 0.8236846923828125, 0.8532333374023438, 0.882781982421875, 0.9123306274414062, 0.9418792724609375, 0.9714279174804688, 1.0009765625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 8.0, 6.0, 14.0, 11.0, 16.0, 14.0, 23.0, 21.0, 31.0, 40.0, 57.0, 56.0, 68.0, 59.0, 74.0, 92.0, 77.0, 61.0, 63.0, 37.0, 29.0, 28.0, 25.0, 17.0, 14.0, 5.0, 10.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008139610290527344, -0.0007902905344963074, -0.0007666200399398804, -0.0007429495453834534, -0.0007192790508270264, -0.0006956085562705994, -0.0006719380617141724, -0.0006482675671577454, -0.0006245970726013184, -0.0006009265780448914, -0.0005772560834884644, -0.0005535855889320374, -0.0005299150943756104, -0.0005062445998191833, -0.00048257410526275635, -0.00045890361070632935, -0.00043523311614990234, -0.00041156262159347534, -0.00038789212703704834, -0.00036422163248062134, -0.00034055113792419434, -0.00031688064336776733, -0.00029321014881134033, -0.00026953965425491333, -0.00024586915969848633, -0.00022219866514205933, -0.00019852817058563232, -0.00017485767602920532, -0.00015118718147277832, -0.00012751668691635132, -0.00010384619235992432, -8.017569780349731e-05, -5.650520324707031e-05, -3.283470869064331e-05, -9.164214134216309e-06, 1.4506280422210693e-05, 3.8176774978637695e-05, 6.18472695350647e-05, 8.55177640914917e-05, 0.0001091882586479187, 0.0001328587532043457, 0.0001565292477607727, 0.0001801997423171997, 0.0002038702368736267, 0.0002275407314300537, 0.0002512112259864807, 0.0002748817205429077, 0.0002985522150993347, 0.0003222227096557617, 0.0003458932042121887, 0.0003695636987686157, 0.0003932341933250427, 0.0004169046878814697, 0.00044057518243789673, 0.00046424567699432373, 0.00048791617155075073, 0.0005115866661071777, 0.0005352571606636047, 0.0005589276552200317, 0.0005825981497764587, 0.0006062686443328857, 0.0006299391388893127, 0.0006536096334457397, 0.0006772801280021667, 0.0007009506225585938]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 11.0, 15.0, 18.0, 20.0, 40.0, 41.0, 80.0, 133.0, 251.0, 602.0, 3234.0, 1037664.0, 5091.0, 679.0, 228.0, 115.0, 77.0, 60.0, 36.0, 31.0, 16.0, 15.0, 6.0, 15.0, 9.0, 16.0, 5.0, 7.0, 3.0, 5.0, 2.0, 0.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.017578125, -0.01702094078063965, -0.016463756561279297, -0.015906572341918945, -0.015349388122558594, -0.014792203903198242, -0.01423501968383789, -0.013677835464477539, -0.013120651245117188, -0.012563467025756836, -0.012006282806396484, -0.011449098587036133, -0.010891914367675781, -0.01033473014831543, -0.009777545928955078, -0.009220361709594727, -0.008663177490234375, -0.008105993270874023, -0.007548809051513672, -0.00699162483215332, -0.006434440612792969, -0.005877256393432617, -0.005320072174072266, -0.004762887954711914, -0.0042057037353515625, -0.003648519515991211, -0.0030913352966308594, -0.002534151077270508, -0.0019769668579101562, -0.0014197826385498047, -0.0008625984191894531, -0.00030541419982910156, 0.00025177001953125, 0.0008089542388916016, 0.0013661384582519531, 0.0019233226776123047, 0.0024805068969726562, 0.003037691116333008, 0.0035948753356933594, 0.004152059555053711, 0.0047092437744140625, 0.005266427993774414, 0.005823612213134766, 0.006380796432495117, 0.006937980651855469, 0.00749516487121582, 0.008052349090576172, 0.008609533309936523, 0.009166717529296875, 0.009723901748657227, 0.010281085968017578, 0.01083827018737793, 0.011395454406738281, 0.011952638626098633, 0.012509822845458984, 0.013067007064819336, 0.013624191284179688, 0.014181375503540039, 0.01473855972290039, 0.015295743942260742, 0.015852928161621094, 0.016410112380981445, 0.016967296600341797, 0.01752448081970215, 0.0180816650390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 231.0, 734.0, 47.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005053344066254795, -0.0004097155178897083, -0.0003140966291539371, -0.00021847771131433547, -0.00012285882257856429, -2.7239933842793107e-05, 6.837898399680853e-05, 0.0001639978727325797, 0.0002596167614683509, 0.00035523565020412207, 0.00045085453893989325, 0.0005464734276756644, 0.0006420923164114356, 0.0007377112051472068, 0.0008333301520906389, 0.0009289490408264101, 0.0010245679877698421, 0.0011201868765056133, 0.0012158057652413845, 0.0013114246539771557, 0.0014070435427129269, 0.001502662431448698, 0.0015982813201844692, 0.0016939002089202404, 0.0017895190976560116, 0.0018851379863917828, 0.001980756875127554, 0.002076375763863325, 0.0021719946525990963, 0.0022676135413348675, 0.0023632324300706387, 0.00245885131880641, 0.0025544704403728247, 0.002650089329108596, 0.002745708217844367, 0.002841327106580138, 0.0029369459953159094, 0.0030325648840516806, 0.0031281837727874517, 0.003223802661523223, 0.003319421550258994, 0.0034150404389947653, 0.0035106593277305365, 0.0036062782164663076, 0.003701897105202079, 0.00379751599393785, 0.003893134882673621, 0.003988754004240036, 0.004084372892975807, 0.004179991781711578, 0.0042756106704473495, 0.004371229559183121, 0.004466848447918892, 0.004562467336654663, 0.004658086225390434, 0.0047537051141262054, 0.004849324002861977, 0.004944942891597748, 0.005040561780333519, 0.00513618066906929, 0.005231799557805061, 0.0053274184465408325, 0.005423037335276604, 0.005518656224012375, 0.005614275112748146]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 1.0, 2.0, 9.0, 8.0, 8.0, 9.0, 9.0, 16.0, 12.0, 22.0, 19.0, 25.0, 31.0, 39.0, 35.0, 35.0, 32.0, 24.0, 34.0, 40.0, 33.0, 36.0, 54.0, 54.0, 41.0, 32.0, 35.0, 39.0, 27.0, 21.0, 23.0, 22.0, 17.0, 28.0, 17.0, 12.0, 17.0, 13.0, 8.0, 9.0, 11.0, 5.0, 9.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00034803152084350586, -0.00033771153539419174, -0.0003273915499448776, -0.0003170715644955635, -0.0003067515790462494, -0.00029643159359693527, -0.00028611160814762115, -0.00027579162269830704, -0.0002654716372489929, -0.0002551516517996788, -0.0002448316663503647, -0.00023451168090105057, -0.00022419169545173645, -0.00021387171000242233, -0.00020355172455310822, -0.0001932317391037941, -0.00018291175365447998, -0.00017259176820516586, -0.00016227178275585175, -0.00015195179730653763, -0.0001416318118572235, -0.0001313118264079094, -0.00012099184095859528, -0.00011067185550928116, -0.00010035187005996704, -9.003188461065292e-05, -7.97118991613388e-05, -6.939191371202469e-05, -5.907192826271057e-05, -4.8751942813396454e-05, -3.8431957364082336e-05, -2.811197191476822e-05, -1.77919864654541e-05, -7.472001016139984e-06, 2.8479844331741333e-06, 1.316796988248825e-05, 2.3487955331802368e-05, 3.3807940781116486e-05, 4.41279262304306e-05, 5.444791167974472e-05, 6.476789712905884e-05, 7.508788257837296e-05, 8.540786802768707e-05, 9.572785347700119e-05, 0.00010604783892631531, 0.00011636782437562943, 0.00012668780982494354, 0.00013700779527425766, 0.00014732778072357178, 0.0001576477661728859, 0.0001679677516222, 0.00017828773707151413, 0.00018860772252082825, 0.00019892770797014236, 0.00020924769341945648, 0.0002195676788687706, 0.00022988766431808472, 0.00024020764976739883, 0.00025052763521671295, 0.00026084762066602707, 0.0002711676061153412, 0.0002814875915646553, 0.0002918075770139694, 0.00030212756246328354, 0.00031244754791259766]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 16.0, 14.0, 23.0, 18.0, 30.0, 24.0, 28.0, 35.0, 36.0, 33.0, 42.0, 46.0, 50.0, 44.0, 41.0, 45.0, 50.0, 38.0, 34.0, 41.0, 40.0, 37.0, 37.0, 31.0, 27.0, 26.0, 18.0, 13.0, 11.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.40625, -7.18658447265625, -6.9669189453125, -6.74725341796875, -6.527587890625, -6.30792236328125, -6.0882568359375, -5.86859130859375, -5.64892578125, -5.42926025390625, -5.2095947265625, -4.98992919921875, -4.770263671875, -4.55059814453125, -4.3309326171875, -4.11126708984375, -3.8916015625, -3.67193603515625, -3.4522705078125, -3.23260498046875, -3.012939453125, -2.79327392578125, -2.5736083984375, -2.35394287109375, -2.13427734375, -1.91461181640625, -1.6949462890625, -1.47528076171875, -1.255615234375, -1.03594970703125, -0.8162841796875, -0.59661865234375, -0.376953125, -0.15728759765625, 0.0623779296875, 0.28204345703125, 0.501708984375, 0.72137451171875, 0.9410400390625, 1.16070556640625, 1.38037109375, 1.60003662109375, 1.8197021484375, 2.03936767578125, 2.259033203125, 2.47869873046875, 2.6983642578125, 2.91802978515625, 3.1376953125, 3.35736083984375, 3.5770263671875, 3.79669189453125, 4.016357421875, 4.23602294921875, 4.4556884765625, 4.67535400390625, 4.89501953125, 5.11468505859375, 5.3343505859375, 5.55401611328125, 5.773681640625, 5.99334716796875, 6.2130126953125, 6.43267822265625, 6.65234375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 6.0, 10.0, 13.0, 15.0, 35.0, 28.0, 52.0, 47.0, 86.0, 107.0, 177.0, 235.0, 363.0, 543.0, 940.0, 1699.0, 3707.0, 9049.0, 23893.0, 69892.0, 207955.0, 466905.0, 170120.0, 57509.0, 20433.0, 7543.0, 3199.0, 1536.0, 851.0, 491.0, 314.0, 241.0, 165.0, 103.0, 68.0, 61.0, 51.0, 32.0, 21.0, 16.0, 4.0, 8.0, 9.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.453125, -5.2899169921875, -5.126708984375, -4.9635009765625, -4.80029296875, -4.6370849609375, -4.473876953125, -4.3106689453125, -4.1474609375, -3.9842529296875, -3.821044921875, -3.6578369140625, -3.49462890625, -3.3314208984375, -3.168212890625, -3.0050048828125, -2.841796875, -2.6785888671875, -2.515380859375, -2.3521728515625, -2.18896484375, -2.0257568359375, -1.862548828125, -1.6993408203125, -1.5361328125, -1.3729248046875, -1.209716796875, -1.0465087890625, -0.88330078125, -0.7200927734375, -0.556884765625, -0.3936767578125, -0.23046875, -0.0672607421875, 0.095947265625, 0.2591552734375, 0.42236328125, 0.5855712890625, 0.748779296875, 0.9119873046875, 1.0751953125, 1.2384033203125, 1.401611328125, 1.5648193359375, 1.72802734375, 1.8912353515625, 2.054443359375, 2.2176513671875, 2.380859375, 2.5440673828125, 2.707275390625, 2.8704833984375, 3.03369140625, 3.1968994140625, 3.360107421875, 3.5233154296875, 3.6865234375, 3.8497314453125, 4.012939453125, 4.1761474609375, 4.33935546875, 4.5025634765625, 4.665771484375, 4.8289794921875, 4.9921875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 1.0, 4.0, 4.0, 8.0, 7.0, 6.0, 8.0, 15.0, 13.0, 14.0, 13.0, 18.0, 28.0, 20.0, 26.0, 26.0, 37.0, 36.0, 38.0, 57.0, 80.0, 74.0, 317.0, 1597.0, 125.0, 70.0, 57.0, 59.0, 37.0, 45.0, 37.0, 28.0, 25.0, 23.0, 16.0, 20.0, 10.0, 8.0, 11.0, 11.0, 3.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.46875, -23.792236328125, -23.11572265625, -22.439208984375, -21.7626953125, -21.086181640625, -20.40966796875, -19.733154296875, -19.056640625, -18.380126953125, -17.70361328125, -17.027099609375, -16.3505859375, -15.674072265625, -14.99755859375, -14.321044921875, -13.64453125, -12.968017578125, -12.29150390625, -11.614990234375, -10.9384765625, -10.261962890625, -9.58544921875, -8.908935546875, -8.232421875, -7.555908203125, -6.87939453125, -6.202880859375, -5.5263671875, -4.849853515625, -4.17333984375, -3.496826171875, -2.8203125, -2.143798828125, -1.46728515625, -0.790771484375, -0.1142578125, 0.562255859375, 1.23876953125, 1.915283203125, 2.591796875, 3.268310546875, 3.94482421875, 4.621337890625, 5.2978515625, 5.974365234375, 6.65087890625, 7.327392578125, 8.00390625, 8.680419921875, 9.35693359375, 10.033447265625, 10.7099609375, 11.386474609375, 12.06298828125, 12.739501953125, 13.416015625, 14.092529296875, 14.76904296875, 15.445556640625, 16.1220703125, 16.798583984375, 17.47509765625, 18.151611328125, 18.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 20.0, 16.0, 19.0, 45.0, 53.0, 67.0, 105.0, 163.0, 217.0, 342.0, 694.0, 6205.0, 3121553.0, 14089.0, 876.0, 359.0, 227.0, 161.0, 124.0, 94.0, 54.0, 53.0, 30.0, 30.0, 26.0, 20.0, 14.0, 11.0, 4.0, 7.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-73.8125, -71.79443359375, -69.7763671875, -67.75830078125, -65.740234375, -63.72216796875, -61.7041015625, -59.68603515625, -57.66796875, -55.64990234375, -53.6318359375, -51.61376953125, -49.595703125, -47.57763671875, -45.5595703125, -43.54150390625, -41.5234375, -39.50537109375, -37.4873046875, -35.46923828125, -33.451171875, -31.43310546875, -29.4150390625, -27.39697265625, -25.37890625, -23.36083984375, -21.3427734375, -19.32470703125, -17.306640625, -15.28857421875, -13.2705078125, -11.25244140625, -9.234375, -7.21630859375, -5.1982421875, -3.18017578125, -1.162109375, 0.85595703125, 2.8740234375, 4.89208984375, 6.91015625, 8.92822265625, 10.9462890625, 12.96435546875, 14.982421875, 17.00048828125, 19.0185546875, 21.03662109375, 23.0546875, 25.07275390625, 27.0908203125, 29.10888671875, 31.126953125, 33.14501953125, 35.1630859375, 37.18115234375, 39.19921875, 41.21728515625, 43.2353515625, 45.25341796875, 47.271484375, 49.28955078125, 51.3076171875, 53.32568359375, 55.34375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 24.0, 117.0, 426.0, 339.0, 96.0, 8.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.97565841674805, -46.39053726196289, -43.805416107177734, -41.22029113769531, -38.635169982910156, -36.050048828125, -33.464927673339844, -30.879804611206055, -28.2946834564209, -25.709562301635742, -23.124439239501953, -20.539318084716797, -17.95419692993164, -15.369073867797852, -12.783952713012695, -10.198829650878906, -7.61370849609375, -5.028586387634277, -2.443464756011963, 0.14165687561035156, 2.726778984069824, 5.311901092529297, 7.897022247314453, 10.482145309448242, 13.067266464233398, 15.652388572692871, 18.237510681152344, 20.8226318359375, 23.407752990722656, 25.992876052856445, 28.5779972076416, 31.16312026977539, 33.74823760986328, 36.33335876464844, 38.918479919433594, 41.50360107421875, 44.08872604370117, 46.67384719848633, 49.258968353271484, 51.844093322753906, 54.42921447753906, 57.01433563232422, 59.599456787109375, 62.18457794189453, 64.76969909667969, 67.35482788085938, 69.93994140625, 72.52507019042969, 75.11018371582031, 77.69530487060547, 80.28042602539062, 82.86554718017578, 85.45066833496094, 88.03579711914062, 90.62091064453125, 93.20603942871094, 95.7911605834961, 98.37628173828125, 100.9614028930664, 103.54652404785156, 106.13164520263672, 108.71676635742188, 111.30189514160156, 113.88701629638672, 116.47213745117188]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 8.0, 8.0, 3.0, 7.0, 10.0, 13.0, 17.0, 15.0, 26.0, 20.0, 29.0, 21.0, 32.0, 36.0, 39.0, 39.0, 35.0, 35.0, 42.0, 41.0, 40.0, 28.0, 44.0, 52.0, 46.0, 26.0, 40.0, 27.0, 32.0, 22.0, 27.0, 24.0, 19.0, 12.0, 12.0, 16.0, 7.0, 9.0, 1.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-63.36546325683594, -61.41703414916992, -59.46860885620117, -57.520179748535156, -55.571754455566406, -53.62332534790039, -51.674896240234375, -49.726470947265625, -47.77804183959961, -45.829612731933594, -43.881187438964844, -41.93275833129883, -39.98432922363281, -38.03590393066406, -36.08747482299805, -34.13904571533203, -32.19062042236328, -30.2421932220459, -28.293766021728516, -26.3453369140625, -24.396909713745117, -22.448482513427734, -20.50005340576172, -18.551626205444336, -16.603199005126953, -14.65477180480957, -12.706343650817871, -10.757915496826172, -8.809488296508789, -6.861061096191406, -4.912632942199707, -2.964204788208008, -1.015777587890625, 0.932650089263916, 2.881077766418457, 4.829505443572998, 6.777933120727539, 8.726360321044922, 10.674788475036621, 12.62321662902832, 14.571643829345703, 16.520071029663086, 18.46849822998047, 20.416927337646484, 22.365354537963867, 24.31378173828125, 26.262210845947266, 28.21063804626465, 30.15906524658203, 32.10749435424805, 34.0559196472168, 36.00434875488281, 37.95277404785156, 39.90120315551758, 41.849632263183594, 43.798057556152344, 45.74648666381836, 47.694915771484375, 49.643341064453125, 51.59177017211914, 53.540199279785156, 55.488624572753906, 57.43705368041992, 59.38548278808594, 61.33390808105469]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 17.0, 19.0, 21.0, 22.0, 16.0, 28.0, 20.0, 44.0, 30.0, 30.0, 41.0, 47.0, 48.0, 44.0, 50.0, 41.0, 34.0, 34.0, 38.0, 37.0, 37.0, 40.0, 41.0, 32.0, 28.0, 21.0, 20.0, 18.0, 20.0, 14.0, 9.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.2109375, -6.98712158203125, -6.7633056640625, -6.53948974609375, -6.315673828125, -6.09185791015625, -5.8680419921875, -5.64422607421875, -5.42041015625, -5.19659423828125, -4.9727783203125, -4.74896240234375, -4.525146484375, -4.30133056640625, -4.0775146484375, -3.85369873046875, -3.6298828125, -3.40606689453125, -3.1822509765625, -2.95843505859375, -2.734619140625, -2.51080322265625, -2.2869873046875, -2.06317138671875, -1.83935546875, -1.61553955078125, -1.3917236328125, -1.16790771484375, -0.944091796875, -0.72027587890625, -0.4964599609375, -0.27264404296875, -0.048828125, 0.17498779296875, 0.3988037109375, 0.62261962890625, 0.846435546875, 1.07025146484375, 1.2940673828125, 1.51788330078125, 1.74169921875, 1.96551513671875, 2.1893310546875, 2.41314697265625, 2.636962890625, 2.86077880859375, 3.0845947265625, 3.30841064453125, 3.5322265625, 3.75604248046875, 3.9798583984375, 4.20367431640625, 4.427490234375, 4.65130615234375, 4.8751220703125, 5.09893798828125, 5.32275390625, 5.54656982421875, 5.7703857421875, 5.99420166015625, 6.218017578125, 6.44183349609375, 6.6656494140625, 6.88946533203125, 7.11328125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 12.0, 16.0, 11.0, 10.0, 17.0, 18.0, 24.0, 28.0, 23.0, 31.0, 40.0, 41.0, 72.0, 169.0, 553.0, 2700.0, 61131.0, 3086468.0, 1028382.0, 12504.0, 1251.0, 338.0, 106.0, 62.0, 41.0, 33.0, 35.0, 30.0, 12.0, 21.0, 23.0, 19.0, 11.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.171875, -24.3544921875, -23.537109375, -22.7197265625, -21.90234375, -21.0849609375, -20.267578125, -19.4501953125, -18.6328125, -17.8154296875, -16.998046875, -16.1806640625, -15.36328125, -14.5458984375, -13.728515625, -12.9111328125, -12.09375, -11.2763671875, -10.458984375, -9.6416015625, -8.82421875, -8.0068359375, -7.189453125, -6.3720703125, -5.5546875, -4.7373046875, -3.919921875, -3.1025390625, -2.28515625, -1.4677734375, -0.650390625, 0.1669921875, 0.984375, 1.8017578125, 2.619140625, 3.4365234375, 4.25390625, 5.0712890625, 5.888671875, 6.7060546875, 7.5234375, 8.3408203125, 9.158203125, 9.9755859375, 10.79296875, 11.6103515625, 12.427734375, 13.2451171875, 14.0625, 14.8798828125, 15.697265625, 16.5146484375, 17.33203125, 18.1494140625, 18.966796875, 19.7841796875, 20.6015625, 21.4189453125, 22.236328125, 23.0537109375, 23.87109375, 24.6884765625, 25.505859375, 26.3232421875, 27.140625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 7.0, 15.0, 19.0, 17.0, 32.0, 46.0, 43.0, 91.0, 103.0, 129.0, 168.0, 230.0, 320.0, 378.0, 442.0, 487.0, 385.0, 304.0, 218.0, 162.0, 123.0, 78.0, 64.0, 45.0, 46.0, 28.0, 20.0, 14.0, 10.0, 10.0, 5.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.071533203125, -10.65869140625, -10.245849609375, -9.8330078125, -9.420166015625, -9.00732421875, -8.594482421875, -8.181640625, -7.768798828125, -7.35595703125, -6.943115234375, -6.5302734375, -6.117431640625, -5.70458984375, -5.291748046875, -4.87890625, -4.466064453125, -4.05322265625, -3.640380859375, -3.2275390625, -2.814697265625, -2.40185546875, -1.989013671875, -1.576171875, -1.163330078125, -0.75048828125, -0.337646484375, 0.0751953125, 0.488037109375, 0.90087890625, 1.313720703125, 1.7265625, 2.139404296875, 2.55224609375, 2.965087890625, 3.3779296875, 3.790771484375, 4.20361328125, 4.616455078125, 5.029296875, 5.442138671875, 5.85498046875, 6.267822265625, 6.6806640625, 7.093505859375, 7.50634765625, 7.919189453125, 8.33203125, 8.744873046875, 9.15771484375, 9.570556640625, 9.9833984375, 10.396240234375, 10.80908203125, 11.221923828125, 11.634765625, 12.047607421875, 12.46044921875, 12.873291015625, 13.2861328125, 13.698974609375, 14.11181640625, 14.524658203125, 14.9375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 16.0, 18.0, 24.0, 23.0, 42.0, 51.0, 64.0, 82.0, 97.0, 139.0, 191.0, 237.0, 403.0, 732.0, 6149.0, 4022252.0, 160889.0, 1190.0, 476.0, 314.0, 206.0, 154.0, 121.0, 90.0, 73.0, 48.0, 38.0, 31.0, 29.0, 17.0, 13.0, 13.0, 14.0, 4.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.59375, -60.48876953125, -58.3837890625, -56.27880859375, -54.173828125, -52.06884765625, -49.9638671875, -47.85888671875, -45.75390625, -43.64892578125, -41.5439453125, -39.43896484375, -37.333984375, -35.22900390625, -33.1240234375, -31.01904296875, -28.9140625, -26.80908203125, -24.7041015625, -22.59912109375, -20.494140625, -18.38916015625, -16.2841796875, -14.17919921875, -12.07421875, -9.96923828125, -7.8642578125, -5.75927734375, -3.654296875, -1.54931640625, 0.5556640625, 2.66064453125, 4.765625, 6.87060546875, 8.9755859375, 11.08056640625, 13.185546875, 15.29052734375, 17.3955078125, 19.50048828125, 21.60546875, 23.71044921875, 25.8154296875, 27.92041015625, 30.025390625, 32.13037109375, 34.2353515625, 36.34033203125, 38.4453125, 40.55029296875, 42.6552734375, 44.76025390625, 46.865234375, 48.97021484375, 51.0751953125, 53.18017578125, 55.28515625, 57.39013671875, 59.4951171875, 61.60009765625, 63.705078125, 65.81005859375, 67.9150390625, 70.02001953125, 72.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 26.0, 204.0, 473.0, 267.0, 38.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.7817611694336, -80.40135955810547, -74.02095794677734, -67.64056396484375, -61.26015853881836, -54.879756927490234, -48.499359130859375, -42.11895751953125, -35.738555908203125, -29.358154296875, -22.977754592895508, -16.597354888916016, -10.21695327758789, -3.8365516662597656, 2.5438461303710938, 8.924247741699219, 15.304649353027344, 21.68505096435547, 28.06545066833496, 34.44585037231445, 40.82625198364258, 47.2066535949707, 53.58705139160156, 59.96745300292969, 66.34785461425781, 72.72825622558594, 79.10865783691406, 85.48905944824219, 91.86946105957031, 98.24986267089844, 104.63025665283203, 111.01065826416016, 117.39105224609375, 123.77145385742188, 130.15185546875, 136.53225708007812, 142.91265869140625, 149.29306030273438, 155.6734619140625, 162.05386352539062, 168.43426513671875, 174.81466674804688, 181.195068359375, 187.57546997070312, 193.95587158203125, 200.33627319335938, 206.7166748046875, 213.09707641601562, 219.4774627685547, 225.8578643798828, 232.23826599121094, 238.61866760253906, 244.9990692138672, 251.3794708251953, 257.7598571777344, 264.1402587890625, 270.5206604003906, 276.90106201171875, 283.2814636230469, 289.661865234375, 296.0422668457031, 302.42266845703125, 308.8030700683594, 315.1834716796875, 321.5638732910156]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 6.0, 12.0, 13.0, 17.0, 20.0, 17.0, 13.0, 29.0, 24.0, 23.0, 29.0, 35.0, 33.0, 29.0, 40.0, 39.0, 39.0, 28.0, 40.0, 41.0, 37.0, 32.0, 46.0, 41.0, 30.0, 32.0, 27.0, 30.0, 12.0, 36.0, 25.0, 22.0, 16.0, 5.0, 12.0, 11.0, 6.0, 7.0, 8.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.13287353515625, -38.885887145996094, -37.6389045715332, -36.39191818237305, -35.144935607910156, -33.89794921875, -32.650962829589844, -31.40397834777832, -30.156993865966797, -28.910009384155273, -27.66302490234375, -26.416038513183594, -25.16905403137207, -23.922069549560547, -22.67508316040039, -21.428098678588867, -20.181114196777344, -18.93412971496582, -17.687145233154297, -16.44015884399414, -15.193174362182617, -13.946189880371094, -12.699204444885254, -11.452219009399414, -10.20523452758789, -8.958250045776367, -7.711264610290527, -6.464279651641846, -5.217294692993164, -3.9703097343444824, -2.723324775695801, -1.476339340209961, -0.2293548583984375, 1.0176301002502441, 2.264615058898926, 3.5116000175476074, 4.758584976196289, 6.005569934844971, 7.252554893493652, 8.499540328979492, 9.746524810791016, 10.993509292602539, 12.240494728088379, 13.487480163574219, 14.734464645385742, 15.981449127197266, 17.228435516357422, 18.475419998168945, 19.72240447998047, 20.969388961791992, 22.216373443603516, 23.463359832763672, 24.710344314575195, 25.95732879638672, 27.204315185546875, 28.4512996673584, 29.698284149169922, 30.945268630981445, 32.19225311279297, 33.439239501953125, 34.68622589111328, 35.93320846557617, 37.18019485473633, 38.42717742919922, 39.674163818359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 4.0, 11.0, 15.0, 13.0, 24.0, 21.0, 32.0, 19.0, 33.0, 26.0, 44.0, 29.0, 41.0, 48.0, 41.0, 41.0, 32.0, 43.0, 43.0, 39.0, 36.0, 33.0, 42.0, 30.0, 30.0, 47.0, 33.0, 25.0, 13.0, 15.0, 14.0, 13.0, 12.0, 7.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.6307373046875, -6.417724609375, -6.2047119140625, -5.99169921875, -5.7786865234375, -5.565673828125, -5.3526611328125, -5.1396484375, -4.9266357421875, -4.713623046875, -4.5006103515625, -4.28759765625, -4.0745849609375, -3.861572265625, -3.6485595703125, -3.435546875, -3.2225341796875, -3.009521484375, -2.7965087890625, -2.58349609375, -2.3704833984375, -2.157470703125, -1.9444580078125, -1.7314453125, -1.5184326171875, -1.305419921875, -1.0924072265625, -0.87939453125, -0.6663818359375, -0.453369140625, -0.2403564453125, -0.02734375, 0.1856689453125, 0.398681640625, 0.6116943359375, 0.82470703125, 1.0377197265625, 1.250732421875, 1.4637451171875, 1.6767578125, 1.8897705078125, 2.102783203125, 2.3157958984375, 2.52880859375, 2.7418212890625, 2.954833984375, 3.1678466796875, 3.380859375, 3.5938720703125, 3.806884765625, 4.0198974609375, 4.23291015625, 4.4459228515625, 4.658935546875, 4.8719482421875, 5.0849609375, 5.2979736328125, 5.510986328125, 5.7239990234375, 5.93701171875, 6.1500244140625, 6.363037109375, 6.5760498046875, 6.7890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 15.0, 11.0, 26.0, 34.0, 45.0, 93.0, 132.0, 163.0, 278.0, 359.0, 503.0, 746.0, 1191.0, 1588.0, 2343.0, 3371.0, 5073.0, 7756.0, 11658.0, 17886.0, 27850.0, 43930.0, 69396.0, 114518.0, 196334.0, 210764.0, 124608.0, 74774.0, 46853.0, 29598.0, 19131.0, 12575.0, 8177.0, 5334.0, 3716.0, 2416.0, 1658.0, 1124.0, 725.0, 549.0, 382.0, 265.0, 198.0, 132.0, 89.0, 63.0, 43.0, 32.0, 16.0, 6.0, 8.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.95849609375, -0.9286117553710938, -0.8987274169921875, -0.8688430786132812, -0.838958740234375, -0.8090744018554688, -0.7791900634765625, -0.7493057250976562, -0.71942138671875, -0.6895370483398438, -0.6596527099609375, -0.6297683715820312, -0.599884033203125, -0.5699996948242188, -0.5401153564453125, -0.5102310180664062, -0.4803466796875, -0.45046234130859375, -0.4205780029296875, -0.39069366455078125, -0.360809326171875, -0.33092498779296875, -0.3010406494140625, -0.27115631103515625, -0.24127197265625, -0.21138763427734375, -0.1815032958984375, -0.15161895751953125, -0.121734619140625, -0.09185028076171875, -0.0619659423828125, -0.03208160400390625, -0.002197265625, 0.02768707275390625, 0.0575714111328125, 0.08745574951171875, 0.117340087890625, 0.14722442626953125, 0.1771087646484375, 0.20699310302734375, 0.23687744140625, 0.26676177978515625, 0.2966461181640625, 0.32653045654296875, 0.356414794921875, 0.38629913330078125, 0.4161834716796875, 0.44606781005859375, 0.4759521484375, 0.5058364868164062, 0.5357208251953125, 0.5656051635742188, 0.595489501953125, 0.6253738403320312, 0.6552581787109375, 0.6851425170898438, 0.71502685546875, 0.7449111938476562, 0.7747955322265625, 0.8046798706054688, 0.834564208984375, 0.8644485473632812, 0.8943328857421875, 0.9242172241210938, 0.9541015625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 11.0, 7.0, 11.0, 12.0, 12.0, 17.0, 20.0, 18.0, 23.0, 32.0, 35.0, 36.0, 36.0, 33.0, 41.0, 35.0, 61.0, 35.0, 1077.0, 41.0, 42.0, 47.0, 40.0, 27.0, 50.0, 26.0, 26.0, 25.0, 25.0, 19.0, 17.0, 11.0, 14.0, 8.0, 13.0, 6.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.41015625, -4.27276611328125, -4.1353759765625, -3.99798583984375, -3.860595703125, -3.72320556640625, -3.5858154296875, -3.44842529296875, -3.31103515625, -3.17364501953125, -3.0362548828125, -2.89886474609375, -2.761474609375, -2.62408447265625, -2.4866943359375, -2.34930419921875, -2.2119140625, -2.07452392578125, -1.9371337890625, -1.79974365234375, -1.662353515625, -1.52496337890625, -1.3875732421875, -1.25018310546875, -1.11279296875, -0.97540283203125, -0.8380126953125, -0.70062255859375, -0.563232421875, -0.42584228515625, -0.2884521484375, -0.15106201171875, -0.013671875, 0.12371826171875, 0.2611083984375, 0.39849853515625, 0.535888671875, 0.67327880859375, 0.8106689453125, 0.94805908203125, 1.08544921875, 1.22283935546875, 1.3602294921875, 1.49761962890625, 1.635009765625, 1.77239990234375, 1.9097900390625, 2.04718017578125, 2.1845703125, 2.32196044921875, 2.4593505859375, 2.59674072265625, 2.734130859375, 2.87152099609375, 3.0089111328125, 3.14630126953125, 3.28369140625, 3.42108154296875, 3.5584716796875, 3.69586181640625, 3.833251953125, 3.97064208984375, 4.1080322265625, 4.24542236328125, 4.3828125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 15.0, 20.0, 26.0, 47.0, 78.0, 120.0, 142.0, 252.0, 351.0, 507.0, 855.0, 1294.0, 2107.0, 3119.0, 4958.0, 7604.0, 12587.0, 20164.0, 34104.0, 58667.0, 107009.0, 209666.0, 1317679.0, 135846.0, 73397.0, 41919.0, 24468.0, 14898.0, 9211.0, 5696.0, 3616.0, 2314.0, 1574.0, 1021.0, 612.0, 396.0, 254.0, 174.0, 135.0, 68.0, 52.0, 44.0, 19.0, 19.0, 8.0, 8.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.016143798828125, -0.98248291015625, -0.948822021484375, -0.9151611328125, -0.881500244140625, -0.84783935546875, -0.814178466796875, -0.780517578125, -0.746856689453125, -0.71319580078125, -0.679534912109375, -0.6458740234375, -0.612213134765625, -0.57855224609375, -0.544891357421875, -0.51123046875, -0.477569580078125, -0.44390869140625, -0.410247802734375, -0.3765869140625, -0.342926025390625, -0.30926513671875, -0.275604248046875, -0.241943359375, -0.208282470703125, -0.17462158203125, -0.140960693359375, -0.1072998046875, -0.073638916015625, -0.03997802734375, -0.006317138671875, 0.02734375, 0.061004638671875, 0.09466552734375, 0.128326416015625, 0.1619873046875, 0.195648193359375, 0.22930908203125, 0.262969970703125, 0.296630859375, 0.330291748046875, 0.36395263671875, 0.397613525390625, 0.4312744140625, 0.464935302734375, 0.49859619140625, 0.532257080078125, 0.56591796875, 0.599578857421875, 0.63323974609375, 0.666900634765625, 0.7005615234375, 0.734222412109375, 0.76788330078125, 0.801544189453125, 0.835205078125, 0.868865966796875, 0.90252685546875, 0.936187744140625, 0.9698486328125, 1.003509521484375, 1.03717041015625, 1.070831298828125, 1.1044921875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 5.0, 15.0, 11.0, 16.0, 17.0, 21.0, 27.0, 26.0, 41.0, 32.0, 34.0, 49.0, 90.0, 70.0, 77.0, 54.0, 67.0, 55.0, 51.0, 49.0, 27.0, 25.0, 21.0, 16.0, 12.0, 10.0, 14.0, 6.0, 12.0, 7.0, 6.0, 3.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006728172302246094, -0.0006508305668830872, -0.0006288439035415649, -0.0006068572402000427, -0.0005848705768585205, -0.0005628839135169983, -0.0005408972501754761, -0.0005189105868339539, -0.0004969239234924316, -0.0004749372601509094, -0.0004529505968093872, -0.000430963933467865, -0.0004089772701263428, -0.00038699060678482056, -0.00036500394344329834, -0.0003430172801017761, -0.0003210306167602539, -0.0002990439534187317, -0.00027705729007720947, -0.00025507062673568726, -0.00023308396339416504, -0.00021109730005264282, -0.0001891106367111206, -0.0001671239733695984, -0.00014513731002807617, -0.00012315064668655396, -0.00010116398334503174, -7.917732000350952e-05, -5.7190656661987305e-05, -3.520399332046509e-05, -1.3217329978942871e-05, 8.769333362579346e-06, 3.075599670410156e-05, 5.274266004562378e-05, 7.4729323387146e-05, 9.671598672866821e-05, 0.00011870265007019043, 0.00014068931341171265, 0.00016267597675323486, 0.00018466264009475708, 0.0002066493034362793, 0.00022863596677780151, 0.00025062263011932373, 0.00027260929346084595, 0.00029459595680236816, 0.0003165826201438904, 0.0003385692834854126, 0.0003605559468269348, 0.00038254261016845703, 0.00040452927350997925, 0.00042651593685150146, 0.0004485026001930237, 0.0004704892635345459, 0.0004924759268760681, 0.0005144625902175903, 0.0005364492535591125, 0.0005584359169006348, 0.000580422580242157, 0.0006024092435836792, 0.0006243959069252014, 0.0006463825702667236, 0.0006683692336082458, 0.0006903558969497681, 0.0007123425602912903, 0.0007343292236328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 1.0, 8.0, 7.0, 6.0, 9.0, 10.0, 15.0, 10.0, 23.0, 28.0, 31.0, 40.0, 60.0, 89.0, 120.0, 252.0, 799.0, 9936.0, 1033213.0, 2591.0, 610.0, 230.0, 106.0, 80.0, 64.0, 34.0, 26.0, 38.0, 15.0, 22.0, 12.0, 15.0, 13.0, 7.0, 10.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016326904296875, -0.015822649002075195, -0.01531839370727539, -0.014814138412475586, -0.014309883117675781, -0.013805627822875977, -0.013301372528076172, -0.012797117233276367, -0.012292861938476562, -0.011788606643676758, -0.011284351348876953, -0.010780096054077148, -0.010275840759277344, -0.009771585464477539, -0.009267330169677734, -0.00876307487487793, -0.008258819580078125, -0.00775456428527832, -0.007250308990478516, -0.006746053695678711, -0.006241798400878906, -0.0057375431060791016, -0.005233287811279297, -0.004729032516479492, -0.0042247772216796875, -0.003720521926879883, -0.003216266632080078, -0.0027120113372802734, -0.0022077560424804688, -0.001703500747680664, -0.0011992454528808594, -0.0006949901580810547, -0.00019073486328125, 0.0003135204315185547, 0.0008177757263183594, 0.001322031021118164, 0.0018262863159179688, 0.0023305416107177734, 0.002834796905517578, 0.003339052200317383, 0.0038433074951171875, 0.004347562789916992, 0.004851818084716797, 0.0053560733795166016, 0.005860328674316406, 0.006364583969116211, 0.006868839263916016, 0.00737309455871582, 0.007877349853515625, 0.00838160514831543, 0.008885860443115234, 0.009390115737915039, 0.009894371032714844, 0.010398626327514648, 0.010902881622314453, 0.011407136917114258, 0.011911392211914062, 0.012415647506713867, 0.012919902801513672, 0.013424158096313477, 0.013928413391113281, 0.014432668685913086, 0.01493692398071289, 0.015441179275512695, 0.0159454345703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 14.0, 81.0, 199.0, 341.0, 241.0, 99.0, 26.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013728872872889042, -0.0013427898520603776, -0.001312692416831851, -0.0012825950980186462, -0.0012524976627901196, -0.001222400227561593, -0.0011923027923330665, -0.0011622053571045399, -0.0011321079218760133, -0.0011020104866474867, -0.00107191305141896, -0.0010418156161904335, -0.0010117182973772287, -0.0009816208621487021, -0.0009515234269201756, -0.000921425991691649, -0.0008913286728784442, -0.0008612312376499176, -0.0008311338606290519, -0.0008010364254005253, -0.0007709389901719987, -0.0007408416131511331, -0.0007107441779226065, -0.0006806467426940799, -0.0006505493074655533, -0.0006204518722370267, -0.000590354495216161, -0.0005602570599876344, -0.0005301596247591078, -0.0005000622477382421, -0.00046996481250971556, -0.0004398674063850194, -0.0004097700002603233, -0.00037967259413562715, -0.00034957515890710056, -0.0003194777527824044, -0.0002893803466577083, -0.00025928294053301215, -0.00022918550530448556, -0.00019908809917978942, -0.00016899067850317806, -0.0001388932578265667, -0.00010879585170187056, -7.86984310252592e-05, -4.860101762460545e-05, -1.8503604223951697e-05, 1.1593816452659667e-05, 4.16912225773558e-05, 7.178864325396717e-05, 0.00010188605665462092, 0.00013198347005527467, 0.00016208089073188603, 0.00019217829685658216, 0.00022227571753319353, 0.0002523731382098049, 0.00028247054433450103, 0.0003125679795630276, 0.00034266538568772376, 0.00037276282091625035, 0.0004028602270409465, 0.0004329576331656426, 0.00046305503929033875, 0.0004931524745188653, 0.000523249851539731, 0.0005533472867682576]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 6.0, 4.0, 5.0, 2.0, 3.0, 9.0, 13.0, 11.0, 11.0, 15.0, 18.0, 25.0, 26.0, 18.0, 30.0, 25.0, 26.0, 29.0, 37.0, 27.0, 44.0, 38.0, 41.0, 56.0, 40.0, 39.0, 32.0, 37.0, 25.0, 26.0, 16.0, 19.0, 34.0, 21.0, 28.0, 25.0, 21.0, 15.0, 15.0, 17.0, 11.0, 6.0, 17.0, 6.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003209710121154785, -0.0003109695389866829, -0.00030096806585788727, -0.00029096659272909164, -0.000280965119600296, -0.0002709636464715004, -0.0002609621733427048, -0.00025096070021390915, -0.00024095922708511353, -0.0002309577539563179, -0.00022095628082752228, -0.00021095480769872665, -0.00020095333456993103, -0.0001909518614411354, -0.00018095038831233978, -0.00017094891518354416, -0.00016094744205474854, -0.0001509459689259529, -0.0001409444957971573, -0.00013094302266836166, -0.00012094154953956604, -0.00011094007641077042, -0.00010093860328197479, -9.093713015317917e-05, -8.093565702438354e-05, -7.093418389558792e-05, -6.09327107667923e-05, -5.0931237637996674e-05, -4.092976450920105e-05, -3.0928291380405426e-05, -2.0926818251609802e-05, -1.0925345122814178e-05, -9.238719940185547e-07, 9.077601134777069e-06, 1.9079074263572693e-05, 2.9080547392368317e-05, 3.908202052116394e-05, 4.9083493649959564e-05, 5.908496677875519e-05, 6.908643990755081e-05, 7.908791303634644e-05, 8.908938616514206e-05, 9.909085929393768e-05, 0.00010909233242273331, 0.00011909380555152893, 0.00012909527868032455, 0.00013909675180912018, 0.0001490982249379158, 0.00015909969806671143, 0.00016910117119550705, 0.00017910264432430267, 0.0001891041174530983, 0.00019910559058189392, 0.00020910706371068954, 0.00021910853683948517, 0.0002291100099682808, 0.00023911148309707642, 0.00024911295622587204, 0.00025911442935466766, 0.0002691159024834633, 0.0002791173756122589, 0.00028911884874105453, 0.00029912032186985016, 0.0003091217949986458, 0.0003191232681274414]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 4.0, 11.0, 15.0, 13.0, 24.0, 22.0, 31.0, 19.0, 33.0, 26.0, 44.0, 29.0, 41.0, 48.0, 41.0, 41.0, 32.0, 43.0, 43.0, 39.0, 36.0, 33.0, 42.0, 30.0, 30.0, 47.0, 33.0, 25.0, 13.0, 15.0, 14.0, 13.0, 12.0, 7.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.6307373046875, -6.417724609375, -6.2047119140625, -5.99169921875, -5.7786865234375, -5.565673828125, -5.3526611328125, -5.1396484375, -4.9266357421875, -4.713623046875, -4.5006103515625, -4.28759765625, -4.0745849609375, -3.861572265625, -3.6485595703125, -3.435546875, -3.2225341796875, -3.009521484375, -2.7965087890625, -2.58349609375, -2.3704833984375, -2.157470703125, -1.9444580078125, -1.7314453125, -1.5184326171875, -1.305419921875, -1.0924072265625, -0.87939453125, -0.6663818359375, -0.453369140625, -0.2403564453125, -0.02734375, 0.1856689453125, 0.398681640625, 0.6116943359375, 0.82470703125, 1.0377197265625, 1.250732421875, 1.4637451171875, 1.6767578125, 1.8897705078125, 2.102783203125, 2.3157958984375, 2.52880859375, 2.7418212890625, 2.954833984375, 3.1678466796875, 3.380859375, 3.5938720703125, 3.806884765625, 4.0198974609375, 4.23291015625, 4.4459228515625, 4.658935546875, 4.8719482421875, 5.0849609375, 5.2979736328125, 5.510986328125, 5.7239990234375, 5.93701171875, 6.1500244140625, 6.363037109375, 6.5760498046875, 6.7890625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 14.0, 17.0, 32.0, 49.0, 73.0, 91.0, 131.0, 138.0, 227.0, 404.0, 658.0, 1118.0, 1902.0, 3429.0, 6830.0, 14724.0, 35121.0, 93736.0, 283319.0, 387929.0, 132503.0, 47770.0, 19549.0, 8787.0, 4395.0, 2235.0, 1255.0, 709.0, 444.0, 306.0, 195.0, 116.0, 101.0, 70.0, 40.0, 31.0, 25.0, 20.0, 18.0, 10.0, 3.0, 4.0, 5.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.12109375, -4.97119140625, -4.8212890625, -4.67138671875, -4.521484375, -4.37158203125, -4.2216796875, -4.07177734375, -3.921875, -3.77197265625, -3.6220703125, -3.47216796875, -3.322265625, -3.17236328125, -3.0224609375, -2.87255859375, -2.72265625, -2.57275390625, -2.4228515625, -2.27294921875, -2.123046875, -1.97314453125, -1.8232421875, -1.67333984375, -1.5234375, -1.37353515625, -1.2236328125, -1.07373046875, -0.923828125, -0.77392578125, -0.6240234375, -0.47412109375, -0.32421875, -0.17431640625, -0.0244140625, 0.12548828125, 0.275390625, 0.42529296875, 0.5751953125, 0.72509765625, 0.875, 1.02490234375, 1.1748046875, 1.32470703125, 1.474609375, 1.62451171875, 1.7744140625, 1.92431640625, 2.07421875, 2.22412109375, 2.3740234375, 2.52392578125, 2.673828125, 2.82373046875, 2.9736328125, 3.12353515625, 3.2734375, 3.42333984375, 3.5732421875, 3.72314453125, 3.873046875, 4.02294921875, 4.1728515625, 4.32275390625, 4.47265625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 4.0, 8.0, 14.0, 12.0, 10.0, 16.0, 18.0, 29.0, 21.0, 23.0, 23.0, 47.0, 35.0, 51.0, 45.0, 56.0, 93.0, 316.0, 1582.0, 123.0, 94.0, 57.0, 47.0, 38.0, 39.0, 33.0, 34.0, 32.0, 23.0, 15.0, 27.0, 10.0, 14.0, 8.0, 7.0, 7.0, 9.0, 6.0, 1.0, 1.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.484375, -21.80712890625, -21.1298828125, -20.45263671875, -19.775390625, -19.09814453125, -18.4208984375, -17.74365234375, -17.06640625, -16.38916015625, -15.7119140625, -15.03466796875, -14.357421875, -13.68017578125, -13.0029296875, -12.32568359375, -11.6484375, -10.97119140625, -10.2939453125, -9.61669921875, -8.939453125, -8.26220703125, -7.5849609375, -6.90771484375, -6.23046875, -5.55322265625, -4.8759765625, -4.19873046875, -3.521484375, -2.84423828125, -2.1669921875, -1.48974609375, -0.8125, -0.13525390625, 0.5419921875, 1.21923828125, 1.896484375, 2.57373046875, 3.2509765625, 3.92822265625, 4.60546875, 5.28271484375, 5.9599609375, 6.63720703125, 7.314453125, 7.99169921875, 8.6689453125, 9.34619140625, 10.0234375, 10.70068359375, 11.3779296875, 12.05517578125, 12.732421875, 13.40966796875, 14.0869140625, 14.76416015625, 15.44140625, 16.11865234375, 16.7958984375, 17.47314453125, 18.150390625, 18.82763671875, 19.5048828125, 20.18212890625, 20.859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 12.0, 13.0, 32.0, 54.0, 95.0, 182.0, 273.0, 495.0, 1754.0, 3133674.0, 7738.0, 613.0, 311.0, 187.0, 109.0, 59.0, 36.0, 21.0, 20.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.875, -137.41015625, -133.9453125, -130.48046875, -127.015625, -123.55078125, -120.0859375, -116.62109375, -113.15625, -109.69140625, -106.2265625, -102.76171875, -99.296875, -95.83203125, -92.3671875, -88.90234375, -85.4375, -81.97265625, -78.5078125, -75.04296875, -71.578125, -68.11328125, -64.6484375, -61.18359375, -57.71875, -54.25390625, -50.7890625, -47.32421875, -43.859375, -40.39453125, -36.9296875, -33.46484375, -30.0, -26.53515625, -23.0703125, -19.60546875, -16.140625, -12.67578125, -9.2109375, -5.74609375, -2.28125, 1.18359375, 4.6484375, 8.11328125, 11.578125, 15.04296875, 18.5078125, 21.97265625, 25.4375, 28.90234375, 32.3671875, 35.83203125, 39.296875, 42.76171875, 46.2265625, 49.69140625, 53.15625, 56.62109375, 60.0859375, 63.55078125, 67.015625, 70.48046875, 73.9453125, 77.41015625, 80.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [4.0, 937.0, 80.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.38177490234375, -7.355345726013184, 2.671083450317383, 12.697513580322266, 22.723941802978516, 32.750370025634766, 42.77680206298828, 52.80323028564453, 62.82965850830078, 72.85608673095703, 82.88251495361328, 92.90895080566406, 102.93537902832031, 112.96180725097656, 122.98823547363281, 133.01466369628906, 143.0410919189453, 153.06752014160156, 163.0939483642578, 173.12037658691406, 183.1468048095703, 193.17323303222656, 203.19967651367188, 213.22610473632812, 223.25253295898438, 233.27896118164062, 243.30538940429688, 253.33181762695312, 263.3582458496094, 273.3846740722656, 283.4111022949219, 293.4375305175781, 303.4639587402344, 313.4903869628906, 323.5168151855469, 333.5432434082031, 343.5696716308594, 353.5960998535156, 363.6225280761719, 373.6489562988281, 383.6753845214844, 393.7018127441406, 403.7282409667969, 413.7546691894531, 423.7810974121094, 433.8075256347656, 443.8339538574219, 453.8603820800781, 463.8868408203125, 473.91326904296875, 483.939697265625, 493.96612548828125, 503.9925537109375, 514.0189819335938, 524.04541015625, 534.0718383789062, 544.0982666015625, 554.1246948242188, 564.151123046875, 574.1775512695312, 584.2039794921875, 594.2304077148438, 604.2568359375, 614.2832641601562, 624.3096923828125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 10.0, 10.0, 8.0, 10.0, 14.0, 14.0, 14.0, 18.0, 20.0, 35.0, 25.0, 26.0, 30.0, 32.0, 29.0, 32.0, 45.0, 48.0, 43.0, 51.0, 43.0, 37.0, 45.0, 37.0, 35.0, 33.0, 32.0, 28.0, 31.0, 22.0, 23.0, 24.0, 12.0, 17.0, 10.0, 15.0, 14.0, 10.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.804561614990234, -57.924407958984375, -56.044254302978516, -54.164100646972656, -52.2839469909668, -50.40379333496094, -48.523643493652344, -46.64348602294922, -44.763336181640625, -42.883182525634766, -41.003028869628906, -39.12287521362305, -37.24272155761719, -35.36256790161133, -33.48241424560547, -31.602262496948242, -29.72210693359375, -27.84195327758789, -25.96179962158203, -24.081645965576172, -22.201492309570312, -20.321338653564453, -18.441186904907227, -16.561033248901367, -14.680879592895508, -12.800725936889648, -10.920572280883789, -9.040419578552246, -7.160265922546387, -5.280112266540527, -3.3999595642089844, -1.519805908203125, 0.3603477478027344, 2.2405011653900146, 4.120654582977295, 6.000807762145996, 7.8809614181518555, 9.761115074157715, 11.641267776489258, 13.521421432495117, 15.401575088500977, 17.281728744506836, 19.161882400512695, 21.042034149169922, 22.92218780517578, 24.80234146118164, 26.6824951171875, 28.56264877319336, 30.44280242919922, 32.32295608520508, 34.20310974121094, 36.0832633972168, 37.963417053222656, 39.843570709228516, 41.723724365234375, 43.60387420654297, 45.484031677246094, 47.36418533325195, 49.24433898925781, 51.12449264526367, 53.00464630126953, 54.88479995727539, 56.76495361328125, 58.645103454589844, 60.5252571105957]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 11.0, 6.0, 8.0, 16.0, 16.0, 17.0, 14.0, 21.0, 28.0, 30.0, 37.0, 42.0, 31.0, 43.0, 44.0, 41.0, 47.0, 42.0, 43.0, 37.0, 44.0, 33.0, 32.0, 33.0, 35.0, 33.0, 44.0, 36.0, 31.0, 16.0, 15.0, 8.0, 6.0, 16.0, 12.0, 6.0, 9.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12109375, -6.8931884765625, -6.665283203125, -6.4373779296875, -6.20947265625, -5.9815673828125, -5.753662109375, -5.5257568359375, -5.2978515625, -5.0699462890625, -4.842041015625, -4.6141357421875, -4.38623046875, -4.1583251953125, -3.930419921875, -3.7025146484375, -3.474609375, -3.2467041015625, -3.018798828125, -2.7908935546875, -2.56298828125, -2.3350830078125, -2.107177734375, -1.8792724609375, -1.6513671875, -1.4234619140625, -1.195556640625, -0.9676513671875, -0.73974609375, -0.5118408203125, -0.283935546875, -0.0560302734375, 0.171875, 0.3997802734375, 0.627685546875, 0.8555908203125, 1.08349609375, 1.3114013671875, 1.539306640625, 1.7672119140625, 1.9951171875, 2.2230224609375, 2.450927734375, 2.6788330078125, 2.90673828125, 3.1346435546875, 3.362548828125, 3.5904541015625, 3.818359375, 4.0462646484375, 4.274169921875, 4.5020751953125, 4.72998046875, 4.9578857421875, 5.185791015625, 5.4136962890625, 5.6416015625, 5.8695068359375, 6.097412109375, 6.3253173828125, 6.55322265625, 6.7811279296875, 7.009033203125, 7.2369384765625, 7.46484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 7.0, 5.0, 6.0, 9.0, 13.0, 12.0, 12.0, 10.0, 19.0, 27.0, 21.0, 31.0, 43.0, 49.0, 87.0, 116.0, 279.0, 796.0, 3136.0, 34569.0, 1201812.0, 2781809.0, 161368.0, 7689.0, 1352.0, 414.0, 176.0, 102.0, 76.0, 48.0, 33.0, 29.0, 24.0, 24.0, 18.0, 13.0, 9.0, 10.0, 6.0, 9.0, 6.0, 3.0, 7.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.540283203125, -16.93994140625, -16.339599609375, -15.7392578125, -15.138916015625, -14.53857421875, -13.938232421875, -13.337890625, -12.737548828125, -12.13720703125, -11.536865234375, -10.9365234375, -10.336181640625, -9.73583984375, -9.135498046875, -8.53515625, -7.934814453125, -7.33447265625, -6.734130859375, -6.1337890625, -5.533447265625, -4.93310546875, -4.332763671875, -3.732421875, -3.132080078125, -2.53173828125, -1.931396484375, -1.3310546875, -0.730712890625, -0.13037109375, 0.469970703125, 1.0703125, 1.670654296875, 2.27099609375, 2.871337890625, 3.4716796875, 4.072021484375, 4.67236328125, 5.272705078125, 5.873046875, 6.473388671875, 7.07373046875, 7.674072265625, 8.2744140625, 8.874755859375, 9.47509765625, 10.075439453125, 10.67578125, 11.276123046875, 11.87646484375, 12.476806640625, 13.0771484375, 13.677490234375, 14.27783203125, 14.878173828125, 15.478515625, 16.078857421875, 16.67919921875, 17.279541015625, 17.8798828125, 18.480224609375, 19.08056640625, 19.680908203125, 20.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 13.0, 6.0, 3.0, 9.0, 17.0, 12.0, 28.0, 24.0, 33.0, 39.0, 34.0, 63.0, 73.0, 90.0, 108.0, 140.0, 184.0, 232.0, 269.0, 372.0, 364.0, 344.0, 286.0, 280.0, 238.0, 165.0, 125.0, 112.0, 90.0, 63.0, 65.0, 41.0, 32.0, 29.0, 22.0, 14.0, 14.0, 5.0, 9.0, 6.0, 6.0, 7.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5743408203125, -8.265869140625, -7.9573974609375, -7.64892578125, -7.3404541015625, -7.031982421875, -6.7235107421875, -6.4150390625, -6.1065673828125, -5.798095703125, -5.4896240234375, -5.18115234375, -4.8726806640625, -4.564208984375, -4.2557373046875, -3.947265625, -3.6387939453125, -3.330322265625, -3.0218505859375, -2.71337890625, -2.4049072265625, -2.096435546875, -1.7879638671875, -1.4794921875, -1.1710205078125, -0.862548828125, -0.5540771484375, -0.24560546875, 0.0628662109375, 0.371337890625, 0.6798095703125, 0.98828125, 1.2967529296875, 1.605224609375, 1.9136962890625, 2.22216796875, 2.5306396484375, 2.839111328125, 3.1475830078125, 3.4560546875, 3.7645263671875, 4.072998046875, 4.3814697265625, 4.68994140625, 4.9984130859375, 5.306884765625, 5.6153564453125, 5.923828125, 6.2322998046875, 6.540771484375, 6.8492431640625, 7.15771484375, 7.4661865234375, 7.774658203125, 8.0831298828125, 8.3916015625, 8.7000732421875, 9.008544921875, 9.3170166015625, 9.62548828125, 9.9339599609375, 10.242431640625, 10.5509033203125, 10.859375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 20.0, 25.0, 28.0, 38.0, 38.0, 78.0, 108.0, 117.0, 160.0, 195.0, 344.0, 641.0, 3144.0, 4060837.0, 126119.0, 894.0, 441.0, 254.0, 188.0, 148.0, 114.0, 73.0, 58.0, 46.0, 40.0, 29.0, 19.0, 20.0, 10.0, 7.0, 3.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.625, -81.21875, -78.8125, -76.40625, -74.0, -71.59375, -69.1875, -66.78125, -64.375, -61.96875, -59.5625, -57.15625, -54.75, -52.34375, -49.9375, -47.53125, -45.125, -42.71875, -40.3125, -37.90625, -35.5, -33.09375, -30.6875, -28.28125, -25.875, -23.46875, -21.0625, -18.65625, -16.25, -13.84375, -11.4375, -9.03125, -6.625, -4.21875, -1.8125, 0.59375, 3.0, 5.40625, 7.8125, 10.21875, 12.625, 15.03125, 17.4375, 19.84375, 22.25, 24.65625, 27.0625, 29.46875, 31.875, 34.28125, 36.6875, 39.09375, 41.5, 43.90625, 46.3125, 48.71875, 51.125, 53.53125, 55.9375, 58.34375, 60.75, 63.15625, 65.5625, 67.96875, 70.375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 13.0, 17.0, 31.0, 31.0, 47.0, 59.0, 90.0, 85.0, 104.0, 91.0, 87.0, 76.0, 78.0, 66.0, 36.0, 31.0, 21.0, 10.0, 12.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.27195739746094, -32.10111999511719, -30.930282592773438, -29.759445190429688, -28.588607788085938, -27.417770385742188, -26.24693489074707, -25.07609748840332, -23.90526008605957, -22.73442268371582, -21.56358528137207, -20.39274787902832, -19.221912384033203, -18.051074981689453, -16.880237579345703, -15.709400177001953, -14.538562774658203, -13.367725372314453, -12.196887969970703, -11.02605152130127, -9.85521411895752, -8.68437671661377, -7.513539791107178, -6.342702865600586, -5.171865463256836, -4.001028060913086, -2.830191135406494, -1.6593539714813232, -0.48851680755615234, 0.6823205947875977, 1.8531575202941895, 3.0239944458007812, 4.194828033447266, 5.365665435791016, 6.536502361297607, 7.707339286804199, 8.87817668914795, 10.0490140914917, 11.219850540161133, 12.390687942504883, 13.561525344848633, 14.732362747192383, 15.903200149536133, 17.074037551879883, 18.244873046875, 19.41571044921875, 20.5865478515625, 21.75738525390625, 22.92822265625, 24.09906005859375, 25.2698974609375, 26.44073486328125, 27.611572265625, 28.78240966796875, 29.953245162963867, 31.124082565307617, 32.294921875, 33.46575927734375, 34.6365966796875, 35.80743408203125, 36.978271484375, 38.14910888671875, 39.3199462890625, 40.49078369140625, 41.661617279052734]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 10.0, 5.0, 9.0, 6.0, 11.0, 14.0, 12.0, 17.0, 17.0, 27.0, 25.0, 15.0, 29.0, 28.0, 38.0, 33.0, 31.0, 37.0, 49.0, 36.0, 33.0, 39.0, 47.0, 36.0, 47.0, 37.0, 29.0, 35.0, 24.0, 32.0, 28.0, 28.0, 25.0, 21.0, 11.0, 14.0, 16.0, 14.0, 7.0, 5.0, 5.0, 5.0, 6.0, 7.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.13691711425781, -37.85509490966797, -36.57327651977539, -35.29145431518555, -34.0096321105957, -32.72780990600586, -31.44599151611328, -30.164169311523438, -28.882347106933594, -27.600526809692383, -26.31870460510254, -25.036884307861328, -23.755062103271484, -22.473241806030273, -21.191421508789062, -19.90959930419922, -18.627779006958008, -17.345958709716797, -16.064136505126953, -14.782316207885742, -13.500494003295898, -12.218673706054688, -10.93685245513916, -9.655031204223633, -8.373209953308105, -7.091388702392578, -5.809567451477051, -4.527746677398682, -3.2459254264831543, -1.964104175567627, -0.6822834014892578, 0.5995378494262695, 1.8813591003417969, 3.163180351257324, 4.445001602172852, 5.726822376251221, 7.008643627166748, 8.290464401245117, 9.572285652160645, 10.854106903076172, 12.1359281539917, 13.417749404907227, 14.699570655822754, 15.981391906738281, 17.263212203979492, 18.545034408569336, 19.826854705810547, 21.10867691040039, 22.3904972076416, 23.672317504882812, 24.954139709472656, 26.235960006713867, 27.51778221130371, 28.799602508544922, 30.081424713134766, 31.363245010375977, 32.64506530761719, 33.92688751220703, 35.20870590209961, 36.49052810668945, 37.7723503112793, 39.05417251586914, 40.33599090576172, 41.61781311035156, 42.899635314941406]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 0.0, 8.0, 10.0, 7.0, 6.0, 10.0, 9.0, 14.0, 25.0, 29.0, 21.0, 39.0, 35.0, 29.0, 33.0, 45.0, 53.0, 45.0, 39.0, 46.0, 47.0, 32.0, 43.0, 38.0, 36.0, 36.0, 48.0, 27.0, 38.0, 21.0, 27.0, 13.0, 20.0, 15.0, 16.0, 8.0, 13.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9609375, -6.73858642578125, -6.5162353515625, -6.29388427734375, -6.071533203125, -5.84918212890625, -5.6268310546875, -5.40447998046875, -5.18212890625, -4.95977783203125, -4.7374267578125, -4.51507568359375, -4.292724609375, -4.07037353515625, -3.8480224609375, -3.62567138671875, -3.4033203125, -3.18096923828125, -2.9586181640625, -2.73626708984375, -2.513916015625, -2.29156494140625, -2.0692138671875, -1.84686279296875, -1.62451171875, -1.40216064453125, -1.1798095703125, -0.95745849609375, -0.735107421875, -0.51275634765625, -0.2904052734375, -0.06805419921875, 0.154296875, 0.37664794921875, 0.5989990234375, 0.82135009765625, 1.043701171875, 1.26605224609375, 1.4884033203125, 1.71075439453125, 1.93310546875, 2.15545654296875, 2.3778076171875, 2.60015869140625, 2.822509765625, 3.04486083984375, 3.2672119140625, 3.48956298828125, 3.7119140625, 3.93426513671875, 4.1566162109375, 4.37896728515625, 4.601318359375, 4.82366943359375, 5.0460205078125, 5.26837158203125, 5.49072265625, 5.71307373046875, 5.9354248046875, 6.15777587890625, 6.380126953125, 6.60247802734375, 6.8248291015625, 7.04718017578125, 7.26953125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 12.0, 10.0, 22.0, 42.0, 36.0, 74.0, 109.0, 172.0, 292.0, 463.0, 720.0, 1156.0, 1990.0, 3265.0, 5284.0, 8844.0, 15321.0, 26684.0, 47120.0, 85639.0, 162992.0, 283631.0, 185092.0, 95783.0, 52748.0, 29515.0, 16812.0, 9780.0, 5862.0, 3493.0, 2084.0, 1284.0, 825.0, 482.0, 336.0, 188.0, 129.0, 91.0, 56.0, 37.0, 25.0, 15.0, 12.0, 18.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3193359375, -1.280059814453125, -1.24078369140625, -1.201507568359375, -1.1622314453125, -1.122955322265625, -1.08367919921875, -1.044403076171875, -1.005126953125, -0.965850830078125, -0.92657470703125, -0.887298583984375, -0.8480224609375, -0.808746337890625, -0.76947021484375, -0.730194091796875, -0.69091796875, -0.651641845703125, -0.61236572265625, -0.573089599609375, -0.5338134765625, -0.494537353515625, -0.45526123046875, -0.415985107421875, -0.376708984375, -0.337432861328125, -0.29815673828125, -0.258880615234375, -0.2196044921875, -0.180328369140625, -0.14105224609375, -0.101776123046875, -0.0625, -0.023223876953125, 0.01605224609375, 0.055328369140625, 0.0946044921875, 0.133880615234375, 0.17315673828125, 0.212432861328125, 0.251708984375, 0.290985107421875, 0.33026123046875, 0.369537353515625, 0.4088134765625, 0.448089599609375, 0.48736572265625, 0.526641845703125, 0.56591796875, 0.605194091796875, 0.64447021484375, 0.683746337890625, 0.7230224609375, 0.762298583984375, 0.80157470703125, 0.840850830078125, 0.880126953125, 0.919403076171875, 0.95867919921875, 0.997955322265625, 1.0372314453125, 1.076507568359375, 1.11578369140625, 1.155059814453125, 1.1943359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 5.0, 7.0, 12.0, 7.0, 14.0, 13.0, 14.0, 20.0, 19.0, 24.0, 24.0, 29.0, 30.0, 31.0, 28.0, 36.0, 29.0, 25.0, 50.0, 33.0, 1061.0, 56.0, 51.0, 39.0, 41.0, 42.0, 29.0, 27.0, 37.0, 17.0, 24.0, 19.0, 21.0, 19.0, 9.0, 18.0, 16.0, 9.0, 7.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.67169189453125, -3.5465087890625, -3.42132568359375, -3.296142578125, -3.17095947265625, -3.0457763671875, -2.92059326171875, -2.79541015625, -2.67022705078125, -2.5450439453125, -2.41986083984375, -2.294677734375, -2.16949462890625, -2.0443115234375, -1.91912841796875, -1.7939453125, -1.66876220703125, -1.5435791015625, -1.41839599609375, -1.293212890625, -1.16802978515625, -1.0428466796875, -0.91766357421875, -0.79248046875, -0.66729736328125, -0.5421142578125, -0.41693115234375, -0.291748046875, -0.16656494140625, -0.0413818359375, 0.08380126953125, 0.208984375, 0.33416748046875, 0.4593505859375, 0.58453369140625, 0.709716796875, 0.83489990234375, 0.9600830078125, 1.08526611328125, 1.21044921875, 1.33563232421875, 1.4608154296875, 1.58599853515625, 1.711181640625, 1.83636474609375, 1.9615478515625, 2.08673095703125, 2.2119140625, 2.33709716796875, 2.4622802734375, 2.58746337890625, 2.712646484375, 2.83782958984375, 2.9630126953125, 3.08819580078125, 3.21337890625, 3.33856201171875, 3.4637451171875, 3.58892822265625, 3.714111328125, 3.83929443359375, 3.9644775390625, 4.08966064453125, 4.21484375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 12.0, 4.0, 9.0, 21.0, 28.0, 38.0, 56.0, 98.0, 139.0, 210.0, 315.0, 411.0, 636.0, 858.0, 1263.0, 1948.0, 2850.0, 4228.0, 6351.0, 9725.0, 14716.0, 22595.0, 35422.0, 57620.0, 95504.0, 173869.0, 1296970.0, 146503.0, 83497.0, 50449.0, 31439.0, 19929.0, 13267.0, 8578.0, 5797.0, 3756.0, 2492.0, 1715.0, 1206.0, 847.0, 562.0, 373.0, 262.0, 172.0, 136.0, 79.0, 65.0, 37.0, 20.0, 23.0, 18.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.9287109375, -0.9000167846679688, -0.8713226318359375, -0.8426284790039062, -0.813934326171875, -0.7852401733398438, -0.7565460205078125, -0.7278518676757812, -0.69915771484375, -0.6704635620117188, -0.6417694091796875, -0.6130752563476562, -0.584381103515625, -0.5556869506835938, -0.5269927978515625, -0.49829864501953125, -0.4696044921875, -0.44091033935546875, -0.4122161865234375, -0.38352203369140625, -0.354827880859375, -0.32613372802734375, -0.2974395751953125, -0.26874542236328125, -0.24005126953125, -0.21135711669921875, -0.1826629638671875, -0.15396881103515625, -0.125274658203125, -0.09658050537109375, -0.0678863525390625, -0.03919219970703125, -0.010498046875, 0.01819610595703125, 0.0468902587890625, 0.07558441162109375, 0.104278564453125, 0.13297271728515625, 0.1616668701171875, 0.19036102294921875, 0.21905517578125, 0.24774932861328125, 0.2764434814453125, 0.30513763427734375, 0.333831787109375, 0.36252593994140625, 0.3912200927734375, 0.41991424560546875, 0.4486083984375, 0.47730255126953125, 0.5059967041015625, 0.5346908569335938, 0.563385009765625, 0.5920791625976562, 0.6207733154296875, 0.6494674682617188, 0.67816162109375, 0.7068557739257812, 0.7355499267578125, 0.7642440795898438, 0.792938232421875, 0.8216323852539062, 0.8503265380859375, 0.8790206909179688, 0.90771484375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 12.0, 15.0, 20.0, 16.0, 31.0, 41.0, 39.0, 56.0, 67.0, 77.0, 75.0, 78.0, 77.0, 61.0, 56.0, 44.0, 44.0, 25.0, 30.0, 20.0, 19.0, 16.0, 6.0, 10.0, 10.0, 9.0, 6.0, 1.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0007271766662597656, -0.0007058605551719666, -0.0006845444440841675, -0.0006632283329963684, -0.0006419122219085693, -0.0006205961108207703, -0.0005992799997329712, -0.0005779638886451721, -0.000556647777557373, -0.000535331666469574, -0.0005140155553817749, -0.0004926994442939758, -0.00047138333320617676, -0.0004500672221183777, -0.0004287511110305786, -0.00040743499994277954, -0.00038611888885498047, -0.0003648027777671814, -0.0003434866666793823, -0.00032217055559158325, -0.0003008544445037842, -0.0002795383334159851, -0.00025822222232818604, -0.00023690611124038696, -0.0002155900001525879, -0.00019427388906478882, -0.00017295777797698975, -0.00015164166688919067, -0.0001303255558013916, -0.00010900944471359253, -8.769333362579346e-05, -6.637722253799438e-05, -4.506111145019531e-05, -2.374500036239624e-05, -2.428889274597168e-06, 1.8887221813201904e-05, 4.0203332901000977e-05, 6.151944398880005e-05, 8.283555507659912e-05, 0.0001041516661643982, 0.00012546777725219727, 0.00014678388833999634, 0.0001680999994277954, 0.00018941611051559448, 0.00021073222160339355, 0.00023204833269119263, 0.0002533644437789917, 0.00027468055486679077, 0.00029599666595458984, 0.0003173127770423889, 0.000338628888130188, 0.00035994499921798706, 0.00038126111030578613, 0.0004025772213935852, 0.0004238933324813843, 0.00044520944356918335, 0.0004665255546569824, 0.0004878416657447815, 0.0005091577768325806, 0.0005304738879203796, 0.0005517899990081787, 0.0005731061100959778, 0.0005944222211837769, 0.0006157383322715759, 0.000637054443359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 12.0, 11.0, 12.0, 17.0, 19.0, 21.0, 26.0, 35.0, 57.0, 64.0, 91.0, 162.0, 267.0, 784.0, 27787.0, 1016309.0, 1830.0, 431.0, 205.0, 120.0, 83.0, 46.0, 33.0, 32.0, 17.0, 16.0, 8.0, 14.0, 11.0, 4.0, 2.0, 2.0, 3.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01488494873046875, -0.014392971992492676, -0.013900995254516602, -0.013409018516540527, -0.012917041778564453, -0.012425065040588379, -0.011933088302612305, -0.01144111156463623, -0.010949134826660156, -0.010457158088684082, -0.009965181350708008, -0.009473204612731934, -0.00898122787475586, -0.008489251136779785, -0.007997274398803711, -0.007505297660827637, -0.0070133209228515625, -0.006521344184875488, -0.006029367446899414, -0.00553739070892334, -0.005045413970947266, -0.004553437232971191, -0.004061460494995117, -0.003569483757019043, -0.0030775070190429688, -0.0025855302810668945, -0.0020935535430908203, -0.001601576805114746, -0.0011096000671386719, -0.0006176233291625977, -0.00012564659118652344, 0.0003663301467895508, 0.000858306884765625, 0.0013502836227416992, 0.0018422603607177734, 0.0023342370986938477, 0.002826213836669922, 0.003318190574645996, 0.0038101673126220703, 0.0043021440505981445, 0.004794120788574219, 0.005286097526550293, 0.005778074264526367, 0.006270051002502441, 0.006762027740478516, 0.00725400447845459, 0.007745981216430664, 0.008237957954406738, 0.008729934692382812, 0.009221911430358887, 0.009713888168334961, 0.010205864906311035, 0.01069784164428711, 0.011189818382263184, 0.011681795120239258, 0.012173771858215332, 0.012665748596191406, 0.01315772533416748, 0.013649702072143555, 0.014141678810119629, 0.014633655548095703, 0.015125632286071777, 0.015617609024047852, 0.016109585762023926, 0.0166015625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 20.0, 33.0, 74.0, 99.0, 139.0, 186.0, 153.0, 128.0, 75.0, 46.0, 18.0, 17.0, 8.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003211433067917824, -0.00030575686832889915, -0.00029037045896984637, -0.00027498402050696313, -0.00025959761114791036, -0.0002442111726850271, -0.00022882474877405912, -0.0002134383248630911, -0.0001980519009521231, -0.0001826654770411551, -0.0001672790531301871, -0.0001518926292192191, -0.00013650619075633585, -0.00012111977412132546, -0.00010573334293439984, -9.034691902343184e-05, -7.496049511246383e-05, -5.9574071201495826e-05, -4.4187643652549013e-05, -2.88012161036022e-05, -1.3414792192634195e-05, 1.9716317183338106e-06, 1.735806290525943e-05, 3.2744486816227436e-05, 4.813091072719544e-05, 6.351733463816345e-05, 7.890375854913145e-05, 9.429018973605707e-05, 0.00010967661364702508, 0.00012506303028203547, 0.0001404494687449187, 0.0001558358926558867, 0.00017122231656685472, 0.00018660874047782272, 0.00020199516438879073, 0.00021738160285167396, 0.00023276801221072674, 0.00024815445067360997, 0.0002635408891364932, 0.000278927298495546, 0.00029431370785459876, 0.000309700146317482, 0.00032508655567653477, 0.000340472994139418, 0.0003558594034984708, 0.000371245841961354, 0.00038663228042423725, 0.00040201868978329003, 0.00041740512824617326, 0.0004327915667090565, 0.0004481779760681093, 0.0004635644145309925, 0.0004789508238900453, 0.0004943372332490981, 0.0005097236717119813, 0.0005251101101748645, 0.0005404965486377478, 0.000555882987100631, 0.0005712694255635142, 0.0005866558058187366, 0.0006020422442816198, 0.000617428682744503, 0.0006328151212073863, 0.0006482015596702695, 0.0006635879399254918]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 9.0, 14.0, 7.0, 10.0, 14.0, 15.0, 15.0, 20.0, 26.0, 27.0, 27.0, 24.0, 35.0, 24.0, 27.0, 28.0, 38.0, 30.0, 33.0, 32.0, 36.0, 33.0, 44.0, 48.0, 29.0, 41.0, 21.0, 29.0, 24.0, 22.0, 34.0, 22.0, 14.0, 22.0, 14.0, 21.0, 17.0, 19.0, 11.0, 7.0, 3.0, 3.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00028628110885620117, -0.0002773944288492203, -0.0002685077488422394, -0.0002596210688352585, -0.0002507343888282776, -0.0002418477088212967, -0.0002329610288143158, -0.0002240743488073349, -0.000215187668800354, -0.0002063009887933731, -0.0001974143087863922, -0.00018852762877941132, -0.00017964094877243042, -0.00017075426876544952, -0.00016186758875846863, -0.00015298090875148773, -0.00014409422874450684, -0.00013520754873752594, -0.00012632086873054504, -0.00011743418872356415, -0.00010854750871658325, -9.966082870960236e-05, -9.077414870262146e-05, -8.188746869564056e-05, -7.300078868865967e-05, -6.411410868167877e-05, -5.5227428674697876e-05, -4.634074866771698e-05, -3.7454068660736084e-05, -2.8567388653755188e-05, -1.9680708646774292e-05, -1.0794028639793396e-05, -1.9073486328125e-06, 6.979331374168396e-06, 1.5866011381149292e-05, 2.4752691388130188e-05, 3.3639371395111084e-05, 4.252605140209198e-05, 5.1412731409072876e-05, 6.029941141605377e-05, 6.918609142303467e-05, 7.807277143001556e-05, 8.695945143699646e-05, 9.584613144397736e-05, 0.00010473281145095825, 0.00011361949145793915, 0.00012250617146492004, 0.00013139285147190094, 0.00014027953147888184, 0.00014916621148586273, 0.00015805289149284363, 0.00016693957149982452, 0.00017582625150680542, 0.00018471293151378632, 0.0001935996115207672, 0.0002024862915277481, 0.000211372971534729, 0.0002202596515417099, 0.0002291463315486908, 0.0002380330115556717, 0.0002469196915626526, 0.0002558063715696335, 0.0002646930515766144, 0.0002735797315835953, 0.00028246641159057617]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 8.0, 10.0, 7.0, 6.0, 10.0, 9.0, 14.0, 25.0, 29.0, 21.0, 39.0, 35.0, 29.0, 33.0, 45.0, 53.0, 45.0, 39.0, 46.0, 47.0, 32.0, 43.0, 38.0, 36.0, 36.0, 48.0, 27.0, 38.0, 21.0, 27.0, 13.0, 20.0, 15.0, 16.0, 8.0, 13.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9609375, -6.73858642578125, -6.5162353515625, -6.29388427734375, -6.071533203125, -5.84918212890625, -5.6268310546875, -5.40447998046875, -5.18212890625, -4.95977783203125, -4.7374267578125, -4.51507568359375, -4.292724609375, -4.07037353515625, -3.8480224609375, -3.62567138671875, -3.4033203125, -3.18096923828125, -2.9586181640625, -2.73626708984375, -2.513916015625, -2.29156494140625, -2.0692138671875, -1.84686279296875, -1.62451171875, -1.40216064453125, -1.1798095703125, -0.95745849609375, -0.735107421875, -0.51275634765625, -0.2904052734375, -0.06805419921875, 0.154296875, 0.37664794921875, 0.5989990234375, 0.82135009765625, 1.043701171875, 1.26605224609375, 1.4884033203125, 1.71075439453125, 1.93310546875, 2.15545654296875, 2.3778076171875, 2.60015869140625, 2.822509765625, 3.04486083984375, 3.2672119140625, 3.48956298828125, 3.7119140625, 3.93426513671875, 4.1566162109375, 4.37896728515625, 4.601318359375, 4.82366943359375, 5.0460205078125, 5.26837158203125, 5.49072265625, 5.71307373046875, 5.9354248046875, 6.15777587890625, 6.380126953125, 6.60247802734375, 6.8248291015625, 7.04718017578125, 7.26953125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 0.0, 8.0, 10.0, 8.0, 10.0, 19.0, 27.0, 27.0, 50.0, 60.0, 81.0, 143.0, 238.0, 332.0, 682.0, 1499.0, 4242.0, 13220.0, 51743.0, 250789.0, 555620.0, 127779.0, 28861.0, 7977.0, 2707.0, 1118.0, 529.0, 266.0, 162.0, 94.0, 68.0, 44.0, 38.0, 21.0, 23.0, 13.0, 19.0, 6.0, 13.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.5380859375, -6.322265625, -6.1064453125, -5.890625, -5.6748046875, -5.458984375, -5.2431640625, -5.02734375, -4.8115234375, -4.595703125, -4.3798828125, -4.1640625, -3.9482421875, -3.732421875, -3.5166015625, -3.30078125, -3.0849609375, -2.869140625, -2.6533203125, -2.4375, -2.2216796875, -2.005859375, -1.7900390625, -1.57421875, -1.3583984375, -1.142578125, -0.9267578125, -0.7109375, -0.4951171875, -0.279296875, -0.0634765625, 0.15234375, 0.3681640625, 0.583984375, 0.7998046875, 1.015625, 1.2314453125, 1.447265625, 1.6630859375, 1.87890625, 2.0947265625, 2.310546875, 2.5263671875, 2.7421875, 2.9580078125, 3.173828125, 3.3896484375, 3.60546875, 3.8212890625, 4.037109375, 4.2529296875, 4.46875, 4.6845703125, 4.900390625, 5.1162109375, 5.33203125, 5.5478515625, 5.763671875, 5.9794921875, 6.1953125, 6.4111328125, 6.626953125, 6.8427734375, 7.05859375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 11.0, 10.0, 16.0, 21.0, 19.0, 28.0, 40.0, 40.0, 31.0, 37.0, 27.0, 45.0, 59.0, 110.0, 371.0, 1586.0, 111.0, 51.0, 42.0, 46.0, 32.0, 34.0, 39.0, 23.0, 29.0, 23.0, 15.0, 19.0, 21.0, 18.0, 9.0, 7.0, 11.0, 8.0, 5.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.5, -19.819580078125, -19.13916015625, -18.458740234375, -17.7783203125, -17.097900390625, -16.41748046875, -15.737060546875, -15.056640625, -14.376220703125, -13.69580078125, -13.015380859375, -12.3349609375, -11.654541015625, -10.97412109375, -10.293701171875, -9.61328125, -8.932861328125, -8.25244140625, -7.572021484375, -6.8916015625, -6.211181640625, -5.53076171875, -4.850341796875, -4.169921875, -3.489501953125, -2.80908203125, -2.128662109375, -1.4482421875, -0.767822265625, -0.08740234375, 0.593017578125, 1.2734375, 1.953857421875, 2.63427734375, 3.314697265625, 3.9951171875, 4.675537109375, 5.35595703125, 6.036376953125, 6.716796875, 7.397216796875, 8.07763671875, 8.758056640625, 9.4384765625, 10.118896484375, 10.79931640625, 11.479736328125, 12.16015625, 12.840576171875, 13.52099609375, 14.201416015625, 14.8818359375, 15.562255859375, 16.24267578125, 16.923095703125, 17.603515625, 18.283935546875, 18.96435546875, 19.644775390625, 20.3251953125, 21.005615234375, 21.68603515625, 22.366455078125, 23.046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 9.0, 13.0, 19.0, 28.0, 49.0, 58.0, 87.0, 133.0, 260.0, 422.0, 1275.0, 94034.0, 3046052.0, 2007.0, 512.0, 263.0, 179.0, 97.0, 63.0, 43.0, 28.0, 18.0, 11.0, 12.0, 6.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.3125, -76.5888671875, -73.865234375, -71.1416015625, -68.41796875, -65.6943359375, -62.970703125, -60.2470703125, -57.5234375, -54.7998046875, -52.076171875, -49.3525390625, -46.62890625, -43.9052734375, -41.181640625, -38.4580078125, -35.734375, -33.0107421875, -30.287109375, -27.5634765625, -24.83984375, -22.1162109375, -19.392578125, -16.6689453125, -13.9453125, -11.2216796875, -8.498046875, -5.7744140625, -3.05078125, -0.3271484375, 2.396484375, 5.1201171875, 7.84375, 10.5673828125, 13.291015625, 16.0146484375, 18.73828125, 21.4619140625, 24.185546875, 26.9091796875, 29.6328125, 32.3564453125, 35.080078125, 37.8037109375, 40.52734375, 43.2509765625, 45.974609375, 48.6982421875, 51.421875, 54.1455078125, 56.869140625, 59.5927734375, 62.31640625, 65.0400390625, 67.763671875, 70.4873046875, 73.2109375, 75.9345703125, 78.658203125, 81.3818359375, 84.10546875, 86.8291015625, 89.552734375, 92.2763671875, 95.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1010.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.07209396362305, -45.55060958862305, -33.02912139892578, -20.50763702392578, -7.986152648925781, 4.535331726074219, 17.056819915771484, 29.578304290771484, 42.099788665771484, 54.621273040771484, 67.14276123046875, 79.66424560546875, 92.18572998046875, 104.70721435546875, 117.22869873046875, 129.75018310546875, 142.27166748046875, 154.79315185546875, 167.31463623046875, 179.83612060546875, 192.35760498046875, 204.87908935546875, 217.40057373046875, 229.92205810546875, 242.4435577392578, 254.9650421142578, 267.4865417480469, 280.0080261230469, 292.5295104980469, 305.0509948730469, 317.5724792480469, 330.0939636230469, 342.6154479980469, 355.1369323730469, 367.6584167480469, 380.1799011230469, 392.7013854980469, 405.2228698730469, 417.7443542480469, 430.2658386230469, 442.7873229980469, 455.3088073730469, 467.8302917480469, 480.3517761230469, 492.8732604980469, 505.3947448730469, 517.916259765625, 530.437744140625, 542.959228515625, 555.480712890625, 568.002197265625, 580.523681640625, 593.045166015625, 605.566650390625, 618.088134765625, 630.609619140625, 643.131103515625, 655.652587890625, 668.174072265625, 680.695556640625, 693.217041015625, 705.738525390625, 718.260009765625, 730.781494140625, 743.302978515625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 9.0, 12.0, 17.0, 18.0, 15.0, 26.0, 23.0, 24.0, 33.0, 31.0, 25.0, 34.0, 40.0, 37.0, 30.0, 39.0, 39.0, 40.0, 43.0, 41.0, 44.0, 33.0, 29.0, 50.0, 34.0, 21.0, 23.0, 26.0, 22.0, 19.0, 19.0, 14.0, 8.0, 9.0, 17.0, 4.0, 3.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-65.43413543701172, -63.51478576660156, -61.59543991088867, -59.676090240478516, -57.756744384765625, -55.83739471435547, -53.91804504394531, -51.99869918823242, -50.07935333251953, -48.160003662109375, -46.240657806396484, -44.32130813598633, -42.40196228027344, -40.48261260986328, -38.563262939453125, -36.643917083740234, -34.72456741333008, -32.80521774291992, -30.88587188720703, -28.966522216796875, -27.047176361083984, -25.127826690673828, -23.208478927612305, -21.28913116455078, -19.369783401489258, -17.450435638427734, -15.531087875366211, -13.611739158630371, -11.692391395568848, -9.773043632507324, -7.853694915771484, -5.934347152709961, -4.0149993896484375, -2.095651388168335, -0.17630338668823242, 1.7430448532104492, 3.6623926162719727, 5.581740379333496, 7.501089096069336, 9.42043685913086, 11.339784622192383, 13.259132385253906, 15.17848014831543, 17.097827911376953, 19.01717758178711, 20.9365234375, 22.855873107910156, 24.77522087097168, 26.694568634033203, 28.613916397094727, 30.53326416015625, 32.452613830566406, 34.3719596862793, 36.29130935668945, 38.210655212402344, 40.1300048828125, 42.049354553222656, 43.96870422363281, 45.8880500793457, 47.80739974975586, 49.72674560546875, 51.646095275878906, 53.56544494628906, 55.48479080200195, 57.404136657714844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 9.0, 4.0, 7.0, 8.0, 16.0, 18.0, 21.0, 28.0, 30.0, 21.0, 45.0, 34.0, 39.0, 50.0, 42.0, 46.0, 54.0, 44.0, 42.0, 40.0, 39.0, 35.0, 37.0, 34.0, 37.0, 38.0, 35.0, 18.0, 20.0, 15.0, 19.0, 13.0, 15.0, 15.0, 7.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.72265625, -6.48919677734375, -6.2557373046875, -6.02227783203125, -5.788818359375, -5.55535888671875, -5.3218994140625, -5.08843994140625, -4.85498046875, -4.62152099609375, -4.3880615234375, -4.15460205078125, -3.921142578125, -3.68768310546875, -3.4542236328125, -3.22076416015625, -2.9873046875, -2.75384521484375, -2.5203857421875, -2.28692626953125, -2.053466796875, -1.82000732421875, -1.5865478515625, -1.35308837890625, -1.11962890625, -0.88616943359375, -0.6527099609375, -0.41925048828125, -0.185791015625, 0.04766845703125, 0.2811279296875, 0.51458740234375, 0.748046875, 0.98150634765625, 1.2149658203125, 1.44842529296875, 1.681884765625, 1.91534423828125, 2.1488037109375, 2.38226318359375, 2.61572265625, 2.84918212890625, 3.0826416015625, 3.31610107421875, 3.549560546875, 3.78302001953125, 4.0164794921875, 4.24993896484375, 4.4833984375, 4.71685791015625, 4.9503173828125, 5.18377685546875, 5.417236328125, 5.65069580078125, 5.8841552734375, 6.11761474609375, 6.35107421875, 6.58453369140625, 6.8179931640625, 7.05145263671875, 7.284912109375, 7.51837158203125, 7.7518310546875, 7.98529052734375, 8.21875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 0.0, 13.0, 10.0, 19.0, 18.0, 21.0, 32.0, 34.0, 37.0, 48.0, 60.0, 70.0, 136.0, 140.0, 246.0, 425.0, 1276.0, 6121.0, 110931.0, 2250592.0, 1753481.0, 63394.0, 4861.0, 1052.0, 391.0, 226.0, 151.0, 92.0, 72.0, 51.0, 46.0, 40.0, 40.0, 34.0, 34.0, 14.0, 12.0, 14.0, 10.0, 11.0, 6.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.1875, -15.60791015625, -15.0283203125, -14.44873046875, -13.869140625, -13.28955078125, -12.7099609375, -12.13037109375, -11.55078125, -10.97119140625, -10.3916015625, -9.81201171875, -9.232421875, -8.65283203125, -8.0732421875, -7.49365234375, -6.9140625, -6.33447265625, -5.7548828125, -5.17529296875, -4.595703125, -4.01611328125, -3.4365234375, -2.85693359375, -2.27734375, -1.69775390625, -1.1181640625, -0.53857421875, 0.041015625, 0.62060546875, 1.2001953125, 1.77978515625, 2.359375, 2.93896484375, 3.5185546875, 4.09814453125, 4.677734375, 5.25732421875, 5.8369140625, 6.41650390625, 6.99609375, 7.57568359375, 8.1552734375, 8.73486328125, 9.314453125, 9.89404296875, 10.4736328125, 11.05322265625, 11.6328125, 12.21240234375, 12.7919921875, 13.37158203125, 13.951171875, 14.53076171875, 15.1103515625, 15.68994140625, 16.26953125, 16.84912109375, 17.4287109375, 18.00830078125, 18.587890625, 19.16748046875, 19.7470703125, 20.32666015625, 20.90625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 13.0, 16.0, 14.0, 8.0, 21.0, 27.0, 38.0, 52.0, 69.0, 75.0, 97.0, 145.0, 192.0, 259.0, 335.0, 417.0, 428.0, 431.0, 343.0, 241.0, 219.0, 129.0, 110.0, 93.0, 79.0, 56.0, 37.0, 18.0, 24.0, 18.0, 16.0, 9.0, 8.0, 8.0, 6.0, 4.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.087158203125, -9.72119140625, -9.355224609375, -8.9892578125, -8.623291015625, -8.25732421875, -7.891357421875, -7.525390625, -7.159423828125, -6.79345703125, -6.427490234375, -6.0615234375, -5.695556640625, -5.32958984375, -4.963623046875, -4.59765625, -4.231689453125, -3.86572265625, -3.499755859375, -3.1337890625, -2.767822265625, -2.40185546875, -2.035888671875, -1.669921875, -1.303955078125, -0.93798828125, -0.572021484375, -0.2060546875, 0.159912109375, 0.52587890625, 0.891845703125, 1.2578125, 1.623779296875, 1.98974609375, 2.355712890625, 2.7216796875, 3.087646484375, 3.45361328125, 3.819580078125, 4.185546875, 4.551513671875, 4.91748046875, 5.283447265625, 5.6494140625, 6.015380859375, 6.38134765625, 6.747314453125, 7.11328125, 7.479248046875, 7.84521484375, 8.211181640625, 8.5771484375, 8.943115234375, 9.30908203125, 9.675048828125, 10.041015625, 10.406982421875, 10.77294921875, 11.138916015625, 11.5048828125, 11.870849609375, 12.23681640625, 12.602783203125, 12.96875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 7.0, 7.0, 10.0, 7.0, 13.0, 19.0, 14.0, 23.0, 26.0, 42.0, 50.0, 61.0, 97.0, 89.0, 121.0, 154.0, 177.0, 235.0, 367.0, 582.0, 3389.0, 3810469.0, 375065.0, 1336.0, 536.0, 336.0, 219.0, 165.0, 134.0, 104.0, 72.0, 78.0, 59.0, 45.0, 39.0, 36.0, 26.0, 18.0, 23.0, 10.0, 7.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.875, -61.8037109375, -59.732421875, -57.6611328125, -55.58984375, -53.5185546875, -51.447265625, -49.3759765625, -47.3046875, -45.2333984375, -43.162109375, -41.0908203125, -39.01953125, -36.9482421875, -34.876953125, -32.8056640625, -30.734375, -28.6630859375, -26.591796875, -24.5205078125, -22.44921875, -20.3779296875, -18.306640625, -16.2353515625, -14.1640625, -12.0927734375, -10.021484375, -7.9501953125, -5.87890625, -3.8076171875, -1.736328125, 0.3349609375, 2.40625, 4.4775390625, 6.548828125, 8.6201171875, 10.69140625, 12.7626953125, 14.833984375, 16.9052734375, 18.9765625, 21.0478515625, 23.119140625, 25.1904296875, 27.26171875, 29.3330078125, 31.404296875, 33.4755859375, 35.546875, 37.6181640625, 39.689453125, 41.7607421875, 43.83203125, 45.9033203125, 47.974609375, 50.0458984375, 52.1171875, 54.1884765625, 56.259765625, 58.3310546875, 60.40234375, 62.4736328125, 64.544921875, 66.6162109375, 68.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 62.0, 550.0, 379.0, 22.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.54374694824219, -113.67644500732422, -104.80913543701172, -95.94183349609375, -87.07452392578125, -78.20722198486328, -69.33992004394531, -60.47261428833008, -51.605308532714844, -42.73800277709961, -33.870697021484375, -25.003395080566406, -16.136089324951172, -7.2687835693359375, 1.5985183715820312, 10.465824127197266, 19.3331298828125, 28.200435638427734, 37.06774139404297, 45.93504333496094, 54.80234909057617, 63.669654846191406, 72.53695678710938, 81.40426635742188, 90.27156829833984, 99.13887023925781, 108.00617980957031, 116.87348175048828, 125.74078369140625, 134.60809326171875, 143.47540283203125, 152.3426971435547, 161.21002197265625, 170.07733154296875, 178.9446258544922, 187.8119354248047, 196.6792449951172, 205.54653930664062, 214.41384887695312, 223.28115844726562, 232.14846801757812, 241.01577758789062, 249.88307189941406, 258.7503662109375, 267.61767578125, 276.4849853515625, 285.352294921875, 294.2196044921875, 303.0869140625, 311.9542236328125, 320.821533203125, 329.6888427734375, 338.5561218261719, 347.4234313964844, 356.2907409667969, 365.1580505371094, 374.02532958984375, 382.89263916015625, 391.75994873046875, 400.62725830078125, 409.4945373535156, 418.3618469238281, 427.2291564941406, 436.0964660644531, 444.9637756347656]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 9.0, 16.0, 11.0, 16.0, 12.0, 26.0, 21.0, 32.0, 39.0, 35.0, 36.0, 45.0, 32.0, 38.0, 40.0, 38.0, 58.0, 48.0, 56.0, 44.0, 38.0, 29.0, 35.0, 32.0, 33.0, 31.0, 17.0, 29.0, 20.0, 10.0, 9.0, 9.0, 10.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.27734375, -44.82401657104492, -43.370689392089844, -41.917362213134766, -40.46403503417969, -39.010711669921875, -37.5573844909668, -36.10405731201172, -34.65073013305664, -33.19740295410156, -31.744075775146484, -30.29075050354004, -28.83742332458496, -27.384096145629883, -25.930770874023438, -24.47744369506836, -23.02411651611328, -21.570789337158203, -20.117462158203125, -18.66413688659668, -17.2108097076416, -15.757482528686523, -14.304156303405762, -12.850830078125, -11.397502899169922, -9.944175720214844, -8.490849494934082, -7.037522792816162, -5.584196090698242, -4.130869388580322, -2.6775426864624023, -1.2242164611816406, 0.2291107177734375, 1.6824374198913574, 3.1357641220092773, 4.589090824127197, 6.042417526245117, 7.495744228363037, 8.949070930480957, 10.402397155761719, 11.855724334716797, 13.309051513671875, 14.762377738952637, 16.2157039642334, 17.669031143188477, 19.122358322143555, 20.57568359375, 22.029010772705078, 23.482337951660156, 24.935665130615234, 26.388992309570312, 27.842317581176758, 29.295644760131836, 30.748971939086914, 32.20229721069336, 33.65562438964844, 35.108951568603516, 36.562278747558594, 38.01560592651367, 39.46893310546875, 40.92225646972656, 42.37558364868164, 43.82891082763672, 45.2822380065918, 46.735565185546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 8.0, 16.0, 11.0, 17.0, 25.0, 28.0, 32.0, 40.0, 22.0, 34.0, 34.0, 40.0, 36.0, 49.0, 30.0, 51.0, 47.0, 48.0, 42.0, 43.0, 34.0, 33.0, 34.0, 36.0, 28.0, 23.0, 23.0, 27.0, 18.0, 17.0, 9.0, 16.0, 15.0, 8.0, 7.0, 2.0, 5.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.2955322265625, -6.075439453125, -5.8553466796875, -5.63525390625, -5.4151611328125, -5.195068359375, -4.9749755859375, -4.7548828125, -4.5347900390625, -4.314697265625, -4.0946044921875, -3.87451171875, -3.6544189453125, -3.434326171875, -3.2142333984375, -2.994140625, -2.7740478515625, -2.553955078125, -2.3338623046875, -2.11376953125, -1.8936767578125, -1.673583984375, -1.4534912109375, -1.2333984375, -1.0133056640625, -0.793212890625, -0.5731201171875, -0.35302734375, -0.1329345703125, 0.087158203125, 0.3072509765625, 0.52734375, 0.7474365234375, 0.967529296875, 1.1876220703125, 1.40771484375, 1.6278076171875, 1.847900390625, 2.0679931640625, 2.2880859375, 2.5081787109375, 2.728271484375, 2.9483642578125, 3.16845703125, 3.3885498046875, 3.608642578125, 3.8287353515625, 4.048828125, 4.2689208984375, 4.489013671875, 4.7091064453125, 4.92919921875, 5.1492919921875, 5.369384765625, 5.5894775390625, 5.8095703125, 6.0296630859375, 6.249755859375, 6.4698486328125, 6.68994140625, 6.9100341796875, 7.130126953125, 7.3502197265625, 7.5703125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 24.0, 30.0, 33.0, 76.0, 90.0, 157.0, 233.0, 338.0, 539.0, 821.0, 1303.0, 2094.0, 3360.0, 5206.0, 8046.0, 13163.0, 20698.0, 34112.0, 57358.0, 101977.0, 196468.0, 267024.0, 141850.0, 77084.0, 44286.0, 26736.0, 16659.0, 10733.0, 6523.0, 4103.0, 2656.0, 1748.0, 1058.0, 701.0, 490.0, 277.0, 179.0, 117.0, 55.0, 48.0, 37.0, 16.0, 15.0, 12.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.17578125, -1.1414642333984375, -1.107147216796875, -1.0728302001953125, -1.03851318359375, -1.0041961669921875, -0.969879150390625, -0.9355621337890625, -0.9012451171875, -0.8669281005859375, -0.832611083984375, -0.7982940673828125, -0.76397705078125, -0.7296600341796875, -0.695343017578125, -0.6610260009765625, -0.626708984375, -0.5923919677734375, -0.558074951171875, -0.5237579345703125, -0.48944091796875, -0.4551239013671875, -0.420806884765625, -0.3864898681640625, -0.3521728515625, -0.3178558349609375, -0.283538818359375, -0.2492218017578125, -0.21490478515625, -0.1805877685546875, -0.146270751953125, -0.1119537353515625, -0.07763671875, -0.0433197021484375, -0.009002685546875, 0.0253143310546875, 0.05963134765625, 0.0939483642578125, 0.128265380859375, 0.1625823974609375, 0.1968994140625, 0.2312164306640625, 0.265533447265625, 0.2998504638671875, 0.33416748046875, 0.3684844970703125, 0.402801513671875, 0.4371185302734375, 0.471435546875, 0.5057525634765625, 0.540069580078125, 0.5743865966796875, 0.60870361328125, 0.6430206298828125, 0.677337646484375, 0.7116546630859375, 0.7459716796875, 0.7802886962890625, 0.814605712890625, 0.8489227294921875, 0.88323974609375, 0.9175567626953125, 0.951873779296875, 0.9861907958984375, 1.0205078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 3.0, 7.0, 13.0, 13.0, 9.0, 12.0, 21.0, 12.0, 23.0, 16.0, 24.0, 32.0, 18.0, 32.0, 38.0, 44.0, 35.0, 38.0, 37.0, 37.0, 1048.0, 30.0, 51.0, 29.0, 48.0, 43.0, 29.0, 34.0, 30.0, 28.0, 24.0, 22.0, 17.0, 10.0, 20.0, 13.0, 16.0, 12.0, 6.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.68359375, -3.56640625, -3.44921875, -3.33203125, -3.21484375, -3.09765625, -2.98046875, -2.86328125, -2.74609375, -2.62890625, -2.51171875, -2.39453125, -2.27734375, -2.16015625, -2.04296875, -1.92578125, -1.80859375, -1.69140625, -1.57421875, -1.45703125, -1.33984375, -1.22265625, -1.10546875, -0.98828125, -0.87109375, -0.75390625, -0.63671875, -0.51953125, -0.40234375, -0.28515625, -0.16796875, -0.05078125, 0.06640625, 0.18359375, 0.30078125, 0.41796875, 0.53515625, 0.65234375, 0.76953125, 0.88671875, 1.00390625, 1.12109375, 1.23828125, 1.35546875, 1.47265625, 1.58984375, 1.70703125, 1.82421875, 1.94140625, 2.05859375, 2.17578125, 2.29296875, 2.41015625, 2.52734375, 2.64453125, 2.76171875, 2.87890625, 2.99609375, 3.11328125, 3.23046875, 3.34765625, 3.46484375, 3.58203125, 3.69921875, 3.81640625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 13.0, 16.0, 21.0, 23.0, 47.0, 70.0, 105.0, 142.0, 218.0, 322.0, 465.0, 670.0, 951.0, 1319.0, 1787.0, 2746.0, 4008.0, 5913.0, 8744.0, 13147.0, 20511.0, 32149.0, 51895.0, 85973.0, 148626.0, 1289126.0, 169847.0, 96840.0, 58146.0, 36081.0, 22562.0, 14548.0, 9400.0, 6615.0, 4325.0, 2935.0, 2102.0, 1411.0, 1005.0, 724.0, 489.0, 356.0, 246.0, 151.0, 116.0, 70.0, 48.0, 40.0, 29.0, 15.0, 8.0, 7.0, 7.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.90478515625, -0.877044677734375, -0.84930419921875, -0.821563720703125, -0.7938232421875, -0.766082763671875, -0.73834228515625, -0.710601806640625, -0.682861328125, -0.655120849609375, -0.62738037109375, -0.599639892578125, -0.5718994140625, -0.544158935546875, -0.51641845703125, -0.488677978515625, -0.4609375, -0.433197021484375, -0.40545654296875, -0.377716064453125, -0.3499755859375, -0.322235107421875, -0.29449462890625, -0.266754150390625, -0.239013671875, -0.211273193359375, -0.18353271484375, -0.155792236328125, -0.1280517578125, -0.100311279296875, -0.07257080078125, -0.044830322265625, -0.01708984375, 0.010650634765625, 0.03839111328125, 0.066131591796875, 0.0938720703125, 0.121612548828125, 0.14935302734375, 0.177093505859375, 0.204833984375, 0.232574462890625, 0.26031494140625, 0.288055419921875, 0.3157958984375, 0.343536376953125, 0.37127685546875, 0.399017333984375, 0.4267578125, 0.454498291015625, 0.48223876953125, 0.509979248046875, 0.5377197265625, 0.565460205078125, 0.59320068359375, 0.620941162109375, 0.648681640625, 0.676422119140625, 0.70416259765625, 0.731903076171875, 0.7596435546875, 0.787384033203125, 0.81512451171875, 0.842864990234375, 0.87060546875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 13.0, 19.0, 27.0, 38.0, 45.0, 72.0, 76.0, 104.0, 124.0, 101.0, 91.0, 77.0, 49.0, 42.0, 30.0, 16.0, 26.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009589195251464844, -0.0009312108159065247, -0.0009035021066665649, -0.0008757933974266052, -0.0008480846881866455, -0.0008203759789466858, -0.0007926672697067261, -0.0007649585604667664, -0.0007372498512268066, -0.0007095411419868469, -0.0006818324327468872, -0.0006541237235069275, -0.0006264150142669678, -0.0005987063050270081, -0.0005709975957870483, -0.0005432888865470886, -0.0005155801773071289, -0.0004878714680671692, -0.00046016275882720947, -0.00043245404958724976, -0.00040474534034729004, -0.0003770366311073303, -0.0003493279218673706, -0.0003216192126274109, -0.00029391050338745117, -0.00026620179414749146, -0.00023849308490753174, -0.00021078437566757202, -0.0001830756664276123, -0.0001553669571876526, -0.00012765824794769287, -9.994953870773315e-05, -7.224082946777344e-05, -4.453212022781372e-05, -1.6823410987854004e-05, 1.0885298252105713e-05, 3.859400749206543e-05, 6.630271673202515e-05, 9.401142597198486e-05, 0.00012172013521194458, 0.0001494288444519043, 0.00017713755369186401, 0.00020484626293182373, 0.00023255497217178345, 0.00026026368141174316, 0.0002879723906517029, 0.0003156810998916626, 0.0003433898091316223, 0.00037109851837158203, 0.00039880722761154175, 0.00042651593685150146, 0.0004542246460914612, 0.0004819333553314209, 0.0005096420645713806, 0.0005373507738113403, 0.0005650594830513, 0.0005927681922912598, 0.0006204769015312195, 0.0006481856107711792, 0.0006758943200111389, 0.0007036030292510986, 0.0007313117384910583, 0.0007590204477310181, 0.0007867291569709778, 0.0008144378662109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 10.0, 7.0, 15.0, 14.0, 18.0, 38.0, 54.0, 85.0, 136.0, 224.0, 812.0, 788461.0, 257434.0, 661.0, 223.0, 120.0, 64.0, 52.0, 29.0, 26.0, 21.0, 12.0, 8.0, 5.0, 9.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019439697265625, -0.018790721893310547, -0.018141746520996094, -0.01749277114868164, -0.016843795776367188, -0.016194820404052734, -0.015545845031738281, -0.014896869659423828, -0.014247894287109375, -0.013598918914794922, -0.012949943542480469, -0.012300968170166016, -0.011651992797851562, -0.01100301742553711, -0.010354042053222656, -0.009705066680908203, -0.00905609130859375, -0.008407115936279297, -0.007758140563964844, -0.007109165191650391, -0.0064601898193359375, -0.005811214447021484, -0.005162239074707031, -0.004513263702392578, -0.003864288330078125, -0.003215312957763672, -0.0025663375854492188, -0.0019173622131347656, -0.0012683868408203125, -0.0006194114685058594, 2.956390380859375e-05, 0.0006785392761230469, 0.0013275146484375, 0.001976490020751953, 0.0026254653930664062, 0.0032744407653808594, 0.0039234161376953125, 0.004572391510009766, 0.005221366882324219, 0.005870342254638672, 0.006519317626953125, 0.007168292999267578, 0.007817268371582031, 0.008466243743896484, 0.009115219116210938, 0.00976419448852539, 0.010413169860839844, 0.011062145233154297, 0.01171112060546875, 0.012360095977783203, 0.013009071350097656, 0.01365804672241211, 0.014307022094726562, 0.014955997467041016, 0.015604972839355469, 0.016253948211669922, 0.016902923583984375, 0.017551898956298828, 0.01820087432861328, 0.018849849700927734, 0.019498825073242188, 0.02014780044555664, 0.020796775817871094, 0.021445751190185547, 0.0220947265625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 295.0, 711.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005777199403382838, -0.00046610942808911204, -0.0003544989158399403, -0.00024288837448693812, -0.00013127786223776639, -1.9667320884764194e-05, 9.194319136440754e-05, 0.00020355370361357927, 0.000315164215862751, 0.00042677472811192274, 0.0005383852403610945, 0.0006499957526102662, 0.0007616062648594379, 0.0008732168353162706, 0.0009848272893577814, 0.001096437918022275, 0.0012080483138561249, 0.0013196588261052966, 0.0014312693383544683, 0.00154287985060364, 0.0016544903628528118, 0.0017661009915173054, 0.0018777113873511553, 0.001989322016015649, 0.0021009324118494987, 0.0022125430405139923, 0.002324153436347842, 0.0024357640650123358, 0.0025473744608461857, 0.0026589850895106792, 0.002770595485344529, 0.0028822061140090227, 0.0029938167426735163, 0.00310542737133801, 0.0032170377671718597, 0.0033286483958363533, 0.003440258791670203, 0.0035518694203346968, 0.0036634798161685467, 0.0037750904448330402, 0.00388670084066689, 0.00399831123650074, 0.004109921865165234, 0.004221532493829727, 0.004333143122494221, 0.004444753285497427, 0.0045563639141619205, 0.004667974542826414, 0.004779585171490908, 0.004891195800155401, 0.005002806428819895, 0.005114416591823101, 0.005226027220487595, 0.005337637849152088, 0.005449248477816582, 0.005560858640819788, 0.0056724692694842815, 0.005784079898148775, 0.005895690526813269, 0.006007300689816475, 0.0061189113184809685, 0.006230521947145462, 0.006342132575809956, 0.006453742738813162, 0.006565353367477655]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 11.0, 10.0, 11.0, 16.0, 19.0, 19.0, 20.0, 10.0, 25.0, 28.0, 27.0, 35.0, 32.0, 33.0, 24.0, 34.0, 53.0, 38.0, 40.0, 42.0, 43.0, 37.0, 47.0, 35.0, 34.0, 33.0, 30.0, 28.0, 24.0, 18.0, 20.0, 15.0, 14.0, 11.0, 15.0, 10.0, 17.0, 6.0, 6.0, 3.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026416778564453125, -0.0002552289515733719, -0.0002462901175022125, -0.00023735128343105316, -0.0002284124493598938, -0.00021947361528873444, -0.00021053478121757507, -0.0002015959471464157, -0.00019265711307525635, -0.00018371827900409698, -0.00017477944493293762, -0.00016584061086177826, -0.0001569017767906189, -0.00014796294271945953, -0.00013902410864830017, -0.0001300852745771408, -0.00012114644050598145, -0.00011220760643482208, -0.00010326877236366272, -9.432993829250336e-05, -8.5391104221344e-05, -7.645227015018463e-05, -6.751343607902527e-05, -5.8574602007865906e-05, -4.963576793670654e-05, -4.069693386554718e-05, -3.175809979438782e-05, -2.2819265723228455e-05, -1.3880431652069092e-05, -4.941597580909729e-06, 3.997236490249634e-06, 1.2936070561408997e-05, 2.187490463256836e-05, 3.081373870372772e-05, 3.9752572774887085e-05, 4.869140684604645e-05, 5.763024091720581e-05, 6.656907498836517e-05, 7.550790905952454e-05, 8.44467431306839e-05, 9.338557720184326e-05, 0.00010232441127300262, 0.00011126324534416199, 0.00012020207941532135, 0.0001291409134864807, 0.00013807974755764008, 0.00014701858162879944, 0.0001559574156999588, 0.00016489624977111816, 0.00017383508384227753, 0.0001827739179134369, 0.00019171275198459625, 0.00020065158605575562, 0.00020959042012691498, 0.00021852925419807434, 0.0002274680882692337, 0.00023640692234039307, 0.00024534575641155243, 0.0002542845904827118, 0.00026322342455387115, 0.0002721622586250305, 0.0002811010926961899, 0.00029003992676734924, 0.0002989787608385086, 0.00030791759490966797]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 8.0, 16.0, 11.0, 17.0, 25.0, 28.0, 32.0, 40.0, 22.0, 34.0, 34.0, 40.0, 36.0, 49.0, 30.0, 51.0, 47.0, 48.0, 42.0, 43.0, 34.0, 33.0, 34.0, 36.0, 28.0, 23.0, 23.0, 27.0, 18.0, 17.0, 9.0, 16.0, 15.0, 8.0, 7.0, 2.0, 5.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.2955322265625, -6.075439453125, -5.8553466796875, -5.63525390625, -5.4151611328125, -5.195068359375, -4.9749755859375, -4.7548828125, -4.5347900390625, -4.314697265625, -4.0946044921875, -3.87451171875, -3.6544189453125, -3.434326171875, -3.2142333984375, -2.994140625, -2.7740478515625, -2.553955078125, -2.3338623046875, -2.11376953125, -1.8936767578125, -1.673583984375, -1.4534912109375, -1.2333984375, -1.0133056640625, -0.793212890625, -0.5731201171875, -0.35302734375, -0.1329345703125, 0.087158203125, 0.3072509765625, 0.52734375, 0.7474365234375, 0.967529296875, 1.1876220703125, 1.40771484375, 1.6278076171875, 1.847900390625, 2.0679931640625, 2.2880859375, 2.5081787109375, 2.728271484375, 2.9483642578125, 3.16845703125, 3.3885498046875, 3.608642578125, 3.8287353515625, 4.048828125, 4.2689208984375, 4.489013671875, 4.7091064453125, 4.92919921875, 5.1492919921875, 5.369384765625, 5.5894775390625, 5.8095703125, 6.0296630859375, 6.249755859375, 6.4698486328125, 6.68994140625, 6.9100341796875, 7.130126953125, 7.3502197265625, 7.5703125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 10.0, 6.0, 14.0, 11.0, 14.0, 26.0, 36.0, 44.0, 69.0, 138.0, 243.0, 410.0, 855.0, 1628.0, 3221.0, 6738.0, 14392.0, 32769.0, 82577.0, 225869.0, 405137.0, 165105.0, 61806.0, 25324.0, 11166.0, 5352.0, 2615.0, 1345.0, 681.0, 389.0, 210.0, 118.0, 57.0, 52.0, 32.0, 12.0, 18.0, 14.0, 9.0, 11.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.955078125, -3.8203125, -3.685546875, -3.55078125, -3.416015625, -3.28125, -3.146484375, -3.01171875, -2.876953125, -2.7421875, -2.607421875, -2.47265625, -2.337890625, -2.203125, -2.068359375, -1.93359375, -1.798828125, -1.6640625, -1.529296875, -1.39453125, -1.259765625, -1.125, -0.990234375, -0.85546875, -0.720703125, -0.5859375, -0.451171875, -0.31640625, -0.181640625, -0.046875, 0.087890625, 0.22265625, 0.357421875, 0.4921875, 0.626953125, 0.76171875, 0.896484375, 1.03125, 1.166015625, 1.30078125, 1.435546875, 1.5703125, 1.705078125, 1.83984375, 1.974609375, 2.109375, 2.244140625, 2.37890625, 2.513671875, 2.6484375, 2.783203125, 2.91796875, 3.052734375, 3.1875, 3.322265625, 3.45703125, 3.591796875, 3.7265625, 3.861328125, 3.99609375, 4.130859375, 4.265625, 4.400390625, 4.53515625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 7.0, 8.0, 7.0, 11.0, 10.0, 13.0, 21.0, 15.0, 17.0, 25.0, 31.0, 31.0, 42.0, 39.0, 50.0, 54.0, 87.0, 179.0, 1693.0, 186.0, 85.0, 58.0, 41.0, 38.0, 33.0, 33.0, 33.0, 29.0, 31.0, 20.0, 25.0, 10.0, 19.0, 10.0, 6.0, 4.0, 8.0, 8.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-21.3125, -20.634765625, -19.95703125, -19.279296875, -18.6015625, -17.923828125, -17.24609375, -16.568359375, -15.890625, -15.212890625, -14.53515625, -13.857421875, -13.1796875, -12.501953125, -11.82421875, -11.146484375, -10.46875, -9.791015625, -9.11328125, -8.435546875, -7.7578125, -7.080078125, -6.40234375, -5.724609375, -5.046875, -4.369140625, -3.69140625, -3.013671875, -2.3359375, -1.658203125, -0.98046875, -0.302734375, 0.375, 1.052734375, 1.73046875, 2.408203125, 3.0859375, 3.763671875, 4.44140625, 5.119140625, 5.796875, 6.474609375, 7.15234375, 7.830078125, 8.5078125, 9.185546875, 9.86328125, 10.541015625, 11.21875, 11.896484375, 12.57421875, 13.251953125, 13.9296875, 14.607421875, 15.28515625, 15.962890625, 16.640625, 17.318359375, 17.99609375, 18.673828125, 19.3515625, 20.029296875, 20.70703125, 21.384765625, 22.0625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 10.0, 12.0, 9.0, 9.0, 24.0, 21.0, 24.0, 32.0, 49.0, 61.0, 71.0, 105.0, 110.0, 139.0, 205.0, 332.0, 601.0, 2288.0, 419133.0, 2717268.0, 3339.0, 652.0, 296.0, 221.0, 148.0, 135.0, 73.0, 70.0, 54.0, 39.0, 40.0, 25.0, 19.0, 13.0, 11.0, 10.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-53.53125, -51.9130859375, -50.294921875, -48.6767578125, -47.05859375, -45.4404296875, -43.822265625, -42.2041015625, -40.5859375, -38.9677734375, -37.349609375, -35.7314453125, -34.11328125, -32.4951171875, -30.876953125, -29.2587890625, -27.640625, -26.0224609375, -24.404296875, -22.7861328125, -21.16796875, -19.5498046875, -17.931640625, -16.3134765625, -14.6953125, -13.0771484375, -11.458984375, -9.8408203125, -8.22265625, -6.6044921875, -4.986328125, -3.3681640625, -1.75, -0.1318359375, 1.486328125, 3.1044921875, 4.72265625, 6.3408203125, 7.958984375, 9.5771484375, 11.1953125, 12.8134765625, 14.431640625, 16.0498046875, 17.66796875, 19.2861328125, 20.904296875, 22.5224609375, 24.140625, 25.7587890625, 27.376953125, 28.9951171875, 30.61328125, 32.2314453125, 33.849609375, 35.4677734375, 37.0859375, 38.7041015625, 40.322265625, 41.9404296875, 43.55859375, 45.1767578125, 46.794921875, 48.4130859375, 50.03125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 9.0, 220.0, 652.0, 125.0, 12.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.327392578125, -16.333105087280273, -13.338817596435547, -10.34453010559082, -7.350242614746094, -4.355955123901367, -1.3616676330566406, 1.632619857788086, 4.6269073486328125, 7.621194839477539, 10.615482330322266, 13.609769821166992, 16.60405731201172, 19.598344802856445, 22.592632293701172, 25.5869197845459, 28.581207275390625, 31.57549476623535, 34.56978225708008, 37.56407165527344, 40.55835723876953, 43.552642822265625, 46.546932220458984, 49.541221618652344, 52.53550720214844, 55.52979278564453, 58.52408218383789, 61.51837158203125, 64.51265716552734, 67.50694274902344, 70.50123596191406, 73.49552154541016, 76.48980712890625, 79.48409271240234, 82.47837829589844, 85.47267150878906, 88.46695709228516, 91.46124267578125, 94.45553588867188, 97.44982147216797, 100.44410705566406, 103.43839263916016, 106.43267822265625, 109.42697143554688, 112.42125701904297, 115.41554260253906, 118.40983581542969, 121.40412139892578, 124.39840698242188, 127.39269256591797, 130.38697814941406, 133.3812713623047, 136.37554931640625, 139.36984252929688, 142.3641357421875, 145.35841369628906, 148.3527069091797, 151.3470001220703, 154.34127807617188, 157.3355712890625, 160.32986450195312, 163.3241424560547, 166.3184356689453, 169.31271362304688, 172.3070068359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 7.0, 7.0, 6.0, 11.0, 13.0, 20.0, 21.0, 11.0, 22.0, 29.0, 26.0, 27.0, 27.0, 28.0, 30.0, 37.0, 42.0, 38.0, 40.0, 37.0, 46.0, 48.0, 32.0, 46.0, 27.0, 39.0, 29.0, 28.0, 19.0, 28.0, 32.0, 18.0, 23.0, 20.0, 18.0, 14.0, 11.0, 9.0, 5.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.3079833984375, -46.60369110107422, -44.89939880371094, -43.195106506347656, -41.490814208984375, -39.786521911621094, -38.08222961425781, -36.37793731689453, -34.67364501953125, -32.96935272216797, -31.265060424804688, -29.560768127441406, -27.856475830078125, -26.152183532714844, -24.44788932800293, -22.74359703063965, -21.039302825927734, -19.335010528564453, -17.630718231201172, -15.926424980163574, -14.222132682800293, -12.517840385437012, -10.813547134399414, -9.109254837036133, -7.404962539672852, -5.70067024230957, -3.996377468109131, -2.2920846939086914, -0.5877923965454102, 1.116499900817871, 2.8207931518554688, 4.52508544921875, 6.229377746582031, 7.9336700439453125, 9.637962341308594, 11.342255592346191, 13.046547889709473, 14.750840187072754, 16.45513343811035, 18.159425735473633, 19.863718032836914, 21.568010330200195, 23.272302627563477, 24.97659683227539, 26.680889129638672, 28.385181427001953, 30.089473724365234, 31.793766021728516, 33.4980583190918, 35.20235061645508, 36.90664291381836, 38.61093521118164, 40.31522750854492, 42.0195198059082, 43.72381591796875, 45.42810821533203, 47.13240051269531, 48.836692810058594, 50.540985107421875, 52.245277404785156, 53.94956970214844, 55.65386199951172, 57.358154296875, 59.06244659423828, 60.76673889160156]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 3.0, 8.0, 11.0, 11.0, 14.0, 18.0, 16.0, 27.0, 34.0, 32.0, 33.0, 21.0, 48.0, 36.0, 47.0, 38.0, 41.0, 45.0, 42.0, 33.0, 51.0, 41.0, 35.0, 39.0, 42.0, 36.0, 26.0, 23.0, 18.0, 24.0, 15.0, 19.0, 16.0, 16.0, 8.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.2794189453125, -6.051025390625, -5.8226318359375, -5.59423828125, -5.3658447265625, -5.137451171875, -4.9090576171875, -4.6806640625, -4.4522705078125, -4.223876953125, -3.9954833984375, -3.76708984375, -3.5386962890625, -3.310302734375, -3.0819091796875, -2.853515625, -2.6251220703125, -2.396728515625, -2.1683349609375, -1.93994140625, -1.7115478515625, -1.483154296875, -1.2547607421875, -1.0263671875, -0.7979736328125, -0.569580078125, -0.3411865234375, -0.11279296875, 0.1156005859375, 0.343994140625, 0.5723876953125, 0.80078125, 1.0291748046875, 1.257568359375, 1.4859619140625, 1.71435546875, 1.9427490234375, 2.171142578125, 2.3995361328125, 2.6279296875, 2.8563232421875, 3.084716796875, 3.3131103515625, 3.54150390625, 3.7698974609375, 3.998291015625, 4.2266845703125, 4.455078125, 4.6834716796875, 4.911865234375, 5.1402587890625, 5.36865234375, 5.5970458984375, 5.825439453125, 6.0538330078125, 6.2822265625, 6.5106201171875, 6.739013671875, 6.9674072265625, 7.19580078125, 7.4241943359375, 7.652587890625, 7.8809814453125, 8.109375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 4.0, 13.0, 6.0, 13.0, 10.0, 22.0, 24.0, 33.0, 17.0, 48.0, 42.0, 66.0, 110.0, 220.0, 603.0, 2116.0, 20680.0, 1442369.0, 2674540.0, 48384.0, 3341.0, 813.0, 309.0, 159.0, 80.0, 39.0, 40.0, 33.0, 18.0, 17.0, 19.0, 17.0, 18.0, 11.0, 10.0, 10.0, 6.0, 1.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.63671875, -20.8671875, -20.09765625, -19.328125, -18.55859375, -17.7890625, -17.01953125, -16.25, -15.48046875, -14.7109375, -13.94140625, -13.171875, -12.40234375, -11.6328125, -10.86328125, -10.09375, -9.32421875, -8.5546875, -7.78515625, -7.015625, -6.24609375, -5.4765625, -4.70703125, -3.9375, -3.16796875, -2.3984375, -1.62890625, -0.859375, -0.08984375, 0.6796875, 1.44921875, 2.21875, 2.98828125, 3.7578125, 4.52734375, 5.296875, 6.06640625, 6.8359375, 7.60546875, 8.375, 9.14453125, 9.9140625, 10.68359375, 11.453125, 12.22265625, 12.9921875, 13.76171875, 14.53125, 15.30078125, 16.0703125, 16.83984375, 17.609375, 18.37890625, 19.1484375, 19.91796875, 20.6875, 21.45703125, 22.2265625, 22.99609375, 23.765625, 24.53515625, 25.3046875, 26.07421875, 26.84375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 14.0, 12.0, 13.0, 14.0, 36.0, 42.0, 46.0, 81.0, 99.0, 139.0, 214.0, 319.0, 456.0, 557.0, 570.0, 392.0, 316.0, 222.0, 149.0, 108.0, 85.0, 58.0, 37.0, 29.0, 25.0, 10.0, 11.0, 6.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.828125, -17.3585205078125, -16.888916015625, -16.4193115234375, -15.94970703125, -15.4801025390625, -15.010498046875, -14.5408935546875, -14.0712890625, -13.6016845703125, -13.132080078125, -12.6624755859375, -12.19287109375, -11.7232666015625, -11.253662109375, -10.7840576171875, -10.314453125, -9.8448486328125, -9.375244140625, -8.9056396484375, -8.43603515625, -7.9664306640625, -7.496826171875, -7.0272216796875, -6.5576171875, -6.0880126953125, -5.618408203125, -5.1488037109375, -4.67919921875, -4.2095947265625, -3.739990234375, -3.2703857421875, -2.80078125, -2.3311767578125, -1.861572265625, -1.3919677734375, -0.92236328125, -0.4527587890625, 0.016845703125, 0.4864501953125, 0.9560546875, 1.4256591796875, 1.895263671875, 2.3648681640625, 2.83447265625, 3.3040771484375, 3.773681640625, 4.2432861328125, 4.712890625, 5.1824951171875, 5.652099609375, 6.1217041015625, 6.59130859375, 7.0609130859375, 7.530517578125, 8.0001220703125, 8.4697265625, 8.9393310546875, 9.408935546875, 9.8785400390625, 10.34814453125, 10.8177490234375, 11.287353515625, 11.7569580078125, 12.2265625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 19.0, 22.0, 36.0, 44.0, 67.0, 86.0, 124.0, 165.0, 232.0, 322.0, 523.0, 1701.0, 4063190.0, 125500.0, 856.0, 397.0, 269.0, 176.0, 137.0, 104.0, 80.0, 67.0, 49.0, 29.0, 29.0, 20.0, 9.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.875, -107.8623046875, -104.849609375, -101.8369140625, -98.82421875, -95.8115234375, -92.798828125, -89.7861328125, -86.7734375, -83.7607421875, -80.748046875, -77.7353515625, -74.72265625, -71.7099609375, -68.697265625, -65.6845703125, -62.671875, -59.6591796875, -56.646484375, -53.6337890625, -50.62109375, -47.6083984375, -44.595703125, -41.5830078125, -38.5703125, -35.5576171875, -32.544921875, -29.5322265625, -26.51953125, -23.5068359375, -20.494140625, -17.4814453125, -14.46875, -11.4560546875, -8.443359375, -5.4306640625, -2.41796875, 0.5947265625, 3.607421875, 6.6201171875, 9.6328125, 12.6455078125, 15.658203125, 18.6708984375, 21.68359375, 24.6962890625, 27.708984375, 30.7216796875, 33.734375, 36.7470703125, 39.759765625, 42.7724609375, 45.78515625, 48.7978515625, 51.810546875, 54.8232421875, 57.8359375, 60.8486328125, 63.861328125, 66.8740234375, 69.88671875, 72.8994140625, 75.912109375, 78.9248046875, 81.9375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 164.0, 574.0, 249.0, 22.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.2158508300781, -278.1891784667969, -271.1625061035156, -264.1358337402344, -257.1091613769531, -250.0824737548828, -243.05580139160156, -236.0291290283203, -229.00245666503906, -221.9757843017578, -214.94911193847656, -207.92242431640625, -200.895751953125, -193.86907958984375, -186.8424072265625, -179.81573486328125, -172.7890625, -165.76239013671875, -158.7357177734375, -151.70904541015625, -144.68235778808594, -137.6556854248047, -130.62901306152344, -123.60234069824219, -116.57565307617188, -109.54898071289062, -102.52230072021484, -95.4956283569336, -88.46895599365234, -81.44227600097656, -74.41560363769531, -67.38893127441406, -60.36225891113281, -53.3355827331543, -46.30891036987305, -39.28223419189453, -32.25556182861328, -25.228885650634766, -18.20220947265625, -11.175537109375, -4.148860931396484, 2.8778138160705566, 9.904488563537598, 16.931163787841797, 23.95783805847168, 30.984512329101562, 38.01118850708008, 45.03786087036133, 52.064537048339844, 59.09121322631836, 66.11788940429688, 73.14456176757812, 80.17123413085938, 87.19790649414062, 94.2245864868164, 101.25125885009766, 108.27793884277344, 115.30461120605469, 122.33129119873047, 129.35797119140625, 136.3846435546875, 143.41131591796875, 150.43798828125, 157.46466064453125, 164.4913330078125]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 7.0, 15.0, 10.0, 15.0, 15.0, 11.0, 24.0, 17.0, 27.0, 32.0, 25.0, 21.0, 43.0, 36.0, 26.0, 37.0, 33.0, 35.0, 36.0, 48.0, 38.0, 36.0, 54.0, 47.0, 40.0, 30.0, 28.0, 28.0, 23.0, 21.0, 25.0, 17.0, 8.0, 16.0, 15.0, 14.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.587913513183594, -39.29560470581055, -38.003292083740234, -36.71098327636719, -35.41867446899414, -34.12636184692383, -32.83405303955078, -31.5417423248291, -30.249431610107422, -28.957120895385742, -27.664812088012695, -26.372501373291016, -25.080190658569336, -23.787879943847656, -22.49557113647461, -21.20326042175293, -19.910951614379883, -18.618640899658203, -17.326332092285156, -16.034021377563477, -14.741710662841797, -13.449400901794434, -12.15709114074707, -10.86478042602539, -9.572470664978027, -8.280160903930664, -6.987850189208984, -5.695540428161621, -4.4032301902771, -3.110919952392578, -1.8186101913452148, -0.5262994766235352, 0.7660102844238281, 2.0583205223083496, 3.350630521774292, 4.642940521240234, 5.935250759124756, 7.227560997009277, 8.51987075805664, 9.81218147277832, 11.104491233825684, 12.396800994873047, 13.689111709594727, 14.98142147064209, 16.273731231689453, 17.566041946411133, 18.858352661132812, 20.15066146850586, 21.44297218322754, 22.73528289794922, 24.027591705322266, 25.319902420043945, 26.612213134765625, 27.904521942138672, 29.19683265686035, 30.48914337158203, 31.781452178955078, 33.073760986328125, 34.36607360839844, 35.658382415771484, 36.95069122314453, 38.243003845214844, 39.53531265258789, 40.82762145996094, 42.11993408203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 8.0, 15.0, 13.0, 12.0, 15.0, 11.0, 23.0, 28.0, 33.0, 32.0, 31.0, 39.0, 42.0, 30.0, 48.0, 35.0, 37.0, 36.0, 35.0, 42.0, 56.0, 41.0, 35.0, 26.0, 24.0, 21.0, 32.0, 26.0, 27.0, 20.0, 29.0, 11.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 7.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.473876953125, -6.26416015625, -6.054443359375, -5.8447265625, -5.635009765625, -5.42529296875, -5.215576171875, -5.005859375, -4.796142578125, -4.58642578125, -4.376708984375, -4.1669921875, -3.957275390625, -3.74755859375, -3.537841796875, -3.328125, -3.118408203125, -2.90869140625, -2.698974609375, -2.4892578125, -2.279541015625, -2.06982421875, -1.860107421875, -1.650390625, -1.440673828125, -1.23095703125, -1.021240234375, -0.8115234375, -0.601806640625, -0.39208984375, -0.182373046875, 0.02734375, 0.237060546875, 0.44677734375, 0.656494140625, 0.8662109375, 1.075927734375, 1.28564453125, 1.495361328125, 1.705078125, 1.914794921875, 2.12451171875, 2.334228515625, 2.5439453125, 2.753662109375, 2.96337890625, 3.173095703125, 3.3828125, 3.592529296875, 3.80224609375, 4.011962890625, 4.2216796875, 4.431396484375, 4.64111328125, 4.850830078125, 5.060546875, 5.270263671875, 5.47998046875, 5.689697265625, 5.8994140625, 6.109130859375, 6.31884765625, 6.528564453125, 6.73828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 5.0, 11.0, 14.0, 15.0, 37.0, 42.0, 55.0, 103.0, 116.0, 186.0, 268.0, 370.0, 499.0, 701.0, 995.0, 1431.0, 2021.0, 2871.0, 4241.0, 6083.0, 8718.0, 12652.0, 18859.0, 29384.0, 45377.0, 72180.0, 115096.0, 191436.0, 198293.0, 121336.0, 75060.0, 47404.0, 29989.0, 20092.0, 13219.0, 8885.0, 6005.0, 4349.0, 2995.0, 2126.0, 1541.0, 1089.0, 713.0, 547.0, 353.0, 240.0, 177.0, 107.0, 79.0, 59.0, 49.0, 24.0, 18.0, 16.0, 17.0, 5.0, 8.0, 3.0, 2.0, 2.0], "bins": [-0.89111328125, -0.8633041381835938, -0.8354949951171875, -0.8076858520507812, -0.779876708984375, -0.7520675659179688, -0.7242584228515625, -0.6964492797851562, -0.66864013671875, -0.6408309936523438, -0.6130218505859375, -0.5852127075195312, -0.557403564453125, -0.5295944213867188, -0.5017852783203125, -0.47397613525390625, -0.4461669921875, -0.41835784912109375, -0.3905487060546875, -0.36273956298828125, -0.334930419921875, -0.30712127685546875, -0.2793121337890625, -0.25150299072265625, -0.22369384765625, -0.19588470458984375, -0.1680755615234375, -0.14026641845703125, -0.112457275390625, -0.08464813232421875, -0.0568389892578125, -0.02902984619140625, -0.001220703125, 0.02658843994140625, 0.0543975830078125, 0.08220672607421875, 0.110015869140625, 0.13782501220703125, 0.1656341552734375, 0.19344329833984375, 0.22125244140625, 0.24906158447265625, 0.2768707275390625, 0.30467987060546875, 0.332489013671875, 0.36029815673828125, 0.3881072998046875, 0.41591644287109375, 0.4437255859375, 0.47153472900390625, 0.4993438720703125, 0.5271530151367188, 0.554962158203125, 0.5827713012695312, 0.6105804443359375, 0.6383895874023438, 0.66619873046875, 0.6940078735351562, 0.7218170166015625, 0.7496261596679688, 0.777435302734375, 0.8052444458007812, 0.8330535888671875, 0.8608627319335938, 0.888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 9.0, 4.0, 7.0, 4.0, 4.0, 8.0, 10.0, 9.0, 10.0, 19.0, 19.0, 20.0, 13.0, 28.0, 20.0, 23.0, 20.0, 24.0, 21.0, 26.0, 28.0, 28.0, 32.0, 38.0, 27.0, 1052.0, 27.0, 29.0, 38.0, 36.0, 22.0, 31.0, 41.0, 32.0, 23.0, 28.0, 26.0, 23.0, 25.0, 18.0, 28.0, 21.0, 6.0, 18.0, 11.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.123046875, -3.01348876953125, -2.9039306640625, -2.79437255859375, -2.684814453125, -2.57525634765625, -2.4656982421875, -2.35614013671875, -2.24658203125, -2.13702392578125, -2.0274658203125, -1.91790771484375, -1.808349609375, -1.69879150390625, -1.5892333984375, -1.47967529296875, -1.3701171875, -1.26055908203125, -1.1510009765625, -1.04144287109375, -0.931884765625, -0.82232666015625, -0.7127685546875, -0.60321044921875, -0.49365234375, -0.38409423828125, -0.2745361328125, -0.16497802734375, -0.055419921875, 0.05413818359375, 0.1636962890625, 0.27325439453125, 0.3828125, 0.49237060546875, 0.6019287109375, 0.71148681640625, 0.821044921875, 0.93060302734375, 1.0401611328125, 1.14971923828125, 1.25927734375, 1.36883544921875, 1.4783935546875, 1.58795166015625, 1.697509765625, 1.80706787109375, 1.9166259765625, 2.02618408203125, 2.1357421875, 2.24530029296875, 2.3548583984375, 2.46441650390625, 2.573974609375, 2.68353271484375, 2.7930908203125, 2.90264892578125, 3.01220703125, 3.12176513671875, 3.2313232421875, 3.34088134765625, 3.450439453125, 3.55999755859375, 3.6695556640625, 3.77911376953125, 3.888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 7.0, 15.0, 13.0, 23.0, 33.0, 43.0, 76.0, 86.0, 165.0, 213.0, 314.0, 485.0, 682.0, 918.0, 1274.0, 1900.0, 2636.0, 3690.0, 5464.0, 7725.0, 11066.0, 15582.0, 23066.0, 34593.0, 51036.0, 79182.0, 126756.0, 1258390.0, 169149.0, 100755.0, 65098.0, 42784.0, 28927.0, 19746.0, 13450.0, 9479.0, 6679.0, 4618.0, 3335.0, 2235.0, 1643.0, 1184.0, 770.0, 597.0, 385.0, 272.0, 197.0, 134.0, 91.0, 55.0, 38.0, 37.0, 23.0, 6.0, 10.0, 4.0, 2.0, 2.0], "bins": [-0.8681640625, -0.8424606323242188, -0.8167572021484375, -0.7910537719726562, -0.765350341796875, -0.7396469116210938, -0.7139434814453125, -0.6882400512695312, -0.66253662109375, -0.6368331909179688, -0.6111297607421875, -0.5854263305664062, -0.559722900390625, -0.5340194702148438, -0.5083160400390625, -0.48261260986328125, -0.4569091796875, -0.43120574951171875, -0.4055023193359375, -0.37979888916015625, -0.354095458984375, -0.32839202880859375, -0.3026885986328125, -0.27698516845703125, -0.25128173828125, -0.22557830810546875, -0.1998748779296875, -0.17417144775390625, -0.148468017578125, -0.12276458740234375, -0.0970611572265625, -0.07135772705078125, -0.045654296875, -0.01995086669921875, 0.0057525634765625, 0.03145599365234375, 0.057159423828125, 0.08286285400390625, 0.1085662841796875, 0.13426971435546875, 0.15997314453125, 0.18567657470703125, 0.2113800048828125, 0.23708343505859375, 0.262786865234375, 0.28849029541015625, 0.3141937255859375, 0.33989715576171875, 0.3656005859375, 0.39130401611328125, 0.4170074462890625, 0.44271087646484375, 0.468414306640625, 0.49411773681640625, 0.5198211669921875, 0.5455245971679688, 0.57122802734375, 0.5969314575195312, 0.6226348876953125, 0.6483383178710938, 0.674041748046875, 0.6997451782226562, 0.7254486083984375, 0.7511520385742188, 0.77685546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 6.0, 10.0, 14.0, 19.0, 24.0, 26.0, 20.0, 37.0, 38.0, 26.0, 45.0, 64.0, 52.0, 74.0, 63.0, 65.0, 58.0, 54.0, 50.0, 39.0, 30.0, 33.0, 24.0, 28.0, 25.0, 8.0, 16.0, 5.0, 8.0, 7.0, 9.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0006403923034667969, -0.0006232447922229767, -0.0006060972809791565, -0.0005889497697353363, -0.0005718022584915161, -0.0005546547472476959, -0.0005375072360038757, -0.0005203597247600555, -0.0005032122135162354, -0.00048606470227241516, -0.00046891719102859497, -0.0004517696797847748, -0.0004346221685409546, -0.0004174746572971344, -0.0004003271460533142, -0.000383179634809494, -0.00036603212356567383, -0.00034888461232185364, -0.00033173710107803345, -0.00031458958983421326, -0.00029744207859039307, -0.0002802945673465729, -0.0002631470561027527, -0.0002459995448589325, -0.0002288520336151123, -0.00021170452237129211, -0.00019455701112747192, -0.00017740949988365173, -0.00016026198863983154, -0.00014311447739601135, -0.00012596696615219116, -0.00010881945490837097, -9.167194366455078e-05, -7.452443242073059e-05, -5.73769211769104e-05, -4.022940993309021e-05, -2.308189868927002e-05, -5.934387445449829e-06, 1.1213123798370361e-05, 2.8360635042190552e-05, 4.550814628601074e-05, 6.265565752983093e-05, 7.980316877365112e-05, 9.695068001747131e-05, 0.0001140981912612915, 0.0001312457025051117, 0.00014839321374893188, 0.00016554072499275208, 0.00018268823623657227, 0.00019983574748039246, 0.00021698325872421265, 0.00023413076996803284, 0.00025127828121185303, 0.0002684257924556732, 0.0002855733036994934, 0.0003027208149433136, 0.0003198683261871338, 0.000337015837430954, 0.00035416334867477417, 0.00037131085991859436, 0.00038845837116241455, 0.00040560588240623474, 0.00042275339365005493, 0.0004399009048938751, 0.0004570484161376953]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 11.0, 3.0, 7.0, 11.0, 16.0, 17.0, 24.0, 22.0, 35.0, 26.0, 43.0, 44.0, 63.0, 92.0, 149.0, 243.0, 594.0, 4455.0, 1032496.0, 8656.0, 703.0, 259.0, 140.0, 94.0, 75.0, 51.0, 47.0, 31.0, 28.0, 23.0, 23.0, 14.0, 8.0, 15.0, 8.0, 4.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0107574462890625, -0.010380744934082031, -0.010004043579101562, -0.009627342224121094, -0.009250640869140625, -0.008873939514160156, -0.008497238159179688, -0.008120536804199219, -0.00774383544921875, -0.007367134094238281, -0.0069904327392578125, -0.006613731384277344, -0.006237030029296875, -0.005860328674316406, -0.0054836273193359375, -0.005106925964355469, -0.004730224609375, -0.004353523254394531, -0.0039768218994140625, -0.0036001205444335938, -0.003223419189453125, -0.0028467178344726562, -0.0024700164794921875, -0.0020933151245117188, -0.00171661376953125, -0.0013399124145507812, -0.0009632110595703125, -0.0005865097045898438, -0.000209808349609375, 0.00016689300537109375, 0.0005435943603515625, 0.0009202957153320312, 0.0012969970703125, 0.0016736984252929688, 0.0020503997802734375, 0.0024271011352539062, 0.002803802490234375, 0.0031805038452148438, 0.0035572052001953125, 0.003933906555175781, 0.00431060791015625, 0.004687309265136719, 0.0050640106201171875, 0.005440711975097656, 0.005817413330078125, 0.006194114685058594, 0.0065708160400390625, 0.006947517395019531, 0.00732421875, 0.007700920104980469, 0.008077621459960938, 0.008454322814941406, 0.008831024169921875, 0.009207725524902344, 0.009584426879882812, 0.009961128234863281, 0.01033782958984375, 0.010714530944824219, 0.011091232299804688, 0.011467933654785156, 0.011844635009765625, 0.012221336364746094, 0.012598037719726562, 0.012974739074707031, 0.0133514404296875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 37.0, 287.0, 506.0, 162.0, 16.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0024123857729136944, -0.0023662885650992393, -0.0023201913572847843, -0.0022740941494703293, -0.0022279969416558743, -0.0021818997338414192, -0.002135802526026964, -0.002089705318212509, -0.002043608110398054, -0.001997510902583599, -0.001951413694769144, -0.001905316486954689, -0.001859219279140234, -0.001813122071325779, -0.001767024863511324, -0.001720927655696869, -0.0016748305642977357, -0.0016287333564832807, -0.0015826361486688256, -0.0015365389408543706, -0.0014904417330399156, -0.0014443445252254605, -0.0013982474338263273, -0.0013521502260118723, -0.0013060530181974173, -0.0012599558103829622, -0.0012138586025685072, -0.0011677613947540522, -0.0011216641869395971, -0.001075566979125142, -0.001029469771310687, -0.000983372563496232, -0.0009372754138894379, -0.0008911782060749829, -0.0008450809982605278, -0.0007989838486537337, -0.0007528866408392787, -0.0007067894330248237, -0.0006606922252103686, -0.0006145950173959136, -0.0005684978095814586, -0.0005224006017670035, -0.0004763033939525485, -0.00043020621524192393, -0.0003841090074274689, -0.00033801179961301386, -0.0002919146209023893, -0.00024581741308793426, -0.00019972020527347922, -0.0001536229974590242, -0.00010752580419648439, -6.142861093394458e-05, -1.533140311948955e-05, 3.076580469496548e-05, 7.686298340559006e-05, 0.0001229601912200451, 0.00016905739903450012, 0.00021515460684895515, 0.0002612518146634102, 0.00030734899337403476, 0.0003534462011884898, 0.0003995434090029448, 0.0004456405877135694, 0.0004917377955280244, 0.0005378350033424795]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 5.0, 11.0, 8.0, 13.0, 12.0, 18.0, 17.0, 15.0, 20.0, 27.0, 23.0, 29.0, 30.0, 25.0, 36.0, 36.0, 36.0, 33.0, 58.0, 35.0, 36.0, 43.0, 44.0, 33.0, 42.0, 45.0, 27.0, 28.0, 20.0, 30.0, 20.0, 19.0, 14.0, 17.0, 15.0, 10.0, 11.0, 13.0, 6.0, 10.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00025594234466552734, -0.0002481583505868912, -0.000240374356508255, -0.00023259036242961884, -0.00022480636835098267, -0.0002170223742723465, -0.00020923838019371033, -0.00020145438611507416, -0.000193670392036438, -0.00018588639795780182, -0.00017810240387916565, -0.00017031840980052948, -0.0001625344157218933, -0.00015475042164325714, -0.00014696642756462097, -0.0001391824334859848, -0.00013139843940734863, -0.00012361444532871246, -0.0001158304512500763, -0.00010804645717144012, -0.00010026246309280396, -9.247846901416779e-05, -8.469447493553162e-05, -7.691048085689545e-05, -6.912648677825928e-05, -6.134249269962311e-05, -5.355849862098694e-05, -4.577450454235077e-05, -3.79905104637146e-05, -3.020651638507843e-05, -2.242252230644226e-05, -1.4638528227806091e-05, -6.854534149169922e-06, 9.294599294662476e-07, 8.713454008102417e-06, 1.6497448086738586e-05, 2.4281442165374756e-05, 3.2065436244010925e-05, 3.9849430322647095e-05, 4.7633424401283264e-05, 5.5417418479919434e-05, 6.32014125585556e-05, 7.098540663719177e-05, 7.876940071582794e-05, 8.655339479446411e-05, 9.433738887310028e-05, 0.00010212138295173645, 0.00010990537703037262, 0.00011768937110900879, 0.00012547336518764496, 0.00013325735926628113, 0.0001410413533449173, 0.00014882534742355347, 0.00015660934150218964, 0.0001643933355808258, 0.00017217732965946198, 0.00017996132373809814, 0.00018774531781673431, 0.00019552931189537048, 0.00020331330597400665, 0.00021109730005264282, 0.000218881294131279, 0.00022666528820991516, 0.00023444928228855133, 0.0002422332763671875]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 8.0, 15.0, 13.0, 12.0, 15.0, 11.0, 23.0, 28.0, 33.0, 32.0, 31.0, 39.0, 42.0, 30.0, 48.0, 35.0, 37.0, 36.0, 35.0, 42.0, 56.0, 41.0, 35.0, 26.0, 24.0, 21.0, 32.0, 26.0, 27.0, 20.0, 29.0, 11.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 7.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.473876953125, -6.26416015625, -6.054443359375, -5.8447265625, -5.635009765625, -5.42529296875, -5.215576171875, -5.005859375, -4.796142578125, -4.58642578125, -4.376708984375, -4.1669921875, -3.957275390625, -3.74755859375, -3.537841796875, -3.328125, -3.118408203125, -2.90869140625, -2.698974609375, -2.4892578125, -2.279541015625, -2.06982421875, -1.860107421875, -1.650390625, -1.440673828125, -1.23095703125, -1.021240234375, -0.8115234375, -0.601806640625, -0.39208984375, -0.182373046875, 0.02734375, 0.237060546875, 0.44677734375, 0.656494140625, 0.8662109375, 1.075927734375, 1.28564453125, 1.495361328125, 1.705078125, 1.914794921875, 2.12451171875, 2.334228515625, 2.5439453125, 2.753662109375, 2.96337890625, 3.173095703125, 3.3828125, 3.592529296875, 3.80224609375, 4.011962890625, 4.2216796875, 4.431396484375, 4.64111328125, 4.850830078125, 5.060546875, 5.270263671875, 5.47998046875, 5.689697265625, 5.8994140625, 6.109130859375, 6.31884765625, 6.528564453125, 6.73828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 7.0, 10.0, 18.0, 14.0, 28.0, 41.0, 50.0, 64.0, 87.0, 103.0, 133.0, 176.0, 316.0, 546.0, 1190.0, 2891.0, 8457.0, 27007.0, 87651.0, 316758.0, 432949.0, 116460.0, 35437.0, 11276.0, 3724.0, 1384.0, 636.0, 300.0, 221.0, 142.0, 120.0, 82.0, 59.0, 51.0, 29.0, 38.0, 27.0, 12.0, 7.0, 9.0, 5.0, 10.0, 6.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.9609375, -6.74420166015625, -6.5274658203125, -6.31072998046875, -6.093994140625, -5.87725830078125, -5.6605224609375, -5.44378662109375, -5.22705078125, -5.01031494140625, -4.7935791015625, -4.57684326171875, -4.360107421875, -4.14337158203125, -3.9266357421875, -3.70989990234375, -3.4931640625, -3.27642822265625, -3.0596923828125, -2.84295654296875, -2.626220703125, -2.40948486328125, -2.1927490234375, -1.97601318359375, -1.75927734375, -1.54254150390625, -1.3258056640625, -1.10906982421875, -0.892333984375, -0.67559814453125, -0.4588623046875, -0.24212646484375, -0.025390625, 0.19134521484375, 0.4080810546875, 0.62481689453125, 0.841552734375, 1.05828857421875, 1.2750244140625, 1.49176025390625, 1.70849609375, 1.92523193359375, 2.1419677734375, 2.35870361328125, 2.575439453125, 2.79217529296875, 3.0089111328125, 3.22564697265625, 3.4423828125, 3.65911865234375, 3.8758544921875, 4.09259033203125, 4.309326171875, 4.52606201171875, 4.7427978515625, 4.95953369140625, 5.17626953125, 5.39300537109375, 5.6097412109375, 5.82647705078125, 6.043212890625, 6.25994873046875, 6.4766845703125, 6.69342041015625, 6.91015625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 7.0, 9.0, 11.0, 17.0, 23.0, 26.0, 30.0, 30.0, 31.0, 46.0, 45.0, 32.0, 50.0, 74.0, 119.0, 1814.0, 237.0, 68.0, 49.0, 49.0, 43.0, 36.0, 35.0, 24.0, 26.0, 30.0, 21.0, 15.0, 22.0, 14.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.25, -28.43115234375, -27.6123046875, -26.79345703125, -25.974609375, -25.15576171875, -24.3369140625, -23.51806640625, -22.69921875, -21.88037109375, -21.0615234375, -20.24267578125, -19.423828125, -18.60498046875, -17.7861328125, -16.96728515625, -16.1484375, -15.32958984375, -14.5107421875, -13.69189453125, -12.873046875, -12.05419921875, -11.2353515625, -10.41650390625, -9.59765625, -8.77880859375, -7.9599609375, -7.14111328125, -6.322265625, -5.50341796875, -4.6845703125, -3.86572265625, -3.046875, -2.22802734375, -1.4091796875, -0.59033203125, 0.228515625, 1.04736328125, 1.8662109375, 2.68505859375, 3.50390625, 4.32275390625, 5.1416015625, 5.96044921875, 6.779296875, 7.59814453125, 8.4169921875, 9.23583984375, 10.0546875, 10.87353515625, 11.6923828125, 12.51123046875, 13.330078125, 14.14892578125, 14.9677734375, 15.78662109375, 16.60546875, 17.42431640625, 18.2431640625, 19.06201171875, 19.880859375, 20.69970703125, 21.5185546875, 22.33740234375, 23.15625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 10.0, 6.0, 8.0, 20.0, 23.0, 62.0, 61.0, 81.0, 121.0, 179.0, 297.0, 606.0, 3398.0, 3129633.0, 9421.0, 817.0, 349.0, 201.0, 119.0, 98.0, 61.0, 44.0, 29.0, 23.0, 13.0, 10.0, 8.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.75, -68.2763671875, -65.802734375, -63.3291015625, -60.85546875, -58.3818359375, -55.908203125, -53.4345703125, -50.9609375, -48.4873046875, -46.013671875, -43.5400390625, -41.06640625, -38.5927734375, -36.119140625, -33.6455078125, -31.171875, -28.6982421875, -26.224609375, -23.7509765625, -21.27734375, -18.8037109375, -16.330078125, -13.8564453125, -11.3828125, -8.9091796875, -6.435546875, -3.9619140625, -1.48828125, 0.9853515625, 3.458984375, 5.9326171875, 8.40625, 10.8798828125, 13.353515625, 15.8271484375, 18.30078125, 20.7744140625, 23.248046875, 25.7216796875, 28.1953125, 30.6689453125, 33.142578125, 35.6162109375, 38.08984375, 40.5634765625, 43.037109375, 45.5107421875, 47.984375, 50.4580078125, 52.931640625, 55.4052734375, 57.87890625, 60.3525390625, 62.826171875, 65.2998046875, 67.7734375, 70.2470703125, 72.720703125, 75.1943359375, 77.66796875, 80.1416015625, 82.615234375, 85.0888671875, 87.5625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 41.0, 667.0, 294.0, 11.0, 1.0, 0.0, 1.0], "bins": [-240.0944366455078, -236.007080078125, -231.91973876953125, -227.83238220214844, -223.74502563476562, -219.65768432617188, -215.57032775878906, -211.48297119140625, -207.3956298828125, -203.3082733154297, -199.22093200683594, -195.13357543945312, -191.0462188720703, -186.9588623046875, -182.87152099609375, -178.78416442871094, -174.69680786132812, -170.6094512939453, -166.52210998535156, -162.43475341796875, -158.34739685058594, -154.26004028320312, -150.17269897460938, -146.08534240722656, -141.99798583984375, -137.91062927246094, -133.8232879638672, -129.73593139648438, -125.64857482910156, -121.56122589111328, -117.473876953125, -113.38652038574219, -109.29917907714844, -105.21183013916016, -101.12447357177734, -97.03712463378906, -92.94976806640625, -88.86241912841797, -84.77507019042969, -80.68771362304688, -76.6003646850586, -72.51301574707031, -68.4256591796875, -64.33831024169922, -60.25095748901367, -56.163604736328125, -52.076255798339844, -47.9889030456543, -43.90155029296875, -39.8141975402832, -35.726844787597656, -31.639495849609375, -27.552143096923828, -23.46479034423828, -19.377439498901367, -15.290088653564453, -11.202737808227539, -7.115386009216309, -3.028034210205078, 1.0593175888061523, 5.146669387817383, 9.23402214050293, 13.321372985839844, 17.408723831176758, 21.496076583862305]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 6.0, 9.0, 11.0, 15.0, 12.0, 6.0, 23.0, 20.0, 26.0, 25.0, 21.0, 24.0, 41.0, 27.0, 35.0, 36.0, 46.0, 38.0, 40.0, 50.0, 42.0, 41.0, 41.0, 38.0, 37.0, 34.0, 27.0, 39.0, 17.0, 23.0, 23.0, 23.0, 15.0, 9.0, 13.0, 13.0, 11.0, 5.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-59.17918395996094, -57.40391540527344, -55.62864685058594, -53.8533821105957, -52.0781135559082, -50.3028450012207, -48.52758026123047, -46.75231170654297, -44.97704315185547, -43.20177459716797, -41.42650604248047, -39.651241302490234, -37.875972747802734, -36.100704193115234, -34.325439453125, -32.5501708984375, -30.77490234375, -28.9996337890625, -27.224367141723633, -25.449100494384766, -23.673831939697266, -21.898563385009766, -20.1232967376709, -18.34803009033203, -16.57276153564453, -14.797493934631348, -13.022226333618164, -11.24695873260498, -9.471691131591797, -7.696423530578613, -5.92115592956543, -4.145888328552246, -2.370624542236328, -0.5953569412231445, 1.179910659790039, 2.9551782608032227, 4.730445861816406, 6.50571346282959, 8.280981063842773, 10.056248664855957, 11.83151626586914, 13.606783866882324, 15.382051467895508, 17.157318115234375, 18.932586669921875, 20.707855224609375, 22.483121871948242, 24.25838851928711, 26.03365707397461, 27.80892562866211, 29.584192276000977, 31.359458923339844, 33.134727478027344, 34.909996032714844, 36.685264587402344, 38.46052932739258, 40.23579788208008, 42.01106643676758, 43.78633117675781, 45.56159973144531, 47.33686828613281, 49.11213684082031, 50.88740539550781, 52.66267013549805, 54.43793869018555]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 7.0, 8.0, 9.0, 12.0, 17.0, 19.0, 14.0, 12.0, 26.0, 28.0, 33.0, 37.0, 39.0, 27.0, 39.0, 39.0, 33.0, 39.0, 30.0, 34.0, 43.0, 36.0, 45.0, 37.0, 42.0, 26.0, 21.0, 29.0, 28.0, 21.0, 25.0, 20.0, 21.0, 17.0, 16.0, 12.0, 6.0, 10.0, 7.0, 4.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.7109375, -6.50421142578125, -6.2974853515625, -6.09075927734375, -5.884033203125, -5.67730712890625, -5.4705810546875, -5.26385498046875, -5.05712890625, -4.85040283203125, -4.6436767578125, -4.43695068359375, -4.230224609375, -4.02349853515625, -3.8167724609375, -3.61004638671875, -3.4033203125, -3.19659423828125, -2.9898681640625, -2.78314208984375, -2.576416015625, -2.36968994140625, -2.1629638671875, -1.95623779296875, -1.74951171875, -1.54278564453125, -1.3360595703125, -1.12933349609375, -0.922607421875, -0.71588134765625, -0.5091552734375, -0.30242919921875, -0.095703125, 0.11102294921875, 0.3177490234375, 0.52447509765625, 0.731201171875, 0.93792724609375, 1.1446533203125, 1.35137939453125, 1.55810546875, 1.76483154296875, 1.9715576171875, 2.17828369140625, 2.385009765625, 2.59173583984375, 2.7984619140625, 3.00518798828125, 3.2119140625, 3.41864013671875, 3.6253662109375, 3.83209228515625, 4.038818359375, 4.24554443359375, 4.4522705078125, 4.65899658203125, 4.86572265625, 5.07244873046875, 5.2791748046875, 5.48590087890625, 5.692626953125, 5.89935302734375, 6.1060791015625, 6.31280517578125, 6.51953125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 6.0, 5.0, 9.0, 6.0, 9.0, 18.0, 12.0, 19.0, 19.0, 31.0, 48.0, 60.0, 75.0, 91.0, 156.0, 202.0, 415.0, 1106.0, 6842.0, 290235.0, 3570370.0, 314713.0, 7392.0, 1223.0, 417.0, 229.0, 126.0, 97.0, 71.0, 63.0, 42.0, 48.0, 23.0, 20.0, 16.0, 8.0, 13.0, 8.0, 7.0, 8.0, 6.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.015625, -24.290771484375, -23.56591796875, -22.841064453125, -22.1162109375, -21.391357421875, -20.66650390625, -19.941650390625, -19.216796875, -18.491943359375, -17.76708984375, -17.042236328125, -16.3173828125, -15.592529296875, -14.86767578125, -14.142822265625, -13.41796875, -12.693115234375, -11.96826171875, -11.243408203125, -10.5185546875, -9.793701171875, -9.06884765625, -8.343994140625, -7.619140625, -6.894287109375, -6.16943359375, -5.444580078125, -4.7197265625, -3.994873046875, -3.27001953125, -2.545166015625, -1.8203125, -1.095458984375, -0.37060546875, 0.354248046875, 1.0791015625, 1.803955078125, 2.52880859375, 3.253662109375, 3.978515625, 4.703369140625, 5.42822265625, 6.153076171875, 6.8779296875, 7.602783203125, 8.32763671875, 9.052490234375, 9.77734375, 10.502197265625, 11.22705078125, 11.951904296875, 12.6767578125, 13.401611328125, 14.12646484375, 14.851318359375, 15.576171875, 16.301025390625, 17.02587890625, 17.750732421875, 18.4755859375, 19.200439453125, 19.92529296875, 20.650146484375, 21.375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 18.0, 26.0, 38.0, 51.0, 75.0, 77.0, 101.0, 156.0, 230.0, 349.0, 528.0, 580.0, 580.0, 411.0, 252.0, 180.0, 127.0, 86.0, 49.0, 51.0, 30.0, 16.0, 9.0, 13.0, 9.0, 0.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7109375, -14.244873046875, -13.77880859375, -13.312744140625, -12.8466796875, -12.380615234375, -11.91455078125, -11.448486328125, -10.982421875, -10.516357421875, -10.05029296875, -9.584228515625, -9.1181640625, -8.652099609375, -8.18603515625, -7.719970703125, -7.25390625, -6.787841796875, -6.32177734375, -5.855712890625, -5.3896484375, -4.923583984375, -4.45751953125, -3.991455078125, -3.525390625, -3.059326171875, -2.59326171875, -2.127197265625, -1.6611328125, -1.195068359375, -0.72900390625, -0.262939453125, 0.203125, 0.669189453125, 1.13525390625, 1.601318359375, 2.0673828125, 2.533447265625, 2.99951171875, 3.465576171875, 3.931640625, 4.397705078125, 4.86376953125, 5.329833984375, 5.7958984375, 6.261962890625, 6.72802734375, 7.194091796875, 7.66015625, 8.126220703125, 8.59228515625, 9.058349609375, 9.5244140625, 9.990478515625, 10.45654296875, 10.922607421875, 11.388671875, 11.854736328125, 12.32080078125, 12.786865234375, 13.2529296875, 13.718994140625, 14.18505859375, 14.651123046875, 15.1171875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 13.0, 12.0, 16.0, 30.0, 32.0, 53.0, 49.0, 103.0, 104.0, 124.0, 182.0, 255.0, 347.0, 610.0, 3026.0, 4030765.0, 155985.0, 974.0, 373.0, 279.0, 213.0, 135.0, 113.0, 98.0, 85.0, 64.0, 54.0, 50.0, 29.0, 38.0, 14.0, 12.0, 11.0, 13.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.4375, -75.8896484375, -73.341796875, -70.7939453125, -68.24609375, -65.6982421875, -63.150390625, -60.6025390625, -58.0546875, -55.5068359375, -52.958984375, -50.4111328125, -47.86328125, -45.3154296875, -42.767578125, -40.2197265625, -37.671875, -35.1240234375, -32.576171875, -30.0283203125, -27.48046875, -24.9326171875, -22.384765625, -19.8369140625, -17.2890625, -14.7412109375, -12.193359375, -9.6455078125, -7.09765625, -4.5498046875, -2.001953125, 0.5458984375, 3.09375, 5.6416015625, 8.189453125, 10.7373046875, 13.28515625, 15.8330078125, 18.380859375, 20.9287109375, 23.4765625, 26.0244140625, 28.572265625, 31.1201171875, 33.66796875, 36.2158203125, 38.763671875, 41.3115234375, 43.859375, 46.4072265625, 48.955078125, 51.5029296875, 54.05078125, 56.5986328125, 59.146484375, 61.6943359375, 64.2421875, 66.7900390625, 69.337890625, 71.8857421875, 74.43359375, 76.9814453125, 79.529296875, 82.0771484375, 84.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 43.0, 274.0, 447.0, 204.0, 34.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.85195922851562, -217.94973754882812, -213.04751586914062, -208.14529418945312, -203.24307250976562, -198.3408660888672, -193.4386444091797, -188.5364227294922, -183.6342010498047, -178.7319793701172, -173.8297576904297, -168.9275360107422, -164.02532958984375, -159.12310791015625, -154.22088623046875, -149.31866455078125, -144.41644287109375, -139.51422119140625, -134.61199951171875, -129.70977783203125, -124.80756378173828, -119.90534210205078, -115.00312805175781, -110.10090637207031, -105.19868469238281, -100.29646301269531, -95.39424133300781, -90.49202728271484, -85.58980560302734, -80.68758392333984, -75.78536987304688, -70.88314819335938, -65.9809341430664, -61.078712463378906, -56.17649459838867, -51.27427673339844, -46.37205505371094, -41.46983337402344, -36.5676155090332, -31.66539764404297, -26.76317596435547, -21.8609561920166, -16.958736419677734, -12.056516647338867, -7.154296875, -2.252077102661133, 2.6501426696777344, 7.552360534667969, 12.454582214355469, 17.356801986694336, 22.259021759033203, 27.16124153137207, 32.06346130371094, 36.96568298339844, 41.86790084838867, 46.770118713378906, 51.672340393066406, 56.574562072753906, 61.47677993774414, 66.37899780273438, 71.28121948242188, 76.18344116210938, 81.08566284179688, 85.98787689208984, 90.89009857177734]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 7.0, 10.0, 10.0, 20.0, 13.0, 22.0, 10.0, 40.0, 25.0, 38.0, 32.0, 29.0, 40.0, 36.0, 40.0, 42.0, 34.0, 38.0, 32.0, 37.0, 44.0, 33.0, 39.0, 34.0, 30.0, 25.0, 37.0, 20.0, 16.0, 21.0, 16.0, 21.0, 13.0, 10.0, 8.0, 13.0, 5.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-39.63624572753906, -38.40560531616211, -37.17496871948242, -35.94432830810547, -34.71369171142578, -33.48305130004883, -32.252410888671875, -31.021772384643555, -29.791133880615234, -28.560495376586914, -27.329856872558594, -26.09921646118164, -24.86857795715332, -23.637939453125, -22.407299041748047, -21.176660537719727, -19.946022033691406, -18.715383529663086, -17.484745025634766, -16.254104614257812, -15.023466110229492, -13.792827606201172, -12.562188148498535, -11.331548690795898, -10.100910186767578, -8.870271682739258, -7.639632225036621, -6.408993244171143, -5.178354263305664, -3.9477152824401855, -2.717076301574707, -1.4864368438720703, -0.2557945251464844, 0.9748444557189941, 2.2054834365844727, 3.436122417449951, 4.66676139831543, 5.897400379180908, 7.128039360046387, 8.358678817749023, 9.589317321777344, 10.819955825805664, 12.0505952835083, 13.281234741210938, 14.511873245239258, 15.742511749267578, 16.97315216064453, 18.20379066467285, 19.434429168701172, 20.665067672729492, 21.895706176757812, 23.126346588134766, 24.356985092163086, 25.587623596191406, 26.81826400756836, 28.04890251159668, 29.279541015625, 30.51017951965332, 31.74081802368164, 32.971458435058594, 34.20209503173828, 35.432735443115234, 36.66337585449219, 37.894012451171875, 39.12465286254883]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 11.0, 12.0, 15.0, 18.0, 12.0, 23.0, 28.0, 19.0, 28.0, 27.0, 36.0, 35.0, 44.0, 33.0, 47.0, 46.0, 50.0, 33.0, 39.0, 39.0, 37.0, 33.0, 28.0, 36.0, 39.0, 26.0, 26.0, 26.0, 23.0, 24.0, 14.0, 19.0, 10.0, 10.0, 15.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3212890625, -6.099609375, -5.8779296875, -5.65625, -5.4345703125, -5.212890625, -4.9912109375, -4.76953125, -4.5478515625, -4.326171875, -4.1044921875, -3.8828125, -3.6611328125, -3.439453125, -3.2177734375, -2.99609375, -2.7744140625, -2.552734375, -2.3310546875, -2.109375, -1.8876953125, -1.666015625, -1.4443359375, -1.22265625, -1.0009765625, -0.779296875, -0.5576171875, -0.3359375, -0.1142578125, 0.107421875, 0.3291015625, 0.55078125, 0.7724609375, 0.994140625, 1.2158203125, 1.4375, 1.6591796875, 1.880859375, 2.1025390625, 2.32421875, 2.5458984375, 2.767578125, 2.9892578125, 3.2109375, 3.4326171875, 3.654296875, 3.8759765625, 4.09765625, 4.3193359375, 4.541015625, 4.7626953125, 4.984375, 5.2060546875, 5.427734375, 5.6494140625, 5.87109375, 6.0927734375, 6.314453125, 6.5361328125, 6.7578125, 6.9794921875, 7.201171875, 7.4228515625, 7.64453125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 5.0, 12.0, 10.0, 17.0, 27.0, 42.0, 56.0, 73.0, 99.0, 175.0, 248.0, 360.0, 491.0, 790.0, 1167.0, 1654.0, 2565.0, 3856.0, 5926.0, 9279.0, 14653.0, 23762.0, 38019.0, 63856.0, 108400.0, 192852.0, 236447.0, 137716.0, 79264.0, 47644.0, 28962.0, 17869.0, 11261.0, 7100.0, 4692.0, 3045.0, 1999.0, 1291.0, 941.0, 569.0, 443.0, 284.0, 200.0, 140.0, 95.0, 60.0, 40.0, 24.0, 29.0, 25.0, 8.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0], "bins": [-1.150390625, -1.115753173828125, -1.08111572265625, -1.046478271484375, -1.0118408203125, -0.977203369140625, -0.94256591796875, -0.907928466796875, -0.873291015625, -0.838653564453125, -0.80401611328125, -0.769378662109375, -0.7347412109375, -0.700103759765625, -0.66546630859375, -0.630828857421875, -0.59619140625, -0.561553955078125, -0.52691650390625, -0.492279052734375, -0.4576416015625, -0.423004150390625, -0.38836669921875, -0.353729248046875, -0.319091796875, -0.284454345703125, -0.24981689453125, -0.215179443359375, -0.1805419921875, -0.145904541015625, -0.11126708984375, -0.076629638671875, -0.0419921875, -0.007354736328125, 0.02728271484375, 0.061920166015625, 0.0965576171875, 0.131195068359375, 0.16583251953125, 0.200469970703125, 0.235107421875, 0.269744873046875, 0.30438232421875, 0.339019775390625, 0.3736572265625, 0.408294677734375, 0.44293212890625, 0.477569580078125, 0.51220703125, 0.546844482421875, 0.58148193359375, 0.616119384765625, 0.6507568359375, 0.685394287109375, 0.72003173828125, 0.754669189453125, 0.789306640625, 0.823944091796875, 0.85858154296875, 0.893218994140625, 0.9278564453125, 0.962493896484375, 0.99713134765625, 1.031768798828125, 1.06640625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 12.0, 14.0, 22.0, 13.0, 16.0, 19.0, 20.0, 27.0, 30.0, 33.0, 38.0, 45.0, 42.0, 50.0, 35.0, 69.0, 1063.0, 56.0, 36.0, 39.0, 41.0, 43.0, 32.0, 44.0, 27.0, 25.0, 17.0, 23.0, 15.0, 23.0, 16.0, 4.0, 7.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9921875, -4.83648681640625, -4.6807861328125, -4.52508544921875, -4.369384765625, -4.21368408203125, -4.0579833984375, -3.90228271484375, -3.74658203125, -3.59088134765625, -3.4351806640625, -3.27947998046875, -3.123779296875, -2.96807861328125, -2.8123779296875, -2.65667724609375, -2.5009765625, -2.34527587890625, -2.1895751953125, -2.03387451171875, -1.878173828125, -1.72247314453125, -1.5667724609375, -1.41107177734375, -1.25537109375, -1.09967041015625, -0.9439697265625, -0.78826904296875, -0.632568359375, -0.47686767578125, -0.3211669921875, -0.16546630859375, -0.009765625, 0.14593505859375, 0.3016357421875, 0.45733642578125, 0.613037109375, 0.76873779296875, 0.9244384765625, 1.08013916015625, 1.23583984375, 1.39154052734375, 1.5472412109375, 1.70294189453125, 1.858642578125, 2.01434326171875, 2.1700439453125, 2.32574462890625, 2.4814453125, 2.63714599609375, 2.7928466796875, 2.94854736328125, 3.104248046875, 3.25994873046875, 3.4156494140625, 3.57135009765625, 3.72705078125, 3.88275146484375, 4.0384521484375, 4.19415283203125, 4.349853515625, 4.50555419921875, 4.6612548828125, 4.81695556640625, 4.97265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 17.0, 25.0, 25.0, 43.0, 72.0, 84.0, 167.0, 222.0, 351.0, 571.0, 829.0, 1403.0, 2175.0, 3327.0, 5270.0, 8255.0, 13209.0, 22526.0, 38718.0, 68479.0, 123478.0, 1290857.0, 235396.0, 119917.0, 66549.0, 37954.0, 21848.0, 12909.0, 8115.0, 5102.0, 3317.0, 2125.0, 1331.0, 902.0, 520.0, 351.0, 223.0, 155.0, 102.0, 64.0, 45.0, 37.0, 17.0, 18.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0279998779296875, -0.992523193359375, -0.9570465087890625, -0.92156982421875, -0.8860931396484375, -0.850616455078125, -0.8151397705078125, -0.7796630859375, -0.7441864013671875, -0.708709716796875, -0.6732330322265625, -0.63775634765625, -0.6022796630859375, -0.566802978515625, -0.5313262939453125, -0.495849609375, -0.4603729248046875, -0.424896240234375, -0.3894195556640625, -0.35394287109375, -0.3184661865234375, -0.282989501953125, -0.2475128173828125, -0.2120361328125, -0.1765594482421875, -0.141082763671875, -0.1056060791015625, -0.07012939453125, -0.0346527099609375, 0.000823974609375, 0.0363006591796875, 0.07177734375, 0.1072540283203125, 0.142730712890625, 0.1782073974609375, 0.21368408203125, 0.2491607666015625, 0.284637451171875, 0.3201141357421875, 0.3555908203125, 0.3910675048828125, 0.426544189453125, 0.4620208740234375, 0.49749755859375, 0.5329742431640625, 0.568450927734375, 0.6039276123046875, 0.639404296875, 0.6748809814453125, 0.710357666015625, 0.7458343505859375, 0.78131103515625, 0.8167877197265625, 0.852264404296875, 0.8877410888671875, 0.9232177734375, 0.9586944580078125, 0.994171142578125, 1.0296478271484375, 1.06512451171875, 1.1006011962890625, 1.136077880859375, 1.1715545654296875, 1.20703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 0.0, 5.0, 4.0, 5.0, 4.0, 10.0, 10.0, 10.0, 18.0, 11.0, 16.0, 25.0, 19.0, 33.0, 36.0, 29.0, 42.0, 49.0, 58.0, 60.0, 49.0, 56.0, 44.0, 46.0, 51.0, 48.0, 45.0, 34.0, 33.0, 23.0, 17.0, 22.0, 16.0, 17.0, 9.0, 13.0, 5.0, 8.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00040340423583984375, -0.00038740038871765137, -0.000371396541595459, -0.0003553926944732666, -0.0003393888473510742, -0.00032338500022888184, -0.00030738115310668945, -0.00029137730598449707, -0.0002753734588623047, -0.0002593696117401123, -0.00024336576461791992, -0.00022736191749572754, -0.00021135807037353516, -0.00019535422325134277, -0.0001793503761291504, -0.000163346529006958, -0.00014734268188476562, -0.00013133883476257324, -0.00011533498764038086, -9.933114051818848e-05, -8.33272933959961e-05, -6.732344627380371e-05, -5.131959915161133e-05, -3.5315752029418945e-05, -1.9311904907226562e-05, -3.3080577850341797e-06, 1.2695789337158203e-05, 2.8699636459350586e-05, 4.470348358154297e-05, 6.070733070373535e-05, 7.671117782592773e-05, 9.271502494812012e-05, 0.0001087188720703125, 0.00012472271919250488, 0.00014072656631469727, 0.00015673041343688965, 0.00017273426055908203, 0.00018873810768127441, 0.0002047419548034668, 0.00022074580192565918, 0.00023674964904785156, 0.00025275349617004395, 0.00026875734329223633, 0.0002847611904144287, 0.0003007650375366211, 0.0003167688846588135, 0.00033277273178100586, 0.00034877657890319824, 0.0003647804260253906, 0.000380784273147583, 0.0003967881202697754, 0.0004127919673919678, 0.00042879581451416016, 0.00044479966163635254, 0.0004608035087585449, 0.0004768073558807373, 0.0004928112030029297, 0.0005088150501251221, 0.0005248188972473145, 0.0005408227443695068, 0.0005568265914916992, 0.0005728304386138916, 0.000588834285736084, 0.0006048381328582764, 0.0006208419799804688]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 7.0, 6.0, 5.0, 19.0, 14.0, 13.0, 27.0, 34.0, 46.0, 56.0, 76.0, 98.0, 146.0, 270.0, 736.0, 43407.0, 1001008.0, 1531.0, 414.0, 197.0, 108.0, 81.0, 59.0, 42.0, 39.0, 29.0, 21.0, 16.0, 11.0, 11.0, 9.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0182037353515625, -0.017739534378051758, -0.017275333404541016, -0.016811132431030273, -0.01634693145751953, -0.01588273048400879, -0.015418529510498047, -0.014954328536987305, -0.014490127563476562, -0.01402592658996582, -0.013561725616455078, -0.013097524642944336, -0.012633323669433594, -0.012169122695922852, -0.01170492172241211, -0.011240720748901367, -0.010776519775390625, -0.010312318801879883, -0.00984811782836914, -0.009383916854858398, -0.008919715881347656, -0.008455514907836914, -0.007991313934326172, -0.00752711296081543, -0.0070629119873046875, -0.006598711013793945, -0.006134510040283203, -0.005670309066772461, -0.005206108093261719, -0.0047419071197509766, -0.004277706146240234, -0.003813505172729492, -0.00334930419921875, -0.002885103225708008, -0.0024209022521972656, -0.0019567012786865234, -0.0014925003051757812, -0.001028299331665039, -0.0005640983581542969, -9.989738464355469e-05, 0.0003643035888671875, 0.0008285045623779297, 0.0012927055358886719, 0.001756906509399414, 0.0022211074829101562, 0.0026853084564208984, 0.0031495094299316406, 0.003613710403442383, 0.004077911376953125, 0.004542112350463867, 0.005006313323974609, 0.0054705142974853516, 0.005934715270996094, 0.006398916244506836, 0.006863117218017578, 0.00732731819152832, 0.0077915191650390625, 0.008255720138549805, 0.008719921112060547, 0.009184122085571289, 0.009648323059082031, 0.010112524032592773, 0.010576725006103516, 0.011040925979614258, 0.011505126953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 16.0, 26.0, 74.0, 132.0, 192.0, 230.0, 164.0, 102.0, 44.0, 17.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005026980652473867, -0.00048484522267244756, -0.0004669924092013389, -0.00044913956662639976, -0.0004312867531552911, -0.00041343391058035195, -0.0003955810680054128, -0.00037772825453430414, -0.00035987544106319547, -0.00034202259848825634, -0.00032416978501714766, -0.00030631694244220853, -0.00028846412897109985, -0.0002706112863961607, -0.0002527584438212216, -0.00023490563035011292, -0.00021705278777517378, -0.00019919995975214988, -0.00018134713172912598, -0.00016349428915418684, -0.00014564147568307817, -0.00012778863310813904, -0.00010993580508511513, -9.208297706209123e-05, -7.423014903906733e-05, -5.6377321016043425e-05, -3.8524489355040714e-05, -2.0671657694038004e-05, -2.8188296710141003e-06, 1.5033998352009803e-05, 3.288683365099132e-05, 5.0739661674015224e-05, 6.859248969703913e-05, 8.644531772006303e-05, 0.00010429814574308693, 0.00012215098831802607, 0.00014000380178913474, 0.00015785664436407387, 0.00017570947238709778, 0.00019356230041012168, 0.00021141512843314558, 0.00022926795645616949, 0.0002471207990311086, 0.0002649736125022173, 0.0002828264550771564, 0.0003006792685482651, 0.00031853211112320423, 0.0003363849245943129, 0.00035423776716925204, 0.00037209060974419117, 0.00038994342321529984, 0.000407796265790239, 0.00042564907926134765, 0.0004435019218362868, 0.00046135473530739546, 0.0004792075778823346, 0.0004970604204572737, 0.0005149132339283824, 0.000532766105607152, 0.0005506189190782607, 0.0005684717325493693, 0.000586324546020478, 0.0006041774176992476, 0.0006220302311703563, 0.000639883044641465]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 12.0, 14.0, 14.0, 26.0, 16.0, 20.0, 32.0, 31.0, 42.0, 23.0, 28.0, 38.0, 41.0, 34.0, 43.0, 50.0, 49.0, 42.0, 35.0, 42.0, 34.0, 31.0, 43.0, 35.0, 27.0, 32.0, 29.0, 21.0, 21.0, 16.0, 14.0, 17.0, 8.0, 8.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00031960010528564453, -0.00031033530831336975, -0.00030107051134109497, -0.0002918057143688202, -0.0002825409173965454, -0.00027327612042427063, -0.00026401132345199585, -0.00025474652647972107, -0.0002454817295074463, -0.0002362169325351715, -0.00022695213556289673, -0.00021768733859062195, -0.00020842254161834717, -0.0001991577446460724, -0.0001898929476737976, -0.00018062815070152283, -0.00017136335372924805, -0.00016209855675697327, -0.00015283375978469849, -0.0001435689628124237, -0.00013430416584014893, -0.00012503936886787415, -0.00011577457189559937, -0.00010650977492332458, -9.72449779510498e-05, -8.798018097877502e-05, -7.871538400650024e-05, -6.945058703422546e-05, -6.0185790061950684e-05, -5.09209930896759e-05, -4.165619611740112e-05, -3.239139914512634e-05, -2.3126602172851562e-05, -1.3861805200576782e-05, -4.597008228302002e-06, 4.667788743972778e-06, 1.3932585716247559e-05, 2.319738268852234e-05, 3.246217966079712e-05, 4.17269766330719e-05, 5.099177360534668e-05, 6.025657057762146e-05, 6.952136754989624e-05, 7.878616452217102e-05, 8.80509614944458e-05, 9.731575846672058e-05, 0.00010658055543899536, 0.00011584535241127014, 0.00012511014938354492, 0.0001343749463558197, 0.00014363974332809448, 0.00015290454030036926, 0.00016216933727264404, 0.00017143413424491882, 0.0001806989312171936, 0.00018996372818946838, 0.00019922852516174316, 0.00020849332213401794, 0.00021775811910629272, 0.0002270229160785675, 0.00023628771305084229, 0.00024555251002311707, 0.00025481730699539185, 0.0002640821039676666, 0.0002733469009399414]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 11.0, 12.0, 15.0, 18.0, 12.0, 23.0, 28.0, 19.0, 28.0, 27.0, 36.0, 35.0, 44.0, 33.0, 47.0, 46.0, 50.0, 33.0, 39.0, 39.0, 37.0, 33.0, 28.0, 36.0, 39.0, 26.0, 26.0, 26.0, 23.0, 24.0, 14.0, 19.0, 10.0, 10.0, 15.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3212890625, -6.099609375, -5.8779296875, -5.65625, -5.4345703125, -5.212890625, -4.9912109375, -4.76953125, -4.5478515625, -4.326171875, -4.1044921875, -3.8828125, -3.6611328125, -3.439453125, -3.2177734375, -2.99609375, -2.7744140625, -2.552734375, -2.3310546875, -2.109375, -1.8876953125, -1.666015625, -1.4443359375, -1.22265625, -1.0009765625, -0.779296875, -0.5576171875, -0.3359375, -0.1142578125, 0.107421875, 0.3291015625, 0.55078125, 0.7724609375, 0.994140625, 1.2158203125, 1.4375, 1.6591796875, 1.880859375, 2.1025390625, 2.32421875, 2.5458984375, 2.767578125, 2.9892578125, 3.2109375, 3.4326171875, 3.654296875, 3.8759765625, 4.09765625, 4.3193359375, 4.541015625, 4.7626953125, 4.984375, 5.2060546875, 5.427734375, 5.6494140625, 5.87109375, 6.0927734375, 6.314453125, 6.5361328125, 6.7578125, 6.9794921875, 7.201171875, 7.4228515625, 7.64453125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 9.0, 6.0, 17.0, 23.0, 21.0, 28.0, 28.0, 50.0, 62.0, 84.0, 101.0, 170.0, 216.0, 370.0, 573.0, 1073.0, 3416.0, 25175.0, 364112.0, 609130.0, 36368.0, 4442.0, 1187.0, 633.0, 373.0, 257.0, 155.0, 107.0, 88.0, 64.0, 58.0, 31.0, 22.0, 28.0, 10.0, 19.0, 16.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.1070556640625, -11.690673828125, -11.2742919921875, -10.85791015625, -10.4415283203125, -10.025146484375, -9.6087646484375, -9.1923828125, -8.7760009765625, -8.359619140625, -7.9432373046875, -7.52685546875, -7.1104736328125, -6.694091796875, -6.2777099609375, -5.861328125, -5.4449462890625, -5.028564453125, -4.6121826171875, -4.19580078125, -3.7794189453125, -3.363037109375, -2.9466552734375, -2.5302734375, -2.1138916015625, -1.697509765625, -1.2811279296875, -0.86474609375, -0.4483642578125, -0.031982421875, 0.3843994140625, 0.80078125, 1.2171630859375, 1.633544921875, 2.0499267578125, 2.46630859375, 2.8826904296875, 3.299072265625, 3.7154541015625, 4.1318359375, 4.5482177734375, 4.964599609375, 5.3809814453125, 5.79736328125, 6.2137451171875, 6.630126953125, 7.0465087890625, 7.462890625, 7.8792724609375, 8.295654296875, 8.7120361328125, 9.12841796875, 9.5447998046875, 9.961181640625, 10.3775634765625, 10.7939453125, 11.2103271484375, 11.626708984375, 12.0430908203125, 12.45947265625, 12.8758544921875, 13.292236328125, 13.7086181640625, 14.125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 7.0, 3.0, 10.0, 7.0, 8.0, 9.0, 18.0, 15.0, 10.0, 21.0, 34.0, 23.0, 24.0, 38.0, 41.0, 49.0, 37.0, 58.0, 70.0, 175.0, 1748.0, 157.0, 60.0, 42.0, 49.0, 35.0, 41.0, 43.0, 24.0, 16.0, 29.0, 30.0, 22.0, 13.0, 13.0, 9.0, 10.0, 11.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-22.28125, -21.615234375, -20.94921875, -20.283203125, -19.6171875, -18.951171875, -18.28515625, -17.619140625, -16.953125, -16.287109375, -15.62109375, -14.955078125, -14.2890625, -13.623046875, -12.95703125, -12.291015625, -11.625, -10.958984375, -10.29296875, -9.626953125, -8.9609375, -8.294921875, -7.62890625, -6.962890625, -6.296875, -5.630859375, -4.96484375, -4.298828125, -3.6328125, -2.966796875, -2.30078125, -1.634765625, -0.96875, -0.302734375, 0.36328125, 1.029296875, 1.6953125, 2.361328125, 3.02734375, 3.693359375, 4.359375, 5.025390625, 5.69140625, 6.357421875, 7.0234375, 7.689453125, 8.35546875, 9.021484375, 9.6875, 10.353515625, 11.01953125, 11.685546875, 12.3515625, 13.017578125, 13.68359375, 14.349609375, 15.015625, 15.681640625, 16.34765625, 17.013671875, 17.6796875, 18.345703125, 19.01171875, 19.677734375, 20.34375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 1.0, 3.0, 4.0, 8.0, 5.0, 9.0, 14.0, 14.0, 12.0, 11.0, 17.0, 29.0, 40.0, 26.0, 37.0, 41.0, 71.0, 79.0, 120.0, 186.0, 359.0, 863.0, 14169.0, 3122304.0, 5640.0, 678.0, 293.0, 171.0, 121.0, 74.0, 62.0, 47.0, 31.0, 35.0, 21.0, 19.0, 13.0, 16.0, 11.0, 10.0, 11.0, 8.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-61.375, -59.3564453125, -57.337890625, -55.3193359375, -53.30078125, -51.2822265625, -49.263671875, -47.2451171875, -45.2265625, -43.2080078125, -41.189453125, -39.1708984375, -37.15234375, -35.1337890625, -33.115234375, -31.0966796875, -29.078125, -27.0595703125, -25.041015625, -23.0224609375, -21.00390625, -18.9853515625, -16.966796875, -14.9482421875, -12.9296875, -10.9111328125, -8.892578125, -6.8740234375, -4.85546875, -2.8369140625, -0.818359375, 1.2001953125, 3.21875, 5.2373046875, 7.255859375, 9.2744140625, 11.29296875, 13.3115234375, 15.330078125, 17.3486328125, 19.3671875, 21.3857421875, 23.404296875, 25.4228515625, 27.44140625, 29.4599609375, 31.478515625, 33.4970703125, 35.515625, 37.5341796875, 39.552734375, 41.5712890625, 43.58984375, 45.6083984375, 47.626953125, 49.6455078125, 51.6640625, 53.6826171875, 55.701171875, 57.7197265625, 59.73828125, 61.7568359375, 63.775390625, 65.7939453125, 67.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 18.0, 22.0, 37.0, 63.0, 90.0, 118.0, 123.0, 129.0, 132.0, 99.0, 76.0, 49.0, 27.0, 14.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-26.973709106445312, -26.45728874206543, -25.940868377685547, -25.424448013305664, -24.90802764892578, -24.391605377197266, -23.875186920166016, -23.3587646484375, -22.842344284057617, -22.325923919677734, -21.80950355529785, -21.29308319091797, -20.776662826538086, -20.260242462158203, -19.743820190429688, -19.227399826049805, -18.710979461669922, -18.19455909729004, -17.678138732910156, -17.161718368530273, -16.64529800415039, -16.128875732421875, -15.612456321716309, -15.096035957336426, -14.57961654663086, -14.063196182250977, -13.546775817871094, -13.030355453491211, -12.513934135437012, -11.997513771057129, -11.481093406677246, -10.964673042297363, -10.448253631591797, -9.931833267211914, -9.415412902832031, -8.898992538452148, -8.38257122039795, -7.866150856018066, -7.349730491638184, -6.833310127258301, -6.316888809204102, -5.800468444824219, -5.284047603607178, -4.767627239227295, -4.251206398010254, -3.734786033630371, -3.2183656692504883, -2.7019450664520264, -2.1855244636535645, -1.6691038608551025, -1.1526833772659302, -0.6362628936767578, -0.1198422908782959, 0.396578311920166, 0.9129986763000488, 1.4294192790985107, 1.9458398818969727, 2.4622604846954346, 2.9786810874938965, 3.4951014518737793, 4.01152229309082, 4.527942657470703, 5.044363021850586, 5.560783386230469, 6.07720422744751]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 9.0, 7.0, 9.0, 8.0, 9.0, 10.0, 21.0, 11.0, 19.0, 19.0, 25.0, 22.0, 36.0, 31.0, 27.0, 31.0, 31.0, 32.0, 33.0, 40.0, 31.0, 39.0, 38.0, 38.0, 38.0, 36.0, 28.0, 32.0, 29.0, 27.0, 27.0, 27.0, 20.0, 22.0, 18.0, 23.0, 20.0, 13.0, 10.0, 7.0, 6.0, 7.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-58.09512710571289, -56.42301559448242, -54.75090789794922, -53.07879638671875, -51.40668487548828, -49.73457717895508, -48.06246566772461, -46.390357971191406, -44.71824645996094, -43.04613494873047, -41.374027252197266, -39.7019157409668, -38.029808044433594, -36.357696533203125, -34.685585021972656, -33.01347351074219, -31.341365814208984, -29.66925621032715, -27.997146606445312, -26.325035095214844, -24.652925491333008, -22.980815887451172, -21.308704376220703, -19.636594772338867, -17.96448516845703, -16.292375564575195, -14.620265007019043, -12.94815444946289, -11.276044845581055, -9.603935241699219, -7.931824684143066, -6.259714126586914, -4.587608337402344, -2.9154982566833496, -1.2433881759643555, 0.42872190475463867, 2.100831985473633, 3.7729415893554688, 5.445052146911621, 7.117162704467773, 8.78927230834961, 10.461381912231445, 12.133492469787598, 13.80560302734375, 15.477712631225586, 17.149822235107422, 18.82193374633789, 20.494043350219727, 22.166152954101562, 23.8382625579834, 25.510372161865234, 27.182483673095703, 28.85459327697754, 30.526702880859375, 32.198814392089844, 33.87092590332031, 35.543033599853516, 37.215145111083984, 38.88725280761719, 40.559364318847656, 42.231475830078125, 43.90358352661133, 45.5756950378418, 47.247802734375, 48.91991424560547]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 7.0, 8.0, 15.0, 12.0, 11.0, 26.0, 25.0, 29.0, 19.0, 28.0, 33.0, 29.0, 41.0, 37.0, 47.0, 43.0, 43.0, 53.0, 49.0, 33.0, 37.0, 38.0, 42.0, 29.0, 37.0, 26.0, 27.0, 27.0, 35.0, 20.0, 12.0, 19.0, 16.0, 11.0, 8.0, 8.0, 4.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5859375, -7.341552734375, -7.09716796875, -6.852783203125, -6.6083984375, -6.364013671875, -6.11962890625, -5.875244140625, -5.630859375, -5.386474609375, -5.14208984375, -4.897705078125, -4.6533203125, -4.408935546875, -4.16455078125, -3.920166015625, -3.67578125, -3.431396484375, -3.18701171875, -2.942626953125, -2.6982421875, -2.453857421875, -2.20947265625, -1.965087890625, -1.720703125, -1.476318359375, -1.23193359375, -0.987548828125, -0.7431640625, -0.498779296875, -0.25439453125, -0.010009765625, 0.234375, 0.478759765625, 0.72314453125, 0.967529296875, 1.2119140625, 1.456298828125, 1.70068359375, 1.945068359375, 2.189453125, 2.433837890625, 2.67822265625, 2.922607421875, 3.1669921875, 3.411376953125, 3.65576171875, 3.900146484375, 4.14453125, 4.388916015625, 4.63330078125, 4.877685546875, 5.1220703125, 5.366455078125, 5.61083984375, 5.855224609375, 6.099609375, 6.343994140625, 6.58837890625, 6.832763671875, 7.0771484375, 7.321533203125, 7.56591796875, 7.810302734375, 8.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 17.0, 15.0, 22.0, 24.0, 32.0, 57.0, 68.0, 103.0, 139.0, 246.0, 441.0, 781.0, 1879.0, 5200.0, 18019.0, 81141.0, 416757.0, 1360626.0, 1578434.0, 578609.0, 115101.0, 24645.0, 7009.0, 2524.0, 1030.0, 500.0, 256.0, 159.0, 132.0, 72.0, 61.0, 38.0, 46.0, 21.0, 19.0, 11.0, 8.0, 14.0, 2.0, 5.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.53125, -10.2396240234375, -9.947998046875, -9.6563720703125, -9.36474609375, -9.0731201171875, -8.781494140625, -8.4898681640625, -8.1982421875, -7.9066162109375, -7.614990234375, -7.3233642578125, -7.03173828125, -6.7401123046875, -6.448486328125, -6.1568603515625, -5.865234375, -5.5736083984375, -5.281982421875, -4.9903564453125, -4.69873046875, -4.4071044921875, -4.115478515625, -3.8238525390625, -3.5322265625, -3.2406005859375, -2.948974609375, -2.6573486328125, -2.36572265625, -2.0740966796875, -1.782470703125, -1.4908447265625, -1.19921875, -0.9075927734375, -0.615966796875, -0.3243408203125, -0.03271484375, 0.2589111328125, 0.550537109375, 0.8421630859375, 1.1337890625, 1.4254150390625, 1.717041015625, 2.0086669921875, 2.30029296875, 2.5919189453125, 2.883544921875, 3.1751708984375, 3.466796875, 3.7584228515625, 4.050048828125, 4.3416748046875, 4.63330078125, 4.9249267578125, 5.216552734375, 5.5081787109375, 5.7998046875, 6.0914306640625, 6.383056640625, 6.6746826171875, 6.96630859375, 7.2579345703125, 7.549560546875, 7.8411865234375, 8.1328125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 5.0, 5.0, 5.0, 12.0, 5.0, 4.0, 18.0, 27.0, 29.0, 39.0, 42.0, 45.0, 62.0, 78.0, 93.0, 133.0, 140.0, 206.0, 234.0, 297.0, 304.0, 372.0, 352.0, 298.0, 254.0, 188.0, 175.0, 124.0, 106.0, 84.0, 74.0, 61.0, 41.0, 38.0, 32.0, 24.0, 15.0, 15.0, 10.0, 9.0, 10.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.390625, -12.0433349609375, -11.696044921875, -11.3487548828125, -11.00146484375, -10.6541748046875, -10.306884765625, -9.9595947265625, -9.6123046875, -9.2650146484375, -8.917724609375, -8.5704345703125, -8.22314453125, -7.8758544921875, -7.528564453125, -7.1812744140625, -6.833984375, -6.4866943359375, -6.139404296875, -5.7921142578125, -5.44482421875, -5.0975341796875, -4.750244140625, -4.4029541015625, -4.0556640625, -3.7083740234375, -3.361083984375, -3.0137939453125, -2.66650390625, -2.3192138671875, -1.971923828125, -1.6246337890625, -1.27734375, -0.9300537109375, -0.582763671875, -0.2354736328125, 0.11181640625, 0.4591064453125, 0.806396484375, 1.1536865234375, 1.5009765625, 1.8482666015625, 2.195556640625, 2.5428466796875, 2.89013671875, 3.2374267578125, 3.584716796875, 3.9320068359375, 4.279296875, 4.6265869140625, 4.973876953125, 5.3211669921875, 5.66845703125, 6.0157470703125, 6.363037109375, 6.7103271484375, 7.0576171875, 7.4049072265625, 7.752197265625, 8.0994873046875, 8.44677734375, 8.7940673828125, 9.141357421875, 9.4886474609375, 9.8359375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 7.0, 7.0, 13.0, 14.0, 22.0, 29.0, 26.0, 46.0, 60.0, 86.0, 87.0, 108.0, 138.0, 188.0, 218.0, 280.0, 404.0, 700.0, 2289.0, 155133.0, 4018232.0, 12902.0, 1253.0, 500.0, 344.0, 228.0, 181.0, 154.0, 135.0, 100.0, 87.0, 63.0, 54.0, 45.0, 35.0, 33.0, 15.0, 15.0, 21.0, 9.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.5625, -62.68017578125, -60.7978515625, -58.91552734375, -57.033203125, -55.15087890625, -53.2685546875, -51.38623046875, -49.50390625, -47.62158203125, -45.7392578125, -43.85693359375, -41.974609375, -40.09228515625, -38.2099609375, -36.32763671875, -34.4453125, -32.56298828125, -30.6806640625, -28.79833984375, -26.916015625, -25.03369140625, -23.1513671875, -21.26904296875, -19.38671875, -17.50439453125, -15.6220703125, -13.73974609375, -11.857421875, -9.97509765625, -8.0927734375, -6.21044921875, -4.328125, -2.44580078125, -0.5634765625, 1.31884765625, 3.201171875, 5.08349609375, 6.9658203125, 8.84814453125, 10.73046875, 12.61279296875, 14.4951171875, 16.37744140625, 18.259765625, 20.14208984375, 22.0244140625, 23.90673828125, 25.7890625, 27.67138671875, 29.5537109375, 31.43603515625, 33.318359375, 35.20068359375, 37.0830078125, 38.96533203125, 40.84765625, 42.72998046875, 44.6123046875, 46.49462890625, 48.376953125, 50.25927734375, 52.1416015625, 54.02392578125, 55.90625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 55.0, 113.0, 245.0, 274.0, 191.0, 87.0, 30.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.8114242553711, -97.7901382446289, -94.76885986328125, -91.74757385253906, -88.72628784179688, -85.70500183105469, -82.68372344970703, -79.66243743896484, -76.64115142822266, -73.61986541748047, -70.59858703613281, -67.57730102539062, -64.55601501464844, -61.534732818603516, -58.513450622558594, -55.492164611816406, -52.470882415771484, -49.44960021972656, -46.428314208984375, -43.40703201293945, -40.385746002197266, -37.364463806152344, -34.343177795410156, -31.321895599365234, -28.30061149597168, -25.279327392578125, -22.25804328918457, -19.236759185791016, -16.215476989746094, -13.194191932678223, -10.172908782958984, -7.15162467956543, -4.130340576171875, -1.1090567111968994, 1.9122271537780762, 4.933510780334473, 7.954794883728027, 10.976078987121582, 13.99736213684082, 17.018646240234375, 20.03993034362793, 23.061214447021484, 26.08249855041504, 29.103782653808594, 32.125064849853516, 35.1463508605957, 38.167633056640625, 41.18891906738281, 44.210201263427734, 47.231483459472656, 50.252769470214844, 53.274051666259766, 56.29533767700195, 59.316619873046875, 62.33790588378906, 65.35919189453125, 68.3804702758789, 71.4017562866211, 74.42303466796875, 77.44432067871094, 80.46560668945312, 83.48689270019531, 86.50817108154297, 89.52945709228516, 92.55074310302734]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 9.0, 9.0, 19.0, 10.0, 23.0, 13.0, 19.0, 21.0, 23.0, 27.0, 30.0, 30.0, 35.0, 31.0, 36.0, 36.0, 42.0, 41.0, 40.0, 42.0, 40.0, 35.0, 34.0, 36.0, 30.0, 23.0, 21.0, 34.0, 14.0, 24.0, 27.0, 19.0, 16.0, 17.0, 9.0, 6.0, 15.0, 10.0, 6.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-42.974578857421875, -41.634178161621094, -40.29378128051758, -38.95338439941406, -37.61298370361328, -36.2725830078125, -34.932186126708984, -33.59178924560547, -32.25138854980469, -30.91098976135254, -29.57059097290039, -28.230192184448242, -26.889793395996094, -25.549394607543945, -24.208995819091797, -22.86859703063965, -21.5281982421875, -20.18779945373535, -18.847400665283203, -17.507001876831055, -16.166603088378906, -14.826204299926758, -13.48580551147461, -12.145406723022461, -10.805007934570312, -9.464609146118164, -8.124210357666016, -6.783811569213867, -5.443412780761719, -4.10301399230957, -2.762615203857422, -1.4222164154052734, -0.081817626953125, 1.2585811614990234, 2.598979949951172, 3.9393787384033203, 5.279777526855469, 6.620176315307617, 7.960575103759766, 9.300973892211914, 10.641372680664062, 11.981771469116211, 13.32217025756836, 14.662569046020508, 16.002967834472656, 17.343366622924805, 18.683765411376953, 20.0241641998291, 21.36456298828125, 22.7049617767334, 24.045360565185547, 25.385759353637695, 26.726158142089844, 28.066556930541992, 29.40695571899414, 30.74735450744629, 32.08775329589844, 33.42815399169922, 34.768550872802734, 36.10894775390625, 37.44934844970703, 38.78974914550781, 40.13014602661133, 41.470542907714844, 42.810943603515625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 10.0, 11.0, 17.0, 13.0, 16.0, 15.0, 18.0, 19.0, 29.0, 26.0, 38.0, 29.0, 24.0, 37.0, 31.0, 28.0, 41.0, 38.0, 47.0, 35.0, 46.0, 33.0, 35.0, 27.0, 29.0, 26.0, 28.0, 21.0, 34.0, 18.0, 30.0, 12.0, 25.0, 13.0, 10.0, 11.0, 11.0, 14.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.50262451171875, -5.3021240234375, -5.10162353515625, -4.901123046875, -4.70062255859375, -4.5001220703125, -4.29962158203125, -4.09912109375, -3.89862060546875, -3.6981201171875, -3.49761962890625, -3.297119140625, -3.09661865234375, -2.8961181640625, -2.69561767578125, -2.4951171875, -2.29461669921875, -2.0941162109375, -1.89361572265625, -1.693115234375, -1.49261474609375, -1.2921142578125, -1.09161376953125, -0.89111328125, -0.69061279296875, -0.4901123046875, -0.28961181640625, -0.089111328125, 0.11138916015625, 0.3118896484375, 0.51239013671875, 0.712890625, 0.91339111328125, 1.1138916015625, 1.31439208984375, 1.514892578125, 1.71539306640625, 1.9158935546875, 2.11639404296875, 2.31689453125, 2.51739501953125, 2.7178955078125, 2.91839599609375, 3.118896484375, 3.31939697265625, 3.5198974609375, 3.72039794921875, 3.9208984375, 4.12139892578125, 4.3218994140625, 4.52239990234375, 4.722900390625, 4.92340087890625, 5.1239013671875, 5.32440185546875, 5.52490234375, 5.72540283203125, 5.9259033203125, 6.12640380859375, 6.326904296875, 6.52740478515625, 6.7279052734375, 6.92840576171875, 7.12890625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 14.0, 11.0, 19.0, 21.0, 38.0, 50.0, 91.0, 96.0, 179.0, 260.0, 397.0, 595.0, 921.0, 1399.0, 2105.0, 3267.0, 5011.0, 7685.0, 11946.0, 18854.0, 30442.0, 49725.0, 83379.0, 140386.0, 236192.0, 181602.0, 106525.0, 63446.0, 38736.0, 23339.0, 14738.0, 9397.0, 5954.0, 4087.0, 2549.0, 1739.0, 1120.0, 776.0, 476.0, 316.0, 214.0, 155.0, 105.0, 61.0, 55.0, 25.0, 25.0, 15.0, 11.0, 6.0, 6.0, 1.0, 2.0, 3.0], "bins": [-1.177734375, -1.143829345703125, -1.10992431640625, -1.076019287109375, -1.0421142578125, -1.008209228515625, -0.97430419921875, -0.940399169921875, -0.906494140625, -0.872589111328125, -0.83868408203125, -0.804779052734375, -0.7708740234375, -0.736968994140625, -0.70306396484375, -0.669158935546875, -0.63525390625, -0.601348876953125, -0.56744384765625, -0.533538818359375, -0.4996337890625, -0.465728759765625, -0.43182373046875, -0.397918701171875, -0.364013671875, -0.330108642578125, -0.29620361328125, -0.262298583984375, -0.2283935546875, -0.194488525390625, -0.16058349609375, -0.126678466796875, -0.0927734375, -0.058868408203125, -0.02496337890625, 0.008941650390625, 0.0428466796875, 0.076751708984375, 0.11065673828125, 0.144561767578125, 0.178466796875, 0.212371826171875, 0.24627685546875, 0.280181884765625, 0.3140869140625, 0.347991943359375, 0.38189697265625, 0.415802001953125, 0.44970703125, 0.483612060546875, 0.51751708984375, 0.551422119140625, 0.5853271484375, 0.619232177734375, 0.65313720703125, 0.687042236328125, 0.720947265625, 0.754852294921875, 0.78875732421875, 0.822662353515625, 0.8565673828125, 0.890472412109375, 0.92437744140625, 0.958282470703125, 0.9921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 4.0, 10.0, 12.0, 14.0, 10.0, 12.0, 17.0, 20.0, 22.0, 17.0, 33.0, 26.0, 28.0, 28.0, 20.0, 34.0, 27.0, 31.0, 35.0, 32.0, 1058.0, 34.0, 43.0, 34.0, 47.0, 37.0, 39.0, 26.0, 26.0, 23.0, 29.0, 27.0, 25.0, 20.0, 20.0, 15.0, 18.0, 13.0, 10.0, 8.0, 3.0, 7.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.2265625, -4.101776123046875, -3.97698974609375, -3.852203369140625, -3.7274169921875, -3.602630615234375, -3.47784423828125, -3.353057861328125, -3.228271484375, -3.103485107421875, -2.97869873046875, -2.853912353515625, -2.7291259765625, -2.604339599609375, -2.47955322265625, -2.354766845703125, -2.22998046875, -2.105194091796875, -1.98040771484375, -1.855621337890625, -1.7308349609375, -1.606048583984375, -1.48126220703125, -1.356475830078125, -1.231689453125, -1.106903076171875, -0.98211669921875, -0.857330322265625, -0.7325439453125, -0.607757568359375, -0.48297119140625, -0.358184814453125, -0.2333984375, -0.108612060546875, 0.01617431640625, 0.140960693359375, 0.2657470703125, 0.390533447265625, 0.51531982421875, 0.640106201171875, 0.764892578125, 0.889678955078125, 1.01446533203125, 1.139251708984375, 1.2640380859375, 1.388824462890625, 1.51361083984375, 1.638397216796875, 1.76318359375, 1.887969970703125, 2.01275634765625, 2.137542724609375, 2.2623291015625, 2.387115478515625, 2.51190185546875, 2.636688232421875, 2.761474609375, 2.886260986328125, 3.01104736328125, 3.135833740234375, 3.2606201171875, 3.385406494140625, 3.51019287109375, 3.634979248046875, 3.759765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 8.0, 22.0, 37.0, 48.0, 64.0, 110.0, 152.0, 225.0, 346.0, 506.0, 697.0, 1035.0, 1610.0, 2275.0, 3166.0, 4654.0, 6856.0, 10163.0, 14832.0, 21779.0, 33249.0, 50151.0, 77952.0, 127717.0, 1267885.0, 176097.0, 102730.0, 64591.0, 42067.0, 27772.0, 18826.0, 12480.0, 8484.0, 5906.0, 3951.0, 2748.0, 1874.0, 1280.0, 904.0, 621.0, 390.0, 320.0, 178.0, 117.0, 80.0, 59.0, 39.0, 23.0, 15.0, 14.0, 9.0, 8.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.923828125, -0.8956527709960938, -0.8674774169921875, -0.8393020629882812, -0.811126708984375, -0.7829513549804688, -0.7547760009765625, -0.7266006469726562, -0.69842529296875, -0.6702499389648438, -0.6420745849609375, -0.6138992309570312, -0.585723876953125, -0.5575485229492188, -0.5293731689453125, -0.5011978149414062, -0.4730224609375, -0.44484710693359375, -0.4166717529296875, -0.38849639892578125, -0.360321044921875, -0.33214569091796875, -0.3039703369140625, -0.27579498291015625, -0.24761962890625, -0.21944427490234375, -0.1912689208984375, -0.16309356689453125, -0.134918212890625, -0.10674285888671875, -0.0785675048828125, -0.05039215087890625, -0.022216796875, 0.00595855712890625, 0.0341339111328125, 0.06230926513671875, 0.090484619140625, 0.11865997314453125, 0.1468353271484375, 0.17501068115234375, 0.20318603515625, 0.23136138916015625, 0.2595367431640625, 0.28771209716796875, 0.315887451171875, 0.34406280517578125, 0.3722381591796875, 0.40041351318359375, 0.4285888671875, 0.45676422119140625, 0.4849395751953125, 0.5131149291992188, 0.541290283203125, 0.5694656372070312, 0.5976409912109375, 0.6258163452148438, 0.65399169921875, 0.6821670532226562, 0.7103424072265625, 0.7385177612304688, 0.766693115234375, 0.7948684692382812, 0.8230438232421875, 0.8512191772460938, 0.87939453125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 10.0, 11.0, 19.0, 21.0, 28.0, 26.0, 30.0, 24.0, 45.0, 53.0, 52.0, 44.0, 64.0, 51.0, 53.0, 39.0, 55.0, 48.0, 44.0, 28.0, 27.0, 28.0, 36.0, 24.0, 23.0, 14.0, 13.0, 13.0, 9.0, 9.0, 5.0, 8.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004916191101074219, -0.00047466158866882324, -0.0004577040672302246, -0.000440746545791626, -0.00042378902435302734, -0.0004068315029144287, -0.0003898739814758301, -0.00037291646003723145, -0.0003559589385986328, -0.0003390014171600342, -0.00032204389572143555, -0.0003050863742828369, -0.0002881288528442383, -0.00027117133140563965, -0.000254213809967041, -0.00023725628852844238, -0.00022029876708984375, -0.00020334124565124512, -0.00018638372421264648, -0.00016942620277404785, -0.00015246868133544922, -0.00013551115989685059, -0.00011855363845825195, -0.00010159611701965332, -8.463859558105469e-05, -6.768107414245605e-05, -5.072355270385742e-05, -3.376603126525879e-05, -1.6808509826660156e-05, 1.4901161193847656e-07, 1.710653305053711e-05, 3.406405448913574e-05, 5.1021575927734375e-05, 6.797909736633301e-05, 8.493661880493164e-05, 0.00010189414024353027, 0.0001188516616821289, 0.00013580918312072754, 0.00015276670455932617, 0.0001697242259979248, 0.00018668174743652344, 0.00020363926887512207, 0.0002205967903137207, 0.00023755431175231934, 0.00025451183319091797, 0.0002714693546295166, 0.00028842687606811523, 0.00030538439750671387, 0.0003223419189453125, 0.00033929944038391113, 0.00035625696182250977, 0.0003732144832611084, 0.00039017200469970703, 0.00040712952613830566, 0.0004240870475769043, 0.00044104456901550293, 0.00045800209045410156, 0.0004749596118927002, 0.0004919171333312988, 0.0005088746547698975, 0.0005258321762084961, 0.0005427896976470947, 0.0005597472190856934, 0.000576704740524292, 0.0005936622619628906]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 9.0, 8.0, 7.0, 16.0, 8.0, 23.0, 14.0, 25.0, 27.0, 38.0, 40.0, 57.0, 68.0, 95.0, 142.0, 245.0, 496.0, 1596.0, 903343.0, 140159.0, 1022.0, 412.0, 167.0, 125.0, 84.0, 59.0, 45.0, 41.0, 35.0, 27.0, 22.0, 17.0, 13.0, 15.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01318359375, -0.012794256210327148, -0.012404918670654297, -0.012015581130981445, -0.011626243591308594, -0.011236906051635742, -0.01084756851196289, -0.010458230972290039, -0.010068893432617188, -0.009679555892944336, -0.009290218353271484, -0.008900880813598633, -0.008511543273925781, -0.00812220573425293, -0.007732868194580078, -0.0073435306549072266, -0.006954193115234375, -0.0065648555755615234, -0.006175518035888672, -0.00578618049621582, -0.005396842956542969, -0.005007505416870117, -0.004618167877197266, -0.004228830337524414, -0.0038394927978515625, -0.003450155258178711, -0.0030608177185058594, -0.002671480178833008, -0.0022821426391601562, -0.0018928050994873047, -0.0015034675598144531, -0.0011141300201416016, -0.00072479248046875, -0.00033545494079589844, 5.3882598876953125e-05, 0.0004432201385498047, 0.0008325576782226562, 0.0012218952178955078, 0.0016112327575683594, 0.002000570297241211, 0.0023899078369140625, 0.002779245376586914, 0.0031685829162597656, 0.003557920455932617, 0.003947257995605469, 0.00433659553527832, 0.004725933074951172, 0.0051152706146240234, 0.005504608154296875, 0.0058939456939697266, 0.006283283233642578, 0.00667262077331543, 0.007061958312988281, 0.007451295852661133, 0.007840633392333984, 0.008229970932006836, 0.008619308471679688, 0.009008646011352539, 0.00939798355102539, 0.009787321090698242, 0.010176658630371094, 0.010565996170043945, 0.010955333709716797, 0.011344671249389648, 0.0117340087890625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 75.0, 728.0, 208.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004281291738152504, -0.004202988464385271, -0.004124685190618038, -0.004046381916850805, -0.003968078643083572, -0.003889775602146983, -0.003811472561210394, -0.003733169287443161, -0.003654866013675928, -0.0035765627399086952, -0.0034982594661414623, -0.003419956425204873, -0.00334165315143764, -0.0032633498776704073, -0.003185046836733818, -0.003106743562966585, -0.0030284402891993523, -0.0029501370154321194, -0.0028718337416648865, -0.0027935307007282972, -0.0027152274269610643, -0.0026369241531938314, -0.002558621112257242, -0.0024803178384900093, -0.0024020145647227764, -0.0023237112909555435, -0.0022454080171883106, -0.0021671049762517214, -0.0020888017024844885, -0.0020104984287172556, -0.0019321952713653445, -0.0018538921140134335, -0.0017755888402462006, -0.0016972855664789677, -0.0016189824091270566, -0.0015406792517751455, -0.0014623759780079126, -0.0013840727042406797, -0.0013057695468887687, -0.0012274663895368576, -0.0011491631157696247, -0.0010708598420023918, -0.0009925566846504807, -0.0009142534690909088, -0.0008359502535313368, -0.0007576470379717648, -0.0006793438224121928, -0.0006010406068526208, -0.0005227374495007098, -0.0004444342339411378, -0.0003661310183815658, -0.00028782780282199383, -0.00020952458726242185, -0.00013122137170284986, -5.2918156143277884e-05, 2.5385059416294098e-05, 0.00010368827497586608, 0.00018199149053543806, 0.00026029470609501004, 0.000338597921654582, 0.000416901137214154, 0.000495204352773726, 0.000573507568333298, 0.00065181078389287, 0.0007301139994524419]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 4.0, 4.0, 9.0, 13.0, 19.0, 14.0, 16.0, 20.0, 20.0, 27.0, 32.0, 32.0, 33.0, 39.0, 28.0, 34.0, 38.0, 38.0, 50.0, 27.0, 42.0, 41.0, 24.0, 33.0, 45.0, 41.0, 32.0, 36.0, 36.0, 28.0, 16.0, 16.0, 15.0, 15.0, 13.0, 6.0, 14.0, 16.0, 12.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026291608810424805, -0.000253492034971714, -0.00024406798183918, -0.00023464392870664597, -0.00022521987557411194, -0.0002157958224415779, -0.00020637176930904388, -0.00019694771617650986, -0.00018752366304397583, -0.0001780996099114418, -0.00016867555677890778, -0.00015925150364637375, -0.00014982745051383972, -0.0001404033973813057, -0.00013097934424877167, -0.00012155529111623764, -0.00011213123798370361, -0.00010270718485116959, -9.328313171863556e-05, -8.385907858610153e-05, -7.44350254535675e-05, -6.501097232103348e-05, -5.558691918849945e-05, -4.6162866055965424e-05, -3.6738812923431396e-05, -2.731475979089737e-05, -1.7890706658363342e-05, -8.466653525829315e-06, 9.57399606704712e-07, 1.0381452739238739e-05, 1.9805505871772766e-05, 2.9229559004306793e-05, 3.865361213684082e-05, 4.807766526937485e-05, 5.7501718401908875e-05, 6.69257715344429e-05, 7.634982466697693e-05, 8.577387779951096e-05, 9.519793093204498e-05, 0.00010462198406457901, 0.00011404603719711304, 0.00012347009032964706, 0.0001328941434621811, 0.00014231819659471512, 0.00015174224972724915, 0.00016116630285978317, 0.0001705903559923172, 0.00018001440912485123, 0.00018943846225738525, 0.00019886251538991928, 0.0002082865685224533, 0.00021771062165498734, 0.00022713467478752136, 0.0002365587279200554, 0.0002459827810525894, 0.00025540683418512344, 0.00026483088731765747, 0.0002742549404501915, 0.0002836789935827255, 0.00029310304671525955, 0.0003025270998477936, 0.0003119511529803276, 0.00032137520611286163, 0.00033079925924539566, 0.0003402233123779297]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 10.0, 11.0, 17.0, 13.0, 16.0, 15.0, 18.0, 19.0, 29.0, 26.0, 39.0, 28.0, 24.0, 37.0, 31.0, 28.0, 41.0, 38.0, 47.0, 35.0, 46.0, 33.0, 35.0, 27.0, 29.0, 26.0, 28.0, 21.0, 34.0, 18.0, 30.0, 12.0, 25.0, 13.0, 10.0, 11.0, 11.0, 14.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.50262451171875, -5.3021240234375, -5.10162353515625, -4.901123046875, -4.70062255859375, -4.5001220703125, -4.29962158203125, -4.09912109375, -3.89862060546875, -3.6981201171875, -3.49761962890625, -3.297119140625, -3.09661865234375, -2.8961181640625, -2.69561767578125, -2.4951171875, -2.29461669921875, -2.0941162109375, -1.89361572265625, -1.693115234375, -1.49261474609375, -1.2921142578125, -1.09161376953125, -0.89111328125, -0.69061279296875, -0.4901123046875, -0.28961181640625, -0.089111328125, 0.11138916015625, 0.3118896484375, 0.51239013671875, 0.712890625, 0.91339111328125, 1.1138916015625, 1.31439208984375, 1.514892578125, 1.71539306640625, 1.9158935546875, 2.11639404296875, 2.31689453125, 2.51739501953125, 2.7178955078125, 2.91839599609375, 3.118896484375, 3.31939697265625, 3.5198974609375, 3.72039794921875, 3.9208984375, 4.12139892578125, 4.3218994140625, 4.52239990234375, 4.722900390625, 4.92340087890625, 5.1239013671875, 5.32440185546875, 5.52490234375, 5.72540283203125, 5.9259033203125, 6.12640380859375, 6.326904296875, 6.52740478515625, 6.7279052734375, 6.92840576171875, 7.12890625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 9.0, 14.0, 6.0, 12.0, 10.0, 20.0, 24.0, 26.0, 32.0, 27.0, 39.0, 72.0, 110.0, 150.0, 310.0, 567.0, 1153.0, 2482.0, 5271.0, 11522.0, 25285.0, 56511.0, 135683.0, 335220.0, 280620.0, 108054.0, 46079.0, 21153.0, 9485.0, 4291.0, 2007.0, 1025.0, 472.0, 252.0, 167.0, 95.0, 68.0, 39.0, 37.0, 28.0, 30.0, 15.0, 19.0, 16.0, 13.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.10546875, -4.94012451171875, -4.7747802734375, -4.60943603515625, -4.444091796875, -4.27874755859375, -4.1134033203125, -3.94805908203125, -3.78271484375, -3.61737060546875, -3.4520263671875, -3.28668212890625, -3.121337890625, -2.95599365234375, -2.7906494140625, -2.62530517578125, -2.4599609375, -2.29461669921875, -2.1292724609375, -1.96392822265625, -1.798583984375, -1.63323974609375, -1.4678955078125, -1.30255126953125, -1.13720703125, -0.97186279296875, -0.8065185546875, -0.64117431640625, -0.475830078125, -0.31048583984375, -0.1451416015625, 0.02020263671875, 0.185546875, 0.35089111328125, 0.5162353515625, 0.68157958984375, 0.846923828125, 1.01226806640625, 1.1776123046875, 1.34295654296875, 1.50830078125, 1.67364501953125, 1.8389892578125, 2.00433349609375, 2.169677734375, 2.33502197265625, 2.5003662109375, 2.66571044921875, 2.8310546875, 2.99639892578125, 3.1617431640625, 3.32708740234375, 3.492431640625, 3.65777587890625, 3.8231201171875, 3.98846435546875, 4.15380859375, 4.31915283203125, 4.4844970703125, 4.64984130859375, 4.815185546875, 4.98052978515625, 5.1458740234375, 5.31121826171875, 5.4765625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 6.0, 4.0, 14.0, 14.0, 10.0, 16.0, 25.0, 22.0, 18.0, 28.0, 33.0, 38.0, 35.0, 29.0, 50.0, 50.0, 72.0, 176.0, 1561.0, 287.0, 87.0, 51.0, 53.0, 44.0, 41.0, 36.0, 21.0, 24.0, 31.0, 16.0, 29.0, 21.0, 15.0, 14.0, 13.0, 14.0, 15.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.328125, -19.666015625, -19.00390625, -18.341796875, -17.6796875, -17.017578125, -16.35546875, -15.693359375, -15.03125, -14.369140625, -13.70703125, -13.044921875, -12.3828125, -11.720703125, -11.05859375, -10.396484375, -9.734375, -9.072265625, -8.41015625, -7.748046875, -7.0859375, -6.423828125, -5.76171875, -5.099609375, -4.4375, -3.775390625, -3.11328125, -2.451171875, -1.7890625, -1.126953125, -0.46484375, 0.197265625, 0.859375, 1.521484375, 2.18359375, 2.845703125, 3.5078125, 4.169921875, 4.83203125, 5.494140625, 6.15625, 6.818359375, 7.48046875, 8.142578125, 8.8046875, 9.466796875, 10.12890625, 10.791015625, 11.453125, 12.115234375, 12.77734375, 13.439453125, 14.1015625, 14.763671875, 15.42578125, 16.087890625, 16.75, 17.412109375, 18.07421875, 18.736328125, 19.3984375, 20.060546875, 20.72265625, 21.384765625, 22.046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 8.0, 8.0, 12.0, 14.0, 18.0, 29.0, 24.0, 33.0, 29.0, 55.0, 62.0, 74.0, 97.0, 121.0, 151.0, 227.0, 371.0, 610.0, 1595.0, 44790.0, 3042972.0, 50818.0, 1687.0, 632.0, 341.0, 228.0, 180.0, 120.0, 86.0, 54.0, 48.0, 51.0, 29.0, 29.0, 18.0, 10.0, 12.0, 12.0, 9.0, 7.0, 5.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.16015625, -34.0078125, -32.85546875, -31.703125, -30.55078125, -29.3984375, -28.24609375, -27.09375, -25.94140625, -24.7890625, -23.63671875, -22.484375, -21.33203125, -20.1796875, -19.02734375, -17.875, -16.72265625, -15.5703125, -14.41796875, -13.265625, -12.11328125, -10.9609375, -9.80859375, -8.65625, -7.50390625, -6.3515625, -5.19921875, -4.046875, -2.89453125, -1.7421875, -0.58984375, 0.5625, 1.71484375, 2.8671875, 4.01953125, 5.171875, 6.32421875, 7.4765625, 8.62890625, 9.78125, 10.93359375, 12.0859375, 13.23828125, 14.390625, 15.54296875, 16.6953125, 17.84765625, 19.0, 20.15234375, 21.3046875, 22.45703125, 23.609375, 24.76171875, 25.9140625, 27.06640625, 28.21875, 29.37109375, 30.5234375, 31.67578125, 32.828125, 33.98046875, 35.1328125, 36.28515625, 37.4375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 29.0, 123.0, 348.0, 343.0, 125.0, 28.0, 13.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.078289031982422, -22.232301712036133, -20.386314392089844, -18.540327072143555, -16.694339752197266, -14.848352432250977, -13.002365112304688, -11.156377792358398, -9.31039047241211, -7.46440315246582, -5.618415832519531, -3.772428512573242, -1.9264411926269531, -0.08045387268066406, 1.765533447265625, 3.611520767211914, 5.457508087158203, 7.303495407104492, 9.149482727050781, 10.99547004699707, 12.84145736694336, 14.687444686889648, 16.533432006835938, 18.379419326782227, 20.225406646728516, 22.071393966674805, 23.917381286621094, 25.763368606567383, 27.609355926513672, 29.45534324645996, 31.30133056640625, 33.147315979003906, 34.99330139160156, 36.83928680419922, 38.68527603149414, 40.53126525878906, 42.37725067138672, 44.223236083984375, 46.0692253112793, 47.91521453857422, 49.761199951171875, 51.60718536376953, 53.45317459106445, 55.299163818359375, 57.14514923095703, 58.99113464355469, 60.83712387084961, 62.68311309814453, 64.52909851074219, 66.37508392333984, 68.2210693359375, 70.06706237792969, 71.91304779052734, 73.759033203125, 75.60502624511719, 77.45101165771484, 79.2969970703125, 81.14298248291016, 82.98896789550781, 84.8349609375, 86.68094635009766, 88.52693176269531, 90.3729248046875, 92.21891021728516, 94.06489562988281]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 1.0, 5.0, 4.0, 8.0, 10.0, 10.0, 9.0, 11.0, 10.0, 12.0, 26.0, 15.0, 18.0, 25.0, 22.0, 26.0, 42.0, 27.0, 41.0, 42.0, 40.0, 35.0, 44.0, 37.0, 53.0, 35.0, 40.0, 34.0, 37.0, 26.0, 34.0, 31.0, 23.0, 24.0, 16.0, 19.0, 21.0, 16.0, 13.0, 12.0, 11.0, 8.0, 9.0, 3.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-51.13607406616211, -49.5098762512207, -47.8836784362793, -46.25748062133789, -44.631282806396484, -43.00508499145508, -41.37888717651367, -39.752689361572266, -38.12649154663086, -36.50029373168945, -34.87409591674805, -33.24789810180664, -31.621700286865234, -29.995502471923828, -28.369304656982422, -26.743106842041016, -25.11690902709961, -23.490711212158203, -21.864513397216797, -20.23831558227539, -18.612117767333984, -16.985919952392578, -15.359722137451172, -13.733524322509766, -12.10732650756836, -10.481128692626953, -8.854930877685547, -7.228733062744141, -5.602535247802734, -3.976337432861328, -2.350139617919922, -0.7239418029785156, 0.9022598266601562, 2.5284576416015625, 4.154655456542969, 5.780853271484375, 7.407051086425781, 9.033248901367188, 10.659446716308594, 12.28564453125, 13.911842346191406, 15.538040161132812, 17.16423797607422, 18.790435791015625, 20.41663360595703, 22.042831420898438, 23.669029235839844, 25.29522705078125, 26.921424865722656, 28.547622680664062, 30.17382049560547, 31.800018310546875, 33.42621612548828, 35.05241394042969, 36.678611755371094, 38.3048095703125, 39.931007385253906, 41.55720520019531, 43.18340301513672, 44.809600830078125, 46.43579864501953, 48.06199645996094, 49.688194274902344, 51.31439208984375, 52.940589904785156]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 1.0, 13.0, 8.0, 10.0, 13.0, 15.0, 17.0, 19.0, 14.0, 25.0, 25.0, 30.0, 26.0, 26.0, 38.0, 35.0, 43.0, 32.0, 42.0, 45.0, 41.0, 33.0, 36.0, 46.0, 33.0, 36.0, 37.0, 29.0, 32.0, 26.0, 19.0, 19.0, 27.0, 15.0, 18.0, 11.0, 12.0, 11.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.0191650390625, -5.800048828125, -5.5809326171875, -5.36181640625, -5.1427001953125, -4.923583984375, -4.7044677734375, -4.4853515625, -4.2662353515625, -4.047119140625, -3.8280029296875, -3.60888671875, -3.3897705078125, -3.170654296875, -2.9515380859375, -2.732421875, -2.5133056640625, -2.294189453125, -2.0750732421875, -1.85595703125, -1.6368408203125, -1.417724609375, -1.1986083984375, -0.9794921875, -0.7603759765625, -0.541259765625, -0.3221435546875, -0.10302734375, 0.1160888671875, 0.335205078125, 0.5543212890625, 0.7734375, 0.9925537109375, 1.211669921875, 1.4307861328125, 1.64990234375, 1.8690185546875, 2.088134765625, 2.3072509765625, 2.5263671875, 2.7454833984375, 2.964599609375, 3.1837158203125, 3.40283203125, 3.6219482421875, 3.841064453125, 4.0601806640625, 4.279296875, 4.4984130859375, 4.717529296875, 4.9366455078125, 5.15576171875, 5.3748779296875, 5.593994140625, 5.8131103515625, 6.0322265625, 6.2513427734375, 6.470458984375, 6.6895751953125, 6.90869140625, 7.1278076171875, 7.346923828125, 7.5660400390625, 7.78515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 13.0, 6.0, 17.0, 16.0, 13.0, 21.0, 16.0, 30.0, 24.0, 45.0, 47.0, 51.0, 79.0, 112.0, 178.0, 382.0, 1490.0, 15290.0, 571202.0, 3377851.0, 217059.0, 8317.0, 1083.0, 292.0, 180.0, 96.0, 56.0, 63.0, 31.0, 33.0, 37.0, 22.0, 24.0, 18.0, 13.0, 9.0, 14.0, 11.0, 8.0, 5.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.203125, -21.49560546875, -20.7880859375, -20.08056640625, -19.373046875, -18.66552734375, -17.9580078125, -17.25048828125, -16.54296875, -15.83544921875, -15.1279296875, -14.42041015625, -13.712890625, -13.00537109375, -12.2978515625, -11.59033203125, -10.8828125, -10.17529296875, -9.4677734375, -8.76025390625, -8.052734375, -7.34521484375, -6.6376953125, -5.93017578125, -5.22265625, -4.51513671875, -3.8076171875, -3.10009765625, -2.392578125, -1.68505859375, -0.9775390625, -0.27001953125, 0.4375, 1.14501953125, 1.8525390625, 2.56005859375, 3.267578125, 3.97509765625, 4.6826171875, 5.39013671875, 6.09765625, 6.80517578125, 7.5126953125, 8.22021484375, 8.927734375, 9.63525390625, 10.3427734375, 11.05029296875, 11.7578125, 12.46533203125, 13.1728515625, 13.88037109375, 14.587890625, 15.29541015625, 16.0029296875, 16.71044921875, 17.41796875, 18.12548828125, 18.8330078125, 19.54052734375, 20.248046875, 20.95556640625, 21.6630859375, 22.37060546875, 23.078125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 5.0, 6.0, 4.0, 8.0, 6.0, 17.0, 19.0, 24.0, 25.0, 41.0, 58.0, 60.0, 92.0, 95.0, 135.0, 146.0, 236.0, 310.0, 363.0, 416.0, 431.0, 330.0, 289.0, 198.0, 146.0, 140.0, 96.0, 82.0, 72.0, 54.0, 39.0, 29.0, 26.0, 19.0, 13.0, 9.0, 8.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.3587646484375, -9.022216796875, -8.6856689453125, -8.34912109375, -8.0125732421875, -7.676025390625, -7.3394775390625, -7.0029296875, -6.6663818359375, -6.329833984375, -5.9932861328125, -5.65673828125, -5.3201904296875, -4.983642578125, -4.6470947265625, -4.310546875, -3.9739990234375, -3.637451171875, -3.3009033203125, -2.96435546875, -2.6278076171875, -2.291259765625, -1.9547119140625, -1.6181640625, -1.2816162109375, -0.945068359375, -0.6085205078125, -0.27197265625, 0.0645751953125, 0.401123046875, 0.7376708984375, 1.07421875, 1.4107666015625, 1.747314453125, 2.0838623046875, 2.42041015625, 2.7569580078125, 3.093505859375, 3.4300537109375, 3.7666015625, 4.1031494140625, 4.439697265625, 4.7762451171875, 5.11279296875, 5.4493408203125, 5.785888671875, 6.1224365234375, 6.458984375, 6.7955322265625, 7.132080078125, 7.4686279296875, 7.80517578125, 8.1417236328125, 8.478271484375, 8.8148193359375, 9.1513671875, 9.4879150390625, 9.824462890625, 10.1610107421875, 10.49755859375, 10.8341064453125, 11.170654296875, 11.5072021484375, 11.84375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 9.0, 9.0, 17.0, 12.0, 29.0, 32.0, 58.0, 50.0, 71.0, 80.0, 107.0, 135.0, 230.0, 273.0, 366.0, 867.0, 11938.0, 4132243.0, 45128.0, 1049.0, 440.0, 280.0, 172.0, 136.0, 118.0, 85.0, 71.0, 56.0, 50.0, 34.0, 26.0, 30.0, 16.0, 15.0, 13.0, 11.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.625, -76.3525390625, -74.080078125, -71.8076171875, -69.53515625, -67.2626953125, -64.990234375, -62.7177734375, -60.4453125, -58.1728515625, -55.900390625, -53.6279296875, -51.35546875, -49.0830078125, -46.810546875, -44.5380859375, -42.265625, -39.9931640625, -37.720703125, -35.4482421875, -33.17578125, -30.9033203125, -28.630859375, -26.3583984375, -24.0859375, -21.8134765625, -19.541015625, -17.2685546875, -14.99609375, -12.7236328125, -10.451171875, -8.1787109375, -5.90625, -3.6337890625, -1.361328125, 0.9111328125, 3.18359375, 5.4560546875, 7.728515625, 10.0009765625, 12.2734375, 14.5458984375, 16.818359375, 19.0908203125, 21.36328125, 23.6357421875, 25.908203125, 28.1806640625, 30.453125, 32.7255859375, 34.998046875, 37.2705078125, 39.54296875, 41.8154296875, 44.087890625, 46.3603515625, 48.6328125, 50.9052734375, 53.177734375, 55.4501953125, 57.72265625, 59.9951171875, 62.267578125, 64.5400390625, 66.8125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 47.0, 296.0, 471.0, 181.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-288.2147216796875, -282.9056701660156, -277.5966491699219, -272.28759765625, -266.9785461425781, -261.66949462890625, -256.3604736328125, -251.05142211914062, -245.74237060546875, -240.43333435058594, -235.12428283691406, -229.81524658203125, -224.50619506835938, -219.19715881347656, -213.8881072998047, -208.57907104492188, -203.27001953125, -197.9609832763672, -192.6519317626953, -187.3428955078125, -182.03384399414062, -176.7248077392578, -171.41575622558594, -166.10671997070312, -160.7976837158203, -155.4886474609375, -150.17959594726562, -144.8705596923828, -139.56150817871094, -134.25247192382812, -128.94342041015625, -123.63438415527344, -118.3253173828125, -113.01627349853516, -107.70722961425781, -102.39818572998047, -97.08914184570312, -91.78009796142578, -86.47105407714844, -81.16201782226562, -75.85297393798828, -70.54393005371094, -65.2348861694336, -59.92584228515625, -54.616798400878906, -49.30775451660156, -43.998714447021484, -38.68967056274414, -33.3806266784668, -28.071582794189453, -22.76253890991211, -17.4534969329834, -12.144453048706055, -6.835409164428711, -1.5263671875, 3.7826766967773438, 9.091720581054688, 14.400764465332031, 19.709808349609375, 25.018850326538086, 30.32789421081543, 35.636940002441406, 40.945980072021484, 46.25502395629883, 51.56406784057617]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 2.0, 8.0, 16.0, 9.0, 14.0, 15.0, 22.0, 20.0, 13.0, 24.0, 18.0, 22.0, 33.0, 34.0, 32.0, 30.0, 28.0, 53.0, 42.0, 29.0, 35.0, 42.0, 37.0, 26.0, 40.0, 30.0, 27.0, 35.0, 32.0, 27.0, 27.0, 29.0, 24.0, 20.0, 21.0, 8.0, 13.0, 14.0, 6.0, 8.0, 3.0, 11.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.510982513427734, -35.232784271240234, -33.95458984375, -32.6763916015625, -31.398197174072266, -30.119998931884766, -28.8418025970459, -27.56360626220703, -26.285409927368164, -25.007213592529297, -23.72901725769043, -22.450820922851562, -21.172622680664062, -19.894428253173828, -18.616230010986328, -17.33803367614746, -16.059837341308594, -14.781641006469727, -13.50344467163086, -12.225247383117676, -10.947051048278809, -9.668854713439941, -8.390657424926758, -7.112461090087891, -5.834264755249023, -4.556068420410156, -3.277871608734131, -1.9996750354766846, -0.7214784622192383, 0.5567178726196289, 1.8349146842956543, 3.1131114959716797, 4.391304016113281, 5.669500350952148, 6.947697162628174, 8.2258939743042, 9.504090309143066, 10.782286643981934, 12.060483932495117, 13.338680267333984, 14.616876602172852, 15.895072937011719, 17.173269271850586, 18.451465606689453, 19.729663848876953, 21.007858276367188, 22.286056518554688, 23.564252853393555, 24.842449188232422, 26.12064552307129, 27.398841857910156, 28.677038192749023, 29.95523452758789, 31.23343276977539, 32.511627197265625, 33.789825439453125, 35.068023681640625, 36.346221923828125, 37.62441635131836, 38.90261459350586, 40.180809020996094, 41.459007263183594, 42.73720169067383, 44.01539993286133, 45.29359436035156]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 7.0, 18.0, 4.0, 21.0, 18.0, 23.0, 18.0, 23.0, 31.0, 32.0, 39.0, 33.0, 44.0, 29.0, 30.0, 36.0, 41.0, 58.0, 33.0, 43.0, 39.0, 35.0, 39.0, 38.0, 37.0, 28.0, 25.0, 24.0, 20.0, 17.0, 16.0, 17.0, 10.0, 14.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.22265625, -6.9989013671875, -6.775146484375, -6.5513916015625, -6.32763671875, -6.1038818359375, -5.880126953125, -5.6563720703125, -5.4326171875, -5.2088623046875, -4.985107421875, -4.7613525390625, -4.53759765625, -4.3138427734375, -4.090087890625, -3.8663330078125, -3.642578125, -3.4188232421875, -3.195068359375, -2.9713134765625, -2.74755859375, -2.5238037109375, -2.300048828125, -2.0762939453125, -1.8525390625, -1.6287841796875, -1.405029296875, -1.1812744140625, -0.95751953125, -0.7337646484375, -0.510009765625, -0.2862548828125, -0.0625, 0.1612548828125, 0.385009765625, 0.6087646484375, 0.83251953125, 1.0562744140625, 1.280029296875, 1.5037841796875, 1.7275390625, 1.9512939453125, 2.175048828125, 2.3988037109375, 2.62255859375, 2.8463134765625, 3.070068359375, 3.2938232421875, 3.517578125, 3.7413330078125, 3.965087890625, 4.1888427734375, 4.41259765625, 4.6363525390625, 4.860107421875, 5.0838623046875, 5.3076171875, 5.5313720703125, 5.755126953125, 5.9788818359375, 6.20263671875, 6.4263916015625, 6.650146484375, 6.8739013671875, 7.09765625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 18.0, 9.0, 21.0, 37.0, 56.0, 89.0, 137.0, 197.0, 273.0, 389.0, 508.0, 835.0, 1161.0, 1809.0, 2614.0, 3555.0, 5347.0, 7661.0, 11707.0, 17198.0, 26013.0, 40268.0, 62867.0, 101520.0, 166013.0, 219074.0, 138209.0, 84316.0, 53444.0, 34393.0, 22360.0, 14777.0, 10096.0, 6778.0, 4682.0, 3170.0, 2118.0, 1504.0, 1055.0, 713.0, 512.0, 333.0, 224.0, 178.0, 106.0, 71.0, 43.0, 30.0, 26.0, 19.0, 6.0, 11.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0478515625, -1.0154266357421875, -0.983001708984375, -0.9505767822265625, -0.91815185546875, -0.8857269287109375, -0.853302001953125, -0.8208770751953125, -0.7884521484375, -0.7560272216796875, -0.723602294921875, -0.6911773681640625, -0.65875244140625, -0.6263275146484375, -0.593902587890625, -0.5614776611328125, -0.529052734375, -0.4966278076171875, -0.464202880859375, -0.4317779541015625, -0.39935302734375, -0.3669281005859375, -0.334503173828125, -0.3020782470703125, -0.2696533203125, -0.2372283935546875, -0.204803466796875, -0.1723785400390625, -0.13995361328125, -0.1075286865234375, -0.075103759765625, -0.0426788330078125, -0.01025390625, 0.0221710205078125, 0.054595947265625, 0.0870208740234375, 0.11944580078125, 0.1518707275390625, 0.184295654296875, 0.2167205810546875, 0.2491455078125, 0.2815704345703125, 0.313995361328125, 0.3464202880859375, 0.37884521484375, 0.4112701416015625, 0.443695068359375, 0.4761199951171875, 0.508544921875, 0.5409698486328125, 0.573394775390625, 0.6058197021484375, 0.63824462890625, 0.6706695556640625, 0.703094482421875, 0.7355194091796875, 0.7679443359375, 0.8003692626953125, 0.832794189453125, 0.8652191162109375, 0.89764404296875, 0.9300689697265625, 0.962493896484375, 0.9949188232421875, 1.02734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 10.0, 14.0, 15.0, 12.0, 25.0, 19.0, 33.0, 17.0, 31.0, 36.0, 29.0, 40.0, 38.0, 37.0, 36.0, 44.0, 1061.0, 44.0, 40.0, 51.0, 44.0, 43.0, 33.0, 29.0, 31.0, 29.0, 28.0, 27.0, 18.0, 26.0, 17.0, 9.0, 14.0, 10.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.5655517578125, -4.416259765625, -4.2669677734375, -4.11767578125, -3.9683837890625, -3.819091796875, -3.6697998046875, -3.5205078125, -3.3712158203125, -3.221923828125, -3.0726318359375, -2.92333984375, -2.7740478515625, -2.624755859375, -2.4754638671875, -2.326171875, -2.1768798828125, -2.027587890625, -1.8782958984375, -1.72900390625, -1.5797119140625, -1.430419921875, -1.2811279296875, -1.1318359375, -0.9825439453125, -0.833251953125, -0.6839599609375, -0.53466796875, -0.3853759765625, -0.236083984375, -0.0867919921875, 0.0625, 0.2117919921875, 0.361083984375, 0.5103759765625, 0.65966796875, 0.8089599609375, 0.958251953125, 1.1075439453125, 1.2568359375, 1.4061279296875, 1.555419921875, 1.7047119140625, 1.85400390625, 2.0032958984375, 2.152587890625, 2.3018798828125, 2.451171875, 2.6004638671875, 2.749755859375, 2.8990478515625, 3.04833984375, 3.1976318359375, 3.346923828125, 3.4962158203125, 3.6455078125, 3.7947998046875, 3.944091796875, 4.0933837890625, 4.24267578125, 4.3919677734375, 4.541259765625, 4.6905517578125, 4.83984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 11.0, 18.0, 29.0, 45.0, 64.0, 91.0, 156.0, 195.0, 304.0, 455.0, 685.0, 1131.0, 1801.0, 2766.0, 4228.0, 6660.0, 10720.0, 16682.0, 27192.0, 44273.0, 74358.0, 129473.0, 1284186.0, 205998.0, 113577.0, 66363.0, 39350.0, 24453.0, 15231.0, 9548.0, 6178.0, 3904.0, 2426.0, 1568.0, 1044.0, 685.0, 423.0, 292.0, 167.0, 142.0, 88.0, 52.0, 38.0, 28.0, 12.0, 14.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.063232421875, -1.02880859375, -0.994384765625, -0.9599609375, -0.925537109375, -0.89111328125, -0.856689453125, -0.822265625, -0.787841796875, -0.75341796875, -0.718994140625, -0.6845703125, -0.650146484375, -0.61572265625, -0.581298828125, -0.546875, -0.512451171875, -0.47802734375, -0.443603515625, -0.4091796875, -0.374755859375, -0.34033203125, -0.305908203125, -0.271484375, -0.237060546875, -0.20263671875, -0.168212890625, -0.1337890625, -0.099365234375, -0.06494140625, -0.030517578125, 0.00390625, 0.038330078125, 0.07275390625, 0.107177734375, 0.1416015625, 0.176025390625, 0.21044921875, 0.244873046875, 0.279296875, 0.313720703125, 0.34814453125, 0.382568359375, 0.4169921875, 0.451416015625, 0.48583984375, 0.520263671875, 0.5546875, 0.589111328125, 0.62353515625, 0.657958984375, 0.6923828125, 0.726806640625, 0.76123046875, 0.795654296875, 0.830078125, 0.864501953125, 0.89892578125, 0.933349609375, 0.9677734375, 1.002197265625, 1.03662109375, 1.071044921875, 1.10546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 6.0, 8.0, 5.0, 8.0, 16.0, 13.0, 16.0, 35.0, 40.0, 40.0, 56.0, 62.0, 69.0, 97.0, 102.0, 69.0, 75.0, 63.0, 50.0, 42.0, 25.0, 20.0, 16.0, 9.0, 17.0, 5.0, 6.0, 7.0, 8.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009007453918457031, -0.0008743852376937866, -0.0008480250835418701, -0.0008216649293899536, -0.0007953047752380371, -0.0007689446210861206, -0.0007425844669342041, -0.0007162243127822876, -0.0006898641586303711, -0.0006635040044784546, -0.0006371438503265381, -0.0006107836961746216, -0.0005844235420227051, -0.0005580633878707886, -0.0005317032337188721, -0.0005053430795669556, -0.00047898292541503906, -0.00045262277126312256, -0.00042626261711120605, -0.00039990246295928955, -0.00037354230880737305, -0.00034718215465545654, -0.00032082200050354004, -0.00029446184635162354, -0.00026810169219970703, -0.00024174153804779053, -0.00021538138389587402, -0.00018902122974395752, -0.00016266107559204102, -0.0001363009214401245, -0.00010994076728820801, -8.35806131362915e-05, -5.7220458984375e-05, -3.0860304832458496e-05, -4.500150680541992e-06, 2.1860003471374512e-05, 4.8220157623291016e-05, 7.458031177520752e-05, 0.00010094046592712402, 0.00012730062007904053, 0.00015366077423095703, 0.00018002092838287354, 0.00020638108253479004, 0.00023274123668670654, 0.00025910139083862305, 0.00028546154499053955, 0.00031182169914245605, 0.00033818185329437256, 0.00036454200744628906, 0.00039090216159820557, 0.00041726231575012207, 0.0004436224699020386, 0.0004699826240539551, 0.0004963427782058716, 0.0005227029323577881, 0.0005490630865097046, 0.0005754232406616211, 0.0006017833948135376, 0.0006281435489654541, 0.0006545037031173706, 0.0006808638572692871, 0.0007072240114212036, 0.0007335841655731201, 0.0007599443197250366, 0.0007863044738769531]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 9.0, 13.0, 9.0, 15.0, 23.0, 27.0, 36.0, 55.0, 76.0, 153.0, 243.0, 423.0, 1709.0, 1037379.0, 6986.0, 645.0, 266.0, 151.0, 98.0, 57.0, 39.0, 40.0, 20.0, 15.0, 13.0, 8.0, 7.0, 4.0, 7.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.017974853515625, -0.017368793487548828, -0.016762733459472656, -0.016156673431396484, -0.015550613403320312, -0.01494455337524414, -0.014338493347167969, -0.013732433319091797, -0.013126373291015625, -0.012520313262939453, -0.011914253234863281, -0.01130819320678711, -0.010702133178710938, -0.010096073150634766, -0.009490013122558594, -0.008883953094482422, -0.00827789306640625, -0.007671833038330078, -0.007065773010253906, -0.006459712982177734, -0.0058536529541015625, -0.005247592926025391, -0.004641532897949219, -0.004035472869873047, -0.003429412841796875, -0.002823352813720703, -0.0022172927856445312, -0.0016112327575683594, -0.0010051727294921875, -0.0003991127014160156, 0.00020694732666015625, 0.0008130073547363281, 0.0014190673828125, 0.002025127410888672, 0.0026311874389648438, 0.0032372474670410156, 0.0038433074951171875, 0.004449367523193359, 0.005055427551269531, 0.005661487579345703, 0.006267547607421875, 0.006873607635498047, 0.007479667663574219, 0.00808572769165039, 0.008691787719726562, 0.009297847747802734, 0.009903907775878906, 0.010509967803955078, 0.01111602783203125, 0.011722087860107422, 0.012328147888183594, 0.012934207916259766, 0.013540267944335938, 0.01414632797241211, 0.014752388000488281, 0.015358448028564453, 0.015964508056640625, 0.016570568084716797, 0.01717662811279297, 0.01778268814086914, 0.018388748168945312, 0.018994808197021484, 0.019600868225097656, 0.020206928253173828, 0.02081298828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 13.0, 31.0, 175.0, 306.0, 311.0, 135.0, 35.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016441349871456623, -0.0016124630346894264, -0.0015807910822331905, -0.0015491191297769547, -0.0015174472937360406, -0.0014857753412798047, -0.0014541033888235688, -0.001422431436367333, -0.001390759483911097, -0.0013590875314548612, -0.0013274155789986253, -0.0012957437429577112, -0.0012640717905014753, -0.0012323998380452394, -0.0012007278855890036, -0.0011690559331327677, -0.0011373839806765318, -0.001105712028220296, -0.00107404007576406, -0.0010423681233078241, -0.00101069628726691, -0.0009790243348106742, -0.0009473523823544383, -0.0009156804298982024, -0.0008840085938572884, -0.0008523366414010525, -0.0008206647471524775, -0.0007889927946962416, -0.0007573208422400057, -0.0007256489479914308, -0.0006939769955351949, -0.000662305043078959, -0.000630633148830384, -0.0005989611963741481, -0.0005672893021255732, -0.0005356173496693373, -0.0005039453972131014, -0.00047227347386069596, -0.00044060155050829053, -0.00040892959805205464, -0.0003772576746996492, -0.0003455857513472438, -0.0003139137988910079, -0.00028224187553860247, -0.00025056995218619704, -0.00021889799972996116, -0.00018722607637755573, -0.00015555413847323507, -0.0001238822005689144, -9.221026266459376e-05, -6.053833203623071e-05, -2.886640140786767e-05, 2.805536496452987e-06, 3.4477474400773644e-05, 6.614939775317907e-05, 9.782133565749973e-05, 0.0001294932735618204, 0.00016116521146614105, 0.0001928371493704617, 0.00022450907272286713, 0.00025618099607527256, 0.00028785294853150845, 0.0003195248718839139, 0.0003511967952363193, 0.0003828687476925552]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 9.0, 10.0, 16.0, 8.0, 15.0, 15.0, 26.0, 21.0, 19.0, 28.0, 36.0, 28.0, 33.0, 26.0, 30.0, 38.0, 34.0, 31.0, 51.0, 38.0, 43.0, 37.0, 42.0, 30.0, 38.0, 42.0, 37.0, 31.0, 22.0, 23.0, 20.0, 13.0, 11.0, 21.0, 14.0, 10.0, 8.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003153681755065918, -0.00030407775193452835, -0.0002927873283624649, -0.00028149690479040146, -0.000270206481218338, -0.00025891605764627457, -0.0002476256340742111, -0.00023633521050214767, -0.00022504478693008423, -0.00021375436335802078, -0.00020246393978595734, -0.0001911735162138939, -0.00017988309264183044, -0.000168592669069767, -0.00015730224549770355, -0.0001460118219256401, -0.00013472139835357666, -0.00012343097478151321, -0.00011214055120944977, -0.00010085012763738632, -8.955970406532288e-05, -7.826928049325943e-05, -6.697885692119598e-05, -5.568843334913254e-05, -4.439800977706909e-05, -3.3107586205005646e-05, -2.18171626329422e-05, -1.0526739060878754e-05, 7.636845111846924e-07, 1.2054108083248138e-05, 2.3344531655311584e-05, 3.463495522737503e-05, 4.5925378799438477e-05, 5.721580237150192e-05, 6.850622594356537e-05, 7.979664951562881e-05, 9.108707308769226e-05, 0.00010237749665975571, 0.00011366792023181915, 0.0001249583438038826, 0.00013624876737594604, 0.0001475391909480095, 0.00015882961452007294, 0.00017012003809213638, 0.00018141046166419983, 0.00019270088523626328, 0.00020399130880832672, 0.00021528173238039017, 0.0002265721559524536, 0.00023786257952451706, 0.0002491530030965805, 0.00026044342666864395, 0.0002717338502407074, 0.00028302427381277084, 0.0002943146973848343, 0.00030560512095689774, 0.0003168955445289612, 0.00032818596810102463, 0.0003394763916730881, 0.0003507668152451515, 0.00036205723881721497, 0.0003733476623892784, 0.00038463808596134186, 0.0003959285095334053, 0.00040721893310546875]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 7.0, 18.0, 4.0, 21.0, 18.0, 23.0, 18.0, 23.0, 31.0, 32.0, 39.0, 33.0, 44.0, 29.0, 30.0, 36.0, 41.0, 58.0, 33.0, 43.0, 39.0, 35.0, 39.0, 38.0, 37.0, 28.0, 25.0, 24.0, 20.0, 17.0, 16.0, 17.0, 10.0, 14.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.22265625, -6.9989013671875, -6.775146484375, -6.5513916015625, -6.32763671875, -6.1038818359375, -5.880126953125, -5.6563720703125, -5.4326171875, -5.2088623046875, -4.985107421875, -4.7613525390625, -4.53759765625, -4.3138427734375, -4.090087890625, -3.8663330078125, -3.642578125, -3.4188232421875, -3.195068359375, -2.9713134765625, -2.74755859375, -2.5238037109375, -2.300048828125, -2.0762939453125, -1.8525390625, -1.6287841796875, -1.405029296875, -1.1812744140625, -0.95751953125, -0.7337646484375, -0.510009765625, -0.2862548828125, -0.0625, 0.1612548828125, 0.385009765625, 0.6087646484375, 0.83251953125, 1.0562744140625, 1.280029296875, 1.5037841796875, 1.7275390625, 1.9512939453125, 2.175048828125, 2.3988037109375, 2.62255859375, 2.8463134765625, 3.070068359375, 3.2938232421875, 3.517578125, 3.7413330078125, 3.965087890625, 4.1888427734375, 4.41259765625, 4.6363525390625, 4.860107421875, 5.0838623046875, 5.3076171875, 5.5313720703125, 5.755126953125, 5.9788818359375, 6.20263671875, 6.4263916015625, 6.650146484375, 6.8739013671875, 7.09765625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 5.0, 11.0, 10.0, 12.0, 13.0, 20.0, 33.0, 39.0, 43.0, 56.0, 72.0, 105.0, 171.0, 221.0, 362.0, 633.0, 1956.0, 11205.0, 94921.0, 766244.0, 151262.0, 16517.0, 2624.0, 753.0, 382.0, 242.0, 183.0, 115.0, 72.0, 63.0, 41.0, 31.0, 30.0, 28.0, 13.0, 17.0, 11.0, 8.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.34375, -13.9036865234375, -13.463623046875, -13.0235595703125, -12.58349609375, -12.1434326171875, -11.703369140625, -11.2633056640625, -10.8232421875, -10.3831787109375, -9.943115234375, -9.5030517578125, -9.06298828125, -8.6229248046875, -8.182861328125, -7.7427978515625, -7.302734375, -6.8626708984375, -6.422607421875, -5.9825439453125, -5.54248046875, -5.1024169921875, -4.662353515625, -4.2222900390625, -3.7822265625, -3.3421630859375, -2.902099609375, -2.4620361328125, -2.02197265625, -1.5819091796875, -1.141845703125, -0.7017822265625, -0.26171875, 0.1783447265625, 0.618408203125, 1.0584716796875, 1.49853515625, 1.9385986328125, 2.378662109375, 2.8187255859375, 3.2587890625, 3.6988525390625, 4.138916015625, 4.5789794921875, 5.01904296875, 5.4591064453125, 5.899169921875, 6.3392333984375, 6.779296875, 7.2193603515625, 7.659423828125, 8.0994873046875, 8.53955078125, 8.9796142578125, 9.419677734375, 9.8597412109375, 10.2998046875, 10.7398681640625, 11.179931640625, 11.6199951171875, 12.06005859375, 12.5001220703125, 12.940185546875, 13.3802490234375, 13.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 7.0, 12.0, 6.0, 10.0, 12.0, 10.0, 23.0, 21.0, 25.0, 22.0, 34.0, 32.0, 41.0, 36.0, 48.0, 56.0, 74.0, 247.0, 1677.0, 178.0, 57.0, 51.0, 43.0, 36.0, 42.0, 24.0, 35.0, 33.0, 18.0, 14.0, 17.0, 22.0, 16.0, 11.0, 5.0, 14.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.484375, -22.781005859375, -22.07763671875, -21.374267578125, -20.6708984375, -19.967529296875, -19.26416015625, -18.560791015625, -17.857421875, -17.154052734375, -16.45068359375, -15.747314453125, -15.0439453125, -14.340576171875, -13.63720703125, -12.933837890625, -12.23046875, -11.527099609375, -10.82373046875, -10.120361328125, -9.4169921875, -8.713623046875, -8.01025390625, -7.306884765625, -6.603515625, -5.900146484375, -5.19677734375, -4.493408203125, -3.7900390625, -3.086669921875, -2.38330078125, -1.679931640625, -0.9765625, -0.273193359375, 0.43017578125, 1.133544921875, 1.8369140625, 2.540283203125, 3.24365234375, 3.947021484375, 4.650390625, 5.353759765625, 6.05712890625, 6.760498046875, 7.4638671875, 8.167236328125, 8.87060546875, 9.573974609375, 10.27734375, 10.980712890625, 11.68408203125, 12.387451171875, 13.0908203125, 13.794189453125, 14.49755859375, 15.200927734375, 15.904296875, 16.607666015625, 17.31103515625, 18.014404296875, 18.7177734375, 19.421142578125, 20.12451171875, 20.827880859375, 21.53125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 8.0, 3.0, 11.0, 12.0, 12.0, 16.0, 23.0, 18.0, 17.0, 23.0, 42.0, 40.0, 53.0, 86.0, 88.0, 168.0, 288.0, 557.0, 2357.0, 801157.0, 2336245.0, 2886.0, 636.0, 321.0, 173.0, 103.0, 72.0, 62.0, 42.0, 29.0, 30.0, 29.0, 17.0, 13.0, 15.0, 9.0, 8.0, 11.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-49.9375, -48.32861328125, -46.7197265625, -45.11083984375, -43.501953125, -41.89306640625, -40.2841796875, -38.67529296875, -37.06640625, -35.45751953125, -33.8486328125, -32.23974609375, -30.630859375, -29.02197265625, -27.4130859375, -25.80419921875, -24.1953125, -22.58642578125, -20.9775390625, -19.36865234375, -17.759765625, -16.15087890625, -14.5419921875, -12.93310546875, -11.32421875, -9.71533203125, -8.1064453125, -6.49755859375, -4.888671875, -3.27978515625, -1.6708984375, -0.06201171875, 1.546875, 3.15576171875, 4.7646484375, 6.37353515625, 7.982421875, 9.59130859375, 11.2001953125, 12.80908203125, 14.41796875, 16.02685546875, 17.6357421875, 19.24462890625, 20.853515625, 22.46240234375, 24.0712890625, 25.68017578125, 27.2890625, 28.89794921875, 30.5068359375, 32.11572265625, 33.724609375, 35.33349609375, 36.9423828125, 38.55126953125, 40.16015625, 41.76904296875, 43.3779296875, 44.98681640625, 46.595703125, 48.20458984375, 49.8134765625, 51.42236328125, 53.03125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 13.0, 792.0, 206.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.23040008544922, -15.555150985717773, -9.879901885986328, -4.204652786254883, 1.4705963134765625, 7.145845413208008, 12.821094512939453, 18.49634552001953, 24.171592712402344, 29.84684181213379, 35.522090911865234, 41.19734191894531, 46.872589111328125, 52.54783630371094, 58.223087310791016, 63.898338317871094, 69.5735855102539, 75.24883270263672, 80.92408752441406, 86.59933471679688, 92.27458190917969, 97.9498291015625, 103.62507629394531, 109.30033111572266, 114.97557830810547, 120.65082550048828, 126.32608032226562, 132.00132751464844, 137.67657470703125, 143.35182189941406, 149.02706909179688, 154.70233154296875, 160.3775634765625, 166.0528106689453, 171.72805786132812, 177.40330505371094, 183.07855224609375, 188.75381469726562, 194.42906188964844, 200.10430908203125, 205.77955627441406, 211.45480346679688, 217.1300506591797, 222.8052978515625, 228.48056030273438, 234.1558074951172, 239.8310546875, 245.5063018798828, 251.18154907226562, 256.8568115234375, 262.53204345703125, 268.2073059082031, 273.8825378417969, 279.55780029296875, 285.2330322265625, 290.9082946777344, 296.58355712890625, 302.2588195800781, 307.9340515136719, 313.60931396484375, 319.2845458984375, 324.9598083496094, 330.6350402832031, 336.310302734375, 341.98553466796875]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 8.0, 4.0, 5.0, 11.0, 11.0, 13.0, 13.0, 13.0, 21.0, 26.0, 21.0, 28.0, 30.0, 32.0, 34.0, 51.0, 40.0, 36.0, 38.0, 49.0, 37.0, 44.0, 41.0, 34.0, 38.0, 41.0, 33.0, 30.0, 27.0, 22.0, 22.0, 31.0, 14.0, 12.0, 15.0, 16.0, 8.0, 9.0, 8.0, 12.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0], "bins": [-56.44456481933594, -54.778480529785156, -53.11240005493164, -51.446319580078125, -49.780235290527344, -48.11415100097656, -46.44807052612305, -44.78199005126953, -43.11590576171875, -41.44982147216797, -39.78374099731445, -38.11766052246094, -36.451576232910156, -34.785491943359375, -33.11941146850586, -31.45332908630371, -29.787246704101562, -28.121164321899414, -26.455081939697266, -24.788999557495117, -23.12291717529297, -21.45683479309082, -19.790752410888672, -18.124670028686523, -16.458587646484375, -14.792505264282227, -13.126422882080078, -11.46034049987793, -9.794258117675781, -8.128175735473633, -6.462093353271484, -4.796010971069336, -3.129932403564453, -1.4638500213623047, 0.20223236083984375, 1.8683147430419922, 3.5343971252441406, 5.200479507446289, 6.8665618896484375, 8.532644271850586, 10.198726654052734, 11.864809036254883, 13.530891418457031, 15.19697380065918, 16.863056182861328, 18.529138565063477, 20.195220947265625, 21.861303329467773, 23.527385711669922, 25.19346809387207, 26.85955047607422, 28.525632858276367, 30.191715240478516, 31.857797622680664, 33.52388000488281, 35.189964294433594, 36.85604476928711, 38.522125244140625, 40.188209533691406, 41.85429382324219, 43.5203742980957, 45.18645477294922, 46.8525390625, 48.51862335205078, 50.1847038269043]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 3.0, 5.0, 10.0, 14.0, 5.0, 17.0, 11.0, 26.0, 19.0, 30.0, 23.0, 37.0, 38.0, 36.0, 26.0, 33.0, 40.0, 41.0, 39.0, 44.0, 46.0, 35.0, 33.0, 38.0, 39.0, 44.0, 37.0, 31.0, 20.0, 25.0, 33.0, 21.0, 17.0, 14.0, 12.0, 9.0, 10.0, 9.0, 5.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.2734375, -7.04437255859375, -6.8153076171875, -6.58624267578125, -6.357177734375, -6.12811279296875, -5.8990478515625, -5.66998291015625, -5.44091796875, -5.21185302734375, -4.9827880859375, -4.75372314453125, -4.524658203125, -4.29559326171875, -4.0665283203125, -3.83746337890625, -3.6083984375, -3.37933349609375, -3.1502685546875, -2.92120361328125, -2.692138671875, -2.46307373046875, -2.2340087890625, -2.00494384765625, -1.77587890625, -1.54681396484375, -1.3177490234375, -1.08868408203125, -0.859619140625, -0.63055419921875, -0.4014892578125, -0.17242431640625, 0.056640625, 0.28570556640625, 0.5147705078125, 0.74383544921875, 0.972900390625, 1.20196533203125, 1.4310302734375, 1.66009521484375, 1.88916015625, 2.11822509765625, 2.3472900390625, 2.57635498046875, 2.805419921875, 3.03448486328125, 3.2635498046875, 3.49261474609375, 3.7216796875, 3.95074462890625, 4.1798095703125, 4.40887451171875, 4.637939453125, 4.86700439453125, 5.0960693359375, 5.32513427734375, 5.55419921875, 5.78326416015625, 6.0123291015625, 6.24139404296875, 6.470458984375, 6.69952392578125, 6.9285888671875, 7.15765380859375, 7.38671875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 8.0, 2.0, 8.0, 3.0, 14.0, 14.0, 25.0, 13.0, 24.0, 37.0, 45.0, 51.0, 79.0, 115.0, 257.0, 493.0, 1388.0, 7257.0, 99731.0, 2508775.0, 1521832.0, 47588.0, 4475.0, 1061.0, 371.0, 189.0, 98.0, 79.0, 65.0, 37.0, 31.0, 23.0, 25.0, 16.0, 13.0, 11.0, 5.0, 5.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.03125, -22.3515625, -21.671875, -20.9921875, -20.3125, -19.6328125, -18.953125, -18.2734375, -17.59375, -16.9140625, -16.234375, -15.5546875, -14.875, -14.1953125, -13.515625, -12.8359375, -12.15625, -11.4765625, -10.796875, -10.1171875, -9.4375, -8.7578125, -8.078125, -7.3984375, -6.71875, -6.0390625, -5.359375, -4.6796875, -4.0, -3.3203125, -2.640625, -1.9609375, -1.28125, -0.6015625, 0.078125, 0.7578125, 1.4375, 2.1171875, 2.796875, 3.4765625, 4.15625, 4.8359375, 5.515625, 6.1953125, 6.875, 7.5546875, 8.234375, 8.9140625, 9.59375, 10.2734375, 10.953125, 11.6328125, 12.3125, 12.9921875, 13.671875, 14.3515625, 15.03125, 15.7109375, 16.390625, 17.0703125, 17.75, 18.4296875, 19.109375, 19.7890625, 20.46875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 12.0, 11.0, 14.0, 17.0, 16.0, 23.0, 39.0, 47.0, 53.0, 86.0, 76.0, 114.0, 146.0, 188.0, 252.0, 330.0, 402.0, 374.0, 345.0, 338.0, 262.0, 192.0, 151.0, 127.0, 110.0, 69.0, 59.0, 41.0, 37.0, 24.0, 21.0, 21.0, 12.0, 16.0, 5.0, 4.0, 8.0, 7.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6171875, -9.292724609375, -8.96826171875, -8.643798828125, -8.3193359375, -7.994873046875, -7.67041015625, -7.345947265625, -7.021484375, -6.697021484375, -6.37255859375, -6.048095703125, -5.7236328125, -5.399169921875, -5.07470703125, -4.750244140625, -4.42578125, -4.101318359375, -3.77685546875, -3.452392578125, -3.1279296875, -2.803466796875, -2.47900390625, -2.154541015625, -1.830078125, -1.505615234375, -1.18115234375, -0.856689453125, -0.5322265625, -0.207763671875, 0.11669921875, 0.441162109375, 0.765625, 1.090087890625, 1.41455078125, 1.739013671875, 2.0634765625, 2.387939453125, 2.71240234375, 3.036865234375, 3.361328125, 3.685791015625, 4.01025390625, 4.334716796875, 4.6591796875, 4.983642578125, 5.30810546875, 5.632568359375, 5.95703125, 6.281494140625, 6.60595703125, 6.930419921875, 7.2548828125, 7.579345703125, 7.90380859375, 8.228271484375, 8.552734375, 8.877197265625, 9.20166015625, 9.526123046875, 9.8505859375, 10.175048828125, 10.49951171875, 10.823974609375, 11.1484375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 5.0, 9.0, 16.0, 21.0, 22.0, 38.0, 46.0, 52.0, 72.0, 92.0, 120.0, 161.0, 297.0, 517.0, 1835.0, 298296.0, 3885713.0, 5136.0, 680.0, 360.0, 218.0, 154.0, 93.0, 81.0, 50.0, 43.0, 31.0, 38.0, 20.0, 14.0, 10.0, 10.0, 6.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.625, -66.3505859375, -64.076171875, -61.8017578125, -59.52734375, -57.2529296875, -54.978515625, -52.7041015625, -50.4296875, -48.1552734375, -45.880859375, -43.6064453125, -41.33203125, -39.0576171875, -36.783203125, -34.5087890625, -32.234375, -29.9599609375, -27.685546875, -25.4111328125, -23.13671875, -20.8623046875, -18.587890625, -16.3134765625, -14.0390625, -11.7646484375, -9.490234375, -7.2158203125, -4.94140625, -2.6669921875, -0.392578125, 1.8818359375, 4.15625, 6.4306640625, 8.705078125, 10.9794921875, 13.25390625, 15.5283203125, 17.802734375, 20.0771484375, 22.3515625, 24.6259765625, 26.900390625, 29.1748046875, 31.44921875, 33.7236328125, 35.998046875, 38.2724609375, 40.546875, 42.8212890625, 45.095703125, 47.3701171875, 49.64453125, 51.9189453125, 54.193359375, 56.4677734375, 58.7421875, 61.0166015625, 63.291015625, 65.5654296875, 67.83984375, 70.1142578125, 72.388671875, 74.6630859375, 76.9375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 19.0, 49.0, 118.0, 135.0, 177.0, 173.0, 136.0, 86.0, 58.0, 29.0, 20.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.96239471435547, -64.2294692993164, -62.49654006958008, -60.763614654541016, -59.03068542480469, -57.297760009765625, -55.56483459472656, -53.831905364990234, -52.098976135253906, -50.366050720214844, -48.633121490478516, -46.90019607543945, -45.167266845703125, -43.43434143066406, -41.701416015625, -39.96848678588867, -38.23556137084961, -36.50263595581055, -34.76970672607422, -33.036781311035156, -31.303852081298828, -29.570926666259766, -27.83799934387207, -26.105072021484375, -24.37214469909668, -22.639217376708984, -20.90629005432129, -19.173362731933594, -17.44043731689453, -15.70750904083252, -13.97458267211914, -12.241655349731445, -10.508731842041016, -8.77580451965332, -7.042877674102783, -5.309950828552246, -3.577023506164551, -1.8440961837768555, -0.11116981506347656, 1.6217575073242188, 3.354684829711914, 5.087612152099609, 6.8205389976501465, 8.553465843200684, 10.286393165588379, 12.019320487976074, 13.752246856689453, 15.485174179077148, 17.218101501464844, 18.95102882385254, 20.683956146240234, 22.416881561279297, 24.149810791015625, 25.882736206054688, 27.615663528442383, 29.348590850830078, 31.081518173217773, 32.81444549560547, 34.54737091064453, 36.28030014038086, 38.01322555541992, 39.74615478515625, 41.47908020019531, 43.212005615234375, 44.9449348449707]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 4.0, 4.0, 11.0, 5.0, 9.0, 10.0, 22.0, 21.0, 26.0, 32.0, 31.0, 31.0, 33.0, 37.0, 36.0, 41.0, 42.0, 45.0, 44.0, 40.0, 45.0, 42.0, 48.0, 51.0, 27.0, 41.0, 32.0, 29.0, 24.0, 23.0, 25.0, 17.0, 18.0, 11.0, 9.0, 9.0, 9.0, 6.0, 8.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.00720977783203, -34.65553665161133, -33.30386734008789, -31.952194213867188, -30.600522994995117, -29.248851776123047, -27.897178649902344, -26.545507431030273, -25.193836212158203, -23.842164993286133, -22.490493774414062, -21.13882064819336, -19.78714942932129, -18.43547821044922, -17.083805084228516, -15.732133865356445, -14.380462646484375, -13.028791427612305, -11.677119255065918, -10.325447082519531, -8.973775863647461, -7.622104167938232, -6.270432472229004, -4.918760299682617, -3.567089080810547, -2.2154173851013184, -0.8637456893920898, 0.48792600631713867, 1.8395977020263672, 3.1912693977355957, 4.542941093444824, 5.894613265991211, 7.246284484863281, 8.597955703735352, 9.949627876281738, 11.301300048828125, 12.652971267700195, 14.004642486572266, 15.356314659118652, 16.70798683166504, 18.05965805053711, 19.41132926940918, 20.76300048828125, 22.114673614501953, 23.466344833374023, 24.818016052246094, 26.169689178466797, 27.521360397338867, 28.873031616210938, 30.224702835083008, 31.576374053955078, 32.92804718017578, 34.27971649169922, 35.63138961791992, 36.983062744140625, 38.33473205566406, 39.686405181884766, 41.03807830810547, 42.389747619628906, 43.74142074584961, 45.09309387207031, 46.44476318359375, 47.79643630981445, 49.148109436035156, 50.499778747558594]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 11.0, 16.0, 19.0, 18.0, 27.0, 18.0, 32.0, 17.0, 30.0, 40.0, 38.0, 27.0, 46.0, 40.0, 35.0, 44.0, 44.0, 41.0, 38.0, 34.0, 30.0, 49.0, 38.0, 34.0, 29.0, 30.0, 30.0, 21.0, 19.0, 11.0, 9.0, 14.0, 7.0, 7.0, 7.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.4053955078125, -7.166259765625, -6.9271240234375, -6.68798828125, -6.4488525390625, -6.209716796875, -5.9705810546875, -5.7314453125, -5.4923095703125, -5.253173828125, -5.0140380859375, -4.77490234375, -4.5357666015625, -4.296630859375, -4.0574951171875, -3.818359375, -3.5792236328125, -3.340087890625, -3.1009521484375, -2.86181640625, -2.6226806640625, -2.383544921875, -2.1444091796875, -1.9052734375, -1.6661376953125, -1.427001953125, -1.1878662109375, -0.94873046875, -0.7095947265625, -0.470458984375, -0.2313232421875, 0.0078125, 0.2469482421875, 0.486083984375, 0.7252197265625, 0.96435546875, 1.2034912109375, 1.442626953125, 1.6817626953125, 1.9208984375, 2.1600341796875, 2.399169921875, 2.6383056640625, 2.87744140625, 3.1165771484375, 3.355712890625, 3.5948486328125, 3.833984375, 4.0731201171875, 4.312255859375, 4.5513916015625, 4.79052734375, 5.0296630859375, 5.268798828125, 5.5079345703125, 5.7470703125, 5.9862060546875, 6.225341796875, 6.4644775390625, 6.70361328125, 6.9427490234375, 7.181884765625, 7.4210205078125, 7.66015625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 10.0, 11.0, 24.0, 32.0, 50.0, 72.0, 115.0, 204.0, 267.0, 425.0, 693.0, 1047.0, 1715.0, 2774.0, 4702.0, 7510.0, 12860.0, 22268.0, 39603.0, 71632.0, 134059.0, 263851.0, 223538.0, 115850.0, 62138.0, 34519.0, 19674.0, 11494.0, 6704.0, 4149.0, 2420.0, 1510.0, 966.0, 608.0, 369.0, 248.0, 121.0, 110.0, 57.0, 43.0, 33.0, 22.0, 18.0, 8.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.3505859375, -1.306854248046875, -1.26312255859375, -1.219390869140625, -1.1756591796875, -1.131927490234375, -1.08819580078125, -1.044464111328125, -1.000732421875, -0.957000732421875, -0.91326904296875, -0.869537353515625, -0.8258056640625, -0.782073974609375, -0.73834228515625, -0.694610595703125, -0.65087890625, -0.607147216796875, -0.56341552734375, -0.519683837890625, -0.4759521484375, -0.432220458984375, -0.38848876953125, -0.344757080078125, -0.301025390625, -0.257293701171875, -0.21356201171875, -0.169830322265625, -0.1260986328125, -0.082366943359375, -0.03863525390625, 0.005096435546875, 0.048828125, 0.092559814453125, 0.13629150390625, 0.180023193359375, 0.2237548828125, 0.267486572265625, 0.31121826171875, 0.354949951171875, 0.398681640625, 0.442413330078125, 0.48614501953125, 0.529876708984375, 0.5736083984375, 0.617340087890625, 0.66107177734375, 0.704803466796875, 0.74853515625, 0.792266845703125, 0.83599853515625, 0.879730224609375, 0.9234619140625, 0.967193603515625, 1.01092529296875, 1.054656982421875, 1.098388671875, 1.142120361328125, 1.18585205078125, 1.229583740234375, 1.2733154296875, 1.317047119140625, 1.36077880859375, 1.404510498046875, 1.4482421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 10.0, 7.0, 12.0, 9.0, 13.0, 6.0, 20.0, 20.0, 16.0, 18.0, 22.0, 33.0, 24.0, 29.0, 35.0, 31.0, 32.0, 38.0, 42.0, 43.0, 1064.0, 30.0, 29.0, 37.0, 37.0, 37.0, 32.0, 33.0, 24.0, 36.0, 26.0, 29.0, 17.0, 13.0, 15.0, 20.0, 17.0, 14.0, 18.0, 9.0, 5.0, 4.0, 1.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.07470703125, -3.9384765625, -3.80224609375, -3.666015625, -3.52978515625, -3.3935546875, -3.25732421875, -3.12109375, -2.98486328125, -2.8486328125, -2.71240234375, -2.576171875, -2.43994140625, -2.3037109375, -2.16748046875, -2.03125, -1.89501953125, -1.7587890625, -1.62255859375, -1.486328125, -1.35009765625, -1.2138671875, -1.07763671875, -0.94140625, -0.80517578125, -0.6689453125, -0.53271484375, -0.396484375, -0.26025390625, -0.1240234375, 0.01220703125, 0.1484375, 0.28466796875, 0.4208984375, 0.55712890625, 0.693359375, 0.82958984375, 0.9658203125, 1.10205078125, 1.23828125, 1.37451171875, 1.5107421875, 1.64697265625, 1.783203125, 1.91943359375, 2.0556640625, 2.19189453125, 2.328125, 2.46435546875, 2.6005859375, 2.73681640625, 2.873046875, 3.00927734375, 3.1455078125, 3.28173828125, 3.41796875, 3.55419921875, 3.6904296875, 3.82666015625, 3.962890625, 4.09912109375, 4.2353515625, 4.37158203125, 4.5078125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 10.0, 12.0, 18.0, 30.0, 47.0, 78.0, 88.0, 154.0, 234.0, 327.0, 463.0, 670.0, 995.0, 1450.0, 2050.0, 3068.0, 4617.0, 6708.0, 9916.0, 14897.0, 22525.0, 35266.0, 55791.0, 89944.0, 152458.0, 1286924.0, 155574.0, 91525.0, 56529.0, 35573.0, 22872.0, 15071.0, 10132.0, 6850.0, 4493.0, 3126.0, 2108.0, 1423.0, 975.0, 672.0, 475.0, 329.0, 220.0, 144.0, 103.0, 65.0, 43.0, 31.0, 23.0, 9.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.048828125, -1.016571044921875, -0.98431396484375, -0.952056884765625, -0.9197998046875, -0.887542724609375, -0.85528564453125, -0.823028564453125, -0.790771484375, -0.758514404296875, -0.72625732421875, -0.694000244140625, -0.6617431640625, -0.629486083984375, -0.59722900390625, -0.564971923828125, -0.53271484375, -0.500457763671875, -0.46820068359375, -0.435943603515625, -0.4036865234375, -0.371429443359375, -0.33917236328125, -0.306915283203125, -0.274658203125, -0.242401123046875, -0.21014404296875, -0.177886962890625, -0.1456298828125, -0.113372802734375, -0.08111572265625, -0.048858642578125, -0.0166015625, 0.015655517578125, 0.04791259765625, 0.080169677734375, 0.1124267578125, 0.144683837890625, 0.17694091796875, 0.209197998046875, 0.241455078125, 0.273712158203125, 0.30596923828125, 0.338226318359375, 0.3704833984375, 0.402740478515625, 0.43499755859375, 0.467254638671875, 0.49951171875, 0.531768798828125, 0.56402587890625, 0.596282958984375, 0.6285400390625, 0.660797119140625, 0.69305419921875, 0.725311279296875, 0.757568359375, 0.789825439453125, 0.82208251953125, 0.854339599609375, 0.8865966796875, 0.918853759765625, 0.95111083984375, 0.983367919921875, 1.015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 8.0, 9.0, 15.0, 15.0, 23.0, 21.0, 26.0, 37.0, 39.0, 57.0, 57.0, 53.0, 63.0, 40.0, 71.0, 40.0, 60.0, 39.0, 40.0, 40.0, 35.0, 23.0, 28.0, 23.0, 9.0, 15.0, 13.0, 12.0, 9.0, 15.0, 9.0, 4.0, 2.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006341934204101562, -0.0006148815155029297, -0.0005955696105957031, -0.0005762577056884766, -0.00055694580078125, -0.0005376338958740234, -0.0005183219909667969, -0.0004990100860595703, -0.00047969818115234375, -0.0004603862762451172, -0.0004410743713378906, -0.00042176246643066406, -0.0004024505615234375, -0.00038313865661621094, -0.0003638267517089844, -0.0003445148468017578, -0.00032520294189453125, -0.0003058910369873047, -0.0002865791320800781, -0.00026726722717285156, -0.000247955322265625, -0.00022864341735839844, -0.00020933151245117188, -0.0001900196075439453, -0.00017070770263671875, -0.0001513957977294922, -0.00013208389282226562, -0.00011277198791503906, -9.34600830078125e-05, -7.414817810058594e-05, -5.4836273193359375e-05, -3.552436828613281e-05, -1.621246337890625e-05, 3.0994415283203125e-06, 2.2411346435546875e-05, 4.172325134277344e-05, 6.103515625e-05, 8.034706115722656e-05, 9.965896606445312e-05, 0.00011897087097167969, 0.00013828277587890625, 0.0001575946807861328, 0.00017690658569335938, 0.00019621849060058594, 0.0002155303955078125, 0.00023484230041503906, 0.0002541542053222656, 0.0002734661102294922, 0.00029277801513671875, 0.0003120899200439453, 0.0003314018249511719, 0.00035071372985839844, 0.000370025634765625, 0.00038933753967285156, 0.0004086494445800781, 0.0004279613494873047, 0.00044727325439453125, 0.0004665851593017578, 0.0004858970642089844, 0.0005052089691162109, 0.0005245208740234375, 0.0005438327789306641, 0.0005631446838378906, 0.0005824565887451172, 0.0006017684936523438]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 9.0, 14.0, 13.0, 12.0, 26.0, 24.0, 26.0, 25.0, 52.0, 48.0, 76.0, 95.0, 127.0, 230.0, 482.0, 1099.0, 318087.0, 725454.0, 1328.0, 478.0, 243.0, 138.0, 121.0, 78.0, 49.0, 32.0, 35.0, 32.0, 22.0, 15.0, 18.0, 10.0, 9.0, 8.0, 7.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01404571533203125, -0.013607501983642578, -0.013169288635253906, -0.012731075286865234, -0.012292861938476562, -0.01185464859008789, -0.011416435241699219, -0.010978221893310547, -0.010540008544921875, -0.010101795196533203, -0.009663581848144531, -0.00922536849975586, -0.008787155151367188, -0.008348941802978516, -0.007910728454589844, -0.007472515106201172, -0.0070343017578125, -0.006596088409423828, -0.006157875061035156, -0.005719661712646484, -0.0052814483642578125, -0.004843235015869141, -0.004405021667480469, -0.003966808319091797, -0.003528594970703125, -0.003090381622314453, -0.0026521682739257812, -0.0022139549255371094, -0.0017757415771484375, -0.0013375282287597656, -0.0008993148803710938, -0.0004611015319824219, -2.288818359375e-05, 0.0004153251647949219, 0.0008535385131835938, 0.0012917518615722656, 0.0017299652099609375, 0.0021681785583496094, 0.0026063919067382812, 0.003044605255126953, 0.003482818603515625, 0.003921031951904297, 0.004359245300292969, 0.004797458648681641, 0.0052356719970703125, 0.005673885345458984, 0.006112098693847656, 0.006550312042236328, 0.006988525390625, 0.007426738739013672, 0.007864952087402344, 0.008303165435791016, 0.008741378784179688, 0.00917959213256836, 0.009617805480957031, 0.010056018829345703, 0.010494232177734375, 0.010932445526123047, 0.011370658874511719, 0.01180887222290039, 0.012247085571289062, 0.012685298919677734, 0.013123512268066406, 0.013561725616455078, 0.01399993896484375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 12.0, 76.0, 304.0, 397.0, 183.0, 33.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001418866217136383, -0.001380834262818098, -0.001342802424915135, -0.00130477047059685, -0.001266738516278565, -0.0012287066783756018, -0.0011906747240573168, -0.0011526427697390318, -0.0011146108154207468, -0.0010765788611024618, -0.0010385470231994987, -0.0010005150688812137, -0.0009624831145629287, -0.0009244512184523046, -0.0008864193223416805, -0.0008483873680233955, -0.0008103555301204324, -0.0007723236340098083, -0.0007342916796915233, -0.0006962597835808992, -0.0006582278292626143, -0.0006201959331519902, -0.0005821640370413661, -0.0005441320827230811, -0.000506100186612457, -0.0004680682613980025, -0.000430036336183548, -0.0003920044400729239, -0.00035397251485846937, -0.00031594058964401484, -0.00027790869353339076, -0.00023987676831893623, -0.00020184495951980352, -0.000163813034305349, -0.0001257811236428097, -8.774920570431277e-05, -4.9717287765815854e-05, -1.1685362551361322e-05, 2.634654811117798e-05, 6.437845877371728e-05, 0.00010241038398817182, 0.00014044230920262635, 0.00017847421986516565, 0.00021650613052770495, 0.0002545380557421595, 0.000292569980956614, 0.0003306018770672381, 0.0003686338022816926, 0.00040666572749614716, 0.0004446976527106017, 0.0004827295779250562, 0.0005207614740356803, 0.0005587934283539653, 0.0005968253244645894, 0.0006348572205752134, 0.0006728891748934984, 0.0007109210710041225, 0.0007489529671147466, 0.0007869849214330316, 0.0008250168175436556, 0.0008630487136542797, 0.0009010806679725647, 0.0009391125640831888, 0.0009771444601938128, 0.0010151764145120978]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 6.0, 4.0, 10.0, 7.0, 8.0, 9.0, 7.0, 20.0, 20.0, 19.0, 26.0, 24.0, 30.0, 31.0, 44.0, 33.0, 34.0, 23.0, 38.0, 38.0, 46.0, 30.0, 40.0, 56.0, 32.0, 41.0, 44.0, 36.0, 26.0, 31.0, 16.0, 30.0, 28.0, 18.0, 20.0, 14.0, 13.0, 9.0, 11.0, 13.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003337860107421875, -0.00032325461506843567, -0.00031272321939468384, -0.000302191823720932, -0.0002916604280471802, -0.00028112903237342834, -0.0002705976366996765, -0.0002600662410259247, -0.00024953484535217285, -0.00023900344967842102, -0.0002284720540046692, -0.00021794065833091736, -0.00020740926265716553, -0.0001968778669834137, -0.00018634647130966187, -0.00017581507563591003, -0.0001652836799621582, -0.00015475228428840637, -0.00014422088861465454, -0.0001336894929409027, -0.00012315809726715088, -0.00011262670159339905, -0.00010209530591964722, -9.156391024589539e-05, -8.103251457214355e-05, -7.050111889839172e-05, -5.996972322463989e-05, -4.943832755088806e-05, -3.890693187713623e-05, -2.83755362033844e-05, -1.784414052963257e-05, -7.312744855880737e-06, 3.2186508178710938e-06, 1.3750046491622925e-05, 2.4281442165374756e-05, 3.481283783912659e-05, 4.534423351287842e-05, 5.587562918663025e-05, 6.640702486038208e-05, 7.693842053413391e-05, 8.746981620788574e-05, 9.800121188163757e-05, 0.0001085326075553894, 0.00011906400322914124, 0.00012959539890289307, 0.0001401267945766449, 0.00015065819025039673, 0.00016118958592414856, 0.0001717209815979004, 0.00018225237727165222, 0.00019278377294540405, 0.00020331516861915588, 0.00021384656429290771, 0.00022437795996665955, 0.00023490935564041138, 0.0002454407513141632, 0.00025597214698791504, 0.00026650354266166687, 0.0002770349383354187, 0.00028756633400917053, 0.00029809772968292236, 0.0003086291253566742, 0.000319160521030426, 0.00032969191670417786, 0.0003402233123779297]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 11.0, 16.0, 19.0, 18.0, 27.0, 18.0, 32.0, 17.0, 30.0, 40.0, 38.0, 27.0, 46.0, 40.0, 35.0, 44.0, 44.0, 41.0, 38.0, 34.0, 30.0, 49.0, 38.0, 34.0, 29.0, 30.0, 30.0, 21.0, 19.0, 11.0, 9.0, 14.0, 7.0, 7.0, 7.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.4053955078125, -7.166259765625, -6.9271240234375, -6.68798828125, -6.4488525390625, -6.209716796875, -5.9705810546875, -5.7314453125, -5.4923095703125, -5.253173828125, -5.0140380859375, -4.77490234375, -4.5357666015625, -4.296630859375, -4.0574951171875, -3.818359375, -3.5792236328125, -3.340087890625, -3.1009521484375, -2.86181640625, -2.6226806640625, -2.383544921875, -2.1444091796875, -1.9052734375, -1.6661376953125, -1.427001953125, -1.1878662109375, -0.94873046875, -0.7095947265625, -0.470458984375, -0.2313232421875, 0.0078125, 0.2469482421875, 0.486083984375, 0.7252197265625, 0.96435546875, 1.2034912109375, 1.442626953125, 1.6817626953125, 1.9208984375, 2.1600341796875, 2.399169921875, 2.6383056640625, 2.87744140625, 3.1165771484375, 3.355712890625, 3.5948486328125, 3.833984375, 4.0731201171875, 4.312255859375, 4.5513916015625, 4.79052734375, 5.0296630859375, 5.268798828125, 5.5079345703125, 5.7470703125, 5.9862060546875, 6.225341796875, 6.4644775390625, 6.70361328125, 6.9427490234375, 7.181884765625, 7.4210205078125, 7.66015625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 6.0, 11.0, 15.0, 17.0, 24.0, 28.0, 50.0, 61.0, 88.0, 108.0, 138.0, 180.0, 244.0, 342.0, 497.0, 706.0, 1279.0, 4113.0, 26305.0, 595492.0, 390516.0, 21036.0, 3641.0, 1120.0, 651.0, 488.0, 358.0, 284.0, 192.0, 137.0, 102.0, 77.0, 55.0, 36.0, 22.0, 34.0, 22.0, 16.0, 12.0, 10.0, 7.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.34375, -18.73828125, -18.1328125, -17.52734375, -16.921875, -16.31640625, -15.7109375, -15.10546875, -14.5, -13.89453125, -13.2890625, -12.68359375, -12.078125, -11.47265625, -10.8671875, -10.26171875, -9.65625, -9.05078125, -8.4453125, -7.83984375, -7.234375, -6.62890625, -6.0234375, -5.41796875, -4.8125, -4.20703125, -3.6015625, -2.99609375, -2.390625, -1.78515625, -1.1796875, -0.57421875, 0.03125, 0.63671875, 1.2421875, 1.84765625, 2.453125, 3.05859375, 3.6640625, 4.26953125, 4.875, 5.48046875, 6.0859375, 6.69140625, 7.296875, 7.90234375, 8.5078125, 9.11328125, 9.71875, 10.32421875, 10.9296875, 11.53515625, 12.140625, 12.74609375, 13.3515625, 13.95703125, 14.5625, 15.16796875, 15.7734375, 16.37890625, 16.984375, 17.58984375, 18.1953125, 18.80078125, 19.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 4.0, 7.0, 18.0, 15.0, 16.0, 13.0, 25.0, 29.0, 26.0, 23.0, 39.0, 39.0, 41.0, 56.0, 52.0, 105.0, 1564.0, 428.0, 90.0, 54.0, 45.0, 49.0, 40.0, 38.0, 36.0, 32.0, 18.0, 25.0, 19.0, 16.0, 14.0, 16.0, 13.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.09375, -23.3623046875, -22.630859375, -21.8994140625, -21.16796875, -20.4365234375, -19.705078125, -18.9736328125, -18.2421875, -17.5107421875, -16.779296875, -16.0478515625, -15.31640625, -14.5849609375, -13.853515625, -13.1220703125, -12.390625, -11.6591796875, -10.927734375, -10.1962890625, -9.46484375, -8.7333984375, -8.001953125, -7.2705078125, -6.5390625, -5.8076171875, -5.076171875, -4.3447265625, -3.61328125, -2.8818359375, -2.150390625, -1.4189453125, -0.6875, 0.0439453125, 0.775390625, 1.5068359375, 2.23828125, 2.9697265625, 3.701171875, 4.4326171875, 5.1640625, 5.8955078125, 6.626953125, 7.3583984375, 8.08984375, 8.8212890625, 9.552734375, 10.2841796875, 11.015625, 11.7470703125, 12.478515625, 13.2099609375, 13.94140625, 14.6728515625, 15.404296875, 16.1357421875, 16.8671875, 17.5986328125, 18.330078125, 19.0615234375, 19.79296875, 20.5244140625, 21.255859375, 21.9873046875, 22.71875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 1.0, 3.0, 5.0, 3.0, 13.0, 10.0, 19.0, 14.0, 19.0, 20.0, 27.0, 30.0, 28.0, 37.0, 60.0, 70.0, 103.0, 197.0, 326.0, 959.0, 19838.0, 3113929.0, 8364.0, 758.0, 304.0, 164.0, 99.0, 50.0, 43.0, 31.0, 32.0, 33.0, 26.0, 16.0, 21.0, 16.0, 10.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.625, -62.5673828125, -60.509765625, -58.4521484375, -56.39453125, -54.3369140625, -52.279296875, -50.2216796875, -48.1640625, -46.1064453125, -44.048828125, -41.9912109375, -39.93359375, -37.8759765625, -35.818359375, -33.7607421875, -31.703125, -29.6455078125, -27.587890625, -25.5302734375, -23.47265625, -21.4150390625, -19.357421875, -17.2998046875, -15.2421875, -13.1845703125, -11.126953125, -9.0693359375, -7.01171875, -4.9541015625, -2.896484375, -0.8388671875, 1.21875, 3.2763671875, 5.333984375, 7.3916015625, 9.44921875, 11.5068359375, 13.564453125, 15.6220703125, 17.6796875, 19.7373046875, 21.794921875, 23.8525390625, 25.91015625, 27.9677734375, 30.025390625, 32.0830078125, 34.140625, 36.1982421875, 38.255859375, 40.3134765625, 42.37109375, 44.4287109375, 46.486328125, 48.5439453125, 50.6015625, 52.6591796875, 54.716796875, 56.7744140625, 58.83203125, 60.8896484375, 62.947265625, 65.0048828125, 67.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 226.0, 643.0, 131.0, 8.0, 0.0, 0.0, 1.0], "bins": [-178.9009552001953, -175.83958435058594, -172.7781982421875, -169.71682739257812, -166.6554412841797, -163.5940704345703, -160.53268432617188, -157.4713134765625, -154.40992736816406, -151.3485565185547, -148.28717041015625, -145.22579956054688, -142.16441345214844, -139.10304260253906, -136.04165649414062, -132.98028564453125, -129.91891479492188, -126.85753631591797, -123.79615783691406, -120.73477935791016, -117.67340087890625, -114.61203002929688, -111.55064392089844, -108.48927307128906, -105.42788696289062, -102.36650848388672, -99.30513000488281, -96.2437515258789, -93.182373046875, -90.12100219726562, -87.05961608886719, -83.99824523925781, -80.93685913085938, -77.87548065185547, -74.81410217285156, -71.75272369384766, -68.69134521484375, -65.62997436523438, -62.5685920715332, -59.50721740722656, -56.445838928222656, -53.38446044921875, -50.323081970214844, -47.26170349121094, -44.2003288269043, -41.13895034790039, -38.077571868896484, -35.016197204589844, -31.954818725585938, -28.89344024658203, -25.832063674926758, -22.77068519592285, -19.709308624267578, -16.647930145263672, -13.586551666259766, -10.525175094604492, -7.463796615600586, -4.402419090270996, -1.341041088104248, 1.7203369140625, 4.78171443939209, 7.84309196472168, 10.904470443725586, 13.96584701538086, 17.027225494384766]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 6.0, 4.0, 5.0, 15.0, 9.0, 9.0, 10.0, 23.0, 15.0, 17.0, 23.0, 29.0, 18.0, 38.0, 42.0, 28.0, 35.0, 43.0, 46.0, 39.0, 51.0, 38.0, 51.0, 35.0, 39.0, 38.0, 24.0, 38.0, 29.0, 39.0, 24.0, 21.0, 11.0, 20.0, 19.0, 10.0, 17.0, 10.0, 7.0, 6.0, 5.0, 10.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-55.071990966796875, -53.43459701538086, -51.797203063964844, -50.15980529785156, -48.52241134643555, -46.88501739501953, -45.247623443603516, -43.6102294921875, -41.972835540771484, -40.33544158935547, -38.69804763793945, -37.06065368652344, -35.423255920410156, -33.78586196899414, -32.148468017578125, -30.51107406616211, -28.87367820739746, -27.236284255981445, -25.598888397216797, -23.96149444580078, -22.324100494384766, -20.68670654296875, -19.0493106842041, -17.411916732788086, -15.774521827697754, -14.137126922607422, -12.499732971191406, -10.862338066101074, -9.224943161010742, -7.587549209594727, -5.9501543045043945, -4.312760353088379, -2.675365447998047, -1.0379709005355835, 0.5994236469268799, 2.236818313598633, 3.8742127418518066, 5.5116071701049805, 7.1490020751953125, 8.786396026611328, 10.42379093170166, 12.061185836791992, 13.698579788208008, 15.33597469329834, 16.973369598388672, 18.610763549804688, 20.248157501220703, 21.88555145263672, 23.522947311401367, 25.160341262817383, 26.79773712158203, 28.435131072998047, 30.072525024414062, 31.709918975830078, 33.347312927246094, 34.984710693359375, 36.62210464477539, 38.259498596191406, 39.89689254760742, 41.53428649902344, 43.17168426513672, 44.809078216552734, 46.44647216796875, 48.083866119384766, 49.72126007080078]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 12.0, 8.0, 13.0, 14.0, 12.0, 21.0, 16.0, 18.0, 26.0, 31.0, 26.0, 22.0, 27.0, 30.0, 39.0, 41.0, 39.0, 31.0, 36.0, 40.0, 38.0, 38.0, 30.0, 42.0, 38.0, 35.0, 44.0, 28.0, 23.0, 22.0, 24.0, 21.0, 18.0, 9.0, 13.0, 10.0, 13.0, 11.0, 11.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.07391357421875, -6.8470458984375, -6.62017822265625, -6.393310546875, -6.16644287109375, -5.9395751953125, -5.71270751953125, -5.48583984375, -5.25897216796875, -5.0321044921875, -4.80523681640625, -4.578369140625, -4.35150146484375, -4.1246337890625, -3.89776611328125, -3.6708984375, -3.44403076171875, -3.2171630859375, -2.99029541015625, -2.763427734375, -2.53656005859375, -2.3096923828125, -2.08282470703125, -1.85595703125, -1.62908935546875, -1.4022216796875, -1.17535400390625, -0.948486328125, -0.72161865234375, -0.4947509765625, -0.26788330078125, -0.041015625, 0.18585205078125, 0.4127197265625, 0.63958740234375, 0.866455078125, 1.09332275390625, 1.3201904296875, 1.54705810546875, 1.77392578125, 2.00079345703125, 2.2276611328125, 2.45452880859375, 2.681396484375, 2.90826416015625, 3.1351318359375, 3.36199951171875, 3.5888671875, 3.81573486328125, 4.0426025390625, 4.26947021484375, 4.496337890625, 4.72320556640625, 4.9500732421875, 5.17694091796875, 5.40380859375, 5.63067626953125, 5.8575439453125, 6.08441162109375, 6.311279296875, 6.53814697265625, 6.7650146484375, 6.99188232421875, 7.21875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 7.0, 2.0, 5.0, 6.0, 1.0, 10.0, 11.0, 3.0, 24.0, 28.0, 23.0, 46.0, 58.0, 62.0, 65.0, 95.0, 116.0, 183.0, 250.0, 377.0, 656.0, 1349.0, 3568.0, 13821.0, 129338.0, 1938843.0, 1947696.0, 136701.0, 14029.0, 3599.0, 1385.0, 604.0, 371.0, 217.0, 180.0, 127.0, 88.0, 74.0, 65.0, 30.0, 34.0, 30.0, 21.0, 19.0, 21.0, 11.0, 13.0, 10.0, 4.0, 5.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.1162109375, -15.560546875, -15.0048828125, -14.44921875, -13.8935546875, -13.337890625, -12.7822265625, -12.2265625, -11.6708984375, -11.115234375, -10.5595703125, -10.00390625, -9.4482421875, -8.892578125, -8.3369140625, -7.78125, -7.2255859375, -6.669921875, -6.1142578125, -5.55859375, -5.0029296875, -4.447265625, -3.8916015625, -3.3359375, -2.7802734375, -2.224609375, -1.6689453125, -1.11328125, -0.5576171875, -0.001953125, 0.5537109375, 1.109375, 1.6650390625, 2.220703125, 2.7763671875, 3.33203125, 3.8876953125, 4.443359375, 4.9990234375, 5.5546875, 6.1103515625, 6.666015625, 7.2216796875, 7.77734375, 8.3330078125, 8.888671875, 9.4443359375, 10.0, 10.5556640625, 11.111328125, 11.6669921875, 12.22265625, 12.7783203125, 13.333984375, 13.8896484375, 14.4453125, 15.0009765625, 15.556640625, 16.1123046875, 16.66796875, 17.2236328125, 17.779296875, 18.3349609375, 18.890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 10.0, 17.0, 19.0, 20.0, 44.0, 62.0, 84.0, 117.0, 148.0, 249.0, 399.0, 563.0, 616.0, 575.0, 392.0, 250.0, 165.0, 92.0, 81.0, 59.0, 32.0, 25.0, 15.0, 13.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.31005859375, -13.8076171875, -13.30517578125, -12.802734375, -12.30029296875, -11.7978515625, -11.29541015625, -10.79296875, -10.29052734375, -9.7880859375, -9.28564453125, -8.783203125, -8.28076171875, -7.7783203125, -7.27587890625, -6.7734375, -6.27099609375, -5.7685546875, -5.26611328125, -4.763671875, -4.26123046875, -3.7587890625, -3.25634765625, -2.75390625, -2.25146484375, -1.7490234375, -1.24658203125, -0.744140625, -0.24169921875, 0.2607421875, 0.76318359375, 1.265625, 1.76806640625, 2.2705078125, 2.77294921875, 3.275390625, 3.77783203125, 4.2802734375, 4.78271484375, 5.28515625, 5.78759765625, 6.2900390625, 6.79248046875, 7.294921875, 7.79736328125, 8.2998046875, 8.80224609375, 9.3046875, 9.80712890625, 10.3095703125, 10.81201171875, 11.314453125, 11.81689453125, 12.3193359375, 12.82177734375, 13.32421875, 13.82666015625, 14.3291015625, 14.83154296875, 15.333984375, 15.83642578125, 16.3388671875, 16.84130859375, 17.34375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 9.0, 15.0, 20.0, 23.0, 34.0, 43.0, 54.0, 78.0, 114.0, 125.0, 184.0, 313.0, 668.0, 2208.0, 45152.0, 4049742.0, 90533.0, 3013.0, 780.0, 324.0, 217.0, 131.0, 110.0, 104.0, 73.0, 41.0, 36.0, 25.0, 15.0, 24.0, 10.0, 19.0, 5.0, 5.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.9375, -49.21484375, -47.4921875, -45.76953125, -44.046875, -42.32421875, -40.6015625, -38.87890625, -37.15625, -35.43359375, -33.7109375, -31.98828125, -30.265625, -28.54296875, -26.8203125, -25.09765625, -23.375, -21.65234375, -19.9296875, -18.20703125, -16.484375, -14.76171875, -13.0390625, -11.31640625, -9.59375, -7.87109375, -6.1484375, -4.42578125, -2.703125, -0.98046875, 0.7421875, 2.46484375, 4.1875, 5.91015625, 7.6328125, 9.35546875, 11.078125, 12.80078125, 14.5234375, 16.24609375, 17.96875, 19.69140625, 21.4140625, 23.13671875, 24.859375, 26.58203125, 28.3046875, 30.02734375, 31.75, 33.47265625, 35.1953125, 36.91796875, 38.640625, 40.36328125, 42.0859375, 43.80859375, 45.53125, 47.25390625, 48.9765625, 50.69921875, 52.421875, 54.14453125, 55.8671875, 57.58984375, 59.3125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 37.0, 138.0, 304.0, 348.0, 131.0, 36.0, 8.0, 2.0, 4.0], "bins": [-213.93435668945312, -210.24412536621094, -206.55389404296875, -202.86366271972656, -199.17343139648438, -195.48321533203125, -191.79298400878906, -188.10275268554688, -184.4125213623047, -180.7222900390625, -177.0320587158203, -173.34182739257812, -169.65159606933594, -165.96136474609375, -162.27114868164062, -158.58091735839844, -154.89068603515625, -151.20045471191406, -147.51022338867188, -143.8199920654297, -140.1297607421875, -136.43954467773438, -132.7493133544922, -129.05908203125, -125.36884307861328, -121.6786117553711, -117.9883804321289, -114.29815673828125, -110.60792541503906, -106.91769409179688, -103.22746276855469, -99.5372314453125, -95.84700012207031, -92.15676879882812, -88.46653747558594, -84.77631378173828, -81.0860824584961, -77.3958511352539, -73.70561981201172, -70.01539611816406, -66.32516479492188, -62.63493347167969, -58.944705963134766, -55.25447463989258, -51.564247131347656, -47.87401580810547, -44.18378448486328, -40.49355697631836, -36.80332946777344, -33.11309814453125, -29.422870635986328, -25.73263931274414, -22.04241180419922, -18.35218048095703, -14.661951065063477, -10.971721649169922, -7.281492233276367, -3.5912625789642334, 0.09896707534790039, 3.7891969680786133, 7.479426383972168, 11.169656753540039, 14.859886169433594, 18.55011558532715, 22.240345001220703]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 5.0, 6.0, 3.0, 4.0, 10.0, 11.0, 10.0, 14.0, 15.0, 17.0, 19.0, 26.0, 27.0, 25.0, 19.0, 24.0, 29.0, 37.0, 38.0, 39.0, 40.0, 31.0, 32.0, 34.0, 46.0, 31.0, 47.0, 33.0, 26.0, 32.0, 47.0, 23.0, 23.0, 13.0, 18.0, 14.0, 25.0, 16.0, 16.0, 9.0, 15.0, 12.0, 10.0, 3.0, 11.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-35.75941467285156, -34.63930130004883, -33.51919174194336, -32.399078369140625, -31.27896499633789, -30.15885353088379, -29.038742065429688, -27.918628692626953, -26.79851722717285, -25.67840576171875, -24.558292388916016, -23.438180923461914, -22.318069458007812, -21.197956085205078, -20.077844619750977, -18.957733154296875, -17.83761978149414, -16.71750831604004, -15.597394943237305, -14.477283477783203, -13.357171058654785, -12.237058639526367, -11.116947174072266, -9.996834754943848, -8.87672233581543, -7.756609916687012, -6.636497974395752, -5.516386032104492, -4.396273612976074, -3.2761611938476562, -2.1560492515563965, -1.0359373092651367, 0.08417510986328125, 1.2042872905731201, 2.324399471282959, 3.444511651992798, 4.564623832702637, 5.684736251831055, 6.8048481941223145, 7.924960136413574, 9.045072555541992, 10.16518497467041, 11.285297393798828, 12.40540885925293, 13.525521278381348, 14.645633697509766, 15.765745162963867, 16.88585662841797, 18.005970001220703, 19.126081466674805, 20.24619483947754, 21.36630630493164, 22.486419677734375, 23.606531143188477, 24.726642608642578, 25.846755981445312, 26.966867446899414, 28.086978912353516, 29.20709228515625, 30.32720375061035, 31.447315216064453, 32.56742858886719, 33.68754196166992, 34.80765151977539, 35.927764892578125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 6.0, 6.0, 12.0, 13.0, 6.0, 22.0, 17.0, 19.0, 23.0, 34.0, 22.0, 27.0, 28.0, 37.0, 42.0, 34.0, 31.0, 43.0, 35.0, 40.0, 43.0, 46.0, 38.0, 31.0, 33.0, 30.0, 33.0, 30.0, 28.0, 22.0, 27.0, 14.0, 18.0, 19.0, 16.0, 13.0, 9.0, 9.0, 10.0, 4.0, 8.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51953125, -7.28167724609375, -7.0438232421875, -6.80596923828125, -6.568115234375, -6.33026123046875, -6.0924072265625, -5.85455322265625, -5.61669921875, -5.37884521484375, -5.1409912109375, -4.90313720703125, -4.665283203125, -4.42742919921875, -4.1895751953125, -3.95172119140625, -3.7138671875, -3.47601318359375, -3.2381591796875, -3.00030517578125, -2.762451171875, -2.52459716796875, -2.2867431640625, -2.04888916015625, -1.81103515625, -1.57318115234375, -1.3353271484375, -1.09747314453125, -0.859619140625, -0.62176513671875, -0.3839111328125, -0.14605712890625, 0.091796875, 0.32965087890625, 0.5675048828125, 0.80535888671875, 1.043212890625, 1.28106689453125, 1.5189208984375, 1.75677490234375, 1.99462890625, 2.23248291015625, 2.4703369140625, 2.70819091796875, 2.946044921875, 3.18389892578125, 3.4217529296875, 3.65960693359375, 3.8974609375, 4.13531494140625, 4.3731689453125, 4.61102294921875, 4.848876953125, 5.08673095703125, 5.3245849609375, 5.56243896484375, 5.80029296875, 6.03814697265625, 6.2760009765625, 6.51385498046875, 6.751708984375, 6.98956298828125, 7.2274169921875, 7.46527099609375, 7.703125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 4.0, 9.0, 7.0, 20.0, 22.0, 37.0, 43.0, 85.0, 105.0, 166.0, 227.0, 354.0, 438.0, 709.0, 1024.0, 1466.0, 2186.0, 3143.0, 4669.0, 6694.0, 10090.0, 15057.0, 22638.0, 34451.0, 53758.0, 85829.0, 141256.0, 224005.0, 163757.0, 98493.0, 61074.0, 39031.0, 25544.0, 16981.0, 11381.0, 7714.0, 5004.0, 3476.0, 2380.0, 1603.0, 1092.0, 778.0, 511.0, 378.0, 290.0, 189.0, 141.0, 77.0, 46.0, 44.0, 38.0, 16.0, 13.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0791015625, -1.0449981689453125, -1.010894775390625, -0.9767913818359375, -0.94268798828125, -0.9085845947265625, -0.874481201171875, -0.8403778076171875, -0.8062744140625, -0.7721710205078125, -0.738067626953125, -0.7039642333984375, -0.66986083984375, -0.6357574462890625, -0.601654052734375, -0.5675506591796875, -0.533447265625, -0.4993438720703125, -0.465240478515625, -0.4311370849609375, -0.39703369140625, -0.3629302978515625, -0.328826904296875, -0.2947235107421875, -0.2606201171875, -0.2265167236328125, -0.192413330078125, -0.1583099365234375, -0.12420654296875, -0.0901031494140625, -0.055999755859375, -0.0218963623046875, 0.01220703125, 0.0463104248046875, 0.080413818359375, 0.1145172119140625, 0.14862060546875, 0.1827239990234375, 0.216827392578125, 0.2509307861328125, 0.2850341796875, 0.3191375732421875, 0.353240966796875, 0.3873443603515625, 0.42144775390625, 0.4555511474609375, 0.489654541015625, 0.5237579345703125, 0.557861328125, 0.5919647216796875, 0.626068115234375, 0.6601715087890625, 0.69427490234375, 0.7283782958984375, 0.762481689453125, 0.7965850830078125, 0.8306884765625, 0.8647918701171875, 0.898895263671875, 0.9329986572265625, 0.96710205078125, 1.0012054443359375, 1.035308837890625, 1.0694122314453125, 1.103515625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 8.0, 10.0, 10.0, 8.0, 18.0, 13.0, 27.0, 23.0, 28.0, 29.0, 25.0, 25.0, 23.0, 34.0, 41.0, 45.0, 34.0, 37.0, 1069.0, 38.0, 34.0, 30.0, 50.0, 37.0, 35.0, 40.0, 40.0, 23.0, 24.0, 29.0, 19.0, 19.0, 11.0, 13.0, 12.0, 5.0, 9.0, 6.0, 12.0, 1.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2972412109375, -5.141357421875, -4.9854736328125, -4.82958984375, -4.6737060546875, -4.517822265625, -4.3619384765625, -4.2060546875, -4.0501708984375, -3.894287109375, -3.7384033203125, -3.58251953125, -3.4266357421875, -3.270751953125, -3.1148681640625, -2.958984375, -2.8031005859375, -2.647216796875, -2.4913330078125, -2.33544921875, -2.1795654296875, -2.023681640625, -1.8677978515625, -1.7119140625, -1.5560302734375, -1.400146484375, -1.2442626953125, -1.08837890625, -0.9324951171875, -0.776611328125, -0.6207275390625, -0.46484375, -0.3089599609375, -0.153076171875, 0.0028076171875, 0.15869140625, 0.3145751953125, 0.470458984375, 0.6263427734375, 0.7822265625, 0.9381103515625, 1.093994140625, 1.2498779296875, 1.40576171875, 1.5616455078125, 1.717529296875, 1.8734130859375, 2.029296875, 2.1851806640625, 2.341064453125, 2.4969482421875, 2.65283203125, 2.8087158203125, 2.964599609375, 3.1204833984375, 3.2763671875, 3.4322509765625, 3.588134765625, 3.7440185546875, 3.89990234375, 4.0557861328125, 4.211669921875, 4.3675537109375, 4.5234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 9.0, 12.0, 25.0, 41.0, 46.0, 91.0, 138.0, 172.0, 277.0, 379.0, 615.0, 920.0, 1456.0, 2094.0, 3098.0, 4694.0, 7172.0, 10883.0, 17039.0, 26863.0, 44315.0, 74643.0, 131300.0, 1289586.0, 201971.0, 110593.0, 63961.0, 38149.0, 23508.0, 14746.0, 9713.0, 6277.0, 4163.0, 2711.0, 1828.0, 1251.0, 801.0, 558.0, 353.0, 229.0, 158.0, 102.0, 63.0, 48.0, 28.0, 17.0, 13.0, 8.0, 4.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.169921875, -1.1320037841796875, -1.094085693359375, -1.0561676025390625, -1.01824951171875, -0.9803314208984375, -0.942413330078125, -0.9044952392578125, -0.8665771484375, -0.8286590576171875, -0.790740966796875, -0.7528228759765625, -0.71490478515625, -0.6769866943359375, -0.639068603515625, -0.6011505126953125, -0.563232421875, -0.5253143310546875, -0.487396240234375, -0.4494781494140625, -0.41156005859375, -0.3736419677734375, -0.335723876953125, -0.2978057861328125, -0.2598876953125, -0.2219696044921875, -0.184051513671875, -0.1461334228515625, -0.10821533203125, -0.0702972412109375, -0.032379150390625, 0.0055389404296875, 0.04345703125, 0.0813751220703125, 0.119293212890625, 0.1572113037109375, 0.19512939453125, 0.2330474853515625, 0.270965576171875, 0.3088836669921875, 0.3468017578125, 0.3847198486328125, 0.422637939453125, 0.4605560302734375, 0.49847412109375, 0.5363922119140625, 0.574310302734375, 0.6122283935546875, 0.650146484375, 0.6880645751953125, 0.725982666015625, 0.7639007568359375, 0.80181884765625, 0.8397369384765625, 0.877655029296875, 0.9155731201171875, 0.9534912109375, 0.9914093017578125, 1.029327392578125, 1.0672454833984375, 1.10516357421875, 1.1430816650390625, 1.180999755859375, 1.2189178466796875, 1.2568359375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 4.0, 3.0, 7.0, 16.0, 12.0, 17.0, 17.0, 18.0, 29.0, 37.0, 53.0, 68.0, 71.0, 91.0, 84.0, 84.0, 79.0, 69.0, 42.0, 47.0, 33.0, 27.0, 19.0, 21.0, 14.0, 12.0, 6.0, 10.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010671615600585938, -0.0010363012552261353, -0.0010054409503936768, -0.0009745806455612183, -0.0009437203407287598, -0.0009128600358963013, -0.0008819997310638428, -0.0008511394262313843, -0.0008202791213989258, -0.0007894188165664673, -0.0007585585117340088, -0.0007276982069015503, -0.0006968379020690918, -0.0006659775972366333, -0.0006351172924041748, -0.0006042569875717163, -0.0005733966827392578, -0.0005425363779067993, -0.0005116760730743408, -0.0004808157682418823, -0.00044995546340942383, -0.00041909515857696533, -0.00038823485374450684, -0.00035737454891204834, -0.00032651424407958984, -0.00029565393924713135, -0.00026479363441467285, -0.00023393332958221436, -0.00020307302474975586, -0.00017221271991729736, -0.00014135241508483887, -0.00011049211025238037, -7.963180541992188e-05, -4.877150058746338e-05, -1.7911195755004883e-05, 1.2949109077453613e-05, 4.380941390991211e-05, 7.46697187423706e-05, 0.0001055300235748291, 0.0001363903284072876, 0.0001672506332397461, 0.0001981109380722046, 0.00022897124290466309, 0.0002598315477371216, 0.0002906918525695801, 0.0003215521574020386, 0.00035241246223449707, 0.00038327276706695557, 0.00041413307189941406, 0.00044499337673187256, 0.00047585368156433105, 0.0005067139863967896, 0.000537574291229248, 0.0005684345960617065, 0.000599294900894165, 0.0006301552057266235, 0.000661015510559082, 0.0006918758153915405, 0.000722736120223999, 0.0007535964250564575, 0.000784456729888916, 0.0008153170347213745, 0.000846177339553833, 0.0008770376443862915, 0.00090789794921875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 15.0, 11.0, 15.0, 24.0, 36.0, 38.0, 47.0, 70.0, 98.0, 157.0, 308.0, 575.0, 3473.0, 1038840.0, 3403.0, 605.0, 287.0, 164.0, 91.0, 68.0, 59.0, 42.0, 26.0, 26.0, 11.0, 20.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.018646240234375, -0.018014192581176758, -0.017382144927978516, -0.016750097274780273, -0.01611804962158203, -0.015486001968383789, -0.014853954315185547, -0.014221906661987305, -0.013589859008789062, -0.01295781135559082, -0.012325763702392578, -0.011693716049194336, -0.011061668395996094, -0.010429620742797852, -0.00979757308959961, -0.009165525436401367, -0.008533477783203125, -0.007901430130004883, -0.007269382476806641, -0.0066373348236083984, -0.006005287170410156, -0.005373239517211914, -0.004741191864013672, -0.00410914421081543, -0.0034770965576171875, -0.0028450489044189453, -0.002213001251220703, -0.001580953598022461, -0.0009489059448242188, -0.00031685829162597656, 0.0003151893615722656, 0.0009472370147705078, 0.00157928466796875, 0.002211332321166992, 0.0028433799743652344, 0.0034754276275634766, 0.004107475280761719, 0.004739522933959961, 0.005371570587158203, 0.006003618240356445, 0.0066356658935546875, 0.00726771354675293, 0.007899761199951172, 0.008531808853149414, 0.009163856506347656, 0.009795904159545898, 0.01042795181274414, 0.011059999465942383, 0.011692047119140625, 0.012324094772338867, 0.01295614242553711, 0.013588190078735352, 0.014220237731933594, 0.014852285385131836, 0.015484333038330078, 0.01611638069152832, 0.016748428344726562, 0.017380475997924805, 0.018012523651123047, 0.01864457130432129, 0.01927661895751953, 0.019908666610717773, 0.020540714263916016, 0.021172761917114258, 0.0218048095703125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 12.0, 14.0, 38.0, 64.0, 118.0, 160.0, 200.0, 158.0, 100.0, 68.0, 39.0, 18.0, 17.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004894381272606552, -0.0004709027416538447, -0.00045236735604703426, -0.0004338319704402238, -0.00041529658483341336, -0.00039676117012277246, -0.000378225784515962, -0.00035969039890915155, -0.0003411550133023411, -0.00032261962769553065, -0.0003040842420887202, -0.00028554885648190975, -0.00026701344177126884, -0.00024847808526828885, -0.00022994267055764794, -0.0002114072849508375, -0.00019287189934402704, -0.0001743365137372166, -0.00015580112813040614, -0.00013726572797168046, -0.00011873034236487001, -0.00010019495675805956, -8.16595638752915e-05, -6.312417099252343e-05, -4.458878538571298e-05, -2.6053396140923724e-05, -7.518006896134466e-06, 1.1017382348654792e-05, 2.955277159344405e-05, 4.80881572002545e-05, 6.662355008302256e-05, 8.515894296579063e-05, 0.00010369427036494017, 0.00012222965597175062, 0.00014076504157856107, 0.00015930044173728675, 0.0001778358273440972, 0.00019637121295090765, 0.00021490661310963333, 0.00023344199871644378, 0.00025197738432325423, 0.0002705127699300647, 0.00028904815553687513, 0.0003075835411436856, 0.0003261189558543265, 0.0003446543123573065, 0.0003631897270679474, 0.00038172511267475784, 0.0004002604982815683, 0.00041879588388837874, 0.0004373312694951892, 0.00045586665510199964, 0.0004744020407088101, 0.000492937455419451, 0.000511472811922431, 0.0005300082266330719, 0.0005485436413437128, 0.0005670790560543537, 0.0005856144125573337, 0.0006041498272679746, 0.0006226851837709546, 0.0006412205984815955, 0.0006597559549845755, 0.0006782913696952164, 0.0006968267261981964]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 4.0, 5.0, 8.0, 13.0, 11.0, 14.0, 18.0, 17.0, 19.0, 26.0, 20.0, 27.0, 29.0, 30.0, 48.0, 32.0, 23.0, 40.0, 41.0, 27.0, 33.0, 47.0, 40.0, 41.0, 27.0, 39.0, 38.0, 25.0, 26.0, 32.0, 23.0, 15.0, 21.0, 21.0, 18.0, 10.0, 13.0, 11.0, 8.0, 17.0, 5.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003337264060974121, -0.0003224192187190056, -0.00031111203134059906, -0.00029980484396219254, -0.000288497656583786, -0.0002771904692053795, -0.00026588328182697296, -0.00025457609444856644, -0.0002432689070701599, -0.0002319617196917534, -0.00022065453231334686, -0.00020934734493494034, -0.0001980401575565338, -0.0001867329701781273, -0.00017542578279972076, -0.00016411859542131424, -0.00015281140804290771, -0.0001415042206645012, -0.00013019703328609467, -0.00011888984590768814, -0.00010758265852928162, -9.627547115087509e-05, -8.496828377246857e-05, -7.366109639406204e-05, -6.235390901565552e-05, -5.104672163724899e-05, -3.973953425884247e-05, -2.8432346880435944e-05, -1.712515950202942e-05, -5.817972123622894e-06, 5.48921525478363e-06, 1.6796402633190155e-05, 2.810359001159668e-05, 3.9410777390003204e-05, 5.071796476840973e-05, 6.202515214681625e-05, 7.333233952522278e-05, 8.46395269036293e-05, 9.594671428203583e-05, 0.00010725390166044235, 0.00011856108903884888, 0.0001298682764172554, 0.00014117546379566193, 0.00015248265117406845, 0.00016378983855247498, 0.0001750970259308815, 0.00018640421330928802, 0.00019771140068769455, 0.00020901858806610107, 0.0002203257754445076, 0.00023163296282291412, 0.00024294015020132065, 0.00025424733757972717, 0.0002655545249581337, 0.0002768617123365402, 0.00028816889971494675, 0.00029947608709335327, 0.0003107832744717598, 0.0003220904618501663, 0.00033339764922857285, 0.00034470483660697937, 0.0003560120239853859, 0.0003673192113637924, 0.00037862639874219894, 0.00038993358612060547]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 6.0, 6.0, 12.0, 13.0, 6.0, 22.0, 17.0, 19.0, 23.0, 34.0, 22.0, 27.0, 28.0, 37.0, 42.0, 34.0, 31.0, 43.0, 35.0, 40.0, 43.0, 46.0, 38.0, 31.0, 34.0, 29.0, 33.0, 30.0, 28.0, 22.0, 27.0, 14.0, 18.0, 19.0, 16.0, 13.0, 9.0, 9.0, 10.0, 4.0, 8.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51953125, -7.28167724609375, -7.0438232421875, -6.80596923828125, -6.568115234375, -6.33026123046875, -6.0924072265625, -5.85455322265625, -5.61669921875, -5.37884521484375, -5.1409912109375, -4.90313720703125, -4.665283203125, -4.42742919921875, -4.1895751953125, -3.95172119140625, -3.7138671875, -3.47601318359375, -3.2381591796875, -3.00030517578125, -2.762451171875, -2.52459716796875, -2.2867431640625, -2.04888916015625, -1.81103515625, -1.57318115234375, -1.3353271484375, -1.09747314453125, -0.859619140625, -0.62176513671875, -0.3839111328125, -0.14605712890625, 0.091796875, 0.32965087890625, 0.5675048828125, 0.80535888671875, 1.043212890625, 1.28106689453125, 1.5189208984375, 1.75677490234375, 1.99462890625, 2.23248291015625, 2.4703369140625, 2.70819091796875, 2.946044921875, 3.18389892578125, 3.4217529296875, 3.65960693359375, 3.8974609375, 4.13531494140625, 4.3731689453125, 4.61102294921875, 4.848876953125, 5.08673095703125, 5.3245849609375, 5.56243896484375, 5.80029296875, 6.03814697265625, 6.2760009765625, 6.51385498046875, 6.751708984375, 6.98956298828125, 7.2274169921875, 7.46527099609375, 7.703125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 8.0, 7.0, 11.0, 17.0, 24.0, 29.0, 24.0, 53.0, 54.0, 61.0, 105.0, 132.0, 182.0, 279.0, 497.0, 923.0, 1895.0, 4584.0, 11531.0, 34365.0, 116285.0, 450872.0, 308114.0, 78761.0, 24335.0, 8412.0, 3412.0, 1494.0, 728.0, 436.0, 240.0, 167.0, 128.0, 87.0, 55.0, 45.0, 56.0, 29.0, 25.0, 19.0, 16.0, 12.0, 10.0, 9.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6875, -9.38330078125, -9.0791015625, -8.77490234375, -8.470703125, -8.16650390625, -7.8623046875, -7.55810546875, -7.25390625, -6.94970703125, -6.6455078125, -6.34130859375, -6.037109375, -5.73291015625, -5.4287109375, -5.12451171875, -4.8203125, -4.51611328125, -4.2119140625, -3.90771484375, -3.603515625, -3.29931640625, -2.9951171875, -2.69091796875, -2.38671875, -2.08251953125, -1.7783203125, -1.47412109375, -1.169921875, -0.86572265625, -0.5615234375, -0.25732421875, 0.046875, 0.35107421875, 0.6552734375, 0.95947265625, 1.263671875, 1.56787109375, 1.8720703125, 2.17626953125, 2.48046875, 2.78466796875, 3.0888671875, 3.39306640625, 3.697265625, 4.00146484375, 4.3056640625, 4.60986328125, 4.9140625, 5.21826171875, 5.5224609375, 5.82666015625, 6.130859375, 6.43505859375, 6.7392578125, 7.04345703125, 7.34765625, 7.65185546875, 7.9560546875, 8.26025390625, 8.564453125, 8.86865234375, 9.1728515625, 9.47705078125, 9.78125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 5.0, 10.0, 14.0, 10.0, 10.0, 12.0, 19.0, 17.0, 25.0, 24.0, 26.0, 26.0, 23.0, 34.0, 48.0, 40.0, 51.0, 64.0, 108.0, 221.0, 1490.0, 209.0, 95.0, 64.0, 46.0, 50.0, 29.0, 43.0, 37.0, 22.0, 27.0, 19.0, 21.0, 17.0, 16.0, 16.0, 16.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.859375, -20.217041015625, -19.57470703125, -18.932373046875, -18.2900390625, -17.647705078125, -17.00537109375, -16.363037109375, -15.720703125, -15.078369140625, -14.43603515625, -13.793701171875, -13.1513671875, -12.509033203125, -11.86669921875, -11.224365234375, -10.58203125, -9.939697265625, -9.29736328125, -8.655029296875, -8.0126953125, -7.370361328125, -6.72802734375, -6.085693359375, -5.443359375, -4.801025390625, -4.15869140625, -3.516357421875, -2.8740234375, -2.231689453125, -1.58935546875, -0.947021484375, -0.3046875, 0.337646484375, 0.97998046875, 1.622314453125, 2.2646484375, 2.906982421875, 3.54931640625, 4.191650390625, 4.833984375, 5.476318359375, 6.11865234375, 6.760986328125, 7.4033203125, 8.045654296875, 8.68798828125, 9.330322265625, 9.97265625, 10.614990234375, 11.25732421875, 11.899658203125, 12.5419921875, 13.184326171875, 13.82666015625, 14.468994140625, 15.111328125, 15.753662109375, 16.39599609375, 17.038330078125, 17.6806640625, 18.322998046875, 18.96533203125, 19.607666015625, 20.25]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 10.0, 6.0, 12.0, 19.0, 25.0, 30.0, 43.0, 57.0, 91.0, 144.0, 197.0, 331.0, 657.0, 2585.0, 91752.0, 3014966.0, 31735.0, 1522.0, 559.0, 336.0, 182.0, 133.0, 90.0, 61.0, 35.0, 32.0, 28.0, 21.0, 12.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.09423828125, -32.7509765625, -31.40771484375, -30.064453125, -28.72119140625, -27.3779296875, -26.03466796875, -24.69140625, -23.34814453125, -22.0048828125, -20.66162109375, -19.318359375, -17.97509765625, -16.6318359375, -15.28857421875, -13.9453125, -12.60205078125, -11.2587890625, -9.91552734375, -8.572265625, -7.22900390625, -5.8857421875, -4.54248046875, -3.19921875, -1.85595703125, -0.5126953125, 0.83056640625, 2.173828125, 3.51708984375, 4.8603515625, 6.20361328125, 7.546875, 8.89013671875, 10.2333984375, 11.57666015625, 12.919921875, 14.26318359375, 15.6064453125, 16.94970703125, 18.29296875, 19.63623046875, 20.9794921875, 22.32275390625, 23.666015625, 25.00927734375, 26.3525390625, 27.69580078125, 29.0390625, 30.38232421875, 31.7255859375, 33.06884765625, 34.412109375, 35.75537109375, 37.0986328125, 38.44189453125, 39.78515625, 41.12841796875, 42.4716796875, 43.81494140625, 45.158203125, 46.50146484375, 47.8447265625, 49.18798828125, 50.53125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 52.0, 878.0, 85.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.468585968017578, -9.919108390808105, -3.369630813598633, 3.1798477172851562, 9.729324340820312, 16.27880096435547, 22.82828140258789, 29.377758026123047, 35.9272346496582, 42.47671127319336, 49.02619171142578, 55.57566833496094, 62.125144958496094, 68.67462158203125, 75.22410583496094, 81.77357482910156, 88.32305908203125, 94.8725357055664, 101.42201232910156, 107.97149658203125, 114.52096557617188, 121.07044982910156, 127.61992645263672, 134.16940307617188, 140.7188720703125, 147.2683563232422, 153.8178253173828, 160.3673095703125, 166.91677856445312, 173.4662628173828, 180.0157470703125, 186.56521606445312, 193.11468505859375, 199.66416931152344, 206.21363830566406, 212.76312255859375, 219.31259155273438, 225.86207580566406, 232.41156005859375, 238.96102905273438, 245.510498046875, 252.0599822998047, 258.6094665527344, 265.158935546875, 271.7084045410156, 278.25787353515625, 284.807373046875, 291.3568420410156, 297.90631103515625, 304.4557800292969, 311.0052795410156, 317.55474853515625, 324.1042175292969, 330.6536865234375, 337.20318603515625, 343.7526550292969, 350.3021545410156, 356.85162353515625, 363.401123046875, 369.9505920410156, 376.50006103515625, 383.0495300292969, 389.5990295410156, 396.14849853515625, 402.6979675292969]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 6.0, 3.0, 12.0, 9.0, 12.0, 16.0, 19.0, 24.0, 24.0, 21.0, 24.0, 23.0, 26.0, 24.0, 33.0, 24.0, 38.0, 27.0, 35.0, 40.0, 44.0, 47.0, 41.0, 41.0, 37.0, 33.0, 37.0, 26.0, 38.0, 29.0, 15.0, 24.0, 25.0, 14.0, 14.0, 24.0, 6.0, 13.0, 7.0, 7.0, 8.0, 2.0, 8.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.56782913208008, -43.14304733276367, -41.71826934814453, -40.293487548828125, -38.86870574951172, -37.44392395019531, -36.019142150878906, -34.594364166259766, -33.16958236694336, -31.744800567626953, -30.32002067565918, -28.895240783691406, -27.470458984375, -26.045677185058594, -24.62089729309082, -23.196117401123047, -21.77133560180664, -20.346553802490234, -18.92177391052246, -17.496994018554688, -16.07221221923828, -14.647431373596191, -13.222650527954102, -11.797869682312012, -10.373088836669922, -8.948307991027832, -7.523527145385742, -6.098746299743652, -4.6739654541015625, -3.2491846084594727, -1.8244037628173828, -0.39962291717529297, 1.0251579284667969, 2.4499387741088867, 3.8747196197509766, 5.299500465393066, 6.724281311035156, 8.149062156677246, 9.573843002319336, 10.998623847961426, 12.423404693603516, 13.848185539245605, 15.272966384887695, 16.69774627685547, 18.122528076171875, 19.54730987548828, 20.972089767456055, 22.396869659423828, 23.821651458740234, 25.24643325805664, 26.671213150024414, 28.095993041992188, 29.520774841308594, 30.945556640625, 32.370338439941406, 33.79511642456055, 35.21989822387695, 36.64468002319336, 38.0694580078125, 39.494239807128906, 40.91902160644531, 42.34380340576172, 43.768585205078125, 45.193363189697266, 46.61814498901367]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 3.0, 9.0, 9.0, 9.0, 12.0, 18.0, 18.0, 19.0, 14.0, 16.0, 33.0, 31.0, 24.0, 29.0, 34.0, 44.0, 38.0, 34.0, 37.0, 31.0, 29.0, 51.0, 34.0, 37.0, 43.0, 26.0, 37.0, 26.0, 23.0, 28.0, 27.0, 24.0, 24.0, 18.0, 18.0, 12.0, 15.0, 9.0, 8.0, 6.0, 8.0, 3.0, 9.0, 1.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.921875, -7.6856689453125, -7.449462890625, -7.2132568359375, -6.97705078125, -6.7408447265625, -6.504638671875, -6.2684326171875, -6.0322265625, -5.7960205078125, -5.559814453125, -5.3236083984375, -5.08740234375, -4.8511962890625, -4.614990234375, -4.3787841796875, -4.142578125, -3.9063720703125, -3.670166015625, -3.4339599609375, -3.19775390625, -2.9615478515625, -2.725341796875, -2.4891357421875, -2.2529296875, -2.0167236328125, -1.780517578125, -1.5443115234375, -1.30810546875, -1.0718994140625, -0.835693359375, -0.5994873046875, -0.36328125, -0.1270751953125, 0.109130859375, 0.3453369140625, 0.58154296875, 0.8177490234375, 1.053955078125, 1.2901611328125, 1.5263671875, 1.7625732421875, 1.998779296875, 2.2349853515625, 2.47119140625, 2.7073974609375, 2.943603515625, 3.1798095703125, 3.416015625, 3.6522216796875, 3.888427734375, 4.1246337890625, 4.36083984375, 4.5970458984375, 4.833251953125, 5.0694580078125, 5.3056640625, 5.5418701171875, 5.778076171875, 6.0142822265625, 6.25048828125, 6.4866943359375, 6.722900390625, 6.9591064453125, 7.1953125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 14.0, 5.0, 13.0, 19.0, 23.0, 13.0, 24.0, 35.0, 32.0, 41.0, 49.0, 89.0, 161.0, 349.0, 1218.0, 5671.0, 73331.0, 3047073.0, 1041844.0, 19964.0, 2909.0, 718.0, 245.0, 110.0, 53.0, 47.0, 30.0, 28.0, 28.0, 17.0, 21.0, 16.0, 14.0, 8.0, 15.0, 7.0, 9.0, 3.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.46875, -26.546875, -25.625, -24.703125, -23.78125, -22.859375, -21.9375, -21.015625, -20.09375, -19.171875, -18.25, -17.328125, -16.40625, -15.484375, -14.5625, -13.640625, -12.71875, -11.796875, -10.875, -9.953125, -9.03125, -8.109375, -7.1875, -6.265625, -5.34375, -4.421875, -3.5, -2.578125, -1.65625, -0.734375, 0.1875, 1.109375, 2.03125, 2.953125, 3.875, 4.796875, 5.71875, 6.640625, 7.5625, 8.484375, 9.40625, 10.328125, 11.25, 12.171875, 13.09375, 14.015625, 14.9375, 15.859375, 16.78125, 17.703125, 18.625, 19.546875, 20.46875, 21.390625, 22.3125, 23.234375, 24.15625, 25.078125, 26.0, 26.921875, 27.84375, 28.765625, 29.6875, 30.609375, 31.53125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 8.0, 7.0, 7.0, 10.0, 8.0, 20.0, 27.0, 21.0, 34.0, 50.0, 59.0, 75.0, 110.0, 171.0, 254.0, 352.0, 430.0, 539.0, 494.0, 427.0, 281.0, 188.0, 157.0, 81.0, 66.0, 52.0, 38.0, 25.0, 25.0, 12.0, 13.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.7119140625, -11.353515625, -10.9951171875, -10.63671875, -10.2783203125, -9.919921875, -9.5615234375, -9.203125, -8.8447265625, -8.486328125, -8.1279296875, -7.76953125, -7.4111328125, -7.052734375, -6.6943359375, -6.3359375, -5.9775390625, -5.619140625, -5.2607421875, -4.90234375, -4.5439453125, -4.185546875, -3.8271484375, -3.46875, -3.1103515625, -2.751953125, -2.3935546875, -2.03515625, -1.6767578125, -1.318359375, -0.9599609375, -0.6015625, -0.2431640625, 0.115234375, 0.4736328125, 0.83203125, 1.1904296875, 1.548828125, 1.9072265625, 2.265625, 2.6240234375, 2.982421875, 3.3408203125, 3.69921875, 4.0576171875, 4.416015625, 4.7744140625, 5.1328125, 5.4912109375, 5.849609375, 6.2080078125, 6.56640625, 6.9248046875, 7.283203125, 7.6416015625, 8.0, 8.3583984375, 8.716796875, 9.0751953125, 9.43359375, 9.7919921875, 10.150390625, 10.5087890625, 10.8671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 12.0, 12.0, 21.0, 26.0, 28.0, 68.0, 77.0, 174.0, 325.0, 914.0, 4254.0, 53604.0, 3535002.0, 581137.0, 15267.0, 2089.0, 602.0, 246.0, 131.0, 89.0, 60.0, 44.0, 22.0, 20.0, 8.0, 9.0, 6.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-42.0625, -40.919189453125, -39.77587890625, -38.632568359375, -37.4892578125, -36.345947265625, -35.20263671875, -34.059326171875, -32.916015625, -31.772705078125, -30.62939453125, -29.486083984375, -28.3427734375, -27.199462890625, -26.05615234375, -24.912841796875, -23.76953125, -22.626220703125, -21.48291015625, -20.339599609375, -19.1962890625, -18.052978515625, -16.90966796875, -15.766357421875, -14.623046875, -13.479736328125, -12.33642578125, -11.193115234375, -10.0498046875, -8.906494140625, -7.76318359375, -6.619873046875, -5.4765625, -4.333251953125, -3.18994140625, -2.046630859375, -0.9033203125, 0.239990234375, 1.38330078125, 2.526611328125, 3.669921875, 4.813232421875, 5.95654296875, 7.099853515625, 8.2431640625, 9.386474609375, 10.52978515625, 11.673095703125, 12.81640625, 13.959716796875, 15.10302734375, 16.246337890625, 17.3896484375, 18.532958984375, 19.67626953125, 20.819580078125, 21.962890625, 23.106201171875, 24.24951171875, 25.392822265625, 26.5361328125, 27.679443359375, 28.82275390625, 29.966064453125, 31.109375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 46.0, 296.0, 457.0, 190.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.51425170898438, -162.16485595703125, -156.81544494628906, -151.46604919433594, -146.11663818359375, -140.76724243164062, -135.4178466796875, -130.0684356689453, -124.71903991699219, -119.36963653564453, -114.02023315429688, -108.67083740234375, -103.3214340209961, -97.97203063964844, -92.62262725830078, -87.27322387695312, -81.92382049560547, -76.57441711425781, -71.22501373291016, -65.8756103515625, -60.526214599609375, -55.17681121826172, -49.82740783691406, -44.47800827026367, -39.128604888916016, -33.77920150756836, -28.42980194091797, -23.080398559570312, -17.73099708557129, -12.381595611572266, -7.032192230224609, -1.6827926635742188, 3.6666107177734375, 9.016012191772461, 14.3654146194458, 19.71481704711914, 25.064218521118164, 30.413619995117188, 35.763023376464844, 41.112422943115234, 46.46182632446289, 51.81122970581055, 57.16062927246094, 62.510032653808594, 67.85943603515625, 73.20883178710938, 78.55824279785156, 83.90763854980469, 89.25704193115234, 94.6064453125, 99.95584869384766, 105.30525207519531, 110.65464782714844, 116.0040512084961, 121.35345458984375, 126.70285034179688, 132.05226135253906, 137.4016571044922, 142.75106811523438, 148.1004638671875, 153.4498748779297, 158.7992706298828, 164.148681640625, 169.49807739257812, 174.84747314453125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 11.0, 13.0, 18.0, 18.0, 23.0, 34.0, 27.0, 36.0, 23.0, 23.0, 31.0, 28.0, 36.0, 40.0, 21.0, 36.0, 38.0, 41.0, 53.0, 24.0, 41.0, 49.0, 31.0, 25.0, 22.0, 31.0, 33.0, 25.0, 14.0, 23.0, 15.0, 15.0, 9.0, 15.0, 7.0, 10.0, 8.0, 6.0, 3.0, 6.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.921142578125, -30.824615478515625, -29.72808837890625, -28.631561279296875, -27.5350341796875, -26.438507080078125, -25.34197998046875, -24.245452880859375, -23.14892578125, -22.052398681640625, -20.95587158203125, -19.859344482421875, -18.7628173828125, -17.666290283203125, -16.56976318359375, -15.473236083984375, -14.376708984375, -13.280181884765625, -12.18365478515625, -11.087127685546875, -9.9906005859375, -8.894073486328125, -7.79754638671875, -6.701019287109375, -5.6044921875, -4.507965087890625, -3.41143798828125, -2.314910888671875, -1.2183837890625, -0.121856689453125, 0.97467041015625, 2.071197509765625, 3.167724609375, 4.264251708984375, 5.36077880859375, 6.457305908203125, 7.5538330078125, 8.650360107421875, 9.74688720703125, 10.843414306640625, 11.93994140625, 13.036468505859375, 14.13299560546875, 15.229522705078125, 16.3260498046875, 17.422576904296875, 18.51910400390625, 19.615631103515625, 20.712158203125, 21.808685302734375, 22.90521240234375, 24.001739501953125, 25.0982666015625, 26.194793701171875, 27.29132080078125, 28.387847900390625, 29.484375, 30.580902099609375, 31.67742919921875, 32.773956298828125, 33.8704833984375, 34.967010498046875, 36.06353759765625, 37.160064697265625, 38.256591796875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 5.0, 14.0, 17.0, 16.0, 16.0, 20.0, 21.0, 17.0, 25.0, 35.0, 35.0, 39.0, 38.0, 30.0, 32.0, 32.0, 34.0, 31.0, 35.0, 53.0, 42.0, 29.0, 36.0, 34.0, 27.0, 29.0, 27.0, 35.0, 30.0, 23.0, 17.0, 21.0, 18.0, 12.0, 18.0, 3.0, 15.0, 3.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.453125, -8.20648193359375, -7.9598388671875, -7.71319580078125, -7.466552734375, -7.21990966796875, -6.9732666015625, -6.72662353515625, -6.47998046875, -6.23333740234375, -5.9866943359375, -5.74005126953125, -5.493408203125, -5.24676513671875, -5.0001220703125, -4.75347900390625, -4.5068359375, -4.26019287109375, -4.0135498046875, -3.76690673828125, -3.520263671875, -3.27362060546875, -3.0269775390625, -2.78033447265625, -2.53369140625, -2.28704833984375, -2.0404052734375, -1.79376220703125, -1.547119140625, -1.30047607421875, -1.0538330078125, -0.80718994140625, -0.560546875, -0.31390380859375, -0.0672607421875, 0.17938232421875, 0.426025390625, 0.67266845703125, 0.9193115234375, 1.16595458984375, 1.41259765625, 1.65924072265625, 1.9058837890625, 2.15252685546875, 2.399169921875, 2.64581298828125, 2.8924560546875, 3.13909912109375, 3.3857421875, 3.63238525390625, 3.8790283203125, 4.12567138671875, 4.372314453125, 4.61895751953125, 4.8656005859375, 5.11224365234375, 5.35888671875, 5.60552978515625, 5.8521728515625, 6.09881591796875, 6.345458984375, 6.59210205078125, 6.8387451171875, 7.08538818359375, 7.33203125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 28.0, 29.0, 61.0, 77.0, 125.0, 173.0, 275.0, 450.0, 704.0, 1105.0, 1686.0, 2702.0, 4171.0, 6606.0, 10400.0, 16147.0, 25838.0, 41588.0, 67314.0, 111828.0, 202906.0, 230200.0, 125667.0, 74728.0, 46022.0, 28516.0, 17783.0, 11332.0, 7248.0, 4648.0, 2935.0, 1870.0, 1196.0, 793.0, 490.0, 322.0, 208.0, 130.0, 88.0, 59.0, 26.0, 21.0, 14.0, 9.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3192596435546875, -1.278167724609375, -1.2370758056640625, -1.19598388671875, -1.1548919677734375, -1.113800048828125, -1.0727081298828125, -1.0316162109375, -0.9905242919921875, -0.949432373046875, -0.9083404541015625, -0.86724853515625, -0.8261566162109375, -0.785064697265625, -0.7439727783203125, -0.702880859375, -0.6617889404296875, -0.620697021484375, -0.5796051025390625, -0.53851318359375, -0.4974212646484375, -0.456329345703125, -0.4152374267578125, -0.3741455078125, -0.3330535888671875, -0.291961669921875, -0.2508697509765625, -0.20977783203125, -0.1686859130859375, -0.127593994140625, -0.0865020751953125, -0.04541015625, -0.0043182373046875, 0.036773681640625, 0.0778656005859375, 0.11895751953125, 0.1600494384765625, 0.201141357421875, 0.2422332763671875, 0.2833251953125, 0.3244171142578125, 0.365509033203125, 0.4066009521484375, 0.44769287109375, 0.4887847900390625, 0.529876708984375, 0.5709686279296875, 0.612060546875, 0.6531524658203125, 0.694244384765625, 0.7353363037109375, 0.77642822265625, 0.8175201416015625, 0.858612060546875, 0.8997039794921875, 0.9407958984375, 0.9818878173828125, 1.022979736328125, 1.0640716552734375, 1.10516357421875, 1.1462554931640625, 1.187347412109375, 1.2284393310546875, 1.26953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 6.0, 8.0, 10.0, 14.0, 12.0, 16.0, 25.0, 18.0, 25.0, 32.0, 30.0, 33.0, 26.0, 36.0, 36.0, 49.0, 35.0, 42.0, 45.0, 1061.0, 37.0, 48.0, 53.0, 25.0, 40.0, 30.0, 27.0, 42.0, 27.0, 20.0, 16.0, 22.0, 12.0, 7.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.65625, -5.4903564453125, -5.324462890625, -5.1585693359375, -4.99267578125, -4.8267822265625, -4.660888671875, -4.4949951171875, -4.3291015625, -4.1632080078125, -3.997314453125, -3.8314208984375, -3.66552734375, -3.4996337890625, -3.333740234375, -3.1678466796875, -3.001953125, -2.8360595703125, -2.670166015625, -2.5042724609375, -2.33837890625, -2.1724853515625, -2.006591796875, -1.8406982421875, -1.6748046875, -1.5089111328125, -1.343017578125, -1.1771240234375, -1.01123046875, -0.8453369140625, -0.679443359375, -0.5135498046875, -0.34765625, -0.1817626953125, -0.015869140625, 0.1500244140625, 0.31591796875, 0.4818115234375, 0.647705078125, 0.8135986328125, 0.9794921875, 1.1453857421875, 1.311279296875, 1.4771728515625, 1.64306640625, 1.8089599609375, 1.974853515625, 2.1407470703125, 2.306640625, 2.4725341796875, 2.638427734375, 2.8043212890625, 2.97021484375, 3.1361083984375, 3.302001953125, 3.4678955078125, 3.6337890625, 3.7996826171875, 3.965576171875, 4.1314697265625, 4.29736328125, 4.4632568359375, 4.629150390625, 4.7950439453125, 4.9609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 4.0, 13.0, 24.0, 24.0, 32.0, 50.0, 93.0, 131.0, 181.0, 271.0, 444.0, 640.0, 908.0, 1373.0, 1979.0, 2951.0, 4389.0, 6773.0, 10523.0, 16655.0, 26665.0, 43635.0, 74338.0, 130586.0, 1299009.0, 204016.0, 108605.0, 61908.0, 37097.0, 22763.0, 14380.0, 8926.0, 5919.0, 3800.0, 2586.0, 1772.0, 1199.0, 795.0, 552.0, 359.0, 253.0, 169.0, 104.0, 81.0, 54.0, 37.0, 25.0, 12.0, 11.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2509765625, -1.2116851806640625, -1.172393798828125, -1.1331024169921875, -1.09381103515625, -1.0545196533203125, -1.015228271484375, -0.9759368896484375, -0.9366455078125, -0.8973541259765625, -0.858062744140625, -0.8187713623046875, -0.77947998046875, -0.7401885986328125, -0.700897216796875, -0.6616058349609375, -0.622314453125, -0.5830230712890625, -0.543731689453125, -0.5044403076171875, -0.46514892578125, -0.4258575439453125, -0.386566162109375, -0.3472747802734375, -0.3079833984375, -0.2686920166015625, -0.229400634765625, -0.1901092529296875, -0.15081787109375, -0.1115264892578125, -0.072235107421875, -0.0329437255859375, 0.00634765625, 0.0456390380859375, 0.084930419921875, 0.1242218017578125, 0.16351318359375, 0.2028045654296875, 0.242095947265625, 0.2813873291015625, 0.3206787109375, 0.3599700927734375, 0.399261474609375, 0.4385528564453125, 0.47784423828125, 0.5171356201171875, 0.556427001953125, 0.5957183837890625, 0.635009765625, 0.6743011474609375, 0.713592529296875, 0.7528839111328125, 0.79217529296875, 0.8314666748046875, 0.870758056640625, 0.9100494384765625, 0.9493408203125, 0.9886322021484375, 1.027923583984375, 1.0672149658203125, 1.10650634765625, 1.1457977294921875, 1.185089111328125, 1.2243804931640625, 1.263671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 2.0, 6.0, 7.0, 6.0, 6.0, 9.0, 12.0, 19.0, 25.0, 17.0, 22.0, 31.0, 41.0, 37.0, 58.0, 54.0, 58.0, 73.0, 57.0, 55.0, 71.0, 61.0, 46.0, 40.0, 35.0, 22.0, 27.0, 22.0, 20.0, 13.0, 13.0, 6.0, 2.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0009264945983886719, -0.000896550714969635, -0.0008666068315505981, -0.0008366629481315613, -0.0008067190647125244, -0.0007767751812934875, -0.0007468312978744507, -0.0007168874144554138, -0.000686943531036377, -0.0006569996476173401, -0.0006270557641983032, -0.0005971118807792664, -0.0005671679973602295, -0.0005372241139411926, -0.0005072802305221558, -0.0004773363471031189, -0.00044739246368408203, -0.00041744858026504517, -0.0003875046968460083, -0.00035756081342697144, -0.00032761693000793457, -0.0002976730465888977, -0.00026772916316986084, -0.00023778527975082397, -0.0002078413963317871, -0.00017789751291275024, -0.00014795362949371338, -0.00011800974607467651, -8.806586265563965e-05, -5.812197923660278e-05, -2.8178095817565918e-05, 1.7657876014709473e-06, 3.170967102050781e-05, 6.165355443954468e-05, 9.159743785858154e-05, 0.00012154132127761841, 0.00015148520469665527, 0.00018142908811569214, 0.000211372971534729, 0.00024131685495376587, 0.00027126073837280273, 0.0003012046217918396, 0.00033114850521087646, 0.00036109238862991333, 0.0003910362720489502, 0.00042098015546798706, 0.0004509240388870239, 0.0004808679223060608, 0.0005108118057250977, 0.0005407556891441345, 0.0005706995725631714, 0.0006006434559822083, 0.0006305873394012451, 0.000660531222820282, 0.0006904751062393188, 0.0007204189896583557, 0.0007503628730773926, 0.0007803067564964294, 0.0008102506399154663, 0.0008401945233345032, 0.00087013840675354, 0.0009000822901725769, 0.0009300261735916138, 0.0009599700570106506, 0.0009899139404296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 7.0, 6.0, 11.0, 13.0, 8.0, 10.0, 22.0, 25.0, 27.0, 38.0, 48.0, 62.0, 92.0, 110.0, 186.0, 338.0, 703.0, 12171.0, 1030639.0, 2360.0, 592.0, 292.0, 207.0, 139.0, 98.0, 82.0, 47.0, 42.0, 28.0, 36.0, 27.0, 15.0, 12.0, 19.0, 10.0, 9.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019622802734375, -0.019016265869140625, -0.01840972900390625, -0.017803192138671875, -0.0171966552734375, -0.016590118408203125, -0.01598358154296875, -0.015377044677734375, -0.0147705078125, -0.014163970947265625, -0.01355743408203125, -0.012950897216796875, -0.0123443603515625, -0.011737823486328125, -0.01113128662109375, -0.010524749755859375, -0.009918212890625, -0.009311676025390625, -0.00870513916015625, -0.008098602294921875, -0.0074920654296875, -0.006885528564453125, -0.00627899169921875, -0.005672454833984375, -0.00506591796875, -0.004459381103515625, -0.00385284423828125, -0.003246307373046875, -0.0026397705078125, -0.002033233642578125, -0.00142669677734375, -0.000820159912109375, -0.000213623046875, 0.000392913818359375, 0.00099945068359375, 0.001605987548828125, 0.0022125244140625, 0.002819061279296875, 0.00342559814453125, 0.004032135009765625, 0.004638671875, 0.005245208740234375, 0.00585174560546875, 0.006458282470703125, 0.0070648193359375, 0.007671356201171875, 0.00827789306640625, 0.008884429931640625, 0.009490966796875, 0.010097503662109375, 0.01070404052734375, 0.011310577392578125, 0.0119171142578125, 0.012523651123046875, 0.01313018798828125, 0.013736724853515625, 0.01434326171875, 0.014949798583984375, 0.01555633544921875, 0.016162872314453125, 0.0167694091796875, 0.017375946044921875, 0.01798248291015625, 0.018589019775390625, 0.019195556640625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 20.0, 209.0, 563.0, 200.0, 18.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015271920710802078, -0.0014648339711129665, -0.0014024758711457253, -0.0013401176547631621, -0.0012777595547959208, -0.0012154014548286796, -0.0011530432384461164, -0.0010906851384788752, -0.0010283270385116339, -0.0009659689385443926, -0.0009036107803694904, -0.0008412526221945882, -0.0007788945222273469, -0.0007165364222601056, -0.0006541782640852034, -0.0005918201059103012, -0.0005294620059430599, -0.0004671038768719882, -0.00040474574780091643, -0.0003423876187298447, -0.00028002948965877295, -0.0002176713605877012, -0.00015531323151662946, -9.295510244555771e-05, -3.059697337448597e-05, 3.1761155696585774e-05, 9.411928476765752e-05, 0.00015647741383872926, 0.000218835542909801, 0.00028119367198087275, 0.0003435518010519445, 0.00040590993012301624, 0.000468268059194088, 0.0005306261591613293, 0.0005929843173362315, 0.0006553424755111337, 0.000717700575478375, 0.0007800586754456162, 0.0008424168336205184, 0.0009047749917954206, 0.0009671330917626619, 0.0010294911917299032, 0.0010918492916971445, 0.0011542075080797076, 0.001216565608046949, 0.0012789237080141902, 0.0013412819243967533, 0.0014036400243639946, 0.0014659981243312359, 0.0015283562242984772, 0.0015907143242657185, 0.0016530725406482816, 0.0017154306406155229, 0.0017777887405827641, 0.0018401469569653273, 0.0019025050569325686, 0.00196486315689981, 0.002027221256867051, 0.0020895793568342924, 0.0021519374568015337, 0.0022142957895994186, 0.00227665388956666, 0.002339011989533901, 0.0024013700895011425, 0.002463728189468384]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 5.0, 10.0, 12.0, 13.0, 7.0, 21.0, 10.0, 19.0, 26.0, 20.0, 34.0, 34.0, 39.0, 38.0, 34.0, 32.0, 37.0, 38.0, 36.0, 40.0, 49.0, 43.0, 43.0, 36.0, 39.0, 35.0, 35.0, 24.0, 28.0, 25.0, 15.0, 19.0, 21.0, 17.0, 5.0, 12.0, 11.0, 8.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004550814628601074, -0.00044012628495693207, -0.0004251711070537567, -0.00041021592915058136, -0.000395260751247406, -0.00038030557334423065, -0.0003653503954410553, -0.00035039521753787994, -0.0003354400396347046, -0.00032048486173152924, -0.0003055296838283539, -0.00029057450592517853, -0.0002756193280220032, -0.0002606641501188278, -0.00024570897221565247, -0.0002307537943124771, -0.00021579861640930176, -0.0002008434385061264, -0.00018588826060295105, -0.0001709330826997757, -0.00015597790479660034, -0.000141022726893425, -0.00012606754899024963, -0.00011111237108707428, -9.615719318389893e-05, -8.120201528072357e-05, -6.624683737754822e-05, -5.1291659474372864e-05, -3.633648157119751e-05, -2.1381303668022156e-05, -6.426125764846802e-06, 8.529052138328552e-06, 2.3484230041503906e-05, 3.843940794467926e-05, 5.3394585847854614e-05, 6.834976375102997e-05, 8.330494165420532e-05, 9.826011955738068e-05, 0.00011321529746055603, 0.00012817047536373138, 0.00014312565326690674, 0.0001580808311700821, 0.00017303600907325745, 0.0001879911869764328, 0.00020294636487960815, 0.0002179015427827835, 0.00023285672068595886, 0.0002478118985891342, 0.00026276707649230957, 0.0002777222543954849, 0.0002926774322986603, 0.00030763261020183563, 0.000322587788105011, 0.00033754296600818634, 0.0003524981439113617, 0.00036745332181453705, 0.0003824084997177124, 0.00039736367762088776, 0.0004123188555240631, 0.00042727403342723846, 0.0004422292113304138, 0.00045718438923358917, 0.0004721395671367645, 0.0004870947450399399, 0.0005020499229431152]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 5.0, 14.0, 17.0, 16.0, 16.0, 20.0, 21.0, 17.0, 25.0, 35.0, 35.0, 39.0, 38.0, 30.0, 32.0, 32.0, 34.0, 31.0, 35.0, 53.0, 42.0, 29.0, 36.0, 34.0, 27.0, 29.0, 27.0, 35.0, 30.0, 23.0, 16.0, 22.0, 18.0, 12.0, 18.0, 3.0, 15.0, 3.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.453125, -8.20648193359375, -7.9598388671875, -7.71319580078125, -7.466552734375, -7.21990966796875, -6.9732666015625, -6.72662353515625, -6.47998046875, -6.23333740234375, -5.9866943359375, -5.74005126953125, -5.493408203125, -5.24676513671875, -5.0001220703125, -4.75347900390625, -4.5068359375, -4.26019287109375, -4.0135498046875, -3.76690673828125, -3.520263671875, -3.27362060546875, -3.0269775390625, -2.78033447265625, -2.53369140625, -2.28704833984375, -2.0404052734375, -1.79376220703125, -1.547119140625, -1.30047607421875, -1.0538330078125, -0.80718994140625, -0.560546875, -0.31390380859375, -0.0672607421875, 0.17938232421875, 0.426025390625, 0.67266845703125, 0.9193115234375, 1.16595458984375, 1.41259765625, 1.65924072265625, 1.9058837890625, 2.15252685546875, 2.399169921875, 2.64581298828125, 2.8924560546875, 3.13909912109375, 3.3857421875, 3.63238525390625, 3.8790283203125, 4.12567138671875, 4.372314453125, 4.61895751953125, 4.8656005859375, 5.11224365234375, 5.35888671875, 5.60552978515625, 5.8521728515625, 6.09881591796875, 6.345458984375, 6.59210205078125, 6.8387451171875, 7.08538818359375, 7.33203125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 13.0, 16.0, 10.0, 22.0, 31.0, 40.0, 69.0, 85.0, 102.0, 142.0, 199.0, 298.0, 407.0, 583.0, 793.0, 1384.0, 2260.0, 4482.0, 10544.0, 28521.0, 91423.0, 299861.0, 402354.0, 135432.0, 41900.0, 14100.0, 5792.0, 2872.0, 1573.0, 997.0, 627.0, 429.0, 310.0, 238.0, 195.0, 122.0, 79.0, 79.0, 45.0, 34.0, 30.0, 18.0, 10.0, 12.0, 6.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4765625, -8.195556640625, -7.91455078125, -7.633544921875, -7.3525390625, -7.071533203125, -6.79052734375, -6.509521484375, -6.228515625, -5.947509765625, -5.66650390625, -5.385498046875, -5.1044921875, -4.823486328125, -4.54248046875, -4.261474609375, -3.98046875, -3.699462890625, -3.41845703125, -3.137451171875, -2.8564453125, -2.575439453125, -2.29443359375, -2.013427734375, -1.732421875, -1.451416015625, -1.17041015625, -0.889404296875, -0.6083984375, -0.327392578125, -0.04638671875, 0.234619140625, 0.515625, 0.796630859375, 1.07763671875, 1.358642578125, 1.6396484375, 1.920654296875, 2.20166015625, 2.482666015625, 2.763671875, 3.044677734375, 3.32568359375, 3.606689453125, 3.8876953125, 4.168701171875, 4.44970703125, 4.730712890625, 5.01171875, 5.292724609375, 5.57373046875, 5.854736328125, 6.1357421875, 6.416748046875, 6.69775390625, 6.978759765625, 7.259765625, 7.540771484375, 7.82177734375, 8.102783203125, 8.3837890625, 8.664794921875, 8.94580078125, 9.226806640625, 9.5078125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 3.0, 5.0, 8.0, 14.0, 16.0, 8.0, 25.0, 11.0, 23.0, 27.0, 35.0, 35.0, 38.0, 36.0, 57.0, 74.0, 109.0, 253.0, 1538.0, 185.0, 102.0, 65.0, 46.0, 42.0, 41.0, 35.0, 34.0, 31.0, 19.0, 25.0, 21.0, 12.0, 11.0, 8.0, 8.0, 11.0, 5.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0], "bins": [-22.484375, -21.8486328125, -21.212890625, -20.5771484375, -19.94140625, -19.3056640625, -18.669921875, -18.0341796875, -17.3984375, -16.7626953125, -16.126953125, -15.4912109375, -14.85546875, -14.2197265625, -13.583984375, -12.9482421875, -12.3125, -11.6767578125, -11.041015625, -10.4052734375, -9.76953125, -9.1337890625, -8.498046875, -7.8623046875, -7.2265625, -6.5908203125, -5.955078125, -5.3193359375, -4.68359375, -4.0478515625, -3.412109375, -2.7763671875, -2.140625, -1.5048828125, -0.869140625, -0.2333984375, 0.40234375, 1.0380859375, 1.673828125, 2.3095703125, 2.9453125, 3.5810546875, 4.216796875, 4.8525390625, 5.48828125, 6.1240234375, 6.759765625, 7.3955078125, 8.03125, 8.6669921875, 9.302734375, 9.9384765625, 10.57421875, 11.2099609375, 11.845703125, 12.4814453125, 13.1171875, 13.7529296875, 14.388671875, 15.0244140625, 15.66015625, 16.2958984375, 16.931640625, 17.5673828125, 18.203125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 7.0, 9.0, 9.0, 11.0, 9.0, 28.0, 35.0, 37.0, 54.0, 62.0, 97.0, 141.0, 179.0, 319.0, 454.0, 1237.0, 12762.0, 2677807.0, 444495.0, 5881.0, 829.0, 402.0, 247.0, 172.0, 105.0, 81.0, 55.0, 46.0, 34.0, 30.0, 22.0, 11.0, 10.0, 10.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-37.71875, -36.4970703125, -35.275390625, -34.0537109375, -32.83203125, -31.6103515625, -30.388671875, -29.1669921875, -27.9453125, -26.7236328125, -25.501953125, -24.2802734375, -23.05859375, -21.8369140625, -20.615234375, -19.3935546875, -18.171875, -16.9501953125, -15.728515625, -14.5068359375, -13.28515625, -12.0634765625, -10.841796875, -9.6201171875, -8.3984375, -7.1767578125, -5.955078125, -4.7333984375, -3.51171875, -2.2900390625, -1.068359375, 0.1533203125, 1.375, 2.5966796875, 3.818359375, 5.0400390625, 6.26171875, 7.4833984375, 8.705078125, 9.9267578125, 11.1484375, 12.3701171875, 13.591796875, 14.8134765625, 16.03515625, 17.2568359375, 18.478515625, 19.7001953125, 20.921875, 22.1435546875, 23.365234375, 24.5869140625, 25.80859375, 27.0302734375, 28.251953125, 29.4736328125, 30.6953125, 31.9169921875, 33.138671875, 34.3603515625, 35.58203125, 36.8037109375, 38.025390625, 39.2470703125, 40.46875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 244.0, 766.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.1175079345703, -183.98941040039062, -173.86129760742188, -163.7332000732422, -153.60508728027344, -143.47698974609375, -133.348876953125, -123.22077941894531, -113.0926742553711, -102.96456909179688, -92.83646392822266, -82.70835876464844, -72.58026123046875, -62.452152252197266, -52.32405090332031, -42.195945739746094, -32.067840576171875, -21.939735412597656, -11.81163215637207, -1.6835289001464844, 8.444576263427734, 18.572681427001953, 28.700782775878906, 38.828887939453125, 48.956993103027344, 59.08509826660156, 69.21320343017578, 79.34130859375, 89.46940612792969, 99.59751892089844, 109.72561645507812, 119.85372161865234, 129.9818115234375, 140.1099090576172, 150.23802185058594, 160.36611938476562, 170.49423217773438, 180.62232971191406, 190.75042724609375, 200.8785400390625, 211.00665283203125, 221.13475036621094, 231.2628631591797, 241.39096069335938, 251.51907348632812, 261.6471862792969, 271.7752685546875, 281.90338134765625, 292.031494140625, 302.15960693359375, 312.2876892089844, 322.4158020019531, 332.5439147949219, 342.6720275878906, 352.80010986328125, 362.92822265625, 373.0563049316406, 383.1844177246094, 393.3125, 403.44061279296875, 413.5687255859375, 423.69683837890625, 433.8249206542969, 443.9530334472656, 454.0811462402344]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 11.0, 7.0, 8.0, 11.0, 5.0, 4.0, 21.0, 17.0, 12.0, 22.0, 20.0, 20.0, 27.0, 29.0, 25.0, 31.0, 29.0, 41.0, 30.0, 36.0, 42.0, 42.0, 39.0, 41.0, 29.0, 39.0, 27.0, 33.0, 40.0, 26.0, 18.0, 23.0, 32.0, 18.0, 27.0, 12.0, 12.0, 17.0, 19.0, 9.0, 8.0, 13.0, 11.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.38108825683594, -36.10797119140625, -34.83485794067383, -33.561744689941406, -32.28862762451172, -31.015512466430664, -29.74239730834961, -28.469282150268555, -27.1961669921875, -25.923051834106445, -24.64993667602539, -23.376821517944336, -22.10370635986328, -20.830591201782227, -19.557476043701172, -18.284360885620117, -17.011245727539062, -15.738130569458008, -14.465015411376953, -13.191900253295898, -11.918785095214844, -10.645669937133789, -9.372554779052734, -8.09943962097168, -6.826324462890625, -5.55320930480957, -4.280094146728516, -3.006978988647461, -1.7338638305664062, -0.46074867248535156, 0.8123664855957031, 2.085481643676758, 3.3585968017578125, 4.631711959838867, 5.904827117919922, 7.177942276000977, 8.451057434082031, 9.724172592163086, 10.99728775024414, 12.270402908325195, 13.54351806640625, 14.816633224487305, 16.08974838256836, 17.362863540649414, 18.63597869873047, 19.909093856811523, 21.182209014892578, 22.455324172973633, 23.728439331054688, 25.001554489135742, 26.274669647216797, 27.54778480529785, 28.820899963378906, 30.09401512145996, 31.367130279541016, 32.64024353027344, 33.913360595703125, 35.18647766113281, 36.459590911865234, 37.732704162597656, 39.005821228027344, 40.27893829345703, 41.55205154418945, 42.825164794921875, 44.09828186035156]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 12.0, 12.0, 6.0, 12.0, 20.0, 21.0, 31.0, 27.0, 26.0, 37.0, 21.0, 28.0, 41.0, 47.0, 29.0, 40.0, 54.0, 49.0, 38.0, 46.0, 26.0, 43.0, 36.0, 35.0, 35.0, 34.0, 28.0, 33.0, 18.0, 28.0, 15.0, 14.0, 18.0, 9.0, 7.0, 3.0, 10.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-9.765625, -9.49163818359375, -9.2176513671875, -8.94366455078125, -8.669677734375, -8.39569091796875, -8.1217041015625, -7.84771728515625, -7.57373046875, -7.29974365234375, -7.0257568359375, -6.75177001953125, -6.477783203125, -6.20379638671875, -5.9298095703125, -5.65582275390625, -5.3818359375, -5.10784912109375, -4.8338623046875, -4.55987548828125, -4.285888671875, -4.01190185546875, -3.7379150390625, -3.46392822265625, -3.18994140625, -2.91595458984375, -2.6419677734375, -2.36798095703125, -2.093994140625, -1.82000732421875, -1.5460205078125, -1.27203369140625, -0.998046875, -0.72406005859375, -0.4500732421875, -0.17608642578125, 0.097900390625, 0.37188720703125, 0.6458740234375, 0.91986083984375, 1.19384765625, 1.46783447265625, 1.7418212890625, 2.01580810546875, 2.289794921875, 2.56378173828125, 2.8377685546875, 3.11175537109375, 3.3857421875, 3.65972900390625, 3.9337158203125, 4.20770263671875, 4.481689453125, 4.75567626953125, 5.0296630859375, 5.30364990234375, 5.57763671875, 5.85162353515625, 6.1256103515625, 6.39959716796875, 6.673583984375, 6.94757080078125, 7.2215576171875, 7.49554443359375, 7.76953125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 16.0, 11.0, 18.0, 20.0, 27.0, 27.0, 52.0, 50.0, 77.0, 86.0, 122.0, 176.0, 254.0, 289.0, 404.0, 490.0, 21437.0, 4168190.0, 784.0, 401.0, 304.0, 261.0, 190.0, 120.0, 109.0, 68.0, 58.0, 44.0, 39.0, 25.0, 25.0, 23.0, 10.0, 15.0, 8.0, 6.0, 7.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-237.625, -229.744140625, -221.86328125, -213.982421875, -206.1015625, -198.220703125, -190.33984375, -182.458984375, -174.578125, -166.697265625, -158.81640625, -150.935546875, -143.0546875, -135.173828125, -127.29296875, -119.412109375, -111.53125, -103.650390625, -95.76953125, -87.888671875, -80.0078125, -72.126953125, -64.24609375, -56.365234375, -48.484375, -40.603515625, -32.72265625, -24.841796875, -16.9609375, -9.080078125, -1.19921875, 6.681640625, 14.5625, 22.443359375, 30.32421875, 38.205078125, 46.0859375, 53.966796875, 61.84765625, 69.728515625, 77.609375, 85.490234375, 93.37109375, 101.251953125, 109.1328125, 117.013671875, 124.89453125, 132.775390625, 140.65625, 148.537109375, 156.41796875, 164.298828125, 172.1796875, 180.060546875, 187.94140625, 195.822265625, 203.703125, 211.583984375, 219.46484375, 227.345703125, 235.2265625, 243.107421875, 250.98828125, 258.869140625, 266.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 9.0, 6.0, 3.0, 9.0, 17.0, 16.0, 37.0, 62.0, 99.0, 153.0, 281.0, 555.0, 938.0, 894.0, 449.0, 223.0, 111.0, 67.0, 62.0, 26.0, 19.0, 15.0, 13.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.546875, -23.8623046875, -23.177734375, -22.4931640625, -21.80859375, -21.1240234375, -20.439453125, -19.7548828125, -19.0703125, -18.3857421875, -17.701171875, -17.0166015625, -16.33203125, -15.6474609375, -14.962890625, -14.2783203125, -13.59375, -12.9091796875, -12.224609375, -11.5400390625, -10.85546875, -10.1708984375, -9.486328125, -8.8017578125, -8.1171875, -7.4326171875, -6.748046875, -6.0634765625, -5.37890625, -4.6943359375, -4.009765625, -3.3251953125, -2.640625, -1.9560546875, -1.271484375, -0.5869140625, 0.09765625, 0.7822265625, 1.466796875, 2.1513671875, 2.8359375, 3.5205078125, 4.205078125, 4.8896484375, 5.57421875, 6.2587890625, 6.943359375, 7.6279296875, 8.3125, 8.9970703125, 9.681640625, 10.3662109375, 11.05078125, 11.7353515625, 12.419921875, 13.1044921875, 13.7890625, 14.4736328125, 15.158203125, 15.8427734375, 16.52734375, 17.2119140625, 17.896484375, 18.5810546875, 19.265625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 15.0, 13.0, 18.0, 31.0, 46.0, 60.0, 85.0, 105.0, 335.0, 3426790.0, 766139.0, 271.0, 108.0, 77.0, 48.0, 42.0, 35.0, 19.0, 16.0, 12.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-309.25, -301.8828125, -294.515625, -287.1484375, -279.78125, -272.4140625, -265.046875, -257.6796875, -250.3125, -242.9453125, -235.578125, -228.2109375, -220.84375, -213.4765625, -206.109375, -198.7421875, -191.375, -184.0078125, -176.640625, -169.2734375, -161.90625, -154.5390625, -147.171875, -139.8046875, -132.4375, -125.0703125, -117.703125, -110.3359375, -102.96875, -95.6015625, -88.234375, -80.8671875, -73.5, -66.1328125, -58.765625, -51.3984375, -44.03125, -36.6640625, -29.296875, -21.9296875, -14.5625, -7.1953125, 0.171875, 7.5390625, 14.90625, 22.2734375, 29.640625, 37.0078125, 44.375, 51.7421875, 59.109375, 66.4765625, 73.84375, 81.2109375, 88.578125, 95.9453125, 103.3125, 110.6796875, 118.046875, 125.4140625, 132.78125, 140.1484375, 147.515625, 154.8828125, 162.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 166.0, 590.0, 233.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.12466430664062, -245.7600555419922, -239.39544677734375, -233.03085327148438, -226.66624450683594, -220.3016357421875, -213.93702697753906, -207.57241821289062, -201.2078094482422, -194.84320068359375, -188.4785919189453, -182.11398315429688, -175.7493896484375, -169.38478088378906, -163.02017211914062, -156.6555633544922, -150.29095458984375, -143.9263458251953, -137.56173706054688, -131.1971435546875, -124.83252716064453, -118.46792602539062, -112.10331726074219, -105.73870849609375, -99.37411499023438, -93.00950622558594, -86.64490509033203, -80.2802963256836, -73.91568756103516, -67.55108642578125, -61.18647766113281, -54.821868896484375, -48.45726013183594, -42.092655181884766, -35.72804641723633, -29.363441467285156, -22.99883460998535, -16.634227752685547, -10.269622802734375, -3.9050140380859375, 2.4595909118652344, 8.824197769165039, 15.188803672790527, 21.553409576416016, 27.91801643371582, 34.282623291015625, 40.6472282409668, 47.011837005615234, 53.376441955566406, 59.74104690551758, 66.10565185546875, 72.47026062011719, 78.83486938476562, 85.19947814941406, 91.56407928466797, 97.9286880493164, 104.29328918457031, 110.65789794921875, 117.02249908447266, 123.3871078491211, 129.751708984375, 136.11631774902344, 142.48092651367188, 148.8455352783203, 155.21014404296875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 1.0, 1.0, 5.0, 7.0, 8.0, 6.0, 9.0, 13.0, 15.0, 17.0, 25.0, 17.0, 27.0, 25.0, 28.0, 30.0, 40.0, 30.0, 30.0, 33.0, 40.0, 41.0, 42.0, 47.0, 46.0, 31.0, 33.0, 38.0, 34.0, 38.0, 28.0, 35.0, 21.0, 23.0, 18.0, 23.0, 23.0, 15.0, 9.0, 14.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-45.00749206542969, -43.69382858276367, -42.38016891479492, -41.066505432128906, -39.752845764160156, -38.43918228149414, -37.12552261352539, -35.811859130859375, -34.498199462890625, -33.18453598022461, -31.87087631225586, -30.557214736938477, -29.243553161621094, -27.929889678955078, -26.616228103637695, -25.302566528320312, -23.988903045654297, -22.675241470336914, -21.36157989501953, -20.04791831970215, -18.734256744384766, -17.42059326171875, -16.106931686401367, -14.793270111083984, -13.479608535766602, -12.165946960449219, -10.852285385131836, -9.538622856140137, -8.224961280822754, -6.911299705505371, -5.59763765335083, -4.283975601196289, -2.9703140258789062, -1.6566522121429443, -0.3429903984069824, 0.9706714153289795, 2.2843332290649414, 3.597994804382324, 4.911656856536865, 6.225318908691406, 7.538980484008789, 8.852642059326172, 10.166303634643555, 11.479966163635254, 12.793627738952637, 14.10728931427002, 15.420951843261719, 16.7346134185791, 18.048274993896484, 19.361936569213867, 20.67559814453125, 21.989259719848633, 23.302921295166016, 24.61658477783203, 25.930246353149414, 27.243907928466797, 28.55756950378418, 29.871231079101562, 31.184892654418945, 32.49855422973633, 33.812217712402344, 35.125877380371094, 36.43954086303711, 37.753204345703125, 39.066864013671875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 10.0, 6.0, 11.0, 13.0, 12.0, 23.0, 23.0, 17.0, 25.0, 23.0, 28.0, 23.0, 28.0, 27.0, 44.0, 32.0, 31.0, 41.0, 34.0, 29.0, 44.0, 39.0, 36.0, 42.0, 39.0, 37.0, 29.0, 25.0, 19.0, 28.0, 22.0, 25.0, 17.0, 28.0, 23.0, 14.0, 11.0, 8.0, 6.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.87506103515625, -6.6368408203125, -6.39862060546875, -6.160400390625, -5.92218017578125, -5.6839599609375, -5.44573974609375, -5.20751953125, -4.96929931640625, -4.7310791015625, -4.49285888671875, -4.254638671875, -4.01641845703125, -3.7781982421875, -3.53997802734375, -3.3017578125, -3.06353759765625, -2.8253173828125, -2.58709716796875, -2.348876953125, -2.11065673828125, -1.8724365234375, -1.63421630859375, -1.39599609375, -1.15777587890625, -0.9195556640625, -0.68133544921875, -0.443115234375, -0.20489501953125, 0.0333251953125, 0.27154541015625, 0.509765625, 0.74798583984375, 0.9862060546875, 1.22442626953125, 1.462646484375, 1.70086669921875, 1.9390869140625, 2.17730712890625, 2.41552734375, 2.65374755859375, 2.8919677734375, 3.13018798828125, 3.368408203125, 3.60662841796875, 3.8448486328125, 4.08306884765625, 4.3212890625, 4.55950927734375, 4.7977294921875, 5.03594970703125, 5.274169921875, 5.51239013671875, 5.7506103515625, 5.98883056640625, 6.22705078125, 6.46527099609375, 6.7034912109375, 6.94171142578125, 7.179931640625, 7.41815185546875, 7.6563720703125, 7.89459228515625, 8.1328125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 9.0, 7.0, 19.0, 19.0, 34.0, 58.0, 79.0, 129.0, 174.0, 277.0, 451.0, 679.0, 1055.0, 1628.0, 2514.0, 3986.0, 6182.0, 9278.0, 14787.0, 22706.0, 34954.0, 54965.0, 88466.0, 152187.0, 251405.0, 155173.0, 91144.0, 55507.0, 35591.0, 23072.0, 14925.0, 9502.0, 6199.0, 4038.0, 2567.0, 1703.0, 1090.0, 696.0, 440.0, 304.0, 206.0, 127.0, 78.0, 49.0, 33.0, 23.0, 17.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.245635986328125, -1.20611572265625, -1.166595458984375, -1.1270751953125, -1.087554931640625, -1.04803466796875, -1.008514404296875, -0.968994140625, -0.929473876953125, -0.88995361328125, -0.850433349609375, -0.8109130859375, -0.771392822265625, -0.73187255859375, -0.692352294921875, -0.65283203125, -0.613311767578125, -0.57379150390625, -0.534271240234375, -0.4947509765625, -0.455230712890625, -0.41571044921875, -0.376190185546875, -0.336669921875, -0.297149658203125, -0.25762939453125, -0.218109130859375, -0.1785888671875, -0.139068603515625, -0.09954833984375, -0.060028076171875, -0.0205078125, 0.019012451171875, 0.05853271484375, 0.098052978515625, 0.1375732421875, 0.177093505859375, 0.21661376953125, 0.256134033203125, 0.295654296875, 0.335174560546875, 0.37469482421875, 0.414215087890625, 0.4537353515625, 0.493255615234375, 0.53277587890625, 0.572296142578125, 0.61181640625, 0.651336669921875, 0.69085693359375, 0.730377197265625, 0.7698974609375, 0.809417724609375, 0.84893798828125, 0.888458251953125, 0.927978515625, 0.967498779296875, 1.00701904296875, 1.046539306640625, 1.0860595703125, 1.125579833984375, 1.16510009765625, 1.204620361328125, 1.244140625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 13.0, 14.0, 11.0, 12.0, 24.0, 17.0, 25.0, 20.0, 25.0, 35.0, 26.0, 33.0, 28.0, 27.0, 33.0, 40.0, 46.0, 39.0, 1061.0, 32.0, 27.0, 37.0, 23.0, 27.0, 38.0, 30.0, 29.0, 28.0, 19.0, 20.0, 19.0, 24.0, 16.0, 19.0, 16.0, 12.0, 8.0, 8.0, 5.0, 9.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.0703125, -3.932373046875, -3.79443359375, -3.656494140625, -3.5185546875, -3.380615234375, -3.24267578125, -3.104736328125, -2.966796875, -2.828857421875, -2.69091796875, -2.552978515625, -2.4150390625, -2.277099609375, -2.13916015625, -2.001220703125, -1.86328125, -1.725341796875, -1.58740234375, -1.449462890625, -1.3115234375, -1.173583984375, -1.03564453125, -0.897705078125, -0.759765625, -0.621826171875, -0.48388671875, -0.345947265625, -0.2080078125, -0.070068359375, 0.06787109375, 0.205810546875, 0.34375, 0.481689453125, 0.61962890625, 0.757568359375, 0.8955078125, 1.033447265625, 1.17138671875, 1.309326171875, 1.447265625, 1.585205078125, 1.72314453125, 1.861083984375, 1.9990234375, 2.136962890625, 2.27490234375, 2.412841796875, 2.55078125, 2.688720703125, 2.82666015625, 2.964599609375, 3.1025390625, 3.240478515625, 3.37841796875, 3.516357421875, 3.654296875, 3.792236328125, 3.93017578125, 4.068115234375, 4.2060546875, 4.343994140625, 4.48193359375, 4.619873046875, 4.7578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 6.0, 17.0, 19.0, 19.0, 37.0, 64.0, 86.0, 116.0, 192.0, 264.0, 407.0, 564.0, 813.0, 1254.0, 1804.0, 2646.0, 3938.0, 5717.0, 8449.0, 12644.0, 18760.0, 28894.0, 43980.0, 69117.0, 113843.0, 199641.0, 1257802.0, 118639.0, 72086.0, 45711.0, 29391.0, 19482.0, 13224.0, 8718.0, 5975.0, 4068.0, 2788.0, 1890.0, 1306.0, 836.0, 635.0, 439.0, 273.0, 207.0, 127.0, 85.0, 55.0, 41.0, 27.0, 18.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0], "bins": [-1.1396484375, -1.106170654296875, -1.07269287109375, -1.039215087890625, -1.0057373046875, -0.972259521484375, -0.93878173828125, -0.905303955078125, -0.871826171875, -0.838348388671875, -0.80487060546875, -0.771392822265625, -0.7379150390625, -0.704437255859375, -0.67095947265625, -0.637481689453125, -0.60400390625, -0.570526123046875, -0.53704833984375, -0.503570556640625, -0.4700927734375, -0.436614990234375, -0.40313720703125, -0.369659423828125, -0.336181640625, -0.302703857421875, -0.26922607421875, -0.235748291015625, -0.2022705078125, -0.168792724609375, -0.13531494140625, -0.101837158203125, -0.068359375, -0.034881591796875, -0.00140380859375, 0.032073974609375, 0.0655517578125, 0.099029541015625, 0.13250732421875, 0.165985107421875, 0.199462890625, 0.232940673828125, 0.26641845703125, 0.299896240234375, 0.3333740234375, 0.366851806640625, 0.40032958984375, 0.433807373046875, 0.46728515625, 0.500762939453125, 0.53424072265625, 0.567718505859375, 0.6011962890625, 0.634674072265625, 0.66815185546875, 0.701629638671875, 0.735107421875, 0.768585205078125, 0.80206298828125, 0.835540771484375, 0.8690185546875, 0.902496337890625, 0.93597412109375, 0.969451904296875, 1.0029296875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 3.0, 5.0, 9.0, 6.0, 18.0, 21.0, 18.0, 28.0, 51.0, 71.0, 94.0, 104.0, 134.0, 121.0, 89.0, 66.0, 38.0, 17.0, 25.0, 15.0, 13.0, 13.0, 5.0, 5.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014142990112304688, -0.0013765990734100342, -0.0013388991355895996, -0.001301199197769165, -0.0012634992599487305, -0.001225799322128296, -0.0011880993843078613, -0.0011503994464874268, -0.0011126995086669922, -0.0010749995708465576, -0.001037299633026123, -0.0009995996952056885, -0.0009618997573852539, -0.0009241998195648193, -0.0008864998817443848, -0.0008487999439239502, -0.0008111000061035156, -0.0007734000682830811, -0.0007357001304626465, -0.0006980001926422119, -0.0006603002548217773, -0.0006226003170013428, -0.0005849003791809082, -0.0005472004413604736, -0.0005095005035400391, -0.0004718005657196045, -0.0004341006278991699, -0.00039640069007873535, -0.0003587007522583008, -0.0003210008144378662, -0.00028330087661743164, -0.00024560093879699707, -0.0002079010009765625, -0.00017020106315612793, -0.00013250112533569336, -9.480118751525879e-05, -5.710124969482422e-05, -1.940131187438965e-05, 1.8298625946044922e-05, 5.599856376647949e-05, 9.369850158691406e-05, 0.00013139843940734863, 0.0001690983772277832, 0.00020679831504821777, 0.00024449825286865234, 0.0002821981906890869, 0.0003198981285095215, 0.00035759806632995605, 0.0003952980041503906, 0.0004329979419708252, 0.00047069787979125977, 0.0005083978176116943, 0.0005460977554321289, 0.0005837976932525635, 0.000621497631072998, 0.0006591975688934326, 0.0006968975067138672, 0.0007345974445343018, 0.0007722973823547363, 0.0008099973201751709, 0.0008476972579956055, 0.00088539719581604, 0.0009230971336364746, 0.0009607970714569092, 0.0009984970092773438]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 8.0, 11.0, 16.0, 14.0, 13.0, 23.0, 42.0, 39.0, 67.0, 95.0, 167.0, 267.0, 409.0, 1045.0, 559244.0, 484729.0, 1044.0, 469.0, 273.0, 175.0, 97.0, 76.0, 58.0, 42.0, 31.0, 14.0, 19.0, 18.0, 7.0, 14.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01666259765625, -0.016045331954956055, -0.01542806625366211, -0.014810800552368164, -0.014193534851074219, -0.013576269149780273, -0.012959003448486328, -0.012341737747192383, -0.011724472045898438, -0.011107206344604492, -0.010489940643310547, -0.009872674942016602, -0.009255409240722656, -0.008638143539428711, -0.008020877838134766, -0.00740361213684082, -0.006786346435546875, -0.00616908073425293, -0.005551815032958984, -0.004934549331665039, -0.004317283630371094, -0.0037000179290771484, -0.003082752227783203, -0.002465486526489258, -0.0018482208251953125, -0.0012309551239013672, -0.0006136894226074219, 3.5762786865234375e-06, 0.0006208419799804688, 0.001238107681274414, 0.0018553733825683594, 0.0024726390838623047, 0.00308990478515625, 0.0037071704864501953, 0.004324436187744141, 0.004941701889038086, 0.005558967590332031, 0.0061762332916259766, 0.006793498992919922, 0.007410764694213867, 0.008028030395507812, 0.008645296096801758, 0.009262561798095703, 0.009879827499389648, 0.010497093200683594, 0.011114358901977539, 0.011731624603271484, 0.01234889030456543, 0.012966156005859375, 0.01358342170715332, 0.014200687408447266, 0.014817953109741211, 0.015435218811035156, 0.0160524845123291, 0.016669750213623047, 0.017287015914916992, 0.017904281616210938, 0.018521547317504883, 0.019138813018798828, 0.019756078720092773, 0.02037334442138672, 0.020990610122680664, 0.02160787582397461, 0.022225141525268555, 0.0228424072265625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 686.0, 309.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00072041607927531, -0.0006152072455734015, -0.0005099984118714929, -0.0004047896363772452, -0.0002995808026753366, -0.000194371968973428, -8.916319347918034e-05, 1.6045640222728252e-05, 0.00012125447392463684, 0.0002264632930746302, 0.00033167211222462356, 0.0004368809168227017, 0.0005420897505246103, 0.0006472985842265189, 0.0007525073597207665, 0.0008577161934226751, 0.0009629250271245837, 0.0010681338608264923, 0.001173342694528401, 0.0012785515282303095, 0.0013837602455168962, 0.0014889691956341267, 0.0015941779129207134, 0.001699386746622622, 0.0018045955803245306, 0.0019098044140264392, 0.0020150132477283478, 0.0021202219650149345, 0.002225430915132165, 0.0023306396324187517, 0.002435848582535982, 0.002541057299822569, 0.0026462660171091557, 0.0027514747343957424, 0.002856683684512973, 0.0029618924017995596, 0.00306710135191679, 0.0031723100692033768, 0.0032775187864899635, 0.003382727736607194, 0.0034879366867244244, 0.003593145404011011, 0.0036983543541282415, 0.0038035630714148283, 0.003908772021532059, 0.0040139807388186455, 0.004119189456105232, 0.004224398173391819, 0.004329606890678406, 0.0044348156079649925, 0.004540024325251579, 0.004645233508199453, 0.00475044222548604, 0.004855650942772627, 0.004960859660059214, 0.005066068843007088, 0.0051712775602936745, 0.005276486277580261, 0.005381694994866848, 0.005486904177814722, 0.005592112895101309, 0.005697321612387896, 0.005802530329674482, 0.005907739512622356, 0.006012948229908943]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 2.0, 8.0, 17.0, 6.0, 10.0, 6.0, 15.0, 12.0, 21.0, 23.0, 27.0, 16.0, 23.0, 30.0, 34.0, 28.0, 34.0, 35.0, 42.0, 48.0, 50.0, 30.0, 33.0, 38.0, 28.0, 38.0, 31.0, 28.0, 36.0, 21.0, 33.0, 27.0, 25.0, 20.0, 17.0, 13.0, 21.0, 17.0, 13.0, 2.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003616213798522949, -0.00034914351999759674, -0.00033666566014289856, -0.0003241878002882004, -0.0003117099404335022, -0.000299232080578804, -0.00028675422072410583, -0.00027427636086940765, -0.00026179850101470947, -0.0002493206411600113, -0.0002368427813053131, -0.00022436492145061493, -0.00021188706159591675, -0.00019940920174121857, -0.00018693134188652039, -0.0001744534820318222, -0.00016197562217712402, -0.00014949776232242584, -0.00013701990246772766, -0.00012454204261302948, -0.0001120641827583313, -9.958632290363312e-05, -8.710846304893494e-05, -7.463060319423676e-05, -6.215274333953857e-05, -4.967488348484039e-05, -3.719702363014221e-05, -2.471916377544403e-05, -1.224130392074585e-05, 2.3655593395233154e-07, 1.2714415788650513e-05, 2.5192275643348694e-05, 3.7670135498046875e-05, 5.0147995352745056e-05, 6.262585520744324e-05, 7.510371506214142e-05, 8.75815749168396e-05, 0.00010005943477153778, 0.00011253729462623596, 0.00012501515448093414, 0.00013749301433563232, 0.0001499708741903305, 0.0001624487340450287, 0.00017492659389972687, 0.00018740445375442505, 0.00019988231360912323, 0.0002123601734638214, 0.0002248380333185196, 0.00023731589317321777, 0.00024979375302791595, 0.00026227161288261414, 0.0002747494727373123, 0.0002872273325920105, 0.0002997051924467087, 0.00031218305230140686, 0.00032466091215610504, 0.0003371387720108032, 0.0003496166318655014, 0.0003620944917201996, 0.00037457235157489777, 0.00038705021142959595, 0.00039952807128429413, 0.0004120059311389923, 0.0004244837909936905, 0.00043696165084838867]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 10.0, 6.0, 11.0, 13.0, 12.0, 23.0, 23.0, 17.0, 25.0, 23.0, 28.0, 23.0, 28.0, 27.0, 44.0, 32.0, 31.0, 41.0, 33.0, 30.0, 44.0, 39.0, 36.0, 42.0, 39.0, 37.0, 29.0, 25.0, 19.0, 28.0, 22.0, 25.0, 17.0, 28.0, 23.0, 14.0, 11.0, 8.0, 6.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.87506103515625, -6.6368408203125, -6.39862060546875, -6.160400390625, -5.92218017578125, -5.6839599609375, -5.44573974609375, -5.20751953125, -4.96929931640625, -4.7310791015625, -4.49285888671875, -4.254638671875, -4.01641845703125, -3.7781982421875, -3.53997802734375, -3.3017578125, -3.06353759765625, -2.8253173828125, -2.58709716796875, -2.348876953125, -2.11065673828125, -1.8724365234375, -1.63421630859375, -1.39599609375, -1.15777587890625, -0.9195556640625, -0.68133544921875, -0.443115234375, -0.20489501953125, 0.0333251953125, 0.27154541015625, 0.509765625, 0.74798583984375, 0.9862060546875, 1.22442626953125, 1.462646484375, 1.70086669921875, 1.9390869140625, 2.17730712890625, 2.41552734375, 2.65374755859375, 2.8919677734375, 3.13018798828125, 3.368408203125, 3.60662841796875, 3.8448486328125, 4.08306884765625, 4.3212890625, 4.55950927734375, 4.7977294921875, 5.03594970703125, 5.274169921875, 5.51239013671875, 5.7506103515625, 5.98883056640625, 6.22705078125, 6.46527099609375, 6.7034912109375, 6.94171142578125, 7.179931640625, 7.41815185546875, 7.6563720703125, 7.89459228515625, 8.1328125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 2.0, 5.0, 23.0, 13.0, 22.0, 33.0, 40.0, 56.0, 92.0, 108.0, 135.0, 200.0, 206.0, 299.0, 373.0, 450.0, 564.0, 714.0, 857.0, 1165.0, 1975.0, 4425.0, 13642.0, 57837.0, 256005.0, 505602.0, 150958.0, 34322.0, 8929.0, 3009.0, 1559.0, 1010.0, 786.0, 662.0, 571.0, 426.0, 356.0, 267.0, 220.0, 151.0, 123.0, 99.0, 66.0, 46.0, 39.0, 24.0, 25.0, 20.0, 6.0, 10.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0], "bins": [-11.3984375, -11.0457763671875, -10.693115234375, -10.3404541015625, -9.98779296875, -9.6351318359375, -9.282470703125, -8.9298095703125, -8.5771484375, -8.2244873046875, -7.871826171875, -7.5191650390625, -7.16650390625, -6.8138427734375, -6.461181640625, -6.1085205078125, -5.755859375, -5.4031982421875, -5.050537109375, -4.6978759765625, -4.34521484375, -3.9925537109375, -3.639892578125, -3.2872314453125, -2.9345703125, -2.5819091796875, -2.229248046875, -1.8765869140625, -1.52392578125, -1.1712646484375, -0.818603515625, -0.4659423828125, -0.11328125, 0.2393798828125, 0.592041015625, 0.9447021484375, 1.29736328125, 1.6500244140625, 2.002685546875, 2.3553466796875, 2.7080078125, 3.0606689453125, 3.413330078125, 3.7659912109375, 4.11865234375, 4.4713134765625, 4.823974609375, 5.1766357421875, 5.529296875, 5.8819580078125, 6.234619140625, 6.5872802734375, 6.93994140625, 7.2926025390625, 7.645263671875, 7.9979248046875, 8.3505859375, 8.7032470703125, 9.055908203125, 9.4085693359375, 9.76123046875, 10.1138916015625, 10.466552734375, 10.8192138671875, 11.171875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 8.0, 6.0, 6.0, 11.0, 18.0, 12.0, 23.0, 12.0, 18.0, 29.0, 38.0, 40.0, 55.0, 49.0, 60.0, 106.0, 280.0, 1605.0, 151.0, 67.0, 64.0, 49.0, 51.0, 41.0, 42.0, 37.0, 31.0, 26.0, 16.0, 17.0, 15.0, 11.0, 8.0, 8.0, 4.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.640625, -15.982177734375, -15.32373046875, -14.665283203125, -14.0068359375, -13.348388671875, -12.68994140625, -12.031494140625, -11.373046875, -10.714599609375, -10.05615234375, -9.397705078125, -8.7392578125, -8.080810546875, -7.42236328125, -6.763916015625, -6.10546875, -5.447021484375, -4.78857421875, -4.130126953125, -3.4716796875, -2.813232421875, -2.15478515625, -1.496337890625, -0.837890625, -0.179443359375, 0.47900390625, 1.137451171875, 1.7958984375, 2.454345703125, 3.11279296875, 3.771240234375, 4.4296875, 5.088134765625, 5.74658203125, 6.405029296875, 7.0634765625, 7.721923828125, 8.38037109375, 9.038818359375, 9.697265625, 10.355712890625, 11.01416015625, 11.672607421875, 12.3310546875, 12.989501953125, 13.64794921875, 14.306396484375, 14.96484375, 15.623291015625, 16.28173828125, 16.940185546875, 17.5986328125, 18.257080078125, 18.91552734375, 19.573974609375, 20.232421875, 20.890869140625, 21.54931640625, 22.207763671875, 22.8662109375, 23.524658203125, 24.18310546875, 24.841552734375, 25.5]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 8.0, 5.0, 7.0, 9.0, 10.0, 15.0, 22.0, 30.0, 26.0, 41.0, 38.0, 65.0, 100.0, 147.0, 240.0, 346.0, 680.0, 2053.0, 2903397.0, 235483.0, 1523.0, 564.0, 312.0, 163.0, 114.0, 81.0, 55.0, 48.0, 25.0, 18.0, 15.0, 17.0, 14.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.0625, -66.8974609375, -64.732421875, -62.5673828125, -60.40234375, -58.2373046875, -56.072265625, -53.9072265625, -51.7421875, -49.5771484375, -47.412109375, -45.2470703125, -43.08203125, -40.9169921875, -38.751953125, -36.5869140625, -34.421875, -32.2568359375, -30.091796875, -27.9267578125, -25.76171875, -23.5966796875, -21.431640625, -19.2666015625, -17.1015625, -14.9365234375, -12.771484375, -10.6064453125, -8.44140625, -6.2763671875, -4.111328125, -1.9462890625, 0.21875, 2.3837890625, 4.548828125, 6.7138671875, 8.87890625, 11.0439453125, 13.208984375, 15.3740234375, 17.5390625, 19.7041015625, 21.869140625, 24.0341796875, 26.19921875, 28.3642578125, 30.529296875, 32.6943359375, 34.859375, 37.0244140625, 39.189453125, 41.3544921875, 43.51953125, 45.6845703125, 47.849609375, 50.0146484375, 52.1796875, 54.3447265625, 56.509765625, 58.6748046875, 60.83984375, 63.0048828125, 65.169921875, 67.3349609375, 69.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 848.0, 155.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.08770751953125, -261.9179992675781, -251.74827575683594, -241.57855224609375, -231.40884399414062, -221.2391357421875, -211.0694122314453, -200.89968872070312, -190.72998046875, -180.56027221679688, -170.3905487060547, -160.2208251953125, -150.05111694335938, -139.88140869140625, -129.71168518066406, -119.5419692993164, -109.37225341796875, -99.2025375366211, -89.03282165527344, -78.86310577392578, -68.69338989257812, -58.52367401123047, -48.35395812988281, -38.184242248535156, -28.0145263671875, -17.844810485839844, -7.6750946044921875, 2.4946212768554688, 12.664337158203125, 22.83405303955078, 33.00376892089844, 43.173484802246094, 53.343170166015625, 63.51288604736328, 73.68260192871094, 83.8523178100586, 94.02203369140625, 104.1917495727539, 114.36146545410156, 124.53118133544922, 134.70089721679688, 144.87060546875, 155.0403289794922, 165.21005249023438, 175.3797607421875, 185.54946899414062, 195.7191925048828, 205.888916015625, 216.05862426757812, 226.22833251953125, 236.39805603027344, 246.56777954101562, 256.73748779296875, 266.9071960449219, 277.076904296875, 287.24664306640625, 297.4163513183594, 307.5860595703125, 317.75579833984375, 327.9255065917969, 338.09521484375, 348.2649230957031, 358.43463134765625, 368.6043701171875, 378.7740783691406]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 6.0, 9.0, 12.0, 21.0, 17.0, 16.0, 24.0, 22.0, 36.0, 28.0, 26.0, 34.0, 23.0, 40.0, 26.0, 41.0, 55.0, 51.0, 47.0, 51.0, 34.0, 34.0, 24.0, 39.0, 38.0, 37.0, 29.0, 31.0, 19.0, 19.0, 18.0, 21.0, 7.0, 17.0, 9.0, 10.0, 7.0, 4.0, 5.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.91034698486328, -50.182552337646484, -48.45476150512695, -46.726966857910156, -44.999176025390625, -43.27138137817383, -41.54358673095703, -39.8157958984375, -38.0880012512207, -36.360206604003906, -34.632415771484375, -32.90462112426758, -31.176828384399414, -29.44903564453125, -27.721240997314453, -25.99344825744629, -24.265655517578125, -22.53786277770996, -20.810070037841797, -19.082275390625, -17.354482650756836, -15.626689910888672, -13.898896217346191, -12.171102523803711, -10.443309783935547, -8.715517044067383, -6.987723350524902, -5.25993013381958, -3.532136917114258, -1.8043441772460938, -0.07655048370361328, 1.6512432098388672, 3.3790359497070312, 5.1068291664123535, 6.834622383117676, 8.562416076660156, 10.29020881652832, 12.018001556396484, 13.745795249938965, 15.473588943481445, 17.20138168334961, 18.929174423217773, 20.656967163085938, 22.384761810302734, 24.1125545501709, 25.840347290039062, 27.56814193725586, 29.295934677124023, 31.023727416992188, 32.751522064208984, 34.479312896728516, 36.20710754394531, 37.934898376464844, 39.66269302368164, 41.39048767089844, 43.11827850341797, 44.846073150634766, 46.57386779785156, 48.301658630371094, 50.02945327758789, 51.75724792480469, 53.48503875732422, 55.212833404541016, 56.94062805175781, 58.668418884277344]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 8.0, 12.0, 7.0, 24.0, 10.0, 13.0, 21.0, 23.0, 34.0, 25.0, 43.0, 39.0, 40.0, 39.0, 48.0, 51.0, 43.0, 56.0, 42.0, 46.0, 42.0, 40.0, 42.0, 34.0, 26.0, 28.0, 27.0, 24.0, 25.0, 14.0, 22.0, 16.0, 12.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.1971435546875, -7.917724609375, -7.6383056640625, -7.35888671875, -7.0794677734375, -6.800048828125, -6.5206298828125, -6.2412109375, -5.9617919921875, -5.682373046875, -5.4029541015625, -5.12353515625, -4.8441162109375, -4.564697265625, -4.2852783203125, -4.005859375, -3.7264404296875, -3.447021484375, -3.1676025390625, -2.88818359375, -2.6087646484375, -2.329345703125, -2.0499267578125, -1.7705078125, -1.4910888671875, -1.211669921875, -0.9322509765625, -0.65283203125, -0.3734130859375, -0.093994140625, 0.1854248046875, 0.46484375, 0.7442626953125, 1.023681640625, 1.3031005859375, 1.58251953125, 1.8619384765625, 2.141357421875, 2.4207763671875, 2.7001953125, 2.9796142578125, 3.259033203125, 3.5384521484375, 3.81787109375, 4.0972900390625, 4.376708984375, 4.6561279296875, 4.935546875, 5.2149658203125, 5.494384765625, 5.7738037109375, 6.05322265625, 6.3326416015625, 6.612060546875, 6.8914794921875, 7.1708984375, 7.4503173828125, 7.729736328125, 8.0091552734375, 8.28857421875, 8.5679931640625, 8.847412109375, 9.1268310546875, 9.40625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 8.0, 10.0, 11.0, 15.0, 24.0, 30.0, 41.0, 58.0, 63.0, 83.0, 99.0, 120.0, 159.0, 245.0, 417.0, 984.0, 4015.0, 42689.0, 2030262.0, 2065570.0, 42800.0, 4167.0, 1052.0, 378.0, 224.0, 152.0, 135.0, 95.0, 72.0, 54.0, 52.0, 40.0, 37.0, 26.0, 20.0, 20.0, 11.0, 11.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.421875, -26.537353515625, -25.65283203125, -24.768310546875, -23.8837890625, -22.999267578125, -22.11474609375, -21.230224609375, -20.345703125, -19.461181640625, -18.57666015625, -17.692138671875, -16.8076171875, -15.923095703125, -15.03857421875, -14.154052734375, -13.26953125, -12.385009765625, -11.50048828125, -10.615966796875, -9.7314453125, -8.846923828125, -7.96240234375, -7.077880859375, -6.193359375, -5.308837890625, -4.42431640625, -3.539794921875, -2.6552734375, -1.770751953125, -0.88623046875, -0.001708984375, 0.8828125, 1.767333984375, 2.65185546875, 3.536376953125, 4.4208984375, 5.305419921875, 6.18994140625, 7.074462890625, 7.958984375, 8.843505859375, 9.72802734375, 10.612548828125, 11.4970703125, 12.381591796875, 13.26611328125, 14.150634765625, 15.03515625, 15.919677734375, 16.80419921875, 17.688720703125, 18.5732421875, 19.457763671875, 20.34228515625, 21.226806640625, 22.111328125, 22.995849609375, 23.88037109375, 24.764892578125, 25.6494140625, 26.533935546875, 27.41845703125, 28.302978515625, 29.1875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 13.0, 11.0, 17.0, 31.0, 39.0, 49.0, 71.0, 107.0, 110.0, 149.0, 222.0, 300.0, 425.0, 591.0, 516.0, 425.0, 237.0, 173.0, 150.0, 99.0, 86.0, 66.0, 42.0, 38.0, 25.0, 12.0, 19.0, 11.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.309814453125, -12.86181640625, -12.413818359375, -11.9658203125, -11.517822265625, -11.06982421875, -10.621826171875, -10.173828125, -9.725830078125, -9.27783203125, -8.829833984375, -8.3818359375, -7.933837890625, -7.48583984375, -7.037841796875, -6.58984375, -6.141845703125, -5.69384765625, -5.245849609375, -4.7978515625, -4.349853515625, -3.90185546875, -3.453857421875, -3.005859375, -2.557861328125, -2.10986328125, -1.661865234375, -1.2138671875, -0.765869140625, -0.31787109375, 0.130126953125, 0.578125, 1.026123046875, 1.47412109375, 1.922119140625, 2.3701171875, 2.818115234375, 3.26611328125, 3.714111328125, 4.162109375, 4.610107421875, 5.05810546875, 5.506103515625, 5.9541015625, 6.402099609375, 6.85009765625, 7.298095703125, 7.74609375, 8.194091796875, 8.64208984375, 9.090087890625, 9.5380859375, 9.986083984375, 10.43408203125, 10.882080078125, 11.330078125, 11.778076171875, 12.22607421875, 12.674072265625, 13.1220703125, 13.570068359375, 14.01806640625, 14.466064453125, 14.9140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 8.0, 15.0, 15.0, 44.0, 60.0, 134.0, 257.0, 813.0, 5636.0, 4060491.0, 124258.0, 1738.0, 426.0, 168.0, 104.0, 45.0, 28.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.9375, -79.435546875, -76.93359375, -74.431640625, -71.9296875, -69.427734375, -66.92578125, -64.423828125, -61.921875, -59.419921875, -56.91796875, -54.416015625, -51.9140625, -49.412109375, -46.91015625, -44.408203125, -41.90625, -39.404296875, -36.90234375, -34.400390625, -31.8984375, -29.396484375, -26.89453125, -24.392578125, -21.890625, -19.388671875, -16.88671875, -14.384765625, -11.8828125, -9.380859375, -6.87890625, -4.376953125, -1.875, 0.626953125, 3.12890625, 5.630859375, 8.1328125, 10.634765625, 13.13671875, 15.638671875, 18.140625, 20.642578125, 23.14453125, 25.646484375, 28.1484375, 30.650390625, 33.15234375, 35.654296875, 38.15625, 40.658203125, 43.16015625, 45.662109375, 48.1640625, 50.666015625, 53.16796875, 55.669921875, 58.171875, 60.673828125, 63.17578125, 65.677734375, 68.1796875, 70.681640625, 73.18359375, 75.685546875, 78.1875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 18.0, 410.0, 567.0, 18.0, 3.0, 2.0, 0.0, 1.0], "bins": [-562.8705444335938, -553.1758422851562, -543.4810791015625, -533.786376953125, -524.0916748046875, -514.3969116210938, -504.70220947265625, -495.00750732421875, -485.3127746582031, -475.6180419921875, -465.92333984375, -456.2286071777344, -446.53387451171875, -436.83917236328125, -427.1444396972656, -417.44970703125, -407.7550048828125, -398.0602722167969, -388.3655700683594, -378.67083740234375, -368.9761047363281, -359.2814025878906, -349.586669921875, -339.8919677734375, -330.19720458984375, -320.5024719238281, -310.8077697753906, -301.113037109375, -291.4183044433594, -281.7236022949219, -272.02886962890625, -262.33416748046875, -252.63941955566406, -242.9447021484375, -233.24996948242188, -223.5552520751953, -213.86053466796875, -204.16580200195312, -194.47108459472656, -184.7763671875, -175.08163452148438, -165.3869171142578, -155.6921844482422, -145.99746704101562, -136.30274963378906, -126.60802459716797, -116.91329956054688, -107.21858215332031, -97.52386474609375, -87.82913970947266, -78.1344223022461, -68.439697265625, -58.74497604370117, -49.050254821777344, -39.35552978515625, -29.660812377929688, -19.966087341308594, -10.27136516571045, -0.5766429901123047, 9.118080139160156, 18.812801361083984, 28.507522583007812, 38.202247619628906, 47.89696502685547, 57.59169006347656]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 5.0, 12.0, 18.0, 16.0, 14.0, 20.0, 30.0, 27.0, 18.0, 27.0, 35.0, 46.0, 53.0, 45.0, 52.0, 46.0, 41.0, 41.0, 41.0, 49.0, 34.0, 49.0, 39.0, 36.0, 27.0, 20.0, 21.0, 17.0, 16.0, 19.0, 9.0, 12.0, 10.0, 8.0, 6.0, 9.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.919647216796875, -47.3433723449707, -45.76709747314453, -44.19082260131836, -42.61454772949219, -41.03827667236328, -39.46200180053711, -37.88572692871094, -36.309452056884766, -34.733177185058594, -33.15690231323242, -31.580629348754883, -30.00435447692871, -28.42807960510254, -26.851806640625, -25.275531768798828, -23.699256896972656, -22.122982025146484, -20.546707153320312, -18.970434188842773, -17.3941593170166, -15.81788444519043, -14.241610527038574, -12.665336608886719, -11.089061737060547, -9.512786865234375, -7.9365129470825195, -6.360238552093506, -4.783964157104492, -3.2076897621154785, -1.6314153671264648, -0.055141448974609375, 1.5211334228515625, 3.097407817840576, 4.67368221282959, 6.2499566078186035, 7.826231002807617, 9.402505874633789, 10.978779792785645, 12.5550537109375, 14.131328582763672, 15.707603454589844, 17.283878326416016, 18.860151290893555, 20.436426162719727, 22.0127010345459, 23.588973999023438, 25.16524887084961, 26.74152374267578, 28.317798614501953, 29.894073486328125, 31.470346450805664, 33.04662322998047, 34.622894287109375, 36.19916915893555, 37.77544403076172, 39.35171890258789, 40.92799377441406, 42.504268646240234, 44.080543518066406, 45.65681457519531, 47.233089447021484, 48.809364318847656, 50.38563919067383, 51.9619140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 14.0, 21.0, 21.0, 14.0, 25.0, 24.0, 42.0, 38.0, 30.0, 36.0, 48.0, 34.0, 33.0, 44.0, 52.0, 59.0, 50.0, 44.0, 39.0, 45.0, 46.0, 38.0, 30.0, 22.0, 27.0, 22.0, 20.0, 18.0, 12.0, 12.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.48248291015625, -7.2540283203125, -7.02557373046875, -6.797119140625, -6.56866455078125, -6.3402099609375, -6.11175537109375, -5.88330078125, -5.65484619140625, -5.4263916015625, -5.19793701171875, -4.969482421875, -4.74102783203125, -4.5125732421875, -4.28411865234375, -4.0556640625, -3.82720947265625, -3.5987548828125, -3.37030029296875, -3.141845703125, -2.91339111328125, -2.6849365234375, -2.45648193359375, -2.22802734375, -1.99957275390625, -1.7711181640625, -1.54266357421875, -1.314208984375, -1.08575439453125, -0.8572998046875, -0.62884521484375, -0.400390625, -0.17193603515625, 0.0565185546875, 0.28497314453125, 0.513427734375, 0.74188232421875, 0.9703369140625, 1.19879150390625, 1.42724609375, 1.65570068359375, 1.8841552734375, 2.11260986328125, 2.341064453125, 2.56951904296875, 2.7979736328125, 3.02642822265625, 3.2548828125, 3.48333740234375, 3.7117919921875, 3.94024658203125, 4.168701171875, 4.39715576171875, 4.6256103515625, 4.85406494140625, 5.08251953125, 5.31097412109375, 5.5394287109375, 5.76788330078125, 5.996337890625, 6.22479248046875, 6.4532470703125, 6.68170166015625, 6.91015625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 11.0, 8.0, 21.0, 35.0, 48.0, 70.0, 103.0, 135.0, 239.0, 402.0, 581.0, 851.0, 1368.0, 2148.0, 3559.0, 5660.0, 9228.0, 14969.0, 24545.0, 40881.0, 68386.0, 121283.0, 235941.0, 230607.0, 118275.0, 66884.0, 39696.0, 24247.0, 14510.0, 8974.0, 5524.0, 3426.0, 2076.0, 1449.0, 837.0, 530.0, 361.0, 256.0, 139.0, 90.0, 71.0, 51.0, 25.0, 19.0, 13.0, 8.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.021392822265625, -0.98614501953125, -0.950897216796875, -0.9156494140625, -0.880401611328125, -0.84515380859375, -0.809906005859375, -0.774658203125, -0.739410400390625, -0.70416259765625, -0.668914794921875, -0.6336669921875, -0.598419189453125, -0.56317138671875, -0.527923583984375, -0.49267578125, -0.457427978515625, -0.42218017578125, -0.386932373046875, -0.3516845703125, -0.316436767578125, -0.28118896484375, -0.245941162109375, -0.210693359375, -0.175445556640625, -0.14019775390625, -0.104949951171875, -0.0697021484375, -0.034454345703125, 0.00079345703125, 0.036041259765625, 0.0712890625, 0.106536865234375, 0.14178466796875, 0.177032470703125, 0.2122802734375, 0.247528076171875, 0.28277587890625, 0.318023681640625, 0.353271484375, 0.388519287109375, 0.42376708984375, 0.459014892578125, 0.4942626953125, 0.529510498046875, 0.56475830078125, 0.600006103515625, 0.63525390625, 0.670501708984375, 0.70574951171875, 0.740997314453125, 0.7762451171875, 0.811492919921875, 0.84674072265625, 0.881988525390625, 0.917236328125, 0.952484130859375, 0.98773193359375, 1.022979736328125, 1.0582275390625, 1.093475341796875, 1.12872314453125, 1.163970947265625, 1.19921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 11.0, 11.0, 18.0, 19.0, 16.0, 15.0, 26.0, 26.0, 27.0, 32.0, 28.0, 24.0, 34.0, 37.0, 32.0, 38.0, 39.0, 1081.0, 33.0, 30.0, 38.0, 42.0, 46.0, 32.0, 47.0, 23.0, 30.0, 33.0, 27.0, 17.0, 20.0, 12.0, 12.0, 8.0, 12.0, 5.0, 3.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.3671875, -4.237152099609375, -4.10711669921875, -3.977081298828125, -3.8470458984375, -3.717010498046875, -3.58697509765625, -3.456939697265625, -3.326904296875, -3.196868896484375, -3.06683349609375, -2.936798095703125, -2.8067626953125, -2.676727294921875, -2.54669189453125, -2.416656494140625, -2.28662109375, -2.156585693359375, -2.02655029296875, -1.896514892578125, -1.7664794921875, -1.636444091796875, -1.50640869140625, -1.376373291015625, -1.246337890625, -1.116302490234375, -0.98626708984375, -0.856231689453125, -0.7261962890625, -0.596160888671875, -0.46612548828125, -0.336090087890625, -0.2060546875, -0.076019287109375, 0.05401611328125, 0.184051513671875, 0.3140869140625, 0.444122314453125, 0.57415771484375, 0.704193115234375, 0.834228515625, 0.964263916015625, 1.09429931640625, 1.224334716796875, 1.3543701171875, 1.484405517578125, 1.61444091796875, 1.744476318359375, 1.87451171875, 2.004547119140625, 2.13458251953125, 2.264617919921875, 2.3946533203125, 2.524688720703125, 2.65472412109375, 2.784759521484375, 2.914794921875, 3.044830322265625, 3.17486572265625, 3.304901123046875, 3.4349365234375, 3.564971923828125, 3.69500732421875, 3.825042724609375, 3.955078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 8.0, 10.0, 10.0, 9.0, 32.0, 35.0, 45.0, 79.0, 118.0, 205.0, 281.0, 445.0, 633.0, 944.0, 1404.0, 2033.0, 3222.0, 4869.0, 7306.0, 11425.0, 17637.0, 27430.0, 43137.0, 69060.0, 113360.0, 204137.0, 1266911.0, 121157.0, 73469.0, 45648.0, 28908.0, 18343.0, 11704.0, 7883.0, 5112.0, 3407.0, 2282.0, 1526.0, 937.0, 610.0, 439.0, 305.0, 218.0, 140.0, 84.0, 71.0, 51.0, 22.0, 15.0, 14.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89501953125, -0.8652420043945312, -0.8354644775390625, -0.8056869506835938, -0.775909423828125, -0.7461318969726562, -0.7163543701171875, -0.6865768432617188, -0.65679931640625, -0.6270217895507812, -0.5972442626953125, -0.5674667358398438, -0.537689208984375, -0.5079116821289062, -0.4781341552734375, -0.44835662841796875, -0.4185791015625, -0.38880157470703125, -0.3590240478515625, -0.32924652099609375, -0.299468994140625, -0.26969146728515625, -0.2399139404296875, -0.21013641357421875, -0.18035888671875, -0.15058135986328125, -0.1208038330078125, -0.09102630615234375, -0.061248779296875, -0.03147125244140625, -0.0016937255859375, 0.02808380126953125, 0.057861328125, 0.08763885498046875, 0.1174163818359375, 0.14719390869140625, 0.176971435546875, 0.20674896240234375, 0.2365264892578125, 0.26630401611328125, 0.29608154296875, 0.32585906982421875, 0.3556365966796875, 0.38541412353515625, 0.415191650390625, 0.44496917724609375, 0.4747467041015625, 0.5045242309570312, 0.5343017578125, 0.5640792846679688, 0.5938568115234375, 0.6236343383789062, 0.653411865234375, 0.6831893920898438, 0.7129669189453125, 0.7427444458007812, 0.77252197265625, 0.8022994995117188, 0.8320770263671875, 0.8618545532226562, 0.891632080078125, 0.9214096069335938, 0.9511871337890625, 0.9809646606445312, 1.0107421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 10.0, 7.0, 14.0, 22.0, 26.0, 26.0, 33.0, 34.0, 53.0, 64.0, 72.0, 82.0, 89.0, 82.0, 74.0, 57.0, 45.0, 44.0, 23.0, 35.0, 13.0, 14.0, 12.0, 13.0, 15.0, 6.0, 6.0, 10.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005064010620117188, -0.00048795342445373535, -0.00046950578689575195, -0.00045105814933776855, -0.00043261051177978516, -0.00041416287422180176, -0.00039571523666381836, -0.00037726759910583496, -0.00035881996154785156, -0.00034037232398986816, -0.00032192468643188477, -0.00030347704887390137, -0.00028502941131591797, -0.00026658177375793457, -0.00024813413619995117, -0.00022968649864196777, -0.00021123886108398438, -0.00019279122352600098, -0.00017434358596801758, -0.00015589594841003418, -0.00013744831085205078, -0.00011900067329406738, -0.00010055303573608398, -8.210539817810059e-05, -6.365776062011719e-05, -4.521012306213379e-05, -2.676248550415039e-05, -8.314847946166992e-06, 1.0132789611816406e-05, 2.8580427169799805e-05, 4.70280647277832e-05, 6.54757022857666e-05, 8.392333984375e-05, 0.0001023709774017334, 0.0001208186149597168, 0.0001392662525177002, 0.0001577138900756836, 0.000176161527633667, 0.0001946091651916504, 0.0002130568027496338, 0.0002315044403076172, 0.0002499520778656006, 0.000268399715423584, 0.0002868473529815674, 0.0003052949905395508, 0.0003237426280975342, 0.0003421902656555176, 0.000360637903213501, 0.0003790855407714844, 0.0003975331783294678, 0.00041598081588745117, 0.00043442845344543457, 0.00045287609100341797, 0.00047132372856140137, 0.0004897713661193848, 0.0005082190036773682, 0.0005266666412353516, 0.000545114278793335, 0.0005635619163513184, 0.0005820095539093018, 0.0006004571914672852, 0.0006189048290252686, 0.000637352466583252, 0.0006558001041412354, 0.0006742477416992188]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 8.0, 13.0, 21.0, 12.0, 29.0, 21.0, 44.0, 49.0, 49.0, 73.0, 115.0, 175.0, 266.0, 391.0, 777.0, 3341.0, 1028392.0, 12477.0, 869.0, 504.0, 287.0, 153.0, 137.0, 85.0, 59.0, 48.0, 45.0, 22.0, 21.0, 19.0, 10.0, 4.0, 10.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0120086669921875, -0.011640310287475586, -0.011271953582763672, -0.010903596878051758, -0.010535240173339844, -0.01016688346862793, -0.009798526763916016, -0.009430170059204102, -0.009061813354492188, -0.008693456649780273, -0.00832509994506836, -0.007956743240356445, -0.007588386535644531, -0.007220029830932617, -0.006851673126220703, -0.006483316421508789, -0.006114959716796875, -0.005746603012084961, -0.005378246307373047, -0.005009889602661133, -0.004641532897949219, -0.004273176193237305, -0.0039048194885253906, -0.0035364627838134766, -0.0031681060791015625, -0.0027997493743896484, -0.0024313926696777344, -0.0020630359649658203, -0.0016946792602539062, -0.0013263225555419922, -0.0009579658508300781, -0.0005896091461181641, -0.00022125244140625, 0.00014710426330566406, 0.0005154609680175781, 0.0008838176727294922, 0.0012521743774414062, 0.0016205310821533203, 0.0019888877868652344, 0.0023572444915771484, 0.0027256011962890625, 0.0030939579010009766, 0.0034623146057128906, 0.0038306713104248047, 0.004199028015136719, 0.004567384719848633, 0.004935741424560547, 0.005304098129272461, 0.005672454833984375, 0.006040811538696289, 0.006409168243408203, 0.006777524948120117, 0.007145881652832031, 0.007514238357543945, 0.00788259506225586, 0.008250951766967773, 0.008619308471679688, 0.008987665176391602, 0.009356021881103516, 0.00972437858581543, 0.010092735290527344, 0.010461091995239258, 0.010829448699951172, 0.011197805404663086, 0.011566162109375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 42.0, 417.0, 478.0, 71.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007842280901968479, -0.0007322087767533958, -0.0006801894633099437, -0.0006281701498664916, -0.0005761508364230394, -0.0005241315229795873, -0.0004721122095361352, -0.0004200928960926831, -0.00036807358264923096, -0.00031605426920577884, -0.0002640349557623267, -0.0002120156423188746, -0.00015999632887542248, -0.00010797701543197036, -5.595770198851824e-05, -3.938388545066118e-06, 4.8080924898386e-05, 0.00010010023834183812, 0.00015211955178529024, 0.00020413886522874236, 0.0002561581786721945, 0.0003081774921156466, 0.0003601968055590987, 0.00041221611900255084, 0.00046423543244600296, 0.0005162547458894551, 0.0005682740593329072, 0.0006202933727763593, 0.0006723126862198114, 0.0007243319996632636, 0.0007763513131067157, 0.0008283706265501678, 0.0008803899399936199, 0.000932409253437072, 0.0009844285668805242, 0.0010364479385316372, 0.0010884671937674284, 0.0011404864490032196, 0.0011925058206543326, 0.0012445251923054457, 0.0012965444475412369, 0.001348563702777028, 0.0014005830744281411, 0.0014526024460792542, 0.0015046217013150454, 0.0015566409565508366, 0.0016086603282019496, 0.0016606796998530626, 0.0017126989550888538, 0.001764718210324645, 0.001816737581975758, 0.0018687569536268711, 0.0019207762088626623, 0.0019727954640984535, 0.0020248149521648884, 0.0020768342074006796, 0.002128853462636471, 0.002180872717872262, 0.002232891973108053, 0.002284911461174488, 0.0023369307164102793, 0.0023889499716460705, 0.0024409694597125053, 0.0024929887149482965, 0.0025450079701840878]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 5.0, 9.0, 6.0, 8.0, 13.0, 20.0, 14.0, 15.0, 26.0, 25.0, 25.0, 21.0, 29.0, 37.0, 44.0, 43.0, 40.0, 35.0, 43.0, 45.0, 40.0, 52.0, 47.0, 37.0, 41.0, 41.0, 36.0, 38.0, 27.0, 19.0, 27.0, 24.0, 16.0, 11.0, 8.0, 8.0, 8.0, 2.0, 4.0, 2.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002828240394592285, -0.0002743285149335861, -0.0002658329904079437, -0.00025733746588230133, -0.00024884194135665894, -0.00024034641683101654, -0.00023185089230537415, -0.00022335536777973175, -0.00021485984325408936, -0.00020636431872844696, -0.00019786879420280457, -0.00018937326967716217, -0.00018087774515151978, -0.00017238222062587738, -0.00016388669610023499, -0.0001553911715745926, -0.0001468956470489502, -0.0001384001225233078, -0.0001299045979976654, -0.00012140907347202301, -0.00011291354894638062, -0.00010441802442073822, -9.592249989509583e-05, -8.742697536945343e-05, -7.893145084381104e-05, -7.043592631816864e-05, -6.194040179252625e-05, -5.344487726688385e-05, -4.4949352741241455e-05, -3.645382821559906e-05, -2.7958303689956665e-05, -1.946277916431427e-05, -1.0967254638671875e-05, -2.47173011302948e-06, 6.023794412612915e-06, 1.451931893825531e-05, 2.3014843463897705e-05, 3.15103679895401e-05, 4.0005892515182495e-05, 4.850141704082489e-05, 5.6996941566467285e-05, 6.549246609210968e-05, 7.398799061775208e-05, 8.248351514339447e-05, 9.097903966903687e-05, 9.947456419467926e-05, 0.00010797008872032166, 0.00011646561324596405, 0.00012496113777160645, 0.00013345666229724884, 0.00014195218682289124, 0.00015044771134853363, 0.00015894323587417603, 0.00016743876039981842, 0.00017593428492546082, 0.0001844298094511032, 0.0001929253339767456, 0.000201420858502388, 0.0002099163830280304, 0.0002184119075536728, 0.00022690743207931519, 0.00023540295660495758, 0.00024389848113059998, 0.00025239400565624237, 0.00026088953018188477]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 14.0, 21.0, 21.0, 14.0, 25.0, 24.0, 42.0, 38.0, 30.0, 36.0, 48.0, 34.0, 33.0, 44.0, 52.0, 59.0, 50.0, 44.0, 39.0, 45.0, 46.0, 38.0, 30.0, 22.0, 27.0, 22.0, 20.0, 18.0, 12.0, 12.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.48248291015625, -7.2540283203125, -7.02557373046875, -6.797119140625, -6.56866455078125, -6.3402099609375, -6.11175537109375, -5.88330078125, -5.65484619140625, -5.4263916015625, -5.19793701171875, -4.969482421875, -4.74102783203125, -4.5125732421875, -4.28411865234375, -4.0556640625, -3.82720947265625, -3.5987548828125, -3.37030029296875, -3.141845703125, -2.91339111328125, -2.6849365234375, -2.45648193359375, -2.22802734375, -1.99957275390625, -1.7711181640625, -1.54266357421875, -1.314208984375, -1.08575439453125, -0.8572998046875, -0.62884521484375, -0.400390625, -0.17193603515625, 0.0565185546875, 0.28497314453125, 0.513427734375, 0.74188232421875, 0.9703369140625, 1.19879150390625, 1.42724609375, 1.65570068359375, 1.8841552734375, 2.11260986328125, 2.341064453125, 2.56951904296875, 2.7979736328125, 3.02642822265625, 3.2548828125, 3.48333740234375, 3.7117919921875, 3.94024658203125, 4.168701171875, 4.39715576171875, 4.6256103515625, 4.85406494140625, 5.08251953125, 5.31097412109375, 5.5394287109375, 5.76788330078125, 5.996337890625, 6.22479248046875, 6.4532470703125, 6.68170166015625, 6.91015625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 12.0, 15.0, 11.0, 20.0, 39.0, 60.0, 79.0, 136.0, 201.0, 292.0, 424.0, 677.0, 1091.0, 1732.0, 3107.0, 6679.0, 27989.0, 373184.0, 574544.0, 41568.0, 8039.0, 3390.0, 1919.0, 1171.0, 769.0, 489.0, 319.0, 184.0, 112.0, 90.0, 73.0, 49.0, 25.0, 14.0, 24.0, 3.0, 4.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.55712890625, -16.9736328125, -16.39013671875, -15.806640625, -15.22314453125, -14.6396484375, -14.05615234375, -13.47265625, -12.88916015625, -12.3056640625, -11.72216796875, -11.138671875, -10.55517578125, -9.9716796875, -9.38818359375, -8.8046875, -8.22119140625, -7.6376953125, -7.05419921875, -6.470703125, -5.88720703125, -5.3037109375, -4.72021484375, -4.13671875, -3.55322265625, -2.9697265625, -2.38623046875, -1.802734375, -1.21923828125, -0.6357421875, -0.05224609375, 0.53125, 1.11474609375, 1.6982421875, 2.28173828125, 2.865234375, 3.44873046875, 4.0322265625, 4.61572265625, 5.19921875, 5.78271484375, 6.3662109375, 6.94970703125, 7.533203125, 8.11669921875, 8.7001953125, 9.28369140625, 9.8671875, 10.45068359375, 11.0341796875, 11.61767578125, 12.201171875, 12.78466796875, 13.3681640625, 13.95166015625, 14.53515625, 15.11865234375, 15.7021484375, 16.28564453125, 16.869140625, 17.45263671875, 18.0361328125, 18.61962890625, 19.203125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 3.0, 7.0, 9.0, 14.0, 17.0, 18.0, 29.0, 33.0, 27.0, 41.0, 46.0, 48.0, 43.0, 79.0, 204.0, 1624.0, 279.0, 97.0, 63.0, 47.0, 57.0, 46.0, 28.0, 43.0, 26.0, 21.0, 12.0, 12.0, 13.0, 9.0, 7.0, 3.0, 6.0, 5.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.875, -18.2978515625, -17.720703125, -17.1435546875, -16.56640625, -15.9892578125, -15.412109375, -14.8349609375, -14.2578125, -13.6806640625, -13.103515625, -12.5263671875, -11.94921875, -11.3720703125, -10.794921875, -10.2177734375, -9.640625, -9.0634765625, -8.486328125, -7.9091796875, -7.33203125, -6.7548828125, -6.177734375, -5.6005859375, -5.0234375, -4.4462890625, -3.869140625, -3.2919921875, -2.71484375, -2.1376953125, -1.560546875, -0.9833984375, -0.40625, 0.1708984375, 0.748046875, 1.3251953125, 1.90234375, 2.4794921875, 3.056640625, 3.6337890625, 4.2109375, 4.7880859375, 5.365234375, 5.9423828125, 6.51953125, 7.0966796875, 7.673828125, 8.2509765625, 8.828125, 9.4052734375, 9.982421875, 10.5595703125, 11.13671875, 11.7138671875, 12.291015625, 12.8681640625, 13.4453125, 14.0224609375, 14.599609375, 15.1767578125, 15.75390625, 16.3310546875, 16.908203125, 17.4853515625, 18.0625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 8.0, 7.0, 4.0, 9.0, 14.0, 29.0, 20.0, 27.0, 40.0, 43.0, 60.0, 57.0, 102.0, 124.0, 168.0, 267.0, 477.0, 1117.0, 7103.0, 3107598.0, 25295.0, 1459.0, 586.0, 305.0, 181.0, 134.0, 107.0, 83.0, 48.0, 57.0, 42.0, 26.0, 19.0, 18.0, 20.0, 9.0, 5.0, 12.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -45.9677734375, -44.466796875, -42.9658203125, -41.46484375, -39.9638671875, -38.462890625, -36.9619140625, -35.4609375, -33.9599609375, -32.458984375, -30.9580078125, -29.45703125, -27.9560546875, -26.455078125, -24.9541015625, -23.453125, -21.9521484375, -20.451171875, -18.9501953125, -17.44921875, -15.9482421875, -14.447265625, -12.9462890625, -11.4453125, -9.9443359375, -8.443359375, -6.9423828125, -5.44140625, -3.9404296875, -2.439453125, -0.9384765625, 0.5625, 2.0634765625, 3.564453125, 5.0654296875, 6.56640625, 8.0673828125, 9.568359375, 11.0693359375, 12.5703125, 14.0712890625, 15.572265625, 17.0732421875, 18.57421875, 20.0751953125, 21.576171875, 23.0771484375, 24.578125, 26.0791015625, 27.580078125, 29.0810546875, 30.58203125, 32.0830078125, 33.583984375, 35.0849609375, 36.5859375, 38.0869140625, 39.587890625, 41.0888671875, 42.58984375, 44.0908203125, 45.591796875, 47.0927734375, 48.59375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 17.0, 40.0, 70.0, 114.0, 164.0, 167.0, 180.0, 107.0, 72.0, 28.0, 20.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.86111831665039, -41.53313446044922, -40.20515060424805, -38.87716293334961, -37.54917907714844, -36.221195220947266, -34.893211364746094, -33.56522750854492, -32.23724365234375, -30.909259796142578, -29.581274032592773, -28.2532901763916, -26.925304412841797, -25.597320556640625, -24.269336700439453, -22.94135284423828, -21.613365173339844, -20.285381317138672, -18.957395553588867, -17.629411697387695, -16.30142593383789, -14.973442077636719, -13.645458221435547, -12.317473411560059, -10.98948860168457, -9.661503791809082, -8.333518981933594, -7.005535125732422, -5.677550315856934, -4.349565505981445, -3.0215811729431152, -1.6935968399047852, -0.36560821533203125, 0.9623763561248779, 2.290360927581787, 3.6183454990386963, 4.9463300704956055, 6.274314880371094, 7.602299213409424, 8.930283546447754, 10.258268356323242, 11.58625316619873, 12.914237976074219, 14.24222183227539, 15.570206642150879, 16.898191452026367, 18.22617530822754, 19.554161071777344, 20.882144927978516, 22.210128784179688, 23.538114547729492, 24.866098403930664, 26.19408416748047, 27.52206802368164, 28.850051879882812, 30.178035736083984, 31.50602149963379, 32.834007263183594, 34.161991119384766, 35.48997497558594, 36.81795883178711, 38.14594268798828, 39.47393035888672, 40.80191421508789, 42.12989807128906]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 9.0, 12.0, 7.0, 14.0, 14.0, 19.0, 18.0, 33.0, 39.0, 26.0, 21.0, 40.0, 41.0, 48.0, 37.0, 39.0, 55.0, 49.0, 47.0, 30.0, 48.0, 31.0, 19.0, 33.0, 36.0, 24.0, 22.0, 34.0, 19.0, 25.0, 16.0, 16.0, 9.0, 14.0, 9.0, 11.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-54.39656066894531, -52.722900390625, -51.04924392700195, -49.37558364868164, -47.701927185058594, -46.02826690673828, -44.354610443115234, -42.68095016479492, -41.007293701171875, -39.33363342285156, -37.659976959228516, -35.9863166809082, -34.312660217285156, -32.638999938964844, -30.965343475341797, -29.291683197021484, -27.618024826049805, -25.944366455078125, -24.270708084106445, -22.597049713134766, -20.923391342163086, -19.249732971191406, -17.576072692871094, -15.90241527557373, -14.22875690460205, -12.555098533630371, -10.881440162658691, -9.207780838012695, -7.534122943878174, -5.860464096069336, -4.186805725097656, -2.5131473541259766, -0.8394889831542969, 0.8341695070266724, 2.5078279972076416, 4.1814866065979, 5.85514497756958, 7.528803825378418, 9.202462196350098, 10.876120567321777, 12.549778938293457, 14.223437309265137, 15.897095680236816, 17.570755004882812, 19.244413375854492, 20.918071746826172, 22.59173011779785, 24.26538848876953, 25.93904685974121, 27.61270523071289, 29.28636360168457, 30.96002197265625, 32.63368225097656, 34.30733871459961, 35.98099899291992, 37.65465545654297, 39.32831573486328, 41.001976013183594, 42.67563247680664, 44.34929275512695, 46.02294921875, 47.69660949707031, 49.37026596069336, 51.04392623901367, 52.71758270263672]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 9.0, 9.0, 4.0, 15.0, 15.0, 16.0, 23.0, 22.0, 20.0, 34.0, 51.0, 33.0, 35.0, 52.0, 58.0, 52.0, 54.0, 41.0, 54.0, 34.0, 46.0, 41.0, 39.0, 37.0, 29.0, 29.0, 26.0, 20.0, 17.0, 34.0, 17.0, 12.0, 5.0, 8.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.140625, -8.8951416015625, -8.649658203125, -8.4041748046875, -8.15869140625, -7.9132080078125, -7.667724609375, -7.4222412109375, -7.1767578125, -6.9312744140625, -6.685791015625, -6.4403076171875, -6.19482421875, -5.9493408203125, -5.703857421875, -5.4583740234375, -5.212890625, -4.9674072265625, -4.721923828125, -4.4764404296875, -4.23095703125, -3.9854736328125, -3.739990234375, -3.4945068359375, -3.2490234375, -3.0035400390625, -2.758056640625, -2.5125732421875, -2.26708984375, -2.0216064453125, -1.776123046875, -1.5306396484375, -1.28515625, -1.0396728515625, -0.794189453125, -0.5487060546875, -0.30322265625, -0.0577392578125, 0.187744140625, 0.4332275390625, 0.6787109375, 0.9241943359375, 1.169677734375, 1.4151611328125, 1.66064453125, 1.9061279296875, 2.151611328125, 2.3970947265625, 2.642578125, 2.8880615234375, 3.133544921875, 3.3790283203125, 3.62451171875, 3.8699951171875, 4.115478515625, 4.3609619140625, 4.6064453125, 4.8519287109375, 5.097412109375, 5.3428955078125, 5.58837890625, 5.8338623046875, 6.079345703125, 6.3248291015625, 6.5703125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 14.0, 24.0, 26.0, 21.0, 43.0, 36.0, 76.0, 95.0, 145.0, 183.0, 325.0, 469.0, 785.0, 1252.0, 2412.0, 5423.0, 15014.0, 66552.0, 489791.0, 2062971.0, 1298972.0, 198383.0, 33438.0, 9602.0, 3630.0, 1808.0, 1013.0, 566.0, 371.0, 266.0, 157.0, 113.0, 81.0, 69.0, 41.0, 28.0, 24.0, 12.0, 15.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0], "bins": [-12.5234375, -12.1734619140625, -11.823486328125, -11.4735107421875, -11.12353515625, -10.7735595703125, -10.423583984375, -10.0736083984375, -9.7236328125, -9.3736572265625, -9.023681640625, -8.6737060546875, -8.32373046875, -7.9737548828125, -7.623779296875, -7.2738037109375, -6.923828125, -6.5738525390625, -6.223876953125, -5.8739013671875, -5.52392578125, -5.1739501953125, -4.823974609375, -4.4739990234375, -4.1240234375, -3.7740478515625, -3.424072265625, -3.0740966796875, -2.72412109375, -2.3741455078125, -2.024169921875, -1.6741943359375, -1.32421875, -0.9742431640625, -0.624267578125, -0.2742919921875, 0.07568359375, 0.4256591796875, 0.775634765625, 1.1256103515625, 1.4755859375, 1.8255615234375, 2.175537109375, 2.5255126953125, 2.87548828125, 3.2254638671875, 3.575439453125, 3.9254150390625, 4.275390625, 4.6253662109375, 4.975341796875, 5.3253173828125, 5.67529296875, 6.0252685546875, 6.375244140625, 6.7252197265625, 7.0751953125, 7.4251708984375, 7.775146484375, 8.1251220703125, 8.47509765625, 8.8250732421875, 9.175048828125, 9.5250244140625, 9.875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 13.0, 15.0, 41.0, 108.0, 393.0, 1098.0, 1620.0, 561.0, 167.0, 50.0, 10.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.03125, -41.650390625, -40.26953125, -38.888671875, -37.5078125, -36.126953125, -34.74609375, -33.365234375, -31.984375, -30.603515625, -29.22265625, -27.841796875, -26.4609375, -25.080078125, -23.69921875, -22.318359375, -20.9375, -19.556640625, -18.17578125, -16.794921875, -15.4140625, -14.033203125, -12.65234375, -11.271484375, -9.890625, -8.509765625, -7.12890625, -5.748046875, -4.3671875, -2.986328125, -1.60546875, -0.224609375, 1.15625, 2.537109375, 3.91796875, 5.298828125, 6.6796875, 8.060546875, 9.44140625, 10.822265625, 12.203125, 13.583984375, 14.96484375, 16.345703125, 17.7265625, 19.107421875, 20.48828125, 21.869140625, 23.25, 24.630859375, 26.01171875, 27.392578125, 28.7734375, 30.154296875, 31.53515625, 32.916015625, 34.296875, 35.677734375, 37.05859375, 38.439453125, 39.8203125, 41.201171875, 42.58203125, 43.962890625, 45.34375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 4.0, 19.0, 42.0, 75.0, 205.0, 756.0, 4187.0, 4170022.0, 17055.0, 1309.0, 360.0, 130.0, 48.0, 21.0, 12.0, 8.0, 8.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.3125, -87.548828125, -84.78515625, -82.021484375, -79.2578125, -76.494140625, -73.73046875, -70.966796875, -68.203125, -65.439453125, -62.67578125, -59.912109375, -57.1484375, -54.384765625, -51.62109375, -48.857421875, -46.09375, -43.330078125, -40.56640625, -37.802734375, -35.0390625, -32.275390625, -29.51171875, -26.748046875, -23.984375, -21.220703125, -18.45703125, -15.693359375, -12.9296875, -10.166015625, -7.40234375, -4.638671875, -1.875, 0.888671875, 3.65234375, 6.416015625, 9.1796875, 11.943359375, 14.70703125, 17.470703125, 20.234375, 22.998046875, 25.76171875, 28.525390625, 31.2890625, 34.052734375, 36.81640625, 39.580078125, 42.34375, 45.107421875, 47.87109375, 50.634765625, 53.3984375, 56.162109375, 58.92578125, 61.689453125, 64.453125, 67.216796875, 69.98046875, 72.744140625, 75.5078125, 78.271484375, 81.03515625, 83.798828125, 86.5625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 85.0, 592.0, 319.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.76255798339844, -240.84356689453125, -233.92457580566406, -227.00558471679688, -220.08657836914062, -213.16758728027344, -206.24859619140625, -199.32960510253906, -192.41061401367188, -185.4916229248047, -178.5726318359375, -171.65362548828125, -164.73463439941406, -157.81564331054688, -150.8966522216797, -143.9776611328125, -137.05865478515625, -130.13966369628906, -123.22066497802734, -116.30167388916016, -109.38267517089844, -102.46368408203125, -95.54469299316406, -88.62570190429688, -81.70670318603516, -74.78771209716797, -67.86871337890625, -60.94972229003906, -54.03072738647461, -47.111732482910156, -40.19274139404297, -33.273746490478516, -26.354736328125, -19.435741424560547, -12.516748428344727, -5.597755432128906, 1.3212394714355469, 8.240234375, 15.159225463867188, 22.07822036743164, 28.997215270996094, 35.91621017456055, 42.835205078125, 49.75419616699219, 56.67319107055664, 63.592185974121094, 70.51117706298828, 77.43017578125, 84.34916687011719, 91.26815795898438, 98.1871566772461, 105.10614776611328, 112.025146484375, 118.94413757324219, 125.86312866210938, 132.78211975097656, 139.70111083984375, 146.62010192871094, 153.53909301757812, 160.45809936523438, 167.37709045410156, 174.29608154296875, 181.21507263183594, 188.13406372070312, 195.05307006835938]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 7.0, 13.0, 12.0, 14.0, 14.0, 18.0, 18.0, 31.0, 30.0, 29.0, 29.0, 26.0, 55.0, 52.0, 41.0, 48.0, 42.0, 34.0, 46.0, 29.0, 48.0, 38.0, 38.0, 32.0, 28.0, 36.0, 23.0, 23.0, 26.0, 17.0, 19.0, 26.0, 9.0, 9.0, 6.0, 6.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.628509521484375, -38.98917770385742, -37.3498420715332, -35.71051025390625, -34.0711784362793, -32.431846618652344, -30.792510986328125, -29.153179168701172, -27.513845443725586, -25.87451171875, -24.235179901123047, -22.59584617614746, -20.956512451171875, -19.317180633544922, -17.677846908569336, -16.03851318359375, -14.399181365966797, -12.759848594665527, -11.120515823364258, -9.481182098388672, -7.841849327087402, -6.202516555786133, -4.563182830810547, -2.9238500595092773, -1.2845172882080078, 0.3548157215118408, 1.9941487312316895, 3.633481979370117, 5.272814750671387, 6.912147521972656, 8.551481246948242, 10.190814018249512, 11.830146789550781, 13.46947956085205, 15.10881233215332, 16.748146057128906, 18.38747787475586, 20.026811599731445, 21.66614532470703, 23.305477142333984, 24.94481086730957, 26.584144592285156, 28.22347640991211, 29.862810134887695, 31.50214385986328, 33.141475677490234, 34.78080749511719, 36.420143127441406, 38.05947494506836, 39.69880676269531, 41.33814239501953, 42.977474212646484, 44.61680603027344, 46.256141662597656, 47.89547348022461, 49.53480529785156, 51.17414093017578, 52.813472747802734, 54.45280838012695, 56.092140197753906, 57.73147201538086, 59.37080383300781, 61.01013946533203, 62.649471282958984, 64.28880310058594]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 12.0, 7.0, 13.0, 12.0, 12.0, 13.0, 15.0, 18.0, 25.0, 25.0, 28.0, 23.0, 26.0, 41.0, 38.0, 35.0, 37.0, 42.0, 43.0, 51.0, 38.0, 36.0, 30.0, 38.0, 44.0, 27.0, 29.0, 32.0, 31.0, 25.0, 18.0, 21.0, 14.0, 14.0, 11.0, 6.0, 9.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.62109375, -4.46685791015625, -4.3126220703125, -4.15838623046875, -4.004150390625, -3.84991455078125, -3.6956787109375, -3.54144287109375, -3.38720703125, -3.23297119140625, -3.0787353515625, -2.92449951171875, -2.770263671875, -2.61602783203125, -2.4617919921875, -2.30755615234375, -2.1533203125, -1.99908447265625, -1.8448486328125, -1.69061279296875, -1.536376953125, -1.38214111328125, -1.2279052734375, -1.07366943359375, -0.91943359375, -0.76519775390625, -0.6109619140625, -0.45672607421875, -0.302490234375, -0.14825439453125, 0.0059814453125, 0.16021728515625, 0.314453125, 0.46868896484375, 0.6229248046875, 0.77716064453125, 0.931396484375, 1.08563232421875, 1.2398681640625, 1.39410400390625, 1.54833984375, 1.70257568359375, 1.8568115234375, 2.01104736328125, 2.165283203125, 2.31951904296875, 2.4737548828125, 2.62799072265625, 2.7822265625, 2.93646240234375, 3.0906982421875, 3.24493408203125, 3.399169921875, 3.55340576171875, 3.7076416015625, 3.86187744140625, 4.01611328125, 4.17034912109375, 4.3245849609375, 4.47882080078125, 4.633056640625, 4.78729248046875, 4.9415283203125, 5.09576416015625, 5.25]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 17.0, 10.0, 29.0, 60.0, 76.0, 120.0, 199.0, 333.0, 531.0, 823.0, 1387.0, 2300.0, 3780.0, 6559.0, 11006.0, 18940.0, 32984.0, 59873.0, 112297.0, 224341.0, 271457.0, 136546.0, 71385.0, 39389.0, 22318.0, 12918.0, 7511.0, 4451.0, 2707.0, 1603.0, 946.0, 589.0, 384.0, 262.0, 150.0, 92.0, 51.0, 44.0, 22.0, 14.0, 14.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.962890625, -0.9298553466796875, -0.896820068359375, -0.8637847900390625, -0.83074951171875, -0.7977142333984375, -0.764678955078125, -0.7316436767578125, -0.6986083984375, -0.6655731201171875, -0.632537841796875, -0.5995025634765625, -0.56646728515625, -0.5334320068359375, -0.500396728515625, -0.4673614501953125, -0.434326171875, -0.4012908935546875, -0.368255615234375, -0.3352203369140625, -0.30218505859375, -0.2691497802734375, -0.236114501953125, -0.2030792236328125, -0.1700439453125, -0.1370086669921875, -0.103973388671875, -0.0709381103515625, -0.03790283203125, -0.0048675537109375, 0.028167724609375, 0.0612030029296875, 0.09423828125, 0.1272735595703125, 0.160308837890625, 0.1933441162109375, 0.22637939453125, 0.2594146728515625, 0.292449951171875, 0.3254852294921875, 0.3585205078125, 0.3915557861328125, 0.424591064453125, 0.4576263427734375, 0.49066162109375, 0.5236968994140625, 0.556732177734375, 0.5897674560546875, 0.622802734375, 0.6558380126953125, 0.688873291015625, 0.7219085693359375, 0.75494384765625, 0.7879791259765625, 0.821014404296875, 0.8540496826171875, 0.8870849609375, 0.9201202392578125, 0.953155517578125, 0.9861907958984375, 1.01922607421875, 1.0522613525390625, 1.085296630859375, 1.1183319091796875, 1.1513671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 14.0, 11.0, 18.0, 13.0, 12.0, 29.0, 26.0, 21.0, 25.0, 27.0, 34.0, 33.0, 37.0, 59.0, 44.0, 30.0, 1086.0, 34.0, 45.0, 45.0, 43.0, 39.0, 39.0, 32.0, 31.0, 25.0, 25.0, 26.0, 14.0, 18.0, 21.0, 10.0, 5.0, 9.0, 9.0, 7.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.10302734375, -2.9912109375, -2.87939453125, -2.767578125, -2.65576171875, -2.5439453125, -2.43212890625, -2.3203125, -2.20849609375, -2.0966796875, -1.98486328125, -1.873046875, -1.76123046875, -1.6494140625, -1.53759765625, -1.42578125, -1.31396484375, -1.2021484375, -1.09033203125, -0.978515625, -0.86669921875, -0.7548828125, -0.64306640625, -0.53125, -0.41943359375, -0.3076171875, -0.19580078125, -0.083984375, 0.02783203125, 0.1396484375, 0.25146484375, 0.36328125, 0.47509765625, 0.5869140625, 0.69873046875, 0.810546875, 0.92236328125, 1.0341796875, 1.14599609375, 1.2578125, 1.36962890625, 1.4814453125, 1.59326171875, 1.705078125, 1.81689453125, 1.9287109375, 2.04052734375, 2.15234375, 2.26416015625, 2.3759765625, 2.48779296875, 2.599609375, 2.71142578125, 2.8232421875, 2.93505859375, 3.046875, 3.15869140625, 3.2705078125, 3.38232421875, 3.494140625, 3.60595703125, 3.7177734375, 3.82958984375, 3.94140625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 11.0, 24.0, 20.0, 53.0, 73.0, 115.0, 152.0, 261.0, 377.0, 560.0, 819.0, 1430.0, 2106.0, 3165.0, 4943.0, 7481.0, 11731.0, 18655.0, 29653.0, 48221.0, 80743.0, 144426.0, 1299193.0, 184080.0, 101107.0, 59432.0, 36068.0, 22623.0, 14003.0, 9042.0, 5726.0, 3860.0, 2417.0, 1577.0, 1022.0, 708.0, 445.0, 272.0, 191.0, 113.0, 88.0, 49.0, 35.0, 18.0, 16.0, 7.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.86572265625, -0.8400344848632812, -0.8143463134765625, -0.7886581420898438, -0.762969970703125, -0.7372817993164062, -0.7115936279296875, -0.6859054565429688, -0.66021728515625, -0.6345291137695312, -0.6088409423828125, -0.5831527709960938, -0.557464599609375, -0.5317764282226562, -0.5060882568359375, -0.48040008544921875, -0.4547119140625, -0.42902374267578125, -0.4033355712890625, -0.37764739990234375, -0.351959228515625, -0.32627105712890625, -0.3005828857421875, -0.27489471435546875, -0.24920654296875, -0.22351837158203125, -0.1978302001953125, -0.17214202880859375, -0.146453857421875, -0.12076568603515625, -0.0950775146484375, -0.06938934326171875, -0.043701171875, -0.01801300048828125, 0.0076751708984375, 0.03336334228515625, 0.059051513671875, 0.08473968505859375, 0.1104278564453125, 0.13611602783203125, 0.16180419921875, 0.18749237060546875, 0.2131805419921875, 0.23886871337890625, 0.264556884765625, 0.29024505615234375, 0.3159332275390625, 0.34162139892578125, 0.3673095703125, 0.39299774169921875, 0.4186859130859375, 0.44437408447265625, 0.470062255859375, 0.49575042724609375, 0.5214385986328125, 0.5471267700195312, 0.57281494140625, 0.5985031127929688, 0.6241912841796875, 0.6498794555664062, 0.675567626953125, 0.7012557983398438, 0.7269439697265625, 0.7526321411132812, 0.7783203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 11.0, 13.0, 19.0, 31.0, 29.0, 38.0, 52.0, 54.0, 73.0, 66.0, 76.0, 68.0, 74.0, 71.0, 61.0, 51.0, 35.0, 31.0, 17.0, 16.0, 19.0, 17.0, 7.0, 8.0, 7.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007786750793457031, -0.0007538646459579468, -0.0007290542125701904, -0.0007042437791824341, -0.0006794333457946777, -0.0006546229124069214, -0.000629812479019165, -0.0006050020456314087, -0.0005801916122436523, -0.000555381178855896, -0.0005305707454681396, -0.0005057603120803833, -0.00048094987869262695, -0.0004561394453048706, -0.00043132901191711426, -0.0004065185785293579, -0.00038170814514160156, -0.0003568977117538452, -0.00033208727836608887, -0.0003072768449783325, -0.00028246641159057617, -0.0002576559782028198, -0.00023284554481506348, -0.00020803511142730713, -0.00018322467803955078, -0.00015841424465179443, -0.00013360381126403809, -0.00010879337787628174, -8.398294448852539e-05, -5.917251110076904e-05, -3.4362077713012695e-05, -9.551644325256348e-06, 1.52587890625e-05, 4.006922245025635e-05, 6.48796558380127e-05, 8.969008922576904e-05, 0.00011450052261352539, 0.00013931095600128174, 0.00016412138938903809, 0.00018893182277679443, 0.00021374225616455078, 0.00023855268955230713, 0.0002633631229400635, 0.0002881735563278198, 0.00031298398971557617, 0.0003377944231033325, 0.00036260485649108887, 0.0003874152898788452, 0.00041222572326660156, 0.0004370361566543579, 0.00046184659004211426, 0.0004866570234298706, 0.000511467456817627, 0.0005362778902053833, 0.0005610883235931396, 0.000585898756980896, 0.0006107091903686523, 0.0006355196237564087, 0.000660330057144165, 0.0006851404905319214, 0.0007099509239196777, 0.0007347613573074341, 0.0007595717906951904, 0.0007843822240829468, 0.0008091926574707031]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 11.0, 12.0, 13.0, 18.0, 15.0, 33.0, 31.0, 34.0, 53.0, 72.0, 92.0, 144.0, 218.0, 280.0, 497.0, 1020.0, 23066.0, 1019262.0, 1576.0, 707.0, 397.0, 254.0, 175.0, 146.0, 96.0, 69.0, 55.0, 46.0, 35.0, 28.0, 18.0, 21.0, 12.0, 12.0, 4.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01226806640625, -0.011887550354003906, -0.011507034301757812, -0.011126518249511719, -0.010746002197265625, -0.010365486145019531, -0.009984970092773438, -0.009604454040527344, -0.00922393798828125, -0.008843421936035156, -0.008462905883789062, -0.008082389831542969, -0.007701873779296875, -0.007321357727050781, -0.0069408416748046875, -0.006560325622558594, -0.0061798095703125, -0.005799293518066406, -0.0054187774658203125, -0.005038261413574219, -0.004657745361328125, -0.004277229309082031, -0.0038967132568359375, -0.0035161972045898438, -0.00313568115234375, -0.0027551651000976562, -0.0023746490478515625, -0.0019941329956054688, -0.001613616943359375, -0.0012331008911132812, -0.0008525848388671875, -0.00047206878662109375, -9.1552734375e-05, 0.00028896331787109375, 0.0006694793701171875, 0.0010499954223632812, 0.001430511474609375, 0.0018110275268554688, 0.0021915435791015625, 0.0025720596313476562, 0.00295257568359375, 0.0033330917358398438, 0.0037136077880859375, 0.004094123840332031, 0.004474639892578125, 0.004855155944824219, 0.0052356719970703125, 0.005616188049316406, 0.0059967041015625, 0.006377220153808594, 0.0067577362060546875, 0.007138252258300781, 0.007518768310546875, 0.007899284362792969, 0.008279800415039062, 0.008660316467285156, 0.00904083251953125, 0.009421348571777344, 0.009801864624023438, 0.010182380676269531, 0.010562896728515625, 0.010943412780761719, 0.011323928833007812, 0.011704444885253906, 0.0120849609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 815.0, 192.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019121458753943443, -0.0018243335653096437, -0.0017365212552249432, -0.0016487089451402426, -0.0015608965186402202, -0.0014730842085555196, -0.001385271898470819, -0.0012974594719707966, -0.001209647161886096, -0.0011218348518013954, -0.0010340225417166948, -0.0009462101734243333, -0.0008583978051319718, -0.0007705854950472713, -0.0006827731849625707, -0.0005949608166702092, -0.0005071485647931695, -0.00041933622560463846, -0.0003315238864161074, -0.00024371157633140683, -0.0001558992371428758, -6.808689795434475e-05, 1.9725412130355835e-05, 0.00010753778042271733, 0.00019535009050741792, 0.00028316242969594896, 0.00037097476888448, 0.0004587870789691806, 0.0005465993890538812, 0.0006344117573462427, 0.0007222240674309433, 0.0008100364357233047, 0.0008978487458080053, 0.000985661055892706, 0.0010734733659774065, 0.001161285676062107, 0.0012490981025621295, 0.00133691041264683, 0.0014247227227315307, 0.001512535149231553, 0.0016003474593162537, 0.0016881597694009542, 0.0017759720794856548, 0.0018637843895703554, 0.0019515968160703778, 0.0020394092425704002, 0.002127221319824457, 0.0022150338627398014, 0.0023028459399938583, 0.002390658250078559, 0.0024784705601632595, 0.00256628287024796, 0.0026540951803326607, 0.002741907723248005, 0.002829719800502062, 0.002917532343417406, 0.0030053446535021067, 0.0030931569635868073, 0.003180969273671508, 0.0032687815837562084, 0.003356593893840909, 0.0034444062039256096, 0.003532218746840954, 0.0036200310569256544, 0.003707843367010355]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 6.0, 4.0, 10.0, 10.0, 10.0, 9.0, 11.0, 13.0, 17.0, 17.0, 23.0, 33.0, 28.0, 30.0, 43.0, 33.0, 40.0, 34.0, 42.0, 47.0, 35.0, 40.0, 40.0, 33.0, 41.0, 37.0, 39.0, 33.0, 28.0, 34.0, 25.0, 28.0, 22.0, 11.0, 21.0, 14.0, 8.0, 13.0, 13.0, 6.0, 4.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000335693359375, -0.0003247419372200966, -0.0003137905150651932, -0.00030283909291028976, -0.00029188767075538635, -0.00028093624860048294, -0.00026998482644557953, -0.0002590334042906761, -0.0002480819821357727, -0.0002371305599808693, -0.00022617913782596588, -0.00021522771567106247, -0.00020427629351615906, -0.00019332487136125565, -0.00018237344920635223, -0.00017142202705144882, -0.0001604706048965454, -0.000149519182741642, -0.00013856776058673859, -0.00012761633843183517, -0.00011666491627693176, -0.00010571349412202835, -9.476207196712494e-05, -8.381064981222153e-05, -7.285922765731812e-05, -6.19078055024147e-05, -5.095638334751129e-05, -4.000496119260788e-05, -2.9053539037704468e-05, -1.8102116882801056e-05, -7.150694727897644e-06, 3.800727427005768e-06, 1.475214958190918e-05, 2.570357173681259e-05, 3.6654993891716003e-05, 4.7606416046619415e-05, 5.855783820152283e-05, 6.950926035642624e-05, 8.046068251132965e-05, 9.141210466623306e-05, 0.00010236352682113647, 0.00011331494897603989, 0.0001242663711309433, 0.0001352177932858467, 0.00014616921544075012, 0.00015712063759565353, 0.00016807205975055695, 0.00017902348190546036, 0.00018997490406036377, 0.00020092632621526718, 0.0002118777483701706, 0.000222829170525074, 0.00023378059267997742, 0.00024473201483488083, 0.00025568343698978424, 0.00026663485914468765, 0.00027758628129959106, 0.0002885377034544945, 0.0002994891256093979, 0.0003104405477643013, 0.0003213919699192047, 0.0003323433920741081, 0.00034329481422901154, 0.00035424623638391495, 0.00036519765853881836]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 12.0, 7.0, 13.0, 12.0, 12.0, 13.0, 15.0, 18.0, 25.0, 25.0, 28.0, 23.0, 26.0, 41.0, 38.0, 35.0, 37.0, 42.0, 43.0, 51.0, 38.0, 36.0, 30.0, 38.0, 44.0, 27.0, 29.0, 32.0, 30.0, 26.0, 18.0, 21.0, 14.0, 14.0, 11.0, 6.0, 9.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.62109375, -4.46685791015625, -4.3126220703125, -4.15838623046875, -4.004150390625, -3.84991455078125, -3.6956787109375, -3.54144287109375, -3.38720703125, -3.23297119140625, -3.0787353515625, -2.92449951171875, -2.770263671875, -2.61602783203125, -2.4617919921875, -2.30755615234375, -2.1533203125, -1.99908447265625, -1.8448486328125, -1.69061279296875, -1.536376953125, -1.38214111328125, -1.2279052734375, -1.07366943359375, -0.91943359375, -0.76519775390625, -0.6109619140625, -0.45672607421875, -0.302490234375, -0.14825439453125, 0.0059814453125, 0.16021728515625, 0.314453125, 0.46868896484375, 0.6229248046875, 0.77716064453125, 0.931396484375, 1.08563232421875, 1.2398681640625, 1.39410400390625, 1.54833984375, 1.70257568359375, 1.8568115234375, 2.01104736328125, 2.165283203125, 2.31951904296875, 2.4737548828125, 2.62799072265625, 2.7822265625, 2.93646240234375, 3.0906982421875, 3.24493408203125, 3.399169921875, 3.55340576171875, 3.7076416015625, 3.86187744140625, 4.01611328125, 4.17034912109375, 4.3245849609375, 4.47882080078125, 4.633056640625, 4.78729248046875, 4.9415283203125, 5.09576416015625, 5.25]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 11.0, 13.0, 18.0, 21.0, 29.0, 29.0, 47.0, 40.0, 80.0, 88.0, 134.0, 177.0, 254.0, 378.0, 604.0, 1000.0, 1737.0, 3690.0, 8814.0, 25052.0, 98952.0, 542341.0, 282807.0, 54008.0, 15715.0, 5930.0, 2650.0, 1400.0, 817.0, 529.0, 326.0, 224.0, 173.0, 112.0, 76.0, 59.0, 52.0, 36.0, 28.0, 22.0, 16.0, 12.0, 5.0, 9.0, 4.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-8.890625, -8.6019287109375, -8.313232421875, -8.0245361328125, -7.73583984375, -7.4471435546875, -7.158447265625, -6.8697509765625, -6.5810546875, -6.2923583984375, -6.003662109375, -5.7149658203125, -5.42626953125, -5.1375732421875, -4.848876953125, -4.5601806640625, -4.271484375, -3.9827880859375, -3.694091796875, -3.4053955078125, -3.11669921875, -2.8280029296875, -2.539306640625, -2.2506103515625, -1.9619140625, -1.6732177734375, -1.384521484375, -1.0958251953125, -0.80712890625, -0.5184326171875, -0.229736328125, 0.0589599609375, 0.34765625, 0.6363525390625, 0.925048828125, 1.2137451171875, 1.50244140625, 1.7911376953125, 2.079833984375, 2.3685302734375, 2.6572265625, 2.9459228515625, 3.234619140625, 3.5233154296875, 3.81201171875, 4.1007080078125, 4.389404296875, 4.6781005859375, 4.966796875, 5.2554931640625, 5.544189453125, 5.8328857421875, 6.12158203125, 6.4102783203125, 6.698974609375, 6.9876708984375, 7.2763671875, 7.5650634765625, 7.853759765625, 8.1424560546875, 8.43115234375, 8.7198486328125, 9.008544921875, 9.2972412109375, 9.5859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 12.0, 9.0, 18.0, 14.0, 17.0, 22.0, 39.0, 41.0, 48.0, 61.0, 64.0, 86.0, 264.0, 1801.0, 151.0, 76.0, 52.0, 46.0, 39.0, 43.0, 29.0, 29.0, 16.0, 16.0, 15.0, 7.0, 11.0, 4.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.939208984375, -16.36279296875, -15.786376953125, -15.2099609375, -14.633544921875, -14.05712890625, -13.480712890625, -12.904296875, -12.327880859375, -11.75146484375, -11.175048828125, -10.5986328125, -10.022216796875, -9.44580078125, -8.869384765625, -8.29296875, -7.716552734375, -7.14013671875, -6.563720703125, -5.9873046875, -5.410888671875, -4.83447265625, -4.258056640625, -3.681640625, -3.105224609375, -2.52880859375, -1.952392578125, -1.3759765625, -0.799560546875, -0.22314453125, 0.353271484375, 0.9296875, 1.506103515625, 2.08251953125, 2.658935546875, 3.2353515625, 3.811767578125, 4.38818359375, 4.964599609375, 5.541015625, 6.117431640625, 6.69384765625, 7.270263671875, 7.8466796875, 8.423095703125, 8.99951171875, 9.575927734375, 10.15234375, 10.728759765625, 11.30517578125, 11.881591796875, 12.4580078125, 13.034423828125, 13.61083984375, 14.187255859375, 14.763671875, 15.340087890625, 15.91650390625, 16.492919921875, 17.0693359375, 17.645751953125, 18.22216796875, 18.798583984375, 19.375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 8.0, 9.0, 13.0, 16.0, 23.0, 24.0, 41.0, 48.0, 62.0, 113.0, 241.0, 540.0, 1557.0, 3074440.0, 66520.0, 1073.0, 440.0, 195.0, 96.0, 80.0, 38.0, 29.0, 25.0, 19.0, 12.0, 10.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.15625, -53.4775390625, -51.798828125, -50.1201171875, -48.44140625, -46.7626953125, -45.083984375, -43.4052734375, -41.7265625, -40.0478515625, -38.369140625, -36.6904296875, -35.01171875, -33.3330078125, -31.654296875, -29.9755859375, -28.296875, -26.6181640625, -24.939453125, -23.2607421875, -21.58203125, -19.9033203125, -18.224609375, -16.5458984375, -14.8671875, -13.1884765625, -11.509765625, -9.8310546875, -8.15234375, -6.4736328125, -4.794921875, -3.1162109375, -1.4375, 0.2412109375, 1.919921875, 3.5986328125, 5.27734375, 6.9560546875, 8.634765625, 10.3134765625, 11.9921875, 13.6708984375, 15.349609375, 17.0283203125, 18.70703125, 20.3857421875, 22.064453125, 23.7431640625, 25.421875, 27.1005859375, 28.779296875, 30.4580078125, 32.13671875, 33.8154296875, 35.494140625, 37.1728515625, 38.8515625, 40.5302734375, 42.208984375, 43.8876953125, 45.56640625, 47.2451171875, 48.923828125, 50.6025390625, 52.28125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 84.0, 550.0, 348.0, 28.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-89.81062316894531, -87.4964828491211, -85.18234252929688, -82.86819458007812, -80.5540542602539, -78.23991394042969, -75.92576599121094, -73.61162567138672, -71.2974853515625, -68.98334503173828, -66.66920471191406, -64.35505676269531, -62.040916442871094, -59.726776123046875, -57.41263198852539, -55.098487854003906, -52.78434753417969, -50.47020721435547, -48.156063079833984, -45.8419189453125, -43.52777862548828, -41.21363830566406, -38.89949417114258, -36.585350036621094, -34.271209716796875, -31.957067489624023, -29.642925262451172, -27.32878303527832, -25.01464080810547, -22.700498580932617, -20.386356353759766, -18.072214126586914, -15.758068084716797, -13.443925857543945, -11.129783630371094, -8.815641403198242, -6.501499176025391, -4.187356948852539, -1.8732147216796875, 0.44092750549316406, 2.7550697326660156, 5.069211959838867, 7.383354187011719, 9.69749641418457, 12.011638641357422, 14.325780868530273, 16.639923095703125, 18.954065322875977, 21.268207550048828, 23.58234977722168, 25.89649200439453, 28.210634231567383, 30.524776458740234, 32.83892059326172, 35.15306091308594, 37.467201232910156, 39.78134536743164, 42.095489501953125, 44.409629821777344, 46.72377014160156, 49.03791427612305, 51.35205841064453, 53.66619873046875, 55.98033905029297, 58.29448318481445]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 8.0, 10.0, 6.0, 9.0, 26.0, 16.0, 17.0, 18.0, 24.0, 29.0, 34.0, 27.0, 23.0, 36.0, 35.0, 39.0, 34.0, 52.0, 53.0, 36.0, 51.0, 50.0, 43.0, 36.0, 29.0, 37.0, 26.0, 33.0, 25.0, 19.0, 22.0, 11.0, 13.0, 4.0, 17.0, 7.0, 4.0, 11.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-33.075252532958984, -32.07883834838867, -31.08242416381836, -30.086009979248047, -29.089595794677734, -28.093181610107422, -27.096765518188477, -26.100351333618164, -25.10393714904785, -24.10752296447754, -23.111108779907227, -22.114694595336914, -21.11827850341797, -20.121864318847656, -19.125450134277344, -18.12903594970703, -17.13262176513672, -16.136207580566406, -15.139793395996094, -14.143378257751465, -13.146964073181152, -12.15054988861084, -11.154134750366211, -10.157720565795898, -9.161306381225586, -8.164892196655273, -7.168477535247803, -6.172062873840332, -5.1756486892700195, -4.179234504699707, -3.1828198432922363, -2.1864051818847656, -1.1899909973144531, -0.19357657432556152, 0.8028378486633301, 1.7992522716522217, 2.7956666946411133, 3.792080879211426, 4.7884955406188965, 5.784910202026367, 6.78132438659668, 7.777738571166992, 8.774152755737305, 9.770567893981934, 10.766982078552246, 11.763396263122559, 12.759811401367188, 13.7562255859375, 14.752639770507812, 15.749053955078125, 16.745468139648438, 17.74188232421875, 18.738296508789062, 19.734710693359375, 20.73112678527832, 21.727540969848633, 22.723955154418945, 23.720369338989258, 24.71678352355957, 25.713197708129883, 26.709613800048828, 27.70602798461914, 28.702442169189453, 29.698856353759766, 30.695270538330078]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 3.0, 13.0, 7.0, 7.0, 14.0, 10.0, 9.0, 17.0, 19.0, 19.0, 26.0, 21.0, 22.0, 34.0, 38.0, 49.0, 42.0, 51.0, 37.0, 40.0, 56.0, 48.0, 39.0, 33.0, 37.0, 47.0, 32.0, 29.0, 29.0, 32.0, 22.0, 18.0, 19.0, 18.0, 8.0, 9.0, 11.0, 13.0, 2.0, 4.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.880859375, -5.6796875, -5.478515625, -5.27734375, -5.076171875, -4.875, -4.673828125, -4.47265625, -4.271484375, -4.0703125, -3.869140625, -3.66796875, -3.466796875, -3.265625, -3.064453125, -2.86328125, -2.662109375, -2.4609375, -2.259765625, -2.05859375, -1.857421875, -1.65625, -1.455078125, -1.25390625, -1.052734375, -0.8515625, -0.650390625, -0.44921875, -0.248046875, -0.046875, 0.154296875, 0.35546875, 0.556640625, 0.7578125, 0.958984375, 1.16015625, 1.361328125, 1.5625, 1.763671875, 1.96484375, 2.166015625, 2.3671875, 2.568359375, 2.76953125, 2.970703125, 3.171875, 3.373046875, 3.57421875, 3.775390625, 3.9765625, 4.177734375, 4.37890625, 4.580078125, 4.78125, 4.982421875, 5.18359375, 5.384765625, 5.5859375, 5.787109375, 5.98828125, 6.189453125, 6.390625, 6.591796875, 6.79296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 12.0, 16.0, 21.0, 27.0, 34.0, 35.0, 44.0, 66.0, 54.0, 94.0, 74.0, 122.0, 175.0, 216.0, 319.0, 489.0, 900.0, 2054.0, 14125.0, 2930471.0, 1233033.0, 7681.0, 1772.0, 719.0, 436.0, 288.0, 241.0, 166.0, 119.0, 82.0, 59.0, 57.0, 46.0, 44.0, 36.0, 31.0, 19.0, 20.0, 14.0, 17.0, 12.0, 8.0, 10.0, 7.0, 0.0, 1.0, 4.0, 2.0], "bins": [-44.8125, -43.56396484375, -42.3154296875, -41.06689453125, -39.818359375, -38.56982421875, -37.3212890625, -36.07275390625, -34.82421875, -33.57568359375, -32.3271484375, -31.07861328125, -29.830078125, -28.58154296875, -27.3330078125, -26.08447265625, -24.8359375, -23.58740234375, -22.3388671875, -21.09033203125, -19.841796875, -18.59326171875, -17.3447265625, -16.09619140625, -14.84765625, -13.59912109375, -12.3505859375, -11.10205078125, -9.853515625, -8.60498046875, -7.3564453125, -6.10791015625, -4.859375, -3.61083984375, -2.3623046875, -1.11376953125, 0.134765625, 1.38330078125, 2.6318359375, 3.88037109375, 5.12890625, 6.37744140625, 7.6259765625, 8.87451171875, 10.123046875, 11.37158203125, 12.6201171875, 13.86865234375, 15.1171875, 16.36572265625, 17.6142578125, 18.86279296875, 20.111328125, 21.35986328125, 22.6083984375, 23.85693359375, 25.10546875, 26.35400390625, 27.6025390625, 28.85107421875, 30.099609375, 31.34814453125, 32.5966796875, 33.84521484375, 35.09375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 12.0, 21.0, 23.0, 56.0, 82.0, 186.0, 375.0, 685.0, 951.0, 729.0, 428.0, 237.0, 114.0, 58.0, 45.0, 18.0, 10.0, 8.0, 7.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3515625, -12.8302001953125, -12.308837890625, -11.7874755859375, -11.26611328125, -10.7447509765625, -10.223388671875, -9.7020263671875, -9.1806640625, -8.6593017578125, -8.137939453125, -7.6165771484375, -7.09521484375, -6.5738525390625, -6.052490234375, -5.5311279296875, -5.009765625, -4.4884033203125, -3.967041015625, -3.4456787109375, -2.92431640625, -2.4029541015625, -1.881591796875, -1.3602294921875, -0.8388671875, -0.3175048828125, 0.203857421875, 0.7252197265625, 1.24658203125, 1.7679443359375, 2.289306640625, 2.8106689453125, 3.33203125, 3.8533935546875, 4.374755859375, 4.8961181640625, 5.41748046875, 5.9388427734375, 6.460205078125, 6.9815673828125, 7.5029296875, 8.0242919921875, 8.545654296875, 9.0670166015625, 9.58837890625, 10.1097412109375, 10.631103515625, 11.1524658203125, 11.673828125, 12.1951904296875, 12.716552734375, 13.2379150390625, 13.75927734375, 14.2806396484375, 14.802001953125, 15.3233642578125, 15.8447265625, 16.3660888671875, 16.887451171875, 17.4088134765625, 17.93017578125, 18.4515380859375, 18.972900390625, 19.4942626953125, 20.015625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 17.0, 24.0, 50.0, 120.0, 186.0, 492.0, 1762.0, 10817.0, 349651.0, 3759685.0, 64873.0, 4799.0, 1037.0, 373.0, 138.0, 93.0, 63.0, 25.0, 12.0, 4.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.5625, -20.80078125, -20.0390625, -19.27734375, -18.515625, -17.75390625, -16.9921875, -16.23046875, -15.46875, -14.70703125, -13.9453125, -13.18359375, -12.421875, -11.66015625, -10.8984375, -10.13671875, -9.375, -8.61328125, -7.8515625, -7.08984375, -6.328125, -5.56640625, -4.8046875, -4.04296875, -3.28125, -2.51953125, -1.7578125, -0.99609375, -0.234375, 0.52734375, 1.2890625, 2.05078125, 2.8125, 3.57421875, 4.3359375, 5.09765625, 5.859375, 6.62109375, 7.3828125, 8.14453125, 8.90625, 9.66796875, 10.4296875, 11.19140625, 11.953125, 12.71484375, 13.4765625, 14.23828125, 15.0, 15.76171875, 16.5234375, 17.28515625, 18.046875, 18.80859375, 19.5703125, 20.33203125, 21.09375, 21.85546875, 22.6171875, 23.37890625, 24.140625, 24.90234375, 25.6640625, 26.42578125, 27.1875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 2.0, 9.0, 13.0, 23.0, 32.0, 52.0, 106.0, 143.0, 145.0, 113.0, 135.0, 86.0, 52.0, 34.0, 26.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.99544525146484, -69.30860900878906, -66.62176513671875, -63.93492889404297, -61.24809265136719, -58.561256408691406, -55.87441635131836, -53.18757629394531, -50.50074005126953, -47.81390380859375, -45.1270637512207, -42.440223693847656, -39.753387451171875, -37.066551208496094, -34.37971115112305, -31.692873001098633, -29.00603485107422, -26.319196701049805, -23.63235855102539, -20.945520401000977, -18.258682250976562, -15.571844100952148, -12.885005950927734, -10.19816780090332, -7.511329650878906, -4.824491500854492, -2.137653350830078, 0.5491847991943359, 3.23602294921875, 5.922861099243164, 8.609699249267578, 11.296537399291992, 13.983367919921875, 16.67020606994629, 19.357044219970703, 22.043882369995117, 24.73072052001953, 27.417558670043945, 30.10439682006836, 32.791236877441406, 35.47807312011719, 38.16490936279297, 40.851749420166016, 43.53858947753906, 46.225425720214844, 48.912261962890625, 51.59910202026367, 54.28594207763672, 56.9727783203125, 59.65961456298828, 62.34645462036133, 65.03329467773438, 67.72013092041016, 70.40696716308594, 73.09381103515625, 75.78064727783203, 78.46748352050781, 81.1543197631836, 83.84115600585938, 86.52799987792969, 89.21483612060547, 91.90167236328125, 94.58851623535156, 97.27535247802734, 99.96218872070312]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 8.0, 9.0, 11.0, 16.0, 17.0, 20.0, 16.0, 21.0, 25.0, 32.0, 27.0, 41.0, 31.0, 44.0, 39.0, 40.0, 38.0, 39.0, 48.0, 41.0, 36.0, 34.0, 40.0, 33.0, 34.0, 35.0, 25.0, 28.0, 24.0, 30.0, 14.0, 17.0, 20.0, 10.0, 6.0, 6.0, 10.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.24128723144531, -31.13075065612793, -30.020212173461914, -28.90967559814453, -27.799137115478516, -26.688600540161133, -25.57806396484375, -24.467525482177734, -23.35698890686035, -22.24645233154297, -21.135913848876953, -20.02537727355957, -18.914840698242188, -17.804302215576172, -16.69376564025879, -15.58322811126709, -14.47269058227539, -13.362153053283691, -12.251615524291992, -11.14107894897461, -10.03054141998291, -8.920003890991211, -7.80946683883667, -6.698929786682129, -5.58839225769043, -4.4778547286987305, -3.3673176765441895, -2.2567803859710693, -1.1462430953979492, -0.03570556640625, 1.074831485748291, 2.185368537902832, 3.2959060668945312, 4.4064435958862305, 5.5169806480407715, 6.6275177001953125, 7.738055229187012, 8.848592758178711, 9.959129333496094, 11.069666862487793, 12.180204391479492, 13.290741920471191, 14.40127944946289, 15.511816024780273, 16.622352600097656, 17.732891082763672, 18.843427658081055, 19.953964233398438, 21.064502716064453, 22.175039291381836, 23.28557777404785, 24.396114349365234, 25.50665283203125, 26.617189407348633, 27.727725982666016, 28.83826446533203, 29.948801040649414, 31.059337615966797, 32.16987609863281, 33.28041458129883, 34.39094924926758, 35.501487731933594, 36.61202621459961, 37.72256088256836, 38.833099365234375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 11.0, 22.0, 16.0, 23.0, 30.0, 23.0, 24.0, 39.0, 35.0, 38.0, 36.0, 53.0, 39.0, 50.0, 39.0, 41.0, 44.0, 40.0, 40.0, 28.0, 43.0, 30.0, 34.0, 29.0, 23.0, 16.0, 28.0, 12.0, 15.0, 11.0, 8.0, 10.0, 10.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.60986328125, -45.8759765625, -44.14208984375, -42.408203125, -40.67431640625, -38.9404296875, -37.20654296875, -35.47265625, -33.73876953125, -32.0048828125, -30.27099609375, -28.537109375, -26.80322265625, -25.0693359375, -23.33544921875, -21.6015625, -19.86767578125, -18.1337890625, -16.39990234375, -14.666015625, -12.93212890625, -11.1982421875, -9.46435546875, -7.73046875, -5.99658203125, -4.2626953125, -2.52880859375, -0.794921875, 0.93896484375, 2.6728515625, 4.40673828125, 6.140625, 7.87451171875, 9.6083984375, 11.34228515625, 13.076171875, 14.81005859375, 16.5439453125, 18.27783203125, 20.01171875, 21.74560546875, 23.4794921875, 25.21337890625, 26.947265625, 28.68115234375, 30.4150390625, 32.14892578125, 33.8828125, 35.61669921875, 37.3505859375, 39.08447265625, 40.818359375, 42.55224609375, 44.2861328125, 46.02001953125, 47.75390625, 49.48779296875, 51.2216796875, 52.95556640625, 54.689453125, 56.42333984375, 58.1572265625, 59.89111328125, 61.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 11.0, 16.0, 21.0, 21.0, 24.0, 46.0, 80.0, 86.0, 150.0, 246.0, 498.0, 788.0, 1433.0, 2427.0, 4171.0, 7434.0, 13343.0, 25150.0, 48245.0, 95708.0, 194768.0, 303926.0, 172069.0, 84490.0, 42984.0, 22600.0, 12007.0, 6716.0, 3771.0, 2179.0, 1328.0, 691.0, 438.0, 260.0, 142.0, 96.0, 75.0, 38.0, 27.0, 11.0, 13.0, 9.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -10.120361328125, -9.76416015625, -9.407958984375, -9.0517578125, -8.695556640625, -8.33935546875, -7.983154296875, -7.626953125, -7.270751953125, -6.91455078125, -6.558349609375, -6.2021484375, -5.845947265625, -5.48974609375, -5.133544921875, -4.77734375, -4.421142578125, -4.06494140625, -3.708740234375, -3.3525390625, -2.996337890625, -2.64013671875, -2.283935546875, -1.927734375, -1.571533203125, -1.21533203125, -0.859130859375, -0.5029296875, -0.146728515625, 0.20947265625, 0.565673828125, 0.921875, 1.278076171875, 1.63427734375, 1.990478515625, 2.3466796875, 2.702880859375, 3.05908203125, 3.415283203125, 3.771484375, 4.127685546875, 4.48388671875, 4.840087890625, 5.1962890625, 5.552490234375, 5.90869140625, 6.264892578125, 6.62109375, 6.977294921875, 7.33349609375, 7.689697265625, 8.0458984375, 8.402099609375, 8.75830078125, 9.114501953125, 9.470703125, 9.826904296875, 10.18310546875, 10.539306640625, 10.8955078125, 11.251708984375, 11.60791015625, 11.964111328125, 12.3203125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 14.0, 16.0, 18.0, 12.0, 21.0, 26.0, 20.0, 31.0, 24.0, 27.0, 37.0, 40.0, 31.0, 34.0, 41.0, 39.0, 1070.0, 31.0, 46.0, 42.0, 40.0, 32.0, 32.0, 33.0, 28.0, 31.0, 21.0, 31.0, 20.0, 15.0, 17.0, 11.0, 10.0, 12.0, 7.0, 11.0, 7.0, 6.0, 7.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.59375, -33.569580078125, -32.54541015625, -31.521240234375, -30.4970703125, -29.472900390625, -28.44873046875, -27.424560546875, -26.400390625, -25.376220703125, -24.35205078125, -23.327880859375, -22.3037109375, -21.279541015625, -20.25537109375, -19.231201171875, -18.20703125, -17.182861328125, -16.15869140625, -15.134521484375, -14.1103515625, -13.086181640625, -12.06201171875, -11.037841796875, -10.013671875, -8.989501953125, -7.96533203125, -6.941162109375, -5.9169921875, -4.892822265625, -3.86865234375, -2.844482421875, -1.8203125, -0.796142578125, 0.22802734375, 1.252197265625, 2.2763671875, 3.300537109375, 4.32470703125, 5.348876953125, 6.373046875, 7.397216796875, 8.42138671875, 9.445556640625, 10.4697265625, 11.493896484375, 12.51806640625, 13.542236328125, 14.56640625, 15.590576171875, 16.61474609375, 17.638916015625, 18.6630859375, 19.687255859375, 20.71142578125, 21.735595703125, 22.759765625, 23.783935546875, 24.80810546875, 25.832275390625, 26.8564453125, 27.880615234375, 28.90478515625, 29.928955078125, 30.953125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 6.0, 13.0, 19.0, 28.0, 50.0, 69.0, 116.0, 148.0, 224.0, 368.0, 489.0, 856.0, 1244.0, 1912.0, 2789.0, 4096.0, 6190.0, 9393.0, 14672.0, 22080.0, 33854.0, 52633.0, 82189.0, 134749.0, 1268514.0, 171920.0, 103131.0, 64621.0, 41634.0, 26906.0, 17779.0, 11482.0, 7640.0, 5130.0, 3435.0, 2298.0, 1526.0, 1003.0, 657.0, 422.0, 300.0, 201.0, 112.0, 66.0, 69.0, 35.0, 20.0, 18.0, 8.0, 7.0, 7.0, 4.0, 0.0, 2.0, 1.0], "bins": [-7.8984375, -7.664306640625, -7.43017578125, -7.196044921875, -6.9619140625, -6.727783203125, -6.49365234375, -6.259521484375, -6.025390625, -5.791259765625, -5.55712890625, -5.322998046875, -5.0888671875, -4.854736328125, -4.62060546875, -4.386474609375, -4.15234375, -3.918212890625, -3.68408203125, -3.449951171875, -3.2158203125, -2.981689453125, -2.74755859375, -2.513427734375, -2.279296875, -2.045166015625, -1.81103515625, -1.576904296875, -1.3427734375, -1.108642578125, -0.87451171875, -0.640380859375, -0.40625, -0.172119140625, 0.06201171875, 0.296142578125, 0.5302734375, 0.764404296875, 0.99853515625, 1.232666015625, 1.466796875, 1.700927734375, 1.93505859375, 2.169189453125, 2.4033203125, 2.637451171875, 2.87158203125, 3.105712890625, 3.33984375, 3.573974609375, 3.80810546875, 4.042236328125, 4.2763671875, 4.510498046875, 4.74462890625, 4.978759765625, 5.212890625, 5.447021484375, 5.68115234375, 5.915283203125, 6.1494140625, 6.383544921875, 6.61767578125, 6.851806640625, 7.0859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 7.0, 9.0, 18.0, 15.0, 12.0, 19.0, 26.0, 31.0, 29.0, 38.0, 36.0, 36.0, 44.0, 56.0, 55.0, 72.0, 69.0, 56.0, 49.0, 38.0, 51.0, 34.0, 31.0, 30.0, 23.0, 18.0, 19.0, 22.0, 9.0, 10.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007305145263671875, -0.007081449031829834, -0.006857752799987793, -0.006634056568145752, -0.006410360336303711, -0.00618666410446167, -0.005962967872619629, -0.005739271640777588, -0.005515575408935547, -0.005291879177093506, -0.005068182945251465, -0.004844486713409424, -0.004620790481567383, -0.004397094249725342, -0.004173398017883301, -0.00394970178604126, -0.0037260055541992188, -0.0035023093223571777, -0.0032786130905151367, -0.0030549168586730957, -0.0028312206268310547, -0.0026075243949890137, -0.0023838281631469727, -0.0021601319313049316, -0.0019364356994628906, -0.0017127394676208496, -0.0014890432357788086, -0.0012653470039367676, -0.0010416507720947266, -0.0008179545402526855, -0.0005942583084106445, -0.0003705620765686035, -0.0001468658447265625, 7.683038711547852e-05, 0.00030052661895751953, 0.0005242228507995605, 0.0007479190826416016, 0.0009716153144836426, 0.0011953115463256836, 0.0014190077781677246, 0.0016427040100097656, 0.0018664002418518066, 0.0020900964736938477, 0.0023137927055358887, 0.0025374889373779297, 0.0027611851692199707, 0.0029848814010620117, 0.0032085776329040527, 0.0034322738647460938, 0.0036559700965881348, 0.0038796663284301758, 0.004103362560272217, 0.004327058792114258, 0.004550755023956299, 0.00477445125579834, 0.004998147487640381, 0.005221843719482422, 0.005445539951324463, 0.005669236183166504, 0.005892932415008545, 0.006116628646850586, 0.006340324878692627, 0.006564021110534668, 0.006787717342376709, 0.00701141357421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 16.0, 15.0, 13.0, 24.0, 26.0, 40.0, 66.0, 77.0, 108.0, 175.0, 252.0, 385.0, 634.0, 1109.0, 2881.0, 10136.0, 50185.0, 340683.0, 533954.0, 85041.0, 15307.0, 3879.0, 1479.0, 696.0, 402.0, 262.0, 203.0, 141.0, 100.0, 71.0, 55.0, 29.0, 23.0, 19.0, 20.0, 8.0, 6.0, 8.0, 7.0, 0.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.056182861328125, -0.05448770523071289, -0.05279254913330078, -0.05109739303588867, -0.04940223693847656, -0.04770708084106445, -0.046011924743652344, -0.044316768646240234, -0.042621612548828125, -0.040926456451416016, -0.039231300354003906, -0.0375361442565918, -0.03584098815917969, -0.03414583206176758, -0.03245067596435547, -0.03075551986694336, -0.02906036376953125, -0.02736520767211914, -0.02567005157470703, -0.023974895477294922, -0.022279739379882812, -0.020584583282470703, -0.018889427185058594, -0.017194271087646484, -0.015499114990234375, -0.013803958892822266, -0.012108802795410156, -0.010413646697998047, -0.008718490600585938, -0.007023334503173828, -0.005328178405761719, -0.0036330223083496094, -0.0019378662109375, -0.00024271011352539062, 0.0014524459838867188, 0.003147602081298828, 0.0048427581787109375, 0.006537914276123047, 0.008233070373535156, 0.009928226470947266, 0.011623382568359375, 0.013318538665771484, 0.015013694763183594, 0.016708850860595703, 0.018404006958007812, 0.020099163055419922, 0.02179431915283203, 0.02348947525024414, 0.02518463134765625, 0.02687978744506836, 0.02857494354248047, 0.030270099639892578, 0.03196525573730469, 0.0336604118347168, 0.035355567932128906, 0.037050724029541016, 0.038745880126953125, 0.040441036224365234, 0.042136192321777344, 0.04383134841918945, 0.04552650451660156, 0.04722166061401367, 0.04891681671142578, 0.05061197280883789, 0.05230712890625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 14.0, 16.0, 25.0, 51.0, 95.0, 139.0, 170.0, 173.0, 139.0, 74.0, 56.0, 28.0, 13.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.014539824798703194, -0.014208639971911907, -0.013877456076443195, -0.013546271249651909, -0.013215087354183197, -0.01288390252739191, -0.012552717700600624, -0.012221533805131912, -0.0118903499096632, -0.011559165082871914, -0.011227981187403202, -0.010896796360611916, -0.010565612465143204, -0.010234427638351917, -0.00990324281156063, -0.009572058916091919, -0.009240874089300632, -0.008909689262509346, -0.008578505367040634, -0.008247320540249348, -0.007916136644780636, -0.007584951817989349, -0.00725376745685935, -0.006922583095729351, -0.006591398734599352, -0.006260214373469353, -0.0059290300123393536, -0.005597845651209354, -0.005266660824418068, -0.004935476928949356, -0.00460429210215807, -0.0042731077410280704, -0.003941923845559359, -0.0036107394844293594, -0.0032795551232993603, -0.0029483705293387175, -0.0026171861682087183, -0.002286001807078719, -0.0019548172131180763, -0.0016236328519880772, -0.001292448490858078, -0.0009612640715204179, -0.0006300796521827579, -0.00029889517463743687, 3.2289186492562294e-05, 0.00036347354762256145, 0.0006946581415832043, 0.0010258425027132034, 0.0013570268638432026, 0.0016882112249732018, 0.002019395586103201, 0.0023505801800638437, 0.002681764541193843, 0.003012948902323842, 0.003344133496284485, 0.003675317857414484, 0.004006502218544483, 0.004337686579674482, 0.0046688709408044815, 0.005000055767595768, 0.00533123966306448, 0.005662424489855766, 0.0059936088509857655, 0.006324793212115765, 0.006655977573245764]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 4.0, 5.0, 10.0, 9.0, 13.0, 11.0, 20.0, 20.0, 22.0, 26.0, 29.0, 19.0, 30.0, 25.0, 40.0, 23.0, 33.0, 31.0, 40.0, 53.0, 41.0, 40.0, 46.0, 28.0, 37.0, 28.0, 31.0, 32.0, 31.0, 29.0, 20.0, 28.0, 19.0, 20.0, 14.0, 17.0, 10.0, 17.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.003273904323577881, -0.003166566602885723, -0.0030592288821935654, -0.0029518911615014076, -0.00284455344080925, -0.002737215720117092, -0.0026298779994249344, -0.0025225402787327766, -0.002415202558040619, -0.002307864837348461, -0.0022005271166563034, -0.0020931893959641457, -0.001985851675271988, -0.0018785139545798302, -0.0017711762338876724, -0.0016638385131955147, -0.001556500792503357, -0.0014491630718111992, -0.0013418253511190414, -0.0012344876304268837, -0.001127149909734726, -0.0010198121890425682, -0.0009124744683504105, -0.0008051367476582527, -0.000697799026966095, -0.0005904613062739372, -0.0004831235855817795, -0.00037578586488962173, -0.000268448144197464, -0.00016111042350530624, -5.37727028131485e-05, 5.356501787900925e-05, 0.000160902738571167, 0.00026824045926332474, 0.0003755781799554825, 0.00048291590064764023, 0.000590253621339798, 0.0006975913420319557, 0.0008049290627241135, 0.0009122667834162712, 0.001019604504108429, 0.0011269422248005867, 0.0012342799454927444, 0.0013416176661849022, 0.00144895538687706, 0.0015562931075692177, 0.0016636308282613754, 0.0017709685489535332, 0.001878306269645691, 0.0019856439903378487, 0.0020929817110300064, 0.002200319431722164, 0.002307657152414322, 0.0024149948731064796, 0.0025223325937986374, 0.002629670314490795, 0.002737008035182953, 0.0028443457558751106, 0.0029516834765672684, 0.003059021197259426, 0.003166358917951584, 0.0032736966386437416, 0.0033810343593358994, 0.003488372080028057, 0.003595709800720215]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 11.0, 22.0, 16.0, 23.0, 30.0, 24.0, 23.0, 39.0, 34.0, 39.0, 36.0, 53.0, 40.0, 49.0, 39.0, 44.0, 41.0, 40.0, 40.0, 28.0, 43.0, 30.0, 34.0, 29.0, 23.0, 18.0, 26.0, 12.0, 15.0, 11.0, 8.0, 10.0, 10.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.609375, -45.875, -44.140625, -42.40625, -40.671875, -38.9375, -37.203125, -35.46875, -33.734375, -32.0, -30.265625, -28.53125, -26.796875, -25.0625, -23.328125, -21.59375, -19.859375, -18.125, -16.390625, -14.65625, -12.921875, -11.1875, -9.453125, -7.71875, -5.984375, -4.25, -2.515625, -0.78125, 0.953125, 2.6875, 4.421875, 6.15625, 7.890625, 9.625, 11.359375, 13.09375, 14.828125, 16.5625, 18.296875, 20.03125, 21.765625, 23.5, 25.234375, 26.96875, 28.703125, 30.4375, 32.171875, 33.90625, 35.640625, 37.375, 39.109375, 40.84375, 42.578125, 44.3125, 46.046875, 47.78125, 49.515625, 51.25, 52.984375, 54.71875, 56.453125, 58.1875, 59.921875, 61.65625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 11.0, 21.0, 22.0, 18.0, 33.0, 48.0, 76.0, 107.0, 167.0, 266.0, 498.0, 890.0, 1829.0, 3895.0, 9665.0, 35704.0, 241512.0, 621348.0, 100866.0, 19355.0, 6368.0, 2755.0, 1337.0, 704.0, 411.0, 196.0, 132.0, 88.0, 52.0, 45.0, 34.0, 22.0, 22.0, 18.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8828125, -13.3338623046875, -12.784912109375, -12.2359619140625, -11.68701171875, -11.1380615234375, -10.589111328125, -10.0401611328125, -9.4912109375, -8.9422607421875, -8.393310546875, -7.8443603515625, -7.29541015625, -6.7464599609375, -6.197509765625, -5.6485595703125, -5.099609375, -4.5506591796875, -4.001708984375, -3.4527587890625, -2.90380859375, -2.3548583984375, -1.805908203125, -1.2569580078125, -0.7080078125, -0.1590576171875, 0.389892578125, 0.9388427734375, 1.48779296875, 2.0367431640625, 2.585693359375, 3.1346435546875, 3.68359375, 4.2325439453125, 4.781494140625, 5.3304443359375, 5.87939453125, 6.4283447265625, 6.977294921875, 7.5262451171875, 8.0751953125, 8.6241455078125, 9.173095703125, 9.7220458984375, 10.27099609375, 10.8199462890625, 11.368896484375, 11.9178466796875, 12.466796875, 13.0157470703125, 13.564697265625, 14.1136474609375, 14.66259765625, 15.2115478515625, 15.760498046875, 16.3094482421875, 16.8583984375, 17.4073486328125, 17.956298828125, 18.5052490234375, 19.05419921875, 19.6031494140625, 20.152099609375, 20.7010498046875, 21.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 11.0, 14.0, 28.0, 28.0, 36.0, 48.0, 70.0, 103.0, 101.0, 2147.0, 107.0, 80.0, 84.0, 54.0, 41.0, 32.0, 24.0, 11.0, 11.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-162.5, -157.533203125, -152.56640625, -147.599609375, -142.6328125, -137.666015625, -132.69921875, -127.732421875, -122.765625, -117.798828125, -112.83203125, -107.865234375, -102.8984375, -97.931640625, -92.96484375, -87.998046875, -83.03125, -78.064453125, -73.09765625, -68.130859375, -63.1640625, -58.197265625, -53.23046875, -48.263671875, -43.296875, -38.330078125, -33.36328125, -28.396484375, -23.4296875, -18.462890625, -13.49609375, -8.529296875, -3.5625, 1.404296875, 6.37109375, 11.337890625, 16.3046875, 21.271484375, 26.23828125, 31.205078125, 36.171875, 41.138671875, 46.10546875, 51.072265625, 56.0390625, 61.005859375, 65.97265625, 70.939453125, 75.90625, 80.873046875, 85.83984375, 90.806640625, 95.7734375, 100.740234375, 105.70703125, 110.673828125, 115.640625, 120.607421875, 125.57421875, 130.541015625, 135.5078125, 140.474609375, 145.44140625, 150.408203125, 155.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 7.0, 12.0, 23.0, 33.0, 53.0, 72.0, 104.0, 248.0, 590.0, 1407.0, 5013.0, 162847.0, 2955788.0, 15637.0, 2225.0, 850.0, 357.0, 156.0, 91.0, 60.0, 37.0, 32.0, 18.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.84375, -39.6142578125, -38.384765625, -37.1552734375, -35.92578125, -34.6962890625, -33.466796875, -32.2373046875, -31.0078125, -29.7783203125, -28.548828125, -27.3193359375, -26.08984375, -24.8603515625, -23.630859375, -22.4013671875, -21.171875, -19.9423828125, -18.712890625, -17.4833984375, -16.25390625, -15.0244140625, -13.794921875, -12.5654296875, -11.3359375, -10.1064453125, -8.876953125, -7.6474609375, -6.41796875, -5.1884765625, -3.958984375, -2.7294921875, -1.5, -0.2705078125, 0.958984375, 2.1884765625, 3.41796875, 4.6474609375, 5.876953125, 7.1064453125, 8.3359375, 9.5654296875, 10.794921875, 12.0244140625, 13.25390625, 14.4833984375, 15.712890625, 16.9423828125, 18.171875, 19.4013671875, 20.630859375, 21.8603515625, 23.08984375, 24.3193359375, 25.548828125, 26.7783203125, 28.0078125, 29.2373046875, 30.466796875, 31.6962890625, 32.92578125, 34.1552734375, 35.384765625, 36.6142578125, 37.84375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 16.0, 37.0, 70.0, 194.0, 354.0, 196.0, 67.0, 32.0, 10.0, 12.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.33833312988281, -79.69783020019531, -72.05732727050781, -64.41683197021484, -56.776329040527344, -49.135826110839844, -41.49532699584961, -33.854827880859375, -26.214324951171875, -18.573823928833008, -10.93332290649414, -3.2928218841552734, 4.347679138183594, 11.988182067871094, 19.628681182861328, 27.269180297851562, 34.90968322753906, 42.55018615722656, 50.1906852722168, 57.83118438720703, 65.47168731689453, 73.11219024658203, 80.752685546875, 88.3931884765625, 96.03369140625, 103.6741943359375, 111.314697265625, 118.95519256591797, 126.59569549560547, 134.2362060546875, 141.87669372558594, 149.51719665527344, 157.15768432617188, 164.79818725585938, 172.43869018554688, 180.07919311523438, 187.71969604492188, 195.36019897460938, 203.0006866455078, 210.6411895751953, 218.2816925048828, 225.9221954345703, 233.5626983642578, 241.2032012939453, 248.84368896484375, 256.48419189453125, 264.12469482421875, 271.76519775390625, 279.40570068359375, 287.04620361328125, 294.68670654296875, 302.32720947265625, 309.96771240234375, 317.60821533203125, 325.24871826171875, 332.88922119140625, 340.52972412109375, 348.17022705078125, 355.81072998046875, 363.45123291015625, 371.09173583984375, 378.73223876953125, 386.37274169921875, 394.01324462890625, 401.6537170410156]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 11.0, 8.0, 5.0, 7.0, 14.0, 16.0, 17.0, 17.0, 18.0, 22.0, 17.0, 37.0, 40.0, 39.0, 52.0, 50.0, 40.0, 52.0, 54.0, 49.0, 33.0, 37.0, 47.0, 52.0, 34.0, 28.0, 32.0, 27.0, 20.0, 20.0, 17.0, 14.0, 10.0, 7.0, 9.0, 11.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-96.98023986816406, -93.855224609375, -90.73020935058594, -87.60519409179688, -84.48017120361328, -81.35515594482422, -78.23014068603516, -75.1051254272461, -71.98011016845703, -68.85509490966797, -65.7300796508789, -62.60506057739258, -59.480045318603516, -56.35502624511719, -53.230010986328125, -50.10499572753906, -46.979976654052734, -43.85496139526367, -40.729942321777344, -37.60492706298828, -34.47991180419922, -31.354894638061523, -28.229877471923828, -25.104862213134766, -21.97984504699707, -18.854827880859375, -15.729812622070312, -12.604795455932617, -9.479779243469238, -6.354763031005859, -3.229745864868164, -0.10473060607910156, 3.0202865600585938, 6.145302772521973, 9.270318984985352, 12.395336151123047, 15.520352363586426, 18.645368576049805, 21.7703857421875, 24.895401000976562, 28.020418167114258, 31.145435333251953, 34.270450592041016, 37.395469665527344, 40.520484924316406, 43.64550018310547, 46.77051544189453, 49.895530700683594, 53.02054977416992, 56.145565032958984, 59.27058410644531, 62.395599365234375, 65.52061462402344, 68.6456298828125, 71.77064514160156, 74.89566040039062, 78.02068328857422, 81.14569854736328, 84.27071380615234, 87.39573669433594, 90.520751953125, 93.64576721191406, 96.77078247070312, 99.89579772949219, 103.02081298828125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 8.0, 9.0, 18.0, 30.0, 50.0, 57.0, 97.0, 160.0, 231.0, 346.0, 496.0, 721.0, 1221.0, 1041009.0, 1458.0, 876.0, 593.0, 392.0, 259.0, 180.0, 136.0, 76.0, 48.0, 33.0, 16.0, 14.0, 9.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.42410659790039, -38.71892547607422, -37.01374816894531, -35.30856704711914, -33.603389739990234, -31.898208618164062, -30.193029403686523, -28.487850189208984, -26.782670974731445, -25.077491760253906, -23.372312545776367, -21.667133331298828, -19.961952209472656, -18.25677490234375, -16.551593780517578, -14.846414566040039, -13.1412353515625, -11.436056137084961, -9.730876922607422, -8.025696754455566, -6.320517539978027, -4.615338325500488, -2.910158157348633, -1.2049789428710938, 0.5002002716064453, 2.2053797245025635, 3.9105591773986816, 5.615738868713379, 7.320918083190918, 9.026097297668457, 10.731277465820312, 12.436456680297852, 14.141632080078125, 15.846811294555664, 17.551990509033203, 19.257171630859375, 20.96234893798828, 22.667530059814453, 24.372709274291992, 26.07788848876953, 27.78306770324707, 29.48824691772461, 31.19342613220215, 32.89860534667969, 34.60378646850586, 36.308963775634766, 38.01414489746094, 39.719322204589844, 41.424503326416016, 43.12968444824219, 44.834861755371094, 46.540042877197266, 48.24522018432617, 49.950401306152344, 51.65557861328125, 53.36075973510742, 55.065940856933594, 56.771121978759766, 58.47629928588867, 60.181480407714844, 61.88665771484375, 63.59183883666992, 65.2970199584961, 67.002197265625, 68.7073745727539]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 13.0, 9.0, 12.0, 7.0, 9.0, 13.0, 29.0, 54.0, 425.0, 51462200.0, 191.0, 64.0, 27.0, 19.0, 7.0, 4.0, 4.0, 3.0, 4.0, 6.0, 11.0, 3.0, 3.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4720.0, -4518.69091796875, -4317.3818359375, -4116.07275390625, -3914.763671875, -3713.45458984375, -3512.1455078125, -3310.83642578125, -3109.52734375, -2908.21826171875, -2706.9091796875, -2505.60009765625, -2304.291015625, -2102.98193359375, -1901.6729736328125, -1700.3638916015625, -1499.054931640625, -1297.745849609375, -1096.436767578125, -895.1277465820312, -693.8186645507812, -492.50958251953125, -291.2005615234375, -89.8914794921875, 111.4176025390625, 312.7266845703125, 514.0357666015625, 715.3447875976562, 916.6538696289062, 1117.962890625, 1319.27197265625, 1520.5810546875, 1721.89013671875, 1923.19921875, 2124.50830078125, 2325.8173828125, 2527.12646484375, 2728.435546875, 2929.74462890625, 3131.0537109375, 3332.36279296875, 3533.671875, 3734.98095703125, 3936.2900390625, 4137.59912109375, 4338.908203125, 4540.21728515625, 4741.5263671875, 4942.8349609375, 5144.14404296875, 5345.453125, 5546.76220703125, 5748.0712890625, 5949.38037109375, 6150.689453125, 6351.99853515625, 6553.3076171875, 6754.61669921875, 6955.92578125, 7157.23486328125, 7358.5439453125, 7559.85302734375, 7761.162109375, 7962.47119140625, 8163.7802734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 9.0, 12.0, 6.0, 13.0, 20.0, 21.0, 34.0, 51.0, 94.0, 121.0, 172.0, 271.0, 365.0, 599.0, 845.0, 1368.0, 2096.0, 3248.0, 5217.0, 8273.0, 13101.0, 21116.0, 34397.0, 57158.0, 98917.0, 175744.0, 340485.0, 1365169.0, 3323656.0, 378720.0, 193464.0, 106601.0, 62497.0, 37086.0, 22284.0, 13949.0, 8834.0, 5599.0, 3397.0, 2212.0, 1386.0, 915.0, 616.0, 424.0, 281.0, 202.0, 121.0, 72.0, 74.0, 55.0, 27.0, 14.0, 14.0, 12.0, 7.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.06640625, -4.9132080078125, -4.760009765625, -4.6068115234375, -4.45361328125, -4.3004150390625, -4.147216796875, -3.9940185546875, -3.8408203125, -3.6876220703125, -3.534423828125, -3.3812255859375, -3.22802734375, -3.0748291015625, -2.921630859375, -2.7684326171875, -2.615234375, -2.4620361328125, -2.308837890625, -2.1556396484375, -2.00244140625, -1.8492431640625, -1.696044921875, -1.5428466796875, -1.3896484375, -1.2364501953125, -1.083251953125, -0.9300537109375, -0.77685546875, -0.6236572265625, -0.470458984375, -0.3172607421875, -0.1640625, -0.0108642578125, 0.142333984375, 0.2955322265625, 0.44873046875, 0.6019287109375, 0.755126953125, 0.9083251953125, 1.0615234375, 1.2147216796875, 1.367919921875, 1.5211181640625, 1.67431640625, 1.8275146484375, 1.980712890625, 2.1339111328125, 2.287109375, 2.4403076171875, 2.593505859375, 2.7467041015625, 2.89990234375, 3.0531005859375, 3.206298828125, 3.3594970703125, 3.5126953125, 3.6658935546875, 3.819091796875, 3.9722900390625, 4.12548828125, 4.2786865234375, 4.431884765625, 4.5850830078125, 4.73828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 2.0, 4.0, 10.0, 9.0, 11.0, 12.0, 16.0, 9.0, 20.0, 17.0, 27.0, 23.0, 29.0, 28.0, 31.0, 44.0, 34.0, 39.0, 50.0, 117.0, 355.0, 600.0, 101.0, 55.0, 40.0, 30.0, 34.0, 29.0, 37.0, 27.0, 27.0, 22.0, 18.0, 20.0, 17.0, 9.0, 12.0, 11.0, 8.0, 10.0, 6.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.5703125, -11.1998291015625, -10.829345703125, -10.4588623046875, -10.08837890625, -9.7178955078125, -9.347412109375, -8.9769287109375, -8.6064453125, -8.2359619140625, -7.865478515625, -7.4949951171875, -7.12451171875, -6.7540283203125, -6.383544921875, -6.0130615234375, -5.642578125, -5.2720947265625, -4.901611328125, -4.5311279296875, -4.16064453125, -3.7901611328125, -3.419677734375, -3.0491943359375, -2.6787109375, -2.3082275390625, -1.937744140625, -1.5672607421875, -1.19677734375, -0.8262939453125, -0.455810546875, -0.0853271484375, 0.28515625, 0.6556396484375, 1.026123046875, 1.3966064453125, 1.76708984375, 2.1375732421875, 2.508056640625, 2.8785400390625, 3.2490234375, 3.6195068359375, 3.989990234375, 4.3604736328125, 4.73095703125, 5.1014404296875, 5.471923828125, 5.8424072265625, 6.212890625, 6.5833740234375, 6.953857421875, 7.3243408203125, 7.69482421875, 8.0653076171875, 8.435791015625, 8.8062744140625, 9.1767578125, 9.5472412109375, 9.917724609375, 10.2882080078125, 10.65869140625, 11.0291748046875, 11.399658203125, 11.7701416015625, 12.140625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 7.0, 6.0, 11.0, 13.0, 22.0, 21.0, 55.0, 53.0, 120.0, 159.0, 326.0, 477.0, 773.0, 1331.0, 2328.0, 4158.0, 7435.0, 13803.0, 25708.0, 48981.0, 97003.0, 197367.0, 487541.0, 4177988.0, 730017.0, 250647.0, 118100.0, 58908.0, 30915.0, 16659.0, 8923.0, 4864.0, 2681.0, 1609.0, 913.0, 600.0, 342.0, 227.0, 132.0, 82.0, 40.0, 18.0, 19.0, 25.0, 16.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0], "bins": [-7.53515625, -7.31121826171875, -7.0872802734375, -6.86334228515625, -6.639404296875, -6.41546630859375, -6.1915283203125, -5.96759033203125, -5.74365234375, -5.51971435546875, -5.2957763671875, -5.07183837890625, -4.847900390625, -4.62396240234375, -4.4000244140625, -4.17608642578125, -3.9521484375, -3.72821044921875, -3.5042724609375, -3.28033447265625, -3.056396484375, -2.83245849609375, -2.6085205078125, -2.38458251953125, -2.16064453125, -1.93670654296875, -1.7127685546875, -1.48883056640625, -1.264892578125, -1.04095458984375, -0.8170166015625, -0.59307861328125, -0.369140625, -0.14520263671875, 0.0787353515625, 0.30267333984375, 0.526611328125, 0.75054931640625, 0.9744873046875, 1.19842529296875, 1.42236328125, 1.64630126953125, 1.8702392578125, 2.09417724609375, 2.318115234375, 2.54205322265625, 2.7659912109375, 2.98992919921875, 3.2138671875, 3.43780517578125, 3.6617431640625, 3.88568115234375, 4.109619140625, 4.33355712890625, 4.5574951171875, 4.78143310546875, 5.00537109375, 5.22930908203125, 5.4532470703125, 5.67718505859375, 5.901123046875, 6.12506103515625, 6.3489990234375, 6.57293701171875, 6.796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 12.0, 10.0, 12.0, 10.0, 19.0, 21.0, 24.0, 26.0, 26.0, 29.0, 44.0, 36.0, 42.0, 62.0, 67.0, 215.0, 624.0, 220.0, 81.0, 65.0, 46.0, 43.0, 28.0, 36.0, 32.0, 27.0, 29.0, 24.0, 19.0, 20.0, 14.0, 17.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.5546875, -9.2708740234375, -8.987060546875, -8.7032470703125, -8.41943359375, -8.1356201171875, -7.851806640625, -7.5679931640625, -7.2841796875, -7.0003662109375, -6.716552734375, -6.4327392578125, -6.14892578125, -5.8651123046875, -5.581298828125, -5.2974853515625, -5.013671875, -4.7298583984375, -4.446044921875, -4.1622314453125, -3.87841796875, -3.5946044921875, -3.310791015625, -3.0269775390625, -2.7431640625, -2.4593505859375, -2.175537109375, -1.8917236328125, -1.60791015625, -1.3240966796875, -1.040283203125, -0.7564697265625, -0.47265625, -0.1888427734375, 0.094970703125, 0.3787841796875, 0.66259765625, 0.9464111328125, 1.230224609375, 1.5140380859375, 1.7978515625, 2.0816650390625, 2.365478515625, 2.6492919921875, 2.93310546875, 3.2169189453125, 3.500732421875, 3.7845458984375, 4.068359375, 4.3521728515625, 4.635986328125, 4.9197998046875, 5.20361328125, 5.4874267578125, 5.771240234375, 6.0550537109375, 6.3388671875, 6.6226806640625, 6.906494140625, 7.1903076171875, 7.47412109375, 7.7579345703125, 8.041748046875, 8.3255615234375, 8.609375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 7.0, 5.0, 7.0, 18.0, 1.0, 5.0, 34.0, 33.0, 31.0, 30.0, 64.0, 66.0, 89.0, 118.0, 146.0, 196.0, 250.0, 299.0, 443.0, 562.0, 860.0, 1045.0, 1550.0, 2413.0, 3574.0, 6380.0, 12575.0, 28197.0, 86109.0, 5842378.0, 215349.0, 46719.0, 18404.0, 8920.0, 4907.0, 2859.0, 1835.0, 1389.0, 847.0, 685.0, 450.0, 382.0, 247.0, 220.0, 165.0, 129.0, 104.0, 89.0, 49.0, 48.0, 46.0, 13.0, 14.0, 26.0, 21.0, 23.0, 14.0, 1.0, 3.0, 9.0], "bins": [-16.90625, -16.4053955078125, -15.904541015625, -15.4036865234375, -14.90283203125, -14.4019775390625, -13.901123046875, -13.4002685546875, -12.8994140625, -12.3985595703125, -11.897705078125, -11.3968505859375, -10.89599609375, -10.3951416015625, -9.894287109375, -9.3934326171875, -8.892578125, -8.3917236328125, -7.890869140625, -7.3900146484375, -6.88916015625, -6.3883056640625, -5.887451171875, -5.3865966796875, -4.8857421875, -4.3848876953125, -3.884033203125, -3.3831787109375, -2.88232421875, -2.3814697265625, -1.880615234375, -1.3797607421875, -0.87890625, -0.3780517578125, 0.122802734375, 0.6236572265625, 1.12451171875, 1.6253662109375, 2.126220703125, 2.6270751953125, 3.1279296875, 3.6287841796875, 4.129638671875, 4.6304931640625, 5.13134765625, 5.6322021484375, 6.133056640625, 6.6339111328125, 7.134765625, 7.6356201171875, 8.136474609375, 8.6373291015625, 9.13818359375, 9.6390380859375, 10.139892578125, 10.6407470703125, 11.1416015625, 11.6424560546875, 12.143310546875, 12.6441650390625, 13.14501953125, 13.6458740234375, 14.146728515625, 14.6475830078125, 15.1484375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 6.0, 9.0, 7.0, 7.0, 17.0, 7.0, 12.0, 15.0, 18.0, 18.0, 19.0, 27.0, 36.0, 31.0, 36.0, 52.0, 53.0, 70.0, 114.0, 212.0, 443.0, 236.0, 107.0, 72.0, 54.0, 42.0, 30.0, 34.0, 39.0, 25.0, 25.0, 24.0, 14.0, 21.0, 10.0, 13.0, 16.0, 9.0, 7.0, 4.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.94140625, -5.76544189453125, -5.5894775390625, -5.41351318359375, -5.237548828125, -5.06158447265625, -4.8856201171875, -4.70965576171875, -4.53369140625, -4.35772705078125, -4.1817626953125, -4.00579833984375, -3.829833984375, -3.65386962890625, -3.4779052734375, -3.30194091796875, -3.1259765625, -2.95001220703125, -2.7740478515625, -2.59808349609375, -2.422119140625, -2.24615478515625, -2.0701904296875, -1.89422607421875, -1.71826171875, -1.54229736328125, -1.3663330078125, -1.19036865234375, -1.014404296875, -0.83843994140625, -0.6624755859375, -0.48651123046875, -0.310546875, -0.13458251953125, 0.0413818359375, 0.21734619140625, 0.393310546875, 0.56927490234375, 0.7452392578125, 0.92120361328125, 1.09716796875, 1.27313232421875, 1.4490966796875, 1.62506103515625, 1.801025390625, 1.97698974609375, 2.1529541015625, 2.32891845703125, 2.5048828125, 2.68084716796875, 2.8568115234375, 3.03277587890625, 3.208740234375, 3.38470458984375, 3.5606689453125, 3.73663330078125, 3.91259765625, 4.08856201171875, 4.2645263671875, 4.44049072265625, 4.616455078125, 4.79241943359375, 4.9683837890625, 5.14434814453125, 5.3203125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 16.0, 72.0, 251.0, 535.0, 92.0, 23.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-100.04877471923828, -98.23719787597656, -96.42562103271484, -94.6140365600586, -92.80245971679688, -90.99088287353516, -89.17930603027344, -87.36772918701172, -85.55615234375, -83.74457550048828, -81.93299865722656, -80.12141418457031, -78.3098373413086, -76.49826049804688, -74.68668365478516, -72.87510681152344, -71.06352233886719, -69.25194549560547, -67.44036865234375, -65.6287841796875, -63.81720733642578, -62.00563049316406, -60.194053649902344, -58.382476806640625, -56.57089614868164, -54.75931930541992, -52.94773864746094, -51.13616180419922, -49.3245849609375, -47.513004302978516, -45.7014274597168, -43.88984680175781, -42.07827377319336, -40.26669692993164, -38.455116271972656, -36.64353942871094, -34.83196258544922, -33.020381927490234, -31.208805084228516, -29.397226333618164, -27.585647583007812, -25.77406883239746, -23.96249008178711, -22.15091323852539, -20.33933448791504, -18.527755737304688, -16.71617889404297, -14.904600143432617, -13.093021392822266, -11.281442642211914, -9.469864845275879, -7.6582865715026855, -5.846708297729492, -4.035129547119141, -2.2235517501831055, -0.4119739532470703, 1.3996047973632812, 3.2111830711364746, 5.022761344909668, 6.834339618682861, 8.645917892456055, 10.457496643066406, 12.269074440002441, 14.080652236938477, 15.892230987548828]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 5.0, 5.0, 7.0, 13.0, 22.0, 14.0, 19.0, 32.0, 27.0, 29.0, 27.0, 38.0, 45.0, 43.0, 38.0, 41.0, 54.0, 49.0, 46.0, 33.0, 59.0, 43.0, 37.0, 41.0, 44.0, 22.0, 28.0, 26.0, 22.0, 28.0, 17.0, 14.0, 9.0, 8.0, 7.0, 3.0, 1.0, 8.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.205036163330078, -8.905710220336914, -8.60638427734375, -8.307058334350586, -8.007732391357422, -7.708406925201416, -7.409080982208252, -7.109755516052246, -6.810429573059082, -6.511103630065918, -6.211777687072754, -5.91245174407959, -5.613126277923584, -5.31380033493042, -5.014474391937256, -4.71514892578125, -4.415822505950928, -4.116496562957764, -3.8171708583831787, -3.5178449153900146, -3.2185192108154297, -2.9191932678222656, -2.6198673248291016, -2.3205416202545166, -2.0212156772613525, -1.721889853477478, -1.4225640296936035, -1.1232380867004395, -0.8239122629165649, -0.5245864391326904, -0.22526049613952637, 0.0740652084350586, 0.37339115142822266, 0.6727169752120972, 0.9720428586006165, 1.2713687419891357, 1.5706945657730103, 1.8700203895568848, 2.169346332550049, 2.468672037124634, 2.767997980117798, 3.067323923110962, 3.366649627685547, 3.665975570678711, 3.965301513671875, 4.264627456665039, 4.563953399658203, 4.863278865814209, 5.162604808807373, 5.461930751800537, 5.761256694793701, 6.060582160949707, 6.359908103942871, 6.659234046936035, 6.958559989929199, 7.257885932922363, 7.557211875915527, 7.856537818908691, 8.155863761901855, 8.45518970489502, 8.754515647888184, 9.053840637207031, 9.353166580200195, 9.65249252319336, 9.951818466186523]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 5.0, 5.0, 6.0, 5.0, 8.0, 14.0, 19.0, 23.0, 26.0, 45.0, 59.0, 79.0, 144.0, 223.0, 348.0, 572.0, 959.0, 1741.0, 3219.0, 7224.0, 21686.0, 3264130.0, 858073.0, 22007.0, 7435.0, 3115.0, 1447.0, 696.0, 360.0, 210.0, 139.0, 74.0, 51.0, 33.0, 28.0, 21.0, 14.0, 9.0, 4.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.035125732421875, -0.03412199020385742, -0.033118247985839844, -0.032114505767822266, -0.031110763549804688, -0.03010702133178711, -0.02910327911376953, -0.028099536895751953, -0.027095794677734375, -0.026092052459716797, -0.02508831024169922, -0.02408456802368164, -0.023080825805664062, -0.022077083587646484, -0.021073341369628906, -0.020069599151611328, -0.01906585693359375, -0.018062114715576172, -0.017058372497558594, -0.016054630279541016, -0.015050888061523438, -0.01404714584350586, -0.013043403625488281, -0.012039661407470703, -0.011035919189453125, -0.010032176971435547, -0.009028434753417969, -0.00802469253540039, -0.0070209503173828125, -0.006017208099365234, -0.005013465881347656, -0.004009723663330078, -0.0030059814453125, -0.002002239227294922, -0.0009984970092773438, 5.245208740234375e-06, 0.0010089874267578125, 0.0020127296447753906, 0.0030164718627929688, 0.004020214080810547, 0.005023956298828125, 0.006027698516845703, 0.007031440734863281, 0.00803518295288086, 0.009038925170898438, 0.010042667388916016, 0.011046409606933594, 0.012050151824951172, 0.01305389404296875, 0.014057636260986328, 0.015061378479003906, 0.016065120697021484, 0.017068862915039062, 0.01807260513305664, 0.01907634735107422, 0.020080089569091797, 0.021083831787109375, 0.022087574005126953, 0.02309131622314453, 0.02409505844116211, 0.025098800659179688, 0.026102542877197266, 0.027106285095214844, 0.028110027313232422, 0.02911376953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 5.0, 7.0, 6.0, 10.0, 6.0, 10.0, 6.0, 11.0, 14.0, 79.0, 499.0, 223.0, 23.0, 8.0, 9.0, 8.0, 10.0, 5.0, 11.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0016803741455078125, -0.0016288608312606812, -0.0015773475170135498, -0.0015258342027664185, -0.0014743208885192871, -0.0014228075742721558, -0.0013712942600250244, -0.001319780945777893, -0.0012682676315307617, -0.0012167543172836304, -0.001165241003036499, -0.0011137276887893677, -0.0010622143745422363, -0.001010701060295105, -0.0009591877460479736, -0.0009076744318008423, -0.0008561611175537109, -0.0008046478033065796, -0.0007531344890594482, -0.0007016211748123169, -0.0006501078605651855, -0.0005985945463180542, -0.0005470812320709229, -0.0004955679178237915, -0.00044405460357666016, -0.0003925412893295288, -0.00034102797508239746, -0.0002895146608352661, -0.00023800134658813477, -0.00018648803234100342, -0.00013497471809387207, -8.346140384674072e-05, -3.1948089599609375e-05, 1.9565224647521973e-05, 7.107853889465332e-05, 0.00012259185314178467, 0.00017410516738891602, 0.00022561848163604736, 0.0002771317958831787, 0.00032864511013031006, 0.0003801584243774414, 0.00043167173862457275, 0.0004831850528717041, 0.0005346983671188354, 0.0005862116813659668, 0.0006377249956130981, 0.0006892383098602295, 0.0007407516241073608, 0.0007922649383544922, 0.0008437782526016235, 0.0008952915668487549, 0.0009468048810958862, 0.0009983181953430176, 0.001049831509590149, 0.0011013448238372803, 0.0011528581380844116, 0.001204371452331543, 0.0012558847665786743, 0.0013073980808258057, 0.001358911395072937, 0.0014104247093200684, 0.0014619380235671997, 0.001513451337814331, 0.0015649646520614624, 0.0016164779663085938]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 14.0, 11.0, 9.0, 11.0, 19.0, 20.0, 31.0, 48.0, 78.0, 144.0, 213.0, 374.0, 689.0, 1334.0, 3684.0, 16811.0, 771253.0, 3372090.0, 20338.0, 3981.0, 1446.0, 680.0, 393.0, 217.0, 129.0, 75.0, 64.0, 34.0, 31.0, 13.0, 13.0, 9.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043060302734375, -0.041407108306884766, -0.03975391387939453, -0.0381007194519043, -0.03644752502441406, -0.03479433059692383, -0.033141136169433594, -0.03148794174194336, -0.029834747314453125, -0.02818155288696289, -0.026528358459472656, -0.024875164031982422, -0.023221969604492188, -0.021568775177001953, -0.01991558074951172, -0.018262386322021484, -0.01660919189453125, -0.014955997467041016, -0.013302803039550781, -0.011649608612060547, -0.009996414184570312, -0.008343219757080078, -0.006690025329589844, -0.005036830902099609, -0.003383636474609375, -0.0017304420471191406, -7.724761962890625e-05, 0.0015759468078613281, 0.0032291412353515625, 0.004882335662841797, 0.006535530090332031, 0.008188724517822266, 0.0098419189453125, 0.011495113372802734, 0.013148307800292969, 0.014801502227783203, 0.016454696655273438, 0.018107891082763672, 0.019761085510253906, 0.02141427993774414, 0.023067474365234375, 0.02472066879272461, 0.026373863220214844, 0.028027057647705078, 0.029680252075195312, 0.03133344650268555, 0.03298664093017578, 0.034639835357666016, 0.03629302978515625, 0.037946224212646484, 0.03959941864013672, 0.04125261306762695, 0.04290580749511719, 0.04455900192260742, 0.046212196350097656, 0.04786539077758789, 0.049518585205078125, 0.05117177963256836, 0.052824974060058594, 0.05447816848754883, 0.05613136291503906, 0.0577845573425293, 0.05943775177001953, 0.061090946197509766, 0.062744140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 11.0, 15.0, 20.0, 24.0, 23.0, 41.0, 44.0, 54.0, 68.0, 99.0, 128.0, 175.0, 298.0, 1478.0, 699.0, 233.0, 166.0, 122.0, 71.0, 66.0, 59.0, 33.0, 29.0, 28.0, 16.0, 12.0, 17.0, 9.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0033664703369140625, -0.0032411515712738037, -0.003115832805633545, -0.002990514039993286, -0.0028651952743530273, -0.0027398765087127686, -0.0026145577430725098, -0.002489238977432251, -0.002363920211791992, -0.0022386014461517334, -0.0021132826805114746, -0.001987963914871216, -0.001862645149230957, -0.0017373263835906982, -0.0016120076179504395, -0.0014866888523101807, -0.0013613700866699219, -0.001236051321029663, -0.0011107325553894043, -0.0009854137897491455, -0.0008600950241088867, -0.0007347762584686279, -0.0006094574928283691, -0.00048413872718811035, -0.00035881996154785156, -0.00023350119590759277, -0.00010818243026733398, 1.7136335372924805e-05, 0.0001424551010131836, 0.0002677738666534424, 0.00039309263229370117, 0.00051841139793396, 0.0006437301635742188, 0.0007690489292144775, 0.0008943676948547363, 0.0010196864604949951, 0.001145005226135254, 0.0012703239917755127, 0.0013956427574157715, 0.0015209615230560303, 0.001646280288696289, 0.0017715990543365479, 0.0018969178199768066, 0.0020222365856170654, 0.0021475553512573242, 0.002272874116897583, 0.002398192882537842, 0.0025235116481781006, 0.0026488304138183594, 0.002774149179458618, 0.002899467945098877, 0.0030247867107391357, 0.0031501054763793945, 0.0032754242420196533, 0.003400743007659912, 0.003526061773300171, 0.0036513805389404297, 0.0037766993045806885, 0.0039020180702209473, 0.004027336835861206, 0.004152655601501465, 0.004277974367141724, 0.004403293132781982, 0.004528611898422241, 0.0046539306640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 10.0, 18.0, 66.0, 231.0, 472.0, 136.0, 39.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0440877303481102, -0.04168759286403656, -0.03928745537996292, -0.03688731789588928, -0.03448718041181564, -0.032087042927742004, -0.029686905443668365, -0.027286767959594727, -0.024886630475521088, -0.02248649299144745, -0.02008635550737381, -0.01768621802330017, -0.015286080539226532, -0.012885943055152893, -0.010485805571079254, -0.008085668087005615, -0.005685530602931976, -0.0032853931188583374, -0.0008852556347846985, 0.0015148818492889404, 0.003915019333362579, 0.006315156817436218, 0.008715294301509857, 0.011115431785583496, 0.013515569269657135, 0.015915706753730774, 0.018315844237804413, 0.020715981721878052, 0.02311611920595169, 0.02551625669002533, 0.02791639417409897, 0.030316531658172607, 0.03271667659282684, 0.03511681407690048, 0.03751695156097412, 0.03991708904504776, 0.0423172265291214, 0.04471736401319504, 0.04711750149726868, 0.049517638981342316, 0.051917776465415955, 0.054317913949489594, 0.05671805143356323, 0.05911818891763687, 0.06151832640171051, 0.06391846388578415, 0.06631860136985779, 0.06871873885393143, 0.07111887633800507, 0.0735190138220787, 0.07591915130615234, 0.07831928879022598, 0.08071942627429962, 0.08311956375837326, 0.0855197012424469, 0.08791983872652054, 0.09031997621059418, 0.09272011369466782, 0.09512025117874146, 0.0975203886628151, 0.09992052614688873, 0.10232066363096237, 0.10472080111503601, 0.10712093859910965, 0.10952107608318329]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 13.0, 9.0, 21.0, 24.0, 33.0, 25.0, 35.0, 37.0, 53.0, 45.0, 47.0, 54.0, 61.0, 43.0, 60.0, 36.0, 48.0, 45.0, 55.0, 44.0, 29.0, 31.0, 28.0, 20.0, 21.0, 12.0, 15.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.013874709606170654, -0.013360245153307915, -0.012845780700445175, -0.012331316247582436, -0.011816851794719696, -0.011302387341856956, -0.010787922888994217, -0.010273458436131477, -0.009758993983268738, -0.009244529530405998, -0.008730065077543259, -0.008215600624680519, -0.0077011361718177795, -0.00718667171895504, -0.0066722072660923, -0.006157742813229561, -0.005643278360366821, -0.005128813907504082, -0.004614349454641342, -0.004099885001778603, -0.003585420548915863, -0.0030709560960531235, -0.002556491643190384, -0.0020420271903276443, -0.0015275627374649048, -0.0010130982846021652, -0.0004986338317394257, 1.5830621123313904e-05, 0.0005302950739860535, 0.001044759526848793, 0.0015592239797115326, 0.002073688432574272, 0.0025881528854370117, 0.0031026173382997513, 0.003617081791162491, 0.00413154624402523, 0.00464601069688797, 0.0051604751497507095, 0.005674939602613449, 0.006189404055476189, 0.006703868508338928, 0.007218332961201668, 0.007732797414064407, 0.008247261866927147, 0.008761726319789886, 0.009276190772652626, 0.009790655225515366, 0.010305119678378105, 0.010819584131240845, 0.011334048584103584, 0.011848513036966324, 0.012362977489829063, 0.012877441942691803, 0.013391906395554543, 0.013906370848417282, 0.014420835301280022, 0.014935299754142761, 0.0154497642070055, 0.01596422865986824, 0.01647869311273098, 0.01699315756559372, 0.01750762201845646, 0.0180220864713192, 0.018536550924181938, 0.019051015377044678]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 12.0, 20.0, 23.0, 19.0, 32.0, 43.0, 57.0, 80.0, 89.0, 141.0, 195.0, 277.0, 333.0, 544.0, 732.0, 1039.0, 1465.0, 2224.0, 3380.0, 5384.0, 8461.0, 15292.0, 34971.0, 819884.0, 100946.0, 21920.0, 11352.0, 6620.0, 4237.0, 2709.0, 1807.0, 1241.0, 843.0, 604.0, 420.0, 284.0, 232.0, 166.0, 138.0, 95.0, 62.0, 36.0, 38.0, 24.0, 17.0, 17.0, 9.0, 7.0, 8.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0], "bins": [-0.01934814453125, -0.018757343292236328, -0.018166542053222656, -0.017575740814208984, -0.016984939575195312, -0.01639413833618164, -0.01580333709716797, -0.015212535858154297, -0.014621734619140625, -0.014030933380126953, -0.013440132141113281, -0.01284933090209961, -0.012258529663085938, -0.011667728424072266, -0.011076927185058594, -0.010486125946044922, -0.00989532470703125, -0.009304523468017578, -0.008713722229003906, -0.008122920989990234, -0.0075321197509765625, -0.006941318511962891, -0.006350517272949219, -0.005759716033935547, -0.005168914794921875, -0.004578113555908203, -0.003987312316894531, -0.0033965110778808594, -0.0028057098388671875, -0.0022149085998535156, -0.0016241073608398438, -0.0010333061218261719, -0.0004425048828125, 0.00014829635620117188, 0.0007390975952148438, 0.0013298988342285156, 0.0019207000732421875, 0.0025115013122558594, 0.0031023025512695312, 0.003693103790283203, 0.004283905029296875, 0.004874706268310547, 0.005465507507324219, 0.006056308746337891, 0.0066471099853515625, 0.007237911224365234, 0.007828712463378906, 0.008419513702392578, 0.00901031494140625, 0.009601116180419922, 0.010191917419433594, 0.010782718658447266, 0.011373519897460938, 0.01196432113647461, 0.012555122375488281, 0.013145923614501953, 0.013736724853515625, 0.014327526092529297, 0.014918327331542969, 0.01550912857055664, 0.016099929809570312, 0.016690731048583984, 0.017281532287597656, 0.017872333526611328, 0.018463134765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 9.0, 7.0, 9.0, 13.0, 11.0, 65.0, 333.0, 341.0, 72.0, 19.0, 7.0, 11.0, 7.0, 9.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0017604827880859375, -0.001710057258605957, -0.0016596317291259766, -0.001609206199645996, -0.0015587806701660156, -0.0015083551406860352, -0.0014579296112060547, -0.0014075040817260742, -0.0013570785522460938, -0.0013066530227661133, -0.0012562274932861328, -0.0012058019638061523, -0.0011553764343261719, -0.0011049509048461914, -0.001054525375366211, -0.0010040998458862305, -0.00095367431640625, -0.0009032487869262695, -0.0008528232574462891, -0.0008023977279663086, -0.0007519721984863281, -0.0007015466690063477, -0.0006511211395263672, -0.0006006956100463867, -0.0005502700805664062, -0.0004998445510864258, -0.0004494190216064453, -0.00039899349212646484, -0.0003485679626464844, -0.0002981424331665039, -0.00024771690368652344, -0.00019729137420654297, -0.0001468658447265625, -9.644031524658203e-05, -4.601478576660156e-05, 4.410743713378906e-06, 5.4836273193359375e-05, 0.00010526180267333984, 0.0001556873321533203, 0.00020611286163330078, 0.00025653839111328125, 0.0003069639205932617, 0.0003573894500732422, 0.00040781497955322266, 0.0004582405090332031, 0.0005086660385131836, 0.0005590915679931641, 0.0006095170974731445, 0.000659942626953125, 0.0007103681564331055, 0.0007607936859130859, 0.0008112192153930664, 0.0008616447448730469, 0.0009120702743530273, 0.0009624958038330078, 0.0010129213333129883, 0.0010633468627929688, 0.0011137723922729492, 0.0011641979217529297, 0.0012146234512329102, 0.0012650489807128906, 0.001315474510192871, 0.0013659000396728516, 0.001416325569152832, 0.0014667510986328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 4.0, 3.0, 7.0, 5.0, 5.0, 16.0, 9.0, 19.0, 25.0, 24.0, 40.0, 39.0, 67.0, 66.0, 107.0, 188.0, 253.0, 307.0, 511.0, 791.0, 1293.0, 2166.0, 4475.0, 11437.0, 57456.0, 854643.0, 88800.0, 14125.0, 5240.0, 2424.0, 1380.0, 849.0, 517.0, 331.0, 233.0, 206.0, 133.0, 79.0, 71.0, 53.0, 43.0, 29.0, 19.0, 19.0, 10.0, 15.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.0357666015625, -0.034668922424316406, -0.03357124328613281, -0.03247356414794922, -0.031375885009765625, -0.03027820587158203, -0.029180526733398438, -0.028082847595214844, -0.02698516845703125, -0.025887489318847656, -0.024789810180664062, -0.02369213104248047, -0.022594451904296875, -0.02149677276611328, -0.020399093627929688, -0.019301414489746094, -0.0182037353515625, -0.017106056213378906, -0.016008377075195312, -0.014910697937011719, -0.013813018798828125, -0.012715339660644531, -0.011617660522460938, -0.010519981384277344, -0.00942230224609375, -0.008324623107910156, -0.0072269439697265625, -0.006129264831542969, -0.005031585693359375, -0.003933906555175781, -0.0028362274169921875, -0.0017385482788085938, -0.000640869140625, 0.00045680999755859375, 0.0015544891357421875, 0.0026521682739257812, 0.003749847412109375, 0.004847526550292969, 0.0059452056884765625, 0.007042884826660156, 0.00814056396484375, 0.009238243103027344, 0.010335922241210938, 0.011433601379394531, 0.012531280517578125, 0.013628959655761719, 0.014726638793945312, 0.015824317932128906, 0.0169219970703125, 0.018019676208496094, 0.019117355346679688, 0.02021503448486328, 0.021312713623046875, 0.02241039276123047, 0.023508071899414062, 0.024605751037597656, 0.02570343017578125, 0.026801109313964844, 0.027898788452148438, 0.02899646759033203, 0.030094146728515625, 0.03119182586669922, 0.03228950500488281, 0.033387184143066406, 0.03448486328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 6.0, 14.0, 11.0, 9.0, 12.0, 11.0, 18.0, 21.0, 28.0, 26.0, 30.0, 23.0, 41.0, 39.0, 37.0, 40.0, 46.0, 42.0, 39.0, 40.0, 37.0, 34.0, 47.0, 42.0, 41.0, 30.0, 26.0, 31.0, 40.0, 21.0, 18.0, 15.0, 17.0, 13.0, 7.0, 10.0, 6.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007640838623046875, -0.00741344690322876, -0.0071860551834106445, -0.006958663463592529, -0.006731271743774414, -0.006503880023956299, -0.006276488304138184, -0.006049096584320068, -0.005821704864501953, -0.005594313144683838, -0.005366921424865723, -0.005139529705047607, -0.004912137985229492, -0.004684746265411377, -0.004457354545593262, -0.0042299628257751465, -0.004002571105957031, -0.003775179386138916, -0.0035477876663208008, -0.0033203959465026855, -0.0030930042266845703, -0.002865612506866455, -0.00263822078704834, -0.0024108290672302246, -0.0021834373474121094, -0.001956045627593994, -0.001728653907775879, -0.0015012621879577637, -0.0012738704681396484, -0.0010464787483215332, -0.000819087028503418, -0.0005916953086853027, -0.0003643035888671875, -0.00013691186904907227, 9.047985076904297e-05, 0.0003178715705871582, 0.0005452632904052734, 0.0007726550102233887, 0.001000046730041504, 0.0012274384498596191, 0.0014548301696777344, 0.0016822218894958496, 0.0019096136093139648, 0.00213700532913208, 0.0023643970489501953, 0.0025917887687683105, 0.0028191804885864258, 0.003046572208404541, 0.0032739639282226562, 0.0035013556480407715, 0.0037287473678588867, 0.003956139087677002, 0.004183530807495117, 0.004410922527313232, 0.004638314247131348, 0.004865705966949463, 0.005093097686767578, 0.005320489406585693, 0.005547881126403809, 0.005775272846221924, 0.006002664566040039, 0.006230056285858154, 0.0064574480056762695, 0.006684839725494385, 0.0069122314453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 4.0, 9.0, 10.0, 8.0, 21.0, 42.0, 44.0, 86.0, 208.0, 671.0, 4318.0, 896820.0, 142225.0, 3062.0, 609.0, 164.0, 86.0, 39.0, 23.0, 12.0, 20.0, 12.0, 5.0, 10.0, 11.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0294189453125, -0.02868199348449707, -0.02794504165649414, -0.02720808982849121, -0.02647113800048828, -0.02573418617248535, -0.024997234344482422, -0.024260282516479492, -0.023523330688476562, -0.022786378860473633, -0.022049427032470703, -0.021312475204467773, -0.020575523376464844, -0.019838571548461914, -0.019101619720458984, -0.018364667892456055, -0.017627716064453125, -0.016890764236450195, -0.016153812408447266, -0.015416860580444336, -0.014679908752441406, -0.013942956924438477, -0.013206005096435547, -0.012469053268432617, -0.011732101440429688, -0.010995149612426758, -0.010258197784423828, -0.009521245956420898, -0.008784294128417969, -0.008047342300415039, -0.007310390472412109, -0.00657343864440918, -0.00583648681640625, -0.00509953498840332, -0.004362583160400391, -0.003625631332397461, -0.0028886795043945312, -0.0021517276763916016, -0.0014147758483886719, -0.0006778240203857422, 5.91278076171875e-05, 0.0007960796356201172, 0.0015330314636230469, 0.0022699832916259766, 0.0030069351196289062, 0.003743886947631836, 0.004480838775634766, 0.005217790603637695, 0.005954742431640625, 0.006691694259643555, 0.007428646087646484, 0.008165597915649414, 0.008902549743652344, 0.009639501571655273, 0.010376453399658203, 0.011113405227661133, 0.011850357055664062, 0.012587308883666992, 0.013324260711669922, 0.014061212539672852, 0.014798164367675781, 0.015535116195678711, 0.01627206802368164, 0.01700901985168457, 0.0177459716796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 14.0, 10.0, 16.0, 24.0, 37.0, 57.0, 89.0, 110.0, 125.0, 124.0, 114.0, 77.0, 63.0, 30.0, 35.0, 22.0, 7.0, 10.0, 13.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0471553802490234e-05, -3.940518945455551e-05, -3.833882510662079e-05, -3.7272460758686066e-05, -3.620609641075134e-05, -3.513973206281662e-05, -3.40733677148819e-05, -3.3007003366947174e-05, -3.194063901901245e-05, -3.087427467107773e-05, -2.9807910323143005e-05, -2.8741545975208282e-05, -2.767518162727356e-05, -2.6608817279338837e-05, -2.5542452931404114e-05, -2.447608858346939e-05, -2.3409724235534668e-05, -2.2343359887599945e-05, -2.1276995539665222e-05, -2.02106311917305e-05, -1.9144266843795776e-05, -1.8077902495861053e-05, -1.701153814792633e-05, -1.5945173799991608e-05, -1.4878809452056885e-05, -1.3812445104122162e-05, -1.2746080756187439e-05, -1.1679716408252716e-05, -1.0613352060317993e-05, -9.54698771238327e-06, -8.480623364448547e-06, -7.4142590165138245e-06, -6.3478946685791016e-06, -5.281530320644379e-06, -4.215165972709656e-06, -3.148801624774933e-06, -2.08243727684021e-06, -1.016072928905487e-06, 5.029141902923584e-08, 1.1166557669639587e-06, 2.1830201148986816e-06, 3.2493844628334045e-06, 4.3157488107681274e-06, 5.38211315870285e-06, 6.448477506637573e-06, 7.514841854572296e-06, 8.581206202507019e-06, 9.647570550441742e-06, 1.0713934898376465e-05, 1.1780299246311188e-05, 1.284666359424591e-05, 1.3913027942180634e-05, 1.4979392290115356e-05, 1.604575663805008e-05, 1.7112120985984802e-05, 1.8178485333919525e-05, 1.9244849681854248e-05, 2.031121402978897e-05, 2.1377578377723694e-05, 2.2443942725658417e-05, 2.351030707359314e-05, 2.4576671421527863e-05, 2.5643035769462585e-05, 2.670940011739731e-05, 2.777576446533203e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 4.0, 6.0, 11.0, 12.0, 15.0, 44.0, 57.0, 81.0, 111.0, 179.0, 293.0, 496.0, 993.0, 2428.0, 9335.0, 769458.0, 252584.0, 8059.0, 2137.0, 934.0, 508.0, 288.0, 157.0, 92.0, 69.0, 51.0, 42.0, 31.0, 13.0, 18.0, 7.0, 8.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0278778076171875, -0.027005434036254883, -0.026133060455322266, -0.02526068687438965, -0.02438831329345703, -0.023515939712524414, -0.022643566131591797, -0.02177119255065918, -0.020898818969726562, -0.020026445388793945, -0.019154071807861328, -0.01828169822692871, -0.017409324645996094, -0.016536951065063477, -0.01566457748413086, -0.014792203903198242, -0.013919830322265625, -0.013047456741333008, -0.01217508316040039, -0.011302709579467773, -0.010430335998535156, -0.009557962417602539, -0.008685588836669922, -0.007813215255737305, -0.0069408416748046875, -0.00606846809387207, -0.005196094512939453, -0.004323720932006836, -0.0034513473510742188, -0.0025789737701416016, -0.0017066001892089844, -0.0008342266082763672, 3.814697265625e-05, 0.0009105205535888672, 0.0017828941345214844, 0.0026552677154541016, 0.0035276412963867188, 0.004400014877319336, 0.005272388458251953, 0.00614476203918457, 0.0070171356201171875, 0.007889509201049805, 0.008761882781982422, 0.009634256362915039, 0.010506629943847656, 0.011379003524780273, 0.01225137710571289, 0.013123750686645508, 0.013996124267578125, 0.014868497848510742, 0.01574087142944336, 0.016613245010375977, 0.017485618591308594, 0.01835799217224121, 0.019230365753173828, 0.020102739334106445, 0.020975112915039062, 0.02184748649597168, 0.022719860076904297, 0.023592233657836914, 0.02446460723876953, 0.02533698081970215, 0.026209354400634766, 0.027081727981567383, 0.0279541015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 12.0, 12.0, 14.0, 22.0, 23.0, 34.0, 51.0, 74.0, 141.0, 195.0, 162.0, 81.0, 33.0, 32.0, 28.0, 17.0, 11.0, 7.0, 7.0, 6.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00684356689453125, -0.006638944149017334, -0.006434321403503418, -0.006229698657989502, -0.006025075912475586, -0.00582045316696167, -0.005615830421447754, -0.005411207675933838, -0.005206584930419922, -0.005001962184906006, -0.00479733943939209, -0.004592716693878174, -0.004388093948364258, -0.004183471202850342, -0.003978848457336426, -0.0037742257118225098, -0.0035696029663085938, -0.0033649802207946777, -0.0031603574752807617, -0.0029557347297668457, -0.0027511119842529297, -0.0025464892387390137, -0.0023418664932250977, -0.0021372437477111816, -0.0019326210021972656, -0.0017279982566833496, -0.0015233755111694336, -0.0013187527656555176, -0.0011141300201416016, -0.0009095072746276855, -0.0007048845291137695, -0.0005002617835998535, -0.0002956390380859375, -9.101629257202148e-05, 0.00011360645294189453, 0.00031822919845581055, 0.0005228519439697266, 0.0007274746894836426, 0.0009320974349975586, 0.0011367201805114746, 0.0013413429260253906, 0.0015459656715393066, 0.0017505884170532227, 0.0019552111625671387, 0.0021598339080810547, 0.0023644566535949707, 0.0025690793991088867, 0.0027737021446228027, 0.0029783248901367188, 0.0031829476356506348, 0.0033875703811645508, 0.003592193126678467, 0.003796815872192383, 0.004001438617706299, 0.004206061363220215, 0.004410684108734131, 0.004615306854248047, 0.004819929599761963, 0.005024552345275879, 0.005229175090789795, 0.005433797836303711, 0.005638420581817627, 0.005843043327331543, 0.006047666072845459, 0.006252288818359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 9.0, 8.0, 23.0, 154.0, 666.0, 63.0, 23.0, 21.0, 13.0, 3.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3244737386703491, -0.3105740547180176, -0.29667437076568604, -0.2827746570110321, -0.26887497305870056, -0.254975289106369, -0.24107559025287628, -0.22717589139938354, -0.213276207447052, -0.19937652349472046, -0.18547682464122772, -0.17157712578773499, -0.15767744183540344, -0.1437777578830719, -0.12987805902957916, -0.11597836762666702, -0.10207867622375488, -0.08817898482084274, -0.0742792934179306, -0.06037960201501846, -0.04647991061210632, -0.03258021920919418, -0.018680527806282043, -0.0047808364033699036, 0.009118854999542236, 0.023018546402454376, 0.036918237805366516, 0.050817929208278656, 0.0647176206111908, 0.07861731201410294, 0.09251700341701508, 0.10641669481992722, 0.12031638622283936, 0.1342160701751709, 0.14811576902866364, 0.16201546788215637, 0.17591515183448792, 0.18981483578681946, 0.2037145346403122, 0.21761423349380493, 0.23151391744613647, 0.24541360139846802, 0.25931328535079956, 0.2732129991054535, 0.28711268305778503, 0.3010123670101166, 0.3149120807647705, 0.32881176471710205, 0.3427114486694336, 0.35661113262176514, 0.3705108165740967, 0.3844105303287506, 0.39831021428108215, 0.4122098982334137, 0.4261096119880676, 0.44000929594039917, 0.4539089798927307, 0.46780866384506226, 0.4817083477973938, 0.49560806155204773, 0.5095077753067017, 0.5234074592590332, 0.5373071432113647, 0.5512068271636963, 0.5651065111160278]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 5.0, 8.0, 7.0, 7.0, 9.0, 20.0, 30.0, 53.0, 107.0, 126.0, 179.0, 150.0, 108.0, 60.0, 32.0, 18.0, 14.0, 11.0, 6.0, 5.0, 5.0, 9.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12328165769577026, -0.11845885217189789, -0.11363604664802551, -0.10881324112415314, -0.10399043560028076, -0.09916763007640839, -0.09434483200311661, -0.08952202647924423, -0.08469922095537186, -0.07987641543149948, -0.0750536099076271, -0.07023080438375473, -0.06540800631046295, -0.06058519706130028, -0.0557623952627182, -0.050939589738845825, -0.04611678421497345, -0.041293978691101074, -0.0364711731672287, -0.03164837136864662, -0.026825565844774246, -0.02200276032090187, -0.017179956659674644, -0.012357152998447418, -0.007534347474575043, -0.002711542882025242, 0.002111261710524559, 0.00693406630307436, 0.01175687089562416, 0.016579676419496536, 0.021402480080723763, 0.02622528374195099, 0.031048089265823364, 0.03587089478969574, 0.040693700313568115, 0.04551650211215019, 0.05033930763602257, 0.05516211315989494, 0.05998491495847702, 0.0648077204823494, 0.06963052600622177, 0.07445333153009415, 0.07927613705396652, 0.0840989425778389, 0.08892174065113068, 0.09374454617500305, 0.09856735169887543, 0.1033901572227478, 0.10821296274662018, 0.11303576827049255, 0.11785857379436493, 0.1226813793182373, 0.12750418484210968, 0.13232699036598206, 0.13714979588985443, 0.1419726014137268, 0.146795392036438, 0.15161819756031036, 0.15644100308418274, 0.16126380860805511, 0.1660866141319275, 0.17090941965579987, 0.17573222517967224, 0.18055501580238342, 0.185377836227417]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 10.0, 14.0, 18.0, 17.0, 20.0, 34.0, 58.0, 147.0, 1190.0, 50004.0, 4139548.0, 2817.0, 150.0, 50.0, 38.0, 26.0, 23.0, 21.0, 14.0, 13.0, 6.0, 3.0, 5.0, 10.0, 1.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.90625, -2.8321075439453125, -2.757965087890625, -2.6838226318359375, -2.60968017578125, -2.5355377197265625, -2.461395263671875, -2.3872528076171875, -2.3131103515625, -2.2389678955078125, -2.164825439453125, -2.0906829833984375, -2.01654052734375, -1.9423980712890625, -1.868255615234375, -1.7941131591796875, -1.719970703125, -1.6458282470703125, -1.571685791015625, -1.4975433349609375, -1.42340087890625, -1.3492584228515625, -1.275115966796875, -1.2009735107421875, -1.1268310546875, -1.0526885986328125, -0.978546142578125, -0.9044036865234375, -0.83026123046875, -0.7561187744140625, -0.681976318359375, -0.6078338623046875, -0.53369140625, -0.4595489501953125, -0.385406494140625, -0.3112640380859375, -0.23712158203125, -0.1629791259765625, -0.088836669921875, -0.0146942138671875, 0.0594482421875, 0.1335906982421875, 0.207733154296875, 0.2818756103515625, 0.35601806640625, 0.4301605224609375, 0.504302978515625, 0.5784454345703125, 0.652587890625, 0.7267303466796875, 0.800872802734375, 0.8750152587890625, 0.94915771484375, 1.0233001708984375, 1.097442626953125, 1.1715850830078125, 1.2457275390625, 1.3198699951171875, 1.394012451171875, 1.4681549072265625, 1.54229736328125, 1.6164398193359375, 1.690582275390625, 1.7647247314453125, 1.8388671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 5.0, 4.0, 9.0, 7.0, 9.0, 9.0, 24.0, 84.0, 283.0, 323.0, 97.0, 24.0, 15.0, 7.0, 7.0, 11.0, 7.0, 9.0, 7.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0014324188232421875, -0.0013889670372009277, -0.001345515251159668, -0.0013020634651184082, -0.0012586116790771484, -0.0012151598930358887, -0.001171708106994629, -0.0011282563209533691, -0.0010848045349121094, -0.0010413527488708496, -0.0009979009628295898, -0.0009544491767883301, -0.0009109973907470703, -0.0008675456047058105, -0.0008240938186645508, -0.000780642032623291, -0.0007371902465820312, -0.0006937384605407715, -0.0006502866744995117, -0.000606834888458252, -0.0005633831024169922, -0.0005199313163757324, -0.00047647953033447266, -0.0004330277442932129, -0.0003895759582519531, -0.00034612417221069336, -0.0003026723861694336, -0.00025922060012817383, -0.00021576881408691406, -0.0001723170280456543, -0.00012886524200439453, -8.541345596313477e-05, -4.1961669921875e-05, 1.4901161193847656e-06, 4.494190216064453e-05, 8.83936882019043e-05, 0.00013184547424316406, 0.00017529726028442383, 0.0002187490463256836, 0.00026220083236694336, 0.0003056526184082031, 0.0003491044044494629, 0.00039255619049072266, 0.0004360079765319824, 0.0004794597625732422, 0.000522911548614502, 0.0005663633346557617, 0.0006098151206970215, 0.0006532669067382812, 0.000696718692779541, 0.0007401704788208008, 0.0007836222648620605, 0.0008270740509033203, 0.0008705258369445801, 0.0009139776229858398, 0.0009574294090270996, 0.0010008811950683594, 0.0010443329811096191, 0.001087784767150879, 0.0011312365531921387, 0.0011746883392333984, 0.0012181401252746582, 0.001261591911315918, 0.0013050436973571777, 0.0013484954833984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 1.0, 18.0, 14.0, 36.0, 45.0, 78.0, 128.0, 208.0, 350.0, 106355.0, 4085870.0, 459.0, 233.0, 184.0, 120.0, 75.0, 49.0, 30.0, 22.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3667106628417969, -0.33864593505859375, -0.3105812072753906, -0.2825164794921875, -0.2544517517089844, -0.22638702392578125, -0.19832229614257812, -0.170257568359375, -0.14219284057617188, -0.11412811279296875, -0.08606338500976562, -0.0579986572265625, -0.029933929443359375, -0.00186920166015625, 0.026195526123046875, 0.05426025390625, 0.08232498168945312, 0.11038970947265625, 0.13845443725585938, 0.1665191650390625, 0.19458389282226562, 0.22264862060546875, 0.2507133483886719, 0.278778076171875, 0.3068428039550781, 0.33490753173828125, 0.3629722595214844, 0.3910369873046875, 0.4191017150878906, 0.44716644287109375, 0.4752311706542969, 0.5032958984375, 0.5313606262207031, 0.5594253540039062, 0.5874900817871094, 0.6155548095703125, 0.6436195373535156, 0.6716842651367188, 0.6997489929199219, 0.727813720703125, 0.7558784484863281, 0.7839431762695312, 0.8120079040527344, 0.8400726318359375, 0.8681373596191406, 0.8962020874023438, 0.9242668151855469, 0.95233154296875, 0.9803962707519531, 1.0084609985351562, 1.0365257263183594, 1.0645904541015625, 1.0926551818847656, 1.1207199096679688, 1.1487846374511719, 1.176849365234375, 1.2049140930175781, 1.2329788208007812, 1.2610435485839844, 1.2891082763671875, 1.3171730041503906, 1.3452377319335938, 1.3733024597167969, 1.4013671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 8.0, 15.0, 22.0, 36.0, 48.0, 100.0, 144.0, 236.0, 380.0, 1459.0, 581.0, 321.0, 234.0, 188.0, 111.0, 82.0, 48.0, 29.0, 21.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027332305908203125, -0.002521008253097534, -0.002308785915374756, -0.0020965635776519775, -0.0018843412399291992, -0.001672118902206421, -0.0014598965644836426, -0.0012476742267608643, -0.001035451889038086, -0.0008232295513153076, -0.0006110072135925293, -0.000398784875869751, -0.00018656253814697266, 2.5659799575805664e-05, 0.00023788213729858398, 0.0004501044750213623, 0.0006623268127441406, 0.0008745491504669189, 0.0010867714881896973, 0.0012989938259124756, 0.001511216163635254, 0.0017234385013580322, 0.0019356608390808105, 0.002147883176803589, 0.002360105514526367, 0.0025723278522491455, 0.002784550189971924, 0.002996772527694702, 0.0032089948654174805, 0.003421217203140259, 0.003633439540863037, 0.0038456618785858154, 0.004057884216308594, 0.004270106554031372, 0.00448232889175415, 0.004694551229476929, 0.004906773567199707, 0.005118995904922485, 0.005331218242645264, 0.005543440580368042, 0.00575566291809082, 0.005967885255813599, 0.006180107593536377, 0.006392329931259155, 0.006604552268981934, 0.006816774606704712, 0.00702899694442749, 0.0072412192821502686, 0.007453441619873047, 0.007665663957595825, 0.007877886295318604, 0.008090108633041382, 0.00830233097076416, 0.008514553308486938, 0.008726775646209717, 0.008938997983932495, 0.009151220321655273, 0.009363442659378052, 0.00957566499710083, 0.009787887334823608, 0.010000109672546387, 0.010212332010269165, 0.010424554347991943, 0.010636776685714722, 0.0108489990234375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [616.0, 389.0, 17.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0585235059261322, 0.003385651856660843, 0.06529480963945389, 0.12720397114753723, 0.18911312520503998, 0.2510222792625427, 0.31293144822120667, 0.3748405873775482, 0.43674975633621216, 0.4986589252948761, 0.56056809425354, 0.6224772334098816, 0.6843863725662231, 0.7462955713272095, 0.808204710483551, 0.8701138496398926, 0.9320230484008789, 0.9939321875572205, 1.055841326713562, 1.1177505254745483, 1.1796597242355347, 1.2415688037872314, 1.3034780025482178, 1.365387201309204, 1.4272962808609009, 1.4892054796218872, 1.551114559173584, 1.6130237579345703, 1.6749329566955566, 1.7368420362472534, 1.7987512350082397, 1.8606603145599365, 1.9225696325302124, 1.9844788312911987, 2.0463879108428955, 2.108297109603882, 2.170206308364868, 2.2321155071258545, 2.2940244674682617, 2.355933666229248, 2.4178428649902344, 2.4797520637512207, 2.541661262512207, 2.6035704612731934, 2.6654794216156006, 2.727388620376587, 2.7892978191375732, 2.8512070178985596, 2.913116216659546, 2.9750254154205322, 3.0369346141815186, 3.098843574523926, 3.160752773284912, 3.2226619720458984, 3.2845711708068848, 3.346480369567871, 3.4083893299102783, 3.4702985286712646, 3.532207727432251, 3.594116687774658, 3.6560258865356445, 3.717935085296631, 3.779844284057617, 3.8417534828186035, 3.90366268157959]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 40.0, 84.0, 118.0, 157.0, 179.0, 160.0, 119.0, 59.0, 35.0, 13.0, 12.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05067789554595947, -0.04592546075582504, -0.04117302596569061, -0.03642059490084648, -0.03166816011071205, -0.02691572532057762, -0.02216329239308834, -0.01741085946559906, -0.01265842467546463, -0.007905990816652775, -0.0031535569578409195, 0.0015988769009709358, 0.006351310759782791, 0.011103745549917221, 0.015856178477406502, 0.020608611404895782, 0.025361046195030212, 0.030113480985164642, 0.03486591577529907, 0.039618346840143204, 0.044370781630277634, 0.049123216420412064, 0.053875647485256195, 0.058628082275390625, 0.06338051706552505, 0.06813295185565948, 0.07288538664579391, 0.07763782143592834, 0.08239024877548218, 0.0871426910161972, 0.09189511835575104, 0.09664755314588547, 0.1013999879360199, 0.10615242272615433, 0.11090485751628876, 0.11565729230642319, 0.12040972709655762, 0.12516215443611145, 0.12991459667682648, 0.1346670240163803, 0.13941946625709534, 0.14417189359664917, 0.1489243358373642, 0.15367676317691803, 0.15842920541763306, 0.1631816327571869, 0.16793407499790192, 0.17268650233745575, 0.17743892967700958, 0.18219135701656342, 0.18694379925727844, 0.19169622659683228, 0.1964486688375473, 0.20120109617710114, 0.20595353841781616, 0.21070596575737, 0.21545839309692383, 0.22021082043647766, 0.2249632626771927, 0.22971569001674652, 0.23446813225746155, 0.23922055959701538, 0.2439730018377304, 0.24872542917728424, 0.25347787141799927]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 3.0, 9.0, 10.0, 24.0, 21.0, 46.0, 57.0, 86.0, 91.0, 131.0, 150.0, 206.0, 313.0, 452.0, 593.0, 799.0, 1159.0, 1507.0, 2261.0, 3063.0, 4583.0, 6814.0, 10889.0, 20465.0, 87547.0, 771677.0, 82316.0, 20096.0, 10755.0, 6754.0, 4612.0, 3134.0, 2187.0, 1515.0, 1180.0, 817.0, 567.0, 478.0, 283.0, 226.0, 173.0, 123.0, 97.0, 85.0, 51.0, 41.0, 26.0, 28.0, 18.0, 9.0, 15.0, 2.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.023101806640625, -0.022368192672729492, -0.021634578704833984, -0.020900964736938477, -0.02016735076904297, -0.01943373680114746, -0.018700122833251953, -0.017966508865356445, -0.017232894897460938, -0.01649928092956543, -0.015765666961669922, -0.015032052993774414, -0.014298439025878906, -0.013564825057983398, -0.01283121109008789, -0.012097597122192383, -0.011363983154296875, -0.010630369186401367, -0.00989675521850586, -0.009163141250610352, -0.008429527282714844, -0.007695913314819336, -0.006962299346923828, -0.00622868537902832, -0.0054950714111328125, -0.004761457443237305, -0.004027843475341797, -0.003294229507446289, -0.0025606155395507812, -0.0018270015716552734, -0.0010933876037597656, -0.0003597736358642578, 0.00037384033203125, 0.0011074542999267578, 0.0018410682678222656, 0.0025746822357177734, 0.0033082962036132812, 0.004041910171508789, 0.004775524139404297, 0.005509138107299805, 0.0062427520751953125, 0.00697636604309082, 0.007709980010986328, 0.008443593978881836, 0.009177207946777344, 0.009910821914672852, 0.01064443588256836, 0.011378049850463867, 0.012111663818359375, 0.012845277786254883, 0.01357889175415039, 0.014312505722045898, 0.015046119689941406, 0.015779733657836914, 0.016513347625732422, 0.01724696159362793, 0.017980575561523438, 0.018714189529418945, 0.019447803497314453, 0.02018141746520996, 0.02091503143310547, 0.021648645401000977, 0.022382259368896484, 0.023115873336791992, 0.0238494873046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 4.0, 3.0, 5.0, 6.0, 11.0, 3.0, 7.0, 8.0, 7.0, 18.0, 26.0, 88.0, 201.0, 246.0, 183.0, 74.0, 20.0, 11.0, 10.0, 8.0, 9.0, 7.0, 9.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014486312866210938, -0.0014037638902664185, -0.0013588964939117432, -0.0013140290975570679, -0.0012691617012023926, -0.0012242943048477173, -0.001179426908493042, -0.0011345595121383667, -0.0010896921157836914, -0.0010448247194290161, -0.0009999573230743408, -0.0009550899267196655, -0.0009102225303649902, -0.0008653551340103149, -0.0008204877376556396, -0.0007756203413009644, -0.0007307529449462891, -0.0006858855485916138, -0.0006410181522369385, -0.0005961507558822632, -0.0005512833595275879, -0.0005064159631729126, -0.0004615485668182373, -0.000416681170463562, -0.0003718137741088867, -0.0003269463777542114, -0.00028207898139953613, -0.00023721158504486084, -0.00019234418869018555, -0.00014747679233551025, -0.00010260939598083496, -5.774199962615967e-05, -1.2874603271484375e-05, 3.199279308319092e-05, 7.686018943786621e-05, 0.0001217275857925415, 0.0001665949821472168, 0.0002114623785018921, 0.0002563297748565674, 0.0003011971712112427, 0.00034606456756591797, 0.00039093196392059326, 0.00043579936027526855, 0.00048066675662994385, 0.0005255341529846191, 0.0005704015493392944, 0.0006152689456939697, 0.000660136342048645, 0.0007050037384033203, 0.0007498711347579956, 0.0007947385311126709, 0.0008396059274673462, 0.0008844733238220215, 0.0009293407201766968, 0.0009742081165313721, 0.0010190755128860474, 0.0010639429092407227, 0.001108810305595398, 0.0011536777019500732, 0.0011985450983047485, 0.0012434124946594238, 0.0012882798910140991, 0.0013331472873687744, 0.0013780146837234497, 0.001422882080078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 3.0, 7.0, 7.0, 9.0, 10.0, 12.0, 20.0, 14.0, 12.0, 13.0, 16.0, 21.0, 22.0, 20.0, 33.0, 30.0, 33.0, 52.0, 87.0, 259.0, 1271.0, 10789.0, 949243.0, 81908.0, 3709.0, 489.0, 106.0, 52.0, 29.0, 26.0, 32.0, 20.0, 32.0, 19.0, 17.0, 21.0, 14.0, 10.0, 18.0, 12.0, 13.0, 7.0, 5.0, 6.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.07745361328125, -0.07509040832519531, -0.07272720336914062, -0.07036399841308594, -0.06800079345703125, -0.06563758850097656, -0.06327438354492188, -0.06091117858886719, -0.0585479736328125, -0.05618476867675781, -0.053821563720703125, -0.05145835876464844, -0.04909515380859375, -0.04673194885253906, -0.044368743896484375, -0.04200553894042969, -0.039642333984375, -0.03727912902832031, -0.034915924072265625, -0.03255271911621094, -0.03018951416015625, -0.027826309204101562, -0.025463104248046875, -0.023099899291992188, -0.0207366943359375, -0.018373489379882812, -0.016010284423828125, -0.013647079467773438, -0.01128387451171875, -0.008920669555664062, -0.006557464599609375, -0.0041942596435546875, -0.0018310546875, 0.0005321502685546875, 0.002895355224609375, 0.0052585601806640625, 0.00762176513671875, 0.009984970092773438, 0.012348175048828125, 0.014711380004882812, 0.0170745849609375, 0.019437789916992188, 0.021800994873046875, 0.024164199829101562, 0.02652740478515625, 0.028890609741210938, 0.031253814697265625, 0.03361701965332031, 0.035980224609375, 0.03834342956542969, 0.040706634521484375, 0.04306983947753906, 0.04543304443359375, 0.04779624938964844, 0.050159454345703125, 0.05252265930175781, 0.0548858642578125, 0.05724906921386719, 0.059612274169921875, 0.06197547912597656, 0.06433868408203125, 0.06670188903808594, 0.06906509399414062, 0.07142829895019531, 0.07379150390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 2.0, 5.0, 3.0, 5.0, 6.0, 9.0, 12.0, 12.0, 12.0, 13.0, 15.0, 16.0, 18.0, 23.0, 35.0, 27.0, 31.0, 35.0, 32.0, 35.0, 41.0, 38.0, 45.0, 38.0, 41.0, 26.0, 36.0, 39.0, 42.0, 28.0, 39.0, 28.0, 25.0, 27.0, 25.0, 13.0, 20.0, 13.0, 13.0, 13.0, 18.0, 9.0, 7.0, 9.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004245758056640625, -0.0041138529777526855, -0.003981947898864746, -0.0038500428199768066, -0.003718137741088867, -0.0035862326622009277, -0.0034543275833129883, -0.003322422504425049, -0.0031905174255371094, -0.00305861234664917, -0.0029267072677612305, -0.002794802188873291, -0.0026628971099853516, -0.002530992031097412, -0.0023990869522094727, -0.002267181873321533, -0.0021352767944335938, -0.0020033717155456543, -0.0018714666366577148, -0.0017395615577697754, -0.001607656478881836, -0.0014757513999938965, -0.001343846321105957, -0.0012119412422180176, -0.0010800361633300781, -0.0009481310844421387, -0.0008162260055541992, -0.0006843209266662598, -0.0005524158477783203, -0.00042051076889038086, -0.0002886056900024414, -0.00015670061111450195, -2.47955322265625e-05, 0.00010710954666137695, 0.0002390146255493164, 0.00037091970443725586, 0.0005028247833251953, 0.0006347298622131348, 0.0007666349411010742, 0.0008985400199890137, 0.0010304450988769531, 0.0011623501777648926, 0.001294255256652832, 0.0014261603355407715, 0.001558065414428711, 0.0016899704933166504, 0.0018218755722045898, 0.0019537806510925293, 0.0020856857299804688, 0.002217590808868408, 0.0023494958877563477, 0.002481400966644287, 0.0026133060455322266, 0.002745211124420166, 0.0028771162033081055, 0.003009021282196045, 0.0031409263610839844, 0.003272831439971924, 0.0034047365188598633, 0.0035366415977478027, 0.003668546676635742, 0.0038004517555236816, 0.003932356834411621, 0.0040642619132995605, 0.0041961669921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 20.0, 23.0, 58.0, 146.0, 899.0, 967740.0, 78803.0, 610.0, 99.0, 58.0, 31.0, 12.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0650634765625, -0.06364703178405762, -0.062230587005615234, -0.06081414222717285, -0.05939769744873047, -0.057981252670288086, -0.0565648078918457, -0.05514836311340332, -0.05373191833496094, -0.052315473556518555, -0.05089902877807617, -0.04948258399963379, -0.048066139221191406, -0.04664969444274902, -0.04523324966430664, -0.04381680488586426, -0.042400360107421875, -0.04098391532897949, -0.03956747055053711, -0.03815102577209473, -0.036734580993652344, -0.03531813621520996, -0.03390169143676758, -0.032485246658325195, -0.031068801879882812, -0.02965235710144043, -0.028235912322998047, -0.026819467544555664, -0.02540302276611328, -0.0239865779876709, -0.022570133209228516, -0.021153688430786133, -0.01973724365234375, -0.018320798873901367, -0.016904354095458984, -0.015487909317016602, -0.014071464538574219, -0.012655019760131836, -0.011238574981689453, -0.00982213020324707, -0.008405685424804688, -0.006989240646362305, -0.005572795867919922, -0.004156351089477539, -0.0027399063110351562, -0.0013234615325927734, 9.298324584960938e-05, 0.0015094280242919922, 0.002925872802734375, 0.004342317581176758, 0.005758762359619141, 0.0071752071380615234, 0.008591651916503906, 0.010008096694946289, 0.011424541473388672, 0.012840986251831055, 0.014257431030273438, 0.01567387580871582, 0.017090320587158203, 0.018506765365600586, 0.01992321014404297, 0.02133965492248535, 0.022756099700927734, 0.024172544479370117, 0.0255889892578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 11.0, 21.0, 72.0, 415.0, 369.0, 58.0, 18.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002791881561279297, -0.0002709701657295227, -0.0002627521753311157, -0.00025453418493270874, -0.00024631619453430176, -0.00023809820413589478, -0.0002298802137374878, -0.0002216622233390808, -0.00021344423294067383, -0.00020522624254226685, -0.00019700825214385986, -0.00018879026174545288, -0.0001805722713470459, -0.00017235428094863892, -0.00016413629055023193, -0.00015591830015182495, -0.00014770030975341797, -0.00013948231935501099, -0.000131264328956604, -0.00012304633855819702, -0.00011482834815979004, -0.00010661035776138306, -9.839236736297607e-05, -9.017437696456909e-05, -8.195638656616211e-05, -7.373839616775513e-05, -6.552040576934814e-05, -5.730241537094116e-05, -4.908442497253418e-05, -4.08664345741272e-05, -3.2648444175720215e-05, -2.4430453777313232e-05, -1.621246337890625e-05, -7.994472980499268e-06, 2.2351741790771484e-07, 8.441507816314697e-06, 1.665949821472168e-05, 2.4877488613128662e-05, 3.3095479011535645e-05, 4.131346940994263e-05, 4.953145980834961e-05, 5.774945020675659e-05, 6.596744060516357e-05, 7.418543100357056e-05, 8.240342140197754e-05, 9.062141180038452e-05, 9.88394021987915e-05, 0.00010705739259719849, 0.00011527538299560547, 0.00012349337339401245, 0.00013171136379241943, 0.00013992935419082642, 0.0001481473445892334, 0.00015636533498764038, 0.00016458332538604736, 0.00017280131578445435, 0.00018101930618286133, 0.0001892372965812683, 0.0001974552869796753, 0.00020567327737808228, 0.00021389126777648926, 0.00022210925817489624, 0.00023032724857330322, 0.0002385452389717102, 0.0002467632293701172]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 3.0, 13.0, 17.0, 29.0, 61.0, 231.0, 1288.0, 36434.0, 1006640.0, 3276.0, 373.0, 99.0, 37.0, 11.0, 13.0, 10.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048492431640625, -0.04703187942504883, -0.045571327209472656, -0.044110774993896484, -0.04265022277832031, -0.04118967056274414, -0.03972911834716797, -0.0382685661315918, -0.036808013916015625, -0.03534746170043945, -0.03388690948486328, -0.03242635726928711, -0.030965805053710938, -0.029505252838134766, -0.028044700622558594, -0.026584148406982422, -0.02512359619140625, -0.023663043975830078, -0.022202491760253906, -0.020741939544677734, -0.019281387329101562, -0.01782083511352539, -0.01636028289794922, -0.014899730682373047, -0.013439178466796875, -0.011978626251220703, -0.010518074035644531, -0.00905752182006836, -0.0075969696044921875, -0.006136417388916016, -0.004675865173339844, -0.003215312957763672, -0.0017547607421875, -0.0002942085266113281, 0.0011663436889648438, 0.0026268959045410156, 0.0040874481201171875, 0.005548000335693359, 0.007008552551269531, 0.008469104766845703, 0.009929656982421875, 0.011390209197998047, 0.012850761413574219, 0.01431131362915039, 0.015771865844726562, 0.017232418060302734, 0.018692970275878906, 0.020153522491455078, 0.02161407470703125, 0.023074626922607422, 0.024535179138183594, 0.025995731353759766, 0.027456283569335938, 0.02891683578491211, 0.03037738800048828, 0.03183794021606445, 0.033298492431640625, 0.0347590446472168, 0.03621959686279297, 0.03768014907836914, 0.03914070129394531, 0.040601253509521484, 0.042061805725097656, 0.04352235794067383, 0.04498291015625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 15.0, 16.0, 42.0, 81.0, 148.0, 452.0, 93.0, 38.0, 25.0, 14.0, 19.0, 10.0, 10.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00852203369140625, -0.00831061601638794, -0.008099198341369629, -0.007887780666351318, -0.007676362991333008, -0.007464945316314697, -0.007253527641296387, -0.007042109966278076, -0.006830692291259766, -0.006619274616241455, -0.0064078569412231445, -0.006196439266204834, -0.0059850215911865234, -0.005773603916168213, -0.005562186241149902, -0.005350768566131592, -0.005139350891113281, -0.004927933216094971, -0.00471651554107666, -0.00450509786605835, -0.004293680191040039, -0.0040822625160217285, -0.003870844841003418, -0.0036594271659851074, -0.003448009490966797, -0.0032365918159484863, -0.0030251741409301758, -0.0028137564659118652, -0.0026023387908935547, -0.002390921115875244, -0.0021795034408569336, -0.001968085765838623, -0.0017566680908203125, -0.001545250415802002, -0.0013338327407836914, -0.0011224150657653809, -0.0009109973907470703, -0.0006995797157287598, -0.0004881620407104492, -0.00027674436569213867, -6.532669067382812e-05, 0.00014609098434448242, 0.00035750865936279297, 0.0005689263343811035, 0.0007803440093994141, 0.0009917616844177246, 0.0012031793594360352, 0.0014145970344543457, 0.0016260147094726562, 0.0018374323844909668, 0.0020488500595092773, 0.002260267734527588, 0.0024716854095458984, 0.002683103084564209, 0.0028945207595825195, 0.00310593843460083, 0.0033173561096191406, 0.003528773784637451, 0.0037401914596557617, 0.003951609134674072, 0.004163026809692383, 0.004374444484710693, 0.004585862159729004, 0.0047972798347473145, 0.005008697509765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 8.0, 10.0, 11.0, 13.0, 30.0, 86.0, 339.0, 326.0, 88.0, 27.0, 15.0, 13.0, 7.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08528926968574524, -0.08200879395008087, -0.07872831076383591, -0.07544783502817154, -0.07216735929250717, -0.06888687610626221, -0.06560640037059784, -0.06232592463493347, -0.059045445173978806, -0.05576496571302414, -0.05248448997735977, -0.049204010516405106, -0.04592353105545044, -0.04264305531978607, -0.039362575858831406, -0.03608209639787674, -0.03280162066221237, -0.029521143063902855, -0.026240665465593338, -0.022960186004638672, -0.019679708406329155, -0.016399230808019638, -0.013118751347064972, -0.009838273748755455, -0.006557796150445938, -0.003277318086475134, 3.1599774956703186e-06, 0.003283638507127762, 0.006564116105437279, 0.009844593703746796, 0.013125073164701462, 0.01640555076301098, 0.0196860209107399, 0.022966498509049416, 0.026246976107358932, 0.0295274555683136, 0.032807931303977966, 0.03608841076493263, 0.0393688902258873, 0.042649365961551666, 0.04592984542250633, 0.049210324883461, 0.052490800619125366, 0.05577128008008003, 0.0590517595410347, 0.062332235276699066, 0.06561271846294403, 0.0688931941986084, 0.07217366993427277, 0.07545414566993713, 0.0787346288561821, 0.08201510459184647, 0.08529558032751083, 0.0885760635137558, 0.09185653924942017, 0.09513701498508453, 0.0984174907207489, 0.10169796645641327, 0.10497844964265823, 0.1082589253783226, 0.11153940111398697, 0.11481988430023193, 0.1181003600358963, 0.12138083577156067, 0.12466131895780563]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 2.0, 5.0, 3.0, 8.0, 16.0, 21.0, 18.0, 36.0, 27.0, 47.0, 67.0, 66.0, 92.0, 89.0, 90.0, 72.0, 61.0, 70.0, 43.0, 36.0, 29.0, 24.0, 24.0, 11.0, 5.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0361018180847168, -0.03461151570081711, -0.03312121331691742, -0.03163091093301773, -0.030140608549118042, -0.028650306165218353, -0.027160003781318665, -0.025669701397418976, -0.024179399013519287, -0.0226890966296196, -0.02119879424571991, -0.01970849186182022, -0.018218189477920532, -0.016727887094020844, -0.015237584710121155, -0.013747282326221466, -0.012256979942321777, -0.010766677558422089, -0.0092763751745224, -0.007786072790622711, -0.0062957704067230225, -0.004805468022823334, -0.003315165638923645, -0.0018248632550239563, -0.0003345608711242676, 0.0011557415127754211, 0.00264604389667511, 0.004136346280574799, 0.005626648664474487, 0.007116951048374176, 0.008607253432273865, 0.010097555816173553, 0.011587858200073242, 0.013078160583972931, 0.01456846296787262, 0.01605876535177231, 0.017549067735671997, 0.019039370119571686, 0.020529672503471375, 0.022019974887371063, 0.023510277271270752, 0.02500057965517044, 0.02649088203907013, 0.027981184422969818, 0.029471486806869507, 0.030961789190769196, 0.032452091574668884, 0.03394239395856857, 0.03543269634246826, 0.03692299872636795, 0.03841330111026764, 0.03990360349416733, 0.04139390587806702, 0.042884208261966705, 0.044374510645866394, 0.04586481302976608, 0.04735511541366577, 0.04884541779756546, 0.05033572018146515, 0.05182602256536484, 0.053316324949264526, 0.054806627333164215, 0.056296929717063904, 0.05778723210096359, 0.05927753448486328]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 6.0, 8.0, 6.0, 6.0, 8.0, 4.0, 14.0, 7.0, 13.0, 12.0, 10.0, 12.0, 10.0, 34.0, 24.0, 112.0, 1803.0, 4191749.0, 220.0, 38.0, 30.0, 14.0, 8.0, 12.0, 14.0, 16.0, 12.0, 0.0, 4.0, 10.0, 6.0, 2.0, 16.0, 6.0, 2.0, 8.0, 4.0, 0.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.9111328125, -1.8597412109375, -1.808349609375, -1.7569580078125, -1.70556640625, -1.6541748046875, -1.602783203125, -1.5513916015625, -1.5, -1.4486083984375, -1.397216796875, -1.3458251953125, -1.29443359375, -1.2430419921875, -1.191650390625, -1.1402587890625, -1.0888671875, -1.0374755859375, -0.986083984375, -0.9346923828125, -0.88330078125, -0.8319091796875, -0.780517578125, -0.7291259765625, -0.677734375, -0.6263427734375, -0.574951171875, -0.5235595703125, -0.47216796875, -0.4207763671875, -0.369384765625, -0.3179931640625, -0.2666015625, -0.2152099609375, -0.163818359375, -0.1124267578125, -0.06103515625, -0.0096435546875, 0.041748046875, 0.0931396484375, 0.14453125, 0.1959228515625, 0.247314453125, 0.2987060546875, 0.35009765625, 0.4014892578125, 0.452880859375, 0.5042724609375, 0.5556640625, 0.6070556640625, 0.658447265625, 0.7098388671875, 0.76123046875, 0.8126220703125, 0.864013671875, 0.9154052734375, 0.966796875, 1.0181884765625, 1.069580078125, 1.1209716796875, 1.17236328125, 1.2237548828125, 1.275146484375, 1.3265380859375, 1.3779296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 5.0, 2.0, 6.0, 3.0, 5.0, 4.0, 11.0, 4.0, 6.0, 9.0, 14.0, 21.0, 49.0, 118.0, 175.0, 230.0, 147.0, 65.0, 32.0, 14.0, 10.0, 7.0, 8.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012407302856445312, -0.0012008696794509888, -0.0011610090732574463, -0.0011211484670639038, -0.0010812878608703613, -0.0010414272546768188, -0.0010015666484832764, -0.0009617060422897339, -0.0009218454360961914, -0.0008819848299026489, -0.0008421242237091064, -0.000802263617515564, -0.0007624030113220215, -0.000722542405128479, -0.0006826817989349365, -0.000642821192741394, -0.0006029605865478516, -0.0005630999803543091, -0.0005232393741607666, -0.0004833787679672241, -0.00044351816177368164, -0.00040365755558013916, -0.0003637969493865967, -0.0003239363431930542, -0.0002840757369995117, -0.00024421513080596924, -0.00020435452461242676, -0.00016449391841888428, -0.0001246333122253418, -8.477270603179932e-05, -4.4912099838256836e-05, -5.0514936447143555e-06, 3.4809112548828125e-05, 7.46697187423706e-05, 0.00011453032493591309, 0.00015439093112945557, 0.00019425153732299805, 0.00023411214351654053, 0.000273972749710083, 0.0003138333559036255, 0.00035369396209716797, 0.00039355456829071045, 0.00043341517448425293, 0.0004732757806777954, 0.0005131363868713379, 0.0005529969930648804, 0.0005928575992584229, 0.0006327182054519653, 0.0006725788116455078, 0.0007124394178390503, 0.0007523000240325928, 0.0007921606302261353, 0.0008320212364196777, 0.0008718818426132202, 0.0009117424488067627, 0.0009516030550003052, 0.0009914636611938477, 0.0010313242673873901, 0.0010711848735809326, 0.001111045479774475, 0.0011509060859680176, 0.00119076669216156, 0.0012306272983551025, 0.001270487904548645, 0.0013103485107421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 10.0, 19.0, 35.0, 88.0, 199.0, 883.0, 4192156.0, 642.0, 143.0, 46.0, 30.0, 16.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.982421875, -1.94384765625, -1.9052734375, -1.86669921875, -1.828125, -1.78955078125, -1.7509765625, -1.71240234375, -1.673828125, -1.63525390625, -1.5966796875, -1.55810546875, -1.51953125, -1.48095703125, -1.4423828125, -1.40380859375, -1.365234375, -1.32666015625, -1.2880859375, -1.24951171875, -1.2109375, -1.17236328125, -1.1337890625, -1.09521484375, -1.056640625, -1.01806640625, -0.9794921875, -0.94091796875, -0.90234375, -0.86376953125, -0.8251953125, -0.78662109375, -0.748046875, -0.70947265625, -0.6708984375, -0.63232421875, -0.59375, -0.55517578125, -0.5166015625, -0.47802734375, -0.439453125, -0.40087890625, -0.3623046875, -0.32373046875, -0.28515625, -0.24658203125, -0.2080078125, -0.16943359375, -0.130859375, -0.09228515625, -0.0537109375, -0.01513671875, 0.0234375, 0.06201171875, 0.1005859375, 0.13916015625, 0.177734375, 0.21630859375, 0.2548828125, 0.29345703125, 0.33203125, 0.37060546875, 0.4091796875, 0.44775390625, 0.486328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 15.0, 18.0, 38.0, 92.0, 126.0, 297.0, 974.0, 1818.0, 371.0, 166.0, 73.0, 34.0, 23.0, 15.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0030727386474609375, -0.0028822720050811768, -0.002691805362701416, -0.0025013387203216553, -0.0023108720779418945, -0.002120405435562134, -0.001929938793182373, -0.0017394721508026123, -0.0015490055084228516, -0.0013585388660430908, -0.00116807222366333, -0.0009776055812835693, -0.0007871389389038086, -0.0005966722965240479, -0.0004062056541442871, -0.00021573901176452637, -2.5272369384765625e-05, 0.00016519427299499512, 0.00035566091537475586, 0.0005461275577545166, 0.0007365942001342773, 0.0009270608425140381, 0.0011175274848937988, 0.0013079941272735596, 0.0014984607696533203, 0.001688927412033081, 0.0018793940544128418, 0.0020698606967926025, 0.0022603273391723633, 0.002450793981552124, 0.0026412606239318848, 0.0028317272663116455, 0.0030221939086914062, 0.003212660551071167, 0.0034031271934509277, 0.0035935938358306885, 0.0037840604782104492, 0.00397452712059021, 0.004164993762969971, 0.0043554604053497314, 0.004545927047729492, 0.004736393690109253, 0.004926860332489014, 0.005117326974868774, 0.005307793617248535, 0.005498260259628296, 0.005688726902008057, 0.005879193544387817, 0.006069660186767578, 0.006260126829147339, 0.0064505934715271, 0.00664106011390686, 0.006831526756286621, 0.007021993398666382, 0.007212460041046143, 0.007402926683425903, 0.007593393325805664, 0.007783859968185425, 0.007974326610565186, 0.008164793252944946, 0.008355259895324707, 0.008545726537704468, 0.008736193180084229, 0.00892665982246399, 0.00911712646484375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 1007.0, 1.0, 0.0, 2.0], "bins": [-4.851652145385742, -4.771372318267822, -4.691092491149902, -4.610812664031982, -4.5305328369140625, -4.450253009796143, -4.369973182678223, -4.2896928787231445, -4.209413051605225, -4.129133224487305, -4.048853397369385, -3.968573570251465, -3.888293504714966, -3.808013677597046, -3.727733850479126, -3.647454023361206, -3.5671744346618652, -3.4868946075439453, -3.4066147804260254, -3.3263349533081055, -3.2460548877716064, -3.1657750606536865, -3.0854952335357666, -3.0052154064178467, -2.9249353408813477, -2.8446555137634277, -2.764375686645508, -2.684095859527588, -2.603815793991089, -2.523535966873169, -2.443256139755249, -2.362976312637329, -2.2826967239379883, -2.2024168968200684, -2.1221370697021484, -2.0418572425842285, -1.961577296257019, -1.8812973499298096, -1.8010175228118896, -1.7207376956939697, -1.6404577493667603, -1.5601779222488403, -1.4798979759216309, -1.399618148803711, -1.319338321685791, -1.239058494567871, -1.1587785482406616, -1.0784987211227417, -0.9982188940048218, -0.9179390072822571, -0.8376591801643372, -0.7573792934417725, -0.6770994663238525, -0.5968195796012878, -0.5165396928787231, -0.4362598657608032, -0.35597994923591614, -0.27570009231567383, -0.19542022049427032, -0.11514034867286682, -0.03486049175262451, 0.0454193651676178, 0.1256992518901825, 0.20597907900810242, 0.2862589657306671]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 19.0, 56.0, 104.0, 201.0, 248.0, 186.0, 117.0, 43.0, 18.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04269814491271973, -0.03907020390033722, -0.03544226661324501, -0.0318143293261528, -0.028186388313770294, -0.024558449164032936, -0.020930510014295578, -0.01730257086455822, -0.013674631714820862, -0.010046692565083504, -0.006418753415346146, -0.0027908142656087875, 0.0008371248841285706, 0.004465064033865929, 0.008093003183603287, 0.011720942333340645, 0.015348881483078003, 0.01897682063281536, 0.02260475978255272, 0.026232698932290077, 0.029860638082027435, 0.03348857909440994, 0.03711651638150215, 0.04074445366859436, 0.04437239468097687, 0.048000335693359375, 0.051628272980451584, 0.05525621026754379, 0.0588841512799263, 0.06251209229230881, 0.06614002585411072, 0.06976796686649323, 0.07339590787887573, 0.07702384889125824, 0.08065178990364075, 0.08427972346544266, 0.08790766447782516, 0.09153560549020767, 0.09516353905200958, 0.09879148006439209, 0.1024194210767746, 0.1060473620891571, 0.10967530310153961, 0.11330323666334152, 0.11693117767572403, 0.12055911868810654, 0.12418705224990845, 0.12781499326229095, 0.13144293427467346, 0.13507087528705597, 0.13869881629943848, 0.14232675731182098, 0.1459546983242035, 0.1495826244354248, 0.1532105654478073, 0.15683850646018982, 0.16046644747257233, 0.16409438848495483, 0.16772232949733734, 0.17135027050971985, 0.17497819662094116, 0.17860613763332367, 0.18223407864570618, 0.18586201965808868, 0.1894899606704712]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 6.0, 6.0, 16.0, 8.0, 15.0, 18.0, 12.0, 17.0, 17.0, 18.0, 13.0, 21.0, 31.0, 41.0, 37.0, 36.0, 36.0, 37.0, 72.0, 249.0, 219949.0, 826988.0, 413.0, 92.0, 67.0, 33.0, 34.0, 33.0, 16.0, 27.0, 28.0, 29.0, 23.0, 18.0, 10.0, 21.0, 10.0, 10.0, 9.0, 5.0, 7.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.58935546875, -0.5720596313476562, -0.5547637939453125, -0.5374679565429688, -0.520172119140625, -0.5028762817382812, -0.4855804443359375, -0.46828460693359375, -0.45098876953125, -0.43369293212890625, -0.4163970947265625, -0.39910125732421875, -0.381805419921875, -0.36450958251953125, -0.3472137451171875, -0.32991790771484375, -0.3126220703125, -0.29532623291015625, -0.2780303955078125, -0.26073455810546875, -0.243438720703125, -0.22614288330078125, -0.2088470458984375, -0.19155120849609375, -0.17425537109375, -0.15695953369140625, -0.1396636962890625, -0.12236785888671875, -0.105072021484375, -0.08777618408203125, -0.0704803466796875, -0.05318450927734375, -0.035888671875, -0.01859283447265625, -0.0012969970703125, 0.01599884033203125, 0.033294677734375, 0.05059051513671875, 0.0678863525390625, 0.08518218994140625, 0.10247802734375, 0.11977386474609375, 0.1370697021484375, 0.15436553955078125, 0.171661376953125, 0.18895721435546875, 0.2062530517578125, 0.22354888916015625, 0.2408447265625, 0.25814056396484375, 0.2754364013671875, 0.29273223876953125, 0.310028076171875, 0.32732391357421875, 0.3446197509765625, 0.36191558837890625, 0.37921142578125, 0.39650726318359375, 0.4138031005859375, 0.43109893798828125, 0.448394775390625, 0.46569061279296875, 0.4829864501953125, 0.5002822875976562, 0.517578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [27.0, 273.0, 590.0, 121.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004947662353515625, -0.0028790831565856934, -0.0008105039596557617, 0.00125807523727417, 0.0033266544342041016, 0.005395233631134033, 0.007463812828063965, 0.009532392024993896, 0.011600971221923828, 0.01366955041885376, 0.01573812961578369, 0.017806708812713623, 0.019875288009643555, 0.021943867206573486, 0.024012446403503418, 0.02608102560043335, 0.02814960479736328, 0.030218183994293213, 0.032286763191223145, 0.034355342388153076, 0.03642392158508301, 0.03849250078201294, 0.04056107997894287, 0.0426296591758728, 0.044698238372802734, 0.046766817569732666, 0.0488353967666626, 0.05090397596359253, 0.05297255516052246, 0.05504113435745239, 0.057109713554382324, 0.059178292751312256, 0.06124687194824219, 0.06331545114517212, 0.06538403034210205, 0.06745260953903198, 0.06952118873596191, 0.07158976793289185, 0.07365834712982178, 0.07572692632675171, 0.07779550552368164, 0.07986408472061157, 0.0819326639175415, 0.08400124311447144, 0.08606982231140137, 0.0881384015083313, 0.09020698070526123, 0.09227555990219116, 0.0943441390991211, 0.09641271829605103, 0.09848129749298096, 0.10054987668991089, 0.10261845588684082, 0.10468703508377075, 0.10675561428070068, 0.10882419347763062, 0.11089277267456055, 0.11296135187149048, 0.11502993106842041, 0.11709851026535034, 0.11916708946228027, 0.1212356686592102, 0.12330424785614014, 0.12537282705307007, 0.12744140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 4.0, 7.0, 8.0, 16.0, 15.0, 24.0, 31.0, 27.0, 49.0, 64.0, 123.0, 202.0, 503.0, 1448.0, 5697.0, 32482.0, 381129.0, 570476.0, 45758.0, 7334.0, 1860.0, 640.0, 265.0, 122.0, 70.0, 35.0, 32.0, 28.0, 18.0, 14.0, 6.0, 16.0, 12.0, 7.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2357177734375, -0.22837066650390625, -0.2210235595703125, -0.21367645263671875, -0.206329345703125, -0.19898223876953125, -0.1916351318359375, -0.18428802490234375, -0.17694091796875, -0.16959381103515625, -0.1622467041015625, -0.15489959716796875, -0.147552490234375, -0.14020538330078125, -0.1328582763671875, -0.12551116943359375, -0.1181640625, -0.11081695556640625, -0.1034698486328125, -0.09612274169921875, -0.088775634765625, -0.08142852783203125, -0.0740814208984375, -0.06673431396484375, -0.05938720703125, -0.05204010009765625, -0.0446929931640625, -0.03734588623046875, -0.029998779296875, -0.02265167236328125, -0.0153045654296875, -0.00795745849609375, -0.0006103515625, 0.00673675537109375, 0.0140838623046875, 0.02143096923828125, 0.028778076171875, 0.03612518310546875, 0.0434722900390625, 0.05081939697265625, 0.05816650390625, 0.06551361083984375, 0.0728607177734375, 0.08020782470703125, 0.087554931640625, 0.09490203857421875, 0.1022491455078125, 0.10959625244140625, 0.116943359375, 0.12429046630859375, 0.1316375732421875, 0.13898468017578125, 0.146331787109375, 0.15367889404296875, 0.1610260009765625, 0.16837310791015625, 0.17572021484375, 0.18306732177734375, 0.1904144287109375, 0.19776153564453125, 0.205108642578125, 0.21245574951171875, 0.2198028564453125, 0.22714996337890625, 0.2344970703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 7.0, 12.0, 13.0, 15.0, 20.0, 26.0, 27.0, 29.0, 38.0, 45.0, 49.0, 52.0, 50.0, 65.0, 55.0, 73.0, 53.0, 51.0, 54.0, 38.0, 39.0, 33.0, 21.0, 25.0, 24.0, 12.0, 14.0, 11.0, 1.0, 4.0, 13.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.1256103515625, -0.12235069274902344, -0.11909103393554688, -0.11583137512207031, -0.11257171630859375, -0.10931205749511719, -0.10605239868164062, -0.10279273986816406, -0.0995330810546875, -0.09627342224121094, -0.09301376342773438, -0.08975410461425781, -0.08649444580078125, -0.08323478698730469, -0.07997512817382812, -0.07671546936035156, -0.073455810546875, -0.07019615173339844, -0.06693649291992188, -0.06367683410644531, -0.06041717529296875, -0.05715751647949219, -0.053897857666015625, -0.05063819885253906, -0.0473785400390625, -0.04411888122558594, -0.040859222412109375, -0.03759956359863281, -0.03433990478515625, -0.031080245971679688, -0.027820587158203125, -0.024560928344726562, -0.02130126953125, -0.018041610717773438, -0.014781951904296875, -0.011522293090820312, -0.00826263427734375, -0.0050029754638671875, -0.001743316650390625, 0.0015163421630859375, 0.0047760009765625, 0.008035659790039062, 0.011295318603515625, 0.014554977416992188, 0.01781463623046875, 0.021074295043945312, 0.024333953857421875, 0.027593612670898438, 0.030853271484375, 0.03411293029785156, 0.037372589111328125, 0.04063224792480469, 0.04389190673828125, 0.04715156555175781, 0.050411224365234375, 0.05367088317871094, 0.0569305419921875, 0.06019020080566406, 0.06344985961914062, 0.06670951843261719, 0.06996917724609375, 0.07322883605957031, 0.07648849487304688, 0.07974815368652344, 0.0830078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 2.0, 5.0, 7.0, 10.0, 15.0, 26.0, 27.0, 46.0, 85.0, 135.0, 295.0, 574.0, 1525.0, 4876.0, 24841.0, 591626.0, 397082.0, 20427.0, 4345.0, 1428.0, 541.0, 273.0, 124.0, 71.0, 47.0, 34.0, 25.0, 24.0, 11.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22418975830078125, -0.2164459228515625, -0.20870208740234375, -0.200958251953125, -0.19321441650390625, -0.1854705810546875, -0.17772674560546875, -0.16998291015625, -0.16223907470703125, -0.1544952392578125, -0.14675140380859375, -0.139007568359375, -0.13126373291015625, -0.1235198974609375, -0.11577606201171875, -0.1080322265625, -0.10028839111328125, -0.0925445556640625, -0.08480072021484375, -0.077056884765625, -0.06931304931640625, -0.0615692138671875, -0.05382537841796875, -0.04608154296875, -0.03833770751953125, -0.0305938720703125, -0.02285003662109375, -0.015106201171875, -0.00736236572265625, 0.0003814697265625, 0.00812530517578125, 0.015869140625, 0.02361297607421875, 0.0313568115234375, 0.03910064697265625, 0.046844482421875, 0.05458831787109375, 0.0623321533203125, 0.07007598876953125, 0.07781982421875, 0.08556365966796875, 0.0933074951171875, 0.10105133056640625, 0.108795166015625, 0.11653900146484375, 0.1242828369140625, 0.13202667236328125, 0.1397705078125, 0.14751434326171875, 0.1552581787109375, 0.16300201416015625, 0.170745849609375, 0.17848968505859375, 0.1862335205078125, 0.19397735595703125, 0.20172119140625, 0.20946502685546875, 0.2172088623046875, 0.22495269775390625, 0.232696533203125, 0.24044036865234375, 0.2481842041015625, 0.25592803955078125, 0.263671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 6.0, 8.0, 10.0, 13.0, 18.0, 18.0, 37.0, 45.0, 68.0, 105.0, 156.0, 102.0, 112.0, 88.0, 58.0, 31.0, 23.0, 23.0, 19.0, 6.0, 9.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7702579498291016e-05, -1.7132610082626343e-05, -1.656264066696167e-05, -1.5992671251296997e-05, -1.5422701835632324e-05, -1.4852732419967651e-05, -1.4282763004302979e-05, -1.3712793588638306e-05, -1.3142824172973633e-05, -1.257285475730896e-05, -1.2002885341644287e-05, -1.1432915925979614e-05, -1.0862946510314941e-05, -1.0292977094650269e-05, -9.723007678985596e-06, -9.153038263320923e-06, -8.58306884765625e-06, -8.013099431991577e-06, -7.443130016326904e-06, -6.8731606006622314e-06, -6.303191184997559e-06, -5.733221769332886e-06, -5.163252353668213e-06, -4.59328293800354e-06, -4.023313522338867e-06, -3.4533441066741943e-06, -2.8833746910095215e-06, -2.3134052753448486e-06, -1.7434358596801758e-06, -1.173466444015503e-06, -6.034970283508301e-07, -3.3527612686157227e-08, 5.364418029785156e-07, 1.1064112186431885e-06, 1.6763806343078613e-06, 2.246350049972534e-06, 2.816319465637207e-06, 3.38628888130188e-06, 3.956258296966553e-06, 4.526227712631226e-06, 5.0961971282958984e-06, 5.666166543960571e-06, 6.236135959625244e-06, 6.806105375289917e-06, 7.37607479095459e-06, 7.946044206619263e-06, 8.516013622283936e-06, 9.085983037948608e-06, 9.655952453613281e-06, 1.0225921869277954e-05, 1.0795891284942627e-05, 1.13658607006073e-05, 1.1935830116271973e-05, 1.2505799531936646e-05, 1.3075768947601318e-05, 1.3645738363265991e-05, 1.4215707778930664e-05, 1.4785677194595337e-05, 1.535564661026001e-05, 1.5925616025924683e-05, 1.6495585441589355e-05, 1.706555485725403e-05, 1.76355242729187e-05, 1.8205493688583374e-05, 1.8775463104248047e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 13.0, 16.0, 36.0, 54.0, 86.0, 252.0, 995.0, 13498.0, 997796.0, 33814.0, 1510.0, 279.0, 89.0, 45.0, 23.0, 11.0, 13.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68408203125, -0.6676445007324219, -0.6512069702148438, -0.6347694396972656, -0.6183319091796875, -0.6018943786621094, -0.5854568481445312, -0.5690193176269531, -0.552581787109375, -0.5361442565917969, -0.5197067260742188, -0.5032691955566406, -0.4868316650390625, -0.4703941345214844, -0.45395660400390625, -0.4375190734863281, -0.42108154296875, -0.4046440124511719, -0.38820648193359375, -0.3717689514160156, -0.3553314208984375, -0.3388938903808594, -0.32245635986328125, -0.3060188293457031, -0.289581298828125, -0.2731437683105469, -0.25670623779296875, -0.24026870727539062, -0.2238311767578125, -0.20739364624023438, -0.19095611572265625, -0.17451858520507812, -0.1580810546875, -0.14164352416992188, -0.12520599365234375, -0.10876846313476562, -0.0923309326171875, -0.07589340209960938, -0.05945587158203125, -0.043018341064453125, -0.026580810546875, -0.010143280029296875, 0.00629425048828125, 0.022731781005859375, 0.0391693115234375, 0.055606842041015625, 0.07204437255859375, 0.08848190307617188, 0.10491943359375, 0.12135696411132812, 0.13779449462890625, 0.15423202514648438, 0.1706695556640625, 0.18710708618164062, 0.20354461669921875, 0.21998214721679688, 0.236419677734375, 0.2528572082519531, 0.26929473876953125, 0.2857322692871094, 0.3021697998046875, 0.3186073303222656, 0.33504486083984375, 0.3514823913574219, 0.367919921875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 0.0, 5.0, 9.0, 9.0, 10.0, 20.0, 20.0, 28.0, 66.0, 129.0, 285.0, 209.0, 92.0, 45.0, 30.0, 11.0, 9.0, 9.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275390625, -0.268951416015625, -0.26251220703125, -0.256072998046875, -0.2496337890625, -0.243194580078125, -0.23675537109375, -0.230316162109375, -0.223876953125, -0.217437744140625, -0.21099853515625, -0.204559326171875, -0.1981201171875, -0.191680908203125, -0.18524169921875, -0.178802490234375, -0.17236328125, -0.165924072265625, -0.15948486328125, -0.153045654296875, -0.1466064453125, -0.140167236328125, -0.13372802734375, -0.127288818359375, -0.120849609375, -0.114410400390625, -0.10797119140625, -0.101531982421875, -0.0950927734375, -0.088653564453125, -0.08221435546875, -0.075775146484375, -0.0693359375, -0.062896728515625, -0.05645751953125, -0.050018310546875, -0.0435791015625, -0.037139892578125, -0.03070068359375, -0.024261474609375, -0.017822265625, -0.011383056640625, -0.00494384765625, 0.001495361328125, 0.0079345703125, 0.014373779296875, 0.02081298828125, 0.027252197265625, 0.03369140625, 0.040130615234375, 0.04656982421875, 0.053009033203125, 0.0594482421875, 0.065887451171875, 0.07232666015625, 0.078765869140625, 0.085205078125, 0.091644287109375, 0.09808349609375, 0.104522705078125, 0.1109619140625, 0.117401123046875, 0.12384033203125, 0.130279541015625, 0.13671875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 12.0, 186.0, 814.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9015557765960693, -2.4335384368896484, -1.9655213356018066, -1.4975041151046753, -1.029486894607544, -0.5614697933197021, -0.09345245361328125, 0.37456488609313965, 0.8425819873809814, 1.3105992078781128, 1.7786164283752441, 2.246633529663086, 2.714650869369507, 3.1826679706573486, 3.6506853103637695, 4.1187028884887695, 4.586719512939453, 5.054736614227295, 5.522753715515137, 5.990771293640137, 6.4587883949279785, 6.92680549621582, 7.39482307434082, 7.862840175628662, 8.330857276916504, 8.798874855041504, 9.266891479492188, 9.734909057617188, 10.202926635742188, 10.670943260192871, 11.138960838317871, 11.606977462768555, 12.074995040893555, 12.543012619018555, 13.011029243469238, 13.479046821594238, 13.947063446044922, 14.415081024169922, 14.883098602294922, 15.351116180419922, 15.819132804870605, 16.28714942932129, 16.75516700744629, 17.22318458557129, 17.69120216369629, 18.159217834472656, 18.627235412597656, 19.095252990722656, 19.563270568847656, 20.031288146972656, 20.499305725097656, 20.967321395874023, 21.435338973999023, 21.903356552124023, 22.371374130249023, 22.839391708374023, 23.30740737915039, 23.77542495727539, 24.24344253540039, 24.711458206176758, 25.179475784301758, 25.647493362426758, 26.115510940551758, 26.583528518676758, 27.051546096801758]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 3.0, 26.0, 30.0, 49.0, 59.0, 71.0, 102.0, 96.0, 105.0, 101.0, 94.0, 90.0, 71.0, 40.0, 27.0, 19.0, 9.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.814208984375, -0.7695979475975037, -0.7249868512153625, -0.6803758144378662, -0.6357647180557251, -0.5911536812782288, -0.5465426445007324, -0.5019315481185913, -0.45732051134109497, -0.41270944476127625, -0.3680983781814575, -0.3234873414039612, -0.27887627482414246, -0.23426520824432373, -0.1896541714668274, -0.14504310488700867, -0.10043203830718994, -0.05582097917795181, -0.011209920048713684, 0.03340113162994385, 0.07801219820976257, 0.1226232647895813, 0.16723430156707764, 0.21184536814689636, 0.2564564347267151, 0.3010675013065338, 0.34567856788635254, 0.3902896046638489, 0.4349006712436676, 0.47951173782348633, 0.5241227746009827, 0.568733811378479, 0.6133449077606201, 0.6579559445381165, 0.7025670409202576, 0.7471780776977539, 0.791789174079895, 0.8364002108573914, 0.8810112476348877, 0.9256223440170288, 0.9702333807945251, 1.0148444175720215, 1.0594555139541626, 1.1040666103363037, 1.1486775875091553, 1.1932886838912964, 1.2378997802734375, 1.282510757446289, 1.3271218538284302, 1.3717329502105713, 1.4163439273834229, 1.460955023765564, 1.505566120147705, 1.5501770973205566, 1.5947881937026978, 1.6393992900848389, 1.6840102672576904, 1.7286213636398315, 1.773232340812683, 1.8178434371948242, 1.8624545335769653, 1.9070656299591064, 1.951676607131958, 1.9962877035140991, 2.0408987998962402]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 12.0, 50.0, 265.0, 16782.0, 4175799.0, 907.0, 230.0, 102.0, 59.0, 44.0, 20.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.54974365234375, -0.4432373046875, -0.33673095703125, -0.230224609375, -0.12371826171875, -0.0172119140625, 0.08929443359375, 0.19580078125, 0.30230712890625, 0.4088134765625, 0.51531982421875, 0.621826171875, 0.72833251953125, 0.8348388671875, 0.94134521484375, 1.0478515625, 1.15435791015625, 1.2608642578125, 1.36737060546875, 1.473876953125, 1.58038330078125, 1.6868896484375, 1.79339599609375, 1.89990234375, 2.00640869140625, 2.1129150390625, 2.21942138671875, 2.325927734375, 2.43243408203125, 2.5389404296875, 2.64544677734375, 2.751953125, 2.85845947265625, 2.9649658203125, 3.07147216796875, 3.177978515625, 3.28448486328125, 3.3909912109375, 3.49749755859375, 3.60400390625, 3.71051025390625, 3.8170166015625, 3.92352294921875, 4.030029296875, 4.13653564453125, 4.2430419921875, 4.34954833984375, 4.4560546875, 4.56256103515625, 4.6690673828125, 4.77557373046875, 4.882080078125, 4.98858642578125, 5.0950927734375, 5.20159912109375, 5.30810546875, 5.41461181640625, 5.5211181640625, 5.62762451171875, 5.734130859375, 5.84063720703125, 5.9471435546875, 6.05364990234375, 6.16015625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 10.0, 59.0, 141.0, 284.0, 304.0, 157.0, 37.0, 22.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0188446044921875, -0.016173601150512695, -0.01350259780883789, -0.010831594467163086, -0.008160591125488281, -0.0054895877838134766, -0.002818584442138672, -0.0001475811004638672, 0.0025234222412109375, 0.005194425582885742, 0.007865428924560547, 0.010536432266235352, 0.013207435607910156, 0.01587843894958496, 0.018549442291259766, 0.02122044563293457, 0.023891448974609375, 0.02656245231628418, 0.029233455657958984, 0.03190445899963379, 0.034575462341308594, 0.0372464656829834, 0.0399174690246582, 0.04258847236633301, 0.04525947570800781, 0.04793047904968262, 0.05060148239135742, 0.05327248573303223, 0.05594348907470703, 0.058614492416381836, 0.06128549575805664, 0.06395649909973145, 0.06662750244140625, 0.06929850578308105, 0.07196950912475586, 0.07464051246643066, 0.07731151580810547, 0.07998251914978027, 0.08265352249145508, 0.08532452583312988, 0.08799552917480469, 0.09066653251647949, 0.0933375358581543, 0.0960085391998291, 0.0986795425415039, 0.10135054588317871, 0.10402154922485352, 0.10669255256652832, 0.10936355590820312, 0.11203455924987793, 0.11470556259155273, 0.11737656593322754, 0.12004756927490234, 0.12271857261657715, 0.12538957595825195, 0.12806057929992676, 0.13073158264160156, 0.13340258598327637, 0.13607358932495117, 0.13874459266662598, 0.14141559600830078, 0.14408659934997559, 0.1467576026916504, 0.1494286060333252, 0.152099609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 8.0, 23.0, 62.0, 92.0, 120.0, 219.0, 497.0, 96348.0, 4095591.0, 537.0, 247.0, 170.0, 132.0, 76.0, 57.0, 39.0, 33.0, 8.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.326385498046875, -3.18206787109375, -3.037750244140625, -2.8934326171875, -2.749114990234375, -2.60479736328125, -2.460479736328125, -2.316162109375, -2.171844482421875, -2.02752685546875, -1.883209228515625, -1.7388916015625, -1.594573974609375, -1.45025634765625, -1.305938720703125, -1.16162109375, -1.017303466796875, -0.87298583984375, -0.728668212890625, -0.5843505859375, -0.440032958984375, -0.29571533203125, -0.151397705078125, -0.007080078125, 0.137237548828125, 0.28155517578125, 0.425872802734375, 0.5701904296875, 0.714508056640625, 0.85882568359375, 1.003143310546875, 1.1474609375, 1.291778564453125, 1.43609619140625, 1.580413818359375, 1.7247314453125, 1.869049072265625, 2.01336669921875, 2.157684326171875, 2.302001953125, 2.446319580078125, 2.59063720703125, 2.734954833984375, 2.8792724609375, 3.023590087890625, 3.16790771484375, 3.312225341796875, 3.45654296875, 3.600860595703125, 3.74517822265625, 3.889495849609375, 4.0338134765625, 4.178131103515625, 4.32244873046875, 4.466766357421875, 4.611083984375, 4.755401611328125, 4.89971923828125, 5.044036865234375, 5.1883544921875, 5.332672119140625, 5.47698974609375, 5.621307373046875, 5.765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 24.0, 131.0, 3686.0, 226.0, 10.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12420654296875, -0.10988330841064453, -0.09556007385253906, -0.0812368392944336, -0.06691360473632812, -0.052590370178222656, -0.03826713562011719, -0.02394390106201172, -0.00962066650390625, 0.004702568054199219, 0.019025802612304688, 0.033349037170410156, 0.047672271728515625, 0.061995506286621094, 0.07631874084472656, 0.09064197540283203, 0.1049652099609375, 0.11928844451904297, 0.13361167907714844, 0.1479349136352539, 0.16225814819335938, 0.17658138275146484, 0.1909046173095703, 0.20522785186767578, 0.21955108642578125, 0.23387432098388672, 0.2481975555419922, 0.26252079010009766, 0.2768440246582031, 0.2911672592163086, 0.30549049377441406, 0.31981372833251953, 0.334136962890625, 0.34846019744873047, 0.36278343200683594, 0.3771066665649414, 0.3914299011230469, 0.40575313568115234, 0.4200763702392578, 0.4343996047973633, 0.44872283935546875, 0.4630460739135742, 0.4773693084716797, 0.49169254302978516, 0.5060157775878906, 0.5203390121459961, 0.5346622467041016, 0.548985481262207, 0.5633087158203125, 0.577631950378418, 0.5919551849365234, 0.6062784194946289, 0.6206016540527344, 0.6349248886108398, 0.6492481231689453, 0.6635713577270508, 0.6778945922851562, 0.6922178268432617, 0.7065410614013672, 0.7208642959594727, 0.7351875305175781, 0.7495107650756836, 0.7638339996337891, 0.7781572341918945, 0.79248046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 12.0, 55.0, 476.0, 428.0, 32.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884055137634277, -0.9903718829154968, -0.7923382520675659, -0.594304621219635, -0.3962709903717041, -0.1982373595237732, -0.00020372867584228516, 0.1978299617767334, 0.39586353302001953, 0.5938971638679504, 0.7919307947158813, 0.9899644255638123, 1.1879980564117432, 1.3860316276550293, 1.584065318107605, 1.7820990085601807, 1.9801325798034668, 2.178166151046753, 2.376199722290039, 2.5742335319519043, 2.7722671031951904, 2.9703006744384766, 3.168334484100342, 3.366368055343628, 3.564401626586914, 3.7624351978302, 3.9604687690734863, 4.158502578735352, 4.356535911560059, 4.554569721221924, 4.752603530883789, 4.950636863708496, 5.148670196533203, 5.346704006195068, 5.544737339019775, 5.742771148681641, 5.940804481506348, 6.138838291168213, 6.336872100830078, 6.534905433654785, 6.73293924331665, 6.930973052978516, 7.129006385803223, 7.327040195465088, 7.525074005126953, 7.72310733795166, 7.921141147613525, 8.11917495727539, 8.317208290100098, 8.515241622924805, 8.713275909423828, 8.911309242248535, 9.109342575073242, 9.307376861572266, 9.505410194396973, 9.70344352722168, 9.901477813720703, 10.09951114654541, 10.297545433044434, 10.49557876586914, 10.693612098693848, 10.891646385192871, 11.089679718017578, 11.287713050842285, 11.485746383666992]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 14.0, 17.0, 65.0, 80.0, 96.0, 150.0, 169.0, 143.0, 105.0, 74.0, 39.0, 25.0, 13.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.661320686340332, -2.579507827758789, -2.497695207595825, -2.4158823490142822, -2.3340697288513184, -2.2522568702697754, -2.1704442501068115, -2.0886313915252686, -2.0068187713623047, -1.9250060319900513, -1.8431932926177979, -1.7613805532455444, -1.679567813873291, -1.597754955291748, -1.5159422159194946, -1.4341294765472412, -1.3523166179656982, -1.2705038785934448, -1.1886911392211914, -1.106878399848938, -1.0250656604766846, -0.9432528614997864, -0.8614400625228882, -0.7796273231506348, -0.6978145837783813, -0.6160018444061279, -0.5341891050338745, -0.4523763060569763, -0.3705635666847229, -0.2887508273124695, -0.20693805813789368, -0.12512528896331787, -0.04331254959106445, 0.03850020468235016, 0.12031295895576477, 0.20212571322917938, 0.283938467502594, 0.3657512068748474, 0.4475639760494232, 0.529376745223999, 0.6111894845962524, 0.6930022239685059, 0.7748149633407593, 0.8566277623176575, 0.9384405016899109, 1.0202531814575195, 1.1020660400390625, 1.183878779411316, 1.2656915187835693, 1.3475042581558228, 1.4293169975280762, 1.5111297369003296, 1.592942476272583, 1.674755334854126, 1.7565680742263794, 1.8383808135986328, 1.9201935529708862, 2.0020062923431396, 2.0838191509246826, 2.1656317710876465, 2.2474446296691895, 2.3292572498321533, 2.4110701084136963, 2.49288272857666, 2.574695587158203]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 16.0, 26.0, 18.0, 22.0, 41.0, 69.0, 97.0, 235.0, 468.0, 1264.0, 4637.0, 54883.0, 909519.0, 69523.0, 5327.0, 1327.0, 508.0, 231.0, 102.0, 76.0, 38.0, 28.0, 20.0, 19.0, 12.0, 15.0, 7.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.07464599609375, -1.0369873046875, -0.99932861328125, -0.961669921875, -0.92401123046875, -0.8863525390625, -0.84869384765625, -0.81103515625, -0.77337646484375, -0.7357177734375, -0.69805908203125, -0.660400390625, -0.62274169921875, -0.5850830078125, -0.54742431640625, -0.509765625, -0.47210693359375, -0.4344482421875, -0.39678955078125, -0.359130859375, -0.32147216796875, -0.2838134765625, -0.24615478515625, -0.20849609375, -0.17083740234375, -0.1331787109375, -0.09552001953125, -0.057861328125, -0.02020263671875, 0.0174560546875, 0.05511474609375, 0.0927734375, 0.13043212890625, 0.1680908203125, 0.20574951171875, 0.243408203125, 0.28106689453125, 0.3187255859375, 0.35638427734375, 0.39404296875, 0.43170166015625, 0.4693603515625, 0.50701904296875, 0.544677734375, 0.58233642578125, 0.6199951171875, 0.65765380859375, 0.6953125, 0.73297119140625, 0.7706298828125, 0.80828857421875, 0.845947265625, 0.88360595703125, 0.9212646484375, 0.95892333984375, 0.99658203125, 1.03424072265625, 1.0718994140625, 1.10955810546875, 1.147216796875, 1.18487548828125, 1.2225341796875, 1.26019287109375, 1.2978515625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 14.0, 33.0, 49.0, 86.0, 128.0, 190.0, 162.0, 136.0, 94.0, 56.0, 34.0, 14.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.101806640625, -0.09648704528808594, -0.09116744995117188, -0.08584785461425781, -0.08052825927734375, -0.07520866394042969, -0.06988906860351562, -0.06456947326660156, -0.0592498779296875, -0.05393028259277344, -0.048610687255859375, -0.04329109191894531, -0.03797149658203125, -0.03265190124511719, -0.027332305908203125, -0.022012710571289062, -0.016693115234375, -0.011373519897460938, -0.006053924560546875, -0.0007343292236328125, 0.00458526611328125, 0.009904861450195312, 0.015224456787109375, 0.020544052124023438, 0.0258636474609375, 0.031183242797851562, 0.036502838134765625, 0.04182243347167969, 0.04714202880859375, 0.05246162414550781, 0.057781219482421875, 0.06310081481933594, 0.06842041015625, 0.07374000549316406, 0.07905960083007812, 0.08437919616699219, 0.08969879150390625, 0.09501838684082031, 0.10033798217773438, 0.10565757751464844, 0.1109771728515625, 0.11629676818847656, 0.12161636352539062, 0.1269359588623047, 0.13225555419921875, 0.1375751495361328, 0.14289474487304688, 0.14821434020996094, 0.153533935546875, 0.15885353088378906, 0.16417312622070312, 0.1694927215576172, 0.17481231689453125, 0.1801319122314453, 0.18545150756835938, 0.19077110290527344, 0.1960906982421875, 0.20141029357910156, 0.20672988891601562, 0.2120494842529297, 0.21736907958984375, 0.2226886749267578, 0.22800827026367188, 0.23332786560058594, 0.2386474609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 11.0, 9.0, 13.0, 24.0, 20.0, 42.0, 60.0, 80.0, 163.0, 395.0, 1140.0, 4874.0, 36280.0, 717816.0, 265930.0, 17211.0, 2912.0, 836.0, 320.0, 139.0, 83.0, 59.0, 26.0, 22.0, 20.0, 22.0, 7.0, 2.0, 11.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5893630981445312, -0.5673980712890625, -0.5454330444335938, -0.523468017578125, -0.5015029907226562, -0.4795379638671875, -0.45757293701171875, -0.43560791015625, -0.41364288330078125, -0.3916778564453125, -0.36971282958984375, -0.347747802734375, -0.32578277587890625, -0.3038177490234375, -0.28185272216796875, -0.2598876953125, -0.23792266845703125, -0.2159576416015625, -0.19399261474609375, -0.172027587890625, -0.15006256103515625, -0.1280975341796875, -0.10613250732421875, -0.08416748046875, -0.06220245361328125, -0.0402374267578125, -0.01827239990234375, 0.003692626953125, 0.02565765380859375, 0.0476226806640625, 0.06958770751953125, 0.091552734375, 0.11351776123046875, 0.1354827880859375, 0.15744781494140625, 0.179412841796875, 0.20137786865234375, 0.2233428955078125, 0.24530792236328125, 0.26727294921875, 0.28923797607421875, 0.3112030029296875, 0.33316802978515625, 0.355133056640625, 0.37709808349609375, 0.3990631103515625, 0.42102813720703125, 0.4429931640625, 0.46495819091796875, 0.4869232177734375, 0.5088882446289062, 0.530853271484375, 0.5528182983398438, 0.5747833251953125, 0.5967483520507812, 0.61871337890625, 0.6406784057617188, 0.6626434326171875, 0.6846084594726562, 0.706573486328125, 0.7285385131835938, 0.7505035400390625, 0.7724685668945312, 0.79443359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 16.0, 17.0, 14.0, 26.0, 28.0, 26.0, 30.0, 52.0, 47.0, 64.0, 69.0, 52.0, 60.0, 66.0, 66.0, 61.0, 51.0, 47.0, 44.0, 26.0, 27.0, 20.0, 16.0, 10.0, 7.0, 8.0, 6.0, 10.0, 1.0, 5.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.27091217041015625, -0.2613067626953125, -0.25170135498046875, -0.242095947265625, -0.23249053955078125, -0.2228851318359375, -0.21327972412109375, -0.20367431640625, -0.19406890869140625, -0.1844635009765625, -0.17485809326171875, -0.165252685546875, -0.15564727783203125, -0.1460418701171875, -0.13643646240234375, -0.1268310546875, -0.11722564697265625, -0.1076202392578125, -0.09801483154296875, -0.088409423828125, -0.07880401611328125, -0.0691986083984375, -0.05959320068359375, -0.04998779296875, -0.04038238525390625, -0.0307769775390625, -0.02117156982421875, -0.011566162109375, -0.00196075439453125, 0.0076446533203125, 0.01725006103515625, 0.02685546875, 0.03646087646484375, 0.0460662841796875, 0.05567169189453125, 0.065277099609375, 0.07488250732421875, 0.0844879150390625, 0.09409332275390625, 0.10369873046875, 0.11330413818359375, 0.1229095458984375, 0.13251495361328125, 0.142120361328125, 0.15172576904296875, 0.1613311767578125, 0.17093658447265625, 0.1805419921875, 0.19014739990234375, 0.1997528076171875, 0.20935821533203125, 0.218963623046875, 0.22856903076171875, 0.2381744384765625, 0.24777984619140625, 0.25738525390625, 0.26699066162109375, 0.2765960693359375, 0.28620147705078125, 0.295806884765625, 0.30541229248046875, 0.3150177001953125, 0.32462310791015625, 0.334228515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 15.0, 26.0, 55.0, 121.0, 357.0, 1336.0, 11917.0, 968466.0, 62416.0, 2901.0, 593.0, 201.0, 75.0, 35.0, 21.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451416015625, -0.4331474304199219, -0.41487884521484375, -0.3966102600097656, -0.3783416748046875, -0.3600730895996094, -0.34180450439453125, -0.3235359191894531, -0.305267333984375, -0.2869987487792969, -0.26873016357421875, -0.2504615783691406, -0.2321929931640625, -0.21392440795898438, -0.19565582275390625, -0.17738723754882812, -0.15911865234375, -0.14085006713867188, -0.12258148193359375, -0.10431289672851562, -0.0860443115234375, -0.06777572631835938, -0.04950714111328125, -0.031238555908203125, -0.012969970703125, 0.005298614501953125, 0.02356719970703125, 0.041835784912109375, 0.0601043701171875, 0.07837295532226562, 0.09664154052734375, 0.11491012573242188, 0.1331787109375, 0.15144729614257812, 0.16971588134765625, 0.18798446655273438, 0.2062530517578125, 0.22452163696289062, 0.24279022216796875, 0.2610588073730469, 0.279327392578125, 0.2975959777832031, 0.31586456298828125, 0.3341331481933594, 0.3524017333984375, 0.3706703186035156, 0.38893890380859375, 0.4072074890136719, 0.42547607421875, 0.4437446594238281, 0.46201324462890625, 0.4802818298339844, 0.4985504150390625, 0.5168190002441406, 0.5350875854492188, 0.5533561706542969, 0.571624755859375, 0.5898933410644531, 0.6081619262695312, 0.6264305114746094, 0.6446990966796875, 0.6629676818847656, 0.6812362670898438, 0.6995048522949219, 0.7177734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 18.0, 12.0, 24.0, 21.0, 34.0, 53.0, 58.0, 82.0, 88.0, 97.0, 103.0, 87.0, 78.0, 59.0, 47.0, 38.0, 17.0, 19.0, 16.0, 9.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.823902130126953e-05, -1.7666257917881012e-05, -1.7093494534492493e-05, -1.6520731151103973e-05, -1.5947967767715454e-05, -1.5375204384326935e-05, -1.4802441000938416e-05, -1.4229677617549896e-05, -1.3656914234161377e-05, -1.3084150850772858e-05, -1.2511387467384338e-05, -1.1938624083995819e-05, -1.13658607006073e-05, -1.079309731721878e-05, -1.0220333933830261e-05, -9.647570550441742e-06, -9.074807167053223e-06, -8.502043783664703e-06, -7.929280400276184e-06, -7.356517016887665e-06, -6.7837536334991455e-06, -6.210990250110626e-06, -5.638226866722107e-06, -5.065463483333588e-06, -4.492700099945068e-06, -3.919936716556549e-06, -3.3471733331680298e-06, -2.7744099497795105e-06, -2.201646566390991e-06, -1.628883183002472e-06, -1.0561197996139526e-06, -4.833564162254333e-07, 8.940696716308594e-08, 6.621703505516052e-07, 1.2349337339401245e-06, 1.8076971173286438e-06, 2.380460500717163e-06, 2.9532238841056824e-06, 3.5259872674942017e-06, 4.098750650882721e-06, 4.67151403427124e-06, 5.2442774176597595e-06, 5.817040801048279e-06, 6.389804184436798e-06, 6.962567567825317e-06, 7.535330951213837e-06, 8.108094334602356e-06, 8.680857717990875e-06, 9.253621101379395e-06, 9.826384484767914e-06, 1.0399147868156433e-05, 1.0971911251544952e-05, 1.1544674634933472e-05, 1.2117438018321991e-05, 1.269020140171051e-05, 1.326296478509903e-05, 1.3835728168487549e-05, 1.4408491551876068e-05, 1.4981254935264587e-05, 1.5554018318653107e-05, 1.6126781702041626e-05, 1.6699545085430145e-05, 1.7272308468818665e-05, 1.7845071852207184e-05, 1.8417835235595703e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 11.0, 20.0, 13.0, 29.0, 56.0, 104.0, 183.0, 574.0, 2249.0, 35003.0, 977870.0, 29338.0, 2050.0, 544.0, 235.0, 105.0, 59.0, 36.0, 23.0, 12.0, 15.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.3297882080078125, -0.316314697265625, -0.3028411865234375, -0.28936767578125, -0.2758941650390625, -0.262420654296875, -0.2489471435546875, -0.2354736328125, -0.2220001220703125, -0.208526611328125, -0.1950531005859375, -0.18157958984375, -0.1681060791015625, -0.154632568359375, -0.1411590576171875, -0.127685546875, -0.1142120361328125, -0.100738525390625, -0.0872650146484375, -0.07379150390625, -0.0603179931640625, -0.046844482421875, -0.0333709716796875, -0.0198974609375, -0.0064239501953125, 0.007049560546875, 0.0205230712890625, 0.03399658203125, 0.0474700927734375, 0.060943603515625, 0.0744171142578125, 0.087890625, 0.1013641357421875, 0.114837646484375, 0.1283111572265625, 0.14178466796875, 0.1552581787109375, 0.168731689453125, 0.1822052001953125, 0.1956787109375, 0.2091522216796875, 0.222625732421875, 0.2360992431640625, 0.24957275390625, 0.2630462646484375, 0.276519775390625, 0.2899932861328125, 0.303466796875, 0.3169403076171875, 0.330413818359375, 0.3438873291015625, 0.35736083984375, 0.3708343505859375, 0.384307861328125, 0.3977813720703125, 0.4112548828125, 0.4247283935546875, 0.438201904296875, 0.4516754150390625, 0.46514892578125, 0.4786224365234375, 0.492095947265625, 0.5055694580078125, 0.51904296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 5.0, 12.0, 20.0, 16.0, 32.0, 60.0, 96.0, 155.0, 183.0, 140.0, 90.0, 57.0, 35.0, 31.0, 12.0, 12.0, 16.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10589599609375, -0.10045719146728516, -0.09501838684082031, -0.08957958221435547, -0.08414077758789062, -0.07870197296142578, -0.07326316833496094, -0.0678243637084961, -0.06238555908203125, -0.056946754455566406, -0.05150794982910156, -0.04606914520263672, -0.040630340576171875, -0.03519153594970703, -0.029752731323242188, -0.024313926696777344, -0.0188751220703125, -0.013436317443847656, -0.007997512817382812, -0.0025587081909179688, 0.002880096435546875, 0.008318901062011719, 0.013757705688476562, 0.019196510314941406, 0.02463531494140625, 0.030074119567871094, 0.03551292419433594, 0.04095172882080078, 0.046390533447265625, 0.05182933807373047, 0.05726814270019531, 0.06270694732666016, 0.068145751953125, 0.07358455657958984, 0.07902336120605469, 0.08446216583251953, 0.08990097045898438, 0.09533977508544922, 0.10077857971191406, 0.1062173843383789, 0.11165618896484375, 0.1170949935913086, 0.12253379821777344, 0.12797260284423828, 0.13341140747070312, 0.13885021209716797, 0.1442890167236328, 0.14972782135009766, 0.1551666259765625, 0.16060543060302734, 0.1660442352294922, 0.17148303985595703, 0.17692184448242188, 0.18236064910888672, 0.18779945373535156, 0.1932382583618164, 0.19867706298828125, 0.2041158676147461, 0.20955467224121094, 0.21499347686767578, 0.22043228149414062, 0.22587108612060547, 0.2313098907470703, 0.23674869537353516, 0.2421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 54.0, 904.0, 54.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.636589050292969, -8.08128833770752, -7.525986671447754, -6.970685958862305, -6.415384292602539, -5.86008358001709, -5.304782390594482, -4.749481201171875, -4.194180011749268, -3.63887882232666, -3.0835776329040527, -2.5282766819000244, -1.972975492477417, -1.4176743030548096, -0.8623733520507812, -0.30707216262817383, 0.2482290267944336, 0.8035301566123962, 1.3588312864303589, 1.9141323566436768, 2.469433546066284, 3.0247347354888916, 3.58003568649292, 4.135336875915527, 4.690638065338135, 5.245939254760742, 5.80124044418335, 6.356541633605957, 6.911842346191406, 7.467144012451172, 8.022444725036621, 8.57774543762207, 9.133047103881836, 9.688347816467285, 10.24364948272705, 10.7989501953125, 11.354251861572266, 11.909552574157715, 12.464853286743164, 13.02015495300293, 13.575456619262695, 14.130757331848145, 14.68605899810791, 15.24135971069336, 15.796661376953125, 16.35196304321289, 16.907262802124023, 17.46256446838379, 18.017864227294922, 18.573165893554688, 19.12846565246582, 19.683767318725586, 20.23906898498535, 20.794370651245117, 21.34967041015625, 21.904972076416016, 22.46027374267578, 23.015575408935547, 23.57087516784668, 24.126176834106445, 24.68147850036621, 25.236780166625977, 25.79207992553711, 26.347381591796875, 26.90268325805664]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 11.0, 8.0, 17.0, 23.0, 28.0, 42.0, 41.0, 41.0, 61.0, 64.0, 62.0, 69.0, 61.0, 62.0, 57.0, 59.0, 49.0, 57.0, 47.0, 35.0, 21.0, 19.0, 19.0, 6.0, 8.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1347343921661377, -2.068380117416382, -2.002025604248047, -1.9356712102890015, -1.869316816329956, -1.8029624223709106, -1.7366080284118652, -1.6702537536621094, -1.6038992404937744, -1.537544846534729, -1.4711904525756836, -1.4048360586166382, -1.3384816646575928, -1.2721272706985474, -1.205772876739502, -1.139418601989746, -1.0730642080307007, -1.0067098140716553, -0.9403554201126099, -0.8740010261535645, -0.807646632194519, -0.7412922382354736, -0.674937903881073, -0.6085835099220276, -0.5422291159629822, -0.47587472200393677, -0.40952032804489136, -0.34316596388816833, -0.2768115699291229, -0.21045717597007751, -0.1441028118133545, -0.07774841785430908, -0.011394023895263672, 0.05496036261320114, 0.12131474912166595, 0.18766912817955017, 0.2540235221385956, 0.320377916097641, 0.386732280254364, 0.4530866742134094, 0.5194410681724548, 0.5857954621315002, 0.6521498560905457, 0.7185041904449463, 0.7848585844039917, 0.8512129783630371, 0.9175673723220825, 0.9839217662811279, 1.0502761602401733, 1.1166305541992188, 1.1829849481582642, 1.2493393421173096, 1.315693736076355, 1.3820481300354004, 1.4484024047851562, 1.5147569179534912, 1.581111192703247, 1.6474655866622925, 1.713819980621338, 1.7801743745803833, 1.8465287685394287, 1.9128831624984741, 1.9792375564575195, 2.0455918312072754, 2.1119463443756104]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 3.0, 4.0, 11.0, 14.0, 35.0, 107.0, 196.0, 504.0, 1500.0, 5215.0, 22996.0, 585576.0, 3537854.0, 30744.0, 6015.0, 1758.0, 721.0, 362.0, 205.0, 127.0, 67.0, 58.0, 40.0, 36.0, 21.0, 15.0, 13.0, 13.0, 9.0, 8.0, 8.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44482421875, -0.41082000732421875, -0.3768157958984375, -0.34281158447265625, -0.308807373046875, -0.27480316162109375, -0.2407989501953125, -0.20679473876953125, -0.17279052734375, -0.13878631591796875, -0.1047821044921875, -0.07077789306640625, -0.036773681640625, -0.00276947021484375, 0.0312347412109375, 0.06523895263671875, 0.0992431640625, 0.13324737548828125, 0.1672515869140625, 0.20125579833984375, 0.235260009765625, 0.26926422119140625, 0.3032684326171875, 0.33727264404296875, 0.37127685546875, 0.40528106689453125, 0.4392852783203125, 0.47328948974609375, 0.507293701171875, 0.5412979125976562, 0.5753021240234375, 0.6093063354492188, 0.643310546875, 0.6773147583007812, 0.7113189697265625, 0.7453231811523438, 0.779327392578125, 0.8133316040039062, 0.8473358154296875, 0.8813400268554688, 0.91534423828125, 0.9493484497070312, 0.9833526611328125, 1.0173568725585938, 1.051361083984375, 1.0853652954101562, 1.1193695068359375, 1.1533737182617188, 1.1873779296875, 1.2213821411132812, 1.2553863525390625, 1.2893905639648438, 1.323394775390625, 1.3573989868164062, 1.3914031982421875, 1.4254074096679688, 1.45941162109375, 1.4934158325195312, 1.5274200439453125, 1.5614242553710938, 1.595428466796875, 1.6294326782226562, 1.6634368896484375, 1.6974411010742188, 1.7314453125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 14.0, 21.0, 29.0, 49.0, 61.0, 116.0, 129.0, 154.0, 123.0, 104.0, 77.0, 60.0, 31.0, 14.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06976318359375, -0.0649557113647461, -0.06014823913574219, -0.05534076690673828, -0.050533294677734375, -0.04572582244873047, -0.04091835021972656, -0.036110877990722656, -0.03130340576171875, -0.026495933532714844, -0.021688461303710938, -0.01688098907470703, -0.012073516845703125, -0.007266044616699219, -0.0024585723876953125, 0.0023488998413085938, 0.0071563720703125, 0.011963844299316406, 0.016771316528320312, 0.02157878875732422, 0.026386260986328125, 0.03119373321533203, 0.03600120544433594, 0.040808677673339844, 0.04561614990234375, 0.050423622131347656, 0.05523109436035156, 0.06003856658935547, 0.06484603881835938, 0.06965351104736328, 0.07446098327636719, 0.0792684555053711, 0.084075927734375, 0.0888833999633789, 0.09369087219238281, 0.09849834442138672, 0.10330581665039062, 0.10811328887939453, 0.11292076110839844, 0.11772823333740234, 0.12253570556640625, 0.12734317779541016, 0.13215065002441406, 0.13695812225341797, 0.14176559448242188, 0.14657306671142578, 0.1513805389404297, 0.1561880111694336, 0.1609954833984375, 0.1658029556274414, 0.1706104278564453, 0.17541790008544922, 0.18022537231445312, 0.18503284454345703, 0.18984031677246094, 0.19464778900146484, 0.19945526123046875, 0.20426273345947266, 0.20907020568847656, 0.21387767791748047, 0.21868515014648438, 0.22349262237548828, 0.2283000946044922, 0.2331075668334961, 0.2379150390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 12.0, 19.0, 46.0, 113.0, 586.0, 4132447.0, 59990.0, 702.0, 224.0, 73.0, 41.0, 24.0, 12.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.837158203125, -3.59619140625, -3.355224609375, -3.1142578125, -2.873291015625, -2.63232421875, -2.391357421875, -2.150390625, -1.909423828125, -1.66845703125, -1.427490234375, -1.1865234375, -0.945556640625, -0.70458984375, -0.463623046875, -0.22265625, 0.018310546875, 0.25927734375, 0.500244140625, 0.7412109375, 0.982177734375, 1.22314453125, 1.464111328125, 1.705078125, 1.946044921875, 2.18701171875, 2.427978515625, 2.6689453125, 2.909912109375, 3.15087890625, 3.391845703125, 3.6328125, 3.873779296875, 4.11474609375, 4.355712890625, 4.5966796875, 4.837646484375, 5.07861328125, 5.319580078125, 5.560546875, 5.801513671875, 6.04248046875, 6.283447265625, 6.5244140625, 6.765380859375, 7.00634765625, 7.247314453125, 7.48828125, 7.729248046875, 7.97021484375, 8.211181640625, 8.4521484375, 8.693115234375, 8.93408203125, 9.175048828125, 9.416015625, 9.656982421875, 9.89794921875, 10.138916015625, 10.3798828125, 10.620849609375, 10.86181640625, 11.102783203125, 11.34375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 10.0, 28.0, 117.0, 3439.0, 402.0, 54.0, 17.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1568603515625, -0.13651084899902344, -0.11616134643554688, -0.09581184387207031, -0.07546234130859375, -0.05511283874511719, -0.034763336181640625, -0.014413833618164062, 0.0059356689453125, 0.026285171508789062, 0.046634674072265625, 0.06698417663574219, 0.08733367919921875, 0.10768318176269531, 0.12803268432617188, 0.14838218688964844, 0.168731689453125, 0.18908119201660156, 0.20943069458007812, 0.2297801971435547, 0.25012969970703125, 0.2704792022705078, 0.2908287048339844, 0.31117820739746094, 0.3315277099609375, 0.35187721252441406, 0.3722267150878906, 0.3925762176513672, 0.41292572021484375, 0.4332752227783203, 0.4536247253417969, 0.47397422790527344, 0.49432373046875, 0.5146732330322266, 0.5350227355957031, 0.5553722381591797, 0.5757217407226562, 0.5960712432861328, 0.6164207458496094, 0.6367702484130859, 0.6571197509765625, 0.6774692535400391, 0.6978187561035156, 0.7181682586669922, 0.7385177612304688, 0.7588672637939453, 0.7792167663574219, 0.7995662689208984, 0.819915771484375, 0.8402652740478516, 0.8606147766113281, 0.8809642791748047, 0.9013137817382812, 0.9216632843017578, 0.9420127868652344, 0.9623622894287109, 0.9827117919921875, 1.003061294555664, 1.0234107971191406, 1.0437602996826172, 1.0641098022460938, 1.0844593048095703, 1.1048088073730469, 1.1251583099365234, 1.1455078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 9.0, 19.0, 206.0, 676.0, 69.0, 15.0, 6.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.629086971282959, -5.429607391357422, -5.230128288269043, -5.030648708343506, -4.831169128417969, -4.63169002532959, -4.432210445404053, -4.232730865478516, -4.033251762390137, -3.8337724208831787, -3.6342928409576416, -3.4348134994506836, -3.2353339195251465, -3.0358545780181885, -2.8363752365112305, -2.6368956565856934, -2.4374160766601562, -2.2379367351531982, -2.038457155227661, -1.8389778137207031, -1.6394983530044556, -1.440018892288208, -1.24053955078125, -1.0410600900650024, -0.8415806293487549, -0.6421011686325073, -0.44262176752090454, -0.24314236640930176, -0.0436629056930542, 0.15581655502319336, 0.35529589653015137, 0.5547753572463989, 0.7542543411254883, 0.9537338018417358, 1.1532132625579834, 1.3526926040649414, 1.552172064781189, 1.7516515254974365, 1.9511308670043945, 2.1506104469299316, 2.3500897884368896, 2.5495691299438477, 2.7490487098693848, 2.9485280513763428, 3.148007392883301, 3.347486972808838, 3.546966314315796, 3.746445655822754, 3.945925235748291, 4.145404815673828, 4.344883918762207, 4.544363498687744, 4.743843078613281, 4.94332218170166, 5.142801761627197, 5.342281341552734, 5.541760444641113, 5.74124002456665, 5.940719127655029, 6.140198707580566, 6.3396782875061035, 6.539157867431641, 6.7386369705200195, 6.938116550445557, 7.137596130371094]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 14.0, 26.0, 33.0, 57.0, 72.0, 79.0, 84.0, 97.0, 101.0, 122.0, 78.0, 62.0, 49.0, 48.0, 37.0, 10.0, 13.0, 6.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9486967325210571, -1.88349449634552, -1.818292260169983, -1.7530900239944458, -1.6878877878189087, -1.6226855516433716, -1.557483434677124, -1.492281198501587, -1.4270789623260498, -1.3618767261505127, -1.2966744899749756, -1.2314722537994385, -1.1662700176239014, -1.1010677814483643, -1.0358655452728271, -0.9706633687019348, -0.9054610729217529, -0.8402588367462158, -0.7750566005706787, -0.7098543643951416, -0.6446521282196045, -0.5794498920440674, -0.514247715473175, -0.44904547929763794, -0.38384324312210083, -0.3186410069465637, -0.2534387707710266, -0.1882365643978119, -0.12303432822227478, -0.05783209204673767, 0.007370114326477051, 0.07257235050201416, 0.13777470588684082, 0.20297694206237793, 0.26817917823791504, 0.33338138461112976, 0.39858362078666687, 0.463785856962204, 0.5289880633354187, 0.5941902995109558, 0.6593925356864929, 0.72459477186203, 0.7897970080375671, 0.8549991846084595, 0.9202014207839966, 0.9854036569595337, 1.0506058931350708, 1.115808129310608, 1.181010365486145, 1.2462126016616821, 1.3114148378372192, 1.3766170740127563, 1.4418193101882935, 1.5070215463638306, 1.5722236633300781, 1.6374258995056152, 1.7026281356811523, 1.7678303718566895, 1.8330326080322266, 1.8982348442077637, 1.9634370803833008, 2.028639316558838, 2.093841552734375, 2.159043788909912, 2.224246025085449]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 5.0, 10.0, 19.0, 21.0, 22.0, 27.0, 42.0, 50.0, 73.0, 102.0, 134.0, 194.0, 347.0, 654.0, 1207.0, 2839.0, 8151.0, 32208.0, 192188.0, 667237.0, 110906.0, 21350.0, 5985.0, 2221.0, 995.0, 519.0, 307.0, 222.0, 144.0, 103.0, 68.0, 59.0, 31.0, 27.0, 11.0, 13.0, 9.0, 5.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.697265625, -0.6743011474609375, -0.651336669921875, -0.6283721923828125, -0.60540771484375, -0.5824432373046875, -0.559478759765625, -0.5365142822265625, -0.5135498046875, -0.4905853271484375, -0.467620849609375, -0.4446563720703125, -0.42169189453125, -0.3987274169921875, -0.375762939453125, -0.3527984619140625, -0.329833984375, -0.3068695068359375, -0.283905029296875, -0.2609405517578125, -0.23797607421875, -0.2150115966796875, -0.192047119140625, -0.1690826416015625, -0.1461181640625, -0.1231536865234375, -0.100189208984375, -0.0772247314453125, -0.05426025390625, -0.0312957763671875, -0.008331298828125, 0.0146331787109375, 0.03759765625, 0.0605621337890625, 0.083526611328125, 0.1064910888671875, 0.12945556640625, 0.1524200439453125, 0.175384521484375, 0.1983489990234375, 0.2213134765625, 0.2442779541015625, 0.267242431640625, 0.2902069091796875, 0.31317138671875, 0.3361358642578125, 0.359100341796875, 0.3820648193359375, 0.405029296875, 0.4279937744140625, 0.450958251953125, 0.4739227294921875, 0.49688720703125, 0.5198516845703125, 0.542816162109375, 0.5657806396484375, 0.5887451171875, 0.6117095947265625, 0.634674072265625, 0.6576385498046875, 0.68060302734375, 0.7035675048828125, 0.726531982421875, 0.7494964599609375, 0.7724609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 12.0, 18.0, 31.0, 31.0, 66.0, 64.0, 87.0, 91.0, 101.0, 106.0, 94.0, 72.0, 68.0, 44.0, 44.0, 34.0, 13.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11504077911376953, -0.10929298400878906, -0.1035451889038086, -0.09779739379882812, -0.09204959869384766, -0.08630180358886719, -0.08055400848388672, -0.07480621337890625, -0.06905841827392578, -0.06331062316894531, -0.057562828063964844, -0.051815032958984375, -0.046067237854003906, -0.04031944274902344, -0.03457164764404297, -0.0288238525390625, -0.02307605743408203, -0.017328262329101562, -0.011580467224121094, -0.005832672119140625, -8.487701416015625e-05, 0.0056629180908203125, 0.011410713195800781, 0.01715850830078125, 0.02290630340576172, 0.028654098510742188, 0.034401893615722656, 0.040149688720703125, 0.045897483825683594, 0.05164527893066406, 0.05739307403564453, 0.063140869140625, 0.06888866424560547, 0.07463645935058594, 0.0803842544555664, 0.08613204956054688, 0.09187984466552734, 0.09762763977050781, 0.10337543487548828, 0.10912322998046875, 0.11487102508544922, 0.12061882019042969, 0.12636661529541016, 0.13211441040039062, 0.1378622055053711, 0.14361000061035156, 0.14935779571533203, 0.1551055908203125, 0.16085338592529297, 0.16660118103027344, 0.1723489761352539, 0.17809677124023438, 0.18384456634521484, 0.1895923614501953, 0.19534015655517578, 0.20108795166015625, 0.20683574676513672, 0.2125835418701172, 0.21833133697509766, 0.22407913208007812, 0.2298269271850586, 0.23557472229003906, 0.24132251739501953, 0.2470703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 6.0, 7.0, 15.0, 15.0, 23.0, 35.0, 47.0, 77.0, 119.0, 246.0, 491.0, 1025.0, 2864.0, 9099.0, 40351.0, 322658.0, 584789.0, 66704.0, 13451.0, 3846.0, 1360.0, 594.0, 286.0, 143.0, 95.0, 66.0, 36.0, 29.0, 12.0, 16.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.66015625, -0.639617919921875, -0.61907958984375, -0.598541259765625, -0.5780029296875, -0.557464599609375, -0.53692626953125, -0.516387939453125, -0.495849609375, -0.475311279296875, -0.45477294921875, -0.434234619140625, -0.4136962890625, -0.393157958984375, -0.37261962890625, -0.352081298828125, -0.33154296875, -0.311004638671875, -0.29046630859375, -0.269927978515625, -0.2493896484375, -0.228851318359375, -0.20831298828125, -0.187774658203125, -0.167236328125, -0.146697998046875, -0.12615966796875, -0.105621337890625, -0.0850830078125, -0.064544677734375, -0.04400634765625, -0.023468017578125, -0.0029296875, 0.017608642578125, 0.03814697265625, 0.058685302734375, 0.0792236328125, 0.099761962890625, 0.12030029296875, 0.140838623046875, 0.161376953125, 0.181915283203125, 0.20245361328125, 0.222991943359375, 0.2435302734375, 0.264068603515625, 0.28460693359375, 0.305145263671875, 0.32568359375, 0.346221923828125, 0.36676025390625, 0.387298583984375, 0.4078369140625, 0.428375244140625, 0.44891357421875, 0.469451904296875, 0.489990234375, 0.510528564453125, 0.53106689453125, 0.551605224609375, 0.5721435546875, 0.592681884765625, 0.61322021484375, 0.633758544921875, 0.654296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 4.0, 10.0, 21.0, 11.0, 21.0, 24.0, 35.0, 43.0, 41.0, 53.0, 52.0, 62.0, 64.0, 62.0, 46.0, 71.0, 45.0, 54.0, 41.0, 53.0, 33.0, 26.0, 30.0, 16.0, 12.0, 10.0, 10.0, 10.0, 4.0, 9.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49951171875, -0.48384857177734375, -0.4681854248046875, -0.45252227783203125, -0.436859130859375, -0.42119598388671875, -0.4055328369140625, -0.38986968994140625, -0.37420654296875, -0.35854339599609375, -0.3428802490234375, -0.32721710205078125, -0.311553955078125, -0.29589080810546875, -0.2802276611328125, -0.26456451416015625, -0.2489013671875, -0.23323822021484375, -0.2175750732421875, -0.20191192626953125, -0.186248779296875, -0.17058563232421875, -0.1549224853515625, -0.13925933837890625, -0.12359619140625, -0.10793304443359375, -0.0922698974609375, -0.07660675048828125, -0.060943603515625, -0.04528045654296875, -0.0296173095703125, -0.01395416259765625, 0.001708984375, 0.01737213134765625, 0.0330352783203125, 0.04869842529296875, 0.064361572265625, 0.08002471923828125, 0.0956878662109375, 0.11135101318359375, 0.12701416015625, 0.14267730712890625, 0.1583404541015625, 0.17400360107421875, 0.189666748046875, 0.20532989501953125, 0.2209930419921875, 0.23665618896484375, 0.2523193359375, 0.26798248291015625, 0.2836456298828125, 0.29930877685546875, 0.314971923828125, 0.33063507080078125, 0.3462982177734375, 0.36196136474609375, 0.37762451171875, 0.39328765869140625, 0.4089508056640625, 0.42461395263671875, 0.440277099609375, 0.45594024658203125, 0.4716033935546875, 0.48726654052734375, 0.5029296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 11.0, 12.0, 16.0, 28.0, 38.0, 47.0, 90.0, 169.0, 420.0, 1284.0, 5783.0, 92392.0, 909461.0, 33629.0, 3640.0, 890.0, 298.0, 117.0, 81.0, 40.0, 30.0, 25.0, 19.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337646484375, -0.3265266418457031, -0.31540679931640625, -0.3042869567871094, -0.2931671142578125, -0.2820472717285156, -0.27092742919921875, -0.2598075866699219, -0.248687744140625, -0.23756790161132812, -0.22644805908203125, -0.21532821655273438, -0.2042083740234375, -0.19308853149414062, -0.18196868896484375, -0.17084884643554688, -0.15972900390625, -0.14860916137695312, -0.13748931884765625, -0.12636947631835938, -0.1152496337890625, -0.10412979125976562, -0.09300994873046875, -0.08189010620117188, -0.070770263671875, -0.059650421142578125, -0.04853057861328125, -0.037410736083984375, -0.0262908935546875, -0.015171051025390625, -0.00405120849609375, 0.007068634033203125, 0.0181884765625, 0.029308319091796875, 0.04042816162109375, 0.051548004150390625, 0.0626678466796875, 0.07378768920898438, 0.08490753173828125, 0.09602737426757812, 0.107147216796875, 0.11826705932617188, 0.12938690185546875, 0.14050674438476562, 0.1516265869140625, 0.16274642944335938, 0.17386627197265625, 0.18498611450195312, 0.19610595703125, 0.20722579956054688, 0.21834564208984375, 0.22946548461914062, 0.2405853271484375, 0.2517051696777344, 0.26282501220703125, 0.2739448547363281, 0.285064697265625, 0.2961845397949219, 0.30730438232421875, 0.3184242248535156, 0.3295440673828125, 0.3406639099121094, 0.35178375244140625, 0.3629035949707031, 0.3740234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 11.0, 11.0, 9.0, 16.0, 17.0, 23.0, 29.0, 32.0, 42.0, 43.0, 63.0, 68.0, 65.0, 66.0, 77.0, 76.0, 61.0, 51.0, 35.0, 37.0, 39.0, 23.0, 18.0, 27.0, 8.0, 8.0, 7.0, 5.0, 3.0, 5.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4781951904296875e-05, -1.433398574590683e-05, -1.3886019587516785e-05, -1.343805342912674e-05, -1.2990087270736694e-05, -1.254212111234665e-05, -1.2094154953956604e-05, -1.1646188795566559e-05, -1.1198222637176514e-05, -1.0750256478786469e-05, -1.0302290320396423e-05, -9.854324162006378e-06, -9.406358003616333e-06, -8.958391845226288e-06, -8.510425686836243e-06, -8.062459528446198e-06, -7.614493370056152e-06, -7.166527211666107e-06, -6.718561053276062e-06, -6.270594894886017e-06, -5.822628736495972e-06, -5.3746625781059265e-06, -4.926696419715881e-06, -4.478730261325836e-06, -4.030764102935791e-06, -3.582797944545746e-06, -3.1348317861557007e-06, -2.6868656277656555e-06, -2.2388994693756104e-06, -1.7909333109855652e-06, -1.34296715259552e-06, -8.950009942054749e-07, -4.470348358154297e-07, 9.313225746154785e-10, 4.4889748096466064e-07, 8.968636393547058e-07, 1.344829797744751e-06, 1.7927959561347961e-06, 2.2407621145248413e-06, 2.6887282729148865e-06, 3.1366944313049316e-06, 3.584660589694977e-06, 4.032626748085022e-06, 4.480592906475067e-06, 4.928559064865112e-06, 5.3765252232551575e-06, 5.824491381645203e-06, 6.272457540035248e-06, 6.720423698425293e-06, 7.168389856815338e-06, 7.616356015205383e-06, 8.064322173595428e-06, 8.512288331985474e-06, 8.960254490375519e-06, 9.408220648765564e-06, 9.856186807155609e-06, 1.0304152965545654e-05, 1.07521191239357e-05, 1.1200085282325745e-05, 1.164805144071579e-05, 1.2096017599105835e-05, 1.254398375749588e-05, 1.2991949915885925e-05, 1.343991607427597e-05, 1.3887882232666016e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 11.0, 8.0, 21.0, 28.0, 29.0, 80.0, 104.0, 192.0, 474.0, 1109.0, 3620.0, 17935.0, 297673.0, 682779.0, 36124.0, 5563.0, 1597.0, 590.0, 252.0, 134.0, 77.0, 43.0, 33.0, 20.0, 6.0, 4.0, 7.0, 5.0, 2.0, 7.0, 5.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.228759765625, -0.2214183807373047, -0.21407699584960938, -0.20673561096191406, -0.19939422607421875, -0.19205284118652344, -0.18471145629882812, -0.1773700714111328, -0.1700286865234375, -0.1626873016357422, -0.15534591674804688, -0.14800453186035156, -0.14066314697265625, -0.13332176208496094, -0.12598037719726562, -0.11863899230957031, -0.111297607421875, -0.10395622253417969, -0.09661483764648438, -0.08927345275878906, -0.08193206787109375, -0.07459068298339844, -0.06724929809570312, -0.05990791320800781, -0.0525665283203125, -0.04522514343261719, -0.037883758544921875, -0.030542373657226562, -0.02320098876953125, -0.015859603881835938, -0.008518218994140625, -0.0011768341064453125, 0.00616455078125, 0.013505935668945312, 0.020847320556640625, 0.028188705444335938, 0.03553009033203125, 0.04287147521972656, 0.050212860107421875, 0.05755424499511719, 0.0648956298828125, 0.07223701477050781, 0.07957839965820312, 0.08691978454589844, 0.09426116943359375, 0.10160255432128906, 0.10894393920898438, 0.11628532409667969, 0.123626708984375, 0.1309680938720703, 0.13830947875976562, 0.14565086364746094, 0.15299224853515625, 0.16033363342285156, 0.16767501831054688, 0.1750164031982422, 0.1823577880859375, 0.1896991729736328, 0.19704055786132812, 0.20438194274902344, 0.21172332763671875, 0.21906471252441406, 0.22640609741210938, 0.2337474822998047, 0.2410888671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 13.0, 10.0, 23.0, 18.0, 34.0, 56.0, 79.0, 96.0, 121.0, 148.0, 121.0, 80.0, 55.0, 38.0, 27.0, 25.0, 13.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.162841796875, -0.1579151153564453, -0.15298843383789062, -0.14806175231933594, -0.14313507080078125, -0.13820838928222656, -0.13328170776367188, -0.1283550262451172, -0.1234283447265625, -0.11850166320800781, -0.11357498168945312, -0.10864830017089844, -0.10372161865234375, -0.09879493713378906, -0.09386825561523438, -0.08894157409667969, -0.084014892578125, -0.07908821105957031, -0.07416152954101562, -0.06923484802246094, -0.06430816650390625, -0.05938148498535156, -0.054454803466796875, -0.04952812194824219, -0.0446014404296875, -0.03967475891113281, -0.034748077392578125, -0.029821395874023438, -0.02489471435546875, -0.019968032836914062, -0.015041351318359375, -0.010114669799804688, -0.00518798828125, -0.0002613067626953125, 0.004665374755859375, 0.009592056274414062, 0.01451873779296875, 0.019445419311523438, 0.024372100830078125, 0.029298782348632812, 0.0342254638671875, 0.03915214538574219, 0.044078826904296875, 0.04900550842285156, 0.05393218994140625, 0.05885887145996094, 0.06378555297851562, 0.06871223449707031, 0.073638916015625, 0.07856559753417969, 0.08349227905273438, 0.08841896057128906, 0.09334564208984375, 0.09827232360839844, 0.10319900512695312, 0.10812568664550781, 0.1130523681640625, 0.11797904968261719, 0.12290573120117188, 0.12783241271972656, 0.13275909423828125, 0.13768577575683594, 0.14261245727539062, 0.1475391387939453, 0.1524658203125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 9.0, 14.0, 25.0, 58.0, 101.0, 244.0, 301.0, 134.0, 55.0, 30.0, 12.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.129291534423828, -1.997900366783142, -1.8665093183517456, -1.7351181507110596, -1.603727102279663, -1.472335934638977, -1.340944766998291, -1.2095537185668945, -1.0781625509262085, -0.9467714428901672, -0.815380334854126, -0.6839891672134399, -0.5525980591773987, -0.4212069511413574, -0.2898157835006714, -0.15842467546463013, -0.027033567428588867, 0.10435755550861359, 0.23574867844581604, 0.3671398162841797, 0.49853092432022095, 0.6299220323562622, 0.7613131999969482, 0.8927043080329895, 1.0240954160690308, 1.1554865837097168, 1.2868776321411133, 1.4182687997817993, 1.5496599674224854, 1.6810510158538818, 1.8124421834945679, 1.943833351135254, 2.0752243995666504, 2.206615447998047, 2.3380067348480225, 2.469397783279419, 2.6007888317108154, 2.732180118560791, 2.8635711669921875, 2.994962215423584, 3.1263532638549805, 3.257744312286377, 3.3891355991363525, 3.520526647567749, 3.6519176959991455, 3.783308982849121, 3.9147000312805176, 4.046091079711914, 4.177482604980469, 4.308873653411865, 4.440264701843262, 4.571656227111816, 4.703047275543213, 4.834438323974609, 4.965829372406006, 5.097220420837402, 5.228611469268799, 5.360002517700195, 5.491393566131592, 5.622784614562988, 5.754176139831543, 5.8855671882629395, 6.016958236694336, 6.148349285125732, 6.279740333557129]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 5.0, 7.0, 16.0, 22.0, 19.0, 26.0, 31.0, 24.0, 30.0, 45.0, 39.0, 49.0, 37.0, 65.0, 61.0, 48.0, 69.0, 59.0, 35.0, 40.0, 40.0, 33.0, 30.0, 29.0, 25.0, 18.0, 10.0, 11.0, 8.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2502613067626953, -2.168671131134033, -2.087080955505371, -2.005490779876709, -1.9239004850387573, -1.8423101902008057, -1.7607200145721436, -1.6791298389434814, -1.5975396633148193, -1.5159494876861572, -1.4343591928482056, -1.3527690172195435, -1.2711788415908813, -1.1895885467529297, -1.1079983711242676, -1.0264081954956055, -0.9448179006576538, -0.8632276654243469, -0.7816374897956848, -0.7000472545623779, -0.6184570789337158, -0.5368668437004089, -0.45527660846710205, -0.37368643283843994, -0.29209619760513306, -0.21050599217414856, -0.12891577184200287, -0.04732555150985718, 0.03426465392112732, 0.11585485935211182, 0.1974450945854187, 0.2790352702140808, 0.3606255054473877, 0.4422157108783722, 0.5238059163093567, 0.6053961515426636, 0.6869863271713257, 0.7685765624046326, 0.8501667976379395, 0.9317569732666016, 1.0133471488952637, 1.0949373245239258, 1.1765276193618774, 1.2581177949905396, 1.3397079706192017, 1.4212982654571533, 1.5028884410858154, 1.5844786167144775, 1.6660689115524292, 1.7476590871810913, 1.829249382019043, 1.910839557647705, 1.9924297332763672, 2.0740199089050293, 2.1556100845336914, 2.2372002601623535, 2.3187906742095947, 2.400380849838257, 2.481971025466919, 2.56356143951416, 2.6451516151428223, 2.7267417907714844, 2.8083319664001465, 2.8899221420288086, 2.9715123176574707]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 6.0, 9.0, 8.0, 5.0, 23.0, 9.0, 34.0, 66.0, 130.0, 204.0, 436.0, 827.0, 1890.0, 5315.0, 21035.0, 215583.0, 3864410.0, 66281.0, 11279.0, 3431.0, 1450.0, 684.0, 390.0, 215.0, 157.0, 115.0, 60.0, 59.0, 42.0, 31.0, 27.0, 14.0, 7.0, 8.0, 8.0, 9.0, 1.0, 9.0, 4.0, 0.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.61083984375, -0.5846328735351562, -0.5584259033203125, -0.5322189331054688, -0.506011962890625, -0.47980499267578125, -0.4535980224609375, -0.42739105224609375, -0.40118408203125, -0.37497711181640625, -0.3487701416015625, -0.32256317138671875, -0.296356201171875, -0.27014923095703125, -0.2439422607421875, -0.21773529052734375, -0.1915283203125, -0.16532135009765625, -0.1391143798828125, -0.11290740966796875, -0.086700439453125, -0.06049346923828125, -0.0342864990234375, -0.00807952880859375, 0.01812744140625, 0.04433441162109375, 0.0705413818359375, 0.09674835205078125, 0.122955322265625, 0.14916229248046875, 0.1753692626953125, 0.20157623291015625, 0.227783203125, 0.25399017333984375, 0.2801971435546875, 0.30640411376953125, 0.332611083984375, 0.35881805419921875, 0.3850250244140625, 0.41123199462890625, 0.43743896484375, 0.46364593505859375, 0.4898529052734375, 0.5160598754882812, 0.542266845703125, 0.5684738159179688, 0.5946807861328125, 0.6208877563476562, 0.6470947265625, 0.6733016967773438, 0.6995086669921875, 0.7257156372070312, 0.751922607421875, 0.7781295776367188, 0.8043365478515625, 0.8305435180664062, 0.85675048828125, 0.8829574584960938, 0.9091644287109375, 0.9353713989257812, 0.961578369140625, 0.9877853393554688, 1.0139923095703125, 1.0401992797851562, 1.06640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 13.0, 12.0, 34.0, 29.0, 49.0, 63.0, 59.0, 91.0, 96.0, 86.0, 99.0, 87.0, 69.0, 65.0, 44.0, 37.0, 26.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12211418151855469, -0.11617660522460938, -0.11023902893066406, -0.10430145263671875, -0.09836387634277344, -0.09242630004882812, -0.08648872375488281, -0.0805511474609375, -0.07461357116699219, -0.06867599487304688, -0.06273841857910156, -0.05680084228515625, -0.05086326599121094, -0.044925689697265625, -0.03898811340332031, -0.033050537109375, -0.027112960815429688, -0.021175384521484375, -0.015237808227539062, -0.00930023193359375, -0.0033626556396484375, 0.002574920654296875, 0.008512496948242188, 0.0144500732421875, 0.020387649536132812, 0.026325225830078125, 0.03226280212402344, 0.03820037841796875, 0.04413795471191406, 0.050075531005859375, 0.05601310729980469, 0.06195068359375, 0.06788825988769531, 0.07382583618164062, 0.07976341247558594, 0.08570098876953125, 0.09163856506347656, 0.09757614135742188, 0.10351371765136719, 0.1094512939453125, 0.11538887023925781, 0.12132644653320312, 0.12726402282714844, 0.13320159912109375, 0.13913917541503906, 0.14507675170898438, 0.1510143280029297, 0.156951904296875, 0.1628894805908203, 0.16882705688476562, 0.17476463317871094, 0.18070220947265625, 0.18663978576660156, 0.19257736206054688, 0.1985149383544922, 0.2044525146484375, 0.2103900909423828, 0.21632766723632812, 0.22226524353027344, 0.22820281982421875, 0.23414039611816406, 0.24007797241210938, 0.2460155487060547, 0.251953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 3.0, 6.0, 5.0, 9.0, 15.0, 18.0, 20.0, 21.0, 20.0, 47.0, 56.0, 76.0, 96.0, 183.0, 355.0, 1676.0, 3465489.0, 723890.0, 1417.0, 319.0, 174.0, 107.0, 76.0, 52.0, 44.0, 22.0, 21.0, 8.0, 9.0, 12.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.244140625, -3.156402587890625, -3.06866455078125, -2.980926513671875, -2.8931884765625, -2.805450439453125, -2.71771240234375, -2.629974365234375, -2.542236328125, -2.454498291015625, -2.36676025390625, -2.279022216796875, -2.1912841796875, -2.103546142578125, -2.01580810546875, -1.928070068359375, -1.84033203125, -1.752593994140625, -1.66485595703125, -1.577117919921875, -1.4893798828125, -1.401641845703125, -1.31390380859375, -1.226165771484375, -1.138427734375, -1.050689697265625, -0.96295166015625, -0.875213623046875, -0.7874755859375, -0.699737548828125, -0.61199951171875, -0.524261474609375, -0.4365234375, -0.348785400390625, -0.26104736328125, -0.173309326171875, -0.0855712890625, 0.002166748046875, 0.08990478515625, 0.177642822265625, 0.265380859375, 0.353118896484375, 0.44085693359375, 0.528594970703125, 0.6163330078125, 0.704071044921875, 0.79180908203125, 0.879547119140625, 0.96728515625, 1.055023193359375, 1.14276123046875, 1.230499267578125, 1.3182373046875, 1.405975341796875, 1.49371337890625, 1.581451416015625, 1.669189453125, 1.756927490234375, 1.84466552734375, 1.932403564453125, 2.0201416015625, 2.107879638671875, 2.19561767578125, 2.283355712890625, 2.37109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 16.0, 44.0, 151.0, 3057.0, 671.0, 92.0, 31.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64306640625, -0.6273002624511719, -0.6115341186523438, -0.5957679748535156, -0.5800018310546875, -0.5642356872558594, -0.5484695434570312, -0.5327033996582031, -0.516937255859375, -0.5011711120605469, -0.48540496826171875, -0.4696388244628906, -0.4538726806640625, -0.4381065368652344, -0.42234039306640625, -0.4065742492675781, -0.39080810546875, -0.3750419616699219, -0.35927581787109375, -0.3435096740722656, -0.3277435302734375, -0.3119773864746094, -0.29621124267578125, -0.2804450988769531, -0.264678955078125, -0.24891281127929688, -0.23314666748046875, -0.21738052368164062, -0.2016143798828125, -0.18584823608398438, -0.17008209228515625, -0.15431594848632812, -0.1385498046875, -0.12278366088867188, -0.10701751708984375, -0.09125137329101562, -0.0754852294921875, -0.059719085693359375, -0.04395294189453125, -0.028186798095703125, -0.012420654296875, 0.003345489501953125, 0.01911163330078125, 0.034877777099609375, 0.0506439208984375, 0.06641006469726562, 0.08217620849609375, 0.09794235229492188, 0.11370849609375, 0.12947463989257812, 0.14524078369140625, 0.16100692749023438, 0.1767730712890625, 0.19253921508789062, 0.20830535888671875, 0.22407150268554688, 0.239837646484375, 0.2556037902832031, 0.27136993408203125, 0.2871360778808594, 0.3029022216796875, 0.3186683654785156, 0.33443450927734375, 0.3502006530761719, 0.365966796875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 51.0, 877.0, 69.0, 5.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.579231262207031, -9.342940330505371, -9.106649398803711, -8.870357513427734, -8.634066581726074, -8.397775650024414, -8.161483764648438, -7.925192832946777, -7.688901901245117, -7.452610969543457, -7.216319561004639, -6.98002815246582, -6.74373722076416, -6.5074462890625, -6.271154880523682, -6.034863471984863, -5.798572540283203, -5.562281608581543, -5.325990200042725, -5.089698791503906, -4.853407859802246, -4.617116928100586, -4.380825519561768, -4.144534111022949, -3.908243179321289, -3.67195200920105, -3.4356608390808105, -3.1993696689605713, -2.963078498840332, -2.7267873287200928, -2.4904961585998535, -2.2542049884796143, -2.017913818359375, -1.7816226482391357, -1.5453314781188965, -1.3090403079986572, -1.072749137878418, -0.8364579677581787, -0.6001667976379395, -0.3638756275177002, -0.12758445739746094, 0.10870671272277832, 0.3449978828430176, 0.5812890529632568, 0.8175802230834961, 1.0538713932037354, 1.2901625633239746, 1.5264537334442139, 1.7627449035644531, 1.9990360736846924, 2.2353272438049316, 2.471618413925171, 2.70790958404541, 2.9442007541656494, 3.1804919242858887, 3.416783094406128, 3.653074264526367, 3.8893654346466064, 4.125656604766846, 4.361948013305664, 4.598238945007324, 4.834529876708984, 5.070821285247803, 5.307112693786621, 5.543403625488281]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 11.0, 16.0, 22.0, 31.0, 42.0, 67.0, 77.0, 72.0, 80.0, 80.0, 87.0, 79.0, 77.0, 69.0, 54.0, 36.0, 38.0, 27.0, 16.0, 9.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7951920628547668, -0.7656492590904236, -0.7361063957214355, -0.7065635919570923, -0.677020788192749, -0.6474779844284058, -0.6179351806640625, -0.5883923172950745, -0.5588495135307312, -0.5293067097663879, -0.4997638761997223, -0.47022104263305664, -0.4406782388687134, -0.4111354351043701, -0.38159260153770447, -0.3520497679710388, -0.32250696420669556, -0.2929641604423523, -0.26342132687568665, -0.2338785082101822, -0.20433568954467773, -0.17479287087917328, -0.14525005221366882, -0.11570723354816437, -0.08616441488265991, -0.05662159621715546, -0.027078777551651, 0.0024640411138534546, 0.03200685977935791, 0.061549678444862366, 0.09109249711036682, 0.12063531577587128, 0.1501781940460205, 0.17972101271152496, 0.20926383137702942, 0.23880665004253387, 0.26834946870803833, 0.2978922724723816, 0.32743510603904724, 0.3569779396057129, 0.38652074337005615, 0.4160635471343994, 0.44560638070106506, 0.4751492142677307, 0.504692018032074, 0.5342348217964172, 0.5637776851654053, 0.5933204889297485, 0.6228632926940918, 0.6524060964584351, 0.6819489002227783, 0.7114917635917664, 0.7410345673561096, 0.7705773711204529, 0.8001202344894409, 0.8296630382537842, 0.8592058420181274, 0.8887486457824707, 0.918291449546814, 0.947834312915802, 0.9773771166801453, 1.0069199800491333, 1.0364627838134766, 1.0660055875778198, 1.095548391342163]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 16.0, 15.0, 18.0, 37.0, 36.0, 42.0, 65.0, 89.0, 149.0, 238.0, 390.0, 655.0, 1145.0, 2503.0, 7058.0, 23284.0, 100318.0, 575891.0, 268951.0, 46848.0, 12754.0, 4262.0, 1685.0, 801.0, 487.0, 279.0, 173.0, 102.0, 92.0, 39.0, 35.0, 28.0, 20.0, 12.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.472900390625, -0.4545402526855469, -0.43618011474609375, -0.4178199768066406, -0.3994598388671875, -0.3810997009277344, -0.36273956298828125, -0.3443794250488281, -0.326019287109375, -0.3076591491699219, -0.28929901123046875, -0.2709388732910156, -0.2525787353515625, -0.23421859741210938, -0.21585845947265625, -0.19749832153320312, -0.17913818359375, -0.16077804565429688, -0.14241790771484375, -0.12405776977539062, -0.1056976318359375, -0.08733749389648438, -0.06897735595703125, -0.050617218017578125, -0.032257080078125, -0.013896942138671875, 0.00446319580078125, 0.022823333740234375, 0.0411834716796875, 0.059543609619140625, 0.07790374755859375, 0.09626388549804688, 0.1146240234375, 0.13298416137695312, 0.15134429931640625, 0.16970443725585938, 0.1880645751953125, 0.20642471313476562, 0.22478485107421875, 0.24314498901367188, 0.261505126953125, 0.2798652648925781, 0.29822540283203125, 0.3165855407714844, 0.3349456787109375, 0.3533058166503906, 0.37166595458984375, 0.3900260925292969, 0.40838623046875, 0.4267463684082031, 0.44510650634765625, 0.4634666442871094, 0.4818267822265625, 0.5001869201660156, 0.5185470581054688, 0.5369071960449219, 0.555267333984375, 0.5736274719238281, 0.5919876098632812, 0.6103477478027344, 0.6287078857421875, 0.6470680236816406, 0.6654281616210938, 0.6837882995605469, 0.7021484375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 8.0, 6.0, 13.0, 27.0, 22.0, 25.0, 50.0, 57.0, 54.0, 60.0, 82.0, 85.0, 92.0, 80.0, 65.0, 55.0, 55.0, 45.0, 28.0, 32.0, 25.0, 5.0, 16.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10821533203125, -0.10307979583740234, -0.09794425964355469, -0.09280872344970703, -0.08767318725585938, -0.08253765106201172, -0.07740211486816406, -0.0722665786743164, -0.06713104248046875, -0.061995506286621094, -0.05685997009277344, -0.05172443389892578, -0.046588897705078125, -0.04145336151123047, -0.03631782531738281, -0.031182289123535156, -0.0260467529296875, -0.020911216735839844, -0.015775680541992188, -0.010640144348144531, -0.005504608154296875, -0.00036907196044921875, 0.0047664642333984375, 0.009902000427246094, 0.01503753662109375, 0.020173072814941406, 0.025308609008789062, 0.03044414520263672, 0.035579681396484375, 0.04071521759033203, 0.04585075378417969, 0.050986289978027344, 0.056121826171875, 0.061257362365722656, 0.06639289855957031, 0.07152843475341797, 0.07666397094726562, 0.08179950714111328, 0.08693504333496094, 0.0920705795288086, 0.09720611572265625, 0.1023416519165039, 0.10747718811035156, 0.11261272430419922, 0.11774826049804688, 0.12288379669189453, 0.1280193328857422, 0.13315486907958984, 0.1382904052734375, 0.14342594146728516, 0.1485614776611328, 0.15369701385498047, 0.15883255004882812, 0.16396808624267578, 0.16910362243652344, 0.1742391586303711, 0.17937469482421875, 0.1845102310180664, 0.18964576721191406, 0.19478130340576172, 0.19991683959960938, 0.20505237579345703, 0.2101879119873047, 0.21532344818115234, 0.220458984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 6.0, 14.0, 17.0, 22.0, 29.0, 56.0, 80.0, 107.0, 237.0, 431.0, 982.0, 2425.0, 7258.0, 28649.0, 207456.0, 686674.0, 89642.0, 16478.0, 4666.0, 1689.0, 760.0, 352.0, 188.0, 109.0, 64.0, 35.0, 29.0, 25.0, 14.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67333984375, -0.6495590209960938, -0.6257781982421875, -0.6019973754882812, -0.578216552734375, -0.5544357299804688, -0.5306549072265625, -0.5068740844726562, -0.48309326171875, -0.45931243896484375, -0.4355316162109375, -0.41175079345703125, -0.387969970703125, -0.36418914794921875, -0.3404083251953125, -0.31662750244140625, -0.2928466796875, -0.26906585693359375, -0.2452850341796875, -0.22150421142578125, -0.197723388671875, -0.17394256591796875, -0.1501617431640625, -0.12638092041015625, -0.10260009765625, -0.07881927490234375, -0.0550384521484375, -0.03125762939453125, -0.007476806640625, 0.01630401611328125, 0.0400848388671875, 0.06386566162109375, 0.087646484375, 0.11142730712890625, 0.1352081298828125, 0.15898895263671875, 0.182769775390625, 0.20655059814453125, 0.2303314208984375, 0.25411224365234375, 0.27789306640625, 0.30167388916015625, 0.3254547119140625, 0.34923553466796875, 0.373016357421875, 0.39679718017578125, 0.4205780029296875, 0.44435882568359375, 0.4681396484375, 0.49192047119140625, 0.5157012939453125, 0.5394821166992188, 0.563262939453125, 0.5870437622070312, 0.6108245849609375, 0.6346054077148438, 0.65838623046875, 0.6821670532226562, 0.7059478759765625, 0.7297286987304688, 0.753509521484375, 0.7772903442382812, 0.8010711669921875, 0.8248519897460938, 0.8486328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 9.0, 8.0, 15.0, 14.0, 19.0, 31.0, 30.0, 43.0, 49.0, 49.0, 55.0, 59.0, 78.0, 76.0, 60.0, 75.0, 51.0, 55.0, 43.0, 31.0, 22.0, 27.0, 16.0, 17.0, 9.0, 9.0, 4.0, 10.0, 6.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57421875, -0.5531234741210938, -0.5320281982421875, -0.5109329223632812, -0.489837646484375, -0.46874237060546875, -0.4476470947265625, -0.42655181884765625, -0.40545654296875, -0.38436126708984375, -0.3632659912109375, -0.34217071533203125, -0.321075439453125, -0.29998016357421875, -0.2788848876953125, -0.25778961181640625, -0.2366943359375, -0.21559906005859375, -0.1945037841796875, -0.17340850830078125, -0.152313232421875, -0.13121795654296875, -0.1101226806640625, -0.08902740478515625, -0.06793212890625, -0.04683685302734375, -0.0257415771484375, -0.00464630126953125, 0.016448974609375, 0.03754425048828125, 0.0586395263671875, 0.07973480224609375, 0.100830078125, 0.12192535400390625, 0.1430206298828125, 0.16411590576171875, 0.185211181640625, 0.20630645751953125, 0.2274017333984375, 0.24849700927734375, 0.26959228515625, 0.29068756103515625, 0.3117828369140625, 0.33287811279296875, 0.353973388671875, 0.37506866455078125, 0.3961639404296875, 0.41725921630859375, 0.4383544921875, 0.45944976806640625, 0.4805450439453125, 0.5016403198242188, 0.522735595703125, 0.5438308715820312, 0.5649261474609375, 0.5860214233398438, 0.60711669921875, 0.6282119750976562, 0.6493072509765625, 0.6704025268554688, 0.691497802734375, 0.7125930786132812, 0.7336883544921875, 0.7547836303710938, 0.77587890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 11.0, 9.0, 23.0, 33.0, 60.0, 104.0, 154.0, 311.0, 792.0, 2363.0, 12536.0, 424421.0, 588699.0, 14799.0, 2571.0, 818.0, 383.0, 168.0, 109.0, 60.0, 39.0, 21.0, 17.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.398193359375, -0.3853645324707031, -0.37253570556640625, -0.3597068786621094, -0.3468780517578125, -0.3340492248535156, -0.32122039794921875, -0.3083915710449219, -0.295562744140625, -0.2827339172363281, -0.26990509033203125, -0.2570762634277344, -0.2442474365234375, -0.23141860961914062, -0.21858978271484375, -0.20576095581054688, -0.19293212890625, -0.18010330200195312, -0.16727447509765625, -0.15444564819335938, -0.1416168212890625, -0.12878799438476562, -0.11595916748046875, -0.10313034057617188, -0.090301513671875, -0.07747268676757812, -0.06464385986328125, -0.051815032958984375, -0.0389862060546875, -0.026157379150390625, -0.01332855224609375, -0.000499725341796875, 0.0123291015625, 0.025157928466796875, 0.03798675537109375, 0.050815582275390625, 0.0636444091796875, 0.07647323608398438, 0.08930206298828125, 0.10213088989257812, 0.114959716796875, 0.12778854370117188, 0.14061737060546875, 0.15344619750976562, 0.1662750244140625, 0.17910385131835938, 0.19193267822265625, 0.20476150512695312, 0.21759033203125, 0.23041915893554688, 0.24324798583984375, 0.2560768127441406, 0.2689056396484375, 0.2817344665527344, 0.29456329345703125, 0.3073921203613281, 0.320220947265625, 0.3330497741699219, 0.34587860107421875, 0.3587074279785156, 0.3715362548828125, 0.3843650817871094, 0.39719390869140625, 0.4100227355957031, 0.4228515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 14.0, 15.0, 30.0, 44.0, 73.0, 121.0, 157.0, 150.0, 111.0, 92.0, 72.0, 43.0, 24.0, 14.0, 9.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.89354133605957e-05, -4.780478775501251e-05, -4.667416214942932e-05, -4.554353654384613e-05, -4.441291093826294e-05, -4.328228533267975e-05, -4.215165972709656e-05, -4.102103412151337e-05, -3.9890408515930176e-05, -3.8759782910346985e-05, -3.7629157304763794e-05, -3.64985316991806e-05, -3.536790609359741e-05, -3.423728048801422e-05, -3.310665488243103e-05, -3.197602927684784e-05, -3.084540367126465e-05, -2.9714778065681458e-05, -2.8584152460098267e-05, -2.7453526854515076e-05, -2.6322901248931885e-05, -2.5192275643348694e-05, -2.4061650037765503e-05, -2.2931024432182312e-05, -2.180039882659912e-05, -2.066977322101593e-05, -1.953914761543274e-05, -1.840852200984955e-05, -1.7277896404266357e-05, -1.6147270798683167e-05, -1.5016645193099976e-05, -1.3886019587516785e-05, -1.2755393981933594e-05, -1.1624768376350403e-05, -1.0494142770767212e-05, -9.363517165184021e-06, -8.23289155960083e-06, -7.102265954017639e-06, -5.971640348434448e-06, -4.841014742851257e-06, -3.7103891372680664e-06, -2.5797635316848755e-06, -1.4491379261016846e-06, -3.1851232051849365e-07, 8.121132850646973e-07, 1.942738890647888e-06, 3.073364496231079e-06, 4.20399010181427e-06, 5.334615707397461e-06, 6.465241312980652e-06, 7.595866918563843e-06, 8.726492524147034e-06, 9.857118129730225e-06, 1.0987743735313416e-05, 1.2118369340896606e-05, 1.3248994946479797e-05, 1.4379620552062988e-05, 1.551024615764618e-05, 1.664087176322937e-05, 1.777149736881256e-05, 1.8902122974395752e-05, 2.0032748579978943e-05, 2.1163374185562134e-05, 2.2293999791145325e-05, 2.3424625396728516e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 15.0, 20.0, 18.0, 42.0, 73.0, 129.0, 311.0, 815.0, 3148.0, 28623.0, 914507.0, 93365.0, 5518.0, 1178.0, 412.0, 179.0, 77.0, 42.0, 24.0, 16.0, 15.0, 5.0, 7.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.484130859375, -0.471923828125, -0.459716796875, -0.447509765625, -0.435302734375, -0.423095703125, -0.410888671875, -0.398681640625, -0.386474609375, -0.374267578125, -0.362060546875, -0.349853515625, -0.337646484375, -0.325439453125, -0.313232421875, -0.301025390625, -0.288818359375, -0.276611328125, -0.264404296875, -0.252197265625, -0.239990234375, -0.227783203125, -0.215576171875, -0.203369140625, -0.191162109375, -0.178955078125, -0.166748046875, -0.154541015625, -0.142333984375, -0.130126953125, -0.117919921875, -0.105712890625, -0.093505859375, -0.081298828125, -0.069091796875, -0.056884765625, -0.044677734375, -0.032470703125, -0.020263671875, -0.008056640625, 0.004150390625, 0.016357421875, 0.028564453125, 0.040771484375, 0.052978515625, 0.065185546875, 0.077392578125, 0.089599609375, 0.101806640625, 0.114013671875, 0.126220703125, 0.138427734375, 0.150634765625, 0.162841796875, 0.175048828125, 0.187255859375, 0.199462890625, 0.211669921875, 0.223876953125, 0.236083984375, 0.248291015625, 0.260498046875, 0.272705078125, 0.284912109375, 0.297119140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 12.0, 13.0, 27.0, 34.0, 55.0, 116.0, 193.0, 206.0, 145.0, 89.0, 46.0, 23.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.413818359375, -0.4048786163330078, -0.3959388732910156, -0.38699913024902344, -0.37805938720703125, -0.36911964416503906, -0.3601799011230469, -0.3512401580810547, -0.3423004150390625, -0.3333606719970703, -0.3244209289550781, -0.31548118591308594, -0.30654144287109375, -0.29760169982910156, -0.2886619567871094, -0.2797222137451172, -0.270782470703125, -0.2618427276611328, -0.2529029846191406, -0.24396324157714844, -0.23502349853515625, -0.22608375549316406, -0.21714401245117188, -0.2082042694091797, -0.1992645263671875, -0.1903247833251953, -0.18138504028320312, -0.17244529724121094, -0.16350555419921875, -0.15456581115722656, -0.14562606811523438, -0.1366863250732422, -0.12774658203125, -0.11880683898925781, -0.10986709594726562, -0.10092735290527344, -0.09198760986328125, -0.08304786682128906, -0.07410812377929688, -0.06516838073730469, -0.0562286376953125, -0.04728889465332031, -0.038349151611328125, -0.029409408569335938, -0.02046966552734375, -0.011529922485351562, -0.002590179443359375, 0.0063495635986328125, 0.015289306640625, 0.024229049682617188, 0.033168792724609375, 0.04210853576660156, 0.05104827880859375, 0.05998802185058594, 0.06892776489257812, 0.07786750793457031, 0.0868072509765625, 0.09574699401855469, 0.10468673706054688, 0.11362648010253906, 0.12256622314453125, 0.13150596618652344, 0.14044570922851562, 0.1493854522705078, 0.1583251953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 17.0, 47.0, 176.0, 471.0, 203.0, 56.0, 17.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7482404708862305, -3.4502804279327393, -3.152320384979248, -2.854360342025757, -2.5564002990722656, -2.2584402561187744, -1.9604802131652832, -1.662520170211792, -1.3645601272583008, -1.0666000843048096, -0.7686400413513184, -0.47067999839782715, -0.17271995544433594, 0.12524008750915527, 0.4232001304626465, 0.7211601734161377, 1.019120216369629, 1.3170802593231201, 1.6150403022766113, 1.9130003452301025, 2.2109603881835938, 2.508920431137085, 2.806880474090576, 3.1048405170440674, 3.4028005599975586, 3.70076060295105, 3.998720645904541, 4.296680450439453, 4.594640731811523, 4.892601013183594, 5.190560817718506, 5.488520622253418, 5.786481857299805, 6.084442138671875, 6.382401943206787, 6.680361747741699, 6.9783220291137695, 7.27628231048584, 7.574242115020752, 7.872201919555664, 8.170162200927734, 8.468122482299805, 8.766082763671875, 9.064042091369629, 9.3620023727417, 9.65996265411377, 9.957921981811523, 10.255882263183594, 10.553842544555664, 10.851802825927734, 11.149763107299805, 11.447722434997559, 11.745682716369629, 12.0436429977417, 12.341602325439453, 12.639562606811523, 12.937522888183594, 13.235483169555664, 13.533443450927734, 13.831402778625488, 14.129363059997559, 14.427323341369629, 14.725282669067383, 15.023242950439453, 15.321203231811523]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 7.0, 10.0, 13.0, 6.0, 11.0, 10.0, 24.0, 22.0, 26.0, 23.0, 31.0, 27.0, 37.0, 45.0, 54.0, 44.0, 47.0, 53.0, 47.0, 52.0, 53.0, 54.0, 41.0, 29.0, 41.0, 26.0, 31.0, 24.0, 12.0, 14.0, 19.0, 13.0, 5.0, 8.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0459728240966797, -2.943551778793335, -2.8411309719085693, -2.7387099266052246, -2.636289119720459, -2.5338680744171143, -2.4314470291137695, -2.329026222229004, -2.226605176925659, -2.1241841316223145, -2.021763324737549, -1.919342279434204, -1.816921353340149, -1.7145004272460938, -1.6120795011520386, -1.5096585750579834, -1.4072376489639282, -1.304816722869873, -1.2023957967758179, -1.0999748706817627, -0.997553825378418, -0.8951328992843628, -0.7927119731903076, -0.6902909874916077, -0.5878700613975525, -0.4854491055011749, -0.38302814960479736, -0.2806072235107422, -0.17818626761436462, -0.07576531171798706, 0.026655614376068115, 0.12907660007476807, 0.23149752616882324, 0.3339184820652008, 0.43633943796157837, 0.5387603640556335, 0.6411813497543335, 0.7436022758483887, 0.8460232019424438, 0.9484441876411438, 1.0508651733398438, 1.153286099433899, 1.255707025527954, 1.3581280708312988, 1.460548996925354, 1.5629699230194092, 1.6653908491134644, 1.7678117752075195, 1.8702327013015747, 1.9726536273956299, 2.0750746726989746, 2.1774954795837402, 2.279916524887085, 2.3823375701904297, 2.4847583770751953, 2.58717942237854, 2.6896002292633057, 2.7920212745666504, 2.894442081451416, 2.9968631267547607, 3.0992839336395264, 3.201704978942871, 3.3041257858276367, 3.4065468311309814, 3.508967876434326]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 14.0, 11.0, 28.0, 38.0, 60.0, 89.0, 152.0, 271.0, 512.0, 956.0, 2053.0, 4815.0, 14754.0, 74741.0, 3726191.0, 325265.0, 29724.0, 8209.0, 3077.0, 1470.0, 754.0, 416.0, 208.0, 139.0, 101.0, 60.0, 44.0, 29.0, 26.0, 18.0, 10.0, 5.0, 6.0, 7.0, 1.0, 6.0, 8.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6582183837890625, -0.627960205078125, -0.5977020263671875, -0.56744384765625, -0.5371856689453125, -0.506927490234375, -0.4766693115234375, -0.4464111328125, -0.4161529541015625, -0.385894775390625, -0.3556365966796875, -0.32537841796875, -0.2951202392578125, -0.264862060546875, -0.2346038818359375, -0.204345703125, -0.1740875244140625, -0.143829345703125, -0.1135711669921875, -0.08331298828125, -0.0530548095703125, -0.022796630859375, 0.0074615478515625, 0.0377197265625, 0.0679779052734375, 0.098236083984375, 0.1284942626953125, 0.15875244140625, 0.1890106201171875, 0.219268798828125, 0.2495269775390625, 0.27978515625, 0.3100433349609375, 0.340301513671875, 0.3705596923828125, 0.40081787109375, 0.4310760498046875, 0.461334228515625, 0.4915924072265625, 0.5218505859375, 0.5521087646484375, 0.582366943359375, 0.6126251220703125, 0.64288330078125, 0.6731414794921875, 0.703399658203125, 0.7336578369140625, 0.763916015625, 0.7941741943359375, 0.824432373046875, 0.8546905517578125, 0.88494873046875, 0.9152069091796875, 0.945465087890625, 0.9757232666015625, 1.0059814453125, 1.0362396240234375, 1.066497802734375, 1.0967559814453125, 1.12701416015625, 1.1572723388671875, 1.187530517578125, 1.2177886962890625, 1.248046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 13.0, 11.0, 23.0, 21.0, 24.0, 45.0, 53.0, 61.0, 53.0, 80.0, 88.0, 75.0, 84.0, 62.0, 56.0, 50.0, 44.0, 44.0, 30.0, 28.0, 19.0, 8.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11968994140625, -0.11406803131103516, -0.10844612121582031, -0.10282421112060547, -0.09720230102539062, -0.09158039093017578, -0.08595848083496094, -0.0803365707397461, -0.07471466064453125, -0.0690927505493164, -0.06347084045410156, -0.05784893035888672, -0.052227020263671875, -0.04660511016845703, -0.04098320007324219, -0.035361289978027344, -0.0297393798828125, -0.024117469787597656, -0.018495559692382812, -0.012873649597167969, -0.007251739501953125, -0.0016298294067382812, 0.0039920806884765625, 0.009613990783691406, 0.01523590087890625, 0.020857810974121094, 0.026479721069335938, 0.03210163116455078, 0.037723541259765625, 0.04334545135498047, 0.04896736145019531, 0.054589271545410156, 0.060211181640625, 0.06583309173583984, 0.07145500183105469, 0.07707691192626953, 0.08269882202148438, 0.08832073211669922, 0.09394264221191406, 0.0995645523071289, 0.10518646240234375, 0.1108083724975586, 0.11643028259277344, 0.12205219268798828, 0.12767410278320312, 0.13329601287841797, 0.1389179229736328, 0.14453983306884766, 0.1501617431640625, 0.15578365325927734, 0.1614055633544922, 0.16702747344970703, 0.17264938354492188, 0.17827129364013672, 0.18389320373535156, 0.1895151138305664, 0.19513702392578125, 0.2007589340209961, 0.20638084411621094, 0.21200275421142578, 0.21762466430664062, 0.22324657440185547, 0.2288684844970703, 0.23449039459228516, 0.2401123046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 6.0, 15.0, 28.0, 19.0, 45.0, 91.0, 232.0, 569.0, 2152.0, 15763.0, 4073019.0, 94952.0, 5309.0, 1204.0, 423.0, 175.0, 85.0, 62.0, 47.0, 31.0, 17.0, 10.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.242279052734375, -1.17596435546875, -1.109649658203125, -1.0433349609375, -0.977020263671875, -0.91070556640625, -0.844390869140625, -0.778076171875, -0.711761474609375, -0.64544677734375, -0.579132080078125, -0.5128173828125, -0.446502685546875, -0.38018798828125, -0.313873291015625, -0.24755859375, -0.181243896484375, -0.11492919921875, -0.048614501953125, 0.0177001953125, 0.084014892578125, 0.15032958984375, 0.216644287109375, 0.282958984375, 0.349273681640625, 0.41558837890625, 0.481903076171875, 0.5482177734375, 0.614532470703125, 0.68084716796875, 0.747161865234375, 0.8134765625, 0.879791259765625, 0.94610595703125, 1.012420654296875, 1.0787353515625, 1.145050048828125, 1.21136474609375, 1.277679443359375, 1.343994140625, 1.410308837890625, 1.47662353515625, 1.542938232421875, 1.6092529296875, 1.675567626953125, 1.74188232421875, 1.808197021484375, 1.87451171875, 1.940826416015625, 2.00714111328125, 2.073455810546875, 2.1397705078125, 2.206085205078125, 2.27239990234375, 2.338714599609375, 2.405029296875, 2.471343994140625, 2.53765869140625, 2.603973388671875, 2.6702880859375, 2.736602783203125, 2.80291748046875, 2.869232177734375, 2.935546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 17.0, 27.0, 79.0, 230.0, 2730.0, 723.0, 126.0, 58.0, 21.0, 15.0, 12.0, 10.0, 7.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298828125, -0.27716064453125, -0.2554931640625, -0.23382568359375, -0.212158203125, -0.19049072265625, -0.1688232421875, -0.14715576171875, -0.12548828125, -0.10382080078125, -0.0821533203125, -0.06048583984375, -0.038818359375, -0.01715087890625, 0.0045166015625, 0.02618408203125, 0.0478515625, 0.06951904296875, 0.0911865234375, 0.11285400390625, 0.134521484375, 0.15618896484375, 0.1778564453125, 0.19952392578125, 0.22119140625, 0.24285888671875, 0.2645263671875, 0.28619384765625, 0.307861328125, 0.32952880859375, 0.3511962890625, 0.37286376953125, 0.39453125, 0.41619873046875, 0.4378662109375, 0.45953369140625, 0.481201171875, 0.50286865234375, 0.5245361328125, 0.54620361328125, 0.56787109375, 0.58953857421875, 0.6112060546875, 0.63287353515625, 0.654541015625, 0.67620849609375, 0.6978759765625, 0.71954345703125, 0.7412109375, 0.76287841796875, 0.7845458984375, 0.80621337890625, 0.827880859375, 0.84954833984375, 0.8712158203125, 0.89288330078125, 0.91455078125, 0.93621826171875, 0.9578857421875, 0.97955322265625, 1.001220703125, 1.02288818359375, 1.0445556640625, 1.06622314453125, 1.087890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 37.0, 74.0, 187.0, 335.0, 206.0, 79.0, 38.0, 16.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.143627882003784, -2.0527660846710205, -1.9619044065475464, -1.8710427284240723, -1.7801809310913086, -1.689319133758545, -1.5984574556350708, -1.5075957775115967, -1.416733980178833, -1.3258721828460693, -1.2350105047225952, -1.144148826599121, -1.0532870292663574, -0.9624252915382385, -0.8715635538101196, -0.7807018160820007, -0.6898400783538818, -0.5989783406257629, -0.508116602897644, -0.41725486516952515, -0.32639312744140625, -0.23553138971328735, -0.14466965198516846, -0.05380791425704956, 0.037053823471069336, 0.12791556119918823, 0.21877729892730713, 0.309639036655426, 0.4005007743835449, 0.4913625121116638, 0.5822242498397827, 0.6730859875679016, 0.7639479637145996, 0.8548097014427185, 0.9456714391708374, 1.0365331172943115, 1.1273949146270752, 1.2182567119598389, 1.309118390083313, 1.399980068206787, 1.4908418655395508, 1.5817036628723145, 1.6725653409957886, 1.7634270191192627, 1.8542888164520264, 1.94515061378479, 2.0360121726989746, 2.1268739700317383, 2.217735767364502, 2.3085975646972656, 2.3994593620300293, 2.490320920944214, 2.5811827182769775, 2.672044515609741, 2.762906074523926, 2.8537678718566895, 2.944629669189453, 3.035491466522217, 3.1263532638549805, 3.217214822769165, 3.3080766201019287, 3.3989384174346924, 3.489799976348877, 3.5806617736816406, 3.6715235710144043]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 20.0, 35.0, 39.0, 64.0, 90.0, 96.0, 104.0, 104.0, 111.0, 107.0, 72.0, 49.0, 48.0, 20.0, 5.0, 10.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.661919593811035, -2.5783746242523193, -2.4948296546936035, -2.4112846851348877, -2.327739715576172, -2.244194746017456, -2.1606497764587402, -2.0771048069000244, -1.9935598373413086, -1.9100148677825928, -1.826469898223877, -1.7429249286651611, -1.6593799591064453, -1.5758349895477295, -1.4922900199890137, -1.4087450504302979, -1.3252002000808716, -1.2416552305221558, -1.15811026096344, -1.0745652914047241, -0.9910203218460083, -0.9074753522872925, -0.8239304423332214, -0.7403854727745056, -0.6568405032157898, -0.573295533657074, -0.48975056409835815, -0.4062056243419647, -0.3226606547832489, -0.23911568522453308, -0.15557074546813965, -0.07202577590942383, 0.011519193649291992, 0.09506415575742722, 0.17860911786556244, 0.26215407252311707, 0.3456990420818329, 0.4292440116405487, 0.5127889513969421, 0.596333920955658, 0.6798788905143738, 0.7634238600730896, 0.8469688296318054, 0.9305137395858765, 1.0140587091445923, 1.097603678703308, 1.181148648262024, 1.2646936178207397, 1.3482385873794556, 1.4317835569381714, 1.5153285264968872, 1.598873496055603, 1.6824184656143188, 1.7659634351730347, 1.849508285522461, 1.9330532550811768, 2.0165982246398926, 2.1001431941986084, 2.183688163757324, 2.26723313331604, 2.350778102874756, 2.4343230724334717, 2.5178680419921875, 2.6014130115509033, 2.684957981109619]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 9.0, 5.0, 9.0, 17.0, 17.0, 13.0, 25.0, 41.0, 41.0, 70.0, 111.0, 166.0, 288.0, 526.0, 959.0, 2240.0, 6322.0, 23412.0, 119175.0, 641237.0, 204378.0, 35157.0, 8615.0, 2933.0, 1269.0, 615.0, 335.0, 183.0, 122.0, 68.0, 42.0, 38.0, 25.0, 33.0, 20.0, 15.0, 4.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7980499267578125, -0.774322509765625, -0.7505950927734375, -0.72686767578125, -0.7031402587890625, -0.679412841796875, -0.6556854248046875, -0.6319580078125, -0.6082305908203125, -0.584503173828125, -0.5607757568359375, -0.53704833984375, -0.5133209228515625, -0.489593505859375, -0.4658660888671875, -0.442138671875, -0.4184112548828125, -0.394683837890625, -0.3709564208984375, -0.34722900390625, -0.3235015869140625, -0.299774169921875, -0.2760467529296875, -0.2523193359375, -0.2285919189453125, -0.204864501953125, -0.1811370849609375, -0.15740966796875, -0.1336822509765625, -0.109954833984375, -0.0862274169921875, -0.0625, -0.0387725830078125, -0.015045166015625, 0.0086822509765625, 0.03240966796875, 0.0561370849609375, 0.079864501953125, 0.1035919189453125, 0.1273193359375, 0.1510467529296875, 0.174774169921875, 0.1985015869140625, 0.22222900390625, 0.2459564208984375, 0.269683837890625, 0.2934112548828125, 0.317138671875, 0.3408660888671875, 0.364593505859375, 0.3883209228515625, 0.41204833984375, 0.4357757568359375, 0.459503173828125, 0.4832305908203125, 0.5069580078125, 0.5306854248046875, 0.554412841796875, 0.5781402587890625, 0.60186767578125, 0.6255950927734375, 0.649322509765625, 0.6730499267578125, 0.69677734375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 8.0, 24.0, 20.0, 43.0, 54.0, 68.0, 93.0, 98.0, 119.0, 95.0, 88.0, 78.0, 55.0, 58.0, 42.0, 21.0, 10.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14321517944335938, -0.13555145263671875, -0.12788772583007812, -0.1202239990234375, -0.11256027221679688, -0.10489654541015625, -0.09723281860351562, -0.089569091796875, -0.08190536499023438, -0.07424163818359375, -0.06657791137695312, -0.0589141845703125, -0.051250457763671875, -0.04358673095703125, -0.035923004150390625, -0.02825927734375, -0.020595550537109375, -0.01293182373046875, -0.005268096923828125, 0.0023956298828125, 0.010059356689453125, 0.01772308349609375, 0.025386810302734375, 0.033050537109375, 0.040714263916015625, 0.04837799072265625, 0.056041717529296875, 0.0637054443359375, 0.07136917114257812, 0.07903289794921875, 0.08669662475585938, 0.0943603515625, 0.10202407836914062, 0.10968780517578125, 0.11735153198242188, 0.1250152587890625, 0.13267898559570312, 0.14034271240234375, 0.14800643920898438, 0.155670166015625, 0.16333389282226562, 0.17099761962890625, 0.17866134643554688, 0.1863250732421875, 0.19398880004882812, 0.20165252685546875, 0.20931625366210938, 0.21697998046875, 0.22464370727539062, 0.23230743408203125, 0.23997116088867188, 0.2476348876953125, 0.2552986145019531, 0.26296234130859375, 0.2706260681152344, 0.278289794921875, 0.2859535217285156, 0.29361724853515625, 0.3012809753417969, 0.3089447021484375, 0.3166084289550781, 0.32427215576171875, 0.3319358825683594, 0.339599609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 17.0, 10.0, 38.0, 43.0, 51.0, 71.0, 127.0, 176.0, 294.0, 515.0, 945.0, 1918.0, 3986.0, 9265.0, 22677.0, 63959.0, 230935.0, 471991.0, 160876.0, 48394.0, 18034.0, 7456.0, 3210.0, 1578.0, 822.0, 422.0, 258.0, 154.0, 123.0, 60.0, 44.0, 31.0, 15.0, 9.0, 9.0, 8.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38623046875, -0.3726158142089844, -0.35900115966796875, -0.3453865051269531, -0.3317718505859375, -0.3181571960449219, -0.30454254150390625, -0.2909278869628906, -0.277313232421875, -0.2636985778808594, -0.25008392333984375, -0.23646926879882812, -0.2228546142578125, -0.20923995971679688, -0.19562530517578125, -0.18201065063476562, -0.16839599609375, -0.15478134155273438, -0.14116668701171875, -0.12755203247070312, -0.1139373779296875, -0.10032272338867188, -0.08670806884765625, -0.07309341430664062, -0.059478759765625, -0.045864105224609375, -0.03224945068359375, -0.018634796142578125, -0.0050201416015625, 0.008594512939453125, 0.02220916748046875, 0.035823822021484375, 0.0494384765625, 0.06305313110351562, 0.07666778564453125, 0.09028244018554688, 0.1038970947265625, 0.11751174926757812, 0.13112640380859375, 0.14474105834960938, 0.158355712890625, 0.17197036743164062, 0.18558502197265625, 0.19919967651367188, 0.2128143310546875, 0.22642898559570312, 0.24004364013671875, 0.2536582946777344, 0.26727294921875, 0.2808876037597656, 0.29450225830078125, 0.3081169128417969, 0.3217315673828125, 0.3353462219238281, 0.34896087646484375, 0.3625755310058594, 0.376190185546875, 0.3898048400878906, 0.40341949462890625, 0.4170341491699219, 0.4306488037109375, 0.4442634582519531, 0.45787811279296875, 0.4714927673339844, 0.485107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 9.0, 9.0, 11.0, 14.0, 12.0, 15.0, 19.0, 19.0, 26.0, 35.0, 42.0, 33.0, 50.0, 46.0, 54.0, 36.0, 49.0, 52.0, 40.0, 58.0, 46.0, 61.0, 35.0, 30.0, 25.0, 16.0, 28.0, 23.0, 27.0, 14.0, 14.0, 10.0, 5.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.474853515625, -0.4575767517089844, -0.44029998779296875, -0.4230232238769531, -0.4057464599609375, -0.3884696960449219, -0.37119293212890625, -0.3539161682128906, -0.336639404296875, -0.3193626403808594, -0.30208587646484375, -0.2848091125488281, -0.2675323486328125, -0.2502555847167969, -0.23297882080078125, -0.21570205688476562, -0.19842529296875, -0.18114852905273438, -0.16387176513671875, -0.14659500122070312, -0.1293182373046875, -0.11204147338867188, -0.09476470947265625, -0.07748794555664062, -0.060211181640625, -0.042934417724609375, -0.02565765380859375, -0.008380889892578125, 0.0088958740234375, 0.026172637939453125, 0.04344940185546875, 0.060726165771484375, 0.0780029296875, 0.09527969360351562, 0.11255645751953125, 0.12983322143554688, 0.1471099853515625, 0.16438674926757812, 0.18166351318359375, 0.19894027709960938, 0.216217041015625, 0.23349380493164062, 0.25077056884765625, 0.2680473327636719, 0.2853240966796875, 0.3026008605957031, 0.31987762451171875, 0.3371543884277344, 0.35443115234375, 0.3717079162597656, 0.38898468017578125, 0.4062614440917969, 0.4235382080078125, 0.4408149719238281, 0.45809173583984375, 0.4753684997558594, 0.492645263671875, 0.5099220275878906, 0.5271987915039062, 0.5444755554199219, 0.5617523193359375, 0.5790290832519531, 0.5963058471679688, 0.6135826110839844, 0.630859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 12.0, 15.0, 19.0, 25.0, 41.0, 36.0, 63.0, 107.0, 143.0, 283.0, 431.0, 858.0, 1700.0, 3952.0, 12598.0, 72772.0, 540012.0, 359060.0, 41346.0, 8915.0, 3100.0, 1346.0, 727.0, 371.0, 197.0, 147.0, 76.0, 50.0, 32.0, 13.0, 20.0, 18.0, 11.0, 13.0, 7.0, 5.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158203125, -0.1520862579345703, -0.14596939086914062, -0.13985252380371094, -0.13373565673828125, -0.12761878967285156, -0.12150192260742188, -0.11538505554199219, -0.1092681884765625, -0.10315132141113281, -0.09703445434570312, -0.09091758728027344, -0.08480072021484375, -0.07868385314941406, -0.07256698608398438, -0.06645011901855469, -0.060333251953125, -0.05421638488769531, -0.048099517822265625, -0.04198265075683594, -0.03586578369140625, -0.029748916625976562, -0.023632049560546875, -0.017515182495117188, -0.0113983154296875, -0.0052814483642578125, 0.000835418701171875, 0.0069522857666015625, 0.01306915283203125, 0.019186019897460938, 0.025302886962890625, 0.03141975402832031, 0.03753662109375, 0.04365348815917969, 0.049770355224609375, 0.05588722229003906, 0.06200408935546875, 0.06812095642089844, 0.07423782348632812, 0.08035469055175781, 0.0864715576171875, 0.09258842468261719, 0.09870529174804688, 0.10482215881347656, 0.11093902587890625, 0.11705589294433594, 0.12317276000976562, 0.1292896270751953, 0.135406494140625, 0.1415233612060547, 0.14764022827148438, 0.15375709533691406, 0.15987396240234375, 0.16599082946777344, 0.17210769653320312, 0.1782245635986328, 0.1843414306640625, 0.1904582977294922, 0.19657516479492188, 0.20269203186035156, 0.20880889892578125, 0.21492576599121094, 0.22104263305664062, 0.2271595001220703, 0.2332763671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 6.0, 8.0, 11.0, 17.0, 18.0, 29.0, 39.0, 49.0, 47.0, 53.0, 58.0, 83.0, 77.0, 66.0, 79.0, 59.0, 60.0, 48.0, 47.0, 25.0, 30.0, 19.0, 15.0, 12.0, 9.0, 10.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.4705583453178406e-05, -1.4092773199081421e-05, -1.3479962944984436e-05, -1.2867152690887451e-05, -1.2254342436790466e-05, -1.1641532182693481e-05, -1.1028721928596497e-05, -1.0415911674499512e-05, -9.803101420402527e-06, -9.190291166305542e-06, -8.577480912208557e-06, -7.964670658111572e-06, -7.351860404014587e-06, -6.7390501499176025e-06, -6.126239895820618e-06, -5.513429641723633e-06, -4.900619387626648e-06, -4.287809133529663e-06, -3.6749988794326782e-06, -3.0621886253356934e-06, -2.4493783712387085e-06, -1.8365681171417236e-06, -1.2237578630447388e-06, -6.109476089477539e-07, 1.862645149230957e-09, 6.146728992462158e-07, 1.2274831533432007e-06, 1.8402934074401855e-06, 2.4531036615371704e-06, 3.0659139156341553e-06, 3.67872416973114e-06, 4.291534423828125e-06, 4.90434467792511e-06, 5.517154932022095e-06, 6.12996518611908e-06, 6.7427754402160645e-06, 7.355585694313049e-06, 7.968395948410034e-06, 8.581206202507019e-06, 9.194016456604004e-06, 9.806826710700989e-06, 1.0419636964797974e-05, 1.1032447218894958e-05, 1.1645257472991943e-05, 1.2258067727088928e-05, 1.2870877981185913e-05, 1.3483688235282898e-05, 1.4096498489379883e-05, 1.4709308743476868e-05, 1.5322118997573853e-05, 1.5934929251670837e-05, 1.6547739505767822e-05, 1.7160549759864807e-05, 1.7773360013961792e-05, 1.8386170268058777e-05, 1.8998980522155762e-05, 1.9611790776252747e-05, 2.022460103034973e-05, 2.0837411284446716e-05, 2.14502215385437e-05, 2.2063031792640686e-05, 2.267584204673767e-05, 2.3288652300834656e-05, 2.390146255493164e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 14.0, 13.0, 19.0, 36.0, 45.0, 68.0, 127.0, 234.0, 473.0, 1032.0, 2690.0, 8247.0, 34322.0, 235640.0, 598235.0, 135681.0, 22117.0, 5816.0, 1946.0, 852.0, 408.0, 214.0, 108.0, 68.0, 41.0, 35.0, 15.0, 8.0, 16.0, 5.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1793212890625, -0.17394638061523438, -0.16857147216796875, -0.16319656372070312, -0.1578216552734375, -0.15244674682617188, -0.14707183837890625, -0.14169692993164062, -0.136322021484375, -0.13094711303710938, -0.12557220458984375, -0.12019729614257812, -0.1148223876953125, -0.10944747924804688, -0.10407257080078125, -0.09869766235351562, -0.09332275390625, -0.08794784545898438, -0.08257293701171875, -0.07719802856445312, -0.0718231201171875, -0.06644821166992188, -0.06107330322265625, -0.055698394775390625, -0.050323486328125, -0.044948577880859375, -0.03957366943359375, -0.034198760986328125, -0.0288238525390625, -0.023448944091796875, -0.01807403564453125, -0.012699127197265625, -0.00732421875, -0.001949310302734375, 0.00342559814453125, 0.008800506591796875, 0.0141754150390625, 0.019550323486328125, 0.02492523193359375, 0.030300140380859375, 0.035675048828125, 0.041049957275390625, 0.04642486572265625, 0.051799774169921875, 0.0571746826171875, 0.06254959106445312, 0.06792449951171875, 0.07329940795898438, 0.07867431640625, 0.08404922485351562, 0.08942413330078125, 0.09479904174804688, 0.1001739501953125, 0.10554885864257812, 0.11092376708984375, 0.11629867553710938, 0.121673583984375, 0.12704849243164062, 0.13242340087890625, 0.13779830932617188, 0.1431732177734375, 0.14854812622070312, 0.15392303466796875, 0.15929794311523438, 0.1646728515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 7.0, 8.0, 5.0, 13.0, 16.0, 28.0, 34.0, 41.0, 67.0, 92.0, 91.0, 113.0, 110.0, 88.0, 87.0, 45.0, 46.0, 29.0, 20.0, 12.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.211181640625, -0.2049388885498047, -0.19869613647460938, -0.19245338439941406, -0.18621063232421875, -0.17996788024902344, -0.17372512817382812, -0.1674823760986328, -0.1612396240234375, -0.1549968719482422, -0.14875411987304688, -0.14251136779785156, -0.13626861572265625, -0.13002586364746094, -0.12378311157226562, -0.11754035949707031, -0.111297607421875, -0.10505485534667969, -0.09881210327148438, -0.09256935119628906, -0.08632659912109375, -0.08008384704589844, -0.07384109497070312, -0.06759834289550781, -0.0613555908203125, -0.05511283874511719, -0.048870086669921875, -0.04262733459472656, -0.03638458251953125, -0.030141830444335938, -0.023899078369140625, -0.017656326293945312, -0.01141357421875, -0.0051708221435546875, 0.001071929931640625, 0.0073146820068359375, 0.01355743408203125, 0.019800186157226562, 0.026042938232421875, 0.03228569030761719, 0.0385284423828125, 0.04477119445800781, 0.051013946533203125, 0.05725669860839844, 0.06349945068359375, 0.06974220275878906, 0.07598495483398438, 0.08222770690917969, 0.088470458984375, 0.09471321105957031, 0.10095596313476562, 0.10719871520996094, 0.11344146728515625, 0.11968421936035156, 0.12592697143554688, 0.1321697235107422, 0.1384124755859375, 0.1446552276611328, 0.15089797973632812, 0.15714073181152344, 0.16338348388671875, 0.16962623596191406, 0.17586898803710938, 0.1821117401123047, 0.1883544921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 8.0, 17.0, 37.0, 78.0, 187.0, 347.0, 207.0, 78.0, 16.0, 18.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.164790153503418, -6.9453654289245605, -6.725940704345703, -6.506516456604004, -6.2870917320251465, -6.067667007446289, -5.848242282867432, -5.628817558288574, -5.409393310546875, -5.189968585968018, -4.97054386138916, -4.751119613647461, -4.5316948890686035, -4.312270164489746, -4.092845439910889, -3.8734207153320312, -3.653995990753174, -3.4345712661743164, -3.215146780014038, -2.9957220554351807, -2.7762975692749023, -2.556872844696045, -2.3374481201171875, -2.11802339553833, -1.8985989093780518, -1.6791743040084839, -1.459749698638916, -1.2403249740600586, -1.0209003686904907, -0.8014757633209229, -0.5820510387420654, -0.36262643337249756, -0.1432023048400879, 0.07622233033180237, 0.2956469655036926, 0.5150716304779053, 0.7344962358474731, 0.953920841217041, 1.1733455657958984, 1.3927701711654663, 1.6121947765350342, 1.831619381904602, 2.05104398727417, 2.2704687118530273, 2.4898934364318848, 2.709317922592163, 2.9287426471710205, 3.148167133331299, 3.3675918579101562, 3.5870165824890137, 3.806441068649292, 4.02586555480957, 4.245290279388428, 4.464715003967285, 4.684139728546143, 4.903564453125, 5.122988700866699, 5.342413425445557, 5.561838150024414, 5.781262397766113, 6.000687122344971, 6.220111846923828, 6.4395365715026855, 6.658961296081543, 6.8783860206604]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 11.0, 7.0, 11.0, 13.0, 20.0, 30.0, 26.0, 30.0, 46.0, 54.0, 58.0, 55.0, 53.0, 59.0, 67.0, 52.0, 56.0, 53.0, 51.0, 36.0, 50.0, 36.0, 26.0, 24.0, 15.0, 17.0, 11.0, 10.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.710875988006592, -3.5751142501831055, -3.43935227394104, -3.3035905361175537, -3.1678285598754883, -3.032066822052002, -2.8963050842285156, -2.7605433464050293, -2.624781370162964, -2.4890196323394775, -2.353257656097412, -2.217495918273926, -2.0817341804504395, -1.945972204208374, -1.8102104663848877, -1.6744486093521118, -1.538686752319336, -1.40292489528656, -1.2671630382537842, -1.1314013004302979, -0.995639443397522, -0.8598775863647461, -0.724115788936615, -0.5883539915084839, -0.452592134475708, -0.3168303072452545, -0.18106848001480103, -0.045306652784347534, 0.09045517444610596, 0.22621703147888184, 0.36197882890701294, 0.49774062633514404, 0.6335020065307617, 0.7692638635635376, 0.9050256609916687, 1.0407874584197998, 1.1765493154525757, 1.3123111724853516, 1.448072910308838, 1.5838347673416138, 1.7195966243743896, 1.8553584814071655, 1.9911203384399414, 2.1268820762634277, 2.262643814086914, 2.3984057903289795, 2.534167528152466, 2.6699295043945312, 2.8056912422180176, 2.941452980041504, 3.0772149562835693, 3.2129766941070557, 3.348738670349121, 3.4845004081726074, 3.6202621459960938, 3.75602388381958, 3.8917858600616455, 4.027547836303711, 4.163309574127197, 4.299071311950684, 4.43483304977417, 4.570594787597656, 4.706357002258301, 4.842118740081787, 4.977880477905273]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 10.0, 11.0, 16.0, 10.0, 21.0, 29.0, 71.0, 116.0, 221.0, 474.0, 950.0, 2753.0, 10563.0, 88091.0, 3967664.0, 106046.0, 12001.0, 2939.0, 1120.0, 490.0, 260.0, 151.0, 82.0, 53.0, 41.0, 33.0, 21.0, 14.0, 7.0, 3.0, 11.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5185546875, -0.494476318359375, -0.47039794921875, -0.446319580078125, -0.4222412109375, -0.398162841796875, -0.37408447265625, -0.350006103515625, -0.325927734375, -0.301849365234375, -0.27777099609375, -0.253692626953125, -0.2296142578125, -0.205535888671875, -0.18145751953125, -0.157379150390625, -0.13330078125, -0.109222412109375, -0.08514404296875, -0.061065673828125, -0.0369873046875, -0.012908935546875, 0.01116943359375, 0.035247802734375, 0.059326171875, 0.083404541015625, 0.10748291015625, 0.131561279296875, 0.1556396484375, 0.179718017578125, 0.20379638671875, 0.227874755859375, 0.251953125, 0.276031494140625, 0.30010986328125, 0.324188232421875, 0.3482666015625, 0.372344970703125, 0.39642333984375, 0.420501708984375, 0.444580078125, 0.468658447265625, 0.49273681640625, 0.516815185546875, 0.5408935546875, 0.564971923828125, 0.58905029296875, 0.613128662109375, 0.63720703125, 0.661285400390625, 0.68536376953125, 0.709442138671875, 0.7335205078125, 0.757598876953125, 0.78167724609375, 0.805755615234375, 0.829833984375, 0.853912353515625, 0.87799072265625, 0.902069091796875, 0.9261474609375, 0.950225830078125, 0.97430419921875, 0.998382568359375, 1.0224609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 7.0, 3.0, 16.0, 25.0, 33.0, 37.0, 78.0, 64.0, 84.0, 101.0, 93.0, 96.0, 79.0, 72.0, 65.0, 48.0, 39.0, 25.0, 13.0, 9.0, 6.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146484375, -0.13861465454101562, -0.13074493408203125, -0.12287521362304688, -0.1150054931640625, -0.10713577270507812, -0.09926605224609375, -0.09139633178710938, -0.083526611328125, -0.07565689086914062, -0.06778717041015625, -0.059917449951171875, -0.0520477294921875, -0.044178009033203125, -0.03630828857421875, -0.028438568115234375, -0.02056884765625, -0.012699127197265625, -0.00482940673828125, 0.003040313720703125, 0.0109100341796875, 0.018779754638671875, 0.02664947509765625, 0.034519195556640625, 0.042388916015625, 0.050258636474609375, 0.05812835693359375, 0.06599807739257812, 0.0738677978515625, 0.08173751831054688, 0.08960723876953125, 0.09747695922851562, 0.1053466796875, 0.11321640014648438, 0.12108612060546875, 0.12895584106445312, 0.1368255615234375, 0.14469528198242188, 0.15256500244140625, 0.16043472290039062, 0.168304443359375, 0.17617416381835938, 0.18404388427734375, 0.19191360473632812, 0.1997833251953125, 0.20765304565429688, 0.21552276611328125, 0.22339248657226562, 0.23126220703125, 0.23913192749023438, 0.24700164794921875, 0.2548713684082031, 0.2627410888671875, 0.2706108093261719, 0.27848052978515625, 0.2863502502441406, 0.294219970703125, 0.3020896911621094, 0.30995941162109375, 0.3178291320800781, 0.3256988525390625, 0.3335685729980469, 0.34143829345703125, 0.3493080139160156, 0.357177734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 7.0, 19.0, 46.0, 85.0, 132.0, 213.0, 378.0, 736.0, 1646.0, 5044.0, 32228.0, 3855073.0, 280317.0, 13150.0, 2823.0, 1136.0, 520.0, 287.0, 159.0, 92.0, 55.0, 46.0, 25.0, 23.0, 12.0, 10.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0390625, -1.0115737915039062, -0.9840850830078125, -0.9565963745117188, -0.929107666015625, -0.9016189575195312, -0.8741302490234375, -0.8466415405273438, -0.81915283203125, -0.7916641235351562, -0.7641754150390625, -0.7366867065429688, -0.709197998046875, -0.6817092895507812, -0.6542205810546875, -0.6267318725585938, -0.5992431640625, -0.5717544555664062, -0.5442657470703125, -0.5167770385742188, -0.489288330078125, -0.46179962158203125, -0.4343109130859375, -0.40682220458984375, -0.37933349609375, -0.35184478759765625, -0.3243560791015625, -0.29686737060546875, -0.269378662109375, -0.24188995361328125, -0.2144012451171875, -0.18691253662109375, -0.159423828125, -0.13193511962890625, -0.1044464111328125, -0.07695770263671875, -0.049468994140625, -0.02198028564453125, 0.0055084228515625, 0.03299713134765625, 0.06048583984375, 0.08797454833984375, 0.1154632568359375, 0.14295196533203125, 0.170440673828125, 0.19792938232421875, 0.2254180908203125, 0.25290679931640625, 0.2803955078125, 0.30788421630859375, 0.3353729248046875, 0.36286163330078125, 0.390350341796875, 0.41783905029296875, 0.4453277587890625, 0.47281646728515625, 0.50030517578125, 0.5277938842773438, 0.5552825927734375, 0.5827713012695312, 0.610260009765625, 0.6377487182617188, 0.6652374267578125, 0.6927261352539062, 0.72021484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 6.0, 4.0, 4.0, 5.0, 10.0, 13.0, 28.0, 45.0, 100.0, 346.0, 2676.0, 595.0, 117.0, 58.0, 21.0, 23.0, 10.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.294921875, -0.2842674255371094, -0.27361297607421875, -0.2629585266113281, -0.2523040771484375, -0.24164962768554688, -0.23099517822265625, -0.22034072875976562, -0.209686279296875, -0.19903182983398438, -0.18837738037109375, -0.17772293090820312, -0.1670684814453125, -0.15641403198242188, -0.14575958251953125, -0.13510513305664062, -0.12445068359375, -0.11379623413085938, -0.10314178466796875, -0.09248733520507812, -0.0818328857421875, -0.07117843627929688, -0.06052398681640625, -0.049869537353515625, -0.039215087890625, -0.028560638427734375, -0.01790618896484375, -0.007251739501953125, 0.0034027099609375, 0.014057159423828125, 0.02471160888671875, 0.035366058349609375, 0.0460205078125, 0.056674957275390625, 0.06732940673828125, 0.07798385620117188, 0.0886383056640625, 0.09929275512695312, 0.10994720458984375, 0.12060165405273438, 0.131256103515625, 0.14191055297851562, 0.15256500244140625, 0.16321945190429688, 0.1738739013671875, 0.18452835083007812, 0.19518280029296875, 0.20583724975585938, 0.21649169921875, 0.22714614868164062, 0.23780059814453125, 0.24845504760742188, 0.2591094970703125, 0.2697639465332031, 0.28041839599609375, 0.2910728454589844, 0.301727294921875, 0.3123817443847656, 0.32303619384765625, 0.3336906433105469, 0.3443450927734375, 0.3549995422363281, 0.36565399169921875, 0.3763084411621094, 0.386962890625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 23.0, 48.0, 141.0, 278.0, 293.0, 140.0, 37.0, 15.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8432812690734863, -2.777459144592285, -2.711637020111084, -2.645815134048462, -2.5799930095672607, -2.5141708850860596, -2.4483487606048584, -2.3825266361236572, -2.316704750061035, -2.250882625579834, -2.185060501098633, -2.1192386150360107, -2.0534164905548096, -1.9875943660736084, -1.9217722415924072, -1.855950117111206, -1.7901279926300049, -1.7243058681488037, -1.658483862876892, -1.592661738395691, -1.5268397331237793, -1.4610176086425781, -1.395195484161377, -1.3293733596801758, -1.2635513544082642, -1.197729229927063, -1.1319072246551514, -1.0660851001739502, -1.000262975692749, -0.9344409704208374, -0.8686188459396362, -0.8027967810630798, -0.7369744777679443, -0.6711524128913879, -0.6053303480148315, -0.5395082235336304, -0.473686158657074, -0.4078640937805176, -0.3420419991016388, -0.27621990442276, -0.2103978395462036, -0.14457575976848602, -0.07875367999076843, -0.012931600213050842, 0.05289047956466675, 0.11871254444122314, 0.18453463912010193, 0.2503567337989807, 0.3161787986755371, 0.3820008635520935, 0.4478229582309723, 0.5136450529098511, 0.5794671177864075, 0.6452891826629639, 0.711111307144165, 0.7769333720207214, 0.8427554368972778, 0.9085775017738342, 0.9743995666503906, 1.0402216911315918, 1.106043815612793, 1.1718658208847046, 1.2376879453659058, 1.3035099506378174, 1.3693320751190186]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 11.0, 17.0, 20.0, 26.0, 26.0, 34.0, 59.0, 71.0, 70.0, 109.0, 75.0, 83.0, 85.0, 82.0, 60.0, 59.0, 36.0, 23.0, 21.0, 11.0, 13.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1679142713546753, -1.1222763061523438, -1.0766383409500122, -1.0310003757476807, -0.9853624105453491, -0.9397244453430176, -0.8940865397453308, -0.8484485745429993, -0.8028106093406677, -0.7571726441383362, -0.7115346789360046, -0.6658967733383179, -0.6202588081359863, -0.5746208429336548, -0.5289828777313232, -0.4833449125289917, -0.43770694732666016, -0.3920689821243286, -0.34643101692199707, -0.3007930815219879, -0.25515511631965637, -0.20951715111732483, -0.16387921571731567, -0.11824125051498413, -0.07260328531265259, -0.026965327560901642, 0.018672630190849304, 0.06431058049201965, 0.1099485456943512, 0.15558651089668274, 0.2012244462966919, 0.24686241149902344, 0.29250025749206543, 0.338138222694397, 0.3837761878967285, 0.42941412329673767, 0.4750520884990692, 0.5206900835037231, 0.5663279891014099, 0.6119659543037415, 0.657603919506073, 0.7032418847084045, 0.7488798499107361, 0.7945177555084229, 0.8401557207107544, 0.8857936859130859, 0.9314316511154175, 0.977069616317749, 1.0227075815200806, 1.068345546722412, 1.1139835119247437, 1.1596214771270752, 1.2052594423294067, 1.2508974075317383, 1.2965352535247803, 1.3421733379364014, 1.3878111839294434, 1.433449149131775, 1.4790871143341064, 1.524725079536438, 1.5703630447387695, 1.616001009941101, 1.6616389751434326, 1.7072768211364746, 1.7529149055480957]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 9.0, 15.0, 20.0, 24.0, 35.0, 42.0, 72.0, 111.0, 183.0, 312.0, 636.0, 1369.0, 3224.0, 8501.0, 26132.0, 97755.0, 446157.0, 354888.0, 75699.0, 20943.0, 7089.0, 2803.0, 1172.0, 522.0, 308.0, 170.0, 104.0, 66.0, 48.0, 31.0, 23.0, 9.0, 18.0, 4.0, 5.0, 5.0, 6.0, 3.0, 5.0, 4.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.626953125, -0.6079025268554688, -0.5888519287109375, -0.5698013305664062, -0.550750732421875, -0.5317001342773438, -0.5126495361328125, -0.49359893798828125, -0.47454833984375, -0.45549774169921875, -0.4364471435546875, -0.41739654541015625, -0.398345947265625, -0.37929534912109375, -0.3602447509765625, -0.34119415283203125, -0.3221435546875, -0.30309295654296875, -0.2840423583984375, -0.26499176025390625, -0.245941162109375, -0.22689056396484375, -0.2078399658203125, -0.18878936767578125, -0.16973876953125, -0.15068817138671875, -0.1316375732421875, -0.11258697509765625, -0.093536376953125, -0.07448577880859375, -0.0554351806640625, -0.03638458251953125, -0.017333984375, 0.00171661376953125, 0.0207672119140625, 0.03981781005859375, 0.058868408203125, 0.07791900634765625, 0.0969696044921875, 0.11602020263671875, 0.13507080078125, 0.15412139892578125, 0.1731719970703125, 0.19222259521484375, 0.211273193359375, 0.23032379150390625, 0.2493743896484375, 0.26842498779296875, 0.2874755859375, 0.30652618408203125, 0.3255767822265625, 0.34462738037109375, 0.363677978515625, 0.38272857666015625, 0.4017791748046875, 0.42082977294921875, 0.43988037109375, 0.45893096923828125, 0.4779815673828125, 0.49703216552734375, 0.516082763671875, 0.5351333618164062, 0.5541839599609375, 0.5732345581054688, 0.59228515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 2.0, 10.0, 10.0, 10.0, 39.0, 44.0, 64.0, 63.0, 56.0, 80.0, 109.0, 82.0, 99.0, 71.0, 65.0, 51.0, 39.0, 37.0, 26.0, 13.0, 12.0, 7.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14599609375, -0.13876724243164062, -0.13153839111328125, -0.12430953979492188, -0.1170806884765625, -0.10985183715820312, -0.10262298583984375, -0.09539413452148438, -0.088165283203125, -0.08093643188476562, -0.07370758056640625, -0.06647872924804688, -0.0592498779296875, -0.052021026611328125, -0.04479217529296875, -0.037563323974609375, -0.03033447265625, -0.023105621337890625, -0.01587677001953125, -0.008647918701171875, -0.0014190673828125, 0.005809783935546875, 0.01303863525390625, 0.020267486572265625, 0.027496337890625, 0.034725189208984375, 0.04195404052734375, 0.049182891845703125, 0.0564117431640625, 0.06364059448242188, 0.07086944580078125, 0.07809829711914062, 0.0853271484375, 0.09255599975585938, 0.09978485107421875, 0.10701370239257812, 0.1142425537109375, 0.12147140502929688, 0.12870025634765625, 0.13592910766601562, 0.143157958984375, 0.15038681030273438, 0.15761566162109375, 0.16484451293945312, 0.1720733642578125, 0.17930221557617188, 0.18653106689453125, 0.19375991821289062, 0.20098876953125, 0.20821762084960938, 0.21544647216796875, 0.22267532348632812, 0.2299041748046875, 0.23713302612304688, 0.24436187744140625, 0.2515907287597656, 0.258819580078125, 0.2660484313964844, 0.27327728271484375, 0.2805061340332031, 0.2877349853515625, 0.2949638366699219, 0.30219268798828125, 0.3094215393066406, 0.316650390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 8.0, 5.0, 13.0, 24.0, 26.0, 41.0, 67.0, 106.0, 124.0, 237.0, 290.0, 578.0, 901.0, 1601.0, 2987.0, 5597.0, 11595.0, 25743.0, 63298.0, 180797.0, 404174.0, 218566.0, 74688.0, 29811.0, 13179.0, 6362.0, 3307.0, 1827.0, 952.0, 584.0, 355.0, 248.0, 120.0, 100.0, 70.0, 57.0, 40.0, 15.0, 9.0, 9.0, 10.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.345703125, -0.3344001770019531, -0.32309722900390625, -0.3117942810058594, -0.3004913330078125, -0.2891883850097656, -0.27788543701171875, -0.2665824890136719, -0.255279541015625, -0.24397659301757812, -0.23267364501953125, -0.22137069702148438, -0.2100677490234375, -0.19876480102539062, -0.18746185302734375, -0.17615890502929688, -0.16485595703125, -0.15355300903320312, -0.14225006103515625, -0.13094711303710938, -0.1196441650390625, -0.10834121704101562, -0.09703826904296875, -0.08573532104492188, -0.074432373046875, -0.06312942504882812, -0.05182647705078125, -0.040523529052734375, -0.0292205810546875, -0.017917633056640625, -0.00661468505859375, 0.004688262939453125, 0.0159912109375, 0.027294158935546875, 0.03859710693359375, 0.049900054931640625, 0.0612030029296875, 0.07250595092773438, 0.08380889892578125, 0.09511184692382812, 0.106414794921875, 0.11771774291992188, 0.12902069091796875, 0.14032363891601562, 0.1516265869140625, 0.16292953491210938, 0.17423248291015625, 0.18553543090820312, 0.19683837890625, 0.20814132690429688, 0.21944427490234375, 0.23074722290039062, 0.2420501708984375, 0.2533531188964844, 0.26465606689453125, 0.2759590148925781, 0.287261962890625, 0.2985649108886719, 0.30986785888671875, 0.3211708068847656, 0.3324737548828125, 0.3437767028808594, 0.35507965087890625, 0.3663825988769531, 0.377685546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 5.0, 8.0, 12.0, 5.0, 16.0, 17.0, 17.0, 19.0, 28.0, 28.0, 36.0, 39.0, 32.0, 35.0, 46.0, 46.0, 52.0, 48.0, 42.0, 47.0, 57.0, 43.0, 45.0, 39.0, 26.0, 36.0, 28.0, 32.0, 25.0, 17.0, 20.0, 17.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.542205810546875, -0.52386474609375, -0.505523681640625, -0.4871826171875, -0.468841552734375, -0.45050048828125, -0.432159423828125, -0.413818359375, -0.395477294921875, -0.37713623046875, -0.358795166015625, -0.3404541015625, -0.322113037109375, -0.30377197265625, -0.285430908203125, -0.26708984375, -0.248748779296875, -0.23040771484375, -0.212066650390625, -0.1937255859375, -0.175384521484375, -0.15704345703125, -0.138702392578125, -0.120361328125, -0.102020263671875, -0.08367919921875, -0.065338134765625, -0.0469970703125, -0.028656005859375, -0.01031494140625, 0.008026123046875, 0.0263671875, 0.044708251953125, 0.06304931640625, 0.081390380859375, 0.0997314453125, 0.118072509765625, 0.13641357421875, 0.154754638671875, 0.173095703125, 0.191436767578125, 0.20977783203125, 0.228118896484375, 0.2464599609375, 0.264801025390625, 0.28314208984375, 0.301483154296875, 0.31982421875, 0.338165283203125, 0.35650634765625, 0.374847412109375, 0.3931884765625, 0.411529541015625, 0.42987060546875, 0.448211669921875, 0.466552734375, 0.484893798828125, 0.50323486328125, 0.521575927734375, 0.5399169921875, 0.558258056640625, 0.57659912109375, 0.594940185546875, 0.61328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 12.0, 7.0, 15.0, 24.0, 51.0, 67.0, 139.0, 276.0, 575.0, 1470.0, 4763.0, 27533.0, 357622.0, 594042.0, 51391.0, 7161.0, 1968.0, 750.0, 306.0, 184.0, 74.0, 49.0, 27.0, 19.0, 9.0, 9.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2093505859375, -0.20163536071777344, -0.19392013549804688, -0.1862049102783203, -0.17848968505859375, -0.1707744598388672, -0.16305923461914062, -0.15534400939941406, -0.1476287841796875, -0.13991355895996094, -0.13219833374023438, -0.12448310852050781, -0.11676788330078125, -0.10905265808105469, -0.10133743286132812, -0.09362220764160156, -0.085906982421875, -0.07819175720214844, -0.07047653198242188, -0.06276130676269531, -0.05504608154296875, -0.04733085632324219, -0.039615631103515625, -0.03190040588378906, -0.0241851806640625, -0.016469955444335938, -0.008754730224609375, -0.0010395050048828125, 0.00667572021484375, 0.014390945434570312, 0.022106170654296875, 0.029821395874023438, 0.03753662109375, 0.04525184631347656, 0.052967071533203125, 0.06068229675292969, 0.06839752197265625, 0.07611274719238281, 0.08382797241210938, 0.09154319763183594, 0.0992584228515625, 0.10697364807128906, 0.11468887329101562, 0.12240409851074219, 0.13011932373046875, 0.1378345489501953, 0.14554977416992188, 0.15326499938964844, 0.160980224609375, 0.16869544982910156, 0.17641067504882812, 0.1841259002685547, 0.19184112548828125, 0.1995563507080078, 0.20727157592773438, 0.21498680114746094, 0.2227020263671875, 0.23041725158691406, 0.23813247680664062, 0.2458477020263672, 0.25356292724609375, 0.2612781524658203, 0.2689933776855469, 0.27670860290527344, 0.284423828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 21.0, 38.0, 53.0, 135.0, 178.0, 202.0, 160.0, 114.0, 54.0, 26.0, 14.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849102020263672e-05, -2.675037831068039e-05, -2.500973641872406e-05, -2.326909452676773e-05, -2.15284526348114e-05, -1.9787810742855072e-05, -1.8047168850898743e-05, -1.6306526958942413e-05, -1.4565885066986084e-05, -1.2825243175029755e-05, -1.1084601283073425e-05, -9.343959391117096e-06, -7.603317499160767e-06, -5.862675607204437e-06, -4.122033715248108e-06, -2.3813918232917786e-06, -6.407499313354492e-07, 1.0998919606208801e-06, 2.8405338525772095e-06, 4.581175744533539e-06, 6.321817636489868e-06, 8.062459528446198e-06, 9.803101420402527e-06, 1.1543743312358856e-05, 1.3284385204315186e-05, 1.5025027096271515e-05, 1.6765668988227844e-05, 1.8506310880184174e-05, 2.0246952772140503e-05, 2.1987594664096832e-05, 2.372823655605316e-05, 2.546887844800949e-05, 2.720952033996582e-05, 2.895016223192215e-05, 3.069080412387848e-05, 3.243144601583481e-05, 3.417208790779114e-05, 3.591272979974747e-05, 3.7653371691703796e-05, 3.9394013583660126e-05, 4.1134655475616455e-05, 4.2875297367572784e-05, 4.4615939259529114e-05, 4.635658115148544e-05, 4.809722304344177e-05, 4.98378649353981e-05, 5.157850682735443e-05, 5.331914871931076e-05, 5.505979061126709e-05, 5.680043250322342e-05, 5.854107439517975e-05, 6.028171628713608e-05, 6.202235817909241e-05, 6.376300007104874e-05, 6.550364196300507e-05, 6.72442838549614e-05, 6.898492574691772e-05, 7.072556763887405e-05, 7.246620953083038e-05, 7.420685142278671e-05, 7.594749331474304e-05, 7.768813520669937e-05, 7.94287770986557e-05, 8.116941899061203e-05, 8.291006088256836e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 18.0, 15.0, 48.0, 59.0, 91.0, 214.0, 527.0, 1468.0, 5365.0, 30572.0, 386623.0, 565807.0, 47647.0, 7081.0, 1790.0, 606.0, 249.0, 143.0, 68.0, 41.0, 32.0, 18.0, 17.0, 13.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2769584655761719, -0.26949310302734375, -0.2620277404785156, -0.2545623779296875, -0.24709701538085938, -0.23963165283203125, -0.23216629028320312, -0.224700927734375, -0.21723556518554688, -0.20977020263671875, -0.20230484008789062, -0.1948394775390625, -0.18737411499023438, -0.17990875244140625, -0.17244338989257812, -0.16497802734375, -0.15751266479492188, -0.15004730224609375, -0.14258193969726562, -0.1351165771484375, -0.12765121459960938, -0.12018585205078125, -0.11272048950195312, -0.105255126953125, -0.09778976440429688, -0.09032440185546875, -0.08285903930664062, -0.0753936767578125, -0.06792831420898438, -0.06046295166015625, -0.052997589111328125, -0.0455322265625, -0.038066864013671875, -0.03060150146484375, -0.023136138916015625, -0.0156707763671875, -0.008205413818359375, -0.00074005126953125, 0.006725311279296875, 0.014190673828125, 0.021656036376953125, 0.02912139892578125, 0.036586761474609375, 0.0440521240234375, 0.051517486572265625, 0.05898284912109375, 0.06644821166992188, 0.07391357421875, 0.08137893676757812, 0.08884429931640625, 0.09630966186523438, 0.1037750244140625, 0.11124038696289062, 0.11870574951171875, 0.12617111206054688, 0.133636474609375, 0.14110183715820312, 0.14856719970703125, 0.15603256225585938, 0.1634979248046875, 0.17096328735351562, 0.17842864990234375, 0.18589401245117188, 0.193359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 10.0, 17.0, 22.0, 36.0, 45.0, 74.0, 85.0, 88.0, 110.0, 118.0, 86.0, 69.0, 75.0, 28.0, 30.0, 21.0, 25.0, 15.0, 9.0, 5.0, 5.0, 3.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1976318359375, -0.19101715087890625, -0.1844024658203125, -0.17778778076171875, -0.171173095703125, -0.16455841064453125, -0.1579437255859375, -0.15132904052734375, -0.14471435546875, -0.13809967041015625, -0.1314849853515625, -0.12487030029296875, -0.118255615234375, -0.11164093017578125, -0.1050262451171875, -0.09841156005859375, -0.091796875, -0.08518218994140625, -0.0785675048828125, -0.07195281982421875, -0.065338134765625, -0.05872344970703125, -0.0521087646484375, -0.04549407958984375, -0.03887939453125, -0.03226470947265625, -0.0256500244140625, -0.01903533935546875, -0.012420654296875, -0.00580596923828125, 0.0008087158203125, 0.00742340087890625, 0.0140380859375, 0.02065277099609375, 0.0272674560546875, 0.03388214111328125, 0.040496826171875, 0.04711151123046875, 0.0537261962890625, 0.06034088134765625, 0.06695556640625, 0.07357025146484375, 0.0801849365234375, 0.08679962158203125, 0.093414306640625, 0.10002899169921875, 0.1066436767578125, 0.11325836181640625, 0.119873046875, 0.12648773193359375, 0.1331024169921875, 0.13971710205078125, 0.146331787109375, 0.15294647216796875, 0.1595611572265625, 0.16617584228515625, 0.17279052734375, 0.17940521240234375, 0.1860198974609375, 0.19263458251953125, 0.199249267578125, 0.20586395263671875, 0.2124786376953125, 0.21909332275390625, 0.2257080078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 21.0, 80.0, 295.0, 459.0, 107.0, 32.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.836428642272949, -6.480191707611084, -6.123955249786377, -5.767718315124512, -5.411481857299805, -5.0552449226379395, -4.699007987976074, -4.342771530151367, -3.986534833908081, -3.630298137664795, -3.274061441421509, -2.9178247451782227, -2.5615878105163574, -2.2053513526916504, -1.8491144180297852, -1.492877721786499, -1.136641025543213, -0.7804043292999268, -0.42416757345199585, -0.06793081760406494, 0.2883058786392212, 0.6445425748825073, 1.000779390335083, 1.3570160865783691, 1.7132527828216553, 2.0694894790649414, 2.4257261753082275, 2.7819628715515137, 3.138199806213379, 3.494436264038086, 3.850673198699951, 4.206910133361816, 4.563146591186523, 4.919383525848389, 5.275619983673096, 5.631856918334961, 5.988093376159668, 6.344330310821533, 6.700567245483398, 7.0568037033081055, 7.4130401611328125, 7.769277095794678, 8.125514030456543, 8.48175048828125, 8.837986946105957, 9.194223403930664, 9.550460815429688, 9.906697273254395, 10.262933731079102, 10.619170188903809, 10.975407600402832, 11.331644058227539, 11.687880516052246, 12.044116973876953, 12.400354385375977, 12.756590843200684, 13.112828254699707, 13.469064712524414, 13.825302124023438, 14.181538581848145, 14.537775039672852, 14.894011497497559, 15.250248908996582, 15.606485366821289, 15.962721824645996]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 12.0, 17.0, 16.0, 24.0, 14.0, 30.0, 28.0, 29.0, 42.0, 32.0, 44.0, 47.0, 51.0, 66.0, 37.0, 42.0, 59.0, 48.0, 54.0, 36.0, 42.0, 33.0, 28.0, 24.0, 20.0, 22.0, 18.0, 18.0, 9.0, 9.0, 8.0, 6.0, 7.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7749481201171875, -3.656970500946045, -3.5389928817749023, -3.421015501022339, -3.3030378818511963, -3.1850602626800537, -3.067082643508911, -2.9491052627563477, -2.831127643585205, -2.7131500244140625, -2.59517240524292, -2.4771950244903564, -2.359217405319214, -2.2412397861480713, -2.1232621669769287, -2.0052847862243652, -1.887307047843933, -1.7693294286727905, -1.6513519287109375, -1.533374309539795, -1.415396809577942, -1.2974191904067993, -1.1794416904449463, -1.0614640712738037, -0.9434865117073059, -0.8255089521408081, -0.7075313925743103, -0.5895538330078125, -0.4715762436389923, -0.3535986542701721, -0.23562109470367432, -0.11764353513717651, 0.00033402442932128906, 0.11831159144639969, 0.2362891584634781, 0.3542667329311371, 0.4722442924976349, 0.5902218818664551, 0.7081994414329529, 0.8261770009994507, 0.9441545605659485, 1.0621321201324463, 1.1801097393035889, 1.298087239265442, 1.4160648584365845, 1.5340423583984375, 1.65201997756958, 1.7699975967407227, 1.8879750967025757, 2.0059525966644287, 2.1239302158355713, 2.241907835006714, 2.3598854541778564, 2.47786283493042, 2.5958404541015625, 2.713818073272705, 2.8317956924438477, 2.9497733116149902, 3.067750930786133, 3.1857283115386963, 3.303705930709839, 3.4216835498809814, 3.539661169052124, 3.6576385498046875, 3.77561616897583]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 17.0, 18.0, 43.0, 59.0, 100.0, 165.0, 368.0, 945.0, 2746.0, 15327.0, 3808720.0, 351967.0, 9937.0, 2220.0, 823.0, 362.0, 176.0, 100.0, 65.0, 31.0, 25.0, 14.0, 15.0, 9.0, 8.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88134765625, -0.8370437622070312, -0.7927398681640625, -0.7484359741210938, -0.704132080078125, -0.6598281860351562, -0.6155242919921875, -0.5712203979492188, -0.52691650390625, -0.48261260986328125, -0.4383087158203125, -0.39400482177734375, -0.349700927734375, -0.30539703369140625, -0.2610931396484375, -0.21678924560546875, -0.1724853515625, -0.12818145751953125, -0.0838775634765625, -0.03957366943359375, 0.004730224609375, 0.04903411865234375, 0.0933380126953125, 0.13764190673828125, 0.18194580078125, 0.22624969482421875, 0.2705535888671875, 0.31485748291015625, 0.359161376953125, 0.40346527099609375, 0.4477691650390625, 0.49207305908203125, 0.536376953125, 0.5806808471679688, 0.6249847412109375, 0.6692886352539062, 0.713592529296875, 0.7578964233398438, 0.8022003173828125, 0.8465042114257812, 0.89080810546875, 0.9351119995117188, 0.9794158935546875, 1.0237197875976562, 1.068023681640625, 1.1123275756835938, 1.1566314697265625, 1.2009353637695312, 1.2452392578125, 1.2895431518554688, 1.3338470458984375, 1.3781509399414062, 1.422454833984375, 1.4667587280273438, 1.5110626220703125, 1.5553665161132812, 1.59967041015625, 1.6439743041992188, 1.6882781982421875, 1.7325820922851562, 1.776885986328125, 1.8211898803710938, 1.8654937744140625, 1.9097976684570312, 1.9541015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 10.0, 9.0, 16.0, 29.0, 28.0, 37.0, 44.0, 50.0, 62.0, 67.0, 73.0, 85.0, 63.0, 61.0, 63.0, 67.0, 59.0, 32.0, 32.0, 24.0, 24.0, 23.0, 14.0, 10.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.14116477966308594, -0.13376998901367188, -0.1263751983642578, -0.11898040771484375, -0.11158561706542969, -0.10419082641601562, -0.09679603576660156, -0.0894012451171875, -0.08200645446777344, -0.07461166381835938, -0.06721687316894531, -0.05982208251953125, -0.05242729187011719, -0.045032501220703125, -0.03763771057128906, -0.030242919921875, -0.022848129272460938, -0.015453338623046875, -0.008058547973632812, -0.00066375732421875, 0.0067310333251953125, 0.014125823974609375, 0.021520614624023438, 0.0289154052734375, 0.03631019592285156, 0.043704986572265625, 0.05109977722167969, 0.05849456787109375, 0.06588935852050781, 0.07328414916992188, 0.08067893981933594, 0.08807373046875, 0.09546852111816406, 0.10286331176757812, 0.11025810241699219, 0.11765289306640625, 0.1250476837158203, 0.13244247436523438, 0.13983726501464844, 0.1472320556640625, 0.15462684631347656, 0.16202163696289062, 0.1694164276123047, 0.17681121826171875, 0.1842060089111328, 0.19160079956054688, 0.19899559020996094, 0.206390380859375, 0.21378517150878906, 0.22117996215820312, 0.2285747528076172, 0.23596954345703125, 0.2433643341064453, 0.2507591247558594, 0.25815391540527344, 0.2655487060546875, 0.27294349670410156, 0.2803382873535156, 0.2877330780029297, 0.29512786865234375, 0.3025226593017578, 0.3099174499511719, 0.31731224060058594, 0.32470703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 13.0, 20.0, 46.0, 102.0, 197.0, 383.0, 929.0, 3065.0, 20925.0, 3953860.0, 203971.0, 7952.0, 1615.0, 599.0, 272.0, 150.0, 75.0, 58.0, 26.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0278778076171875, -0.986419677734375, -0.9449615478515625, -0.90350341796875, -0.8620452880859375, -0.820587158203125, -0.7791290283203125, -0.7376708984375, -0.6962127685546875, -0.654754638671875, -0.6132965087890625, -0.57183837890625, -0.5303802490234375, -0.488922119140625, -0.4474639892578125, -0.406005859375, -0.3645477294921875, -0.323089599609375, -0.2816314697265625, -0.24017333984375, -0.1987152099609375, -0.157257080078125, -0.1157989501953125, -0.0743408203125, -0.0328826904296875, 0.008575439453125, 0.0500335693359375, 0.09149169921875, 0.1329498291015625, 0.174407958984375, 0.2158660888671875, 0.25732421875, 0.2987823486328125, 0.340240478515625, 0.3816986083984375, 0.42315673828125, 0.4646148681640625, 0.506072998046875, 0.5475311279296875, 0.5889892578125, 0.6304473876953125, 0.671905517578125, 0.7133636474609375, 0.75482177734375, 0.7962799072265625, 0.837738037109375, 0.8791961669921875, 0.920654296875, 0.9621124267578125, 1.003570556640625, 1.0450286865234375, 1.08648681640625, 1.1279449462890625, 1.169403076171875, 1.2108612060546875, 1.2523193359375, 1.2937774658203125, 1.335235595703125, 1.3766937255859375, 1.41815185546875, 1.4596099853515625, 1.501068115234375, 1.5425262451171875, 1.583984375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 13.0, 22.0, 26.0, 65.0, 203.0, 2129.0, 1280.0, 172.0, 58.0, 36.0, 23.0, 14.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5027847290039062, -0.4865264892578125, -0.47026824951171875, -0.454010009765625, -0.43775177001953125, -0.4214935302734375, -0.40523529052734375, -0.38897705078125, -0.37271881103515625, -0.3564605712890625, -0.34020233154296875, -0.323944091796875, -0.30768585205078125, -0.2914276123046875, -0.27516937255859375, -0.2589111328125, -0.24265289306640625, -0.2263946533203125, -0.21013641357421875, -0.193878173828125, -0.17761993408203125, -0.1613616943359375, -0.14510345458984375, -0.12884521484375, -0.11258697509765625, -0.0963287353515625, -0.08007049560546875, -0.063812255859375, -0.04755401611328125, -0.0312957763671875, -0.01503753662109375, 0.001220703125, 0.01747894287109375, 0.0337371826171875, 0.04999542236328125, 0.066253662109375, 0.08251190185546875, 0.0987701416015625, 0.11502838134765625, 0.13128662109375, 0.14754486083984375, 0.1638031005859375, 0.18006134033203125, 0.196319580078125, 0.21257781982421875, 0.2288360595703125, 0.24509429931640625, 0.2613525390625, 0.27761077880859375, 0.2938690185546875, 0.31012725830078125, 0.326385498046875, 0.34264373779296875, 0.3589019775390625, 0.37516021728515625, 0.39141845703125, 0.40767669677734375, 0.4239349365234375, 0.44019317626953125, 0.456451416015625, 0.47270965576171875, 0.4889678955078125, 0.5052261352539062, 0.521484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 28.0, 201.0, 637.0, 116.0, 16.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-11.237338066101074, -11.038126945495605, -10.838916778564453, -10.639705657958984, -10.440495491027832, -10.241284370422363, -10.042074203491211, -9.842863082885742, -9.643651962280273, -9.444440841674805, -9.245230674743652, -9.046019554138184, -8.846809387207031, -8.647598266601562, -8.44838809967041, -8.249176979064941, -8.049966812133789, -7.8507561683654785, -7.651545524597168, -7.452334880828857, -7.253124237060547, -7.053913116455078, -6.854702472686768, -6.655491828918457, -6.4562811851501465, -6.257070541381836, -6.057859897613525, -5.858649253845215, -5.659438133239746, -5.4602274894714355, -5.261016845703125, -5.0618062019348145, -4.862595081329346, -4.663384437561035, -4.464173793792725, -4.264963150024414, -4.065752029418945, -3.866541624069214, -3.667330741882324, -3.4681200981140137, -3.268909454345703, -3.0696988105773926, -2.870488166809082, -2.6712772846221924, -2.472066640853882, -2.2728559970855713, -2.0736451148986816, -1.874434471130371, -1.6752238273620605, -1.47601318359375, -1.27680242061615, -1.0775916576385498, -0.8783810138702393, -0.6791703104972839, -0.4799596071243286, -0.2807488441467285, -0.08153820037841797, 0.11767250299453735, 0.3168832063674927, 0.516093909740448, 0.7153046131134033, 0.9145153164863586, 1.113726019859314, 1.312936782836914, 1.5121474266052246]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 10.0, 6.0, 23.0, 21.0, 24.0, 34.0, 24.0, 31.0, 42.0, 51.0, 46.0, 64.0, 52.0, 60.0, 58.0, 50.0, 56.0, 50.0, 51.0, 46.0, 32.0, 28.0, 26.0, 27.0, 17.0, 18.0, 9.0, 8.0, 10.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.520456075668335, -1.4812712669372559, -1.4420864582061768, -1.4029016494750977, -1.3637168407440186, -1.3245320320129395, -1.2853472232818604, -1.2461625337600708, -1.2069777250289917, -1.1677929162979126, -1.1286081075668335, -1.0894232988357544, -1.0502384901046753, -1.0110538005828857, -0.9718689322471619, -0.9326841831207275, -0.8934993147850037, -0.8543145060539246, -0.8151296973228455, -0.7759449481964111, -0.736760139465332, -0.6975753307342529, -0.6583905220031738, -0.6192057132720947, -0.5800209045410156, -0.5408360958099365, -0.5016512870788574, -0.4624665081501007, -0.423281729221344, -0.3840969204902649, -0.3449121117591858, -0.3057273328304291, -0.26654261350631714, -0.22735781967639923, -0.18817302584648132, -0.14898821711540222, -0.10980342328548431, -0.0706186294555664, -0.031433820724487305, 0.007750958204269409, 0.04693576693534851, 0.08612056076526642, 0.12530535459518433, 0.16449016332626343, 0.20367495715618134, 0.24285975098609924, 0.28204455971717834, 0.32122933864593506, 0.36041414737701416, 0.39959895610809326, 0.43878373503685, 0.4779685437679291, 0.5171533226966858, 0.5563381314277649, 0.595522940158844, 0.6347076892852783, 0.6738924980163574, 0.7130773067474365, 0.7522621154785156, 0.7914469242095947, 0.830631673336029, 0.8698164820671082, 0.9090012907981873, 0.9481860399246216, 0.9873709082603455]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 11.0, 11.0, 23.0, 27.0, 44.0, 84.0, 115.0, 179.0, 251.0, 468.0, 890.0, 1895.0, 4348.0, 10882.0, 33016.0, 120173.0, 529693.0, 258169.0, 58105.0, 18112.0, 6599.0, 2611.0, 1290.0, 661.0, 347.0, 207.0, 106.0, 74.0, 42.0, 34.0, 35.0, 14.0, 12.0, 13.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5654296875, -0.54345703125, -0.521484375, -0.49951171875, -0.4775390625, -0.45556640625, -0.43359375, -0.41162109375, -0.3896484375, -0.36767578125, -0.345703125, -0.32373046875, -0.3017578125, -0.27978515625, -0.2578125, -0.23583984375, -0.2138671875, -0.19189453125, -0.169921875, -0.14794921875, -0.1259765625, -0.10400390625, -0.08203125, -0.06005859375, -0.0380859375, -0.01611328125, 0.005859375, 0.02783203125, 0.0498046875, 0.07177734375, 0.09375, 0.11572265625, 0.1376953125, 0.15966796875, 0.181640625, 0.20361328125, 0.2255859375, 0.24755859375, 0.26953125, 0.29150390625, 0.3134765625, 0.33544921875, 0.357421875, 0.37939453125, 0.4013671875, 0.42333984375, 0.4453125, 0.46728515625, 0.4892578125, 0.51123046875, 0.533203125, 0.55517578125, 0.5771484375, 0.59912109375, 0.62109375, 0.64306640625, 0.6650390625, 0.68701171875, 0.708984375, 0.73095703125, 0.7529296875, 0.77490234375, 0.796875, 0.81884765625, 0.8408203125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 14.0, 22.0, 34.0, 25.0, 23.0, 28.0, 35.0, 35.0, 40.0, 59.0, 52.0, 55.0, 55.0, 62.0, 56.0, 58.0, 57.0, 39.0, 35.0, 45.0, 29.0, 32.0, 17.0, 13.0, 20.0, 9.0, 13.0, 8.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.151611328125, -0.14554595947265625, -0.1394805908203125, -0.13341522216796875, -0.127349853515625, -0.12128448486328125, -0.1152191162109375, -0.10915374755859375, -0.10308837890625, -0.09702301025390625, -0.0909576416015625, -0.08489227294921875, -0.078826904296875, -0.07276153564453125, -0.0666961669921875, -0.06063079833984375, -0.0545654296875, -0.04850006103515625, -0.0424346923828125, -0.03636932373046875, -0.030303955078125, -0.02423858642578125, -0.0181732177734375, -0.01210784912109375, -0.00604248046875, 2.288818359375e-05, 0.0060882568359375, 0.01215362548828125, 0.018218994140625, 0.02428436279296875, 0.0303497314453125, 0.03641510009765625, 0.04248046875, 0.04854583740234375, 0.0546112060546875, 0.06067657470703125, 0.066741943359375, 0.07280731201171875, 0.0788726806640625, 0.08493804931640625, 0.09100341796875, 0.09706878662109375, 0.1031341552734375, 0.10919952392578125, 0.115264892578125, 0.12133026123046875, 0.1273956298828125, 0.13346099853515625, 0.1395263671875, 0.14559173583984375, 0.1516571044921875, 0.15772247314453125, 0.163787841796875, 0.16985321044921875, 0.1759185791015625, 0.18198394775390625, 0.18804931640625, 0.19411468505859375, 0.2001800537109375, 0.20624542236328125, 0.212310791015625, 0.21837615966796875, 0.2244415283203125, 0.23050689697265625, 0.236572265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 3.0, 7.0, 7.0, 7.0, 14.0, 7.0, 12.0, 23.0, 30.0, 40.0, 58.0, 77.0, 118.0, 255.0, 414.0, 785.0, 1736.0, 4224.0, 12335.0, 43323.0, 217363.0, 600549.0, 124059.0, 28368.0, 8643.0, 3155.0, 1398.0, 639.0, 317.0, 207.0, 135.0, 76.0, 40.0, 34.0, 15.0, 14.0, 14.0, 13.0, 8.0, 7.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67578125, -0.6535110473632812, -0.6312408447265625, -0.6089706420898438, -0.586700439453125, -0.5644302368164062, -0.5421600341796875, -0.5198898315429688, -0.49761962890625, -0.47534942626953125, -0.4530792236328125, -0.43080902099609375, -0.408538818359375, -0.38626861572265625, -0.3639984130859375, -0.34172821044921875, -0.3194580078125, -0.29718780517578125, -0.2749176025390625, -0.25264739990234375, -0.230377197265625, -0.20810699462890625, -0.1858367919921875, -0.16356658935546875, -0.14129638671875, -0.11902618408203125, -0.0967559814453125, -0.07448577880859375, -0.052215576171875, -0.02994537353515625, -0.0076751708984375, 0.01459503173828125, 0.036865234375, 0.05913543701171875, 0.0814056396484375, 0.10367584228515625, 0.125946044921875, 0.14821624755859375, 0.1704864501953125, 0.19275665283203125, 0.21502685546875, 0.23729705810546875, 0.2595672607421875, 0.28183746337890625, 0.304107666015625, 0.32637786865234375, 0.3486480712890625, 0.37091827392578125, 0.3931884765625, 0.41545867919921875, 0.4377288818359375, 0.45999908447265625, 0.482269287109375, 0.5045394897460938, 0.5268096923828125, 0.5490798950195312, 0.57135009765625, 0.5936203002929688, 0.6158905029296875, 0.6381607055664062, 0.660430908203125, 0.6827011108398438, 0.7049713134765625, 0.7272415161132812, 0.74951171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 10.0, 11.0, 13.0, 18.0, 24.0, 16.0, 25.0, 28.0, 37.0, 41.0, 43.0, 59.0, 39.0, 48.0, 57.0, 55.0, 51.0, 51.0, 40.0, 40.0, 38.0, 45.0, 33.0, 31.0, 22.0, 18.0, 24.0, 12.0, 8.0, 7.0, 10.0, 9.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.78955078125, -0.7642898559570312, -0.7390289306640625, -0.7137680053710938, -0.688507080078125, -0.6632461547851562, -0.6379852294921875, -0.6127243041992188, -0.58746337890625, -0.5622024536132812, -0.5369415283203125, -0.5116806030273438, -0.486419677734375, -0.46115875244140625, -0.4358978271484375, -0.41063690185546875, -0.3853759765625, -0.36011505126953125, -0.3348541259765625, -0.30959320068359375, -0.284332275390625, -0.25907135009765625, -0.2338104248046875, -0.20854949951171875, -0.18328857421875, -0.15802764892578125, -0.1327667236328125, -0.10750579833984375, -0.082244873046875, -0.05698394775390625, -0.0317230224609375, -0.00646209716796875, 0.018798828125, 0.04405975341796875, 0.0693206787109375, 0.09458160400390625, 0.119842529296875, 0.14510345458984375, 0.1703643798828125, 0.19562530517578125, 0.22088623046875, 0.24614715576171875, 0.2714080810546875, 0.29666900634765625, 0.321929931640625, 0.34719085693359375, 0.3724517822265625, 0.39771270751953125, 0.4229736328125, 0.44823455810546875, 0.4734954833984375, 0.49875640869140625, 0.524017333984375, 0.5492782592773438, 0.5745391845703125, 0.5998001098632812, 0.62506103515625, 0.6503219604492188, 0.6755828857421875, 0.7008438110351562, 0.726104736328125, 0.7513656616210938, 0.7766265869140625, 0.8018875122070312, 0.8271484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 5.0, 12.0, 13.0, 45.0, 145.0, 375.0, 1438.0, 20299.0, 1013143.0, 11538.0, 1061.0, 278.0, 120.0, 43.0, 14.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.230377197265625, -1.19122314453125, -1.152069091796875, -1.1129150390625, -1.073760986328125, -1.03460693359375, -0.995452880859375, -0.956298828125, -0.917144775390625, -0.87799072265625, -0.838836669921875, -0.7996826171875, -0.760528564453125, -0.72137451171875, -0.682220458984375, -0.64306640625, -0.603912353515625, -0.56475830078125, -0.525604248046875, -0.4864501953125, -0.447296142578125, -0.40814208984375, -0.368988037109375, -0.329833984375, -0.290679931640625, -0.25152587890625, -0.212371826171875, -0.1732177734375, -0.134063720703125, -0.09490966796875, -0.055755615234375, -0.0166015625, 0.022552490234375, 0.06170654296875, 0.100860595703125, 0.1400146484375, 0.179168701171875, 0.21832275390625, 0.257476806640625, 0.296630859375, 0.335784912109375, 0.37493896484375, 0.414093017578125, 0.4532470703125, 0.492401123046875, 0.53155517578125, 0.570709228515625, 0.60986328125, 0.649017333984375, 0.68817138671875, 0.727325439453125, 0.7664794921875, 0.805633544921875, 0.84478759765625, 0.883941650390625, 0.923095703125, 0.962249755859375, 1.00140380859375, 1.040557861328125, 1.0797119140625, 1.118865966796875, 1.15802001953125, 1.197174072265625, 1.236328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 8.0, 26.0, 37.0, 48.0, 88.0, 135.0, 168.0, 166.0, 104.0, 78.0, 51.0, 20.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1975250244140625e-05, -5.034264177083969e-05, -4.871003329753876e-05, -4.7077424824237823e-05, -4.544481635093689e-05, -4.3812207877635956e-05, -4.217959940433502e-05, -4.054699093103409e-05, -3.8914382457733154e-05, -3.728177398443222e-05, -3.564916551113129e-05, -3.401655703783035e-05, -3.238394856452942e-05, -3.0751340091228485e-05, -2.911873161792755e-05, -2.7486123144626617e-05, -2.5853514671325684e-05, -2.422090619802475e-05, -2.2588297724723816e-05, -2.0955689251422882e-05, -1.9323080778121948e-05, -1.7690472304821014e-05, -1.605786383152008e-05, -1.4425255358219147e-05, -1.2792646884918213e-05, -1.1160038411617279e-05, -9.527429938316345e-06, -7.894821465015411e-06, -6.2622129917144775e-06, -4.629604518413544e-06, -2.99699604511261e-06, -1.364387571811676e-06, 2.682209014892578e-07, 1.9008293747901917e-06, 3.5334378480911255e-06, 5.166046321392059e-06, 6.798654794692993e-06, 8.431263267993927e-06, 1.006387174129486e-05, 1.1696480214595795e-05, 1.3329088687896729e-05, 1.4961697161197662e-05, 1.6594305634498596e-05, 1.822691410779953e-05, 1.9859522581100464e-05, 2.1492131054401398e-05, 2.312473952770233e-05, 2.4757348001003265e-05, 2.63899564743042e-05, 2.8022564947605133e-05, 2.9655173420906067e-05, 3.1287781894207e-05, 3.2920390367507935e-05, 3.455299884080887e-05, 3.61856073141098e-05, 3.7818215787410736e-05, 3.945082426071167e-05, 4.1083432734012604e-05, 4.271604120731354e-05, 4.434864968061447e-05, 4.5981258153915405e-05, 4.761386662721634e-05, 4.924647510051727e-05, 5.087908357381821e-05, 5.251169204711914e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 19.0, 35.0, 60.0, 94.0, 159.0, 282.0, 1059.0, 31374.0, 1009323.0, 5096.0, 505.0, 211.0, 117.0, 86.0, 41.0, 24.0, 23.0, 11.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.115234375, -1.0758209228515625, -1.036407470703125, -0.9969940185546875, -0.95758056640625, -0.9181671142578125, -0.878753662109375, -0.8393402099609375, -0.7999267578125, -0.7605133056640625, -0.721099853515625, -0.6816864013671875, -0.64227294921875, -0.6028594970703125, -0.563446044921875, -0.5240325927734375, -0.484619140625, -0.4452056884765625, -0.405792236328125, -0.3663787841796875, -0.32696533203125, -0.2875518798828125, -0.248138427734375, -0.2087249755859375, -0.1693115234375, -0.1298980712890625, -0.090484619140625, -0.0510711669921875, -0.01165771484375, 0.0277557373046875, 0.067169189453125, 0.1065826416015625, 0.14599609375, 0.1854095458984375, 0.224822998046875, 0.2642364501953125, 0.30364990234375, 0.3430633544921875, 0.382476806640625, 0.4218902587890625, 0.4613037109375, 0.5007171630859375, 0.540130615234375, 0.5795440673828125, 0.61895751953125, 0.6583709716796875, 0.697784423828125, 0.7371978759765625, 0.776611328125, 0.8160247802734375, 0.855438232421875, 0.8948516845703125, 0.93426513671875, 0.9736785888671875, 1.013092041015625, 1.0525054931640625, 1.0919189453125, 1.1313323974609375, 1.170745849609375, 1.2101593017578125, 1.24957275390625, 1.2889862060546875, 1.328399658203125, 1.3678131103515625, 1.4072265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 35.0, 212.0, 530.0, 171.0, 35.0, 8.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.172760009765625, -1.12677001953125, -1.080780029296875, -1.0347900390625, -0.988800048828125, -0.94281005859375, -0.896820068359375, -0.850830078125, -0.804840087890625, -0.75885009765625, -0.712860107421875, -0.6668701171875, -0.620880126953125, -0.57489013671875, -0.528900146484375, -0.48291015625, -0.436920166015625, -0.39093017578125, -0.344940185546875, -0.2989501953125, -0.252960205078125, -0.20697021484375, -0.160980224609375, -0.114990234375, -0.069000244140625, -0.02301025390625, 0.022979736328125, 0.0689697265625, 0.114959716796875, 0.16094970703125, 0.206939697265625, 0.2529296875, 0.298919677734375, 0.34490966796875, 0.390899658203125, 0.4368896484375, 0.482879638671875, 0.52886962890625, 0.574859619140625, 0.620849609375, 0.666839599609375, 0.71282958984375, 0.758819580078125, 0.8048095703125, 0.850799560546875, 0.89678955078125, 0.942779541015625, 0.98876953125, 1.034759521484375, 1.08074951171875, 1.126739501953125, 1.1727294921875, 1.218719482421875, 1.26470947265625, 1.310699462890625, 1.356689453125, 1.402679443359375, 1.44866943359375, 1.494659423828125, 1.5406494140625, 1.586639404296875, 1.63262939453125, 1.678619384765625, 1.724609375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 19.0, 39.0, 93.0, 336.0, 335.0, 134.0, 33.0, 10.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6794753074645996, -3.3204543590545654, -2.9614334106445312, -2.602412223815918, -2.243391275405884, -1.8843703269958496, -1.5253491401672363, -1.1663281917572021, -0.807307243347168, -0.448286235332489, -0.08926522731781006, 0.26975584030151367, 0.6287767887115479, 0.987797737121582, 1.3468189239501953, 1.7058398723602295, 2.0648608207702637, 2.423881769180298, 2.782902717590332, 3.1419239044189453, 3.5009448528289795, 3.8599658012390137, 4.218986988067627, 4.578007698059082, 4.937028884887695, 5.296050071716309, 5.655070781707764, 6.014091968536377, 6.373112678527832, 6.732133865356445, 7.091155052185059, 7.450176239013672, 7.809196472167969, 8.168217658996582, 8.527238845825195, 8.886259078979492, 9.245280265808105, 9.604301452636719, 9.963322639465332, 10.322343826293945, 10.681364059448242, 11.040385246276855, 11.399406433105469, 11.758426666259766, 12.117447853088379, 12.476469039916992, 12.835490226745605, 13.194511413574219, 13.553532600402832, 13.912553787231445, 14.271574974060059, 14.630596160888672, 14.989616394042969, 15.348637580871582, 15.707658767700195, 16.066679000854492, 16.425701141357422, 16.78472137451172, 17.14374351501465, 17.502763748168945, 17.861785888671875, 18.220806121826172, 18.57982635498047, 18.9388484954834, 19.297868728637695]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 3.0, 9.0, 9.0, 11.0, 13.0, 15.0, 13.0, 14.0, 20.0, 36.0, 33.0, 41.0, 39.0, 32.0, 43.0, 37.0, 57.0, 46.0, 47.0, 42.0, 39.0, 41.0, 50.0, 30.0, 33.0, 28.0, 21.0, 39.0, 25.0, 25.0, 17.0, 21.0, 13.0, 10.0, 3.0, 8.0, 3.0, 2.0, 6.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.138191223144531, -4.019832134246826, -3.901472806930542, -3.783113479614258, -3.6647541522979736, -3.5463948249816895, -3.4280357360839844, -3.3096764087677, -3.191317081451416, -3.072957754135132, -2.9545986652374268, -2.8362393379211426, -2.7178800106048584, -2.599520683288574, -2.481161594390869, -2.362802267074585, -2.24444317817688, -2.1260838508605957, -2.0077247619628906, -1.8893654346466064, -1.7710061073303223, -1.6526468992233276, -1.534287691116333, -1.4159283638000488, -1.2975691556930542, -1.1792099475860596, -1.0608506202697754, -0.9424914121627808, -0.8241321444511414, -0.705772876739502, -0.5874136686325073, -0.4690544009208679, -0.3506953716278076, -0.2323361188173294, -0.1139768660068512, 0.00438237190246582, 0.12274163961410522, 0.24110090732574463, 0.35946011543273926, 0.47781938314437866, 0.5961786508560181, 0.7145379185676575, 0.8328971862792969, 0.9512563943862915, 1.0696156024932861, 1.1879749298095703, 1.306334137916565, 1.4246933460235596, 1.5430526733398438, 1.6614118814468384, 1.7797712087631226, 1.8981304168701172, 2.0164897441864014, 2.1348490715026855, 2.2532081604003906, 2.371567487716675, 2.489926815032959, 2.608286142349243, 2.7266452312469482, 2.8450045585632324, 2.9633638858795166, 3.081723213195801, 3.200082302093506, 3.31844162940979, 3.436800718307495]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 10.0, 8.0, 16.0, 19.0, 35.0, 56.0, 56.0, 78.0, 132.0, 169.0, 290.0, 436.0, 732.0, 1358.0, 2491.0, 5211.0, 13318.0, 43272.0, 374223.0, 3620227.0, 93592.0, 22271.0, 8065.0, 3622.0, 1888.0, 1034.0, 554.0, 347.0, 247.0, 159.0, 107.0, 67.0, 59.0, 34.0, 24.0, 19.0, 15.0, 11.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.5380859375, -0.5228157043457031, -0.5075454711914062, -0.4922752380371094, -0.4770050048828125, -0.4617347717285156, -0.44646453857421875, -0.4311943054199219, -0.415924072265625, -0.4006538391113281, -0.38538360595703125, -0.3701133728027344, -0.3548431396484375, -0.3395729064941406, -0.32430267333984375, -0.3090324401855469, -0.29376220703125, -0.2784919738769531, -0.26322174072265625, -0.24795150756835938, -0.2326812744140625, -0.21741104125976562, -0.20214080810546875, -0.18687057495117188, -0.171600341796875, -0.15633010864257812, -0.14105987548828125, -0.12578964233398438, -0.1105194091796875, -0.09524917602539062, -0.07997894287109375, -0.06470870971679688, -0.0494384765625, -0.034168243408203125, -0.01889801025390625, -0.003627777099609375, 0.0116424560546875, 0.026912689208984375, 0.04218292236328125, 0.057453155517578125, 0.072723388671875, 0.08799362182617188, 0.10326385498046875, 0.11853408813476562, 0.1338043212890625, 0.14907455444335938, 0.16434478759765625, 0.17961502075195312, 0.19488525390625, 0.21015548706054688, 0.22542572021484375, 0.24069595336914062, 0.2559661865234375, 0.2712364196777344, 0.28650665283203125, 0.3017768859863281, 0.317047119140625, 0.3323173522949219, 0.34758758544921875, 0.3628578186035156, 0.3781280517578125, 0.3933982849121094, 0.40866851806640625, 0.4239387512207031, 0.439208984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 6.0, 11.0, 14.0, 22.0, 24.0, 29.0, 36.0, 36.0, 42.0, 62.0, 55.0, 45.0, 48.0, 56.0, 39.0, 62.0, 51.0, 34.0, 43.0, 36.0, 33.0, 42.0, 32.0, 25.0, 15.0, 17.0, 14.0, 15.0, 7.0, 11.0, 14.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.15790748596191406, -0.15114212036132812, -0.1443767547607422, -0.13761138916015625, -0.1308460235595703, -0.12408065795898438, -0.11731529235839844, -0.1105499267578125, -0.10378456115722656, -0.09701919555664062, -0.09025382995605469, -0.08348846435546875, -0.07672309875488281, -0.06995773315429688, -0.06319236755371094, -0.056427001953125, -0.04966163635253906, -0.042896270751953125, -0.03613090515136719, -0.02936553955078125, -0.022600173950195312, -0.015834808349609375, -0.009069442749023438, -0.0023040771484375, 0.0044612884521484375, 0.011226654052734375, 0.017992019653320312, 0.02475738525390625, 0.03152275085449219, 0.038288116455078125, 0.04505348205566406, 0.05181884765625, 0.05858421325683594, 0.06534957885742188, 0.07211494445800781, 0.07888031005859375, 0.08564567565917969, 0.09241104125976562, 0.09917640686035156, 0.1059417724609375, 0.11270713806152344, 0.11947250366210938, 0.1262378692626953, 0.13300323486328125, 0.1397686004638672, 0.14653396606445312, 0.15329933166503906, 0.160064697265625, 0.16683006286621094, 0.17359542846679688, 0.1803607940673828, 0.18712615966796875, 0.1938915252685547, 0.20065689086914062, 0.20742225646972656, 0.2141876220703125, 0.22095298767089844, 0.22771835327148438, 0.2344837188720703, 0.24124908447265625, 0.2480144500732422, 0.2547798156738281, 0.26154518127441406, 0.268310546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 11.0, 22.0, 17.0, 27.0, 35.0, 62.0, 76.0, 122.0, 235.0, 391.0, 962.0, 3668.0, 30723.0, 4049555.0, 99334.0, 6509.0, 1340.0, 474.0, 242.0, 145.0, 83.0, 75.0, 63.0, 38.0, 23.0, 14.0, 7.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0830078125, -1.039093017578125, -0.99517822265625, -0.951263427734375, -0.9073486328125, -0.863433837890625, -0.81951904296875, -0.775604248046875, -0.731689453125, -0.687774658203125, -0.64385986328125, -0.599945068359375, -0.5560302734375, -0.512115478515625, -0.46820068359375, -0.424285888671875, -0.38037109375, -0.336456298828125, -0.29254150390625, -0.248626708984375, -0.2047119140625, -0.160797119140625, -0.11688232421875, -0.072967529296875, -0.029052734375, 0.014862060546875, 0.05877685546875, 0.102691650390625, 0.1466064453125, 0.190521240234375, 0.23443603515625, 0.278350830078125, 0.322265625, 0.366180419921875, 0.41009521484375, 0.454010009765625, 0.4979248046875, 0.541839599609375, 0.58575439453125, 0.629669189453125, 0.673583984375, 0.717498779296875, 0.76141357421875, 0.805328369140625, 0.8492431640625, 0.893157958984375, 0.93707275390625, 0.980987548828125, 1.02490234375, 1.068817138671875, 1.11273193359375, 1.156646728515625, 1.2005615234375, 1.244476318359375, 1.28839111328125, 1.332305908203125, 1.376220703125, 1.420135498046875, 1.46405029296875, 1.507965087890625, 1.5518798828125, 1.595794677734375, 1.63970947265625, 1.683624267578125, 1.7275390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 15.0, 26.0, 64.0, 430.0, 3240.0, 198.0, 52.0, 18.0, 12.0, 9.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5309219360351562, -0.5071563720703125, -0.48339080810546875, -0.459625244140625, -0.43585968017578125, -0.4120941162109375, -0.38832855224609375, -0.36456298828125, -0.34079742431640625, -0.3170318603515625, -0.29326629638671875, -0.269500732421875, -0.24573516845703125, -0.2219696044921875, -0.19820404052734375, -0.1744384765625, -0.15067291259765625, -0.1269073486328125, -0.10314178466796875, -0.079376220703125, -0.05561065673828125, -0.0318450927734375, -0.00807952880859375, 0.01568603515625, 0.03945159912109375, 0.0632171630859375, 0.08698272705078125, 0.110748291015625, 0.13451385498046875, 0.1582794189453125, 0.18204498291015625, 0.205810546875, 0.22957611083984375, 0.2533416748046875, 0.27710723876953125, 0.300872802734375, 0.32463836669921875, 0.3484039306640625, 0.37216949462890625, 0.39593505859375, 0.41970062255859375, 0.4434661865234375, 0.46723175048828125, 0.490997314453125, 0.5147628784179688, 0.5385284423828125, 0.5622940063476562, 0.5860595703125, 0.6098251342773438, 0.6335906982421875, 0.6573562622070312, 0.681121826171875, 0.7048873901367188, 0.7286529541015625, 0.7524185180664062, 0.77618408203125, 0.7999496459960938, 0.8237152099609375, 0.8474807739257812, 0.871246337890625, 0.8950119018554688, 0.9187774658203125, 0.9425430297851562, 0.96630859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 27.0, 138.0, 365.0, 346.0, 84.0, 18.0, 10.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.105861186981201, -5.992343425750732, -5.8788251876831055, -5.765307426452637, -5.651789665222168, -5.538271903991699, -5.424753665924072, -5.3112359046936035, -5.197718143463135, -5.084200382232666, -4.970682144165039, -4.85716438293457, -4.743646621704102, -4.630128860473633, -4.516610622406006, -4.403092861175537, -4.28957462310791, -4.176056861877441, -4.0625386238098145, -3.9490208625793457, -3.835503101348877, -3.721985101699829, -3.6084671020507812, -3.4949493408203125, -3.3814315795898438, -3.267913579940796, -3.154395818710327, -3.0408778190612793, -2.9273600578308105, -2.8138420581817627, -2.700324058532715, -2.586806297302246, -2.4732885360717773, -2.3597705364227295, -2.2462527751922607, -2.132734775543213, -2.019217014312744, -1.9056990146636963, -1.792181134223938, -1.6786632537841797, -1.5651453733444214, -1.451627492904663, -1.3381096124649048, -1.2245917320251465, -1.1110737323760986, -0.9975559115409851, -0.884037971496582, -0.7705200910568237, -0.6570022106170654, -0.5434843301773071, -0.42996641993522644, -0.31644850969314575, -0.20293062925338745, -0.08941274881362915, 0.024105191230773926, 0.13762307167053223, 0.2511409521102905, 0.36465883255004883, 0.4781767427921295, 0.5916946530342102, 0.7052125334739685, 0.8187304139137268, 0.9322483539581299, 1.0457662343978882, 1.1592841148376465]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 2.0, 2.0, 6.0, 8.0, 11.0, 9.0, 19.0, 23.0, 22.0, 27.0, 37.0, 41.0, 40.0, 48.0, 52.0, 51.0, 64.0, 62.0, 51.0, 73.0, 43.0, 43.0, 43.0, 43.0, 50.0, 21.0, 22.0, 20.0, 17.0, 10.0, 10.0, 7.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.045449137687683, -1.0140300989151, -0.9826111197471619, -0.9511920809745789, -0.9197731018066406, -0.8883540630340576, -0.8569350242614746, -0.8255160450935364, -0.7940970659255981, -0.7626780271530151, -0.7312590479850769, -0.6998400092124939, -0.6684210300445557, -0.6370019912719727, -0.6055829524993896, -0.5741639733314514, -0.5427449345588684, -0.5113258957862854, -0.47990691661834717, -0.44848787784576416, -0.4170688986778259, -0.3856498599052429, -0.3542308509349823, -0.3228118419647217, -0.29139283299446106, -0.25997382402420044, -0.22855481505393982, -0.197135791182518, -0.16571678221225739, -0.13429777324199677, -0.10287874937057495, -0.07145974040031433, -0.040040671825408936, -0.008621659129858017, 0.0227973535656929, 0.05421636998653412, 0.08563537895679474, 0.11705438792705536, 0.14847341179847717, 0.1798924207687378, 0.2113114297389984, 0.24273043870925903, 0.27414944767951965, 0.3055684566497803, 0.3369874954223633, 0.3684064745903015, 0.3998255133628845, 0.43124452233314514, 0.46266353130340576, 0.4940825402736664, 0.525501549243927, 0.55692058801651, 0.5883395671844482, 0.6197586059570312, 0.6511776447296143, 0.6825966238975525, 0.7140156030654907, 0.7454346418380737, 0.776853621006012, 0.808272659778595, 0.8396916389465332, 0.8711106777191162, 0.9025297164916992, 0.9339486956596375, 0.9653677344322205]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 12.0, 9.0, 12.0, 18.0, 21.0, 41.0, 49.0, 94.0, 158.0, 271.0, 465.0, 913.0, 1873.0, 4215.0, 10009.0, 26018.0, 80193.0, 301120.0, 435571.0, 125442.0, 37700.0, 13792.0, 5429.0, 2516.0, 1142.0, 614.0, 327.0, 170.0, 116.0, 70.0, 45.0, 40.0, 16.0, 19.0, 11.0, 17.0, 3.0, 12.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6953125, -0.6755447387695312, -0.6557769775390625, -0.6360092163085938, -0.616241455078125, -0.5964736938476562, -0.5767059326171875, -0.5569381713867188, -0.53717041015625, -0.5174026489257812, -0.4976348876953125, -0.47786712646484375, -0.458099365234375, -0.43833160400390625, -0.4185638427734375, -0.39879608154296875, -0.3790283203125, -0.35926055908203125, -0.3394927978515625, -0.31972503662109375, -0.299957275390625, -0.28018951416015625, -0.2604217529296875, -0.24065399169921875, -0.22088623046875, -0.20111846923828125, -0.1813507080078125, -0.16158294677734375, -0.141815185546875, -0.12204742431640625, -0.1022796630859375, -0.08251190185546875, -0.062744140625, -0.04297637939453125, -0.0232086181640625, -0.00344085693359375, 0.016326904296875, 0.03609466552734375, 0.0558624267578125, 0.07563018798828125, 0.09539794921875, 0.11516571044921875, 0.1349334716796875, 0.15470123291015625, 0.174468994140625, 0.19423675537109375, 0.2140045166015625, 0.23377227783203125, 0.2535400390625, 0.27330780029296875, 0.2930755615234375, 0.31284332275390625, 0.332611083984375, 0.35237884521484375, 0.3721466064453125, 0.39191436767578125, 0.41168212890625, 0.43144989013671875, 0.4512176513671875, 0.47098541259765625, 0.490753173828125, 0.5105209350585938, 0.5302886962890625, 0.5500564575195312, 0.56982421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 1.0, 5.0, 2.0, 3.0, 9.0, 11.0, 18.0, 18.0, 30.0, 32.0, 32.0, 37.0, 52.0, 49.0, 50.0, 54.0, 49.0, 49.0, 43.0, 51.0, 47.0, 36.0, 49.0, 37.0, 32.0, 29.0, 31.0, 28.0, 18.0, 26.0, 9.0, 11.0, 12.0, 11.0, 8.0, 5.0, 9.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1771240234375, -0.17061233520507812, -0.16410064697265625, -0.15758895874023438, -0.1510772705078125, -0.14456558227539062, -0.13805389404296875, -0.13154220581054688, -0.125030517578125, -0.11851882934570312, -0.11200714111328125, -0.10549545288085938, -0.0989837646484375, -0.09247207641601562, -0.08596038818359375, -0.07944869995117188, -0.07293701171875, -0.06642532348632812, -0.05991363525390625, -0.053401947021484375, -0.0468902587890625, -0.040378570556640625, -0.03386688232421875, -0.027355194091796875, -0.020843505859375, -0.014331817626953125, -0.00782012939453125, -0.001308441162109375, 0.0052032470703125, 0.011714935302734375, 0.01822662353515625, 0.024738311767578125, 0.03125, 0.037761688232421875, 0.04427337646484375, 0.050785064697265625, 0.0572967529296875, 0.06380844116210938, 0.07032012939453125, 0.07683181762695312, 0.083343505859375, 0.08985519409179688, 0.09636688232421875, 0.10287857055664062, 0.1093902587890625, 0.11590194702148438, 0.12241363525390625, 0.12892532348632812, 0.13543701171875, 0.14194869995117188, 0.14846038818359375, 0.15497207641601562, 0.1614837646484375, 0.16799545288085938, 0.17450714111328125, 0.18101882934570312, 0.187530517578125, 0.19404220581054688, 0.20055389404296875, 0.20706558227539062, 0.2135772705078125, 0.22008895874023438, 0.22660064697265625, 0.23311233520507812, 0.2396240234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 8.0, 12.0, 17.0, 31.0, 23.0, 41.0, 69.0, 79.0, 148.0, 246.0, 484.0, 1146.0, 2982.0, 9075.0, 32433.0, 147508.0, 574759.0, 216300.0, 44788.0, 11868.0, 3782.0, 1422.0, 596.0, 289.0, 142.0, 95.0, 45.0, 40.0, 37.0, 17.0, 14.0, 13.0, 8.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.693359375, -0.6699447631835938, -0.6465301513671875, -0.6231155395507812, -0.599700927734375, -0.5762863159179688, -0.5528717041015625, -0.5294570922851562, -0.50604248046875, -0.48262786865234375, -0.4592132568359375, -0.43579864501953125, -0.412384033203125, -0.38896942138671875, -0.3655548095703125, -0.34214019775390625, -0.3187255859375, -0.29531097412109375, -0.2718963623046875, -0.24848175048828125, -0.225067138671875, -0.20165252685546875, -0.1782379150390625, -0.15482330322265625, -0.13140869140625, -0.10799407958984375, -0.0845794677734375, -0.06116485595703125, -0.037750244140625, -0.01433563232421875, 0.0090789794921875, 0.03249359130859375, 0.055908203125, 0.07932281494140625, 0.1027374267578125, 0.12615203857421875, 0.149566650390625, 0.17298126220703125, 0.1963958740234375, 0.21981048583984375, 0.24322509765625, 0.26663970947265625, 0.2900543212890625, 0.31346893310546875, 0.336883544921875, 0.36029815673828125, 0.3837127685546875, 0.40712738037109375, 0.4305419921875, 0.45395660400390625, 0.4773712158203125, 0.5007858276367188, 0.524200439453125, 0.5476150512695312, 0.5710296630859375, 0.5944442749023438, 0.61785888671875, 0.6412734985351562, 0.6646881103515625, 0.6881027221679688, 0.711517333984375, 0.7349319458007812, 0.7583465576171875, 0.7817611694335938, 0.80517578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 10.0, 8.0, 17.0, 15.0, 28.0, 20.0, 27.0, 31.0, 34.0, 31.0, 31.0, 44.0, 54.0, 47.0, 46.0, 46.0, 38.0, 45.0, 40.0, 44.0, 37.0, 34.0, 31.0, 30.0, 31.0, 29.0, 21.0, 15.0, 15.0, 16.0, 23.0, 7.0, 5.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7900390625, -0.7654495239257812, -0.7408599853515625, -0.7162704467773438, -0.691680908203125, -0.6670913696289062, -0.6425018310546875, -0.6179122924804688, -0.59332275390625, -0.5687332153320312, -0.5441436767578125, -0.5195541381835938, -0.494964599609375, -0.47037506103515625, -0.4457855224609375, -0.42119598388671875, -0.3966064453125, -0.37201690673828125, -0.3474273681640625, -0.32283782958984375, -0.298248291015625, -0.27365875244140625, -0.2490692138671875, -0.22447967529296875, -0.19989013671875, -0.17530059814453125, -0.1507110595703125, -0.12612152099609375, -0.101531982421875, -0.07694244384765625, -0.0523529052734375, -0.02776336669921875, -0.003173828125, 0.02141571044921875, 0.0460052490234375, 0.07059478759765625, 0.095184326171875, 0.11977386474609375, 0.1443634033203125, 0.16895294189453125, 0.19354248046875, 0.21813201904296875, 0.2427215576171875, 0.26731109619140625, 0.291900634765625, 0.31649017333984375, 0.3410797119140625, 0.36566925048828125, 0.3902587890625, 0.41484832763671875, 0.4394378662109375, 0.46402740478515625, 0.488616943359375, 0.5132064819335938, 0.5377960205078125, 0.5623855590820312, 0.58697509765625, 0.6115646362304688, 0.6361541748046875, 0.6607437133789062, 0.685333251953125, 0.7099227905273438, 0.7345123291015625, 0.7591018676757812, 0.78369140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 6.0, 17.0, 17.0, 28.0, 32.0, 47.0, 106.0, 176.0, 266.0, 601.0, 1358.0, 3752.0, 14470.0, 92496.0, 581781.0, 303688.0, 37969.0, 7517.0, 2215.0, 943.0, 408.0, 247.0, 125.0, 91.0, 51.0, 40.0, 22.0, 23.0, 12.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23232078552246094, -0.22330856323242188, -0.2142963409423828, -0.20528411865234375, -0.1962718963623047, -0.18725967407226562, -0.17824745178222656, -0.1692352294921875, -0.16022300720214844, -0.15121078491210938, -0.1421985626220703, -0.13318634033203125, -0.12417411804199219, -0.11516189575195312, -0.10614967346191406, -0.097137451171875, -0.08812522888183594, -0.07911300659179688, -0.07010078430175781, -0.06108856201171875, -0.05207633972167969, -0.043064117431640625, -0.03405189514160156, -0.0250396728515625, -0.016027450561523438, -0.007015228271484375, 0.0019969940185546875, 0.01100921630859375, 0.020021438598632812, 0.029033660888671875, 0.03804588317871094, 0.04705810546875, 0.05607032775878906, 0.06508255004882812, 0.07409477233886719, 0.08310699462890625, 0.09211921691894531, 0.10113143920898438, 0.11014366149902344, 0.1191558837890625, 0.12816810607910156, 0.13718032836914062, 0.1461925506591797, 0.15520477294921875, 0.1642169952392578, 0.17322921752929688, 0.18224143981933594, 0.191253662109375, 0.20026588439941406, 0.20927810668945312, 0.2182903289794922, 0.22730255126953125, 0.2363147735595703, 0.24532699584960938, 0.25433921813964844, 0.2633514404296875, 0.27236366271972656, 0.2813758850097656, 0.2903881072998047, 0.29940032958984375, 0.3084125518798828, 0.3174247741699219, 0.32643699645996094, 0.33544921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 7.0, 20.0, 17.0, 22.0, 42.0, 59.0, 100.0, 124.0, 123.0, 129.0, 111.0, 69.0, 60.0, 32.0, 22.0, 14.0, 8.0, 15.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849102020263672e-05, -2.6963651180267334e-05, -2.543628215789795e-05, -2.3908913135528564e-05, -2.238154411315918e-05, -2.0854175090789795e-05, -1.932680606842041e-05, -1.7799437046051025e-05, -1.627206802368164e-05, -1.4744699001312256e-05, -1.3217329978942871e-05, -1.1689960956573486e-05, -1.0162591934204102e-05, -8.635222911834717e-06, -7.107853889465332e-06, -5.580484867095947e-06, -4.0531158447265625e-06, -2.5257468223571777e-06, -9.98377799987793e-07, 5.289912223815918e-07, 2.0563602447509766e-06, 3.5837292671203613e-06, 5.111098289489746e-06, 6.638467311859131e-06, 8.165836334228516e-06, 9.6932053565979e-06, 1.1220574378967285e-05, 1.274794340133667e-05, 1.4275312423706055e-05, 1.580268144607544e-05, 1.7330050468444824e-05, 1.885741949081421e-05, 2.0384788513183594e-05, 2.191215753555298e-05, 2.3439526557922363e-05, 2.4966895580291748e-05, 2.6494264602661133e-05, 2.8021633625030518e-05, 2.9549002647399902e-05, 3.107637166976929e-05, 3.260374069213867e-05, 3.413110971450806e-05, 3.565847873687744e-05, 3.7185847759246826e-05, 3.871321678161621e-05, 4.0240585803985596e-05, 4.176795482635498e-05, 4.3295323848724365e-05, 4.482269287109375e-05, 4.6350061893463135e-05, 4.787743091583252e-05, 4.9404799938201904e-05, 5.093216896057129e-05, 5.2459537982940674e-05, 5.398690700531006e-05, 5.551427602767944e-05, 5.704164505004883e-05, 5.856901407241821e-05, 6.00963830947876e-05, 6.162375211715698e-05, 6.315112113952637e-05, 6.467849016189575e-05, 6.620585918426514e-05, 6.773322820663452e-05, 6.92605972290039e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 6.0, 13.0, 21.0, 21.0, 40.0, 71.0, 138.0, 332.0, 910.0, 3882.0, 27952.0, 410564.0, 558445.0, 39473.0, 4929.0, 1028.0, 346.0, 187.0, 91.0, 42.0, 26.0, 12.0, 11.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.442626953125, -0.43068695068359375, -0.4187469482421875, -0.40680694580078125, -0.394866943359375, -0.38292694091796875, -0.3709869384765625, -0.35904693603515625, -0.34710693359375, -0.33516693115234375, -0.3232269287109375, -0.31128692626953125, -0.299346923828125, -0.28740692138671875, -0.2754669189453125, -0.26352691650390625, -0.2515869140625, -0.23964691162109375, -0.2277069091796875, -0.21576690673828125, -0.203826904296875, -0.19188690185546875, -0.1799468994140625, -0.16800689697265625, -0.15606689453125, -0.14412689208984375, -0.1321868896484375, -0.12024688720703125, -0.108306884765625, -0.09636688232421875, -0.0844268798828125, -0.07248687744140625, -0.060546875, -0.04860687255859375, -0.0366668701171875, -0.02472686767578125, -0.012786865234375, -0.00084686279296875, 0.0110931396484375, 0.02303314208984375, 0.03497314453125, 0.04691314697265625, 0.0588531494140625, 0.07079315185546875, 0.082733154296875, 0.09467315673828125, 0.1066131591796875, 0.11855316162109375, 0.1304931640625, 0.14243316650390625, 0.1543731689453125, 0.16631317138671875, 0.178253173828125, 0.19019317626953125, 0.2021331787109375, 0.21407318115234375, 0.22601318359375, 0.23795318603515625, 0.2498931884765625, 0.26183319091796875, 0.273773193359375, 0.28571319580078125, 0.2976531982421875, 0.30959320068359375, 0.321533203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 14.0, 15.0, 25.0, 38.0, 49.0, 63.0, 95.0, 115.0, 122.0, 120.0, 92.0, 76.0, 68.0, 31.0, 29.0, 18.0, 11.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4931640625, -0.4816303253173828, -0.4700965881347656, -0.45856285095214844, -0.44702911376953125, -0.43549537658691406, -0.4239616394042969, -0.4124279022216797, -0.4008941650390625, -0.3893604278564453, -0.3778266906738281, -0.36629295349121094, -0.35475921630859375, -0.34322547912597656, -0.3316917419433594, -0.3201580047607422, -0.308624267578125, -0.2970905303955078, -0.2855567932128906, -0.27402305603027344, -0.26248931884765625, -0.25095558166503906, -0.23942184448242188, -0.2278881072998047, -0.2163543701171875, -0.2048206329345703, -0.19328689575195312, -0.18175315856933594, -0.17021942138671875, -0.15868568420410156, -0.14715194702148438, -0.1356182098388672, -0.12408447265625, -0.11255073547363281, -0.10101699829101562, -0.08948326110839844, -0.07794952392578125, -0.06641578674316406, -0.054882049560546875, -0.04334831237792969, -0.0318145751953125, -0.020280838012695312, -0.008747100830078125, 0.0027866363525390625, 0.01432037353515625, 0.025854110717773438, 0.037387847900390625, 0.04892158508300781, 0.060455322265625, 0.07198905944824219, 0.08352279663085938, 0.09505653381347656, 0.10659027099609375, 0.11812400817871094, 0.12965774536132812, 0.1411914825439453, 0.1527252197265625, 0.1642589569091797, 0.17579269409179688, 0.18732643127441406, 0.19886016845703125, 0.21039390563964844, 0.22192764282226562, 0.2334613800048828, 0.2449951171875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 14.0, 14.0, 29.0, 64.0, 135.0, 270.0, 237.0, 146.0, 51.0, 23.0, 13.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.018630027770996, -11.787850379943848, -11.557071685791016, -11.326292037963867, -11.095513343811035, -10.864733695983887, -10.633955001831055, -10.403175354003906, -10.172395706176758, -9.94161605834961, -9.710837364196777, -9.480057716369629, -9.249279022216797, -9.018499374389648, -8.787720680236816, -8.556941032409668, -8.326162338256836, -8.095382690429688, -7.8646039962768555, -7.633824825286865, -7.403045654296875, -7.172266006469727, -6.941486835479736, -6.710707664489746, -6.479928493499756, -6.249149322509766, -6.018370151519775, -5.787590980529785, -5.556811332702637, -5.326032638549805, -5.095252990722656, -4.864473819732666, -4.633694171905518, -4.402915000915527, -4.172135829925537, -3.9413564205169678, -3.7105772495269775, -3.4797980785369873, -3.249018669128418, -3.0182394981384277, -2.7874603271484375, -2.5566811561584473, -2.325901985168457, -2.0951225757598877, -1.8643434047698975, -1.6335642337799072, -1.4027849435806274, -1.1720056533813477, -0.9412264823913574, -0.7104472517967224, -0.4796680212020874, -0.2488887906074524, -0.018109560012817383, 0.21266961097717285, 0.44344890117645264, 0.6742281913757324, 0.9050073623657227, 1.135786533355713, 1.3665658235549927, 1.5973451137542725, 1.8281242847442627, 2.058903455734253, 2.2896828651428223, 2.5204620361328125, 2.7512412071228027]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 9.0, 11.0, 11.0, 15.0, 13.0, 21.0, 15.0, 25.0, 28.0, 30.0, 31.0, 39.0, 45.0, 48.0, 50.0, 52.0, 51.0, 36.0, 45.0, 60.0, 47.0, 44.0, 38.0, 41.0, 42.0, 27.0, 21.0, 26.0, 9.0, 15.0, 13.0, 8.0, 4.0, 3.0, 7.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.715194225311279, -4.5851969718933105, -4.455199241638184, -4.325201988220215, -4.195204734802246, -4.065207481384277, -3.9352097511291504, -3.8052124977111816, -3.675215005874634, -3.545217514038086, -3.415220260620117, -3.2852227687835693, -3.1552252769470215, -3.0252280235290527, -2.895230531692505, -2.765233039855957, -2.6352357864379883, -2.5052382946014404, -2.3752410411834717, -2.245243549346924, -2.115246295928955, -1.9852488040924072, -1.8552513122558594, -1.725253939628601, -1.5952565670013428, -1.4652591943740845, -1.3352618217468262, -1.2052643299102783, -1.07526695728302, -0.9452695846557617, -0.8152721524238586, -0.6852747201919556, -0.5552773475646973, -0.4252799451351166, -0.2952825427055359, -0.1652851402759552, -0.03528773784637451, 0.09470963478088379, 0.22470706701278687, 0.35470449924468994, 0.48470187187194824, 0.6146992444992065, 0.7446966767311096, 0.8746941089630127, 1.004691481590271, 1.1346888542175293, 1.2646863460540771, 1.3946837186813354, 1.5246810913085938, 1.654678463935852, 1.7846758365631104, 1.9146733283996582, 2.044670581817627, 2.174668073654175, 2.3046655654907227, 2.4346628189086914, 2.5646603107452393, 2.694657802581787, 2.824655055999756, 2.9546525478363037, 3.0846500396728516, 3.2146472930908203, 3.344644784927368, 3.474642276763916, 3.6046395301818848]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 9.0, 9.0, 8.0, 16.0, 17.0, 32.0, 35.0, 52.0, 73.0, 110.0, 165.0, 235.0, 349.0, 517.0, 868.0, 1490.0, 2905.0, 6534.0, 18435.0, 131393.0, 3931024.0, 74163.0, 14468.0, 5376.0, 2470.0, 1404.0, 776.0, 438.0, 290.0, 206.0, 134.0, 81.0, 45.0, 45.0, 34.0, 19.0, 20.0, 12.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.0478515625, -1.0198287963867188, -0.9918060302734375, -0.9637832641601562, -0.935760498046875, -0.9077377319335938, -0.8797149658203125, -0.8516921997070312, -0.82366943359375, -0.7956466674804688, -0.7676239013671875, -0.7396011352539062, -0.711578369140625, -0.6835556030273438, -0.6555328369140625, -0.6275100708007812, -0.5994873046875, -0.5714645385742188, -0.5434417724609375, -0.5154190063476562, -0.487396240234375, -0.45937347412109375, -0.4313507080078125, -0.40332794189453125, -0.37530517578125, -0.34728240966796875, -0.3192596435546875, -0.29123687744140625, -0.263214111328125, -0.23519134521484375, -0.2071685791015625, -0.17914581298828125, -0.151123046875, -0.12310028076171875, -0.0950775146484375, -0.06705474853515625, -0.039031982421875, -0.01100921630859375, 0.0170135498046875, 0.04503631591796875, 0.07305908203125, 0.10108184814453125, 0.1291046142578125, 0.15712738037109375, 0.185150146484375, 0.21317291259765625, 0.2411956787109375, 0.26921844482421875, 0.2972412109375, 0.32526397705078125, 0.3532867431640625, 0.38130950927734375, 0.409332275390625, 0.43735504150390625, 0.4653778076171875, 0.49340057373046875, 0.52142333984375, 0.5494461059570312, 0.5774688720703125, 0.6054916381835938, 0.633514404296875, 0.6615371704101562, 0.6895599365234375, 0.7175827026367188, 0.74560546875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 9.0, 1.0, 4.0, 12.0, 11.0, 10.0, 20.0, 17.0, 24.0, 34.0, 33.0, 36.0, 39.0, 40.0, 48.0, 34.0, 47.0, 46.0, 53.0, 47.0, 48.0, 46.0, 42.0, 35.0, 42.0, 32.0, 24.0, 39.0, 24.0, 27.0, 15.0, 14.0, 11.0, 9.0, 7.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.246337890625, -0.23920059204101562, -0.23206329345703125, -0.22492599487304688, -0.2177886962890625, -0.21065139770507812, -0.20351409912109375, -0.19637680053710938, -0.189239501953125, -0.18210220336914062, -0.17496490478515625, -0.16782760620117188, -0.1606903076171875, -0.15355300903320312, -0.14641571044921875, -0.13927841186523438, -0.13214111328125, -0.12500381469726562, -0.11786651611328125, -0.11072921752929688, -0.1035919189453125, -0.09645462036132812, -0.08931732177734375, -0.08218002319335938, -0.075042724609375, -0.06790542602539062, -0.06076812744140625, -0.053630828857421875, -0.0464935302734375, -0.039356231689453125, -0.03221893310546875, -0.025081634521484375, -0.0179443359375, -0.010807037353515625, -0.00366973876953125, 0.003467559814453125, 0.0106048583984375, 0.017742156982421875, 0.02487945556640625, 0.032016754150390625, 0.039154052734375, 0.046291351318359375, 0.05342864990234375, 0.060565948486328125, 0.0677032470703125, 0.07484054565429688, 0.08197784423828125, 0.08911514282226562, 0.09625244140625, 0.10338973999023438, 0.11052703857421875, 0.11766433715820312, 0.1248016357421875, 0.13193893432617188, 0.13907623291015625, 0.14621353149414062, 0.153350830078125, 0.16048812866210938, 0.16762542724609375, 0.17476272583007812, 0.1819000244140625, 0.18903732299804688, 0.19617462158203125, 0.20331192016601562, 0.21044921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 13.0, 18.0, 20.0, 37.0, 43.0, 46.0, 73.0, 114.0, 164.0, 297.0, 1068.0, 8642.0, 4046995.0, 131870.0, 3483.0, 718.0, 259.0, 120.0, 62.0, 69.0, 47.0, 30.0, 34.0, 24.0, 11.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.0960235595703125, -3.016265869140625, -2.9365081787109375, -2.85675048828125, -2.7769927978515625, -2.697235107421875, -2.6174774169921875, -2.5377197265625, -2.4579620361328125, -2.378204345703125, -2.2984466552734375, -2.21868896484375, -2.1389312744140625, -2.059173583984375, -1.9794158935546875, -1.899658203125, -1.8199005126953125, -1.740142822265625, -1.6603851318359375, -1.58062744140625, -1.5008697509765625, -1.421112060546875, -1.3413543701171875, -1.2615966796875, -1.1818389892578125, -1.102081298828125, -1.0223236083984375, -0.94256591796875, -0.8628082275390625, -0.783050537109375, -0.7032928466796875, -0.62353515625, -0.5437774658203125, -0.464019775390625, -0.3842620849609375, -0.30450439453125, -0.2247467041015625, -0.144989013671875, -0.0652313232421875, 0.0145263671875, 0.0942840576171875, 0.174041748046875, 0.2537994384765625, 0.33355712890625, 0.4133148193359375, 0.493072509765625, 0.5728302001953125, 0.652587890625, 0.7323455810546875, 0.812103271484375, 0.8918609619140625, 0.97161865234375, 1.0513763427734375, 1.131134033203125, 1.2108917236328125, 1.2906494140625, 1.3704071044921875, 1.450164794921875, 1.5299224853515625, 1.60968017578125, 1.6894378662109375, 1.769195556640625, 1.8489532470703125, 1.9287109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 14.0, 29.0, 170.0, 3608.0, 197.0, 36.0, 10.0, 9.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.7155685424804688, -1.6743011474609375, -1.6330337524414062, -1.591766357421875, -1.5504989624023438, -1.5092315673828125, -1.4679641723632812, -1.42669677734375, -1.3854293823242188, -1.3441619873046875, -1.3028945922851562, -1.261627197265625, -1.2203598022460938, -1.1790924072265625, -1.1378250122070312, -1.0965576171875, -1.0552902221679688, -1.0140228271484375, -0.9727554321289062, -0.931488037109375, -0.8902206420898438, -0.8489532470703125, -0.8076858520507812, -0.76641845703125, -0.7251510620117188, -0.6838836669921875, -0.6426162719726562, -0.601348876953125, -0.5600814819335938, -0.5188140869140625, -0.47754669189453125, -0.436279296875, -0.39501190185546875, -0.3537445068359375, -0.31247711181640625, -0.271209716796875, -0.22994232177734375, -0.1886749267578125, -0.14740753173828125, -0.10614013671875, -0.06487274169921875, -0.0236053466796875, 0.01766204833984375, 0.058929443359375, 0.10019683837890625, 0.1414642333984375, 0.18273162841796875, 0.2239990234375, 0.26526641845703125, 0.3065338134765625, 0.34780120849609375, 0.389068603515625, 0.43033599853515625, 0.4716033935546875, 0.5128707885742188, 0.55413818359375, 0.5954055786132812, 0.6366729736328125, 0.6779403686523438, 0.719207763671875, 0.7604751586914062, 0.8017425537109375, 0.8430099487304688, 0.88427734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 14.0, 25.0, 81.0, 233.0, 374.0, 184.0, 51.0, 18.0, 13.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.567192077636719, -5.452269077301025, -5.33734655380249, -5.222423553466797, -5.1075005531311035, -4.99257755279541, -4.877655029296875, -4.762732028961182, -4.647809028625488, -4.532886028289795, -4.41796350479126, -4.303040504455566, -4.188117504119873, -4.07319450378418, -3.9582719802856445, -3.843348979949951, -3.728426218032837, -3.6135034561157227, -3.4985804557800293, -3.383657693862915, -3.2687346935272217, -3.1538119316101074, -3.038888931274414, -2.9239661693573, -2.8090434074401855, -2.6941206455230713, -2.579197645187378, -2.4642748832702637, -2.3493518829345703, -2.234429121017456, -2.119506359100342, -2.0045833587646484, -1.8896605968475342, -1.7747377157211304, -1.6598148345947266, -1.5448920726776123, -1.429969072341919, -1.3150463104248047, -1.2001234292984009, -1.085200548171997, -0.9702776670455933, -0.8553547859191895, -0.7404319047927856, -0.6255090832710266, -0.5105862021446228, -0.395663321018219, -0.28074049949645996, -0.16581761837005615, -0.050894737243652344, 0.06402812898159027, 0.17895099520683289, 0.2938738465309143, 0.4087967276573181, 0.5237196087837219, 0.638642430305481, 0.7535653114318848, 0.8684881925582886, 0.9834110736846924, 1.0983339548110962, 1.2132568359375, 1.3281795978546143, 1.4431025981903076, 1.5580253601074219, 1.6729482412338257, 1.7878711223602295]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 5.0, 13.0, 18.0, 16.0, 22.0, 27.0, 33.0, 49.0, 43.0, 42.0, 53.0, 53.0, 59.0, 61.0, 68.0, 65.0, 46.0, 55.0, 44.0, 39.0, 34.0, 34.0, 25.0, 22.0, 16.0, 11.0, 9.0, 12.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7369763851165771, -1.688307523727417, -1.6396386623382568, -1.5909698009490967, -1.542301058769226, -1.493632197380066, -1.4449633359909058, -1.3962944746017456, -1.347625732421875, -1.2989568710327148, -1.2502880096435547, -1.2016191482543945, -1.152950406074524, -1.1042815446853638, -1.0556126832962036, -1.0069438219070435, -0.9582749605178833, -0.9096060991287231, -0.8609372973442078, -0.8122684359550476, -0.7635996341705322, -0.7149307727813721, -0.6662619113922119, -0.6175930500030518, -0.5689242482185364, -0.5202553868293762, -0.47158658504486084, -0.4229177236557007, -0.3742488920688629, -0.32558006048202515, -0.276911199092865, -0.22824236750602722, -0.17957353591918945, -0.13090470433235168, -0.08223585784435272, -0.03356701135635376, 0.015101820230484009, 0.06377065181732178, 0.11243951320648193, 0.1611083447933197, 0.20977717638015747, 0.25844600796699524, 0.307114839553833, 0.35578370094299316, 0.40445253252983093, 0.4531213641166687, 0.5017902255058289, 0.5504590272903442, 0.5991278886795044, 0.6477967500686646, 0.6964655518531799, 0.7451344132423401, 0.7938032150268555, 0.8424720764160156, 0.8911409378051758, 0.9398097991943359, 0.9884786009788513, 1.0371474027633667, 1.0858162641525269, 1.134485125541687, 1.1831539869308472, 1.2318227291107178, 1.280491590499878, 1.329160451889038, 1.3778293132781982]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 8.0, 6.0, 5.0, 14.0, 25.0, 27.0, 42.0, 62.0, 101.0, 157.0, 198.0, 305.0, 469.0, 749.0, 1106.0, 1860.0, 3004.0, 5051.0, 8424.0, 14055.0, 24676.0, 45371.0, 88630.0, 182522.0, 278690.0, 190445.0, 93278.0, 46930.0, 25539.0, 14580.0, 8642.0, 5055.0, 3179.0, 1929.0, 1154.0, 824.0, 490.0, 310.0, 213.0, 143.0, 103.0, 58.0, 35.0, 29.0, 22.0, 11.0, 11.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4019508361816406, -0.38959503173828125, -0.3772392272949219, -0.3648834228515625, -0.3525276184082031, -0.34017181396484375, -0.3278160095214844, -0.315460205078125, -0.3031044006347656, -0.29074859619140625, -0.2783927917480469, -0.2660369873046875, -0.2536811828613281, -0.24132537841796875, -0.22896957397460938, -0.21661376953125, -0.20425796508789062, -0.19190216064453125, -0.17954635620117188, -0.1671905517578125, -0.15483474731445312, -0.14247894287109375, -0.13012313842773438, -0.117767333984375, -0.10541152954101562, -0.09305572509765625, -0.08069992065429688, -0.0683441162109375, -0.055988311767578125, -0.04363250732421875, -0.031276702880859375, -0.0189208984375, -0.006565093994140625, 0.00579071044921875, 0.018146514892578125, 0.0305023193359375, 0.042858123779296875, 0.05521392822265625, 0.06756973266601562, 0.079925537109375, 0.09228134155273438, 0.10463714599609375, 0.11699295043945312, 0.1293487548828125, 0.14170455932617188, 0.15406036376953125, 0.16641616821289062, 0.17877197265625, 0.19112777709960938, 0.20348358154296875, 0.21583938598632812, 0.2281951904296875, 0.24055099487304688, 0.25290679931640625, 0.2652626037597656, 0.277618408203125, 0.2899742126464844, 0.30233001708984375, 0.3146858215332031, 0.3270416259765625, 0.3393974304199219, 0.35175323486328125, 0.3641090393066406, 0.37646484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 11.0, 5.0, 9.0, 4.0, 14.0, 18.0, 12.0, 16.0, 16.0, 23.0, 28.0, 35.0, 25.0, 26.0, 53.0, 56.0, 55.0, 52.0, 42.0, 37.0, 47.0, 43.0, 40.0, 57.0, 36.0, 40.0, 24.0, 27.0, 28.0, 26.0, 22.0, 15.0, 17.0, 15.0, 11.0, 3.0, 7.0, 5.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.26850128173828125, -0.2608795166015625, -0.25325775146484375, -0.245635986328125, -0.23801422119140625, -0.2303924560546875, -0.22277069091796875, -0.21514892578125, -0.20752716064453125, -0.1999053955078125, -0.19228363037109375, -0.184661865234375, -0.17704010009765625, -0.1694183349609375, -0.16179656982421875, -0.1541748046875, -0.14655303955078125, -0.1389312744140625, -0.13130950927734375, -0.123687744140625, -0.11606597900390625, -0.1084442138671875, -0.10082244873046875, -0.09320068359375, -0.08557891845703125, -0.0779571533203125, -0.07033538818359375, -0.062713623046875, -0.05509185791015625, -0.0474700927734375, -0.03984832763671875, -0.0322265625, -0.02460479736328125, -0.0169830322265625, -0.00936126708984375, -0.001739501953125, 0.00588226318359375, 0.0135040283203125, 0.02112579345703125, 0.02874755859375, 0.03636932373046875, 0.0439910888671875, 0.05161285400390625, 0.059234619140625, 0.06685638427734375, 0.0744781494140625, 0.08209991455078125, 0.0897216796875, 0.09734344482421875, 0.1049652099609375, 0.11258697509765625, 0.120208740234375, 0.12783050537109375, 0.1354522705078125, 0.14307403564453125, 0.15069580078125, 0.15831756591796875, 0.1659393310546875, 0.17356109619140625, 0.181182861328125, 0.18880462646484375, 0.1964263916015625, 0.20404815673828125, 0.211669921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 11.0, 28.0, 27.0, 54.0, 56.0, 113.0, 168.0, 231.0, 400.0, 689.0, 1268.0, 2467.0, 5210.0, 12077.0, 32922.0, 112516.0, 426444.0, 328512.0, 81379.0, 25347.0, 9715.0, 4175.0, 2035.0, 1103.0, 582.0, 392.0, 225.0, 137.0, 92.0, 47.0, 31.0, 25.0, 20.0, 10.0, 5.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.6753921508789062, -0.6535186767578125, -0.6316452026367188, -0.609771728515625, -0.5878982543945312, -0.5660247802734375, -0.5441513061523438, -0.52227783203125, -0.5004043579101562, -0.4785308837890625, -0.45665740966796875, -0.434783935546875, -0.41291046142578125, -0.3910369873046875, -0.36916351318359375, -0.3472900390625, -0.32541656494140625, -0.3035430908203125, -0.28166961669921875, -0.259796142578125, -0.23792266845703125, -0.2160491943359375, -0.19417572021484375, -0.17230224609375, -0.15042877197265625, -0.1285552978515625, -0.10668182373046875, -0.084808349609375, -0.06293487548828125, -0.0410614013671875, -0.01918792724609375, 0.002685546875, 0.02455902099609375, 0.0464324951171875, 0.06830596923828125, 0.090179443359375, 0.11205291748046875, 0.1339263916015625, 0.15579986572265625, 0.17767333984375, 0.19954681396484375, 0.2214202880859375, 0.24329376220703125, 0.265167236328125, 0.28704071044921875, 0.3089141845703125, 0.33078765869140625, 0.3526611328125, 0.37453460693359375, 0.3964080810546875, 0.41828155517578125, 0.440155029296875, 0.46202850341796875, 0.4839019775390625, 0.5057754516601562, 0.52764892578125, 0.5495223999023438, 0.5713958740234375, 0.5932693481445312, 0.615142822265625, 0.6370162963867188, 0.6588897705078125, 0.6807632446289062, 0.70263671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 7.0, 15.0, 8.0, 10.0, 14.0, 19.0, 19.0, 34.0, 45.0, 47.0, 50.0, 52.0, 51.0, 56.0, 54.0, 60.0, 56.0, 60.0, 71.0, 47.0, 37.0, 43.0, 25.0, 26.0, 19.0, 18.0, 18.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4541015625, -1.409881591796875, -1.36566162109375, -1.321441650390625, -1.2772216796875, -1.233001708984375, -1.18878173828125, -1.144561767578125, -1.100341796875, -1.056121826171875, -1.01190185546875, -0.967681884765625, -0.9234619140625, -0.879241943359375, -0.83502197265625, -0.790802001953125, -0.74658203125, -0.702362060546875, -0.65814208984375, -0.613922119140625, -0.5697021484375, -0.525482177734375, -0.48126220703125, -0.437042236328125, -0.392822265625, -0.348602294921875, -0.30438232421875, -0.260162353515625, -0.2159423828125, -0.171722412109375, -0.12750244140625, -0.083282470703125, -0.0390625, 0.005157470703125, 0.04937744140625, 0.093597412109375, 0.1378173828125, 0.182037353515625, 0.22625732421875, 0.270477294921875, 0.314697265625, 0.358917236328125, 0.40313720703125, 0.447357177734375, 0.4915771484375, 0.535797119140625, 0.58001708984375, 0.624237060546875, 0.66845703125, 0.712677001953125, 0.75689697265625, 0.801116943359375, 0.8453369140625, 0.889556884765625, 0.93377685546875, 0.977996826171875, 1.022216796875, 1.066436767578125, 1.11065673828125, 1.154876708984375, 1.1990966796875, 1.243316650390625, 1.28753662109375, 1.331756591796875, 1.3759765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 10.0, 14.0, 20.0, 36.0, 58.0, 123.0, 224.0, 537.0, 1238.0, 3678.0, 17622.0, 189456.0, 722939.0, 96710.0, 11240.0, 2732.0, 1005.0, 442.0, 220.0, 101.0, 60.0, 32.0, 18.0, 14.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4705238342285156, -0.45886993408203125, -0.4472160339355469, -0.4355621337890625, -0.4239082336425781, -0.41225433349609375, -0.4006004333496094, -0.388946533203125, -0.3772926330566406, -0.36563873291015625, -0.3539848327636719, -0.3423309326171875, -0.3306770324707031, -0.31902313232421875, -0.3073692321777344, -0.29571533203125, -0.2840614318847656, -0.27240753173828125, -0.2607536315917969, -0.2490997314453125, -0.23744583129882812, -0.22579193115234375, -0.21413803100585938, -0.202484130859375, -0.19083023071289062, -0.17917633056640625, -0.16752243041992188, -0.1558685302734375, -0.14421463012695312, -0.13256072998046875, -0.12090682983398438, -0.1092529296875, -0.09759902954101562, -0.08594512939453125, -0.07429122924804688, -0.0626373291015625, -0.050983428955078125, -0.03932952880859375, -0.027675628662109375, -0.016021728515625, -0.004367828369140625, 0.00728607177734375, 0.018939971923828125, 0.0305938720703125, 0.042247772216796875, 0.05390167236328125, 0.06555557250976562, 0.07720947265625, 0.08886337280273438, 0.10051727294921875, 0.11217117309570312, 0.1238250732421875, 0.13547897338867188, 0.14713287353515625, 0.15878677368164062, 0.170440673828125, 0.18209457397460938, 0.19374847412109375, 0.20540237426757812, 0.2170562744140625, 0.22871017456054688, 0.24036407470703125, 0.2520179748535156, 0.263671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 6.0, 5.0, 12.0, 18.0, 15.0, 28.0, 58.0, 57.0, 83.0, 115.0, 109.0, 122.0, 93.0, 79.0, 53.0, 41.0, 33.0, 15.0, 15.0, 11.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.023313522338867e-05, -3.877934068441391e-05, -3.732554614543915e-05, -3.5871751606464386e-05, -3.4417957067489624e-05, -3.296416252851486e-05, -3.15103679895401e-05, -3.0056573450565338e-05, -2.8602778911590576e-05, -2.7148984372615814e-05, -2.5695189833641052e-05, -2.424139529466629e-05, -2.278760075569153e-05, -2.1333806216716766e-05, -1.9880011677742004e-05, -1.8426217138767242e-05, -1.697242259979248e-05, -1.551862806081772e-05, -1.4064833521842957e-05, -1.2611038982868195e-05, -1.1157244443893433e-05, -9.70344990491867e-06, -8.249655365943909e-06, -6.795860826969147e-06, -5.342066287994385e-06, -3.888271749019623e-06, -2.434477210044861e-06, -9.806826710700989e-07, 4.731118679046631e-07, 1.926906406879425e-06, 3.380700945854187e-06, 4.834495484828949e-06, 6.288290023803711e-06, 7.742084562778473e-06, 9.195879101753235e-06, 1.0649673640727997e-05, 1.2103468179702759e-05, 1.355726271867752e-05, 1.5011057257652283e-05, 1.6464851796627045e-05, 1.7918646335601807e-05, 1.937244087457657e-05, 2.082623541355133e-05, 2.2280029952526093e-05, 2.3733824491500854e-05, 2.5187619030475616e-05, 2.664141356945038e-05, 2.809520810842514e-05, 2.9549002647399902e-05, 3.1002797186374664e-05, 3.2456591725349426e-05, 3.391038626432419e-05, 3.536418080329895e-05, 3.681797534227371e-05, 3.8271769881248474e-05, 3.9725564420223236e-05, 4.1179358959198e-05, 4.263315349817276e-05, 4.408694803714752e-05, 4.5540742576122284e-05, 4.6994537115097046e-05, 4.844833165407181e-05, 4.990212619304657e-05, 5.135592073202133e-05, 5.2809715270996094e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 11.0, 23.0, 27.0, 46.0, 59.0, 99.0, 142.0, 283.0, 477.0, 943.0, 2229.0, 6490.0, 25430.0, 131253.0, 491219.0, 309384.0, 60746.0, 12963.0, 3784.0, 1384.0, 638.0, 363.0, 214.0, 126.0, 72.0, 44.0, 27.0, 19.0, 9.0, 8.0, 11.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2508888244628906, -0.24323272705078125, -0.23557662963867188, -0.2279205322265625, -0.22026443481445312, -0.21260833740234375, -0.20495223999023438, -0.197296142578125, -0.18964004516601562, -0.18198394775390625, -0.17432785034179688, -0.1666717529296875, -0.15901565551757812, -0.15135955810546875, -0.14370346069335938, -0.13604736328125, -0.12839126586914062, -0.12073516845703125, -0.11307907104492188, -0.1054229736328125, -0.09776687622070312, -0.09011077880859375, -0.08245468139648438, -0.074798583984375, -0.06714248657226562, -0.05948638916015625, -0.051830291748046875, -0.0441741943359375, -0.036518096923828125, -0.02886199951171875, -0.021205902099609375, -0.0135498046875, -0.005893707275390625, 0.00176239013671875, 0.009418487548828125, 0.0170745849609375, 0.024730682373046875, 0.03238677978515625, 0.040042877197265625, 0.047698974609375, 0.055355072021484375, 0.06301116943359375, 0.07066726684570312, 0.0783233642578125, 0.08597946166992188, 0.09363555908203125, 0.10129165649414062, 0.10894775390625, 0.11660385131835938, 0.12425994873046875, 0.13191604614257812, 0.1395721435546875, 0.14722824096679688, 0.15488433837890625, 0.16254043579101562, 0.170196533203125, 0.17785263061523438, 0.18550872802734375, 0.19316482543945312, 0.2008209228515625, 0.20847702026367188, 0.21613311767578125, 0.22378921508789062, 0.2314453125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 5.0, 13.0, 15.0, 23.0, 36.0, 58.0, 54.0, 84.0, 99.0, 93.0, 104.0, 98.0, 79.0, 69.0, 44.0, 37.0, 24.0, 16.0, 12.0, 11.0, 8.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.449951171875, -0.43747711181640625, -0.4250030517578125, -0.41252899169921875, -0.400054931640625, -0.38758087158203125, -0.3751068115234375, -0.36263275146484375, -0.35015869140625, -0.33768463134765625, -0.3252105712890625, -0.31273651123046875, -0.300262451171875, -0.28778839111328125, -0.2753143310546875, -0.26284027099609375, -0.2503662109375, -0.23789215087890625, -0.2254180908203125, -0.21294403076171875, -0.200469970703125, -0.18799591064453125, -0.1755218505859375, -0.16304779052734375, -0.15057373046875, -0.13809967041015625, -0.1256256103515625, -0.11315155029296875, -0.100677490234375, -0.08820343017578125, -0.0757293701171875, -0.06325531005859375, -0.05078125, -0.03830718994140625, -0.0258331298828125, -0.01335906982421875, -0.000885009765625, 0.01158905029296875, 0.0240631103515625, 0.03653717041015625, 0.04901123046875, 0.06148529052734375, 0.0739593505859375, 0.08643341064453125, 0.098907470703125, 0.11138153076171875, 0.1238555908203125, 0.13632965087890625, 0.1488037109375, 0.16127777099609375, 0.1737518310546875, 0.18622589111328125, 0.198699951171875, 0.21117401123046875, 0.2236480712890625, 0.23612213134765625, 0.24859619140625, 0.26107025146484375, 0.2735443115234375, 0.28601837158203125, 0.298492431640625, 0.31096649169921875, 0.3234405517578125, 0.33591461181640625, 0.348388671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 17.0, 29.0, 61.0, 134.0, 216.0, 278.0, 161.0, 50.0, 28.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.122644901275635, -6.786108493804932, -6.449572563171387, -6.113036155700684, -5.776500225067139, -5.4399638175964355, -5.103427886962891, -4.7668914794921875, -4.430355072021484, -4.093818664550781, -3.7572827339172363, -3.420746326446533, -3.0842103958129883, -2.747673988342285, -2.411137819290161, -2.074601650238037, -1.7380657196044922, -1.4015295505523682, -1.0649933815002441, -0.7284570932388306, -0.39192092418670654, -0.05538475513458252, 0.28115153312683105, 0.6176877021789551, 0.9542238712310791, 1.2907600402832031, 1.6272962093353271, 1.9638324975967407, 2.3003687858581543, 2.636904716491699, 2.9734411239624023, 3.3099772930145264, 3.646512985229492, 3.983049154281616, 4.31958532333374, 4.656121730804443, 4.992657661437988, 5.329194068908691, 5.6657304763793945, 6.0022664070129395, 6.338802337646484, 6.6753387451171875, 7.011874675750732, 7.3484110832214355, 7.6849470138549805, 8.021483421325684, 8.358019828796387, 8.694555282592773, 9.031091690063477, 9.36762809753418, 9.704164505004883, 10.04069995880127, 10.377236366271973, 10.713772773742676, 11.050309181213379, 11.386844635009766, 11.723381996154785, 12.059918403625488, 12.396454811096191, 12.732990264892578, 13.069526672363281, 13.406063079833984, 13.742599487304688, 14.07913589477539, 14.415671348571777]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 14.0, 5.0, 8.0, 17.0, 29.0, 13.0, 23.0, 22.0, 17.0, 25.0, 29.0, 39.0, 22.0, 41.0, 39.0, 51.0, 38.0, 39.0, 34.0, 49.0, 31.0, 34.0, 44.0, 37.0, 31.0, 35.0, 25.0, 12.0, 23.0, 23.0, 10.0, 19.0, 18.0, 14.0, 8.0, 10.0, 7.0, 11.0, 8.0, 1.0, 8.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0], "bins": [-5.70883321762085, -5.541421413421631, -5.374009132385254, -5.206597328186035, -5.039185047149658, -4.8717732429504395, -4.7043609619140625, -4.536949157714844, -4.369537353515625, -4.202125549316406, -4.034713268280029, -3.8673014640808105, -3.6998894214630127, -3.532477378845215, -3.365065336227417, -3.197653293609619, -3.0302412509918213, -2.8628292083740234, -2.6954171657562256, -2.5280051231384277, -2.360593318939209, -2.193181276321411, -2.0257692337036133, -1.858357310295105, -1.6909452676773071, -1.5235332250595093, -1.356121301651001, -1.1887092590332031, -1.0212972164154053, -0.853885293006897, -0.6864732503890991, -0.5190613269805908, -0.35164928436279297, -0.1842372864484787, -0.01682528853416443, 0.15058672428131104, 0.3179987072944641, 0.4854106903076172, 0.652822732925415, 0.8202346563339233, 0.9876466989517212, 1.155058741569519, 1.3224706649780273, 1.4898827075958252, 1.657294750213623, 1.8247066736221313, 1.9921187162399292, 2.1595306396484375, 2.3269426822662354, 2.494354724884033, 2.661766767501831, 2.829178810119629, 2.9965906143188477, 3.1640026569366455, 3.3314146995544434, 3.498826503753662, 3.666238784790039, 3.833650827407837, 4.001062870025635, 4.1684746742248535, 4.3358869552612305, 4.503298759460449, 4.670710563659668, 4.838122844696045, 5.005534648895264]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 3.0, 7.0, 6.0, 8.0, 7.0, 12.0, 28.0, 44.0, 31.0, 58.0, 82.0, 105.0, 132.0, 215.0, 317.0, 431.0, 599.0, 985.0, 1446.0, 2431.0, 4020.0, 7956.0, 18302.0, 68608.0, 3794607.0, 236065.0, 31690.0, 11480.0, 5830.0, 3123.0, 1941.0, 1229.0, 804.0, 536.0, 351.0, 238.0, 178.0, 109.0, 85.0, 63.0, 30.0, 30.0, 21.0, 14.0, 7.0, 5.0, 9.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8818359375, -0.8557052612304688, -0.8295745849609375, -0.8034439086914062, -0.777313232421875, -0.7511825561523438, -0.7250518798828125, -0.6989212036132812, -0.67279052734375, -0.6466598510742188, -0.6205291748046875, -0.5943984985351562, -0.568267822265625, -0.5421371459960938, -0.5160064697265625, -0.48987579345703125, -0.4637451171875, -0.43761444091796875, -0.4114837646484375, -0.38535308837890625, -0.359222412109375, -0.33309173583984375, -0.3069610595703125, -0.28083038330078125, -0.25469970703125, -0.22856903076171875, -0.2024383544921875, -0.17630767822265625, -0.150177001953125, -0.12404632568359375, -0.0979156494140625, -0.07178497314453125, -0.045654296875, -0.01952362060546875, 0.0066070556640625, 0.03273773193359375, 0.058868408203125, 0.08499908447265625, 0.1111297607421875, 0.13726043701171875, 0.16339111328125, 0.18952178955078125, 0.2156524658203125, 0.24178314208984375, 0.267913818359375, 0.29404449462890625, 0.3201751708984375, 0.34630584716796875, 0.3724365234375, 0.39856719970703125, 0.4246978759765625, 0.45082855224609375, 0.476959228515625, 0.5030899047851562, 0.5292205810546875, 0.5553512573242188, 0.58148193359375, 0.6076126098632812, 0.6337432861328125, 0.6598739624023438, 0.686004638671875, 0.7121353149414062, 0.7382659912109375, 0.7643966674804688, 0.79052734375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 4.0, 8.0, 13.0, 9.0, 16.0, 23.0, 23.0, 29.0, 24.0, 37.0, 39.0, 38.0, 35.0, 52.0, 48.0, 52.0, 54.0, 47.0, 38.0, 41.0, 50.0, 38.0, 36.0, 29.0, 32.0, 35.0, 25.0, 26.0, 11.0, 12.0, 14.0, 20.0, 8.0, 7.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3349609375, -0.32505035400390625, -0.3151397705078125, -0.30522918701171875, -0.295318603515625, -0.28540802001953125, -0.2754974365234375, -0.26558685302734375, -0.25567626953125, -0.24576568603515625, -0.2358551025390625, -0.22594451904296875, -0.216033935546875, -0.20612335205078125, -0.1962127685546875, -0.18630218505859375, -0.1763916015625, -0.16648101806640625, -0.1565704345703125, -0.14665985107421875, -0.136749267578125, -0.12683868408203125, -0.1169281005859375, -0.10701751708984375, -0.09710693359375, -0.08719635009765625, -0.0772857666015625, -0.06737518310546875, -0.057464599609375, -0.04755401611328125, -0.0376434326171875, -0.02773284912109375, -0.017822265625, -0.00791168212890625, 0.0019989013671875, 0.01190948486328125, 0.021820068359375, 0.03173065185546875, 0.0416412353515625, 0.05155181884765625, 0.06146240234375, 0.07137298583984375, 0.0812835693359375, 0.09119415283203125, 0.101104736328125, 0.11101531982421875, 0.1209259033203125, 0.13083648681640625, 0.1407470703125, 0.15065765380859375, 0.1605682373046875, 0.17047882080078125, 0.180389404296875, 0.19029998779296875, 0.2002105712890625, 0.21012115478515625, 0.22003173828125, 0.22994232177734375, 0.2398529052734375, 0.24976348876953125, 0.259674072265625, 0.26958465576171875, 0.2794952392578125, 0.28940582275390625, 0.29931640625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 8.0, 12.0, 23.0, 20.0, 23.0, 39.0, 43.0, 79.0, 95.0, 156.0, 252.0, 436.0, 944.0, 2410.0, 7841.0, 34619.0, 821932.0, 3270736.0, 40730.0, 8878.0, 2709.0, 1062.0, 477.0, 233.0, 138.0, 109.0, 59.0, 46.0, 35.0, 35.0, 16.0, 22.0, 17.0, 11.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.359375, -1.320587158203125, -1.28179931640625, -1.243011474609375, -1.2042236328125, -1.165435791015625, -1.12664794921875, -1.087860107421875, -1.049072265625, -1.010284423828125, -0.97149658203125, -0.932708740234375, -0.8939208984375, -0.855133056640625, -0.81634521484375, -0.777557373046875, -0.73876953125, -0.699981689453125, -0.66119384765625, -0.622406005859375, -0.5836181640625, -0.544830322265625, -0.50604248046875, -0.467254638671875, -0.428466796875, -0.389678955078125, -0.35089111328125, -0.312103271484375, -0.2733154296875, -0.234527587890625, -0.19573974609375, -0.156951904296875, -0.1181640625, -0.079376220703125, -0.04058837890625, -0.001800537109375, 0.0369873046875, 0.075775146484375, 0.11456298828125, 0.153350830078125, 0.192138671875, 0.230926513671875, 0.26971435546875, 0.308502197265625, 0.3472900390625, 0.386077880859375, 0.42486572265625, 0.463653564453125, 0.50244140625, 0.541229248046875, 0.58001708984375, 0.618804931640625, 0.6575927734375, 0.696380615234375, 0.73516845703125, 0.773956298828125, 0.812744140625, 0.851531982421875, 0.89031982421875, 0.929107666015625, 0.9678955078125, 1.006683349609375, 1.04547119140625, 1.084259033203125, 1.123046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 13.0, 20.0, 29.0, 44.0, 108.0, 681.0, 2889.0, 135.0, 60.0, 37.0, 23.0, 8.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2293243408203125, -1.197906494140625, -1.1664886474609375, -1.13507080078125, -1.1036529541015625, -1.072235107421875, -1.0408172607421875, -1.0093994140625, -0.9779815673828125, -0.946563720703125, -0.9151458740234375, -0.88372802734375, -0.8523101806640625, -0.820892333984375, -0.7894744873046875, -0.758056640625, -0.7266387939453125, -0.695220947265625, -0.6638031005859375, -0.63238525390625, -0.6009674072265625, -0.569549560546875, -0.5381317138671875, -0.5067138671875, -0.4752960205078125, -0.443878173828125, -0.4124603271484375, -0.38104248046875, -0.3496246337890625, -0.318206787109375, -0.2867889404296875, -0.25537109375, -0.2239532470703125, -0.192535400390625, -0.1611175537109375, -0.12969970703125, -0.0982818603515625, -0.066864013671875, -0.0354461669921875, -0.0040283203125, 0.0273895263671875, 0.058807373046875, 0.0902252197265625, 0.12164306640625, 0.1530609130859375, 0.184478759765625, 0.2158966064453125, 0.247314453125, 0.2787322998046875, 0.310150146484375, 0.3415679931640625, 0.37298583984375, 0.4044036865234375, 0.435821533203125, 0.4672393798828125, 0.4986572265625, 0.5300750732421875, 0.561492919921875, 0.5929107666015625, 0.62432861328125, 0.6557464599609375, 0.687164306640625, 0.7185821533203125, 0.75]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 23.0, 48.0, 131.0, 276.0, 283.0, 148.0, 50.0, 15.0, 11.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9765621423721313, -1.8348950147628784, -1.693228006362915, -1.551560878753662, -1.4098937511444092, -1.2682267427444458, -1.1265596151351929, -0.9848925471305847, -0.8432254791259766, -0.7015584111213684, -0.5598913431167603, -0.4182242155075073, -0.27655714750289917, -0.13489007949829102, 0.006777048110961914, 0.14844411611557007, 0.2901111841201782, 0.4317782521247864, 0.5734453201293945, 0.7151124477386475, 0.8567795157432556, 0.9984465837478638, 1.1401137113571167, 1.28178071975708, 1.423447847366333, 1.565114974975586, 1.7067819833755493, 1.8484491109848022, 1.9901161193847656, 2.1317832469940186, 2.2734503746032715, 2.4151175022125244, 2.5567846298217773, 2.6984517574310303, 2.840118885040283, 2.981785774230957, 3.12345290184021, 3.265120029449463, 3.406787157058716, 3.5484542846679688, 3.6901211738586426, 3.8317883014678955, 3.9734554290771484, 4.115122318267822, 4.256789684295654, 4.398456573486328, 4.54012393951416, 4.681790828704834, 4.823457717895508, 4.965124607086182, 5.106791973114014, 5.2484588623046875, 5.3901262283325195, 5.531793117523193, 5.673460006713867, 5.815127372741699, 5.956794738769531, 6.098461627960205, 6.240128993988037, 6.381795883178711, 6.523463249206543, 6.665130138397217, 6.806797027587891, 6.948464393615723, 7.0901312828063965]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 11.0, 14.0, 16.0, 17.0, 23.0, 14.0, 25.0, 29.0, 39.0, 46.0, 49.0, 40.0, 53.0, 48.0, 40.0, 51.0, 47.0, 60.0, 46.0, 49.0, 41.0, 37.0, 41.0, 22.0, 16.0, 20.0, 18.0, 17.0, 12.0, 7.0, 6.0, 13.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4657471179962158, -1.4160938262939453, -1.3664405345916748, -1.3167871236801147, -1.2671338319778442, -1.2174805402755737, -1.1678271293640137, -1.1181738376617432, -1.0685205459594727, -1.0188672542572021, -0.9692139029502869, -0.9195605516433716, -0.8699072599411011, -0.8202539682388306, -0.7706006169319153, -0.720947265625, -0.6712939739227295, -0.621640682220459, -0.5719873309135437, -0.5223339796066284, -0.4726806879043579, -0.423027366399765, -0.3733740448951721, -0.3237207233905792, -0.27406740188598633, -0.22441408038139343, -0.17476075887680054, -0.12510743737220764, -0.07545411586761475, -0.02580079436302185, 0.023852527141571045, 0.07350584864616394, 0.12315917015075684, 0.17281249165534973, 0.22246581315994263, 0.2721191346645355, 0.3217724561691284, 0.3714257776737213, 0.4210790991783142, 0.4707324206829071, 0.5203857421875, 0.5700390338897705, 0.6196923851966858, 0.6693457365036011, 0.7189990282058716, 0.7686523199081421, 0.8183056712150574, 0.8679590225219727, 0.9176123142242432, 0.9672656059265137, 1.0169188976287842, 1.0665723085403442, 1.1162256002426147, 1.1658788919448853, 1.2155323028564453, 1.2651855945587158, 1.3148388862609863, 1.3644921779632568, 1.4141454696655273, 1.4637988805770874, 1.513452172279358, 1.5631054639816284, 1.6127588748931885, 1.662412166595459, 1.7120654582977295]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 5.0, 11.0, 9.0, 12.0, 20.0, 30.0, 36.0, 47.0, 66.0, 72.0, 120.0, 187.0, 307.0, 477.0, 855.0, 1560.0, 3109.0, 6440.0, 13781.0, 32801.0, 91299.0, 312042.0, 392365.0, 119401.0, 41268.0, 16610.0, 7623.0, 3635.0, 1806.0, 982.0, 547.0, 325.0, 206.0, 147.0, 93.0, 64.0, 46.0, 35.0, 32.0, 16.0, 18.0, 14.0, 8.0, 8.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.9971389770507812, -0.9679107666015625, -0.9386825561523438, -0.909454345703125, -0.8802261352539062, -0.8509979248046875, -0.8217697143554688, -0.79254150390625, -0.7633132934570312, -0.7340850830078125, -0.7048568725585938, -0.675628662109375, -0.6464004516601562, -0.6171722412109375, -0.5879440307617188, -0.5587158203125, -0.5294876098632812, -0.5002593994140625, -0.47103118896484375, -0.441802978515625, -0.41257476806640625, -0.3833465576171875, -0.35411834716796875, -0.32489013671875, -0.29566192626953125, -0.2664337158203125, -0.23720550537109375, -0.207977294921875, -0.17874908447265625, -0.1495208740234375, -0.12029266357421875, -0.091064453125, -0.06183624267578125, -0.0326080322265625, -0.00337982177734375, 0.025848388671875, 0.05507659912109375, 0.0843048095703125, 0.11353302001953125, 0.14276123046875, 0.17198944091796875, 0.2012176513671875, 0.23044586181640625, 0.259674072265625, 0.28890228271484375, 0.3181304931640625, 0.34735870361328125, 0.3765869140625, 0.40581512451171875, 0.4350433349609375, 0.46427154541015625, 0.493499755859375, 0.5227279663085938, 0.5519561767578125, 0.5811843872070312, 0.61041259765625, 0.6396408081054688, 0.6688690185546875, 0.6980972290039062, 0.727325439453125, 0.7565536499023438, 0.7857818603515625, 0.8150100708007812, 0.84423828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 6.0, 8.0, 6.0, 5.0, 13.0, 15.0, 18.0, 18.0, 25.0, 19.0, 35.0, 27.0, 34.0, 44.0, 41.0, 49.0, 45.0, 45.0, 51.0, 48.0, 54.0, 49.0, 32.0, 47.0, 38.0, 37.0, 38.0, 27.0, 29.0, 20.0, 12.0, 12.0, 8.0, 17.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3818359375, -0.37113189697265625, -0.3604278564453125, -0.34972381591796875, -0.339019775390625, -0.32831573486328125, -0.3176116943359375, -0.30690765380859375, -0.29620361328125, -0.28549957275390625, -0.2747955322265625, -0.26409149169921875, -0.253387451171875, -0.24268341064453125, -0.2319793701171875, -0.22127532958984375, -0.2105712890625, -0.19986724853515625, -0.1891632080078125, -0.17845916748046875, -0.167755126953125, -0.15705108642578125, -0.1463470458984375, -0.13564300537109375, -0.12493896484375, -0.11423492431640625, -0.1035308837890625, -0.09282684326171875, -0.082122802734375, -0.07141876220703125, -0.0607147216796875, -0.05001068115234375, -0.039306640625, -0.02860260009765625, -0.0178985595703125, -0.00719451904296875, 0.003509521484375, 0.01421356201171875, 0.0249176025390625, 0.03562164306640625, 0.04632568359375, 0.05702972412109375, 0.0677337646484375, 0.07843780517578125, 0.089141845703125, 0.09984588623046875, 0.1105499267578125, 0.12125396728515625, 0.1319580078125, 0.14266204833984375, 0.1533660888671875, 0.16407012939453125, 0.174774169921875, 0.18547821044921875, 0.1961822509765625, 0.20688629150390625, 0.21759033203125, 0.22829437255859375, 0.2389984130859375, 0.24970245361328125, 0.260406494140625, 0.27111053466796875, 0.2818145751953125, 0.29251861572265625, 0.30322265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 16.0, 21.0, 28.0, 32.0, 82.0, 166.0, 295.0, 630.0, 1471.0, 3809.0, 11562.0, 43396.0, 300229.0, 585061.0, 75343.0, 17160.0, 5560.0, 1979.0, 867.0, 390.0, 196.0, 93.0, 56.0, 30.0, 24.0, 13.0, 15.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.73828125, -1.6915130615234375, -1.644744873046875, -1.5979766845703125, -1.55120849609375, -1.5044403076171875, -1.457672119140625, -1.4109039306640625, -1.3641357421875, -1.3173675537109375, -1.270599365234375, -1.2238311767578125, -1.17706298828125, -1.1302947998046875, -1.083526611328125, -1.0367584228515625, -0.989990234375, -0.9432220458984375, -0.896453857421875, -0.8496856689453125, -0.80291748046875, -0.7561492919921875, -0.709381103515625, -0.6626129150390625, -0.6158447265625, -0.5690765380859375, -0.522308349609375, -0.4755401611328125, -0.42877197265625, -0.3820037841796875, -0.335235595703125, -0.2884674072265625, -0.24169921875, -0.1949310302734375, -0.148162841796875, -0.1013946533203125, -0.05462646484375, -0.0078582763671875, 0.038909912109375, 0.0856781005859375, 0.1324462890625, 0.1792144775390625, 0.225982666015625, 0.2727508544921875, 0.31951904296875, 0.3662872314453125, 0.413055419921875, 0.4598236083984375, 0.506591796875, 0.5533599853515625, 0.600128173828125, 0.6468963623046875, 0.69366455078125, 0.7404327392578125, 0.787200927734375, 0.8339691162109375, 0.8807373046875, 0.9275054931640625, 0.974273681640625, 1.0210418701171875, 1.06781005859375, 1.1145782470703125, 1.161346435546875, 1.2081146240234375, 1.2548828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 8.0, 6.0, 10.0, 18.0, 17.0, 29.0, 30.0, 30.0, 27.0, 32.0, 40.0, 50.0, 55.0, 46.0, 53.0, 55.0, 68.0, 55.0, 45.0, 55.0, 42.0, 39.0, 29.0, 27.0, 30.0, 21.0, 17.0, 16.0, 16.0, 9.0, 3.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.86328125, -1.802642822265625, -1.74200439453125, -1.681365966796875, -1.6207275390625, -1.560089111328125, -1.49945068359375, -1.438812255859375, -1.378173828125, -1.317535400390625, -1.25689697265625, -1.196258544921875, -1.1356201171875, -1.074981689453125, -1.01434326171875, -0.953704833984375, -0.89306640625, -0.832427978515625, -0.77178955078125, -0.711151123046875, -0.6505126953125, -0.589874267578125, -0.52923583984375, -0.468597412109375, -0.407958984375, -0.347320556640625, -0.28668212890625, -0.226043701171875, -0.1654052734375, -0.104766845703125, -0.04412841796875, 0.016510009765625, 0.0771484375, 0.137786865234375, 0.19842529296875, 0.259063720703125, 0.3197021484375, 0.380340576171875, 0.44097900390625, 0.501617431640625, 0.562255859375, 0.622894287109375, 0.68353271484375, 0.744171142578125, 0.8048095703125, 0.865447998046875, 0.92608642578125, 0.986724853515625, 1.04736328125, 1.108001708984375, 1.16864013671875, 1.229278564453125, 1.2899169921875, 1.350555419921875, 1.41119384765625, 1.471832275390625, 1.532470703125, 1.593109130859375, 1.65374755859375, 1.714385986328125, 1.7750244140625, 1.835662841796875, 1.89630126953125, 1.956939697265625, 2.017578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 14.0, 23.0, 26.0, 32.0, 46.0, 72.0, 124.0, 172.0, 256.0, 546.0, 926.0, 1984.0, 5488.0, 29126.0, 722163.0, 264476.0, 15608.0, 3946.0, 1615.0, 764.0, 393.0, 264.0, 161.0, 96.0, 59.0, 51.0, 30.0, 18.0, 15.0, 12.0, 9.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9462890625, -0.9191360473632812, -0.8919830322265625, -0.8648300170898438, -0.837677001953125, -0.8105239868164062, -0.7833709716796875, -0.7562179565429688, -0.72906494140625, -0.7019119262695312, -0.6747589111328125, -0.6476058959960938, -0.620452880859375, -0.5932998657226562, -0.5661468505859375, -0.5389938354492188, -0.5118408203125, -0.48468780517578125, -0.4575347900390625, -0.43038177490234375, -0.403228759765625, -0.37607574462890625, -0.3489227294921875, -0.32176971435546875, -0.29461669921875, -0.26746368408203125, -0.2403106689453125, -0.21315765380859375, -0.186004638671875, -0.15885162353515625, -0.1316986083984375, -0.10454559326171875, -0.077392578125, -0.05023956298828125, -0.0230865478515625, 0.00406646728515625, 0.031219482421875, 0.05837249755859375, 0.0855255126953125, 0.11267852783203125, 0.13983154296875, 0.16698455810546875, 0.1941375732421875, 0.22129058837890625, 0.248443603515625, 0.27559661865234375, 0.3027496337890625, 0.32990264892578125, 0.3570556640625, 0.38420867919921875, 0.4113616943359375, 0.43851470947265625, 0.465667724609375, 0.49282073974609375, 0.5199737548828125, 0.5471267700195312, 0.57427978515625, 0.6014328002929688, 0.6285858154296875, 0.6557388305664062, 0.682891845703125, 0.7100448608398438, 0.7371978759765625, 0.7643508911132812, 0.79150390625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 9.0, 9.0, 13.0, 24.0, 58.0, 124.0, 259.0, 247.0, 143.0, 58.0, 28.0, 15.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.249243885278702e-05, -8.765049278736115e-05, -8.280854672193527e-05, -7.79666006565094e-05, -7.312465459108353e-05, -6.828270852565765e-05, -6.344076246023178e-05, -5.859881639480591e-05, -5.3756870329380035e-05, -4.891492426395416e-05, -4.407297819852829e-05, -3.923103213310242e-05, -3.4389086067676544e-05, -2.954714000225067e-05, -2.47051939368248e-05, -1.9863247871398926e-05, -1.5021301805973053e-05, -1.017935574054718e-05, -5.337409675121307e-06, -4.954636096954346e-07, 4.346482455730438e-06, 9.188428521156311e-06, 1.4030374586582184e-05, 1.8872320652008057e-05, 2.371426671743393e-05, 2.8556212782859802e-05, 3.3398158848285675e-05, 3.824010491371155e-05, 4.308205097913742e-05, 4.7923997044563293e-05, 5.2765943109989166e-05, 5.760788917541504e-05, 6.244983524084091e-05, 6.729178130626678e-05, 7.213372737169266e-05, 7.697567343711853e-05, 8.18176195025444e-05, 8.665956556797028e-05, 9.150151163339615e-05, 9.634345769882202e-05, 0.0001011854037642479, 0.00010602734982967377, 0.00011086929589509964, 0.00011571124196052551, 0.00012055318802595139, 0.00012539513409137726, 0.00013023708015680313, 0.000135079026222229, 0.00013992097228765488, 0.00014476291835308075, 0.00014960486441850662, 0.0001544468104839325, 0.00015928875654935837, 0.00016413070261478424, 0.0001689726486802101, 0.00017381459474563599, 0.00017865654081106186, 0.00018349848687648773, 0.0001883404329419136, 0.00019318237900733948, 0.00019802432507276535, 0.00020286627113819122, 0.0002077082172036171, 0.00021255016326904297]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 16.0, 21.0, 22.0, 31.0, 51.0, 77.0, 132.0, 209.0, 415.0, 727.0, 1610.0, 4331.0, 26443.0, 823529.0, 176325.0, 9458.0, 2589.0, 1141.0, 599.0, 329.0, 181.0, 113.0, 61.0, 50.0, 25.0, 18.0, 14.0, 14.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.884765625, -0.85504150390625, -0.8253173828125, -0.79559326171875, -0.765869140625, -0.73614501953125, -0.7064208984375, -0.67669677734375, -0.64697265625, -0.61724853515625, -0.5875244140625, -0.55780029296875, -0.528076171875, -0.49835205078125, -0.4686279296875, -0.43890380859375, -0.4091796875, -0.37945556640625, -0.3497314453125, -0.32000732421875, -0.290283203125, -0.26055908203125, -0.2308349609375, -0.20111083984375, -0.17138671875, -0.14166259765625, -0.1119384765625, -0.08221435546875, -0.052490234375, -0.02276611328125, 0.0069580078125, 0.03668212890625, 0.06640625, 0.09613037109375, 0.1258544921875, 0.15557861328125, 0.185302734375, 0.21502685546875, 0.2447509765625, 0.27447509765625, 0.30419921875, 0.33392333984375, 0.3636474609375, 0.39337158203125, 0.423095703125, 0.45281982421875, 0.4825439453125, 0.51226806640625, 0.5419921875, 0.57171630859375, 0.6014404296875, 0.63116455078125, 0.660888671875, 0.69061279296875, 0.7203369140625, 0.75006103515625, 0.77978515625, 0.80950927734375, 0.8392333984375, 0.86895751953125, 0.898681640625, 0.92840576171875, 0.9581298828125, 0.98785400390625, 1.017578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 8.0, 13.0, 15.0, 32.0, 94.0, 213.0, 281.0, 176.0, 88.0, 34.0, 15.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.8074569702148438, -0.7609100341796875, -0.7143630981445312, -0.667816162109375, -0.6212692260742188, -0.5747222900390625, -0.5281753540039062, -0.48162841796875, -0.43508148193359375, -0.3885345458984375, -0.34198760986328125, -0.295440673828125, -0.24889373779296875, -0.2023468017578125, -0.15579986572265625, -0.1092529296875, -0.06270599365234375, -0.0161590576171875, 0.03038787841796875, 0.076934814453125, 0.12348175048828125, 0.1700286865234375, 0.21657562255859375, 0.26312255859375, 0.30966949462890625, 0.3562164306640625, 0.40276336669921875, 0.449310302734375, 0.49585723876953125, 0.5424041748046875, 0.5889511108398438, 0.635498046875, 0.6820449829101562, 0.7285919189453125, 0.7751388549804688, 0.821685791015625, 0.8682327270507812, 0.9147796630859375, 0.9613265991210938, 1.00787353515625, 1.0544204711914062, 1.1009674072265625, 1.1475143432617188, 1.194061279296875, 1.2406082153320312, 1.2871551513671875, 1.3337020874023438, 1.3802490234375, 1.4267959594726562, 1.4733428955078125, 1.5198898315429688, 1.566436767578125, 1.6129837036132812, 1.6595306396484375, 1.7060775756835938, 1.75262451171875, 1.7991714477539062, 1.8457183837890625, 1.8922653198242188, 1.938812255859375, 1.9853591918945312, 2.0319061279296875, 2.0784530639648438, 2.125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 19.0, 45.0, 88.0, 215.0, 259.0, 172.0, 112.0, 47.0, 10.0, 13.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.22579574584961, -17.72553062438965, -17.225263595581055, -16.724998474121094, -16.224733352661133, -15.724466323852539, -15.224201202392578, -14.7239351272583, -14.223669052124023, -13.723402976989746, -13.223137855529785, -12.722871780395508, -12.22260570526123, -11.722339630126953, -11.222074508666992, -10.721808433532715, -10.221543312072754, -9.721277236938477, -9.221012115478516, -8.720746040344238, -8.220479965209961, -7.720214366912842, -7.219948768615723, -6.719682693481445, -6.219417095184326, -5.719151496887207, -5.21888542175293, -4.7186198234558105, -4.218354225158691, -3.718088150024414, -3.217822551727295, -2.7175567150115967, -2.2172908782958984, -1.7170250415802002, -1.2167593240737915, -0.7164936065673828, -0.21622776985168457, 0.28403806686401367, 0.7843036651611328, 1.284569501876831, 1.7848353385925293, 2.2851011753082275, 2.785367012023926, 3.285632610321045, 3.785898447036743, 4.286164283752441, 4.7864298820495605, 5.28669548034668, 5.786961555480957, 6.287227153778076, 6.7874932289123535, 7.287758827209473, 7.78802490234375, 8.288290023803711, 8.788556098937988, 9.288822174072266, 9.789087295532227, 10.289353370666504, 10.789618492126465, 11.289884567260742, 11.79015064239502, 12.290416717529297, 12.790681838989258, 13.290947914123535, 13.791213989257812]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 10.0, 10.0, 10.0, 14.0, 10.0, 11.0, 18.0, 20.0, 28.0, 29.0, 36.0, 28.0, 37.0, 55.0, 51.0, 51.0, 40.0, 33.0, 51.0, 38.0, 37.0, 44.0, 47.0, 38.0, 30.0, 26.0, 29.0, 34.0, 16.0, 26.0, 20.0, 16.0, 17.0, 6.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0], "bins": [-10.728023529052734, -10.451824188232422, -10.17562484741211, -9.899425506591797, -9.6232271194458, -9.347027778625488, -9.070828437805176, -8.794629096984863, -8.51842975616455, -8.242230415344238, -7.966031551361084, -7.6898322105407715, -7.413632869720459, -7.137434005737305, -6.861234664916992, -6.58503532409668, -6.308836460113525, -6.032637119293213, -5.756438255310059, -5.480238914489746, -5.204039573669434, -4.927840232849121, -4.651641368865967, -4.375442028045654, -4.0992431640625, -3.8230440616607666, -3.546844720840454, -3.2706456184387207, -2.994446277618408, -2.718247175216675, -2.4420480728149414, -2.165848731994629, -1.8896493911743164, -1.6134501695632935, -1.3372509479522705, -1.061051845550537, -0.7848526239395142, -0.5086534023284912, -0.2324542999267578, 0.04374492168426514, 0.3199441432952881, 0.596143364906311, 0.8723425269126892, 1.1485416889190674, 1.4247409105300903, 1.7009401321411133, 1.9771392345428467, 2.25333833694458, 2.5295376777648926, 2.805736780166626, 3.0819361209869385, 3.358135223388672, 3.6343345642089844, 3.9105336666107178, 4.186732769012451, 4.462932109832764, 4.739130973815918, 5.0153303146362305, 5.291529178619385, 5.567728519439697, 5.84392786026001, 6.120126724243164, 6.396326065063477, 6.672525405883789, 6.948724746704102]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 3.0, 5.0, 7.0, 7.0, 12.0, 14.0, 12.0, 20.0, 22.0, 36.0, 42.0, 48.0, 54.0, 83.0, 97.0, 137.0, 141.0, 195.0, 297.0, 425.0, 669.0, 1185.0, 2582.0, 14315.0, 4146562.0, 20518.0, 3103.0, 1244.0, 710.0, 431.0, 345.0, 239.0, 161.0, 102.0, 106.0, 83.0, 72.0, 41.0, 34.0, 27.0, 21.0, 25.0, 7.0, 10.0, 13.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.52734375, -2.4542236328125, -2.381103515625, -2.3079833984375, -2.23486328125, -2.1617431640625, -2.088623046875, -2.0155029296875, -1.9423828125, -1.8692626953125, -1.796142578125, -1.7230224609375, -1.64990234375, -1.5767822265625, -1.503662109375, -1.4305419921875, -1.357421875, -1.2843017578125, -1.211181640625, -1.1380615234375, -1.06494140625, -0.9918212890625, -0.918701171875, -0.8455810546875, -0.7724609375, -0.6993408203125, -0.626220703125, -0.5531005859375, -0.47998046875, -0.4068603515625, -0.333740234375, -0.2606201171875, -0.1875, -0.1143798828125, -0.041259765625, 0.0318603515625, 0.10498046875, 0.1781005859375, 0.251220703125, 0.3243408203125, 0.3974609375, 0.4705810546875, 0.543701171875, 0.6168212890625, 0.68994140625, 0.7630615234375, 0.836181640625, 0.9093017578125, 0.982421875, 1.0555419921875, 1.128662109375, 1.2017822265625, 1.27490234375, 1.3480224609375, 1.421142578125, 1.4942626953125, 1.5673828125, 1.6405029296875, 1.713623046875, 1.7867431640625, 1.85986328125, 1.9329833984375, 2.006103515625, 2.0792236328125, 2.15234375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 13.0, 13.0, 14.0, 15.0, 20.0, 14.0, 23.0, 21.0, 33.0, 36.0, 27.0, 38.0, 42.0, 45.0, 44.0, 51.0, 39.0, 41.0, 42.0, 53.0, 23.0, 44.0, 24.0, 33.0, 32.0, 30.0, 21.0, 29.0, 18.0, 20.0, 16.0, 9.0, 9.0, 10.0, 7.0, 5.0, 6.0, 3.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.431640625, -0.4192352294921875, -0.406829833984375, -0.3944244384765625, -0.38201904296875, -0.3696136474609375, -0.357208251953125, -0.3448028564453125, -0.3323974609375, -0.3199920654296875, -0.307586669921875, -0.2951812744140625, -0.28277587890625, -0.2703704833984375, -0.257965087890625, -0.2455596923828125, -0.233154296875, -0.2207489013671875, -0.208343505859375, -0.1959381103515625, -0.18353271484375, -0.1711273193359375, -0.158721923828125, -0.1463165283203125, -0.1339111328125, -0.1215057373046875, -0.109100341796875, -0.0966949462890625, -0.08428955078125, -0.0718841552734375, -0.059478759765625, -0.0470733642578125, -0.03466796875, -0.0222625732421875, -0.009857177734375, 0.0025482177734375, 0.01495361328125, 0.0273590087890625, 0.039764404296875, 0.0521697998046875, 0.0645751953125, 0.0769805908203125, 0.089385986328125, 0.1017913818359375, 0.11419677734375, 0.1266021728515625, 0.139007568359375, 0.1514129638671875, 0.163818359375, 0.1762237548828125, 0.188629150390625, 0.2010345458984375, 0.21343994140625, 0.2258453369140625, 0.238250732421875, 0.2506561279296875, 0.2630615234375, 0.2754669189453125, 0.287872314453125, 0.3002777099609375, 0.31268310546875, 0.3250885009765625, 0.337493896484375, 0.3498992919921875, 0.3623046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 7.0, 11.0, 13.0, 10.0, 15.0, 20.0, 32.0, 34.0, 53.0, 60.0, 107.0, 120.0, 142.0, 211.0, 279.0, 377.0, 561.0, 828.0, 1255.0, 2232.0, 5159.0, 17769.0, 4053889.0, 92173.0, 10007.0, 3560.0, 1786.0, 1064.0, 734.0, 453.0, 339.0, 254.0, 181.0, 148.0, 104.0, 67.0, 62.0, 39.0, 39.0, 23.0, 18.0, 10.0, 13.0, 11.0, 12.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.857421875, -1.7990264892578125, -1.740631103515625, -1.6822357177734375, -1.62384033203125, -1.5654449462890625, -1.507049560546875, -1.4486541748046875, -1.3902587890625, -1.3318634033203125, -1.273468017578125, -1.2150726318359375, -1.15667724609375, -1.0982818603515625, -1.039886474609375, -0.9814910888671875, -0.923095703125, -0.8647003173828125, -0.806304931640625, -0.7479095458984375, -0.68951416015625, -0.6311187744140625, -0.572723388671875, -0.5143280029296875, -0.4559326171875, -0.3975372314453125, -0.339141845703125, -0.2807464599609375, -0.22235107421875, -0.1639556884765625, -0.105560302734375, -0.0471649169921875, 0.01123046875, 0.0696258544921875, 0.128021240234375, 0.1864166259765625, 0.24481201171875, 0.3032073974609375, 0.361602783203125, 0.4199981689453125, 0.4783935546875, 0.5367889404296875, 0.595184326171875, 0.6535797119140625, 0.71197509765625, 0.7703704833984375, 0.828765869140625, 0.8871612548828125, 0.945556640625, 1.0039520263671875, 1.062347412109375, 1.1207427978515625, 1.17913818359375, 1.2375335693359375, 1.295928955078125, 1.3543243408203125, 1.4127197265625, 1.4711151123046875, 1.529510498046875, 1.5879058837890625, 1.64630126953125, 1.7046966552734375, 1.763092041015625, 1.8214874267578125, 1.8798828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 22.0, 141.0, 3818.0, 41.0, 16.0, 12.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7828445434570312, -0.7585601806640625, -0.7342758178710938, -0.709991455078125, -0.6857070922851562, -0.6614227294921875, -0.6371383666992188, -0.61285400390625, -0.5885696411132812, -0.5642852783203125, -0.5400009155273438, -0.515716552734375, -0.49143218994140625, -0.4671478271484375, -0.44286346435546875, -0.4185791015625, -0.39429473876953125, -0.3700103759765625, -0.34572601318359375, -0.321441650390625, -0.29715728759765625, -0.2728729248046875, -0.24858856201171875, -0.22430419921875, -0.20001983642578125, -0.1757354736328125, -0.15145111083984375, -0.127166748046875, -0.10288238525390625, -0.0785980224609375, -0.05431365966796875, -0.030029296875, -0.00574493408203125, 0.0185394287109375, 0.04282379150390625, 0.067108154296875, 0.09139251708984375, 0.1156768798828125, 0.13996124267578125, 0.16424560546875, 0.18852996826171875, 0.2128143310546875, 0.23709869384765625, 0.261383056640625, 0.28566741943359375, 0.3099517822265625, 0.33423614501953125, 0.3585205078125, 0.38280487060546875, 0.4070892333984375, 0.43137359619140625, 0.455657958984375, 0.47994232177734375, 0.5042266845703125, 0.5285110473632812, 0.55279541015625, 0.5770797729492188, 0.6013641357421875, 0.6256484985351562, 0.649932861328125, 0.6742172241210938, 0.6985015869140625, 0.7227859497070312, 0.7470703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 23.0, 18.0, 38.0, 64.0, 81.0, 121.0, 162.0, 160.0, 126.0, 73.0, 51.0, 25.0, 14.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1238667964935303, -1.0766856670379639, -1.029504418373108, -0.9823232889175415, -0.9351420998573303, -0.8879609107971191, -0.8407797813415527, -0.7935985922813416, -0.7464174032211304, -0.6992362141609192, -0.652055025100708, -0.6048738956451416, -0.5576927065849304, -0.5105115175247192, -0.46333035826683044, -0.41614919900894165, -0.36896800994873047, -0.3217868208885193, -0.2746056616306305, -0.2274244874715805, -0.18024331331253052, -0.13306213915348053, -0.08588096499443054, -0.03869980573654175, 0.008481383323669434, 0.05566255748271942, 0.10284373164176941, 0.1500249058008194, 0.19720607995986938, 0.24438725411891937, 0.29156842827796936, 0.33874958753585815, 0.3859308958053589, 0.43311208486557007, 0.48029324412345886, 0.5274744033813477, 0.5746555924415588, 0.62183678150177, 0.6690179109573364, 0.7161991000175476, 0.7633802890777588, 0.81056147813797, 0.8577426671981812, 0.9049237966537476, 0.9521049857139587, 0.9992861747741699, 1.0464673042297363, 1.0936484336853027, 1.1408296823501587, 1.188010811805725, 1.235192060470581, 1.2823731899261475, 1.3295543193817139, 1.3767355680465698, 1.4239166975021362, 1.4710979461669922, 1.5182790756225586, 1.565460205078125, 1.612641453742981, 1.6598225831985474, 1.7070038318634033, 1.7541849613189697, 1.8013660907745361, 1.8485472202301025, 1.8957284688949585]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 8.0, 12.0, 10.0, 21.0, 19.0, 21.0, 22.0, 30.0, 43.0, 45.0, 39.0, 38.0, 57.0, 48.0, 51.0, 62.0, 51.0, 42.0, 47.0, 39.0, 33.0, 43.0, 33.0, 35.0, 25.0, 27.0, 22.0, 16.0, 11.0, 10.0, 12.0, 4.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0886290073394775, -1.0520042181015015, -1.0153794288635254, -0.9787546396255493, -0.9421297907829285, -0.9055050015449524, -0.8688802123069763, -0.8322553634643555, -0.7956305742263794, -0.7590057849884033, -0.7223809957504272, -0.6857562065124512, -0.6491313576698303, -0.6125065684318542, -0.5758817791938782, -0.5392569303512573, -0.502632200717926, -0.46600741147994995, -0.4293825924396515, -0.3927578032016754, -0.35613298416137695, -0.3195081949234009, -0.2828834056854248, -0.24625858664512634, -0.20963379740715027, -0.173008993268013, -0.13638418912887573, -0.09975939989089966, -0.06313459575176239, -0.026509791612625122, 0.010114997625350952, 0.046739816665649414, 0.08336460590362549, 0.11998941004276276, 0.15661421418190002, 0.1932390034198761, 0.22986380755901337, 0.26648861169815063, 0.3031134009361267, 0.33973821997642517, 0.37636300921440125, 0.4129877984523773, 0.4496126174926758, 0.48623740673065186, 0.5228621959686279, 0.559486985206604, 0.5961117744445801, 0.6327366232872009, 0.669361412525177, 0.7059862017631531, 0.7426109910011292, 0.77923583984375, 0.8158606290817261, 0.8524854183197021, 0.8891102075576782, 0.9257349967956543, 0.9623597860336304, 0.9989845752716064, 1.0356093645095825, 1.0722341537475586, 1.1088589429855347, 1.1454837322235107, 1.1821086406707764, 1.2187334299087524, 1.2553582191467285]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 10.0, 4.0, 12.0, 8.0, 18.0, 30.0, 32.0, 63.0, 84.0, 102.0, 171.0, 203.0, 369.0, 525.0, 864.0, 1235.0, 1960.0, 3221.0, 5181.0, 8589.0, 14497.0, 25269.0, 46626.0, 92741.0, 202872.0, 298189.0, 170851.0, 78779.0, 40597.0, 22292.0, 12845.0, 7558.0, 4728.0, 2787.0, 1804.0, 1145.0, 756.0, 509.0, 334.0, 211.0, 145.0, 100.0, 72.0, 54.0, 31.0, 24.0, 20.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 3.0], "bins": [-0.70458984375, -0.6834869384765625, -0.662384033203125, -0.6412811279296875, -0.62017822265625, -0.5990753173828125, -0.577972412109375, -0.5568695068359375, -0.5357666015625, -0.5146636962890625, -0.493560791015625, -0.4724578857421875, -0.45135498046875, -0.4302520751953125, -0.409149169921875, -0.3880462646484375, -0.366943359375, -0.3458404541015625, -0.324737548828125, -0.3036346435546875, -0.28253173828125, -0.2614288330078125, -0.240325927734375, -0.2192230224609375, -0.1981201171875, -0.1770172119140625, -0.155914306640625, -0.1348114013671875, -0.11370849609375, -0.0926055908203125, -0.071502685546875, -0.0503997802734375, -0.029296875, -0.0081939697265625, 0.012908935546875, 0.0340118408203125, 0.05511474609375, 0.0762176513671875, 0.097320556640625, 0.1184234619140625, 0.1395263671875, 0.1606292724609375, 0.181732177734375, 0.2028350830078125, 0.22393798828125, 0.2450408935546875, 0.266143798828125, 0.2872467041015625, 0.308349609375, 0.3294525146484375, 0.350555419921875, 0.3716583251953125, 0.39276123046875, 0.4138641357421875, 0.434967041015625, 0.4560699462890625, 0.4771728515625, 0.4982757568359375, 0.519378662109375, 0.5404815673828125, 0.56158447265625, 0.5826873779296875, 0.603790283203125, 0.6248931884765625, 0.64599609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 7.0, 5.0, 7.0, 9.0, 14.0, 16.0, 12.0, 17.0, 20.0, 15.0, 35.0, 35.0, 30.0, 31.0, 45.0, 37.0, 52.0, 44.0, 55.0, 50.0, 34.0, 32.0, 44.0, 40.0, 34.0, 36.0, 24.0, 28.0, 30.0, 23.0, 17.0, 21.0, 20.0, 16.0, 8.0, 12.0, 9.0, 5.0, 7.0, 3.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5107421875, -0.495849609375, -0.48095703125, -0.466064453125, -0.451171875, -0.436279296875, -0.42138671875, -0.406494140625, -0.3916015625, -0.376708984375, -0.36181640625, -0.346923828125, -0.33203125, -0.317138671875, -0.30224609375, -0.287353515625, -0.2724609375, -0.257568359375, -0.24267578125, -0.227783203125, -0.212890625, -0.197998046875, -0.18310546875, -0.168212890625, -0.1533203125, -0.138427734375, -0.12353515625, -0.108642578125, -0.09375, -0.078857421875, -0.06396484375, -0.049072265625, -0.0341796875, -0.019287109375, -0.00439453125, 0.010498046875, 0.025390625, 0.040283203125, 0.05517578125, 0.070068359375, 0.0849609375, 0.099853515625, 0.11474609375, 0.129638671875, 0.14453125, 0.159423828125, 0.17431640625, 0.189208984375, 0.2041015625, 0.218994140625, 0.23388671875, 0.248779296875, 0.263671875, 0.278564453125, 0.29345703125, 0.308349609375, 0.3232421875, 0.338134765625, 0.35302734375, 0.367919921875, 0.3828125, 0.397705078125, 0.41259765625, 0.427490234375, 0.4423828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 13.0, 13.0, 20.0, 35.0, 37.0, 39.0, 58.0, 125.0, 212.0, 409.0, 917.0, 2196.0, 6318.0, 21465.0, 91138.0, 546609.0, 304387.0, 53108.0, 14038.0, 4383.0, 1544.0, 684.0, 318.0, 174.0, 82.0, 61.0, 47.0, 26.0, 28.0, 18.0, 8.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.001953125, -1.946075439453125, -1.89019775390625, -1.834320068359375, -1.7784423828125, -1.722564697265625, -1.66668701171875, -1.610809326171875, -1.554931640625, -1.499053955078125, -1.44317626953125, -1.387298583984375, -1.3314208984375, -1.275543212890625, -1.21966552734375, -1.163787841796875, -1.10791015625, -1.052032470703125, -0.99615478515625, -0.940277099609375, -0.8843994140625, -0.828521728515625, -0.77264404296875, -0.716766357421875, -0.660888671875, -0.605010986328125, -0.54913330078125, -0.493255615234375, -0.4373779296875, -0.381500244140625, -0.32562255859375, -0.269744873046875, -0.2138671875, -0.157989501953125, -0.10211181640625, -0.046234130859375, 0.0096435546875, 0.065521240234375, 0.12139892578125, 0.177276611328125, 0.233154296875, 0.289031982421875, 0.34490966796875, 0.400787353515625, 0.4566650390625, 0.512542724609375, 0.56842041015625, 0.624298095703125, 0.68017578125, 0.736053466796875, 0.79193115234375, 0.847808837890625, 0.9036865234375, 0.959564208984375, 1.01544189453125, 1.071319580078125, 1.127197265625, 1.183074951171875, 1.23895263671875, 1.294830322265625, 1.3507080078125, 1.406585693359375, 1.46246337890625, 1.518341064453125, 1.57421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 4.0, 9.0, 11.0, 18.0, 17.0, 23.0, 23.0, 29.0, 23.0, 30.0, 47.0, 40.0, 49.0, 39.0, 57.0, 45.0, 45.0, 31.0, 52.0, 48.0, 54.0, 46.0, 41.0, 37.0, 33.0, 23.0, 19.0, 16.0, 18.0, 12.0, 9.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.103515625, -3.010284423828125, -2.91705322265625, -2.823822021484375, -2.7305908203125, -2.637359619140625, -2.54412841796875, -2.450897216796875, -2.357666015625, -2.264434814453125, -2.17120361328125, -2.077972412109375, -1.9847412109375, -1.891510009765625, -1.79827880859375, -1.705047607421875, -1.61181640625, -1.518585205078125, -1.42535400390625, -1.332122802734375, -1.2388916015625, -1.145660400390625, -1.05242919921875, -0.959197998046875, -0.865966796875, -0.772735595703125, -0.67950439453125, -0.586273193359375, -0.4930419921875, -0.399810791015625, -0.30657958984375, -0.213348388671875, -0.1201171875, -0.026885986328125, 0.06634521484375, 0.159576416015625, 0.2528076171875, 0.346038818359375, 0.43927001953125, 0.532501220703125, 0.625732421875, 0.718963623046875, 0.81219482421875, 0.905426025390625, 0.9986572265625, 1.091888427734375, 1.18511962890625, 1.278350830078125, 1.37158203125, 1.464813232421875, 1.55804443359375, 1.651275634765625, 1.7445068359375, 1.837738037109375, 1.93096923828125, 2.024200439453125, 2.117431640625, 2.210662841796875, 2.30389404296875, 2.397125244140625, 2.4903564453125, 2.583587646484375, 2.67681884765625, 2.770050048828125, 2.86328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 12.0, 14.0, 19.0, 46.0, 85.0, 265.0, 720.0, 2837.0, 24508.0, 737815.0, 268202.0, 11408.0, 1827.0, 451.0, 155.0, 78.0, 41.0, 21.0, 14.0, 13.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8729629516601562, -0.8391876220703125, -0.8054122924804688, -0.771636962890625, -0.7378616333007812, -0.7040863037109375, -0.6703109741210938, -0.63653564453125, -0.6027603149414062, -0.5689849853515625, -0.5352096557617188, -0.501434326171875, -0.46765899658203125, -0.4338836669921875, -0.40010833740234375, -0.3663330078125, -0.33255767822265625, -0.2987823486328125, -0.26500701904296875, -0.231231689453125, -0.19745635986328125, -0.1636810302734375, -0.12990570068359375, -0.09613037109375, -0.06235504150390625, -0.0285797119140625, 0.00519561767578125, 0.038970947265625, 0.07274627685546875, 0.1065216064453125, 0.14029693603515625, 0.174072265625, 0.20784759521484375, 0.2416229248046875, 0.27539825439453125, 0.309173583984375, 0.34294891357421875, 0.3767242431640625, 0.41049957275390625, 0.44427490234375, 0.47805023193359375, 0.5118255615234375, 0.5456008911132812, 0.579376220703125, 0.6131515502929688, 0.6469268798828125, 0.6807022094726562, 0.7144775390625, 0.7482528686523438, 0.7820281982421875, 0.8158035278320312, 0.849578857421875, 0.8833541870117188, 0.9171295166015625, 0.9509048461914062, 0.98468017578125, 1.0184555053710938, 1.0522308349609375, 1.0860061645507812, 1.119781494140625, 1.1535568237304688, 1.1873321533203125, 1.2211074829101562, 1.2548828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 6.0, 9.0, 26.0, 26.0, 63.0, 95.0, 117.0, 146.0, 155.0, 118.0, 89.0, 57.0, 33.0, 24.0, 13.0, 9.0, 8.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010907649993896484, -0.0001053251326084137, -0.00010157376527786255, -9.78223979473114e-05, -9.407103061676025e-05, -9.03196632862091e-05, -8.656829595565796e-05, -8.281692862510681e-05, -7.906556129455566e-05, -7.531419396400452e-05, -7.156282663345337e-05, -6.781145930290222e-05, -6.406009197235107e-05, -6.030872464179993e-05, -5.655735731124878e-05, -5.280598998069763e-05, -4.9054622650146484e-05, -4.530325531959534e-05, -4.155188798904419e-05, -3.780052065849304e-05, -3.4049153327941895e-05, -3.0297785997390747e-05, -2.65464186668396e-05, -2.2795051336288452e-05, -1.9043684005737305e-05, -1.5292316675186157e-05, -1.154094934463501e-05, -7.789582014083862e-06, -4.038214683532715e-06, -2.868473529815674e-07, 3.46451997756958e-06, 7.2158873081207275e-06, 1.0967254638671875e-05, 1.4718621969223022e-05, 1.846998929977417e-05, 2.2221356630325317e-05, 2.5972723960876465e-05, 2.9724091291427612e-05, 3.347545862197876e-05, 3.722682595252991e-05, 4.0978193283081055e-05, 4.47295606136322e-05, 4.848092794418335e-05, 5.22322952747345e-05, 5.5983662605285645e-05, 5.973502993583679e-05, 6.348639726638794e-05, 6.723776459693909e-05, 7.098913192749023e-05, 7.474049925804138e-05, 7.849186658859253e-05, 8.224323391914368e-05, 8.599460124969482e-05, 8.974596858024597e-05, 9.349733591079712e-05, 9.724870324134827e-05, 0.00010100007057189941, 0.00010475143790245056, 0.00010850280523300171, 0.00011225417256355286, 0.000116005539894104, 0.00011975690722465515, 0.0001235082745552063, 0.00012725964188575745, 0.0001310110092163086]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 10.0, 7.0, 9.0, 27.0, 43.0, 54.0, 122.0, 304.0, 904.0, 4352.0, 37119.0, 608022.0, 370969.0, 22481.0, 2976.0, 685.0, 231.0, 101.0, 57.0, 36.0, 23.0, 9.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45458984375, -0.43053436279296875, -0.4064788818359375, -0.38242340087890625, -0.358367919921875, -0.33431243896484375, -0.3102569580078125, -0.28620147705078125, -0.26214599609375, -0.23809051513671875, -0.2140350341796875, -0.18997955322265625, -0.165924072265625, -0.14186859130859375, -0.1178131103515625, -0.09375762939453125, -0.0697021484375, -0.04564666748046875, -0.0215911865234375, 0.00246429443359375, 0.026519775390625, 0.05057525634765625, 0.0746307373046875, 0.09868621826171875, 0.12274169921875, 0.14679718017578125, 0.1708526611328125, 0.19490814208984375, 0.218963623046875, 0.24301910400390625, 0.2670745849609375, 0.29113006591796875, 0.315185546875, 0.33924102783203125, 0.3632965087890625, 0.38735198974609375, 0.411407470703125, 0.43546295166015625, 0.4595184326171875, 0.48357391357421875, 0.50762939453125, 0.5316848754882812, 0.5557403564453125, 0.5797958374023438, 0.603851318359375, 0.6279067993164062, 0.6519622802734375, 0.6760177612304688, 0.7000732421875, 0.7241287231445312, 0.7481842041015625, 0.7722396850585938, 0.796295166015625, 0.8203506469726562, 0.8444061279296875, 0.8684616088867188, 0.89251708984375, 0.9165725708007812, 0.9406280517578125, 0.9646835327148438, 0.988739013671875, 1.0127944946289062, 1.0368499755859375, 1.0609054565429688, 1.0849609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 8.0, 22.0, 26.0, 38.0, 43.0, 50.0, 73.0, 89.0, 91.0, 105.0, 80.0, 97.0, 59.0, 44.0, 38.0, 39.0, 19.0, 10.0, 9.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.462646484375, -0.4397773742675781, -0.41690826416015625, -0.3940391540527344, -0.3711700439453125, -0.3483009338378906, -0.32543182373046875, -0.3025627136230469, -0.279693603515625, -0.2568244934082031, -0.23395538330078125, -0.21108627319335938, -0.1882171630859375, -0.16534805297851562, -0.14247894287109375, -0.11960983276367188, -0.09674072265625, -0.07387161254882812, -0.05100250244140625, -0.028133392333984375, -0.0052642822265625, 0.017604827880859375, 0.04047393798828125, 0.06334304809570312, 0.086212158203125, 0.10908126831054688, 0.13195037841796875, 0.15481948852539062, 0.1776885986328125, 0.20055770874023438, 0.22342681884765625, 0.24629592895507812, 0.2691650390625, 0.2920341491699219, 0.31490325927734375, 0.3377723693847656, 0.3606414794921875, 0.3835105895996094, 0.40637969970703125, 0.4292488098144531, 0.452117919921875, 0.4749870300292969, 0.49785614013671875, 0.5207252502441406, 0.5435943603515625, 0.5664634704589844, 0.5893325805664062, 0.6122016906738281, 0.63507080078125, 0.6579399108886719, 0.6808090209960938, 0.7036781311035156, 0.7265472412109375, 0.7494163513183594, 0.7722854614257812, 0.7951545715332031, 0.818023681640625, 0.8408927917480469, 0.8637619018554688, 0.8866310119628906, 0.9095001220703125, 0.9323692321777344, 0.9552383422851562, 0.9781074523925781, 1.0009765625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 10.0, 18.0, 34.0, 65.0, 179.0, 327.0, 221.0, 77.0, 49.0, 18.0, 9.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.836753845214844, -6.047939777374268, -5.259125709533691, -4.470311164855957, -3.68149733543396, -2.892683267593384, -2.1038689613342285, -1.3150548934936523, -0.5262408256530762, 0.2625733017921448, 1.0513874292373657, 1.8402016162872314, 2.6290156841278076, 3.417829751968384, 4.206644058227539, 4.995458126068115, 5.784272193908691, 6.573086261749268, 7.361900329589844, 8.150714874267578, 8.939528465270996, 9.72834300994873, 10.517156600952148, 11.305971145629883, 12.094785690307617, 12.883600234985352, 13.67241382598877, 14.461228370666504, 15.250041961669922, 16.038856506347656, 16.82767105102539, 17.616485595703125, 18.405298233032227, 19.19411277770996, 19.982927322387695, 20.771739959716797, 21.56055450439453, 22.349369049072266, 23.13818359375, 23.926998138427734, 24.715810775756836, 25.50462532043457, 26.293439865112305, 27.082252502441406, 27.87106704711914, 28.659881591796875, 29.44869613647461, 30.237510681152344, 31.026325225830078, 31.815139770507812, 32.60395431518555, 33.39276885986328, 34.181583404541016, 34.970394134521484, 35.75920867919922, 36.54802322387695, 37.33683776855469, 38.12565231323242, 38.914466857910156, 39.70328140258789, 40.492095947265625, 41.280906677246094, 42.06972122192383, 42.85853576660156, 43.6473503112793]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 6.0, 7.0, 11.0, 15.0, 21.0, 18.0, 16.0, 28.0, 30.0, 54.0, 42.0, 36.0, 54.0, 71.0, 65.0, 62.0, 62.0, 56.0, 43.0, 35.0, 44.0, 34.0, 22.0, 20.0, 28.0, 24.0, 18.0, 19.0, 5.0, 11.0, 5.0, 5.0, 11.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.14488983154297, -15.629015922546387, -15.113142967224121, -14.597269058227539, -14.081395149230957, -13.565521240234375, -13.04964828491211, -12.533774375915527, -12.017900466918945, -11.502026557922363, -10.986153602600098, -10.470279693603516, -9.954405784606934, -9.438531875610352, -8.922658920288086, -8.406785011291504, -7.890912055969238, -7.3750386238098145, -6.859164714813232, -6.343291282653809, -5.827417373657227, -5.311543941497803, -4.795670509338379, -4.279796600341797, -3.763923168182373, -3.24804949760437, -2.732175827026367, -2.2163023948669434, -1.7004287242889404, -1.1845550537109375, -0.6686816215515137, -0.15280795097351074, 0.3630657196044922, 0.8789393305778503, 1.3948129415512085, 1.9106864929199219, 2.426560163497925, 2.9424338340759277, 3.4583072662353516, 3.9741809368133545, 4.490054607391357, 5.005928039550781, 5.521801948547363, 6.037675380706787, 6.553548812866211, 7.069422721862793, 7.585296154022217, 8.10116958618164, 8.617043495178223, 9.132917404174805, 9.64879035949707, 10.164664268493652, 10.680538177490234, 11.1964111328125, 11.712285041809082, 12.228158950805664, 12.74403190612793, 13.259905815124512, 13.775778770446777, 14.29165267944336, 14.807526588439941, 15.323400497436523, 15.839273452758789, 16.355146408081055, 16.871021270751953]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 12.0, 11.0, 16.0, 32.0, 26.0, 36.0, 48.0, 75.0, 110.0, 151.0, 248.0, 346.0, 570.0, 943.0, 1746.0, 3912.0, 11646.0, 264044.0, 3888578.0, 13006.0, 3973.0, 1892.0, 1013.0, 594.0, 407.0, 225.0, 189.0, 112.0, 87.0, 51.0, 34.0, 31.0, 19.0, 19.0, 15.0, 23.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.3076171875, -1.2667999267578125, -1.225982666015625, -1.1851654052734375, -1.14434814453125, -1.1035308837890625, -1.062713623046875, -1.0218963623046875, -0.9810791015625, -0.9402618408203125, -0.899444580078125, -0.8586273193359375, -0.81781005859375, -0.7769927978515625, -0.736175537109375, -0.6953582763671875, -0.654541015625, -0.6137237548828125, -0.572906494140625, -0.5320892333984375, -0.49127197265625, -0.4504547119140625, -0.409637451171875, -0.3688201904296875, -0.3280029296875, -0.2871856689453125, -0.246368408203125, -0.2055511474609375, -0.16473388671875, -0.1239166259765625, -0.083099365234375, -0.0422821044921875, -0.00146484375, 0.0393524169921875, 0.080169677734375, 0.1209869384765625, 0.16180419921875, 0.2026214599609375, 0.243438720703125, 0.2842559814453125, 0.3250732421875, 0.3658905029296875, 0.406707763671875, 0.4475250244140625, 0.48834228515625, 0.5291595458984375, 0.569976806640625, 0.6107940673828125, 0.651611328125, 0.6924285888671875, 0.733245849609375, 0.7740631103515625, 0.81488037109375, 0.8556976318359375, 0.896514892578125, 0.9373321533203125, 0.9781494140625, 1.0189666748046875, 1.059783935546875, 1.1006011962890625, 1.14141845703125, 1.1822357177734375, 1.223052978515625, 1.2638702392578125, 1.3046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 9.0, 11.0, 16.0, 11.0, 12.0, 15.0, 32.0, 21.0, 27.0, 51.0, 37.0, 38.0, 49.0, 56.0, 59.0, 57.0, 66.0, 66.0, 57.0, 47.0, 33.0, 34.0, 39.0, 31.0, 19.0, 20.0, 9.0, 10.0, 20.0, 5.0, 6.0, 7.0, 8.0, 6.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7090606689453125, -0.685211181640625, -0.6613616943359375, -0.63751220703125, -0.6136627197265625, -0.589813232421875, -0.5659637451171875, -0.5421142578125, -0.5182647705078125, -0.494415283203125, -0.4705657958984375, -0.44671630859375, -0.4228668212890625, -0.399017333984375, -0.3751678466796875, -0.351318359375, -0.3274688720703125, -0.303619384765625, -0.2797698974609375, -0.25592041015625, -0.2320709228515625, -0.208221435546875, -0.1843719482421875, -0.1605224609375, -0.1366729736328125, -0.112823486328125, -0.0889739990234375, -0.06512451171875, -0.0412750244140625, -0.017425537109375, 0.0064239501953125, 0.0302734375, 0.0541229248046875, 0.077972412109375, 0.1018218994140625, 0.12567138671875, 0.1495208740234375, 0.173370361328125, 0.1972198486328125, 0.2210693359375, 0.2449188232421875, 0.268768310546875, 0.2926177978515625, 0.31646728515625, 0.3403167724609375, 0.364166259765625, 0.3880157470703125, 0.411865234375, 0.4357147216796875, 0.459564208984375, 0.4834136962890625, 0.50726318359375, 0.5311126708984375, 0.554962158203125, 0.5788116455078125, 0.6026611328125, 0.6265106201171875, 0.650360107421875, 0.6742095947265625, 0.69805908203125, 0.7219085693359375, 0.745758056640625, 0.7696075439453125, 0.79345703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 10.0, 5.0, 5.0, 7.0, 17.0, 13.0, 23.0, 34.0, 41.0, 45.0, 69.0, 97.0, 130.0, 145.0, 207.0, 319.0, 408.0, 590.0, 1049.0, 1736.0, 3353.0, 8608.0, 36344.0, 4031026.0, 86530.0, 13033.0, 4525.0, 2129.0, 1183.0, 777.0, 530.0, 326.0, 254.0, 194.0, 123.0, 105.0, 77.0, 66.0, 41.0, 33.0, 25.0, 17.0, 10.0, 7.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2587890625, -1.2148895263671875, -1.170989990234375, -1.1270904541015625, -1.08319091796875, -1.0392913818359375, -0.995391845703125, -0.9514923095703125, -0.9075927734375, -0.8636932373046875, -0.819793701171875, -0.7758941650390625, -0.73199462890625, -0.6880950927734375, -0.644195556640625, -0.6002960205078125, -0.556396484375, -0.5124969482421875, -0.468597412109375, -0.4246978759765625, -0.38079833984375, -0.3368988037109375, -0.292999267578125, -0.2490997314453125, -0.2052001953125, -0.1613006591796875, -0.117401123046875, -0.0735015869140625, -0.02960205078125, 0.0142974853515625, 0.058197021484375, 0.1020965576171875, 0.14599609375, 0.1898956298828125, 0.233795166015625, 0.2776947021484375, 0.32159423828125, 0.3654937744140625, 0.409393310546875, 0.4532928466796875, 0.4971923828125, 0.5410919189453125, 0.584991455078125, 0.6288909912109375, 0.67279052734375, 0.7166900634765625, 0.760589599609375, 0.8044891357421875, 0.848388671875, 0.8922882080078125, 0.936187744140625, 0.9800872802734375, 1.02398681640625, 1.0678863525390625, 1.111785888671875, 1.1556854248046875, 1.1995849609375, 1.2434844970703125, 1.287384033203125, 1.3312835693359375, 1.37518310546875, 1.4190826416015625, 1.462982177734375, 1.5068817138671875, 1.55078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 20.0, 62.0, 3318.0, 530.0, 58.0, 21.0, 21.0, 9.0, 1.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5976524353027344, -0.5805587768554688, -0.5634651184082031, -0.5463714599609375, -0.5292778015136719, -0.5121841430664062, -0.4950904846191406, -0.477996826171875, -0.4609031677246094, -0.44380950927734375, -0.4267158508300781, -0.4096221923828125, -0.3925285339355469, -0.37543487548828125, -0.3583412170410156, -0.34124755859375, -0.3241539001464844, -0.30706024169921875, -0.2899665832519531, -0.2728729248046875, -0.2557792663574219, -0.23868560791015625, -0.22159194946289062, -0.204498291015625, -0.18740463256835938, -0.17031097412109375, -0.15321731567382812, -0.1361236572265625, -0.11902999877929688, -0.10193634033203125, -0.08484268188476562, -0.0677490234375, -0.050655364990234375, -0.03356170654296875, -0.016468048095703125, 0.0006256103515625, 0.017719268798828125, 0.03481292724609375, 0.051906585693359375, 0.069000244140625, 0.08609390258789062, 0.10318756103515625, 0.12028121948242188, 0.1373748779296875, 0.15446853637695312, 0.17156219482421875, 0.18865585327148438, 0.20574951171875, 0.22284317016601562, 0.23993682861328125, 0.2570304870605469, 0.2741241455078125, 0.2912178039550781, 0.30831146240234375, 0.3254051208496094, 0.342498779296875, 0.3595924377441406, 0.37668609619140625, 0.3937797546386719, 0.4108734130859375, 0.4279670715332031, 0.44506072998046875, 0.4621543884277344, 0.479248046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 8.0, 33.0, 87.0, 179.0, 280.0, 242.0, 105.0, 42.0, 18.0, 13.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7683079242706299, -1.677186131477356, -1.586064338684082, -1.4949424266815186, -1.4038207530975342, -1.3126988410949707, -1.2215770483016968, -1.1304552555084229, -1.039333462715149, -0.948211669921875, -0.8570898771286011, -0.7659680247306824, -0.6748462319374084, -0.5837244391441345, -0.4926025867462158, -0.4014807939529419, -0.31035900115966797, -0.21923719346523285, -0.12811538577079773, -0.036993563175201416, 0.05412822961807251, 0.14525002241134644, 0.23637187480926514, 0.32749366760253906, 0.418615460395813, 0.5097372531890869, 0.6008590459823608, 0.6919808983802795, 0.7831026911735535, 0.8742244839668274, 0.9653463363647461, 1.05646812915802, 1.147590160369873, 1.238711953163147, 1.329833745956421, 1.4209556579589844, 1.5120773315429688, 1.6031992435455322, 1.6943210363388062, 1.78544282913208, 1.876564621925354, 1.967686414718628, 2.0588083267211914, 2.149930000305176, 2.2410519123077393, 2.3321735858917236, 2.423295497894287, 2.5144171714782715, 2.605539083480835, 2.6966609954833984, 2.787782669067383, 2.8789045810699463, 2.9700262546539307, 3.061148166656494, 3.1522698402404785, 3.243391752243042, 3.3345136642456055, 3.425635576248169, 3.5167572498321533, 3.607879161834717, 3.699000835418701, 3.7901227474212646, 3.881244659423828, 3.9723663330078125, 4.063488006591797]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 15.0, 3.0, 12.0, 10.0, 13.0, 15.0, 22.0, 21.0, 40.0, 23.0, 31.0, 41.0, 40.0, 35.0, 54.0, 39.0, 56.0, 55.0, 53.0, 52.0, 38.0, 51.0, 41.0, 31.0, 35.0, 31.0, 22.0, 22.0, 15.0, 16.0, 16.0, 10.0, 10.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8254018425941467, -0.7982668876647949, -0.7711318731307983, -0.7439968585968018, -0.71686190366745, -0.6897269487380981, -0.6625919342041016, -0.635456919670105, -0.6083219647407532, -0.5811870098114014, -0.5540519952774048, -0.5269169807434082, -0.4997820258140564, -0.4726470410823822, -0.445512056350708, -0.4183770716190338, -0.3912420868873596, -0.3641071021556854, -0.33697211742401123, -0.30983713269233704, -0.28270214796066284, -0.25556716322898865, -0.22843217849731445, -0.20129719376564026, -0.17416220903396606, -0.14702722430229187, -0.11989223957061768, -0.09275725483894348, -0.06562227010726929, -0.03848728537559509, -0.011352300643920898, 0.015782684087753296, 0.042917728424072266, 0.07005271315574646, 0.09718769788742065, 0.12432268261909485, 0.15145766735076904, 0.17859265208244324, 0.20572763681411743, 0.23286262154579163, 0.2599976062774658, 0.28713259100914, 0.3142675757408142, 0.3414025604724884, 0.3685375452041626, 0.3956725299358368, 0.422807514667511, 0.4499424993991852, 0.4770774841308594, 0.504212498664856, 0.5313474535942078, 0.5584824085235596, 0.5856174230575562, 0.6127524375915527, 0.6398873925209045, 0.6670223474502563, 0.6941573619842529, 0.7212923765182495, 0.7484273314476013, 0.7755622863769531, 0.8026973009109497, 0.8298323154449463, 0.8569672703742981, 0.8841022253036499, 0.9112372398376465]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 8.0, 8.0, 6.0, 6.0, 16.0, 18.0, 29.0, 45.0, 58.0, 63.0, 130.0, 157.0, 195.0, 363.0, 551.0, 836.0, 1379.0, 2377.0, 4430.0, 8048.0, 16741.0, 37775.0, 101033.0, 321511.0, 357503.0, 114955.0, 41939.0, 18208.0, 8847.0, 4687.0, 2511.0, 1451.0, 905.0, 576.0, 378.0, 246.0, 158.0, 117.0, 83.0, 58.0, 42.0, 37.0, 18.0, 16.0, 11.0, 6.0, 8.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.0625, -1.028289794921875, -0.99407958984375, -0.959869384765625, -0.9256591796875, -0.891448974609375, -0.85723876953125, -0.823028564453125, -0.788818359375, -0.754608154296875, -0.72039794921875, -0.686187744140625, -0.6519775390625, -0.617767333984375, -0.58355712890625, -0.549346923828125, -0.51513671875, -0.480926513671875, -0.44671630859375, -0.412506103515625, -0.3782958984375, -0.344085693359375, -0.30987548828125, -0.275665283203125, -0.241455078125, -0.207244873046875, -0.17303466796875, -0.138824462890625, -0.1046142578125, -0.070404052734375, -0.03619384765625, -0.001983642578125, 0.0322265625, 0.066436767578125, 0.10064697265625, 0.134857177734375, 0.1690673828125, 0.203277587890625, 0.23748779296875, 0.271697998046875, 0.305908203125, 0.340118408203125, 0.37432861328125, 0.408538818359375, 0.4427490234375, 0.476959228515625, 0.51116943359375, 0.545379638671875, 0.57958984375, 0.613800048828125, 0.64801025390625, 0.682220458984375, 0.7164306640625, 0.750640869140625, 0.78485107421875, 0.819061279296875, 0.853271484375, 0.887481689453125, 0.92169189453125, 0.955902099609375, 0.9901123046875, 1.024322509765625, 1.05853271484375, 1.092742919921875, 1.126953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 8.0, 6.0, 12.0, 13.0, 7.0, 15.0, 25.0, 23.0, 29.0, 29.0, 36.0, 35.0, 33.0, 49.0, 63.0, 56.0, 51.0, 63.0, 71.0, 50.0, 53.0, 46.0, 28.0, 42.0, 29.0, 14.0, 18.0, 17.0, 11.0, 10.0, 14.0, 9.0, 4.0, 5.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.763671875, -0.739715576171875, -0.71575927734375, -0.691802978515625, -0.6678466796875, -0.643890380859375, -0.61993408203125, -0.595977783203125, -0.572021484375, -0.548065185546875, -0.52410888671875, -0.500152587890625, -0.4761962890625, -0.452239990234375, -0.42828369140625, -0.404327392578125, -0.38037109375, -0.356414794921875, -0.33245849609375, -0.308502197265625, -0.2845458984375, -0.260589599609375, -0.23663330078125, -0.212677001953125, -0.188720703125, -0.164764404296875, -0.14080810546875, -0.116851806640625, -0.0928955078125, -0.068939208984375, -0.04498291015625, -0.021026611328125, 0.0029296875, 0.026885986328125, 0.05084228515625, 0.074798583984375, 0.0987548828125, 0.122711181640625, 0.14666748046875, 0.170623779296875, 0.194580078125, 0.218536376953125, 0.24249267578125, 0.266448974609375, 0.2904052734375, 0.314361572265625, 0.33831787109375, 0.362274169921875, 0.38623046875, 0.410186767578125, 0.43414306640625, 0.458099365234375, 0.4820556640625, 0.506011962890625, 0.52996826171875, 0.553924560546875, 0.577880859375, 0.601837158203125, 0.62579345703125, 0.649749755859375, 0.6737060546875, 0.697662353515625, 0.72161865234375, 0.745574951171875, 0.76953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 7.0, 10.0, 16.0, 16.0, 38.0, 52.0, 77.0, 148.0, 259.0, 515.0, 1262.0, 3791.0, 17940.0, 218053.0, 747979.0, 47726.0, 7227.0, 1891.0, 750.0, 352.0, 179.0, 110.0, 48.0, 42.0, 24.0, 14.0, 8.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.2064208984375, -3.100341796875, -2.9942626953125, -2.88818359375, -2.7821044921875, -2.676025390625, -2.5699462890625, -2.4638671875, -2.3577880859375, -2.251708984375, -2.1456298828125, -2.03955078125, -1.9334716796875, -1.827392578125, -1.7213134765625, -1.615234375, -1.5091552734375, -1.403076171875, -1.2969970703125, -1.19091796875, -1.0848388671875, -0.978759765625, -0.8726806640625, -0.7666015625, -0.6605224609375, -0.554443359375, -0.4483642578125, -0.34228515625, -0.2362060546875, -0.130126953125, -0.0240478515625, 0.08203125, 0.1881103515625, 0.294189453125, 0.4002685546875, 0.50634765625, 0.6124267578125, 0.718505859375, 0.8245849609375, 0.9306640625, 1.0367431640625, 1.142822265625, 1.2489013671875, 1.35498046875, 1.4610595703125, 1.567138671875, 1.6732177734375, 1.779296875, 1.8853759765625, 1.991455078125, 2.0975341796875, 2.20361328125, 2.3096923828125, 2.415771484375, 2.5218505859375, 2.6279296875, 2.7340087890625, 2.840087890625, 2.9461669921875, 3.05224609375, 3.1583251953125, 3.264404296875, 3.3704833984375, 3.4765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 13.0, 22.0, 39.0, 48.0, 64.0, 65.0, 82.0, 76.0, 81.0, 98.0, 71.0, 71.0, 59.0, 58.0, 38.0, 24.0, 22.0, 11.0, 11.0, 11.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.258544921875, -5.07177734375, -4.885009765625, -4.6982421875, -4.511474609375, -4.32470703125, -4.137939453125, -3.951171875, -3.764404296875, -3.57763671875, -3.390869140625, -3.2041015625, -3.017333984375, -2.83056640625, -2.643798828125, -2.45703125, -2.270263671875, -2.08349609375, -1.896728515625, -1.7099609375, -1.523193359375, -1.33642578125, -1.149658203125, -0.962890625, -0.776123046875, -0.58935546875, -0.402587890625, -0.2158203125, -0.029052734375, 0.15771484375, 0.344482421875, 0.53125, 0.718017578125, 0.90478515625, 1.091552734375, 1.2783203125, 1.465087890625, 1.65185546875, 1.838623046875, 2.025390625, 2.212158203125, 2.39892578125, 2.585693359375, 2.7724609375, 2.959228515625, 3.14599609375, 3.332763671875, 3.51953125, 3.706298828125, 3.89306640625, 4.079833984375, 4.2666015625, 4.453369140625, 4.64013671875, 4.826904296875, 5.013671875, 5.200439453125, 5.38720703125, 5.573974609375, 5.7607421875, 5.947509765625, 6.13427734375, 6.321044921875, 6.5078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 3.0, 7.0, 14.0, 15.0, 23.0, 37.0, 65.0, 162.0, 365.0, 1022.0, 3618.0, 31385.0, 991660.0, 15999.0, 2682.0, 858.0, 320.0, 149.0, 67.0, 36.0, 22.0, 17.0, 11.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8115234375, -1.7268524169921875, -1.642181396484375, -1.5575103759765625, -1.47283935546875, -1.3881683349609375, -1.303497314453125, -1.2188262939453125, -1.1341552734375, -1.0494842529296875, -0.964813232421875, -0.8801422119140625, -0.79547119140625, -0.7108001708984375, -0.626129150390625, -0.5414581298828125, -0.456787109375, -0.3721160888671875, -0.287445068359375, -0.2027740478515625, -0.11810302734375, -0.0334320068359375, 0.051239013671875, 0.1359100341796875, 0.2205810546875, 0.3052520751953125, 0.389923095703125, 0.4745941162109375, 0.55926513671875, 0.6439361572265625, 0.728607177734375, 0.8132781982421875, 0.89794921875, 0.9826202392578125, 1.067291259765625, 1.1519622802734375, 1.23663330078125, 1.3213043212890625, 1.405975341796875, 1.4906463623046875, 1.5753173828125, 1.6599884033203125, 1.744659423828125, 1.8293304443359375, 1.91400146484375, 1.9986724853515625, 2.083343505859375, 2.1680145263671875, 2.252685546875, 2.3373565673828125, 2.422027587890625, 2.5066986083984375, 2.59136962890625, 2.6760406494140625, 2.760711669921875, 2.8453826904296875, 2.9300537109375, 3.0147247314453125, 3.099395751953125, 3.1840667724609375, 3.26873779296875, 3.3534088134765625, 3.438079833984375, 3.5227508544921875, 3.607421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 11.0, 9.0, 21.0, 29.0, 29.0, 32.0, 76.0, 138.0, 190.0, 148.0, 112.0, 63.0, 45.0, 23.0, 14.0, 11.0, 9.0, 3.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001690387725830078, -0.00016478542238473892, -0.00016053207218647003, -0.00015627872198820114, -0.00015202537178993225, -0.00014777202159166336, -0.00014351867139339447, -0.00013926532119512558, -0.0001350119709968567, -0.0001307586207985878, -0.0001265052706003189, -0.00012225192040205002, -0.00011799857020378113, -0.00011374522000551224, -0.00010949186980724335, -0.00010523851960897446, -0.00010098516941070557, -9.673181921243668e-05, -9.247846901416779e-05, -8.82251188158989e-05, -8.397176861763e-05, -7.971841841936111e-05, -7.546506822109222e-05, -7.121171802282333e-05, -6.695836782455444e-05, -6.270501762628555e-05, -5.845166742801666e-05, -5.419831722974777e-05, -4.994496703147888e-05, -4.569161683320999e-05, -4.14382666349411e-05, -3.718491643667221e-05, -3.293156623840332e-05, -2.867821604013443e-05, -2.442486584186554e-05, -2.017151564359665e-05, -1.591816544532776e-05, -1.1664815247058868e-05, -7.411465048789978e-06, -3.1581148505210876e-06, 1.0952353477478027e-06, 5.348585546016693e-06, 9.601935744285583e-06, 1.3855285942554474e-05, 1.8108636140823364e-05, 2.2361986339092255e-05, 2.6615336537361145e-05, 3.0868686735630035e-05, 3.5122036933898926e-05, 3.9375387132167816e-05, 4.3628737330436707e-05, 4.78820875287056e-05, 5.213543772697449e-05, 5.638878792524338e-05, 6.064213812351227e-05, 6.489548832178116e-05, 6.914883852005005e-05, 7.340218871831894e-05, 7.765553891658783e-05, 8.190888911485672e-05, 8.616223931312561e-05, 9.04155895113945e-05, 9.466893970966339e-05, 9.892228990793228e-05, 0.00010317564010620117]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 9.0, 6.0, 12.0, 18.0, 43.0, 48.0, 78.0, 141.0, 392.0, 1563.0, 16920.0, 1017246.0, 10140.0, 1238.0, 336.0, 148.0, 72.0, 40.0, 34.0, 18.0, 13.0, 11.0, 10.0, 5.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.224884033203125, -4.11773681640625, -4.010589599609375, -3.9034423828125, -3.796295166015625, -3.68914794921875, -3.582000732421875, -3.474853515625, -3.367706298828125, -3.26055908203125, -3.153411865234375, -3.0462646484375, -2.939117431640625, -2.83197021484375, -2.724822998046875, -2.61767578125, -2.510528564453125, -2.40338134765625, -2.296234130859375, -2.1890869140625, -2.081939697265625, -1.97479248046875, -1.867645263671875, -1.760498046875, -1.653350830078125, -1.54620361328125, -1.439056396484375, -1.3319091796875, -1.224761962890625, -1.11761474609375, -1.010467529296875, -0.9033203125, -0.796173095703125, -0.68902587890625, -0.581878662109375, -0.4747314453125, -0.367584228515625, -0.26043701171875, -0.153289794921875, -0.046142578125, 0.061004638671875, 0.16815185546875, 0.275299072265625, 0.3824462890625, 0.489593505859375, 0.59674072265625, 0.703887939453125, 0.81103515625, 0.918182373046875, 1.02532958984375, 1.132476806640625, 1.2396240234375, 1.346771240234375, 1.45391845703125, 1.561065673828125, 1.668212890625, 1.775360107421875, 1.88250732421875, 1.989654541015625, 2.0968017578125, 2.203948974609375, 2.31109619140625, 2.418243408203125, 2.525390625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 43.0, 271.0, 569.0, 77.0, 21.0, 10.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4453125, -9.260955810546875, -9.07659912109375, -8.892242431640625, -8.7078857421875, -8.523529052734375, -8.33917236328125, -8.154815673828125, -7.970458984375, -7.786102294921875, -7.60174560546875, -7.417388916015625, -7.2330322265625, -7.048675537109375, -6.86431884765625, -6.679962158203125, -6.49560546875, -6.311248779296875, -6.12689208984375, -5.942535400390625, -5.7581787109375, -5.573822021484375, -5.38946533203125, -5.205108642578125, -5.020751953125, -4.836395263671875, -4.65203857421875, -4.467681884765625, -4.2833251953125, -4.098968505859375, -3.91461181640625, -3.730255126953125, -3.5458984375, -3.361541748046875, -3.17718505859375, -2.992828369140625, -2.8084716796875, -2.624114990234375, -2.43975830078125, -2.255401611328125, -2.071044921875, -1.886688232421875, -1.70233154296875, -1.517974853515625, -1.3336181640625, -1.149261474609375, -0.96490478515625, -0.780548095703125, -0.59619140625, -0.411834716796875, -0.22747802734375, -0.043121337890625, 0.1412353515625, 0.325592041015625, 0.50994873046875, 0.694305419921875, 0.878662109375, 1.063018798828125, 1.24737548828125, 1.431732177734375, 1.6160888671875, 1.800445556640625, 1.98480224609375, 2.169158935546875, 2.353515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 29.0, 51.0, 123.0, 256.0, 279.0, 156.0, 55.0, 23.0, 7.0, 5.0, 5.0, 0.0, 0.0, 1.0], "bins": [-61.468017578125, -60.33716583251953, -59.2063102722168, -58.07545852661133, -56.944602966308594, -55.813751220703125, -54.68289566040039, -53.55204391479492, -52.42118835449219, -51.29033660888672, -50.159481048583984, -49.028629302978516, -47.89777374267578, -46.76692199707031, -45.63606643676758, -44.50521469116211, -43.37436294555664, -42.24351119995117, -41.11265563964844, -39.98180389404297, -38.850948333740234, -37.720096588134766, -36.58924102783203, -35.45838928222656, -34.327537536621094, -33.196685791015625, -32.06583023071289, -30.93497657775879, -29.804122924804688, -28.67327117919922, -27.542417526245117, -26.411563873291016, -25.280712127685547, -24.149858474731445, -23.019004821777344, -21.888151168823242, -20.75729751586914, -19.626445770263672, -18.49559211730957, -17.36473846435547, -16.233882904052734, -15.103029251098633, -13.972175598144531, -12.841322898864746, -11.710469245910645, -10.579615592956543, -9.448762893676758, -8.317909240722656, -7.187056541442871, -6.0562028884887695, -4.925349712371826, -3.7944962978363037, -2.6636428833007812, -1.5327892303466797, -0.40193605422973633, 0.728917121887207, 1.8597707748413086, 2.990624189376831, 4.1214776039123535, 5.252330780029297, 6.383184432983398, 7.5140380859375, 8.644891738891602, 9.775744438171387, 10.906598091125488]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 9.0, 7.0, 8.0, 12.0, 20.0, 8.0, 14.0, 21.0, 23.0, 29.0, 32.0, 36.0, 49.0, 42.0, 52.0, 43.0, 54.0, 59.0, 59.0, 47.0, 37.0, 42.0, 36.0, 45.0, 35.0, 30.0, 29.0, 19.0, 26.0, 23.0, 14.0, 6.0, 9.0, 3.0, 2.0, 5.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.26739501953125, -16.66203498840332, -16.056676864624023, -15.451316833496094, -14.84595775604248, -14.240598678588867, -13.635239601135254, -13.02988052368164, -12.424520492553711, -11.819161415100098, -11.213802337646484, -10.608442306518555, -10.003083229064941, -9.397724151611328, -8.792365074157715, -8.187005996704102, -7.581646919250488, -6.976287841796875, -6.3709282875061035, -5.76556921005249, -5.160209655761719, -4.5548505783081055, -3.949491500854492, -3.3441319465637207, -2.7387728691101074, -2.133413553237915, -1.5280543565750122, -0.9226951599121094, -0.317335844039917, 0.2880234718322754, 0.8933825492858887, 1.4987421035766602, 2.1041011810302734, 2.709460496902466, 3.314819812774658, 3.9201788902282715, 4.525538444519043, 5.130897521972656, 5.7362565994262695, 6.341616153717041, 6.946975231170654, 7.552334308624268, 8.157693862915039, 8.763052940368652, 9.368412017822266, 9.973772048950195, 10.579130172729492, 11.184490203857422, 11.789849281311035, 12.395208358764648, 13.000567436218262, 13.605926513671875, 14.211286544799805, 14.816645622253418, 15.422004699707031, 16.02736473083496, 16.632722854614258, 17.238082885742188, 17.843441009521484, 18.448801040649414, 19.05415916442871, 19.65951919555664, 20.264877319335938, 20.870237350463867, 21.475597381591797]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 14.0, 13.0, 22.0, 31.0, 44.0, 66.0, 85.0, 111.0, 196.0, 312.0, 620.0, 1389.0, 5572.0, 4092387.0, 86698.0, 4083.0, 1232.0, 497.0, 293.0, 169.0, 124.0, 85.0, 63.0, 38.0, 39.0, 23.0, 18.0, 7.0, 15.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3671875, -3.27838134765625, -3.1895751953125, -3.10076904296875, -3.011962890625, -2.92315673828125, -2.8343505859375, -2.74554443359375, -2.65673828125, -2.56793212890625, -2.4791259765625, -2.39031982421875, -2.301513671875, -2.21270751953125, -2.1239013671875, -2.03509521484375, -1.9462890625, -1.85748291015625, -1.7686767578125, -1.67987060546875, -1.591064453125, -1.50225830078125, -1.4134521484375, -1.32464599609375, -1.23583984375, -1.14703369140625, -1.0582275390625, -0.96942138671875, -0.880615234375, -0.79180908203125, -0.7030029296875, -0.61419677734375, -0.525390625, -0.43658447265625, -0.3477783203125, -0.25897216796875, -0.170166015625, -0.08135986328125, 0.0074462890625, 0.09625244140625, 0.18505859375, 0.27386474609375, 0.3626708984375, 0.45147705078125, 0.540283203125, 0.62908935546875, 0.7178955078125, 0.80670166015625, 0.8955078125, 0.98431396484375, 1.0731201171875, 1.16192626953125, 1.250732421875, 1.33953857421875, 1.4283447265625, 1.51715087890625, 1.60595703125, 1.69476318359375, 1.7835693359375, 1.87237548828125, 1.961181640625, 2.04998779296875, 2.1387939453125, 2.22760009765625, 2.31640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 8.0, 7.0, 7.0, 16.0, 6.0, 19.0, 24.0, 39.0, 34.0, 57.0, 55.0, 82.0, 70.0, 87.0, 71.0, 74.0, 55.0, 68.0, 49.0, 34.0, 16.0, 22.0, 25.0, 11.0, 16.0, 13.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2237472534179688, -1.1887054443359375, -1.1536636352539062, -1.118621826171875, -1.0835800170898438, -1.0485382080078125, -1.0134963989257812, -0.97845458984375, -0.9434127807617188, -0.9083709716796875, -0.8733291625976562, -0.838287353515625, -0.8032455444335938, -0.7682037353515625, -0.7331619262695312, -0.6981201171875, -0.6630783081054688, -0.6280364990234375, -0.5929946899414062, -0.557952880859375, -0.5229110717773438, -0.4878692626953125, -0.45282745361328125, -0.41778564453125, -0.38274383544921875, -0.3477020263671875, -0.31266021728515625, -0.277618408203125, -0.24257659912109375, -0.2075347900390625, -0.17249298095703125, -0.137451171875, -0.10240936279296875, -0.0673675537109375, -0.03232574462890625, 0.002716064453125, 0.03775787353515625, 0.0727996826171875, 0.10784149169921875, 0.14288330078125, 0.17792510986328125, 0.2129669189453125, 0.24800872802734375, 0.283050537109375, 0.31809234619140625, 0.3531341552734375, 0.38817596435546875, 0.4232177734375, 0.45825958251953125, 0.4933013916015625, 0.5283432006835938, 0.563385009765625, 0.5984268188476562, 0.6334686279296875, 0.6685104370117188, 0.70355224609375, 0.7385940551757812, 0.7736358642578125, 0.8086776733398438, 0.843719482421875, 0.8787612915039062, 0.9138031005859375, 0.9488449096679688, 0.98388671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 13.0, 13.0, 32.0, 26.0, 34.0, 52.0, 88.0, 92.0, 133.0, 203.0, 357.0, 586.0, 1422.0, 3668.0, 14786.0, 4081463.0, 78034.0, 8327.0, 2480.0, 1009.0, 461.0, 272.0, 185.0, 143.0, 100.0, 78.0, 67.0, 42.0, 28.0, 23.0, 16.0, 8.0, 5.0, 5.0, 5.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.07159423828125, -2.0064697265625, -1.94134521484375, -1.876220703125, -1.81109619140625, -1.7459716796875, -1.68084716796875, -1.61572265625, -1.55059814453125, -1.4854736328125, -1.42034912109375, -1.355224609375, -1.29010009765625, -1.2249755859375, -1.15985107421875, -1.0947265625, -1.02960205078125, -0.9644775390625, -0.89935302734375, -0.834228515625, -0.76910400390625, -0.7039794921875, -0.63885498046875, -0.57373046875, -0.50860595703125, -0.4434814453125, -0.37835693359375, -0.313232421875, -0.24810791015625, -0.1829833984375, -0.11785888671875, -0.052734375, 0.01239013671875, 0.0775146484375, 0.14263916015625, 0.207763671875, 0.27288818359375, 0.3380126953125, 0.40313720703125, 0.46826171875, 0.53338623046875, 0.5985107421875, 0.66363525390625, 0.728759765625, 0.79388427734375, 0.8590087890625, 0.92413330078125, 0.9892578125, 1.05438232421875, 1.1195068359375, 1.18463134765625, 1.249755859375, 1.31488037109375, 1.3800048828125, 1.44512939453125, 1.51025390625, 1.57537841796875, 1.6405029296875, 1.70562744140625, 1.770751953125, 1.83587646484375, 1.9010009765625, 1.96612548828125, 2.03125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 23.0, 77.0, 3817.0, 85.0, 27.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23583984375, -0.2169342041015625, -0.198028564453125, -0.1791229248046875, -0.16021728515625, -0.1413116455078125, -0.122406005859375, -0.1035003662109375, -0.0845947265625, -0.0656890869140625, -0.046783447265625, -0.0278778076171875, -0.00897216796875, 0.0099334716796875, 0.028839111328125, 0.0477447509765625, 0.066650390625, 0.0855560302734375, 0.104461669921875, 0.1233673095703125, 0.14227294921875, 0.1611785888671875, 0.180084228515625, 0.1989898681640625, 0.2178955078125, 0.2368011474609375, 0.255706787109375, 0.2746124267578125, 0.29351806640625, 0.3124237060546875, 0.331329345703125, 0.3502349853515625, 0.369140625, 0.3880462646484375, 0.406951904296875, 0.4258575439453125, 0.44476318359375, 0.4636688232421875, 0.482574462890625, 0.5014801025390625, 0.5203857421875, 0.5392913818359375, 0.558197021484375, 0.5771026611328125, 0.59600830078125, 0.6149139404296875, 0.633819580078125, 0.6527252197265625, 0.671630859375, 0.6905364990234375, 0.709442138671875, 0.7283477783203125, 0.74725341796875, 0.7661590576171875, 0.785064697265625, 0.8039703369140625, 0.8228759765625, 0.8417816162109375, 0.860687255859375, 0.8795928955078125, 0.89849853515625, 0.9174041748046875, 0.936309814453125, 0.9552154541015625, 0.97412109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 130.0, 745.0, 118.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.236989974975586, -9.93779468536377, -9.638599395751953, -9.339405059814453, -9.040209770202637, -8.74101448059082, -8.441819190979004, -8.142623901367188, -7.843428611755371, -7.544233322143555, -7.2450385093688965, -6.94584321975708, -6.646647930145264, -6.3474531173706055, -6.048257827758789, -5.749062538146973, -5.4498677253723145, -5.150672435760498, -4.85147762298584, -4.552282333374023, -4.253087043762207, -3.9538919925689697, -3.6546969413757324, -3.355501651763916, -3.0563066005706787, -2.7571115493774414, -2.457916259765625, -2.1587212085723877, -1.8595260381698608, -1.560330867767334, -1.2611358165740967, -0.9619405269622803, -0.662745475769043, -0.3635503351688385, -0.06435519456863403, 0.23483991622924805, 0.5340350866317749, 0.8332302570343018, 1.132425308227539, 1.4316205978393555, 1.7308156490325928, 2.03001070022583, 2.3292059898376465, 2.628401041030884, 2.927596092224121, 3.2267913818359375, 3.525986433029175, 3.825181722640991, 4.1243767738342285, 4.423572063446045, 4.722766876220703, 5.0219621658325195, 5.321157455444336, 5.620352745056152, 5.9195475578308105, 6.218742847442627, 6.517937660217285, 6.817132949829102, 7.11632776260376, 7.415523052215576, 7.714718341827393, 8.01391315460205, 8.313108444213867, 8.612303733825684, 8.9114990234375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 9.0, 5.0, 8.0, 11.0, 18.0, 16.0, 21.0, 27.0, 25.0, 30.0, 37.0, 36.0, 43.0, 40.0, 44.0, 54.0, 49.0, 54.0, 57.0, 51.0, 39.0, 40.0, 34.0, 35.0, 28.0, 35.0, 25.0, 26.0, 20.0, 11.0, 26.0, 14.0, 16.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9321097731590271, -0.8937767744064331, -0.8554438352584839, -0.8171108365058899, -0.7787778973579407, -0.7404448986053467, -0.7021119594573975, -0.6637789607048035, -0.6254459619522095, -0.5871129631996155, -0.5487800240516663, -0.5104470252990723, -0.47211408615112305, -0.43378108739852905, -0.39544811844825745, -0.35711514949798584, -0.3187822103500366, -0.280449241399765, -0.2421162724494934, -0.2037832885980606, -0.165450319647789, -0.1271173506975174, -0.0887843668460846, -0.05045139789581299, -0.012118428945541382, 0.026214543730020523, 0.06454751640558243, 0.10288049280643463, 0.14121346175670624, 0.17954643070697784, 0.21787941455841064, 0.25621238350868225, 0.29454541206359863, 0.33287838101387024, 0.37121134996414185, 0.40954434871673584, 0.44787728786468506, 0.48621028661727905, 0.524543285369873, 0.5628762245178223, 0.6012091636657715, 0.6395421624183655, 0.6778751015663147, 0.7162081003189087, 0.7545410394668579, 0.7928740382194519, 0.8312070369720459, 0.8695399761199951, 0.9078729748725891, 0.9462059736251831, 0.9845389127731323, 1.0228718519210815, 1.0612049102783203, 1.0995378494262695, 1.1378707885742188, 1.176203727722168, 1.2145367860794067, 1.252869725227356, 1.2912027835845947, 1.329535722732544, 1.3678686618804932, 1.4062016010284424, 1.4445346593856812, 1.4828675985336304, 1.5212005376815796]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 7.0, 6.0, 13.0, 19.0, 30.0, 40.0, 59.0, 67.0, 132.0, 199.0, 289.0, 474.0, 860.0, 1676.0, 3304.0, 7881.0, 21945.0, 83774.0, 503186.0, 337929.0, 57257.0, 16906.0, 6379.0, 2828.0, 1319.0, 749.0, 454.0, 254.0, 160.0, 101.0, 76.0, 62.0, 34.0, 19.0, 22.0, 10.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.16796875, -2.103973388671875, -2.03997802734375, -1.975982666015625, -1.9119873046875, -1.847991943359375, -1.78399658203125, -1.720001220703125, -1.656005859375, -1.592010498046875, -1.52801513671875, -1.464019775390625, -1.4000244140625, -1.336029052734375, -1.27203369140625, -1.208038330078125, -1.14404296875, -1.080047607421875, -1.01605224609375, -0.952056884765625, -0.8880615234375, -0.824066162109375, -0.76007080078125, -0.696075439453125, -0.632080078125, -0.568084716796875, -0.50408935546875, -0.440093994140625, -0.3760986328125, -0.312103271484375, -0.24810791015625, -0.184112548828125, -0.1201171875, -0.056121826171875, 0.00787353515625, 0.071868896484375, 0.1358642578125, 0.199859619140625, 0.26385498046875, 0.327850341796875, 0.391845703125, 0.455841064453125, 0.51983642578125, 0.583831787109375, 0.6478271484375, 0.711822509765625, 0.77581787109375, 0.839813232421875, 0.90380859375, 0.967803955078125, 1.03179931640625, 1.095794677734375, 1.1597900390625, 1.223785400390625, 1.28778076171875, 1.351776123046875, 1.415771484375, 1.479766845703125, 1.54376220703125, 1.607757568359375, 1.6717529296875, 1.735748291015625, 1.79974365234375, 1.863739013671875, 1.927734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 10.0, 7.0, 5.0, 20.0, 18.0, 27.0, 26.0, 30.0, 52.0, 55.0, 67.0, 72.0, 77.0, 73.0, 67.0, 68.0, 60.0, 55.0, 44.0, 30.0, 21.0, 25.0, 14.0, 19.0, 11.0, 13.0, 10.0, 2.0, 2.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2147293090820312, -1.1804351806640625, -1.1461410522460938, -1.111846923828125, -1.0775527954101562, -1.0432586669921875, -1.0089645385742188, -0.97467041015625, -0.9403762817382812, -0.9060821533203125, -0.8717880249023438, -0.837493896484375, -0.8031997680664062, -0.7689056396484375, -0.7346115112304688, -0.7003173828125, -0.6660232543945312, -0.6317291259765625, -0.5974349975585938, -0.563140869140625, -0.5288467407226562, -0.4945526123046875, -0.46025848388671875, -0.42596435546875, -0.39167022705078125, -0.3573760986328125, -0.32308197021484375, -0.288787841796875, -0.25449371337890625, -0.2201995849609375, -0.18590545654296875, -0.151611328125, -0.11731719970703125, -0.0830230712890625, -0.04872894287109375, -0.014434814453125, 0.01985931396484375, 0.0541534423828125, 0.08844757080078125, 0.12274169921875, 0.15703582763671875, 0.1913299560546875, 0.22562408447265625, 0.259918212890625, 0.29421234130859375, 0.3285064697265625, 0.36280059814453125, 0.3970947265625, 0.43138885498046875, 0.4656829833984375, 0.49997711181640625, 0.534271240234375, 0.5685653686523438, 0.6028594970703125, 0.6371536254882812, 0.67144775390625, 0.7057418823242188, 0.7400360107421875, 0.7743301391601562, 0.808624267578125, 0.8429183959960938, 0.8772125244140625, 0.9115066528320312, 0.94580078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 15.0, 27.0, 38.0, 70.0, 124.0, 235.0, 432.0, 789.0, 1716.0, 4406.0, 19612.0, 333780.0, 649232.0, 28537.0, 5559.0, 1958.0, 901.0, 470.0, 247.0, 133.0, 86.0, 64.0, 37.0, 16.0, 13.0, 9.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.619903564453125, -3.50347900390625, -3.387054443359375, -3.2706298828125, -3.154205322265625, -3.03778076171875, -2.921356201171875, -2.804931640625, -2.688507080078125, -2.57208251953125, -2.455657958984375, -2.3392333984375, -2.222808837890625, -2.10638427734375, -1.989959716796875, -1.87353515625, -1.757110595703125, -1.64068603515625, -1.524261474609375, -1.4078369140625, -1.291412353515625, -1.17498779296875, -1.058563232421875, -0.942138671875, -0.825714111328125, -0.70928955078125, -0.592864990234375, -0.4764404296875, -0.360015869140625, -0.24359130859375, -0.127166748046875, -0.0107421875, 0.105682373046875, 0.22210693359375, 0.338531494140625, 0.4549560546875, 0.571380615234375, 0.68780517578125, 0.804229736328125, 0.920654296875, 1.037078857421875, 1.15350341796875, 1.269927978515625, 1.3863525390625, 1.502777099609375, 1.61920166015625, 1.735626220703125, 1.85205078125, 1.968475341796875, 2.08489990234375, 2.201324462890625, 2.3177490234375, 2.434173583984375, 2.55059814453125, 2.667022705078125, 2.783447265625, 2.899871826171875, 3.01629638671875, 3.132720947265625, 3.2491455078125, 3.365570068359375, 3.48199462890625, 3.598419189453125, 3.71484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 5.0, 10.0, 7.0, 15.0, 18.0, 23.0, 32.0, 38.0, 41.0, 62.0, 57.0, 53.0, 64.0, 63.0, 79.0, 63.0, 62.0, 62.0, 44.0, 49.0, 36.0, 35.0, 20.0, 16.0, 12.0, 6.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.62005615234375, -4.4471435546875, -4.27423095703125, -4.101318359375, -3.92840576171875, -3.7554931640625, -3.58258056640625, -3.40966796875, -3.23675537109375, -3.0638427734375, -2.89093017578125, -2.718017578125, -2.54510498046875, -2.3721923828125, -2.19927978515625, -2.0263671875, -1.85345458984375, -1.6805419921875, -1.50762939453125, -1.334716796875, -1.16180419921875, -0.9888916015625, -0.81597900390625, -0.64306640625, -0.47015380859375, -0.2972412109375, -0.12432861328125, 0.048583984375, 0.22149658203125, 0.3944091796875, 0.56732177734375, 0.740234375, 0.91314697265625, 1.0860595703125, 1.25897216796875, 1.431884765625, 1.60479736328125, 1.7777099609375, 1.95062255859375, 2.12353515625, 2.29644775390625, 2.4693603515625, 2.64227294921875, 2.815185546875, 2.98809814453125, 3.1610107421875, 3.33392333984375, 3.5068359375, 3.67974853515625, 3.8526611328125, 4.02557373046875, 4.198486328125, 4.37139892578125, 4.5443115234375, 4.71722412109375, 4.89013671875, 5.06304931640625, 5.2359619140625, 5.40887451171875, 5.581787109375, 5.75469970703125, 5.9276123046875, 6.10052490234375, 6.2734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 11.0, 14.0, 32.0, 102.0, 341.0, 1446.0, 13347.0, 1020230.0, 11188.0, 1394.0, 271.0, 92.0, 50.0, 13.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.53125, -6.36578369140625, -6.2003173828125, -6.03485107421875, -5.869384765625, -5.70391845703125, -5.5384521484375, -5.37298583984375, -5.20751953125, -5.04205322265625, -4.8765869140625, -4.71112060546875, -4.545654296875, -4.38018798828125, -4.2147216796875, -4.04925537109375, -3.8837890625, -3.71832275390625, -3.5528564453125, -3.38739013671875, -3.221923828125, -3.05645751953125, -2.8909912109375, -2.72552490234375, -2.56005859375, -2.39459228515625, -2.2291259765625, -2.06365966796875, -1.898193359375, -1.73272705078125, -1.5672607421875, -1.40179443359375, -1.236328125, -1.07086181640625, -0.9053955078125, -0.73992919921875, -0.574462890625, -0.40899658203125, -0.2435302734375, -0.07806396484375, 0.08740234375, 0.25286865234375, 0.4183349609375, 0.58380126953125, 0.749267578125, 0.91473388671875, 1.0802001953125, 1.24566650390625, 1.4111328125, 1.57659912109375, 1.7420654296875, 1.90753173828125, 2.072998046875, 2.23846435546875, 2.4039306640625, 2.56939697265625, 2.73486328125, 2.90032958984375, 3.0657958984375, 3.23126220703125, 3.396728515625, 3.56219482421875, 3.7276611328125, 3.89312744140625, 4.05859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 9.0, 7.0, 16.0, 33.0, 70.0, 189.0, 274.0, 205.0, 112.0, 45.0, 12.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022149085998535156, -0.0002125091850757599, -0.0002035275101661682, -0.00019454583525657654, -0.00018556416034698486, -0.0001765824854373932, -0.00016760081052780151, -0.00015861913561820984, -0.00014963746070861816, -0.0001406557857990265, -0.00013167411088943481, -0.00012269243597984314, -0.00011371076107025146, -0.00010472908616065979, -9.574741125106812e-05, -8.676573634147644e-05, -7.778406143188477e-05, -6.880238652229309e-05, -5.9820711612701416e-05, -5.083903670310974e-05, -4.1857361793518066e-05, -3.287568688392639e-05, -2.3894011974334717e-05, -1.4912337064743042e-05, -5.930662155151367e-06, 3.0510127544403076e-06, 1.2032687664031982e-05, 2.1014362573623657e-05, 2.9996037483215332e-05, 3.897771239280701e-05, 4.795938730239868e-05, 5.6941062211990356e-05, 6.592273712158203e-05, 7.49044120311737e-05, 8.388608694076538e-05, 9.286776185035706e-05, 0.00010184943675994873, 0.0001108311116695404, 0.00011981278657913208, 0.00012879446148872375, 0.00013777613639831543, 0.0001467578113079071, 0.00015573948621749878, 0.00016472116112709045, 0.00017370283603668213, 0.0001826845109462738, 0.00019166618585586548, 0.00020064786076545715, 0.00020962953567504883, 0.0002186112105846405, 0.00022759288549423218, 0.00023657456040382385, 0.00024555623531341553, 0.0002545379102230072, 0.0002635195851325989, 0.00027250126004219055, 0.0002814829349517822, 0.0002904646098613739, 0.0002994462847709656, 0.00030842795968055725, 0.0003174096345901489, 0.0003263913094997406, 0.0003353729844093323, 0.00034435465931892395, 0.0003533363342285156]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 11.0, 4.0, 13.0, 12.0, 16.0, 39.0, 46.0, 73.0, 144.0, 279.0, 543.0, 1326.0, 3478.0, 12171.0, 778799.0, 237282.0, 9244.0, 2793.0, 1156.0, 551.0, 234.0, 128.0, 63.0, 59.0, 27.0, 21.0, 13.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.9482421875, -1.873046875, -1.7978515625, -1.72265625, -1.6474609375, -1.572265625, -1.4970703125, -1.421875, -1.3466796875, -1.271484375, -1.1962890625, -1.12109375, -1.0458984375, -0.970703125, -0.8955078125, -0.8203125, -0.7451171875, -0.669921875, -0.5947265625, -0.51953125, -0.4443359375, -0.369140625, -0.2939453125, -0.21875, -0.1435546875, -0.068359375, 0.0068359375, 0.08203125, 0.1572265625, 0.232421875, 0.3076171875, 0.3828125, 0.4580078125, 0.533203125, 0.6083984375, 0.68359375, 0.7587890625, 0.833984375, 0.9091796875, 0.984375, 1.0595703125, 1.134765625, 1.2099609375, 1.28515625, 1.3603515625, 1.435546875, 1.5107421875, 1.5859375, 1.6611328125, 1.736328125, 1.8115234375, 1.88671875, 1.9619140625, 2.037109375, 2.1123046875, 2.1875, 2.2626953125, 2.337890625, 2.4130859375, 2.48828125, 2.5634765625, 2.638671875, 2.7138671875, 2.7890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 9.0, 23.0, 92.0, 354.0, 331.0, 94.0, 19.0, 12.0, 9.0, 5.0, 3.0, 2.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.859222412109375, -2.70867919921875, -2.558135986328125, -2.4075927734375, -2.257049560546875, -2.10650634765625, -1.955963134765625, -1.805419921875, -1.654876708984375, -1.50433349609375, -1.353790283203125, -1.2032470703125, -1.052703857421875, -0.90216064453125, -0.751617431640625, -0.60107421875, -0.450531005859375, -0.29998779296875, -0.149444580078125, 0.0010986328125, 0.151641845703125, 0.30218505859375, 0.452728271484375, 0.603271484375, 0.753814697265625, 0.90435791015625, 1.054901123046875, 1.2054443359375, 1.355987548828125, 1.50653076171875, 1.657073974609375, 1.8076171875, 1.958160400390625, 2.10870361328125, 2.259246826171875, 2.4097900390625, 2.560333251953125, 2.71087646484375, 2.861419677734375, 3.011962890625, 3.162506103515625, 3.31304931640625, 3.463592529296875, 3.6141357421875, 3.764678955078125, 3.91522216796875, 4.065765380859375, 4.21630859375, 4.366851806640625, 4.51739501953125, 4.667938232421875, 4.8184814453125, 4.969024658203125, 5.11956787109375, 5.270111083984375, 5.420654296875, 5.571197509765625, 5.72174072265625, 5.872283935546875, 6.0228271484375, 6.173370361328125, 6.32391357421875, 6.474456787109375, 6.625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 12.0, 41.0, 132.0, 289.0, 278.0, 128.0, 70.0, 29.0, 19.0, 9.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.160404205322266, -25.91027069091797, -24.660137176513672, -23.410003662109375, -22.159870147705078, -20.90973663330078, -19.659605026245117, -18.40947151184082, -17.159337997436523, -15.909204483032227, -14.65907096862793, -13.40893840789795, -12.158804893493652, -10.908671379089355, -9.658538818359375, -8.408405303955078, -7.158271789550781, -5.908138275146484, -4.658005237579346, -3.407871961593628, -2.15773868560791, -0.9076051712036133, 0.3425278663635254, 1.592660903930664, 2.842794418334961, 4.092927932739258, 5.3430609703063965, 6.593194007873535, 7.843327522277832, 9.093461036682129, 10.34359359741211, 11.593727111816406, 12.843864440917969, 14.093997955322266, 15.344131469726562, 16.59426498413086, 17.844398498535156, 19.094532012939453, 20.344663619995117, 21.594797134399414, 22.84493064880371, 24.095064163208008, 25.345197677612305, 26.5953311920166, 27.845462799072266, 29.095596313476562, 30.34572982788086, 31.595863342285156, 32.84599685668945, 34.09613037109375, 35.34626388549805, 36.596397399902344, 37.84653091430664, 39.09666442871094, 40.346797943115234, 41.59693145751953, 42.84706115722656, 44.09719467163086, 45.347328186035156, 46.59746170043945, 47.84759521484375, 49.09772872924805, 50.347862243652344, 51.597991943359375, 52.84812927246094]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 7.0, 6.0, 12.0, 10.0, 17.0, 8.0, 17.0, 12.0, 19.0, 18.0, 24.0, 24.0, 21.0, 31.0, 22.0, 50.0, 42.0, 45.0, 40.0, 42.0, 30.0, 44.0, 47.0, 45.0, 40.0, 44.0, 37.0, 31.0, 30.0, 28.0, 31.0, 13.0, 16.0, 21.0, 18.0, 18.0, 10.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.617327690124512, -15.052301406860352, -14.487274169921875, -13.922247886657715, -13.357221603393555, -12.792194366455078, -12.227168083190918, -11.662141799926758, -11.097114562988281, -10.532088279724121, -9.967061042785645, -9.402034759521484, -8.837007522583008, -8.271981239318848, -7.7069549560546875, -7.141928195953369, -6.576901435852051, -6.011874675750732, -5.446847915649414, -4.881821632385254, -4.3167948722839355, -3.751768112182617, -3.186741590499878, -2.6217150688171387, -2.0566883087158203, -1.4916616678237915, -0.9266350269317627, -0.3616083860397339, 0.20341825485229492, 0.7684450149536133, 1.3334715366363525, 1.8984980583190918, 2.4635257720947266, 3.028552532196045, 3.593579053878784, 4.158605575561523, 4.723632335662842, 5.28865909576416, 5.85368537902832, 6.418712139129639, 6.983738899230957, 7.548765659332275, 8.113792419433594, 8.678818702697754, 9.243844985961914, 9.80887222290039, 10.37389850616455, 10.938924789428711, 11.503952026367188, 12.068978309631348, 12.634005546569824, 13.199031829833984, 13.764059066772461, 14.329085350036621, 14.894111633300781, 15.459138870239258, 16.024166107177734, 16.58919334411621, 17.154218673706055, 17.71924591064453, 18.284273147583008, 18.849300384521484, 19.414325714111328, 19.979352951049805, 20.54437828063965]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 9.0, 6.0, 4.0, 9.0, 13.0, 10.0, 18.0, 26.0, 39.0, 54.0, 81.0, 136.0, 233.0, 425.0, 1018.0, 3183.0, 28463.0, 4143983.0, 12394.0, 2365.0, 814.0, 367.0, 212.0, 131.0, 86.0, 55.0, 25.0, 21.0, 18.0, 19.0, 17.0, 6.0, 15.0, 10.0, 3.0, 4.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.88714599609375, -3.7547607421875, -3.62237548828125, -3.489990234375, -3.35760498046875, -3.2252197265625, -3.09283447265625, -2.96044921875, -2.82806396484375, -2.6956787109375, -2.56329345703125, -2.430908203125, -2.29852294921875, -2.1661376953125, -2.03375244140625, -1.9013671875, -1.76898193359375, -1.6365966796875, -1.50421142578125, -1.371826171875, -1.23944091796875, -1.1070556640625, -0.97467041015625, -0.84228515625, -0.70989990234375, -0.5775146484375, -0.44512939453125, -0.312744140625, -0.18035888671875, -0.0479736328125, 0.08441162109375, 0.216796875, 0.34918212890625, 0.4815673828125, 0.61395263671875, 0.746337890625, 0.87872314453125, 1.0111083984375, 1.14349365234375, 1.27587890625, 1.40826416015625, 1.5406494140625, 1.67303466796875, 1.805419921875, 1.93780517578125, 2.0701904296875, 2.20257568359375, 2.3349609375, 2.46734619140625, 2.5997314453125, 2.73211669921875, 2.864501953125, 2.99688720703125, 3.1292724609375, 3.26165771484375, 3.39404296875, 3.52642822265625, 3.6588134765625, 3.79119873046875, 3.923583984375, 4.05596923828125, 4.1883544921875, 4.32073974609375, 4.453125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 8.0, 14.0, 16.0, 27.0, 34.0, 34.0, 51.0, 48.0, 59.0, 78.0, 67.0, 70.0, 81.0, 73.0, 63.0, 54.0, 42.0, 34.0, 30.0, 22.0, 12.0, 16.0, 11.0, 9.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8544921875, -0.81842041015625, -0.7823486328125, -0.74627685546875, -0.710205078125, -0.67413330078125, -0.6380615234375, -0.60198974609375, -0.56591796875, -0.52984619140625, -0.4937744140625, -0.45770263671875, -0.421630859375, -0.38555908203125, -0.3494873046875, -0.31341552734375, -0.27734375, -0.24127197265625, -0.2052001953125, -0.16912841796875, -0.133056640625, -0.09698486328125, -0.0609130859375, -0.02484130859375, 0.01123046875, 0.04730224609375, 0.0833740234375, 0.11944580078125, 0.155517578125, 0.19158935546875, 0.2276611328125, 0.26373291015625, 0.2998046875, 0.33587646484375, 0.3719482421875, 0.40802001953125, 0.444091796875, 0.48016357421875, 0.5162353515625, 0.55230712890625, 0.58837890625, 0.62445068359375, 0.6605224609375, 0.69659423828125, 0.732666015625, 0.76873779296875, 0.8048095703125, 0.84088134765625, 0.876953125, 0.91302490234375, 0.9490966796875, 0.98516845703125, 1.021240234375, 1.05731201171875, 1.0933837890625, 1.12945556640625, 1.16552734375, 1.20159912109375, 1.2376708984375, 1.27374267578125, 1.309814453125, 1.34588623046875, 1.3819580078125, 1.41802978515625, 1.4541015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 9.0, 7.0, 15.0, 18.0, 17.0, 37.0, 34.0, 38.0, 60.0, 69.0, 105.0, 117.0, 191.0, 247.0, 299.0, 385.0, 897.0, 10436.0, 4175136.0, 4050.0, 650.0, 328.0, 256.0, 181.0, 184.0, 106.0, 87.0, 80.0, 60.0, 39.0, 28.0, 22.0, 22.0, 18.0, 10.0, 11.0, 11.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.63671875, -11.265625, -10.89453125, -10.5234375, -10.15234375, -9.78125, -9.41015625, -9.0390625, -8.66796875, -8.296875, -7.92578125, -7.5546875, -7.18359375, -6.8125, -6.44140625, -6.0703125, -5.69921875, -5.328125, -4.95703125, -4.5859375, -4.21484375, -3.84375, -3.47265625, -3.1015625, -2.73046875, -2.359375, -1.98828125, -1.6171875, -1.24609375, -0.875, -0.50390625, -0.1328125, 0.23828125, 0.609375, 0.98046875, 1.3515625, 1.72265625, 2.09375, 2.46484375, 2.8359375, 3.20703125, 3.578125, 3.94921875, 4.3203125, 4.69140625, 5.0625, 5.43359375, 5.8046875, 6.17578125, 6.546875, 6.91796875, 7.2890625, 7.66015625, 8.03125, 8.40234375, 8.7734375, 9.14453125, 9.515625, 9.88671875, 10.2578125, 10.62890625, 11.0, 11.37109375, 11.7421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 25.0, 4003.0, 40.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.640625, -13.37078857421875, -13.1009521484375, -12.83111572265625, -12.561279296875, -12.29144287109375, -12.0216064453125, -11.75177001953125, -11.48193359375, -11.21209716796875, -10.9422607421875, -10.67242431640625, -10.402587890625, -10.13275146484375, -9.8629150390625, -9.59307861328125, -9.3232421875, -9.05340576171875, -8.7835693359375, -8.51373291015625, -8.243896484375, -7.97406005859375, -7.7042236328125, -7.43438720703125, -7.16455078125, -6.89471435546875, -6.6248779296875, -6.35504150390625, -6.085205078125, -5.81536865234375, -5.5455322265625, -5.27569580078125, -5.005859375, -4.73602294921875, -4.4661865234375, -4.19635009765625, -3.926513671875, -3.65667724609375, -3.3868408203125, -3.11700439453125, -2.84716796875, -2.57733154296875, -2.3074951171875, -2.03765869140625, -1.767822265625, -1.49798583984375, -1.2281494140625, -0.95831298828125, -0.6884765625, -0.41864013671875, -0.1488037109375, 0.12103271484375, 0.390869140625, 0.66070556640625, 0.9305419921875, 1.20037841796875, 1.47021484375, 1.74005126953125, 2.0098876953125, 2.27972412109375, 2.549560546875, 2.81939697265625, 3.0892333984375, 3.35906982421875, 3.62890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 24.0, 55.0, 184.0, 438.0, 212.0, 62.0, 12.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.379966735839844, -33.69788360595703, -33.01579666137695, -32.33371353149414, -31.651628494262695, -30.96954345703125, -30.287460327148438, -29.605375289916992, -28.923290252685547, -28.2412052154541, -27.55912208557129, -26.877037048339844, -26.1949520111084, -25.512866973876953, -24.83078384399414, -24.148698806762695, -23.466615676879883, -22.784530639648438, -22.102447509765625, -21.42036247253418, -20.738277435302734, -20.056194305419922, -19.374109268188477, -18.69202423095703, -18.00994110107422, -17.327856063842773, -16.64577293395996, -15.963687896728516, -15.28160285949707, -14.599518775939941, -13.917434692382812, -13.235349655151367, -12.553266525268555, -11.871182441711426, -11.18909740447998, -10.507013320922852, -9.824928283691406, -9.142844200134277, -8.460760116577148, -7.778675556182861, -7.096590995788574, -6.414506435394287, -5.732421875, -5.050337791442871, -4.368253231048584, -3.686168670654297, -3.004084587097168, -2.322000026702881, -1.6399154663085938, -0.9578310251235962, -0.27574658393859863, 0.4063377380371094, 1.0884222984313965, 1.7705068588256836, 2.4525909423828125, 3.1346755027770996, 3.8167600631713867, 4.498844623565674, 5.180929183959961, 5.86301326751709, 6.545097827911377, 7.227182388305664, 7.909266471862793, 8.591350555419922, 9.273435592651367]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 17.0, 20.0, 38.0, 64.0, 90.0, 123.0, 163.0, 140.0, 114.0, 69.0, 49.0, 41.0, 20.0, 17.0, 5.0, 9.0, 0.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28121566772461, -20.547666549682617, -19.814117431640625, -19.08056640625, -18.347017288208008, -17.613468170166016, -16.879919052124023, -16.14636993408203, -15.412819862365723, -14.67927074432373, -13.945720672607422, -13.21217155456543, -12.478622436523438, -11.745072364807129, -11.011523246765137, -10.277973175048828, -9.544424057006836, -8.810874938964844, -8.077324867248535, -7.343775749206543, -6.610226154327393, -5.876676559448242, -5.14312744140625, -4.4095778465271, -3.676028251647949, -2.942478656768799, -2.2089293003082275, -1.4753799438476562, -0.7418303489685059, -0.008280754089355469, 0.7252683639526367, 1.458817958831787, 2.1923694610595703, 2.9259190559387207, 3.659468412399292, 4.393017768859863, 5.126567363739014, 5.860116958618164, 6.593666076660156, 7.327215671539307, 8.060765266418457, 8.79431438446045, 9.527864456176758, 10.26141357421875, 10.994962692260742, 11.72851276397705, 12.462061882019043, 13.195611953735352, 13.929161071777344, 14.662710189819336, 15.396260261535645, 16.129810333251953, 16.863359451293945, 17.596908569335938, 18.33045768737793, 19.064006805419922, 19.797557830810547, 20.53110694885254, 21.26465606689453, 21.998207092285156, 22.73175621032715, 23.46530532836914, 24.198854446411133, 24.932403564453125, 25.665952682495117]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 18.0, 19.0, 40.0, 55.0, 107.0, 178.0, 336.0, 652.0, 1696.0, 5319.0, 22103.0, 151814.0, 714412.0, 124756.0, 19520.0, 4613.0, 1502.0, 676.0, 306.0, 157.0, 102.0, 62.0, 32.0, 22.0, 19.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.9449462890625, -2.844970703125, -2.7449951171875, -2.64501953125, -2.5450439453125, -2.445068359375, -2.3450927734375, -2.2451171875, -2.1451416015625, -2.045166015625, -1.9451904296875, -1.84521484375, -1.7452392578125, -1.645263671875, -1.5452880859375, -1.4453125, -1.3453369140625, -1.245361328125, -1.1453857421875, -1.04541015625, -0.9454345703125, -0.845458984375, -0.7454833984375, -0.6455078125, -0.5455322265625, -0.445556640625, -0.3455810546875, -0.24560546875, -0.1456298828125, -0.045654296875, 0.0543212890625, 0.154296875, 0.2542724609375, 0.354248046875, 0.4542236328125, 0.55419921875, 0.6541748046875, 0.754150390625, 0.8541259765625, 0.9541015625, 1.0540771484375, 1.154052734375, 1.2540283203125, 1.35400390625, 1.4539794921875, 1.553955078125, 1.6539306640625, 1.75390625, 1.8538818359375, 1.953857421875, 2.0538330078125, 2.15380859375, 2.2537841796875, 2.353759765625, 2.4537353515625, 2.5537109375, 2.6536865234375, 2.753662109375, 2.8536376953125, 2.95361328125, 3.0535888671875, 3.153564453125, 3.2535400390625, 3.353515625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 8.0, 18.0, 18.0, 21.0, 35.0, 39.0, 55.0, 66.0, 79.0, 100.0, 96.0, 97.0, 90.0, 75.0, 46.0, 45.0, 22.0, 16.0, 20.0, 12.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.876953125, -1.8171234130859375, -1.757293701171875, -1.6974639892578125, -1.63763427734375, -1.5778045654296875, -1.517974853515625, -1.4581451416015625, -1.3983154296875, -1.3384857177734375, -1.278656005859375, -1.2188262939453125, -1.15899658203125, -1.0991668701171875, -1.039337158203125, -0.9795074462890625, -0.919677734375, -0.8598480224609375, -0.800018310546875, -0.7401885986328125, -0.68035888671875, -0.6205291748046875, -0.560699462890625, -0.5008697509765625, -0.4410400390625, -0.3812103271484375, -0.321380615234375, -0.2615509033203125, -0.20172119140625, -0.1418914794921875, -0.082061767578125, -0.0222320556640625, 0.03759765625, 0.0974273681640625, 0.157257080078125, 0.2170867919921875, 0.27691650390625, 0.3367462158203125, 0.396575927734375, 0.4564056396484375, 0.5162353515625, 0.5760650634765625, 0.635894775390625, 0.6957244873046875, 0.75555419921875, 0.8153839111328125, 0.875213623046875, 0.9350433349609375, 0.994873046875, 1.0547027587890625, 1.114532470703125, 1.1743621826171875, 1.23419189453125, 1.2940216064453125, 1.353851318359375, 1.4136810302734375, 1.4735107421875, 1.5333404541015625, 1.593170166015625, 1.6529998779296875, 1.71282958984375, 1.7726593017578125, 1.832489013671875, 1.8923187255859375, 1.9521484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 14.0, 18.0, 20.0, 36.0, 48.0, 90.0, 147.0, 276.0, 717.0, 3284.0, 110577.0, 921293.0, 9946.0, 1177.0, 411.0, 192.0, 118.0, 78.0, 41.0, 23.0, 7.0, 11.0, 10.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69921875, -7.43572998046875, -7.1722412109375, -6.90875244140625, -6.645263671875, -6.38177490234375, -6.1182861328125, -5.85479736328125, -5.59130859375, -5.32781982421875, -5.0643310546875, -4.80084228515625, -4.537353515625, -4.27386474609375, -4.0103759765625, -3.74688720703125, -3.4833984375, -3.21990966796875, -2.9564208984375, -2.69293212890625, -2.429443359375, -2.16595458984375, -1.9024658203125, -1.63897705078125, -1.37548828125, -1.11199951171875, -0.8485107421875, -0.58502197265625, -0.321533203125, -0.05804443359375, 0.2054443359375, 0.46893310546875, 0.732421875, 0.99591064453125, 1.2593994140625, 1.52288818359375, 1.786376953125, 2.04986572265625, 2.3133544921875, 2.57684326171875, 2.84033203125, 3.10382080078125, 3.3673095703125, 3.63079833984375, 3.894287109375, 4.15777587890625, 4.4212646484375, 4.68475341796875, 4.9482421875, 5.21173095703125, 5.4752197265625, 5.73870849609375, 6.002197265625, 6.26568603515625, 6.5291748046875, 6.79266357421875, 7.05615234375, 7.31964111328125, 7.5831298828125, 7.84661865234375, 8.110107421875, 8.37359619140625, 8.6370849609375, 8.90057373046875, 9.1640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 39.0, 68.0, 112.0, 168.0, 184.0, 158.0, 122.0, 92.0, 30.0, 13.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.880859375, -21.35546875, -20.830078125, -20.3046875, -19.779296875, -19.25390625, -18.728515625, -18.203125, -17.677734375, -17.15234375, -16.626953125, -16.1015625, -15.576171875, -15.05078125, -14.525390625, -14.0, -13.474609375, -12.94921875, -12.423828125, -11.8984375, -11.373046875, -10.84765625, -10.322265625, -9.796875, -9.271484375, -8.74609375, -8.220703125, -7.6953125, -7.169921875, -6.64453125, -6.119140625, -5.59375, -5.068359375, -4.54296875, -4.017578125, -3.4921875, -2.966796875, -2.44140625, -1.916015625, -1.390625, -0.865234375, -0.33984375, 0.185546875, 0.7109375, 1.236328125, 1.76171875, 2.287109375, 2.8125, 3.337890625, 3.86328125, 4.388671875, 4.9140625, 5.439453125, 5.96484375, 6.490234375, 7.015625, 7.541015625, 8.06640625, 8.591796875, 9.1171875, 9.642578125, 10.16796875, 10.693359375, 11.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 13.0, 16.0, 20.0, 24.0, 45.0, 87.0, 169.0, 515.0, 1960.0, 13064.0, 646920.0, 372543.0, 10619.0, 1718.0, 463.0, 166.0, 68.0, 27.0, 39.0, 12.0, 9.0, 7.0, 12.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.173828125, -2.119415283203125, -2.06500244140625, -2.010589599609375, -1.9561767578125, -1.901763916015625, -1.84735107421875, -1.792938232421875, -1.738525390625, -1.684112548828125, -1.62969970703125, -1.575286865234375, -1.5208740234375, -1.466461181640625, -1.41204833984375, -1.357635498046875, -1.30322265625, -1.248809814453125, -1.19439697265625, -1.139984130859375, -1.0855712890625, -1.031158447265625, -0.97674560546875, -0.922332763671875, -0.867919921875, -0.813507080078125, -0.75909423828125, -0.704681396484375, -0.6502685546875, -0.595855712890625, -0.54144287109375, -0.487030029296875, -0.4326171875, -0.378204345703125, -0.32379150390625, -0.269378662109375, -0.2149658203125, -0.160552978515625, -0.10614013671875, -0.051727294921875, 0.002685546875, 0.057098388671875, 0.11151123046875, 0.165924072265625, 0.2203369140625, 0.274749755859375, 0.32916259765625, 0.383575439453125, 0.43798828125, 0.492401123046875, 0.54681396484375, 0.601226806640625, 0.6556396484375, 0.710052490234375, 0.76446533203125, 0.818878173828125, 0.873291015625, 0.927703857421875, 0.98211669921875, 1.036529541015625, 1.0909423828125, 1.145355224609375, 1.19976806640625, 1.254180908203125, 1.30859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 8.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 16.0, 12.0, 25.0, 49.0, 57.0, 72.0, 117.0, 127.0, 124.0, 101.0, 77.0, 46.0, 30.0, 24.0, 18.0, 15.0, 11.0, 10.0, 6.0, 5.0, 7.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011783838272094727, -0.0001134360209107399, -0.00010903365910053253, -0.00010463129729032516, -0.0001002289354801178, -9.582657366991043e-05, -9.142421185970306e-05, -8.70218500494957e-05, -8.261948823928833e-05, -7.821712642908096e-05, -7.38147646188736e-05, -6.941240280866623e-05, -6.501004099845886e-05, -6.0607679188251495e-05, -5.620531737804413e-05, -5.180295556783676e-05, -4.7400593757629395e-05, -4.299823194742203e-05, -3.859587013721466e-05, -3.4193508327007294e-05, -2.9791146516799927e-05, -2.538878470659256e-05, -2.0986422896385193e-05, -1.6584061086177826e-05, -1.2181699275970459e-05, -7.779337465763092e-06, -3.376975655555725e-06, 1.0253861546516418e-06, 5.427747964859009e-06, 9.830109775066376e-06, 1.4232471585273743e-05, 1.863483339548111e-05, 2.3037195205688477e-05, 2.7439557015895844e-05, 3.184191882610321e-05, 3.624428063631058e-05, 4.0646642446517944e-05, 4.504900425672531e-05, 4.945136606693268e-05, 5.3853727877140045e-05, 5.825608968734741e-05, 6.265845149755478e-05, 6.706081330776215e-05, 7.146317511796951e-05, 7.586553692817688e-05, 8.026789873838425e-05, 8.467026054859161e-05, 8.907262235879898e-05, 9.347498416900635e-05, 9.787734597921371e-05, 0.00010227970778942108, 0.00010668206959962845, 0.00011108443140983582, 0.00011548679322004318, 0.00011988915503025055, 0.00012429151684045792, 0.00012869387865066528, 0.00013309624046087265, 0.00013749860227108002, 0.00014190096408128738, 0.00014630332589149475, 0.00015070568770170212, 0.00015510804951190948, 0.00015951041132211685, 0.00016391277313232422]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 9.0, 12.0, 8.0, 32.0, 62.0, 117.0, 240.0, 650.0, 2354.0, 21714.0, 986760.0, 32660.0, 2666.0, 732.0, 275.0, 105.0, 59.0, 36.0, 19.0, 11.0, 8.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -2.007232666015625, -1.93438720703125, -1.861541748046875, -1.7886962890625, -1.715850830078125, -1.64300537109375, -1.570159912109375, -1.497314453125, -1.424468994140625, -1.35162353515625, -1.278778076171875, -1.2059326171875, -1.133087158203125, -1.06024169921875, -0.987396240234375, -0.91455078125, -0.841705322265625, -0.76885986328125, -0.696014404296875, -0.6231689453125, -0.550323486328125, -0.47747802734375, -0.404632568359375, -0.331787109375, -0.258941650390625, -0.18609619140625, -0.113250732421875, -0.0404052734375, 0.032440185546875, 0.10528564453125, 0.178131103515625, 0.2509765625, 0.323822021484375, 0.39666748046875, 0.469512939453125, 0.5423583984375, 0.615203857421875, 0.68804931640625, 0.760894775390625, 0.833740234375, 0.906585693359375, 0.97943115234375, 1.052276611328125, 1.1251220703125, 1.197967529296875, 1.27081298828125, 1.343658447265625, 1.41650390625, 1.489349365234375, 1.56219482421875, 1.635040283203125, 1.7078857421875, 1.780731201171875, 1.85357666015625, 1.926422119140625, 1.999267578125, 2.072113037109375, 2.14495849609375, 2.217803955078125, 2.2906494140625, 2.363494873046875, 2.43634033203125, 2.509185791015625, 2.58203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 12.0, 8.0, 14.0, 19.0, 44.0, 88.0, 133.0, 160.0, 184.0, 136.0, 78.0, 44.0, 26.0, 15.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33203125, -1.278717041015625, -1.22540283203125, -1.172088623046875, -1.1187744140625, -1.065460205078125, -1.01214599609375, -0.958831787109375, -0.905517578125, -0.852203369140625, -0.79888916015625, -0.745574951171875, -0.6922607421875, -0.638946533203125, -0.58563232421875, -0.532318115234375, -0.47900390625, -0.425689697265625, -0.37237548828125, -0.319061279296875, -0.2657470703125, -0.212432861328125, -0.15911865234375, -0.105804443359375, -0.052490234375, 0.000823974609375, 0.05413818359375, 0.107452392578125, 0.1607666015625, 0.214080810546875, 0.26739501953125, 0.320709228515625, 0.3740234375, 0.427337646484375, 0.48065185546875, 0.533966064453125, 0.5872802734375, 0.640594482421875, 0.69390869140625, 0.747222900390625, 0.800537109375, 0.853851318359375, 0.90716552734375, 0.960479736328125, 1.0137939453125, 1.067108154296875, 1.12042236328125, 1.173736572265625, 1.22705078125, 1.280364990234375, 1.33367919921875, 1.386993408203125, 1.4403076171875, 1.493621826171875, 1.54693603515625, 1.600250244140625, 1.653564453125, 1.706878662109375, 1.76019287109375, 1.813507080078125, 1.8668212890625, 1.920135498046875, 1.97344970703125, 2.026763916015625, 2.080078125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 17.0, 122.0, 653.0, 203.0, 16.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.2798309326172, -128.9432373046875, -124.60664367675781, -120.27005004882812, -115.93345642089844, -111.59686279296875, -107.26026916503906, -102.92367553710938, -98.58708190917969, -94.25048828125, -89.91389465332031, -85.57730102539062, -81.24070739746094, -76.90411376953125, -72.56752014160156, -68.23092651367188, -63.89433288574219, -59.5577392578125, -55.22114562988281, -50.884552001953125, -46.54795837402344, -42.21136474609375, -37.87477111816406, -33.538177490234375, -29.201583862304688, -24.864990234375, -20.528396606445312, -16.191802978515625, -11.855209350585938, -7.51861572265625, -3.1820220947265625, 1.154571533203125, 5.49114990234375, 9.827743530273438, 14.164337158203125, 18.500930786132812, 22.8375244140625, 27.174118041992188, 31.510711669921875, 35.84730529785156, 40.18389892578125, 44.52049255371094, 48.857086181640625, 53.19367980957031, 57.5302734375, 61.86686706542969, 66.20346069335938, 70.54005432128906, 74.87664794921875, 79.21324157714844, 83.54983520507812, 87.88642883300781, 92.2230224609375, 96.55961608886719, 100.89620971679688, 105.23280334472656, 109.56939697265625, 113.90599060058594, 118.24258422851562, 122.57917785644531, 126.915771484375, 131.2523651123047, 135.58895874023438, 139.92555236816406, 144.26214599609375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 16.0, 16.0, 17.0, 21.0, 30.0, 23.0, 43.0, 29.0, 37.0, 58.0, 54.0, 59.0, 60.0, 67.0, 60.0, 55.0, 52.0, 47.0, 38.0, 43.0, 27.0, 32.0, 23.0, 18.0, 7.0, 12.0, 20.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.70851135253906, -40.5550422668457, -39.401573181152344, -38.248104095458984, -37.094635009765625, -35.941165924072266, -34.787696838378906, -33.63422775268555, -32.48075866699219, -31.327289581298828, -30.17382049560547, -29.02035140991211, -27.86688232421875, -26.71341323852539, -25.55994415283203, -24.406475067138672, -23.253005981445312, -22.099536895751953, -20.946067810058594, -19.792598724365234, -18.639129638671875, -17.485660552978516, -16.332191467285156, -15.178722381591797, -14.025253295898438, -12.871784210205078, -11.718315124511719, -10.56484603881836, -9.411376953125, -8.25790786743164, -7.104438781738281, -5.950969696044922, -4.797496795654297, -3.6440277099609375, -2.490558624267578, -1.3370895385742188, -0.18362045288085938, 0.9698486328125, 2.1233177185058594, 3.2767868041992188, 4.430255889892578, 5.5837249755859375, 6.737194061279297, 7.890663146972656, 9.044132232666016, 10.197601318359375, 11.351070404052734, 12.504539489746094, 13.658008575439453, 14.811477661132812, 15.964946746826172, 17.11841583251953, 18.27188491821289, 19.42535400390625, 20.57882308959961, 21.73229217529297, 22.885761260986328, 24.039230346679688, 25.192699432373047, 26.346168518066406, 27.499637603759766, 28.653106689453125, 29.806575775146484, 30.960044860839844, 32.1135139465332]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 12.0, 9.0, 20.0, 26.0, 33.0, 55.0, 58.0, 114.0, 123.0, 205.0, 270.0, 402.0, 620.0, 1033.0, 1720.0, 2806.0, 4930.0, 10407.0, 26163.0, 109223.0, 1439583.0, 2415902.0, 128950.0, 26415.0, 10630.0, 5546.0, 3159.0, 1944.0, 1219.0, 788.0, 575.0, 376.0, 267.0, 202.0, 146.0, 92.0, 62.0, 55.0, 40.0, 28.0, 17.0, 14.0, 11.0, 6.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9634246826171875, -0.927825927734375, -0.8922271728515625, -0.85662841796875, -0.8210296630859375, -0.785430908203125, -0.7498321533203125, -0.7142333984375, -0.6786346435546875, -0.643035888671875, -0.6074371337890625, -0.57183837890625, -0.5362396240234375, -0.500640869140625, -0.4650421142578125, -0.429443359375, -0.3938446044921875, -0.358245849609375, -0.3226470947265625, -0.28704833984375, -0.2514495849609375, -0.215850830078125, -0.1802520751953125, -0.1446533203125, -0.1090545654296875, -0.073455810546875, -0.0378570556640625, -0.00225830078125, 0.0333404541015625, 0.068939208984375, 0.1045379638671875, 0.14013671875, 0.1757354736328125, 0.211334228515625, 0.2469329833984375, 0.28253173828125, 0.3181304931640625, 0.353729248046875, 0.3893280029296875, 0.4249267578125, 0.4605255126953125, 0.496124267578125, 0.5317230224609375, 0.56732177734375, 0.6029205322265625, 0.638519287109375, 0.6741180419921875, 0.709716796875, 0.7453155517578125, 0.780914306640625, 0.8165130615234375, 0.85211181640625, 0.8877105712890625, 0.923309326171875, 0.9589080810546875, 0.9945068359375, 1.0301055908203125, 1.065704345703125, 1.1013031005859375, 1.13690185546875, 1.1725006103515625, 1.208099365234375, 1.2436981201171875, 1.279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 7.0, 16.0, 10.0, 15.0, 26.0, 26.0, 24.0, 27.0, 36.0, 44.0, 58.0, 57.0, 53.0, 56.0, 58.0, 61.0, 56.0, 60.0, 42.0, 37.0, 41.0, 35.0, 26.0, 17.0, 18.0, 23.0, 13.0, 9.0, 5.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9189453125, -0.8869171142578125, -0.854888916015625, -0.8228607177734375, -0.79083251953125, -0.7588043212890625, -0.726776123046875, -0.6947479248046875, -0.6627197265625, -0.6306915283203125, -0.598663330078125, -0.5666351318359375, -0.53460693359375, -0.5025787353515625, -0.470550537109375, -0.4385223388671875, -0.406494140625, -0.3744659423828125, -0.342437744140625, -0.3104095458984375, -0.27838134765625, -0.2463531494140625, -0.214324951171875, -0.1822967529296875, -0.1502685546875, -0.1182403564453125, -0.086212158203125, -0.0541839599609375, -0.02215576171875, 0.0098724365234375, 0.041900634765625, 0.0739288330078125, 0.10595703125, 0.1379852294921875, 0.170013427734375, 0.2020416259765625, 0.23406982421875, 0.2660980224609375, 0.298126220703125, 0.3301544189453125, 0.3621826171875, 0.3942108154296875, 0.426239013671875, 0.4582672119140625, 0.49029541015625, 0.5223236083984375, 0.554351806640625, 0.5863800048828125, 0.618408203125, 0.6504364013671875, 0.682464599609375, 0.7144927978515625, 0.74652099609375, 0.7785491943359375, 0.810577392578125, 0.8426055908203125, 0.8746337890625, 0.9066619873046875, 0.938690185546875, 0.9707183837890625, 1.00274658203125, 1.0347747802734375, 1.066802978515625, 1.0988311767578125, 1.130859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 5.0, 9.0, 19.0, 16.0, 31.0, 50.0, 103.0, 221.0, 395.0, 999.0, 3259.0, 18390.0, 611125.0, 3525401.0, 27485.0, 4352.0, 1245.0, 490.0, 266.0, 141.0, 88.0, 36.0, 28.0, 17.0, 17.0, 13.0, 7.0, 3.0, 6.0, 7.0, 2.0, 4.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.7000732421875, -3.591552734375, -3.4830322265625, -3.37451171875, -3.2659912109375, -3.157470703125, -3.0489501953125, -2.9404296875, -2.8319091796875, -2.723388671875, -2.6148681640625, -2.50634765625, -2.3978271484375, -2.289306640625, -2.1807861328125, -2.072265625, -1.9637451171875, -1.855224609375, -1.7467041015625, -1.63818359375, -1.5296630859375, -1.421142578125, -1.3126220703125, -1.2041015625, -1.0955810546875, -0.987060546875, -0.8785400390625, -0.77001953125, -0.6614990234375, -0.552978515625, -0.4444580078125, -0.3359375, -0.2274169921875, -0.118896484375, -0.0103759765625, 0.09814453125, 0.2066650390625, 0.315185546875, 0.4237060546875, 0.5322265625, 0.6407470703125, 0.749267578125, 0.8577880859375, 0.96630859375, 1.0748291015625, 1.183349609375, 1.2918701171875, 1.400390625, 1.5089111328125, 1.617431640625, 1.7259521484375, 1.83447265625, 1.9429931640625, 2.051513671875, 2.1600341796875, 2.2685546875, 2.3770751953125, 2.485595703125, 2.5941162109375, 2.70263671875, 2.8111572265625, 2.919677734375, 3.0281982421875, 3.13671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 8.0, 10.0, 10.0, 14.0, 24.0, 23.0, 32.0, 58.0, 183.0, 784.0, 1964.0, 623.0, 140.0, 61.0, 35.0, 21.0, 26.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.044921875, -1.949798583984375, -1.85467529296875, -1.759552001953125, -1.6644287109375, -1.569305419921875, -1.47418212890625, -1.379058837890625, -1.283935546875, -1.188812255859375, -1.09368896484375, -0.998565673828125, -0.9034423828125, -0.808319091796875, -0.71319580078125, -0.618072509765625, -0.52294921875, -0.427825927734375, -0.33270263671875, -0.237579345703125, -0.1424560546875, -0.047332763671875, 0.04779052734375, 0.142913818359375, 0.238037109375, 0.333160400390625, 0.42828369140625, 0.523406982421875, 0.6185302734375, 0.713653564453125, 0.80877685546875, 0.903900146484375, 0.9990234375, 1.094146728515625, 1.18927001953125, 1.284393310546875, 1.3795166015625, 1.474639892578125, 1.56976318359375, 1.664886474609375, 1.760009765625, 1.855133056640625, 1.95025634765625, 2.045379638671875, 2.1405029296875, 2.235626220703125, 2.33074951171875, 2.425872802734375, 2.52099609375, 2.616119384765625, 2.71124267578125, 2.806365966796875, 2.9014892578125, 2.996612548828125, 3.09173583984375, 3.186859130859375, 3.281982421875, 3.377105712890625, 3.47222900390625, 3.567352294921875, 3.6624755859375, 3.757598876953125, 3.85272216796875, 3.947845458984375, 4.04296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 4.0, 18.0, 19.0, 26.0, 47.0, 91.0, 129.0, 140.0, 154.0, 119.0, 90.0, 56.0, 31.0, 12.0, 18.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.957306861877441, -12.5669584274292, -12.176609992980957, -11.786261558532715, -11.395913124084473, -11.00556468963623, -10.615216255187988, -10.224867820739746, -9.834519386291504, -9.444170951843262, -9.05382251739502, -8.663474082946777, -8.273125648498535, -7.882777214050293, -7.492428779602051, -7.102080345153809, -6.711731910705566, -6.321383476257324, -5.931035041809082, -5.54068660736084, -5.150338172912598, -4.7599897384643555, -4.369641304016113, -3.979292869567871, -3.588944435119629, -3.1985960006713867, -2.8082475662231445, -2.4178991317749023, -2.02755069732666, -1.637202262878418, -1.2468538284301758, -0.8565053939819336, -0.466156005859375, -0.07580757141113281, 0.3145408630371094, 0.7048892974853516, 1.0952377319335938, 1.485586166381836, 1.8759346008300781, 2.2662830352783203, 2.6566314697265625, 3.0469799041748047, 3.437328338623047, 3.827676773071289, 4.218025207519531, 4.608373641967773, 4.998722076416016, 5.389070510864258, 5.7794189453125, 6.169767379760742, 6.560115814208984, 6.950464248657227, 7.340812683105469, 7.731161117553711, 8.121509552001953, 8.511857986450195, 8.902206420898438, 9.29255485534668, 9.682903289794922, 10.073251724243164, 10.463600158691406, 10.853948593139648, 11.24429702758789, 11.634645462036133, 12.024993896484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 12.0, 9.0, 19.0, 29.0, 20.0, 21.0, 28.0, 33.0, 40.0, 45.0, 41.0, 52.0, 54.0, 82.0, 64.0, 71.0, 52.0, 34.0, 57.0, 39.0, 31.0, 38.0, 26.0, 23.0, 14.0, 17.0, 13.0, 7.0, 4.0, 5.0, 1.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.359330177307129, -9.958972930908203, -9.558615684509277, -9.158258438110352, -8.757902145385742, -8.3575439453125, -7.957187652587891, -7.556830406188965, -7.156473159790039, -6.756115913391113, -6.3557586669921875, -5.95540189743042, -5.555044651031494, -5.154687404632568, -4.754330635070801, -4.353973388671875, -3.953616142272949, -3.5532588958740234, -3.1529018878936768, -2.75254487991333, -2.3521876335144043, -1.9518303871154785, -1.5514733791351318, -1.1511163711547852, -0.7507591247558594, -0.35040199756622314, 0.049955129623413086, 0.4503122568130493, 0.8506693840026855, 1.2510266304016113, 1.651383638381958, 2.0517406463623047, 2.4520978927612305, 2.8524551391601562, 3.252812147140503, 3.6531691551208496, 4.053526401519775, 4.453883647918701, 4.854240417480469, 5.2545976638793945, 5.65495491027832, 6.055312156677246, 6.455669403076172, 6.8560261726379395, 7.256383419036865, 7.656740665435791, 8.057097434997559, 8.457454681396484, 8.85781192779541, 9.258169174194336, 9.658526420593262, 10.058883666992188, 10.459239959716797, 10.859598159790039, 11.259954452514648, 11.660311698913574, 12.0606689453125, 12.461026191711426, 12.861383438110352, 13.261740684509277, 13.662097930908203, 14.062454223632812, 14.462811470031738, 14.863168716430664, 15.26352596282959]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 17.0, 22.0, 24.0, 52.0, 63.0, 91.0, 136.0, 194.0, 291.0, 446.0, 683.0, 1125.0, 1674.0, 2910.0, 4910.0, 8425.0, 15237.0, 28004.0, 54273.0, 111025.0, 217306.0, 271049.0, 162404.0, 79597.0, 39851.0, 20718.0, 11697.0, 6468.0, 3677.0, 2260.0, 1412.0, 881.0, 577.0, 377.0, 232.0, 142.0, 94.0, 64.0, 47.0, 34.0, 20.0, 13.0, 11.0, 11.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.6571121215820312, -0.6320953369140625, -0.6070785522460938, -0.582061767578125, -0.5570449829101562, -0.5320281982421875, -0.5070114135742188, -0.48199462890625, -0.45697784423828125, -0.4319610595703125, -0.40694427490234375, -0.381927490234375, -0.35691070556640625, -0.3318939208984375, -0.30687713623046875, -0.2818603515625, -0.25684356689453125, -0.2318267822265625, -0.20680999755859375, -0.181793212890625, -0.15677642822265625, -0.1317596435546875, -0.10674285888671875, -0.08172607421875, -0.05670928955078125, -0.0316925048828125, -0.00667572021484375, 0.018341064453125, 0.04335784912109375, 0.0683746337890625, 0.09339141845703125, 0.118408203125, 0.14342498779296875, 0.1684417724609375, 0.19345855712890625, 0.218475341796875, 0.24349212646484375, 0.2685089111328125, 0.29352569580078125, 0.31854248046875, 0.34355926513671875, 0.3685760498046875, 0.39359283447265625, 0.418609619140625, 0.44362640380859375, 0.4686431884765625, 0.49365997314453125, 0.5186767578125, 0.5436935424804688, 0.5687103271484375, 0.5937271118164062, 0.618743896484375, 0.6437606811523438, 0.6687774658203125, 0.6937942504882812, 0.71881103515625, 0.7438278198242188, 0.7688446044921875, 0.7938613891601562, 0.818878173828125, 0.8438949584960938, 0.8689117431640625, 0.8939285278320312, 0.9189453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 22.0, 18.0, 13.0, 19.0, 20.0, 29.0, 27.0, 42.0, 32.0, 38.0, 51.0, 46.0, 53.0, 47.0, 70.0, 59.0, 54.0, 60.0, 39.0, 36.0, 29.0, 22.0, 33.0, 31.0, 25.0, 15.0, 11.0, 10.0, 10.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.7779388427734375, -0.748260498046875, -0.7185821533203125, -0.68890380859375, -0.6592254638671875, -0.629547119140625, -0.5998687744140625, -0.5701904296875, -0.5405120849609375, -0.510833740234375, -0.4811553955078125, -0.45147705078125, -0.4217987060546875, -0.392120361328125, -0.3624420166015625, -0.332763671875, -0.3030853271484375, -0.273406982421875, -0.2437286376953125, -0.21405029296875, -0.1843719482421875, -0.154693603515625, -0.1250152587890625, -0.0953369140625, -0.0656585693359375, -0.035980224609375, -0.0063018798828125, 0.02337646484375, 0.0530548095703125, 0.082733154296875, 0.1124114990234375, 0.14208984375, 0.1717681884765625, 0.201446533203125, 0.2311248779296875, 0.26080322265625, 0.2904815673828125, 0.320159912109375, 0.3498382568359375, 0.3795166015625, 0.4091949462890625, 0.438873291015625, 0.4685516357421875, 0.49822998046875, 0.5279083251953125, 0.557586669921875, 0.5872650146484375, 0.616943359375, 0.6466217041015625, 0.676300048828125, 0.7059783935546875, 0.73565673828125, 0.7653350830078125, 0.795013427734375, 0.8246917724609375, 0.8543701171875, 0.8840484619140625, 0.913726806640625, 0.9434051513671875, 0.97308349609375, 1.0027618408203125, 1.032440185546875, 1.0621185302734375, 1.091796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 7.0, 12.0, 16.0, 22.0, 51.0, 71.0, 121.0, 180.0, 301.0, 573.0, 1171.0, 3068.0, 13614.0, 165124.0, 796046.0, 57059.0, 7296.0, 2016.0, 791.0, 419.0, 221.0, 122.0, 86.0, 51.0, 35.0, 24.0, 16.0, 8.0, 4.0, 6.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.784820556640625, -2.67901611328125, -2.573211669921875, -2.4674072265625, -2.361602783203125, -2.25579833984375, -2.149993896484375, -2.044189453125, -1.938385009765625, -1.83258056640625, -1.726776123046875, -1.6209716796875, -1.515167236328125, -1.40936279296875, -1.303558349609375, -1.19775390625, -1.091949462890625, -0.98614501953125, -0.880340576171875, -0.7745361328125, -0.668731689453125, -0.56292724609375, -0.457122802734375, -0.351318359375, -0.245513916015625, -0.13970947265625, -0.033905029296875, 0.0718994140625, 0.177703857421875, 0.28350830078125, 0.389312744140625, 0.4951171875, 0.600921630859375, 0.70672607421875, 0.812530517578125, 0.9183349609375, 1.024139404296875, 1.12994384765625, 1.235748291015625, 1.341552734375, 1.447357177734375, 1.55316162109375, 1.658966064453125, 1.7647705078125, 1.870574951171875, 1.97637939453125, 2.082183837890625, 2.18798828125, 2.293792724609375, 2.39959716796875, 2.505401611328125, 2.6112060546875, 2.717010498046875, 2.82281494140625, 2.928619384765625, 3.034423828125, 3.140228271484375, 3.24603271484375, 3.351837158203125, 3.4576416015625, 3.563446044921875, 3.66925048828125, 3.775054931640625, 3.880859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 10.0, 7.0, 12.0, 15.0, 27.0, 24.0, 22.0, 32.0, 43.0, 36.0, 45.0, 46.0, 49.0, 57.0, 50.0, 45.0, 40.0, 76.0, 47.0, 39.0, 36.0, 37.0, 33.0, 32.0, 27.0, 15.0, 16.0, 13.0, 9.0, 11.0, 6.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.767578125, -3.635955810546875, -3.50433349609375, -3.372711181640625, -3.2410888671875, -3.109466552734375, -2.97784423828125, -2.846221923828125, -2.714599609375, -2.582977294921875, -2.45135498046875, -2.319732666015625, -2.1881103515625, -2.056488037109375, -1.92486572265625, -1.793243408203125, -1.66162109375, -1.529998779296875, -1.39837646484375, -1.266754150390625, -1.1351318359375, -1.003509521484375, -0.87188720703125, -0.740264892578125, -0.608642578125, -0.477020263671875, -0.34539794921875, -0.213775634765625, -0.0821533203125, 0.049468994140625, 0.18109130859375, 0.312713623046875, 0.4443359375, 0.575958251953125, 0.70758056640625, 0.839202880859375, 0.9708251953125, 1.102447509765625, 1.23406982421875, 1.365692138671875, 1.497314453125, 1.628936767578125, 1.76055908203125, 1.892181396484375, 2.0238037109375, 2.155426025390625, 2.28704833984375, 2.418670654296875, 2.55029296875, 2.681915283203125, 2.81353759765625, 2.945159912109375, 3.0767822265625, 3.208404541015625, 3.34002685546875, 3.471649169921875, 3.603271484375, 3.734893798828125, 3.86651611328125, 3.998138427734375, 4.1297607421875, 4.261383056640625, 4.39300537109375, 4.524627685546875, 4.65625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 15.0, 19.0, 23.0, 35.0, 55.0, 98.0, 169.0, 299.0, 577.0, 1441.0, 3695.0, 16382.0, 423640.0, 576819.0, 18406.0, 3983.0, 1438.0, 650.0, 297.0, 172.0, 112.0, 56.0, 44.0, 23.0, 14.0, 8.0, 9.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1591796875, -1.120574951171875, -1.08197021484375, -1.043365478515625, -1.0047607421875, -0.966156005859375, -0.92755126953125, -0.888946533203125, -0.850341796875, -0.811737060546875, -0.77313232421875, -0.734527587890625, -0.6959228515625, -0.657318115234375, -0.61871337890625, -0.580108642578125, -0.54150390625, -0.502899169921875, -0.46429443359375, -0.425689697265625, -0.3870849609375, -0.348480224609375, -0.30987548828125, -0.271270751953125, -0.232666015625, -0.194061279296875, -0.15545654296875, -0.116851806640625, -0.0782470703125, -0.039642333984375, -0.00103759765625, 0.037567138671875, 0.076171875, 0.114776611328125, 0.15338134765625, 0.191986083984375, 0.2305908203125, 0.269195556640625, 0.30780029296875, 0.346405029296875, 0.385009765625, 0.423614501953125, 0.46221923828125, 0.500823974609375, 0.5394287109375, 0.578033447265625, 0.61663818359375, 0.655242919921875, 0.69384765625, 0.732452392578125, 0.77105712890625, 0.809661865234375, 0.8482666015625, 0.886871337890625, 0.92547607421875, 0.964080810546875, 1.002685546875, 1.041290283203125, 1.07989501953125, 1.118499755859375, 1.1571044921875, 1.195709228515625, 1.23431396484375, 1.272918701171875, 1.3115234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 9.0, 6.0, 13.0, 14.0, 31.0, 53.0, 88.0, 131.0, 184.0, 183.0, 108.0, 69.0, 37.0, 31.0, 11.0, 14.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00027108192443847656, -0.00026389583945274353, -0.0002567097544670105, -0.00024952366948127747, -0.00024233758449554443, -0.0002351514995098114, -0.00022796541452407837, -0.00022077932953834534, -0.0002135932445526123, -0.00020640715956687927, -0.00019922107458114624, -0.0001920349895954132, -0.00018484890460968018, -0.00017766281962394714, -0.0001704767346382141, -0.00016329064965248108, -0.00015610456466674805, -0.00014891847968101501, -0.00014173239469528198, -0.00013454630970954895, -0.00012736022472381592, -0.00012017413973808289, -0.00011298805475234985, -0.00010580196976661682, -9.861588478088379e-05, -9.142979979515076e-05, -8.424371480941772e-05, -7.705762982368469e-05, -6.987154483795166e-05, -6.268545985221863e-05, -5.5499374866485596e-05, -4.8313289880752563e-05, -4.112720489501953e-05, -3.39411199092865e-05, -2.6755034923553467e-05, -1.9568949937820435e-05, -1.2382864952087402e-05, -5.19677996635437e-06, 1.989305019378662e-06, 9.175390005111694e-06, 1.6361474990844727e-05, 2.354755997657776e-05, 3.073364496231079e-05, 3.791972994804382e-05, 4.5105814933776855e-05, 5.229189991950989e-05, 5.947798490524292e-05, 6.666406989097595e-05, 7.385015487670898e-05, 8.103623986244202e-05, 8.822232484817505e-05, 9.540840983390808e-05, 0.00010259449481964111, 0.00010978057980537415, 0.00011696666479110718, 0.0001241527497768402, 0.00013133883476257324, 0.00013852491974830627, 0.0001457110047340393, 0.00015289708971977234, 0.00016008317470550537, 0.0001672692596912384, 0.00017445534467697144, 0.00018164142966270447, 0.0001888275146484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 3.0, 5.0, 13.0, 12.0, 13.0, 28.0, 30.0, 48.0, 71.0, 107.0, 194.0, 387.0, 904.0, 2658.0, 11446.0, 250725.0, 754746.0, 21049.0, 3770.0, 1238.0, 476.0, 216.0, 123.0, 87.0, 57.0, 29.0, 26.0, 17.0, 11.0, 7.0, 10.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3076171875, -1.266937255859375, -1.22625732421875, -1.185577392578125, -1.1448974609375, -1.104217529296875, -1.06353759765625, -1.022857666015625, -0.982177734375, -0.941497802734375, -0.90081787109375, -0.860137939453125, -0.8194580078125, -0.778778076171875, -0.73809814453125, -0.697418212890625, -0.65673828125, -0.616058349609375, -0.57537841796875, -0.534698486328125, -0.4940185546875, -0.453338623046875, -0.41265869140625, -0.371978759765625, -0.331298828125, -0.290618896484375, -0.24993896484375, -0.209259033203125, -0.1685791015625, -0.127899169921875, -0.08721923828125, -0.046539306640625, -0.005859375, 0.034820556640625, 0.07550048828125, 0.116180419921875, 0.1568603515625, 0.197540283203125, 0.23822021484375, 0.278900146484375, 0.319580078125, 0.360260009765625, 0.40093994140625, 0.441619873046875, 0.4822998046875, 0.522979736328125, 0.56365966796875, 0.604339599609375, 0.64501953125, 0.685699462890625, 0.72637939453125, 0.767059326171875, 0.8077392578125, 0.848419189453125, 0.88909912109375, 0.929779052734375, 0.970458984375, 1.011138916015625, 1.05181884765625, 1.092498779296875, 1.1331787109375, 1.173858642578125, 1.21453857421875, 1.255218505859375, 1.2958984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 14.0, 12.0, 21.0, 38.0, 49.0, 60.0, 88.0, 116.0, 117.0, 107.0, 82.0, 73.0, 64.0, 39.0, 31.0, 26.0, 10.0, 6.0, 4.0, 5.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.173828125, -1.1358489990234375, -1.097869873046875, -1.0598907470703125, -1.02191162109375, -0.9839324951171875, -0.945953369140625, -0.9079742431640625, -0.8699951171875, -0.8320159912109375, -0.794036865234375, -0.7560577392578125, -0.71807861328125, -0.6800994873046875, -0.642120361328125, -0.6041412353515625, -0.566162109375, -0.5281829833984375, -0.490203857421875, -0.4522247314453125, -0.41424560546875, -0.3762664794921875, -0.338287353515625, -0.3003082275390625, -0.2623291015625, -0.2243499755859375, -0.186370849609375, -0.1483917236328125, -0.11041259765625, -0.0724334716796875, -0.034454345703125, 0.0035247802734375, 0.04150390625, 0.0794830322265625, 0.117462158203125, 0.1554412841796875, 0.19342041015625, 0.2313995361328125, 0.269378662109375, 0.3073577880859375, 0.3453369140625, 0.3833160400390625, 0.421295166015625, 0.4592742919921875, 0.49725341796875, 0.5352325439453125, 0.573211669921875, 0.6111907958984375, 0.649169921875, 0.6871490478515625, 0.725128173828125, 0.7631072998046875, 0.80108642578125, 0.8390655517578125, 0.877044677734375, 0.9150238037109375, 0.9530029296875, 0.9909820556640625, 1.028961181640625, 1.0669403076171875, 1.10491943359375, 1.1428985595703125, 1.180877685546875, 1.2188568115234375, 1.2568359375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 21.0, 230.0, 561.0, 145.0, 23.0, 8.0, 10.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-101.09318542480469, -99.19454956054688, -97.2959213256836, -95.39728546142578, -93.4986572265625, -91.60002136230469, -89.7013931274414, -87.8027572631836, -85.90412902832031, -84.0054931640625, -82.10686492919922, -80.2082290649414, -78.30960083007812, -76.41096496582031, -74.51233673095703, -72.61370086669922, -70.71507263183594, -68.81643676757812, -66.91780853271484, -65.01917266845703, -63.12054443359375, -61.2219123840332, -59.323280334472656, -57.424644470214844, -55.52600860595703, -53.627376556396484, -51.72874450683594, -49.83011245727539, -47.931480407714844, -46.0328483581543, -44.13421630859375, -42.23558044433594, -40.336952209472656, -38.43832015991211, -36.53968811035156, -34.641056060791016, -32.74242401123047, -30.843791961669922, -28.945158004760742, -27.046525955200195, -25.14789581298828, -23.249263763427734, -21.350631713867188, -19.45199966430664, -17.553367614746094, -15.65473461151123, -13.756101608276367, -11.85746955871582, -9.958837509155273, -8.060205459594727, -6.1615729331970215, -4.262940406799316, -2.3643083572387695, -0.46567630767822266, 1.4329566955566406, 3.3315887451171875, 5.230220794677734, 7.128852844238281, 9.027484893798828, 10.926117897033691, 12.824749946594238, 14.723381996154785, 16.62201499938965, 18.520647048950195, 20.419279098510742]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 3.0, 8.0, 18.0, 22.0, 11.0, 18.0, 17.0, 32.0, 24.0, 34.0, 35.0, 35.0, 40.0, 47.0, 56.0, 54.0, 66.0, 48.0, 51.0, 44.0, 41.0, 28.0, 34.0, 28.0, 32.0, 30.0, 21.0, 21.0, 28.0, 19.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.727006912231445, -15.239923477172852, -14.752840042114258, -14.265755653381348, -13.778672218322754, -13.29158878326416, -12.804505348205566, -12.317420959472656, -11.830337524414062, -11.343254089355469, -10.856170654296875, -10.369086265563965, -9.882002830505371, -9.394919395446777, -8.907835960388184, -8.420751571655273, -7.933668613433838, -7.446585178375244, -6.959501266479492, -6.472417831420898, -5.9853339195251465, -5.498250484466553, -5.011166572570801, -4.524083137512207, -4.036999702453613, -3.5499160289764404, -3.0628323554992676, -2.575748920440674, -2.088665008544922, -1.6015815734863281, -1.1144979000091553, -0.6274142265319824, -0.14033031463623047, 0.34675332903862, 0.8338369727134705, 1.3209205865859985, 1.8080042600631714, 2.2950878143310547, 2.7821714878082275, 3.2692551612854004, 3.7563388347625732, 4.243422508239746, 4.73050594329834, 5.217589855194092, 5.7046732902526855, 6.1917572021484375, 6.678840637207031, 7.165924072265625, 7.653007984161377, 8.140091896057129, 8.627175331115723, 9.114258766174316, 9.60134220123291, 10.08842658996582, 10.575510025024414, 11.062593460083008, 11.549676895141602, 12.036760330200195, 12.523843765258789, 13.0109281539917, 13.498011589050293, 13.985095024108887, 14.47217845916748, 14.95926284790039, 15.446346282958984]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 4.0, 10.0, 12.0, 19.0, 36.0, 51.0, 87.0, 179.0, 413.0, 1385.0, 6620.0, 79166.0, 4022893.0, 75163.0, 5772.0, 1374.0, 500.0, 220.0, 129.0, 72.0, 42.0, 39.0, 20.0, 16.0, 12.0, 12.0, 10.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.412109375, -3.32989501953125, -3.2476806640625, -3.16546630859375, -3.083251953125, -3.00103759765625, -2.9188232421875, -2.83660888671875, -2.75439453125, -2.67218017578125, -2.5899658203125, -2.50775146484375, -2.425537109375, -2.34332275390625, -2.2611083984375, -2.17889404296875, -2.0966796875, -2.01446533203125, -1.9322509765625, -1.85003662109375, -1.767822265625, -1.68560791015625, -1.6033935546875, -1.52117919921875, -1.43896484375, -1.35675048828125, -1.2745361328125, -1.19232177734375, -1.110107421875, -1.02789306640625, -0.9456787109375, -0.86346435546875, -0.78125, -0.69903564453125, -0.6168212890625, -0.53460693359375, -0.452392578125, -0.37017822265625, -0.2879638671875, -0.20574951171875, -0.12353515625, -0.04132080078125, 0.0408935546875, 0.12310791015625, 0.205322265625, 0.28753662109375, 0.3697509765625, 0.45196533203125, 0.5341796875, 0.61639404296875, 0.6986083984375, 0.78082275390625, 0.863037109375, 0.94525146484375, 1.0274658203125, 1.10968017578125, 1.19189453125, 1.27410888671875, 1.3563232421875, 1.43853759765625, 1.520751953125, 1.60296630859375, 1.6851806640625, 1.76739501953125, 1.849609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 7.0, 9.0, 15.0, 15.0, 18.0, 33.0, 44.0, 46.0, 60.0, 67.0, 76.0, 70.0, 81.0, 84.0, 88.0, 68.0, 62.0, 35.0, 34.0, 27.0, 21.0, 9.0, 12.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8896484375, -0.847930908203125, -0.80621337890625, -0.764495849609375, -0.7227783203125, -0.681060791015625, -0.63934326171875, -0.597625732421875, -0.555908203125, -0.514190673828125, -0.47247314453125, -0.430755615234375, -0.3890380859375, -0.347320556640625, -0.30560302734375, -0.263885498046875, -0.22216796875, -0.180450439453125, -0.13873291015625, -0.097015380859375, -0.0552978515625, -0.013580322265625, 0.02813720703125, 0.069854736328125, 0.111572265625, 0.153289794921875, 0.19500732421875, 0.236724853515625, 0.2784423828125, 0.320159912109375, 0.36187744140625, 0.403594970703125, 0.4453125, 0.487030029296875, 0.52874755859375, 0.570465087890625, 0.6121826171875, 0.653900146484375, 0.69561767578125, 0.737335205078125, 0.779052734375, 0.820770263671875, 0.86248779296875, 0.904205322265625, 0.9459228515625, 0.987640380859375, 1.02935791015625, 1.071075439453125, 1.11279296875, 1.154510498046875, 1.19622802734375, 1.237945556640625, 1.2796630859375, 1.321380615234375, 1.36309814453125, 1.404815673828125, 1.446533203125, 1.488250732421875, 1.52996826171875, 1.571685791015625, 1.6134033203125, 1.655120849609375, 1.69683837890625, 1.738555908203125, 1.7802734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 13.0, 19.0, 44.0, 102.0, 165.0, 414.0, 1618.0, 12416.0, 1715599.0, 2449847.0, 11654.0, 1506.0, 418.0, 215.0, 112.0, 60.0, 38.0, 18.0, 15.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.29595947265625, -3.1739501953125, -3.05194091796875, -2.929931640625, -2.80792236328125, -2.6859130859375, -2.56390380859375, -2.44189453125, -2.31988525390625, -2.1978759765625, -2.07586669921875, -1.953857421875, -1.83184814453125, -1.7098388671875, -1.58782958984375, -1.4658203125, -1.34381103515625, -1.2218017578125, -1.09979248046875, -0.977783203125, -0.85577392578125, -0.7337646484375, -0.61175537109375, -0.48974609375, -0.36773681640625, -0.2457275390625, -0.12371826171875, -0.001708984375, 0.12030029296875, 0.2423095703125, 0.36431884765625, 0.486328125, 0.60833740234375, 0.7303466796875, 0.85235595703125, 0.974365234375, 1.09637451171875, 1.2183837890625, 1.34039306640625, 1.46240234375, 1.58441162109375, 1.7064208984375, 1.82843017578125, 1.950439453125, 2.07244873046875, 2.1944580078125, 2.31646728515625, 2.4384765625, 2.56048583984375, 2.6824951171875, 2.80450439453125, 2.926513671875, 3.04852294921875, 3.1705322265625, 3.29254150390625, 3.41455078125, 3.53656005859375, 3.6585693359375, 3.78057861328125, 3.902587890625, 4.02459716796875, 4.1466064453125, 4.26861572265625, 4.390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 8.0, 8.0, 10.0, 13.0, 24.0, 45.0, 60.0, 181.0, 851.0, 1971.0, 612.0, 156.0, 59.0, 34.0, 17.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.283203125, -2.19342041015625, -2.1036376953125, -2.01385498046875, -1.924072265625, -1.83428955078125, -1.7445068359375, -1.65472412109375, -1.56494140625, -1.47515869140625, -1.3853759765625, -1.29559326171875, -1.205810546875, -1.11602783203125, -1.0262451171875, -0.93646240234375, -0.8466796875, -0.75689697265625, -0.6671142578125, -0.57733154296875, -0.487548828125, -0.39776611328125, -0.3079833984375, -0.21820068359375, -0.12841796875, -0.03863525390625, 0.0511474609375, 0.14093017578125, 0.230712890625, 0.32049560546875, 0.4102783203125, 0.50006103515625, 0.58984375, 0.67962646484375, 0.7694091796875, 0.85919189453125, 0.948974609375, 1.03875732421875, 1.1285400390625, 1.21832275390625, 1.30810546875, 1.39788818359375, 1.4876708984375, 1.57745361328125, 1.667236328125, 1.75701904296875, 1.8468017578125, 1.93658447265625, 2.0263671875, 2.11614990234375, 2.2059326171875, 2.29571533203125, 2.385498046875, 2.47528076171875, 2.5650634765625, 2.65484619140625, 2.74462890625, 2.83441162109375, 2.9241943359375, 3.01397705078125, 3.103759765625, 3.19354248046875, 3.2833251953125, 3.37310791015625, 3.462890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 10.0, 33.0, 105.0, 238.0, 272.0, 160.0, 85.0, 30.0, 24.0, 9.0, 12.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.11816120147705, -12.63796615600586, -12.157770156860352, -11.67757511138916, -11.197380065917969, -10.717184066772461, -10.23698902130127, -9.756793975830078, -9.27659797668457, -8.796402931213379, -8.316206932067871, -7.83601188659668, -7.35581636428833, -6.8756208419799805, -6.395425796508789, -5.9152302742004395, -5.43503475189209, -4.95483922958374, -4.474643707275391, -3.994448661804199, -3.5142531394958496, -3.0340576171875, -2.5538623332977295, -2.073667049407959, -1.5934715270996094, -1.1132761240005493, -0.6330807209014893, -0.1528853178024292, 0.32731008529663086, 0.8075056076049805, 1.287700891494751, 1.7678961753845215, 2.2480926513671875, 2.728288173675537, 3.2084834575653076, 3.688678741455078, 4.168874263763428, 4.649069786071777, 5.129264831542969, 5.609460353851318, 6.089655876159668, 6.569851398468018, 7.050046920776367, 7.530241966247559, 8.01043701171875, 8.490633010864258, 8.97082805633545, 9.45102310180664, 9.931219100952148, 10.41141414642334, 10.891610145568848, 11.371805191040039, 11.852001190185547, 12.332196235656738, 12.81239128112793, 13.292587280273438, 13.772782325744629, 14.25297737121582, 14.733173370361328, 15.21336841583252, 15.693563461303711, 16.17375946044922, 16.653955459594727, 17.1341495513916, 17.61434555053711]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 5.0, 10.0, 8.0, 14.0, 13.0, 24.0, 17.0, 30.0, 27.0, 26.0, 42.0, 44.0, 50.0, 48.0, 62.0, 59.0, 58.0, 59.0, 53.0, 70.0, 50.0, 47.0, 38.0, 28.0, 24.0, 27.0, 14.0, 16.0, 5.0, 6.0, 3.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.063533782958984, -7.807955265045166, -7.552376747131348, -7.2967987060546875, -7.041220188140869, -6.785641670227051, -6.530063629150391, -6.274485111236572, -6.018906593322754, -5.7633280754089355, -5.507749557495117, -5.252171516418457, -4.996592998504639, -4.74101448059082, -4.48543643951416, -4.229857921600342, -3.9742794036865234, -3.718700885772705, -3.463122606277466, -3.2075443267822266, -2.951965808868408, -2.69638729095459, -2.4408090114593506, -2.1852307319641113, -1.929652214050293, -1.6740738153457642, -1.4184954166412354, -1.1629170179367065, -0.9073386192321777, -0.6517602205276489, -0.3961818218231201, -0.1406034231185913, 0.1149740219116211, 0.3705524206161499, 0.6261308193206787, 0.8817092180252075, 1.1372876167297363, 1.3928660154342651, 1.648444414138794, 1.9040228128433228, 2.1596012115478516, 2.41517972946167, 2.670758008956909, 2.9263362884521484, 3.181914806365967, 3.437493324279785, 3.6930716037750244, 3.9486498832702637, 4.204228401184082, 4.4598069190979, 4.715385437011719, 4.970963478088379, 5.226541996002197, 5.482120513916016, 5.737698554992676, 5.993277072906494, 6.2488555908203125, 6.504434108734131, 6.760012626647949, 7.015590667724609, 7.271169185638428, 7.526747703552246, 7.782325744628906, 8.037904739379883, 8.293482780456543]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 6.0, 20.0, 29.0, 49.0, 60.0, 98.0, 170.0, 331.0, 548.0, 1008.0, 2010.0, 4301.0, 9109.0, 21604.0, 53445.0, 143826.0, 334642.0, 288602.0, 113434.0, 42865.0, 17406.0, 7700.0, 3463.0, 1763.0, 883.0, 485.0, 254.0, 150.0, 82.0, 71.0, 57.0, 19.0, 17.0, 7.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96875, -0.9340057373046875, -0.899261474609375, -0.8645172119140625, -0.82977294921875, -0.7950286865234375, -0.760284423828125, -0.7255401611328125, -0.6907958984375, -0.6560516357421875, -0.621307373046875, -0.5865631103515625, -0.55181884765625, -0.5170745849609375, -0.482330322265625, -0.4475860595703125, -0.412841796875, -0.3780975341796875, -0.343353271484375, -0.3086090087890625, -0.27386474609375, -0.2391204833984375, -0.204376220703125, -0.1696319580078125, -0.1348876953125, -0.1001434326171875, -0.065399169921875, -0.0306549072265625, 0.00408935546875, 0.0388336181640625, 0.073577880859375, 0.1083221435546875, 0.14306640625, 0.1778106689453125, 0.212554931640625, 0.2472991943359375, 0.28204345703125, 0.3167877197265625, 0.351531982421875, 0.3862762451171875, 0.4210205078125, 0.4557647705078125, 0.490509033203125, 0.5252532958984375, 0.55999755859375, 0.5947418212890625, 0.629486083984375, 0.6642303466796875, 0.698974609375, 0.7337188720703125, 0.768463134765625, 0.8032073974609375, 0.83795166015625, 0.8726959228515625, 0.907440185546875, 0.9421844482421875, 0.9769287109375, 1.0116729736328125, 1.046417236328125, 1.0811614990234375, 1.11590576171875, 1.1506500244140625, 1.185394287109375, 1.2201385498046875, 1.2548828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 0.0, 2.0, 4.0, 8.0, 4.0, 15.0, 6.0, 12.0, 13.0, 16.0, 14.0, 15.0, 29.0, 25.0, 36.0, 33.0, 42.0, 48.0, 46.0, 46.0, 40.0, 45.0, 34.0, 48.0, 60.0, 49.0, 56.0, 38.0, 27.0, 33.0, 27.0, 34.0, 17.0, 9.0, 14.0, 17.0, 8.0, 15.0, 2.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6422576904296875, -0.616546630859375, -0.5908355712890625, -0.56512451171875, -0.5394134521484375, -0.513702392578125, -0.4879913330078125, -0.4622802734375, -0.4365692138671875, -0.410858154296875, -0.3851470947265625, -0.35943603515625, -0.3337249755859375, -0.308013916015625, -0.2823028564453125, -0.256591796875, -0.2308807373046875, -0.205169677734375, -0.1794586181640625, -0.15374755859375, -0.1280364990234375, -0.102325439453125, -0.0766143798828125, -0.0509033203125, -0.0251922607421875, 0.000518798828125, 0.0262298583984375, 0.05194091796875, 0.0776519775390625, 0.103363037109375, 0.1290740966796875, 0.15478515625, 0.1804962158203125, 0.206207275390625, 0.2319183349609375, 0.25762939453125, 0.2833404541015625, 0.309051513671875, 0.3347625732421875, 0.3604736328125, 0.3861846923828125, 0.411895751953125, 0.4376068115234375, 0.46331787109375, 0.4890289306640625, 0.514739990234375, 0.5404510498046875, 0.566162109375, 0.5918731689453125, 0.617584228515625, 0.6432952880859375, 0.66900634765625, 0.6947174072265625, 0.720428466796875, 0.7461395263671875, 0.7718505859375, 0.7975616455078125, 0.823272705078125, 0.8489837646484375, 0.87469482421875, 0.9004058837890625, 0.926116943359375, 0.9518280029296875, 0.9775390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 8.0, 12.0, 16.0, 18.0, 24.0, 39.0, 70.0, 95.0, 131.0, 243.0, 399.0, 853.0, 2248.0, 9028.0, 80321.0, 789538.0, 146809.0, 13571.0, 2859.0, 1005.0, 481.0, 273.0, 161.0, 103.0, 60.0, 50.0, 34.0, 26.0, 22.0, 16.0, 9.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.62109375, -3.524810791015625, -3.42852783203125, -3.332244873046875, -3.2359619140625, -3.139678955078125, -3.04339599609375, -2.947113037109375, -2.850830078125, -2.754547119140625, -2.65826416015625, -2.561981201171875, -2.4656982421875, -2.369415283203125, -2.27313232421875, -2.176849365234375, -2.08056640625, -1.984283447265625, -1.88800048828125, -1.791717529296875, -1.6954345703125, -1.599151611328125, -1.50286865234375, -1.406585693359375, -1.310302734375, -1.214019775390625, -1.11773681640625, -1.021453857421875, -0.9251708984375, -0.828887939453125, -0.73260498046875, -0.636322021484375, -0.5400390625, -0.443756103515625, -0.34747314453125, -0.251190185546875, -0.1549072265625, -0.058624267578125, 0.03765869140625, 0.133941650390625, 0.230224609375, 0.326507568359375, 0.42279052734375, 0.519073486328125, 0.6153564453125, 0.711639404296875, 0.80792236328125, 0.904205322265625, 1.00048828125, 1.096771240234375, 1.19305419921875, 1.289337158203125, 1.3856201171875, 1.481903076171875, 1.57818603515625, 1.674468994140625, 1.770751953125, 1.867034912109375, 1.96331787109375, 2.059600830078125, 2.1558837890625, 2.252166748046875, 2.34844970703125, 2.444732666015625, 2.541015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 13.0, 12.0, 16.0, 26.0, 34.0, 54.0, 40.0, 68.0, 53.0, 76.0, 81.0, 93.0, 79.0, 65.0, 51.0, 55.0, 44.0, 43.0, 23.0, 19.0, 15.0, 6.0, 7.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.5625, -6.40203857421875, -6.2415771484375, -6.08111572265625, -5.920654296875, -5.76019287109375, -5.5997314453125, -5.43927001953125, -5.27880859375, -5.11834716796875, -4.9578857421875, -4.79742431640625, -4.636962890625, -4.47650146484375, -4.3160400390625, -4.15557861328125, -3.9951171875, -3.83465576171875, -3.6741943359375, -3.51373291015625, -3.353271484375, -3.19281005859375, -3.0323486328125, -2.87188720703125, -2.71142578125, -2.55096435546875, -2.3905029296875, -2.23004150390625, -2.069580078125, -1.90911865234375, -1.7486572265625, -1.58819580078125, -1.427734375, -1.26727294921875, -1.1068115234375, -0.94635009765625, -0.785888671875, -0.62542724609375, -0.4649658203125, -0.30450439453125, -0.14404296875, 0.01641845703125, 0.1768798828125, 0.33734130859375, 0.497802734375, 0.65826416015625, 0.8187255859375, 0.97918701171875, 1.1396484375, 1.30010986328125, 1.4605712890625, 1.62103271484375, 1.781494140625, 1.94195556640625, 2.1024169921875, 2.26287841796875, 2.42333984375, 2.58380126953125, 2.7442626953125, 2.90472412109375, 3.065185546875, 3.22564697265625, 3.3861083984375, 3.54656982421875, 3.70703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 1.0, 6.0, 17.0, 19.0, 44.0, 62.0, 104.0, 231.0, 492.0, 1541.0, 8684.0, 251693.0, 766552.0, 15680.0, 2248.0, 617.0, 276.0, 119.0, 70.0, 32.0, 24.0, 14.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.064453125, -2.0039520263671875, -1.943450927734375, -1.8829498291015625, -1.82244873046875, -1.7619476318359375, -1.701446533203125, -1.6409454345703125, -1.5804443359375, -1.5199432373046875, -1.459442138671875, -1.3989410400390625, -1.33843994140625, -1.2779388427734375, -1.217437744140625, -1.1569366455078125, -1.096435546875, -1.0359344482421875, -0.975433349609375, -0.9149322509765625, -0.85443115234375, -0.7939300537109375, -0.733428955078125, -0.6729278564453125, -0.6124267578125, -0.5519256591796875, -0.491424560546875, -0.4309234619140625, -0.37042236328125, -0.3099212646484375, -0.249420166015625, -0.1889190673828125, -0.12841796875, -0.0679168701171875, -0.007415771484375, 0.0530853271484375, 0.11358642578125, 0.1740875244140625, 0.234588623046875, 0.2950897216796875, 0.3555908203125, 0.4160919189453125, 0.476593017578125, 0.5370941162109375, 0.59759521484375, 0.6580963134765625, 0.718597412109375, 0.7790985107421875, 0.839599609375, 0.9001007080078125, 0.960601806640625, 1.0211029052734375, 1.08160400390625, 1.1421051025390625, 1.202606201171875, 1.2631072998046875, 1.3236083984375, 1.3841094970703125, 1.444610595703125, 1.5051116943359375, 1.56561279296875, 1.6261138916015625, 1.686614990234375, 1.7471160888671875, 1.8076171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 31.0, 70.0, 133.0, 208.0, 244.0, 140.0, 64.0, 47.0, 21.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033402442932128906, -0.00032171234488487244, -0.0003094002604484558, -0.0002970881760120392, -0.00028477609157562256, -0.00027246400713920593, -0.0002601519227027893, -0.0002478398382663727, -0.00023552775382995605, -0.00022321566939353943, -0.0002109035849571228, -0.00019859150052070618, -0.00018627941608428955, -0.00017396733164787292, -0.0001616552472114563, -0.00014934316277503967, -0.00013703107833862305, -0.00012471899390220642, -0.0001124069094657898, -0.00010009482502937317, -8.778274059295654e-05, -7.547065615653992e-05, -6.315857172012329e-05, -5.0846487283706665e-05, -3.853440284729004e-05, -2.6222318410873413e-05, -1.3910233974456787e-05, -1.5981495380401611e-06, 1.0713934898376465e-05, 2.302601933479309e-05, 3.533810377120972e-05, 4.765018820762634e-05, 5.996227264404297e-05, 7.22743570804596e-05, 8.458644151687622e-05, 9.689852595329285e-05, 0.00010921061038970947, 0.0001215226948261261, 0.00013383477926254272, 0.00014614686369895935, 0.00015845894813537598, 0.0001707710325717926, 0.00018308311700820923, 0.00019539520144462585, 0.00020770728588104248, 0.0002200193703174591, 0.00023233145475387573, 0.00024464353919029236, 0.000256955623626709, 0.0002692677080631256, 0.00028157979249954224, 0.00029389187693595886, 0.0003062039613723755, 0.0003185160458087921, 0.00033082813024520874, 0.00034314021468162537, 0.000355452299118042, 0.0003677643835544586, 0.00038007646799087524, 0.00039238855242729187, 0.0004047006368637085, 0.0004170127213001251, 0.00042932480573654175, 0.0004416368901729584, 0.000453948974609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 13.0, 11.0, 17.0, 28.0, 27.0, 42.0, 79.0, 118.0, 161.0, 265.0, 513.0, 1096.0, 2633.0, 9249.0, 52057.0, 595036.0, 341491.0, 34315.0, 6984.0, 2249.0, 931.0, 454.0, 258.0, 148.0, 94.0, 73.0, 40.0, 41.0, 27.0, 15.0, 12.0, 13.0, 9.0, 9.0, 9.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.95849609375, -0.9310302734375, -0.903564453125, -0.8760986328125, -0.8486328125, -0.8211669921875, -0.793701171875, -0.7662353515625, -0.73876953125, -0.7113037109375, -0.683837890625, -0.6563720703125, -0.62890625, -0.6014404296875, -0.573974609375, -0.5465087890625, -0.51904296875, -0.4915771484375, -0.464111328125, -0.4366455078125, -0.4091796875, -0.3817138671875, -0.354248046875, -0.3267822265625, -0.29931640625, -0.2718505859375, -0.244384765625, -0.2169189453125, -0.189453125, -0.1619873046875, -0.134521484375, -0.1070556640625, -0.07958984375, -0.0521240234375, -0.024658203125, 0.0028076171875, 0.0302734375, 0.0577392578125, 0.085205078125, 0.1126708984375, 0.14013671875, 0.1676025390625, 0.195068359375, 0.2225341796875, 0.25, 0.2774658203125, 0.304931640625, 0.3323974609375, 0.35986328125, 0.3873291015625, 0.414794921875, 0.4422607421875, 0.4697265625, 0.4971923828125, 0.524658203125, 0.5521240234375, 0.57958984375, 0.6070556640625, 0.634521484375, 0.6619873046875, 0.689453125, 0.7169189453125, 0.744384765625, 0.7718505859375, 0.79931640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 4.0, 8.0, 15.0, 12.0, 17.0, 29.0, 41.0, 46.0, 57.0, 64.0, 82.0, 72.0, 87.0, 86.0, 68.0, 56.0, 54.0, 44.0, 38.0, 28.0, 20.0, 8.0, 13.0, 13.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.738555908203125, -0.71148681640625, -0.684417724609375, -0.6573486328125, -0.630279541015625, -0.60321044921875, -0.576141357421875, -0.549072265625, -0.522003173828125, -0.49493408203125, -0.467864990234375, -0.4407958984375, -0.413726806640625, -0.38665771484375, -0.359588623046875, -0.33251953125, -0.305450439453125, -0.27838134765625, -0.251312255859375, -0.2242431640625, -0.197174072265625, -0.17010498046875, -0.143035888671875, -0.115966796875, -0.088897705078125, -0.06182861328125, -0.034759521484375, -0.0076904296875, 0.019378662109375, 0.04644775390625, 0.073516845703125, 0.1005859375, 0.127655029296875, 0.15472412109375, 0.181793212890625, 0.2088623046875, 0.235931396484375, 0.26300048828125, 0.290069580078125, 0.317138671875, 0.344207763671875, 0.37127685546875, 0.398345947265625, 0.4254150390625, 0.452484130859375, 0.47955322265625, 0.506622314453125, 0.53369140625, 0.560760498046875, 0.58782958984375, 0.614898681640625, 0.6419677734375, 0.669036865234375, 0.69610595703125, 0.723175048828125, 0.750244140625, 0.777313232421875, 0.80438232421875, 0.831451416015625, 0.8585205078125, 0.885589599609375, 0.91265869140625, 0.939727783203125, 0.966796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 25.0, 71.0, 310.0, 467.0, 104.0, 9.0, 11.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.674224853515625, -58.15066909790039, -56.62711715698242, -55.10356140136719, -53.58000946044922, -52.056453704833984, -50.53289794921875, -49.00934600830078, -47.48579025268555, -45.96223449707031, -44.438682556152344, -42.91512680053711, -41.391571044921875, -39.868019104003906, -38.34446334838867, -36.82090759277344, -35.29735565185547, -33.773799896240234, -32.250247955322266, -30.72669219970703, -29.20313835144043, -27.679584503173828, -26.156028747558594, -24.632474899291992, -23.10892105102539, -21.58536720275879, -20.061813354492188, -18.538257598876953, -17.01470375061035, -15.49114990234375, -13.967595100402832, -12.444040298461914, -10.920482635498047, -9.396928787231445, -7.873373985290527, -6.349819660186768, -4.826265335083008, -3.302711009979248, -1.7791566848754883, -0.2556018829345703, 1.2679519653320312, 2.791506290435791, 4.315060615539551, 5.8386149406433105, 7.36216926574707, 8.885723114013672, 10.40927791595459, 11.932832717895508, 13.45638656616211, 14.979940414428711, 16.503494262695312, 18.027050018310547, 19.55060386657715, 21.07415771484375, 22.597713470458984, 24.121267318725586, 25.644821166992188, 27.16837501525879, 28.69192886352539, 30.215484619140625, 31.739038467407227, 33.26259231567383, 34.78614807128906, 36.30970001220703, 37.833255767822266]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 5.0, 12.0, 13.0, 14.0, 20.0, 20.0, 29.0, 29.0, 37.0, 49.0, 65.0, 55.0, 65.0, 66.0, 76.0, 65.0, 60.0, 44.0, 34.0, 46.0, 31.0, 30.0, 29.0, 20.0, 15.0, 10.0, 18.0, 15.0, 4.0, 3.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.69677734375, -13.10966682434082, -12.522557258605957, -11.935446739196777, -11.348337173461914, -10.761226654052734, -10.174116134643555, -9.587005615234375, -8.999896049499512, -8.412785530090332, -7.825675964355469, -7.238565444946289, -6.651455402374268, -6.064345359802246, -5.477234840393066, -4.890124797821045, -4.303014755249023, -3.715904712677002, -3.1287944316864014, -2.541684150695801, -1.9545741081237793, -1.3674640655517578, -0.7803537845611572, -0.19324350357055664, 0.39386653900146484, 0.9809767007827759, 1.568086862564087, 2.1551971435546875, 2.742307186126709, 3.3294172286987305, 3.916527509689331, 4.503637790679932, 5.090749740600586, 5.677859783172607, 6.264969825744629, 6.852080345153809, 7.43919038772583, 8.026300430297852, 8.613410949707031, 9.200521469116211, 9.787631034851074, 10.374741554260254, 10.961851119995117, 11.548961639404297, 12.136072158813477, 12.72318172454834, 13.31029224395752, 13.897401809692383, 14.484512329101562, 15.071622848510742, 15.658732414245605, 16.24584197998047, 16.83295249938965, 17.420063018798828, 18.007173538208008, 18.594284057617188, 19.181392669677734, 19.768503189086914, 20.355613708496094, 20.94272232055664, 21.52983283996582, 22.116943359375, 22.70405387878418, 23.29116439819336, 23.87827491760254]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 12.0, 7.0, 19.0, 43.0, 74.0, 84.0, 154.0, 288.0, 501.0, 992.0, 2029.0, 4975.0, 14202.0, 50340.0, 423179.0, 2995062.0, 617424.0, 61539.0, 13585.0, 4993.0, 2175.0, 1099.0, 600.0, 366.0, 185.0, 102.0, 87.0, 53.0, 29.0, 20.0, 16.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7802734375, -0.747161865234375, -0.71405029296875, -0.680938720703125, -0.6478271484375, -0.614715576171875, -0.58160400390625, -0.548492431640625, -0.515380859375, -0.482269287109375, -0.44915771484375, -0.416046142578125, -0.3829345703125, -0.349822998046875, -0.31671142578125, -0.283599853515625, -0.25048828125, -0.217376708984375, -0.18426513671875, -0.151153564453125, -0.1180419921875, -0.084930419921875, -0.05181884765625, -0.018707275390625, 0.014404296875, 0.047515869140625, 0.08062744140625, 0.113739013671875, 0.1468505859375, 0.179962158203125, 0.21307373046875, 0.246185302734375, 0.279296875, 0.312408447265625, 0.34552001953125, 0.378631591796875, 0.4117431640625, 0.444854736328125, 0.47796630859375, 0.511077880859375, 0.544189453125, 0.577301025390625, 0.61041259765625, 0.643524169921875, 0.6766357421875, 0.709747314453125, 0.74285888671875, 0.775970458984375, 0.80908203125, 0.842193603515625, 0.87530517578125, 0.908416748046875, 0.9415283203125, 0.974639892578125, 1.00775146484375, 1.040863037109375, 1.073974609375, 1.107086181640625, 1.14019775390625, 1.173309326171875, 1.2064208984375, 1.239532470703125, 1.27264404296875, 1.305755615234375, 1.3388671875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 3.0, 9.0, 4.0, 8.0, 12.0, 10.0, 14.0, 15.0, 17.0, 18.0, 30.0, 24.0, 28.0, 41.0, 48.0, 41.0, 49.0, 63.0, 57.0, 68.0, 41.0, 64.0, 54.0, 53.0, 40.0, 39.0, 35.0, 31.0, 18.0, 19.0, 14.0, 6.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.60888671875, -0.5812759399414062, -0.5536651611328125, -0.5260543823242188, -0.498443603515625, -0.47083282470703125, -0.4432220458984375, -0.41561126708984375, -0.38800048828125, -0.36038970947265625, -0.3327789306640625, -0.30516815185546875, -0.277557373046875, -0.24994659423828125, -0.2223358154296875, -0.19472503662109375, -0.1671142578125, -0.13950347900390625, -0.1118927001953125, -0.08428192138671875, -0.056671142578125, -0.02906036376953125, -0.0014495849609375, 0.02616119384765625, 0.05377197265625, 0.08138275146484375, 0.1089935302734375, 0.13660430908203125, 0.164215087890625, 0.19182586669921875, 0.2194366455078125, 0.24704742431640625, 0.274658203125, 0.30226898193359375, 0.3298797607421875, 0.35749053955078125, 0.385101318359375, 0.41271209716796875, 0.4403228759765625, 0.46793365478515625, 0.49554443359375, 0.5231552124023438, 0.5507659912109375, 0.5783767700195312, 0.605987548828125, 0.6335983276367188, 0.6612091064453125, 0.6888198852539062, 0.7164306640625, 0.7440414428710938, 0.7716522216796875, 0.7992630004882812, 0.826873779296875, 0.8544845581054688, 0.8820953369140625, 0.9097061157226562, 0.93731689453125, 0.9649276733398438, 0.9925384521484375, 1.0201492309570312, 1.047760009765625, 1.0753707885742188, 1.1029815673828125, 1.1305923461914062, 1.158203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 11.0, 22.0, 35.0, 43.0, 57.0, 124.0, 237.0, 514.0, 1250.0, 5052.0, 31882.0, 948313.0, 3146846.0, 49956.0, 7245.0, 1637.0, 533.0, 212.0, 107.0, 45.0, 35.0, 34.0, 25.0, 16.0, 10.0, 12.0, 8.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7578125, -2.687286376953125, -2.61676025390625, -2.546234130859375, -2.4757080078125, -2.405181884765625, -2.33465576171875, -2.264129638671875, -2.193603515625, -2.123077392578125, -2.05255126953125, -1.982025146484375, -1.9114990234375, -1.840972900390625, -1.77044677734375, -1.699920654296875, -1.62939453125, -1.558868408203125, -1.48834228515625, -1.417816162109375, -1.3472900390625, -1.276763916015625, -1.20623779296875, -1.135711669921875, -1.065185546875, -0.994659423828125, -0.92413330078125, -0.853607177734375, -0.7830810546875, -0.712554931640625, -0.64202880859375, -0.571502685546875, -0.5009765625, -0.430450439453125, -0.35992431640625, -0.289398193359375, -0.2188720703125, -0.148345947265625, -0.07781982421875, -0.007293701171875, 0.063232421875, 0.133758544921875, 0.20428466796875, 0.274810791015625, 0.3453369140625, 0.415863037109375, 0.48638916015625, 0.556915283203125, 0.62744140625, 0.697967529296875, 0.76849365234375, 0.839019775390625, 0.9095458984375, 0.980072021484375, 1.05059814453125, 1.121124267578125, 1.191650390625, 1.262176513671875, 1.33270263671875, 1.403228759765625, 1.4737548828125, 1.544281005859375, 1.61480712890625, 1.685333251953125, 1.755859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 6.0, 10.0, 4.0, 8.0, 12.0, 15.0, 27.0, 27.0, 36.0, 59.0, 101.0, 157.0, 317.0, 712.0, 1028.0, 753.0, 350.0, 157.0, 88.0, 44.0, 43.0, 18.0, 18.0, 13.0, 11.0, 15.0, 8.0, 6.0, 5.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.16796875, -2.1130828857421875, -2.058197021484375, -2.0033111572265625, -1.94842529296875, -1.8935394287109375, -1.838653564453125, -1.7837677001953125, -1.7288818359375, -1.6739959716796875, -1.619110107421875, -1.5642242431640625, -1.50933837890625, -1.4544525146484375, -1.399566650390625, -1.3446807861328125, -1.289794921875, -1.2349090576171875, -1.180023193359375, -1.1251373291015625, -1.07025146484375, -1.0153656005859375, -0.960479736328125, -0.9055938720703125, -0.8507080078125, -0.7958221435546875, -0.740936279296875, -0.6860504150390625, -0.63116455078125, -0.5762786865234375, -0.521392822265625, -0.4665069580078125, -0.41162109375, -0.3567352294921875, -0.301849365234375, -0.2469635009765625, -0.19207763671875, -0.1371917724609375, -0.082305908203125, -0.0274200439453125, 0.0274658203125, 0.0823516845703125, 0.137237548828125, 0.1921234130859375, 0.24700927734375, 0.3018951416015625, 0.356781005859375, 0.4116668701171875, 0.466552734375, 0.5214385986328125, 0.576324462890625, 0.6312103271484375, 0.68609619140625, 0.7409820556640625, 0.795867919921875, 0.8507537841796875, 0.9056396484375, 0.9605255126953125, 1.015411376953125, 1.0702972412109375, 1.12518310546875, 1.1800689697265625, 1.234954833984375, 1.2898406982421875, 1.3447265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 16.0, 56.0, 116.0, 241.0, 269.0, 175.0, 63.0, 18.0, 12.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4849853515625, -19.87091636657715, -19.256847381591797, -18.642778396606445, -18.028709411621094, -17.414640426635742, -16.80057144165039, -16.18650245666504, -15.572433471679688, -14.958364486694336, -14.344295501708984, -13.730226516723633, -13.116157531738281, -12.50208854675293, -11.888019561767578, -11.273950576782227, -10.659881591796875, -10.045812606811523, -9.431743621826172, -8.81767463684082, -8.203605651855469, -7.589536666870117, -6.975467681884766, -6.361398696899414, -5.7473297119140625, -5.133260726928711, -4.519191741943359, -3.905122756958008, -3.2910537719726562, -2.6769847869873047, -2.062915802001953, -1.4488468170166016, -0.8347797393798828, -0.22071075439453125, 0.3933582305908203, 1.0074272155761719, 1.6214962005615234, 2.235565185546875, 2.8496341705322266, 3.463703155517578, 4.07777214050293, 4.691841125488281, 5.305910110473633, 5.919979095458984, 6.534048080444336, 7.1481170654296875, 7.762186050415039, 8.37625503540039, 8.990324020385742, 9.604393005371094, 10.218461990356445, 10.832530975341797, 11.446599960327148, 12.0606689453125, 12.674737930297852, 13.288806915283203, 13.902875900268555, 14.516944885253906, 15.131013870239258, 15.74508285522461, 16.35915184020996, 16.973220825195312, 17.587289810180664, 18.201358795166016, 18.815427780151367]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 19.0, 11.0, 5.0, 19.0, 14.0, 24.0, 23.0, 23.0, 22.0, 31.0, 40.0, 39.0, 37.0, 61.0, 47.0, 59.0, 46.0, 47.0, 58.0, 47.0, 65.0, 40.0, 43.0, 31.0, 28.0, 20.0, 22.0, 14.0, 15.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.67354965209961, -8.42505931854248, -8.176568031311035, -7.928077220916748, -7.679586410522461, -7.431096076965332, -7.182604789733887, -6.934114456176758, -6.685623645782471, -6.437132835388184, -6.1886420249938965, -5.940151214599609, -5.691660404205322, -5.443169593811035, -5.194679260253906, -4.946188449859619, -4.697697639465332, -4.449206829071045, -4.200716018676758, -3.9522252082824707, -3.7037346363067627, -3.4552438259124756, -3.2067530155181885, -2.9582624435424805, -2.709771156311035, -2.461280345916748, -2.212789535522461, -1.9642988443374634, -1.7158081531524658, -1.4673173427581787, -1.2188265323638916, -0.970335841178894, -0.7218451499938965, -0.47335439920425415, -0.22486361861228943, 0.023627161979675293, 0.2721179127693176, 0.52060866355896, 0.7690994739532471, 1.0175901651382446, 1.2660809755325317, 1.5145717859268188, 1.7630624771118164, 2.0115532875061035, 2.2600440979003906, 2.5085349082946777, 2.757025718688965, 3.005516290664673, 3.25400710105896, 3.502497911453247, 3.750988721847534, 3.999479293823242, 4.247970104217529, 4.496460914611816, 4.7449517250061035, 4.993442535400391, 5.241933345794678, 5.490424156188965, 5.738914966583252, 5.987405776977539, 6.235896587371826, 6.484387397766113, 6.732877731323242, 6.981368541717529, 7.229859352111816]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 20.0, 26.0, 40.0, 62.0, 86.0, 160.0, 266.0, 414.0, 659.0, 1326.0, 2510.0, 5295.0, 11824.0, 29277.0, 75233.0, 192931.0, 340281.0, 231265.0, 93445.0, 36044.0, 14661.0, 6303.0, 2845.0, 1547.0, 811.0, 493.0, 276.0, 169.0, 89.0, 59.0, 44.0, 26.0, 27.0, 8.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8629074096679688, -0.8327484130859375, -0.8025894165039062, -0.772430419921875, -0.7422714233398438, -0.7121124267578125, -0.6819534301757812, -0.65179443359375, -0.6216354370117188, -0.5914764404296875, -0.5613174438476562, -0.531158447265625, -0.5009994506835938, -0.4708404541015625, -0.44068145751953125, -0.4105224609375, -0.38036346435546875, -0.3502044677734375, -0.32004547119140625, -0.289886474609375, -0.25972747802734375, -0.2295684814453125, -0.19940948486328125, -0.16925048828125, -0.13909149169921875, -0.1089324951171875, -0.07877349853515625, -0.048614501953125, -0.01845550537109375, 0.0117034912109375, 0.04186248779296875, 0.072021484375, 0.10218048095703125, 0.1323394775390625, 0.16249847412109375, 0.192657470703125, 0.22281646728515625, 0.2529754638671875, 0.28313446044921875, 0.31329345703125, 0.34345245361328125, 0.3736114501953125, 0.40377044677734375, 0.433929443359375, 0.46408843994140625, 0.4942474365234375, 0.5244064331054688, 0.5545654296875, 0.5847244262695312, 0.6148834228515625, 0.6450424194335938, 0.675201416015625, 0.7053604125976562, 0.7355194091796875, 0.7656784057617188, 0.79583740234375, 0.8259963989257812, 0.8561553955078125, 0.8863143920898438, 0.916473388671875, 0.9466323852539062, 0.9767913818359375, 1.0069503784179688, 1.037109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 11.0, 4.0, 9.0, 6.0, 15.0, 17.0, 15.0, 20.0, 31.0, 23.0, 38.0, 27.0, 41.0, 62.0, 58.0, 60.0, 54.0, 51.0, 63.0, 57.0, 66.0, 40.0, 43.0, 41.0, 33.0, 25.0, 26.0, 17.0, 17.0, 10.0, 9.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68359375, -0.65625, -0.62890625, -0.6015625, -0.57421875, -0.546875, -0.51953125, -0.4921875, -0.46484375, -0.4375, -0.41015625, -0.3828125, -0.35546875, -0.328125, -0.30078125, -0.2734375, -0.24609375, -0.21875, -0.19140625, -0.1640625, -0.13671875, -0.109375, -0.08203125, -0.0546875, -0.02734375, 0.0, 0.02734375, 0.0546875, 0.08203125, 0.109375, 0.13671875, 0.1640625, 0.19140625, 0.21875, 0.24609375, 0.2734375, 0.30078125, 0.328125, 0.35546875, 0.3828125, 0.41015625, 0.4375, 0.46484375, 0.4921875, 0.51953125, 0.546875, 0.57421875, 0.6015625, 0.62890625, 0.65625, 0.68359375, 0.7109375, 0.73828125, 0.765625, 0.79296875, 0.8203125, 0.84765625, 0.875, 0.90234375, 0.9296875, 0.95703125, 0.984375, 1.01171875, 1.0390625, 1.06640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 0.0, 4.0, 6.0, 11.0, 7.0, 11.0, 24.0, 17.0, 28.0, 46.0, 40.0, 52.0, 63.0, 87.0, 132.0, 159.0, 183.0, 278.0, 398.0, 608.0, 904.0, 1759.0, 4255.0, 15313.0, 91048.0, 660537.0, 228063.0, 31364.0, 7044.0, 2453.0, 1149.0, 703.0, 454.0, 335.0, 237.0, 179.0, 147.0, 93.0, 85.0, 58.0, 40.0, 39.0, 33.0, 28.0, 22.0, 18.0, 10.0, 12.0, 4.0, 4.0, 4.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-1.978515625, -1.9180450439453125, -1.857574462890625, -1.7971038818359375, -1.73663330078125, -1.6761627197265625, -1.615692138671875, -1.5552215576171875, -1.4947509765625, -1.4342803955078125, -1.373809814453125, -1.3133392333984375, -1.25286865234375, -1.1923980712890625, -1.131927490234375, -1.0714569091796875, -1.010986328125, -0.9505157470703125, -0.890045166015625, -0.8295745849609375, -0.76910400390625, -0.7086334228515625, -0.648162841796875, -0.5876922607421875, -0.5272216796875, -0.4667510986328125, -0.406280517578125, -0.3458099365234375, -0.28533935546875, -0.2248687744140625, -0.164398193359375, -0.1039276123046875, -0.04345703125, 0.0170135498046875, 0.077484130859375, 0.1379547119140625, 0.19842529296875, 0.2588958740234375, 0.319366455078125, 0.3798370361328125, 0.4403076171875, 0.5007781982421875, 0.561248779296875, 0.6217193603515625, 0.68218994140625, 0.7426605224609375, 0.803131103515625, 0.8636016845703125, 0.924072265625, 0.9845428466796875, 1.045013427734375, 1.1054840087890625, 1.16595458984375, 1.2264251708984375, 1.286895751953125, 1.3473663330078125, 1.4078369140625, 1.4683074951171875, 1.528778076171875, 1.5892486572265625, 1.64971923828125, 1.7101898193359375, 1.770660400390625, 1.8311309814453125, 1.8916015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 9.0, 5.0, 8.0, 4.0, 8.0, 12.0, 11.0, 6.0, 19.0, 15.0, 21.0, 23.0, 27.0, 26.0, 51.0, 44.0, 36.0, 41.0, 47.0, 51.0, 61.0, 46.0, 34.0, 44.0, 49.0, 36.0, 43.0, 33.0, 27.0, 25.0, 26.0, 23.0, 12.0, 15.0, 9.0, 18.0, 4.0, 7.0, 12.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.83203125, -2.734161376953125, -2.63629150390625, -2.538421630859375, -2.4405517578125, -2.342681884765625, -2.24481201171875, -2.146942138671875, -2.049072265625, -1.951202392578125, -1.85333251953125, -1.755462646484375, -1.6575927734375, -1.559722900390625, -1.46185302734375, -1.363983154296875, -1.26611328125, -1.168243408203125, -1.07037353515625, -0.972503662109375, -0.8746337890625, -0.776763916015625, -0.67889404296875, -0.581024169921875, -0.483154296875, -0.385284423828125, -0.28741455078125, -0.189544677734375, -0.0916748046875, 0.006195068359375, 0.10406494140625, 0.201934814453125, 0.2998046875, 0.397674560546875, 0.49554443359375, 0.593414306640625, 0.6912841796875, 0.789154052734375, 0.88702392578125, 0.984893798828125, 1.082763671875, 1.180633544921875, 1.27850341796875, 1.376373291015625, 1.4742431640625, 1.572113037109375, 1.66998291015625, 1.767852783203125, 1.86572265625, 1.963592529296875, 2.06146240234375, 2.159332275390625, 2.2572021484375, 2.355072021484375, 2.45294189453125, 2.550811767578125, 2.648681640625, 2.746551513671875, 2.84442138671875, 2.942291259765625, 3.0401611328125, 3.138031005859375, 3.23590087890625, 3.333770751953125, 3.431640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 17.0, 24.0, 29.0, 53.0, 70.0, 151.0, 365.0, 1019.0, 4580.0, 48778.0, 956226.0, 31871.0, 3793.0, 870.0, 302.0, 155.0, 68.0, 52.0, 36.0, 11.0, 16.0, 14.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.46484375, -1.416717529296875, -1.36859130859375, -1.320465087890625, -1.2723388671875, -1.224212646484375, -1.17608642578125, -1.127960205078125, -1.079833984375, -1.031707763671875, -0.98358154296875, -0.935455322265625, -0.8873291015625, -0.839202880859375, -0.79107666015625, -0.742950439453125, -0.69482421875, -0.646697998046875, -0.59857177734375, -0.550445556640625, -0.5023193359375, -0.454193115234375, -0.40606689453125, -0.357940673828125, -0.309814453125, -0.261688232421875, -0.21356201171875, -0.165435791015625, -0.1173095703125, -0.069183349609375, -0.02105712890625, 0.027069091796875, 0.0751953125, 0.123321533203125, 0.17144775390625, 0.219573974609375, 0.2677001953125, 0.315826416015625, 0.36395263671875, 0.412078857421875, 0.460205078125, 0.508331298828125, 0.55645751953125, 0.604583740234375, 0.6527099609375, 0.700836181640625, 0.74896240234375, 0.797088623046875, 0.84521484375, 0.893341064453125, 0.94146728515625, 0.989593505859375, 1.0377197265625, 1.085845947265625, 1.13397216796875, 1.182098388671875, 1.230224609375, 1.278350830078125, 1.32647705078125, 1.374603271484375, 1.4227294921875, 1.470855712890625, 1.51898193359375, 1.567108154296875, 1.615234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 5.0, 7.0, 23.0, 20.0, 36.0, 56.0, 109.0, 158.0, 200.0, 124.0, 88.0, 63.0, 30.0, 22.0, 10.0, 8.0, 9.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024127960205078125, -0.00023337453603744507, -0.0002254694700241089, -0.0002175644040107727, -0.00020965933799743652, -0.00020175427198410034, -0.00019384920597076416, -0.00018594413995742798, -0.0001780390739440918, -0.00017013400793075562, -0.00016222894191741943, -0.00015432387590408325, -0.00014641880989074707, -0.0001385137438774109, -0.0001306086778640747, -0.00012270361185073853, -0.00011479854583740234, -0.00010689347982406616, -9.898841381072998e-05, -9.10833477973938e-05, -8.317828178405762e-05, -7.527321577072144e-05, -6.736814975738525e-05, -5.946308374404907e-05, -5.155801773071289e-05, -4.365295171737671e-05, -3.574788570404053e-05, -2.7842819690704346e-05, -1.9937753677368164e-05, -1.2032687664031982e-05, -4.127621650695801e-06, 3.777444362640381e-06, 1.1682510375976562e-05, 1.9587576389312744e-05, 2.7492642402648926e-05, 3.539770841598511e-05, 4.330277442932129e-05, 5.120784044265747e-05, 5.911290645599365e-05, 6.701797246932983e-05, 7.492303848266602e-05, 8.28281044960022e-05, 9.073317050933838e-05, 9.863823652267456e-05, 0.00010654330253601074, 0.00011444836854934692, 0.0001223534345626831, 0.0001302585005760193, 0.00013816356658935547, 0.00014606863260269165, 0.00015397369861602783, 0.00016187876462936401, 0.0001697838306427002, 0.00017768889665603638, 0.00018559396266937256, 0.00019349902868270874, 0.00020140409469604492, 0.0002093091607093811, 0.00021721422672271729, 0.00022511929273605347, 0.00023302435874938965, 0.00024092942476272583, 0.000248834490776062, 0.0002567395567893982, 0.0002646446228027344]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 14.0, 21.0, 23.0, 43.0, 60.0, 83.0, 138.0, 339.0, 906.0, 3032.0, 17444.0, 789835.0, 222703.0, 10377.0, 2173.0, 684.0, 299.0, 121.0, 75.0, 51.0, 24.0, 24.0, 16.0, 14.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3416900634765625, -1.299591064453125, -1.2574920654296875, -1.21539306640625, -1.1732940673828125, -1.131195068359375, -1.0890960693359375, -1.0469970703125, -1.0048980712890625, -0.962799072265625, -0.9207000732421875, -0.87860107421875, -0.8365020751953125, -0.794403076171875, -0.7523040771484375, -0.710205078125, -0.6681060791015625, -0.626007080078125, -0.5839080810546875, -0.54180908203125, -0.4997100830078125, -0.457611083984375, -0.4155120849609375, -0.3734130859375, -0.3313140869140625, -0.289215087890625, -0.2471160888671875, -0.20501708984375, -0.1629180908203125, -0.120819091796875, -0.0787200927734375, -0.03662109375, 0.0054779052734375, 0.047576904296875, 0.0896759033203125, 0.13177490234375, 0.1738739013671875, 0.215972900390625, 0.2580718994140625, 0.3001708984375, 0.3422698974609375, 0.384368896484375, 0.4264678955078125, 0.46856689453125, 0.5106658935546875, 0.552764892578125, 0.5948638916015625, 0.636962890625, 0.6790618896484375, 0.721160888671875, 0.7632598876953125, 0.80535888671875, 0.8474578857421875, 0.889556884765625, 0.9316558837890625, 0.9737548828125, 1.0158538818359375, 1.057952880859375, 1.1000518798828125, 1.14215087890625, 1.1842498779296875, 1.226348876953125, 1.2684478759765625, 1.310546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 8.0, 8.0, 9.0, 16.0, 19.0, 19.0, 26.0, 40.0, 49.0, 61.0, 76.0, 94.0, 131.0, 90.0, 83.0, 59.0, 53.0, 38.0, 29.0, 15.0, 17.0, 11.0, 11.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7275390625, -0.705535888671875, -0.68353271484375, -0.661529541015625, -0.6395263671875, -0.617523193359375, -0.59552001953125, -0.573516845703125, -0.551513671875, -0.529510498046875, -0.50750732421875, -0.485504150390625, -0.4635009765625, -0.441497802734375, -0.41949462890625, -0.397491455078125, -0.37548828125, -0.353485107421875, -0.33148193359375, -0.309478759765625, -0.2874755859375, -0.265472412109375, -0.24346923828125, -0.221466064453125, -0.199462890625, -0.177459716796875, -0.15545654296875, -0.133453369140625, -0.1114501953125, -0.089447021484375, -0.06744384765625, -0.045440673828125, -0.0234375, -0.001434326171875, 0.02056884765625, 0.042572021484375, 0.0645751953125, 0.086578369140625, 0.10858154296875, 0.130584716796875, 0.152587890625, 0.174591064453125, 0.19659423828125, 0.218597412109375, 0.2406005859375, 0.262603759765625, 0.28460693359375, 0.306610107421875, 0.32861328125, 0.350616455078125, 0.37261962890625, 0.394622802734375, 0.4166259765625, 0.438629150390625, 0.46063232421875, 0.482635498046875, 0.504638671875, 0.526641845703125, 0.54864501953125, 0.570648193359375, 0.5926513671875, 0.614654541015625, 0.63665771484375, 0.658660888671875, 0.6806640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 13.0, 9.0, 40.0, 83.0, 142.0, 272.0, 244.0, 95.0, 55.0, 23.0, 12.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.1849308013916, -23.5288028717041, -22.8726749420166, -22.216548919677734, -21.560420989990234, -20.904293060302734, -20.248165130615234, -19.592037200927734, -18.935909271240234, -18.279781341552734, -17.623653411865234, -16.967527389526367, -16.311399459838867, -15.655271530151367, -14.999143600463867, -14.343015670776367, -13.6868896484375, -13.03076171875, -12.374634742736816, -11.718506813049316, -11.062379837036133, -10.406251907348633, -9.750123977661133, -9.093996047973633, -8.43786907196045, -7.781741619110107, -7.125614166259766, -6.469486236572266, -5.813358783721924, -5.157231330871582, -4.501103401184082, -3.8449759483337402, -3.1888465881347656, -2.532719135284424, -1.876591444015503, -1.2204638719558716, -0.5643362998962402, 0.09179115295410156, 0.7479188442230225, 1.4040465354919434, 2.060173988342285, 2.716301441192627, 3.372429132461548, 4.028556823730469, 4.6846842765808105, 5.340811729431152, 5.996939659118652, 6.653067111968994, 7.309194564819336, 7.965322017669678, 8.62144947052002, 9.27757740020752, 9.933704376220703, 10.589832305908203, 11.245960235595703, 11.902088165283203, 12.558215141296387, 13.214343070983887, 13.87047004699707, 14.52659797668457, 15.18272590637207, 15.838852882385254, 16.494979858398438, 17.151107788085938, 17.807235717773438]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 11.0, 22.0, 13.0, 14.0, 21.0, 22.0, 22.0, 20.0, 28.0, 34.0, 19.0, 35.0, 57.0, 55.0, 57.0, 75.0, 77.0, 51.0, 35.0, 38.0, 43.0, 36.0, 24.0, 32.0, 27.0, 16.0, 14.0, 17.0, 17.0, 13.0, 9.0, 12.0, 4.0, 6.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0], "bins": [-16.52168083190918, -16.101119995117188, -15.680558204650879, -15.259997367858887, -14.839435577392578, -14.418874740600586, -13.998313903808594, -13.577753067016602, -13.157191276550293, -12.7366304397583, -12.316068649291992, -11.8955078125, -11.474946975708008, -11.0543851852417, -10.633824348449707, -10.213262557983398, -9.792701721191406, -9.372140884399414, -8.951579093933105, -8.531018257141113, -8.110456466674805, -7.6898956298828125, -7.26933479309082, -6.84877347946167, -6.4282121658325195, -6.007650852203369, -5.587089538574219, -5.166528701782227, -4.745967388153076, -4.325406074523926, -3.9048449993133545, -3.484283924102783, -3.0637216567993164, -2.643160343170166, -2.2225992679595947, -1.8020380735397339, -1.381476879119873, -0.9609155654907227, -0.5403544902801514, -0.11979341506958008, 0.3007678985595703, 0.7213290929794312, 1.141890287399292, 1.5624514818191528, 1.9830126762390137, 2.403573989868164, 2.8241350650787354, 3.2446961402893066, 3.665257453918457, 4.085818767547607, 4.506380081176758, 4.92694091796875, 5.3475022315979, 5.768063545227051, 6.188624382019043, 6.609185695648193, 7.029747009277344, 7.450308322906494, 7.8708696365356445, 8.291430473327637, 8.711992263793945, 9.132553100585938, 9.55311393737793, 9.973674774169922, 10.39423656463623]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 11.0, 14.0, 10.0, 12.0, 27.0, 37.0, 43.0, 56.0, 70.0, 124.0, 182.0, 340.0, 611.0, 1235.0, 2556.0, 6729.0, 23107.0, 123401.0, 867678.0, 2411322.0, 636301.0, 89584.0, 18707.0, 6430.0, 2833.0, 1294.0, 632.0, 349.0, 184.0, 146.0, 66.0, 45.0, 48.0, 28.0, 23.0, 12.0, 12.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6026763916015625, -0.579864501953125, -0.5570526123046875, -0.53424072265625, -0.5114288330078125, -0.488616943359375, -0.4658050537109375, -0.4429931640625, -0.4201812744140625, -0.397369384765625, -0.3745574951171875, -0.35174560546875, -0.3289337158203125, -0.306121826171875, -0.2833099365234375, -0.260498046875, -0.2376861572265625, -0.214874267578125, -0.1920623779296875, -0.16925048828125, -0.1464385986328125, -0.123626708984375, -0.1008148193359375, -0.0780029296875, -0.0551910400390625, -0.032379150390625, -0.0095672607421875, 0.01324462890625, 0.0360565185546875, 0.058868408203125, 0.0816802978515625, 0.1044921875, 0.1273040771484375, 0.150115966796875, 0.1729278564453125, 0.19573974609375, 0.2185516357421875, 0.241363525390625, 0.2641754150390625, 0.2869873046875, 0.3097991943359375, 0.332611083984375, 0.3554229736328125, 0.37823486328125, 0.4010467529296875, 0.423858642578125, 0.4466705322265625, 0.469482421875, 0.4922943115234375, 0.515106201171875, 0.5379180908203125, 0.56072998046875, 0.5835418701171875, 0.606353759765625, 0.6291656494140625, 0.6519775390625, 0.6747894287109375, 0.697601318359375, 0.7204132080078125, 0.74322509765625, 0.7660369873046875, 0.788848876953125, 0.8116607666015625, 0.83447265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 5.0, 7.0, 12.0, 21.0, 26.0, 24.0, 27.0, 36.0, 60.0, 41.0, 63.0, 62.0, 80.0, 73.0, 66.0, 62.0, 59.0, 56.0, 46.0, 38.0, 34.0, 32.0, 23.0, 12.0, 10.0, 8.0, 6.0, 10.0, 6.0, 2.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3820114135742188, -1.3509368896484375, -1.3198623657226562, -1.288787841796875, -1.2577133178710938, -1.2266387939453125, -1.1955642700195312, -1.16448974609375, -1.1334152221679688, -1.1023406982421875, -1.0712661743164062, -1.040191650390625, -1.0091171264648438, -0.9780426025390625, -0.9469680786132812, -0.9158935546875, -0.8848190307617188, -0.8537445068359375, -0.8226699829101562, -0.791595458984375, -0.7605209350585938, -0.7294464111328125, -0.6983718872070312, -0.66729736328125, -0.6362228393554688, -0.6051483154296875, -0.5740737915039062, -0.542999267578125, -0.5119247436523438, -0.4808502197265625, -0.44977569580078125, -0.418701171875, -0.38762664794921875, -0.3565521240234375, -0.32547760009765625, -0.294403076171875, -0.26332855224609375, -0.2322540283203125, -0.20117950439453125, -0.17010498046875, -0.13903045654296875, -0.1079559326171875, -0.07688140869140625, -0.045806884765625, -0.01473236083984375, 0.0163421630859375, 0.04741668701171875, 0.0784912109375, 0.10956573486328125, 0.1406402587890625, 0.17171478271484375, 0.202789306640625, 0.23386383056640625, 0.2649383544921875, 0.29601287841796875, 0.32708740234375, 0.35816192626953125, 0.3892364501953125, 0.42031097412109375, 0.451385498046875, 0.48246002197265625, 0.5135345458984375, 0.5446090698242188, 0.57568359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 9.0, 4.0, 15.0, 15.0, 20.0, 42.0, 62.0, 112.0, 213.0, 342.0, 678.0, 1551.0, 4548.0, 18603.0, 148192.0, 3584400.0, 390295.0, 33145.0, 7320.0, 2482.0, 1028.0, 524.0, 263.0, 167.0, 74.0, 70.0, 28.0, 21.0, 12.0, 8.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.5927734375, -1.5467987060546875, -1.500823974609375, -1.4548492431640625, -1.40887451171875, -1.3628997802734375, -1.316925048828125, -1.2709503173828125, -1.2249755859375, -1.1790008544921875, -1.133026123046875, -1.0870513916015625, -1.04107666015625, -0.9951019287109375, -0.949127197265625, -0.9031524658203125, -0.857177734375, -0.8112030029296875, -0.765228271484375, -0.7192535400390625, -0.67327880859375, -0.6273040771484375, -0.581329345703125, -0.5353546142578125, -0.4893798828125, -0.4434051513671875, -0.397430419921875, -0.3514556884765625, -0.30548095703125, -0.2595062255859375, -0.213531494140625, -0.1675567626953125, -0.12158203125, -0.0756072998046875, -0.029632568359375, 0.0163421630859375, 0.06231689453125, 0.1082916259765625, 0.154266357421875, 0.2002410888671875, 0.2462158203125, 0.2921905517578125, 0.338165283203125, 0.3841400146484375, 0.43011474609375, 0.4760894775390625, 0.522064208984375, 0.5680389404296875, 0.614013671875, 0.6599884033203125, 0.705963134765625, 0.7519378662109375, 0.79791259765625, 0.8438873291015625, 0.889862060546875, 0.9358367919921875, 0.9818115234375, 1.0277862548828125, 1.073760986328125, 1.1197357177734375, 1.16571044921875, 1.2116851806640625, 1.257659912109375, 1.3036346435546875, 1.349609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 6.0, 2.0, 18.0, 26.0, 61.0, 69.0, 149.0, 355.0, 709.0, 1054.0, 851.0, 361.0, 160.0, 81.0, 44.0, 32.0, 22.0, 16.0, 12.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.342803955078125, -1.28326416015625, -1.223724365234375, -1.1641845703125, -1.104644775390625, -1.04510498046875, -0.985565185546875, -0.926025390625, -0.866485595703125, -0.80694580078125, -0.747406005859375, -0.6878662109375, -0.628326416015625, -0.56878662109375, -0.509246826171875, -0.44970703125, -0.390167236328125, -0.33062744140625, -0.271087646484375, -0.2115478515625, -0.152008056640625, -0.09246826171875, -0.032928466796875, 0.026611328125, 0.086151123046875, 0.14569091796875, 0.205230712890625, 0.2647705078125, 0.324310302734375, 0.38385009765625, 0.443389892578125, 0.5029296875, 0.562469482421875, 0.62200927734375, 0.681549072265625, 0.7410888671875, 0.800628662109375, 0.86016845703125, 0.919708251953125, 0.979248046875, 1.038787841796875, 1.09832763671875, 1.157867431640625, 1.2174072265625, 1.276947021484375, 1.33648681640625, 1.396026611328125, 1.45556640625, 1.515106201171875, 1.57464599609375, 1.634185791015625, 1.6937255859375, 1.753265380859375, 1.81280517578125, 1.872344970703125, 1.931884765625, 1.991424560546875, 2.05096435546875, 2.110504150390625, 2.1700439453125, 2.229583740234375, 2.28912353515625, 2.348663330078125, 2.408203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 9.0, 17.0, 59.0, 124.0, 255.0, 280.0, 147.0, 59.0, 17.0, 13.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.396169662475586, -11.836724281311035, -11.277278900146484, -10.71783447265625, -10.1583890914917, -9.598943710327148, -9.039499282836914, -8.480053901672363, -7.9206085205078125, -7.361163139343262, -6.801718235015869, -6.242273330688477, -5.682827949523926, -5.123382568359375, -4.563937664031982, -4.00449275970459, -3.445047378540039, -2.8856022357940674, -2.3261570930480957, -1.766711950302124, -1.2072668075561523, -0.6478216648101807, -0.08837652206420898, 0.4710686206817627, 1.0305137634277344, 1.589958906173706, 2.1494040489196777, 2.7088491916656494, 3.268294334411621, 3.8277394771575928, 4.3871846199035645, 4.946629524230957, 5.506076812744141, 6.065522193908691, 6.624967098236084, 7.184412002563477, 7.743857383728027, 8.303302764892578, 8.862747192382812, 9.422192573547363, 9.981637954711914, 10.541083335876465, 11.100528717041016, 11.65997314453125, 12.2194185256958, 12.778863906860352, 13.338308334350586, 13.897753715515137, 14.457199096679688, 15.016644477844238, 15.576089859008789, 16.135534286499023, 16.69498062133789, 17.254425048828125, 17.81386947631836, 18.373315811157227, 18.93276023864746, 19.492204666137695, 20.051651000976562, 20.611095428466797, 21.17053985595703, 21.7299861907959, 22.289430618286133, 22.848876953125, 23.408321380615234]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 6.0, 5.0, 2.0, 9.0, 14.0, 20.0, 25.0, 33.0, 38.0, 52.0, 59.0, 70.0, 84.0, 85.0, 79.0, 80.0, 69.0, 58.0, 64.0, 35.0, 33.0, 26.0, 15.0, 16.0, 9.0, 5.0, 9.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.438441753387451, -6.079217433929443, -5.7199931144714355, -5.360769271850586, -5.001544952392578, -4.64232063293457, -4.2830963134765625, -3.9238719940185547, -3.564647674560547, -3.205423355102539, -2.8461990356445312, -2.4869749546051025, -2.1277506351470947, -1.768526315689087, -1.4093022346496582, -1.0500779151916504, -0.6908535957336426, -0.33162933588027954, 0.027594923973083496, 0.38681912422180176, 0.7460434436798096, 1.1052677631378174, 1.464491844177246, 1.823716163635254, 2.1829404830932617, 2.5421648025512695, 2.9013891220092773, 3.260613203048706, 3.619837522506714, 3.9790618419647217, 4.33828592300415, 4.697510242462158, 5.056734085083008, 5.415958404541016, 5.775182723999023, 6.134407043457031, 6.493631362915039, 6.852855682373047, 7.2120795249938965, 7.571303844451904, 7.930528163909912, 8.289752006530762, 8.64897632598877, 9.008200645446777, 9.367424964904785, 9.726649284362793, 10.0858736038208, 10.445097923278809, 10.804322242736816, 11.163546562194824, 11.522770881652832, 11.88199520111084, 12.241219520568848, 12.600443840026855, 12.959667205810547, 13.318891525268555, 13.678115844726562, 14.03734016418457, 14.396564483642578, 14.755788803100586, 15.115013122558594, 15.474237442016602, 15.83346176147461, 16.192686080932617, 16.551910400390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 1.0, 5.0, 13.0, 20.0, 25.0, 40.0, 73.0, 91.0, 181.0, 366.0, 595.0, 1205.0, 2368.0, 5045.0, 11011.0, 26206.0, 63823.0, 157310.0, 320730.0, 264593.0, 114039.0, 45595.0, 19181.0, 8205.0, 3842.0, 1857.0, 951.0, 491.0, 293.0, 186.0, 80.0, 48.0, 25.0, 17.0, 10.0, 9.0, 11.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98974609375, -0.960479736328125, -0.93121337890625, -0.901947021484375, -0.8726806640625, -0.843414306640625, -0.81414794921875, -0.784881591796875, -0.755615234375, -0.726348876953125, -0.69708251953125, -0.667816162109375, -0.6385498046875, -0.609283447265625, -0.58001708984375, -0.550750732421875, -0.521484375, -0.492218017578125, -0.46295166015625, -0.433685302734375, -0.4044189453125, -0.375152587890625, -0.34588623046875, -0.316619873046875, -0.287353515625, -0.258087158203125, -0.22882080078125, -0.199554443359375, -0.1702880859375, -0.141021728515625, -0.11175537109375, -0.082489013671875, -0.05322265625, -0.023956298828125, 0.00531005859375, 0.034576416015625, 0.0638427734375, 0.093109130859375, 0.12237548828125, 0.151641845703125, 0.180908203125, 0.210174560546875, 0.23944091796875, 0.268707275390625, 0.2979736328125, 0.327239990234375, 0.35650634765625, 0.385772705078125, 0.4150390625, 0.444305419921875, 0.47357177734375, 0.502838134765625, 0.5321044921875, 0.561370849609375, 0.59063720703125, 0.619903564453125, 0.649169921875, 0.678436279296875, 0.70770263671875, 0.736968994140625, 0.7662353515625, 0.795501708984375, 0.82476806640625, 0.854034423828125, 0.88330078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 8.0, 5.0, 10.0, 17.0, 12.0, 13.0, 11.0, 10.0, 21.0, 27.0, 18.0, 26.0, 35.0, 32.0, 38.0, 56.0, 41.0, 37.0, 33.0, 38.0, 39.0, 43.0, 35.0, 40.0, 36.0, 44.0, 36.0, 29.0, 27.0, 27.0, 17.0, 25.0, 21.0, 19.0, 15.0, 16.0, 4.0, 11.0, 9.0, 5.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.630859375, -0.6124343872070312, -0.5940093994140625, -0.5755844116210938, -0.557159423828125, -0.5387344360351562, -0.5203094482421875, -0.5018844604492188, -0.48345947265625, -0.46503448486328125, -0.4466094970703125, -0.42818450927734375, -0.409759521484375, -0.39133453369140625, -0.3729095458984375, -0.35448455810546875, -0.3360595703125, -0.31763458251953125, -0.2992095947265625, -0.28078460693359375, -0.262359619140625, -0.24393463134765625, -0.2255096435546875, -0.20708465576171875, -0.18865966796875, -0.17023468017578125, -0.1518096923828125, -0.13338470458984375, -0.114959716796875, -0.09653472900390625, -0.0781097412109375, -0.05968475341796875, -0.041259765625, -0.02283477783203125, -0.0044097900390625, 0.01401519775390625, 0.032440185546875, 0.05086517333984375, 0.0692901611328125, 0.08771514892578125, 0.10614013671875, 0.12456512451171875, 0.1429901123046875, 0.16141510009765625, 0.179840087890625, 0.19826507568359375, 0.2166900634765625, 0.23511505126953125, 0.2535400390625, 0.27196502685546875, 0.2903900146484375, 0.30881500244140625, 0.327239990234375, 0.34566497802734375, 0.3640899658203125, 0.38251495361328125, 0.40093994140625, 0.41936492919921875, 0.4377899169921875, 0.45621490478515625, 0.474639892578125, 0.49306488037109375, 0.5114898681640625, 0.5299148559570312, 0.54833984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 11.0, 24.0, 27.0, 49.0, 48.0, 47.0, 71.0, 113.0, 169.0, 235.0, 297.0, 473.0, 709.0, 1247.0, 2608.0, 8269.0, 42291.0, 324050.0, 589704.0, 60451.0, 10541.0, 3255.0, 1362.0, 770.0, 510.0, 347.0, 228.0, 178.0, 118.0, 92.0, 60.0, 50.0, 47.0, 23.0, 22.0, 17.0, 5.0, 2.0, 8.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.216796875, -2.15362548828125, -2.0904541015625, -2.02728271484375, -1.964111328125, -1.90093994140625, -1.8377685546875, -1.77459716796875, -1.71142578125, -1.64825439453125, -1.5850830078125, -1.52191162109375, -1.458740234375, -1.39556884765625, -1.3323974609375, -1.26922607421875, -1.2060546875, -1.14288330078125, -1.0797119140625, -1.01654052734375, -0.953369140625, -0.89019775390625, -0.8270263671875, -0.76385498046875, -0.70068359375, -0.63751220703125, -0.5743408203125, -0.51116943359375, -0.447998046875, -0.38482666015625, -0.3216552734375, -0.25848388671875, -0.1953125, -0.13214111328125, -0.0689697265625, -0.00579833984375, 0.057373046875, 0.12054443359375, 0.1837158203125, 0.24688720703125, 0.31005859375, 0.37322998046875, 0.4364013671875, 0.49957275390625, 0.562744140625, 0.62591552734375, 0.6890869140625, 0.75225830078125, 0.8154296875, 0.87860107421875, 0.9417724609375, 1.00494384765625, 1.068115234375, 1.13128662109375, 1.1944580078125, 1.25762939453125, 1.32080078125, 1.38397216796875, 1.4471435546875, 1.51031494140625, 1.573486328125, 1.63665771484375, 1.6998291015625, 1.76300048828125, 1.826171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 9.0, 11.0, 14.0, 20.0, 12.0, 22.0, 28.0, 27.0, 26.0, 35.0, 47.0, 47.0, 54.0, 50.0, 53.0, 51.0, 43.0, 54.0, 47.0, 35.0, 45.0, 34.0, 30.0, 29.0, 22.0, 21.0, 15.0, 18.0, 20.0, 12.0, 6.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.572265625, -2.49383544921875, -2.4154052734375, -2.33697509765625, -2.258544921875, -2.18011474609375, -2.1016845703125, -2.02325439453125, -1.94482421875, -1.86639404296875, -1.7879638671875, -1.70953369140625, -1.631103515625, -1.55267333984375, -1.4742431640625, -1.39581298828125, -1.3173828125, -1.23895263671875, -1.1605224609375, -1.08209228515625, -1.003662109375, -0.92523193359375, -0.8468017578125, -0.76837158203125, -0.68994140625, -0.61151123046875, -0.5330810546875, -0.45465087890625, -0.376220703125, -0.29779052734375, -0.2193603515625, -0.14093017578125, -0.0625, 0.01593017578125, 0.0943603515625, 0.17279052734375, 0.251220703125, 0.32965087890625, 0.4080810546875, 0.48651123046875, 0.56494140625, 0.64337158203125, 0.7218017578125, 0.80023193359375, 0.878662109375, 0.95709228515625, 1.0355224609375, 1.11395263671875, 1.1923828125, 1.27081298828125, 1.3492431640625, 1.42767333984375, 1.506103515625, 1.58453369140625, 1.6629638671875, 1.74139404296875, 1.81982421875, 1.89825439453125, 1.9766845703125, 2.05511474609375, 2.133544921875, 2.21197509765625, 2.2904052734375, 2.36883544921875, 2.447265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 8.0, 7.0, 11.0, 13.0, 16.0, 33.0, 52.0, 67.0, 114.0, 170.0, 251.0, 474.0, 772.0, 1543.0, 3033.0, 6460.0, 18591.0, 86268.0, 694176.0, 188944.0, 29762.0, 9516.0, 3901.0, 1900.0, 970.0, 557.0, 340.0, 206.0, 124.0, 87.0, 53.0, 42.0, 24.0, 18.0, 14.0, 10.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7421875, -0.72015380859375, -0.6981201171875, -0.67608642578125, -0.654052734375, -0.63201904296875, -0.6099853515625, -0.58795166015625, -0.56591796875, -0.54388427734375, -0.5218505859375, -0.49981689453125, -0.477783203125, -0.45574951171875, -0.4337158203125, -0.41168212890625, -0.3896484375, -0.36761474609375, -0.3455810546875, -0.32354736328125, -0.301513671875, -0.27947998046875, -0.2574462890625, -0.23541259765625, -0.21337890625, -0.19134521484375, -0.1693115234375, -0.14727783203125, -0.125244140625, -0.10321044921875, -0.0811767578125, -0.05914306640625, -0.037109375, -0.01507568359375, 0.0069580078125, 0.02899169921875, 0.051025390625, 0.07305908203125, 0.0950927734375, 0.11712646484375, 0.13916015625, 0.16119384765625, 0.1832275390625, 0.20526123046875, 0.227294921875, 0.24932861328125, 0.2713623046875, 0.29339599609375, 0.3154296875, 0.33746337890625, 0.3594970703125, 0.38153076171875, 0.403564453125, 0.42559814453125, 0.4476318359375, 0.46966552734375, 0.49169921875, 0.51373291015625, 0.5357666015625, 0.55780029296875, 0.579833984375, 0.60186767578125, 0.6239013671875, 0.64593505859375, 0.66796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 6.0, 8.0, 21.0, 42.0, 164.0, 401.0, 203.0, 64.0, 25.0, 16.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004868507385253906, -0.00046428292989730835, -0.0004417151212692261, -0.0004191473126411438, -0.0003965795040130615, -0.00037401169538497925, -0.00035144388675689697, -0.0003288760781288147, -0.0003063082695007324, -0.00028374046087265015, -0.00026117265224456787, -0.0002386048436164856, -0.00021603703498840332, -0.00019346922636032104, -0.00017090141773223877, -0.0001483336091041565, -0.00012576580047607422, -0.00010319799184799194, -8.063018321990967e-05, -5.806237459182739e-05, -3.549456596374512e-05, -1.2926757335662842e-05, 9.641051292419434e-06, 3.220885992050171e-05, 5.4776668548583984e-05, 7.734447717666626e-05, 9.991228580474854e-05, 0.0001224800944328308, 0.00014504790306091309, 0.00016761571168899536, 0.00019018352031707764, 0.0002127513289451599, 0.0002353191375732422, 0.00025788694620132446, 0.00028045475482940674, 0.000303022563457489, 0.0003255903720855713, 0.00034815818071365356, 0.00037072598934173584, 0.0003932937979698181, 0.0004158616065979004, 0.00043842941522598267, 0.00046099722385406494, 0.0004835650324821472, 0.0005061328411102295, 0.0005287006497383118, 0.000551268458366394, 0.0005738362669944763, 0.0005964040756225586, 0.0006189718842506409, 0.0006415396928787231, 0.0006641075015068054, 0.0006866753101348877, 0.00070924311876297, 0.0007318109273910522, 0.0007543787360191345, 0.0007769465446472168, 0.0007995143532752991, 0.0008220821619033813, 0.0008446499705314636, 0.0008672177791595459, 0.0008897855877876282, 0.0009123533964157104, 0.0009349212050437927, 0.000957489013671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 8.0, 10.0, 26.0, 27.0, 65.0, 105.0, 247.0, 504.0, 1648.0, 8827.0, 237929.0, 779079.0, 16374.0, 2425.0, 699.0, 284.0, 121.0, 74.0, 42.0, 20.0, 8.0, 13.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.7332763671875, -1.685302734375, -1.6373291015625, -1.58935546875, -1.5413818359375, -1.493408203125, -1.4454345703125, -1.3974609375, -1.3494873046875, -1.301513671875, -1.2535400390625, -1.20556640625, -1.1575927734375, -1.109619140625, -1.0616455078125, -1.013671875, -0.9656982421875, -0.917724609375, -0.8697509765625, -0.82177734375, -0.7738037109375, -0.725830078125, -0.6778564453125, -0.6298828125, -0.5819091796875, -0.533935546875, -0.4859619140625, -0.43798828125, -0.3900146484375, -0.342041015625, -0.2940673828125, -0.24609375, -0.1981201171875, -0.150146484375, -0.1021728515625, -0.05419921875, -0.0062255859375, 0.041748046875, 0.0897216796875, 0.1376953125, 0.1856689453125, 0.233642578125, 0.2816162109375, 0.32958984375, 0.3775634765625, 0.425537109375, 0.4735107421875, 0.521484375, 0.5694580078125, 0.617431640625, 0.6654052734375, 0.71337890625, 0.7613525390625, 0.809326171875, 0.8572998046875, 0.9052734375, 0.9532470703125, 1.001220703125, 1.0491943359375, 1.09716796875, 1.1451416015625, 1.193115234375, 1.2410888671875, 1.2890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 9.0, 3.0, 6.0, 7.0, 11.0, 13.0, 21.0, 20.0, 22.0, 31.0, 36.0, 47.0, 62.0, 44.0, 60.0, 63.0, 71.0, 75.0, 60.0, 52.0, 45.0, 34.0, 28.0, 21.0, 37.0, 17.0, 11.0, 13.0, 13.0, 11.0, 8.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.494384765625, -0.47887420654296875, -0.4633636474609375, -0.44785308837890625, -0.432342529296875, -0.41683197021484375, -0.4013214111328125, -0.38581085205078125, -0.37030029296875, -0.35478973388671875, -0.3392791748046875, -0.32376861572265625, -0.308258056640625, -0.29274749755859375, -0.2772369384765625, -0.26172637939453125, -0.2462158203125, -0.23070526123046875, -0.2151947021484375, -0.19968414306640625, -0.184173583984375, -0.16866302490234375, -0.1531524658203125, -0.13764190673828125, -0.12213134765625, -0.10662078857421875, -0.0911102294921875, -0.07559967041015625, -0.060089111328125, -0.04457855224609375, -0.0290679931640625, -0.01355743408203125, 0.001953125, 0.01746368408203125, 0.0329742431640625, 0.04848480224609375, 0.063995361328125, 0.07950592041015625, 0.0950164794921875, 0.11052703857421875, 0.12603759765625, 0.14154815673828125, 0.1570587158203125, 0.17256927490234375, 0.188079833984375, 0.20359039306640625, 0.2191009521484375, 0.23461151123046875, 0.2501220703125, 0.26563262939453125, 0.2811431884765625, 0.29665374755859375, 0.312164306640625, 0.32767486572265625, 0.3431854248046875, 0.35869598388671875, 0.37420654296875, 0.38971710205078125, 0.4052276611328125, 0.42073822021484375, 0.436248779296875, 0.45175933837890625, 0.4672698974609375, 0.48278045654296875, 0.498291015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 20.0, 51.0, 155.0, 334.0, 275.0, 102.0, 32.0, 8.0, 12.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.361270904541016, -33.52109146118164, -32.680908203125, -31.840726852416992, -31.000545501708984, -30.160364151000977, -29.32018280029297, -28.480003356933594, -27.639820098876953, -26.799638748168945, -25.959457397460938, -25.11927604675293, -24.279094696044922, -23.438913345336914, -22.598731994628906, -21.75855255126953, -20.918371200561523, -20.078189849853516, -19.238008499145508, -18.3978271484375, -17.557645797729492, -16.717464447021484, -15.877284049987793, -15.037102699279785, -14.196921348571777, -13.35673999786377, -12.516558647155762, -11.67637825012207, -10.836196899414062, -9.996015548706055, -9.155834197998047, -8.315652847290039, -7.475473403930664, -6.635292053222656, -5.795110702514648, -4.954929828643799, -4.114748477935791, -3.274567127227783, -2.4343862533569336, -1.5942049026489258, -0.754023551940918, 0.08615767955780029, 0.9263389110565186, 1.7665200233459473, 2.606701374053955, 3.446882724761963, 4.2870635986328125, 5.12724494934082, 5.967426300048828, 6.807607650756836, 7.647789001464844, 8.487970352172852, 9.32815170288086, 10.168333053588867, 11.008513450622559, 11.848694801330566, 12.688876152038574, 13.529057502746582, 14.36923885345459, 15.209419250488281, 16.04960060119629, 16.889781951904297, 17.729963302612305, 18.570144653320312, 19.41032600402832]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 8.0, 9.0, 16.0, 16.0, 12.0, 20.0, 14.0, 34.0, 34.0, 25.0, 31.0, 32.0, 34.0, 40.0, 47.0, 72.0, 82.0, 57.0, 49.0, 58.0, 26.0, 32.0, 28.0, 28.0, 25.0, 18.0, 27.0, 19.0, 21.0, 13.0, 10.0, 15.0, 8.0, 6.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.247876167297363, -7.950588703155518, -7.65330171585083, -7.356014251708984, -7.058727264404297, -6.761439800262451, -6.4641523361206055, -6.166865348815918, -5.869577884674072, -5.572290420532227, -5.275003433227539, -4.977715969085693, -4.680428504943848, -4.38314151763916, -4.0858540534973145, -3.788566827774048, -3.4912796020507812, -3.1939923763275146, -2.896705150604248, -2.5994176864624023, -2.3021304607391357, -2.004843235015869, -1.707555890083313, -1.4102685451507568, -1.1129813194274902, -0.8156940340995789, -0.5184067487716675, -0.2211194634437561, 0.07616782188415527, 0.3734550476074219, 0.670742392539978, 0.9680297374725342, 1.2653179168701172, 1.5626051425933838, 1.85989248752594, 2.157179832458496, 2.4544670581817627, 2.7517542839050293, 3.049041748046875, 3.3463289737701416, 3.643616199493408, 3.940903425216675, 4.238190650939941, 4.535478115081787, 4.832765579223633, 5.13005256652832, 5.427340030670166, 5.724627494812012, 6.021914482116699, 6.319201946258545, 6.616488933563232, 6.913776397705078, 7.211063385009766, 7.508350849151611, 7.805638313293457, 8.102925300598145, 8.400213241577148, 8.697500228881836, 8.99478816986084, 9.292075157165527, 9.589362144470215, 9.886650085449219, 10.183937072753906, 10.481224060058594, 10.778511047363281]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 14.0, 12.0, 16.0, 24.0, 27.0, 46.0, 48.0, 100.0, 146.0, 217.0, 409.0, 763.0, 1796.0, 5694.0, 27704.0, 366074.0, 2889491.0, 834415.0, 54204.0, 8441.0, 2437.0, 992.0, 457.0, 256.0, 164.0, 105.0, 75.0, 45.0, 33.0, 24.0, 18.0, 13.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84375, -0.813232421875, -0.78271484375, -0.752197265625, -0.7216796875, -0.691162109375, -0.66064453125, -0.630126953125, -0.599609375, -0.569091796875, -0.53857421875, -0.508056640625, -0.4775390625, -0.447021484375, -0.41650390625, -0.385986328125, -0.35546875, -0.324951171875, -0.29443359375, -0.263916015625, -0.2333984375, -0.202880859375, -0.17236328125, -0.141845703125, -0.111328125, -0.080810546875, -0.05029296875, -0.019775390625, 0.0107421875, 0.041259765625, 0.07177734375, 0.102294921875, 0.1328125, 0.163330078125, 0.19384765625, 0.224365234375, 0.2548828125, 0.285400390625, 0.31591796875, 0.346435546875, 0.376953125, 0.407470703125, 0.43798828125, 0.468505859375, 0.4990234375, 0.529541015625, 0.56005859375, 0.590576171875, 0.62109375, 0.651611328125, 0.68212890625, 0.712646484375, 0.7431640625, 0.773681640625, 0.80419921875, 0.834716796875, 0.865234375, 0.895751953125, 0.92626953125, 0.956787109375, 0.9873046875, 1.017822265625, 1.04833984375, 1.078857421875, 1.109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 7.0, 12.0, 9.0, 15.0, 18.0, 17.0, 11.0, 24.0, 29.0, 27.0, 26.0, 29.0, 46.0, 34.0, 47.0, 37.0, 49.0, 48.0, 46.0, 43.0, 51.0, 30.0, 38.0, 35.0, 38.0, 24.0, 27.0, 22.0, 23.0, 32.0, 20.0, 18.0, 12.0, 8.0, 6.0, 3.0, 9.0, 6.0, 10.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58984375, -0.5720291137695312, -0.5542144775390625, -0.5363998413085938, -0.518585205078125, -0.5007705688476562, -0.4829559326171875, -0.46514129638671875, -0.44732666015625, -0.42951202392578125, -0.4116973876953125, -0.39388275146484375, -0.376068115234375, -0.35825347900390625, -0.3404388427734375, -0.32262420654296875, -0.3048095703125, -0.28699493408203125, -0.2691802978515625, -0.25136566162109375, -0.233551025390625, -0.21573638916015625, -0.1979217529296875, -0.18010711669921875, -0.16229248046875, -0.14447784423828125, -0.1266632080078125, -0.10884857177734375, -0.091033935546875, -0.07321929931640625, -0.0554046630859375, -0.03759002685546875, -0.019775390625, -0.00196075439453125, 0.0158538818359375, 0.03366851806640625, 0.051483154296875, 0.06929779052734375, 0.0871124267578125, 0.10492706298828125, 0.12274169921875, 0.14055633544921875, 0.1583709716796875, 0.17618560791015625, 0.194000244140625, 0.21181488037109375, 0.2296295166015625, 0.24744415283203125, 0.2652587890625, 0.28307342529296875, 0.3008880615234375, 0.31870269775390625, 0.336517333984375, 0.35433197021484375, 0.3721466064453125, 0.38996124267578125, 0.40777587890625, 0.42559051513671875, 0.4434051513671875, 0.46121978759765625, 0.479034423828125, 0.49684906005859375, 0.5146636962890625, 0.5324783325195312, 0.55029296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 17.0, 26.0, 52.0, 85.0, 145.0, 341.0, 941.0, 3757.0, 330410.0, 3849428.0, 7079.0, 1142.0, 441.0, 209.0, 91.0, 44.0, 28.0, 14.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.243072509765625, -4.11505126953125, -3.987030029296875, -3.8590087890625, -3.730987548828125, -3.60296630859375, -3.474945068359375, -3.346923828125, -3.218902587890625, -3.09088134765625, -2.962860107421875, -2.8348388671875, -2.706817626953125, -2.57879638671875, -2.450775146484375, -2.32275390625, -2.194732666015625, -2.06671142578125, -1.938690185546875, -1.8106689453125, -1.682647705078125, -1.55462646484375, -1.426605224609375, -1.298583984375, -1.170562744140625, -1.04254150390625, -0.914520263671875, -0.7864990234375, -0.658477783203125, -0.53045654296875, -0.402435302734375, -0.2744140625, -0.146392822265625, -0.01837158203125, 0.109649658203125, 0.2376708984375, 0.365692138671875, 0.49371337890625, 0.621734619140625, 0.749755859375, 0.877777099609375, 1.00579833984375, 1.133819580078125, 1.2618408203125, 1.389862060546875, 1.51788330078125, 1.645904541015625, 1.77392578125, 1.901947021484375, 2.02996826171875, 2.157989501953125, 2.2860107421875, 2.414031982421875, 2.54205322265625, 2.670074462890625, 2.798095703125, 2.926116943359375, 3.05413818359375, 3.182159423828125, 3.3101806640625, 3.438201904296875, 3.56622314453125, 3.694244384765625, 3.822265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 20.0, 62.0, 179.0, 843.0, 2180.0, 595.0, 120.0, 42.0, 19.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.204864501953125, -3.08355712890625, -2.962249755859375, -2.8409423828125, -2.719635009765625, -2.59832763671875, -2.477020263671875, -2.355712890625, -2.234405517578125, -2.11309814453125, -1.991790771484375, -1.8704833984375, -1.749176025390625, -1.62786865234375, -1.506561279296875, -1.38525390625, -1.263946533203125, -1.14263916015625, -1.021331787109375, -0.9000244140625, -0.778717041015625, -0.65740966796875, -0.536102294921875, -0.414794921875, -0.293487548828125, -0.17218017578125, -0.050872802734375, 0.0704345703125, 0.191741943359375, 0.31304931640625, 0.434356689453125, 0.5556640625, 0.676971435546875, 0.79827880859375, 0.919586181640625, 1.0408935546875, 1.162200927734375, 1.28350830078125, 1.404815673828125, 1.526123046875, 1.647430419921875, 1.76873779296875, 1.890045166015625, 2.0113525390625, 2.132659912109375, 2.25396728515625, 2.375274658203125, 2.49658203125, 2.617889404296875, 2.73919677734375, 2.860504150390625, 2.9818115234375, 3.103118896484375, 3.22442626953125, 3.345733642578125, 3.467041015625, 3.588348388671875, 3.70965576171875, 3.830963134765625, 3.9522705078125, 4.073577880859375, 4.19488525390625, 4.316192626953125, 4.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 19.0, 76.0, 518.0, 316.0, 50.0, 13.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8726806640625, -36.564170837402344, -35.25566482543945, -33.9471549987793, -32.63864517211914, -31.33013916015625, -30.021629333496094, -28.71312141418457, -27.404613494873047, -26.096105575561523, -24.787595748901367, -23.479087829589844, -22.17057991027832, -20.862071990966797, -19.55356216430664, -18.245054244995117, -16.93654441833496, -15.628035545349121, -14.319527626037598, -13.011018753051758, -11.702510833740234, -10.394001960754395, -9.085493087768555, -7.776985168457031, -6.468476295471191, -5.15996789932251, -3.851459264755249, -2.5429506301879883, -1.2344422340393066, 0.074066162109375, 1.3825750350952148, 2.6910829544067383, 3.999591827392578, 5.30810022354126, 6.616608619689941, 7.925117492675781, 9.233625411987305, 10.542134284973145, 11.850643157958984, 13.159151077270508, 14.467659950256348, 15.776168823242188, 17.08467674255371, 18.393184661865234, 19.70169448852539, 21.010202407836914, 22.318710327148438, 23.627220153808594, 24.935728073120117, 26.24423599243164, 27.552745819091797, 28.86125373840332, 30.169761657714844, 31.478271484375, 32.786781311035156, 34.09528732299805, 35.4037971496582, 36.71230697631836, 38.02081298828125, 39.329322814941406, 40.63783264160156, 41.94633865356445, 43.25484848022461, 44.5633544921875, 45.871864318847656]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 8.0, 5.0, 10.0, 15.0, 19.0, 15.0, 30.0, 53.0, 58.0, 54.0, 69.0, 71.0, 66.0, 88.0, 82.0, 72.0, 72.0, 40.0, 53.0, 37.0, 24.0, 25.0, 13.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.154629707336426, -11.825424194335938, -11.496219635009766, -11.167014122009277, -10.837809562683105, -10.508604049682617, -10.179399490356445, -9.850193977355957, -9.520989418029785, -9.191783905029297, -8.862579345703125, -8.533373832702637, -8.204169273376465, -7.874964237213135, -7.545759201049805, -7.216553688049316, -6.887348651885986, -6.558143615722656, -6.228938579559326, -5.899733543395996, -5.570528507232666, -5.241323471069336, -4.912117958068848, -4.582913398742676, -4.2537078857421875, -3.9245028495788574, -3.5952978134155273, -3.2660927772521973, -2.936887741088867, -2.607682704925537, -2.278477430343628, -1.9492723941802979, -1.6200675964355469, -1.2908625602722168, -0.9616574645042419, -0.6324523687362671, -0.303247332572937, 0.025957703590393066, 0.3551628589630127, 0.6843678951263428, 1.0135729312896729, 1.342777967453003, 1.671983003616333, 2.001188278198242, 2.3303933143615723, 2.6595983505249023, 2.9888033866882324, 3.3180084228515625, 3.6472134590148926, 3.9764184951782227, 4.305623531341553, 4.634828567504883, 4.964033603668213, 5.293238639831543, 5.622444152832031, 5.951648712158203, 6.280854225158691, 6.6100592613220215, 6.939264297485352, 7.268469333648682, 7.597674369812012, 7.926879405975342, 8.256084442138672, 8.58528995513916, 8.914494514465332]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 14.0, 17.0, 33.0, 47.0, 69.0, 99.0, 133.0, 204.0, 324.0, 540.0, 807.0, 1376.0, 2203.0, 3802.0, 6388.0, 11755.0, 21255.0, 39957.0, 73637.0, 132276.0, 205250.0, 215048.0, 148445.0, 83963.0, 44925.0, 24604.0, 13351.0, 7380.0, 4181.0, 2481.0, 1449.0, 875.0, 561.0, 374.0, 273.0, 148.0, 96.0, 69.0, 45.0, 33.0, 14.0, 9.0, 12.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5776214599609375, -0.559051513671875, -0.5404815673828125, -0.52191162109375, -0.5033416748046875, -0.484771728515625, -0.4662017822265625, -0.4476318359375, -0.4290618896484375, -0.410491943359375, -0.3919219970703125, -0.37335205078125, -0.3547821044921875, -0.336212158203125, -0.3176422119140625, -0.299072265625, -0.2805023193359375, -0.261932373046875, -0.2433624267578125, -0.22479248046875, -0.2062225341796875, -0.187652587890625, -0.1690826416015625, -0.1505126953125, -0.1319427490234375, -0.113372802734375, -0.0948028564453125, -0.07623291015625, -0.0576629638671875, -0.039093017578125, -0.0205230712890625, -0.001953125, 0.0166168212890625, 0.035186767578125, 0.0537567138671875, 0.07232666015625, 0.0908966064453125, 0.109466552734375, 0.1280364990234375, 0.1466064453125, 0.1651763916015625, 0.183746337890625, 0.2023162841796875, 0.22088623046875, 0.2394561767578125, 0.258026123046875, 0.2765960693359375, 0.295166015625, 0.3137359619140625, 0.332305908203125, 0.3508758544921875, 0.36944580078125, 0.3880157470703125, 0.406585693359375, 0.4251556396484375, 0.4437255859375, 0.4622955322265625, 0.480865478515625, 0.4994354248046875, 0.51800537109375, 0.5365753173828125, 0.555145263671875, 0.5737152099609375, 0.59228515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 23.0, 26.0, 25.0, 33.0, 36.0, 39.0, 35.0, 50.0, 49.0, 49.0, 69.0, 33.0, 47.0, 51.0, 38.0, 42.0, 37.0, 37.0, 27.0, 30.0, 35.0, 25.0, 21.0, 14.0, 16.0, 15.0, 9.0, 4.0, 8.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5880661010742188, -0.5667572021484375, -0.5454483032226562, -0.524139404296875, -0.5028305053710938, -0.4815216064453125, -0.46021270751953125, -0.43890380859375, -0.41759490966796875, -0.3962860107421875, -0.37497711181640625, -0.353668212890625, -0.33235931396484375, -0.3110504150390625, -0.28974151611328125, -0.2684326171875, -0.24712371826171875, -0.2258148193359375, -0.20450592041015625, -0.183197021484375, -0.16188812255859375, -0.1405792236328125, -0.11927032470703125, -0.09796142578125, -0.07665252685546875, -0.0553436279296875, -0.03403472900390625, -0.012725830078125, 0.00858306884765625, 0.0298919677734375, 0.05120086669921875, 0.072509765625, 0.09381866455078125, 0.1151275634765625, 0.13643646240234375, 0.157745361328125, 0.17905426025390625, 0.2003631591796875, 0.22167205810546875, 0.24298095703125, 0.26428985595703125, 0.2855987548828125, 0.30690765380859375, 0.328216552734375, 0.34952545166015625, 0.3708343505859375, 0.39214324951171875, 0.4134521484375, 0.43476104736328125, 0.4560699462890625, 0.47737884521484375, 0.498687744140625, 0.5199966430664062, 0.5413055419921875, 0.5626144409179688, 0.58392333984375, 0.6052322387695312, 0.6265411376953125, 0.6478500366210938, 0.669158935546875, 0.6904678344726562, 0.7117767333984375, 0.7330856323242188, 0.75439453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 13.0, 4.0, 16.0, 15.0, 21.0, 25.0, 19.0, 51.0, 44.0, 76.0, 100.0, 151.0, 210.0, 346.0, 595.0, 1274.0, 3341.0, 10992.0, 44089.0, 203993.0, 601373.0, 138409.0, 30312.0, 7985.0, 2550.0, 1047.0, 490.0, 305.0, 204.0, 123.0, 121.0, 58.0, 40.0, 40.0, 25.0, 28.0, 23.0, 17.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.61328125, -1.56634521484375, -1.5194091796875, -1.47247314453125, -1.425537109375, -1.37860107421875, -1.3316650390625, -1.28472900390625, -1.23779296875, -1.19085693359375, -1.1439208984375, -1.09698486328125, -1.050048828125, -1.00311279296875, -0.9561767578125, -0.90924072265625, -0.8623046875, -0.81536865234375, -0.7684326171875, -0.72149658203125, -0.674560546875, -0.62762451171875, -0.5806884765625, -0.53375244140625, -0.48681640625, -0.43988037109375, -0.3929443359375, -0.34600830078125, -0.299072265625, -0.25213623046875, -0.2052001953125, -0.15826416015625, -0.111328125, -0.06439208984375, -0.0174560546875, 0.02947998046875, 0.076416015625, 0.12335205078125, 0.1702880859375, 0.21722412109375, 0.26416015625, 0.31109619140625, 0.3580322265625, 0.40496826171875, 0.451904296875, 0.49884033203125, 0.5457763671875, 0.59271240234375, 0.6396484375, 0.68658447265625, 0.7335205078125, 0.78045654296875, 0.827392578125, 0.87432861328125, 0.9212646484375, 0.96820068359375, 1.01513671875, 1.06207275390625, 1.1090087890625, 1.15594482421875, 1.202880859375, 1.24981689453125, 1.2967529296875, 1.34368896484375, 1.390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 7.0, 6.0, 4.0, 7.0, 9.0, 17.0, 15.0, 17.0, 22.0, 19.0, 31.0, 27.0, 35.0, 48.0, 44.0, 38.0, 39.0, 44.0, 44.0, 62.0, 50.0, 54.0, 44.0, 49.0, 42.0, 52.0, 31.0, 34.0, 19.0, 25.0, 15.0, 15.0, 12.0, 4.0, 7.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.338134765625, -2.26025390625, -2.182373046875, -2.1044921875, -2.026611328125, -1.94873046875, -1.870849609375, -1.79296875, -1.715087890625, -1.63720703125, -1.559326171875, -1.4814453125, -1.403564453125, -1.32568359375, -1.247802734375, -1.169921875, -1.092041015625, -1.01416015625, -0.936279296875, -0.8583984375, -0.780517578125, -0.70263671875, -0.624755859375, -0.546875, -0.468994140625, -0.39111328125, -0.313232421875, -0.2353515625, -0.157470703125, -0.07958984375, -0.001708984375, 0.076171875, 0.154052734375, 0.23193359375, 0.309814453125, 0.3876953125, 0.465576171875, 0.54345703125, 0.621337890625, 0.69921875, 0.777099609375, 0.85498046875, 0.932861328125, 1.0107421875, 1.088623046875, 1.16650390625, 1.244384765625, 1.322265625, 1.400146484375, 1.47802734375, 1.555908203125, 1.6337890625, 1.711669921875, 1.78955078125, 1.867431640625, 1.9453125, 2.023193359375, 2.10107421875, 2.178955078125, 2.2568359375, 2.334716796875, 2.41259765625, 2.490478515625, 2.568359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 6.0, 13.0, 18.0, 39.0, 77.0, 103.0, 164.0, 349.0, 659.0, 1552.0, 3636.0, 11490.0, 40641.0, 177124.0, 623349.0, 140857.0, 32800.0, 9559.0, 3360.0, 1372.0, 621.0, 343.0, 171.0, 106.0, 46.0, 32.0, 24.0, 8.0, 8.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52099609375, -0.5054092407226562, -0.4898223876953125, -0.47423553466796875, -0.458648681640625, -0.44306182861328125, -0.4274749755859375, -0.41188812255859375, -0.39630126953125, -0.38071441650390625, -0.3651275634765625, -0.34954071044921875, -0.333953857421875, -0.31836700439453125, -0.3027801513671875, -0.28719329833984375, -0.2716064453125, -0.25601959228515625, -0.2404327392578125, -0.22484588623046875, -0.209259033203125, -0.19367218017578125, -0.1780853271484375, -0.16249847412109375, -0.14691162109375, -0.13132476806640625, -0.1157379150390625, -0.10015106201171875, -0.084564208984375, -0.06897735595703125, -0.0533905029296875, -0.03780364990234375, -0.022216796875, -0.00662994384765625, 0.0089569091796875, 0.02454376220703125, 0.040130615234375, 0.05571746826171875, 0.0713043212890625, 0.08689117431640625, 0.10247802734375, 0.11806488037109375, 0.1336517333984375, 0.14923858642578125, 0.164825439453125, 0.18041229248046875, 0.1959991455078125, 0.21158599853515625, 0.2271728515625, 0.24275970458984375, 0.2583465576171875, 0.27393341064453125, 0.289520263671875, 0.30510711669921875, 0.3206939697265625, 0.33628082275390625, 0.35186767578125, 0.36745452880859375, 0.3830413818359375, 0.39862823486328125, 0.414215087890625, 0.42980194091796875, 0.4453887939453125, 0.46097564697265625, 0.4765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 13.0, 20.0, 35.0, 34.0, 55.0, 77.0, 120.0, 145.0, 131.0, 109.0, 89.0, 38.0, 31.0, 18.0, 19.0, 7.0, 9.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015581771731376648, -0.00014831870794296265, -0.0001408196985721588, -0.00013332068920135498, -0.00012582167983055115, -0.00011832267045974731, -0.00011082366108894348, -0.00010332465171813965, -9.582564234733582e-05, -8.832663297653198e-05, -8.082762360572815e-05, -7.332861423492432e-05, -6.582960486412048e-05, -5.833059549331665e-05, -5.083158612251282e-05, -4.3332576751708984e-05, -3.583356738090515e-05, -2.833455801010132e-05, -2.0835548639297485e-05, -1.3336539268493652e-05, -5.837529897689819e-06, 1.6614794731140137e-06, 9.160488843917847e-06, 1.665949821472168e-05, 2.4158507585525513e-05, 3.1657516956329346e-05, 3.915652632713318e-05, 4.665553569793701e-05, 5.4154545068740845e-05, 6.165355443954468e-05, 6.915256381034851e-05, 7.665157318115234e-05, 8.415058255195618e-05, 9.164959192276001e-05, 9.914860129356384e-05, 0.00010664761066436768, 0.00011414662003517151, 0.00012164562940597534, 0.00012914463877677917, 0.000136643648147583, 0.00014414265751838684, 0.00015164166688919067, 0.0001591406762599945, 0.00016663968563079834, 0.00017413869500160217, 0.000181637704372406, 0.00018913671374320984, 0.00019663572311401367, 0.0002041347324848175, 0.00021163374185562134, 0.00021913275122642517, 0.000226631760597229, 0.00023413076996803284, 0.00024162977933883667, 0.0002491287887096405, 0.00025662779808044434, 0.00026412680745124817, 0.000271625816822052, 0.00027912482619285583, 0.00028662383556365967, 0.0002941228449344635, 0.00030162185430526733, 0.00030912086367607117, 0.000316619873046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 14.0, 19.0, 33.0, 46.0, 78.0, 111.0, 223.0, 502.0, 1108.0, 3182.0, 11661.0, 58034.0, 343031.0, 543389.0, 68014.0, 13261.0, 3539.0, 1196.0, 495.0, 238.0, 132.0, 78.0, 52.0, 28.0, 21.0, 22.0, 13.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5162582397460938, -0.4978485107421875, -0.47943878173828125, -0.461029052734375, -0.44261932373046875, -0.4242095947265625, -0.40579986572265625, -0.38739013671875, -0.36898040771484375, -0.3505706787109375, -0.33216094970703125, -0.313751220703125, -0.29534149169921875, -0.2769317626953125, -0.25852203369140625, -0.2401123046875, -0.22170257568359375, -0.2032928466796875, -0.18488311767578125, -0.166473388671875, -0.14806365966796875, -0.1296539306640625, -0.11124420166015625, -0.09283447265625, -0.07442474365234375, -0.0560150146484375, -0.03760528564453125, -0.019195556640625, -0.00078582763671875, 0.0176239013671875, 0.03603363037109375, 0.054443359375, 0.07285308837890625, 0.0912628173828125, 0.10967254638671875, 0.128082275390625, 0.14649200439453125, 0.1649017333984375, 0.18331146240234375, 0.20172119140625, 0.22013092041015625, 0.2385406494140625, 0.25695037841796875, 0.275360107421875, 0.29376983642578125, 0.3121795654296875, 0.33058929443359375, 0.3489990234375, 0.36740875244140625, 0.3858184814453125, 0.40422821044921875, 0.422637939453125, 0.44104766845703125, 0.4594573974609375, 0.47786712646484375, 0.49627685546875, 0.5146865844726562, 0.5330963134765625, 0.5515060424804688, 0.569915771484375, 0.5883255004882812, 0.6067352294921875, 0.6251449584960938, 0.6435546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 11.0, 11.0, 15.0, 29.0, 27.0, 29.0, 42.0, 39.0, 73.0, 83.0, 91.0, 91.0, 80.0, 77.0, 53.0, 66.0, 41.0, 29.0, 27.0, 19.0, 18.0, 12.0, 9.0, 4.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.6296157836914062, -0.6107940673828125, -0.5919723510742188, -0.573150634765625, -0.5543289184570312, -0.5355072021484375, -0.5166854858398438, -0.49786376953125, -0.47904205322265625, -0.4602203369140625, -0.44139862060546875, -0.422576904296875, -0.40375518798828125, -0.3849334716796875, -0.36611175537109375, -0.3472900390625, -0.32846832275390625, -0.3096466064453125, -0.29082489013671875, -0.272003173828125, -0.25318145751953125, -0.2343597412109375, -0.21553802490234375, -0.19671630859375, -0.17789459228515625, -0.1590728759765625, -0.14025115966796875, -0.121429443359375, -0.10260772705078125, -0.0837860107421875, -0.06496429443359375, -0.046142578125, -0.02732086181640625, -0.0084991455078125, 0.01032257080078125, 0.029144287109375, 0.04796600341796875, 0.0667877197265625, 0.08560943603515625, 0.10443115234375, 0.12325286865234375, 0.1420745849609375, 0.16089630126953125, 0.179718017578125, 0.19853973388671875, 0.2173614501953125, 0.23618316650390625, 0.2550048828125, 0.27382659912109375, 0.2926483154296875, 0.31147003173828125, 0.330291748046875, 0.34911346435546875, 0.3679351806640625, 0.38675689697265625, 0.40557861328125, 0.42440032958984375, 0.4432220458984375, 0.46204376220703125, 0.480865478515625, 0.49968719482421875, 0.5185089111328125, 0.5373306274414062, 0.55615234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 19.0, 33.0, 74.0, 159.0, 325.0, 200.0, 103.0, 39.0, 21.0, 11.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.74115753173828, -17.211669921875, -16.68218421936035, -16.15269660949707, -15.623208999633789, -15.093722343444824, -14.56423568725586, -14.034748077392578, -13.505261421203613, -12.975774765014648, -12.446287155151367, -11.916800498962402, -11.387313842773438, -10.857826232910156, -10.328339576721191, -9.798852920532227, -9.269365310668945, -8.73987865447998, -8.2103910446167, -7.680904388427734, -7.151417255401611, -6.621930122375488, -6.092443466186523, -5.5629563331604, -5.033469200134277, -4.503982067108154, -3.9744951725006104, -3.4450082778930664, -2.9155211448669434, -2.3860340118408203, -1.8565471172332764, -1.3270602226257324, -0.7975730895996094, -0.2680860757827759, 0.2614009380340576, 0.7908879518508911, 1.3203749656677246, 1.8498620986938477, 2.3793489933013916, 2.9088358879089355, 3.4383230209350586, 3.9678101539611816, 4.497297286987305, 5.0267839431762695, 5.556271076202393, 6.085758209228516, 6.6152448654174805, 7.1447319984436035, 7.674219131469727, 8.203705787658691, 8.733193397521973, 9.262680053710938, 9.792167663574219, 10.321654319763184, 10.851140975952148, 11.38062858581543, 11.910115242004395, 12.43960189819336, 12.96908950805664, 13.498576164245605, 14.02806282043457, 14.557550430297852, 15.087037086486816, 15.616523742675781, 16.146011352539062]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 5.0, 9.0, 8.0, 17.0, 12.0, 13.0, 16.0, 19.0, 22.0, 28.0, 30.0, 29.0, 30.0, 29.0, 35.0, 50.0, 55.0, 88.0, 76.0, 61.0, 37.0, 31.0, 34.0, 22.0, 33.0, 30.0, 16.0, 18.0, 31.0, 19.0, 15.0, 10.0, 7.0, 8.0, 9.0, 4.0, 7.0, 8.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-8.921832084655762, -8.66435432434082, -8.406875610351562, -8.149396896362305, -7.891919136047363, -7.634440898895264, -7.376962661743164, -7.1194844245910645, -6.862006187438965, -6.604527950286865, -6.347049713134766, -6.089571475982666, -5.832093238830566, -5.574615001678467, -5.317136764526367, -5.059658527374268, -4.802180290222168, -4.544702053070068, -4.287223815917969, -4.029745578765869, -3.7722673416137695, -3.51478910446167, -3.2573108673095703, -2.9998326301574707, -2.742354393005371, -2.4848761558532715, -2.227397918701172, -1.9699196815490723, -1.7124414443969727, -1.454963207244873, -1.1974849700927734, -0.9400067329406738, -0.6825294494628906, -0.425051212310791, -0.1675729751586914, 0.0899052619934082, 0.3473834991455078, 0.6048617362976074, 0.862339973449707, 1.1198182106018066, 1.3772964477539062, 1.6347746849060059, 1.8922529220581055, 2.149731159210205, 2.4072093963623047, 2.6646876335144043, 2.922165870666504, 3.1796441078186035, 3.437122344970703, 3.6946005821228027, 3.9520788192749023, 4.209557056427002, 4.467035293579102, 4.724513530731201, 4.981991767883301, 5.2394700050354, 5.4969482421875, 5.7544264793396, 6.011904716491699, 6.269382953643799, 6.526861190795898, 6.784339427947998, 7.041817665100098, 7.299295902252197, 7.556774139404297]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 12.0, 12.0, 9.0, 18.0, 31.0, 51.0, 46.0, 80.0, 109.0, 163.0, 259.0, 390.0, 568.0, 889.0, 1470.0, 2514.0, 4951.0, 11363.0, 37048.0, 169603.0, 830838.0, 2041584.0, 870289.0, 163108.0, 35892.0, 11395.0, 4943.0, 2540.0, 1415.0, 875.0, 558.0, 388.0, 253.0, 177.0, 130.0, 101.0, 63.0, 45.0, 28.0, 19.0, 14.0, 13.0, 5.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5108871459960938, -0.4929656982421875, -0.47504425048828125, -0.457122802734375, -0.43920135498046875, -0.4212799072265625, -0.40335845947265625, -0.38543701171875, -0.36751556396484375, -0.3495941162109375, -0.33167266845703125, -0.313751220703125, -0.29582977294921875, -0.2779083251953125, -0.25998687744140625, -0.2420654296875, -0.22414398193359375, -0.2062225341796875, -0.18830108642578125, -0.170379638671875, -0.15245819091796875, -0.1345367431640625, -0.11661529541015625, -0.09869384765625, -0.08077239990234375, -0.0628509521484375, -0.04492950439453125, -0.027008056640625, -0.00908660888671875, 0.0088348388671875, 0.02675628662109375, 0.044677734375, 0.06259918212890625, 0.0805206298828125, 0.09844207763671875, 0.116363525390625, 0.13428497314453125, 0.1522064208984375, 0.17012786865234375, 0.18804931640625, 0.20597076416015625, 0.2238922119140625, 0.24181365966796875, 0.259735107421875, 0.27765655517578125, 0.2955780029296875, 0.31349945068359375, 0.3314208984375, 0.34934234619140625, 0.3672637939453125, 0.38518524169921875, 0.403106689453125, 0.42102813720703125, 0.4389495849609375, 0.45687103271484375, 0.47479248046875, 0.49271392822265625, 0.5106353759765625, 0.5285568237304688, 0.546478271484375, 0.5643997192382812, 0.5823211669921875, 0.6002426147460938, 0.6181640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 1.0, 4.0, 8.0, 10.0, 10.0, 7.0, 15.0, 29.0, 23.0, 30.0, 40.0, 31.0, 42.0, 35.0, 47.0, 45.0, 50.0, 58.0, 49.0, 42.0, 47.0, 44.0, 37.0, 42.0, 21.0, 35.0, 32.0, 25.0, 19.0, 20.0, 26.0, 24.0, 15.0, 4.0, 12.0, 7.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61376953125, -0.5949630737304688, -0.5761566162109375, -0.5573501586914062, -0.538543701171875, -0.5197372436523438, -0.5009307861328125, -0.48212432861328125, -0.46331787109375, -0.44451141357421875, -0.4257049560546875, -0.40689849853515625, -0.388092041015625, -0.36928558349609375, -0.3504791259765625, -0.33167266845703125, -0.3128662109375, -0.29405975341796875, -0.2752532958984375, -0.25644683837890625, -0.237640380859375, -0.21883392333984375, -0.2000274658203125, -0.18122100830078125, -0.16241455078125, -0.14360809326171875, -0.1248016357421875, -0.10599517822265625, -0.087188720703125, -0.06838226318359375, -0.0495758056640625, -0.03076934814453125, -0.011962890625, 0.00684356689453125, 0.0256500244140625, 0.04445648193359375, 0.063262939453125, 0.08206939697265625, 0.1008758544921875, 0.11968231201171875, 0.13848876953125, 0.15729522705078125, 0.1761016845703125, 0.19490814208984375, 0.213714599609375, 0.23252105712890625, 0.2513275146484375, 0.27013397216796875, 0.2889404296875, 0.30774688720703125, 0.3265533447265625, 0.34535980224609375, 0.364166259765625, 0.38297271728515625, 0.4017791748046875, 0.42058563232421875, 0.43939208984375, 0.45819854736328125, 0.4770050048828125, 0.49581146240234375, 0.514617919921875, 0.5334243774414062, 0.5522308349609375, 0.5710372924804688, 0.58984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 16.0, 25.0, 52.0, 162.0, 404.0, 2203.0, 317807.0, 3867955.0, 4624.0, 654.0, 209.0, 86.0, 41.0, 24.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.658935546875, -4.50927734375, -4.359619140625, -4.2099609375, -4.060302734375, -3.91064453125, -3.760986328125, -3.611328125, -3.461669921875, -3.31201171875, -3.162353515625, -3.0126953125, -2.863037109375, -2.71337890625, -2.563720703125, -2.4140625, -2.264404296875, -2.11474609375, -1.965087890625, -1.8154296875, -1.665771484375, -1.51611328125, -1.366455078125, -1.216796875, -1.067138671875, -0.91748046875, -0.767822265625, -0.6181640625, -0.468505859375, -0.31884765625, -0.169189453125, -0.01953125, 0.130126953125, 0.27978515625, 0.429443359375, 0.5791015625, 0.728759765625, 0.87841796875, 1.028076171875, 1.177734375, 1.327392578125, 1.47705078125, 1.626708984375, 1.7763671875, 1.926025390625, 2.07568359375, 2.225341796875, 2.375, 2.524658203125, 2.67431640625, 2.823974609375, 2.9736328125, 3.123291015625, 3.27294921875, 3.422607421875, 3.572265625, 3.721923828125, 3.87158203125, 4.021240234375, 4.1708984375, 4.320556640625, 4.47021484375, 4.619873046875, 4.76953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 10.0, 24.0, 14.0, 40.0, 84.0, 145.0, 339.0, 804.0, 1085.0, 787.0, 364.0, 182.0, 78.0, 44.0, 31.0, 15.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1865234375, -1.1287078857421875, -1.070892333984375, -1.0130767822265625, -0.95526123046875, -0.8974456787109375, -0.839630126953125, -0.7818145751953125, -0.7239990234375, -0.6661834716796875, -0.608367919921875, -0.5505523681640625, -0.49273681640625, -0.4349212646484375, -0.377105712890625, -0.3192901611328125, -0.261474609375, -0.2036590576171875, -0.145843505859375, -0.0880279541015625, -0.03021240234375, 0.0276031494140625, 0.085418701171875, 0.1432342529296875, 0.2010498046875, 0.2588653564453125, 0.316680908203125, 0.3744964599609375, 0.43231201171875, 0.4901275634765625, 0.547943115234375, 0.6057586669921875, 0.66357421875, 0.7213897705078125, 0.779205322265625, 0.8370208740234375, 0.89483642578125, 0.9526519775390625, 1.010467529296875, 1.0682830810546875, 1.1260986328125, 1.1839141845703125, 1.241729736328125, 1.2995452880859375, 1.35736083984375, 1.4151763916015625, 1.472991943359375, 1.5308074951171875, 1.588623046875, 1.6464385986328125, 1.704254150390625, 1.7620697021484375, 1.81988525390625, 1.8777008056640625, 1.935516357421875, 1.9933319091796875, 2.0511474609375, 2.1089630126953125, 2.166778564453125, 2.2245941162109375, 2.28240966796875, 2.3402252197265625, 2.398040771484375, 2.4558563232421875, 2.513671875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 13.0, 22.0, 55.0, 204.0, 299.0, 256.0, 99.0, 28.0, 16.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.188379287719727, -12.54666519165039, -11.904952049255371, -11.263237953186035, -10.6215238571167, -9.97981071472168, -9.338096618652344, -8.696382522583008, -8.054668426513672, -7.412954807281494, -6.771240711212158, -6.1295270919799805, -5.4878129959106445, -4.846099376678467, -4.204385757446289, -3.562671661376953, -2.9209585189819336, -2.2792446613311768, -1.6375309228897095, -0.9958171844482422, -0.35410332679748535, 0.2876105308532715, 0.9293241500854492, 1.5710382461547852, 2.212751865386963, 2.8544657230377197, 3.4961795806884766, 4.137893199920654, 4.779606819152832, 5.421320915222168, 6.063034534454346, 6.704748630523682, 7.346462249755859, 7.988175868988037, 8.629889488220215, 9.27160358428955, 9.913317680358887, 10.555030822753906, 11.196744918823242, 11.838459014892578, 12.480173110961914, 13.12188720703125, 13.76360034942627, 14.405314445495605, 15.047028541564941, 15.688741683959961, 16.330455780029297, 16.972169876098633, 17.61388397216797, 18.255598068237305, 18.89731216430664, 19.539024353027344, 20.18073844909668, 20.822452545166016, 21.46416664123535, 22.105880737304688, 22.74759292602539, 23.389307022094727, 24.031021118164062, 24.672733306884766, 25.3144474029541, 25.956161499023438, 26.597875595092773, 27.23958969116211, 27.881303787231445]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 6.0, 10.0, 7.0, 10.0, 12.0, 20.0, 21.0, 20.0, 22.0, 51.0, 38.0, 39.0, 51.0, 56.0, 56.0, 49.0, 50.0, 43.0, 66.0, 53.0, 41.0, 31.0, 55.0, 38.0, 38.0, 21.0, 20.0, 17.0, 12.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.450509548187256, -7.235997200012207, -7.021484851837158, -6.806972503662109, -6.592460632324219, -6.377947807312012, -6.163435935974121, -5.948923587799072, -5.734411239624023, -5.519898891448975, -5.305386543273926, -5.090874195098877, -4.876361846923828, -4.6618499755859375, -4.447337627410889, -4.23282527923584, -4.018312931060791, -3.803800582885742, -3.5892882347106934, -3.3747761249542236, -3.160263776779175, -2.945751428604126, -2.7312393188476562, -2.5167269706726074, -2.3022146224975586, -2.0877022743225098, -1.8731900453567505, -1.6586778163909912, -1.4441654682159424, -1.2296531200408936, -1.0151408910751343, -0.800628662109375, -0.5861167907714844, -0.3716045022010803, -0.15709221363067627, 0.05742007493972778, 0.27193236351013184, 0.48644471168518066, 0.7009569406509399, 0.9154691696166992, 1.129981517791748, 1.3444938659667969, 1.5590060949325562, 1.7735183238983154, 1.9880306720733643, 2.202543020248413, 2.417055130004883, 2.6315674781799316, 2.8460798263549805, 3.0605921745300293, 3.275104522705078, 3.489616632461548, 3.7041289806365967, 3.9186413288116455, 4.133153438568115, 4.347665786743164, 4.562178134918213, 4.776690483093262, 4.9912028312683105, 5.205715179443359, 5.42022705078125, 5.634739875793457, 5.849251747131348, 6.0637640953063965, 6.278276443481445]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 14.0, 20.0, 35.0, 38.0, 70.0, 72.0, 154.0, 213.0, 291.0, 508.0, 725.0, 1230.0, 2042.0, 3146.0, 5205.0, 9251.0, 15775.0, 27693.0, 49693.0, 89325.0, 156435.0, 223943.0, 193733.0, 117800.0, 65269.0, 36076.0, 20480.0, 11829.0, 6909.0, 4027.0, 2445.0, 1504.0, 929.0, 568.0, 369.0, 233.0, 164.0, 88.0, 79.0, 64.0, 27.0, 31.0, 13.0, 12.0, 4.0, 10.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.467041015625, -0.4507865905761719, -0.43453216552734375, -0.4182777404785156, -0.4020233154296875, -0.3857688903808594, -0.36951446533203125, -0.3532600402832031, -0.337005615234375, -0.3207511901855469, -0.30449676513671875, -0.2882423400878906, -0.2719879150390625, -0.2557334899902344, -0.23947906494140625, -0.22322463989257812, -0.20697021484375, -0.19071578979492188, -0.17446136474609375, -0.15820693969726562, -0.1419525146484375, -0.12569808959960938, -0.10944366455078125, -0.09318923950195312, -0.076934814453125, -0.060680389404296875, -0.04442596435546875, -0.028171539306640625, -0.0119171142578125, 0.004337310791015625, 0.02059173583984375, 0.036846160888671875, 0.0531005859375, 0.06935501098632812, 0.08560943603515625, 0.10186386108398438, 0.1181182861328125, 0.13437271118164062, 0.15062713623046875, 0.16688156127929688, 0.183135986328125, 0.19939041137695312, 0.21564483642578125, 0.23189926147460938, 0.2481536865234375, 0.2644081115722656, 0.28066253662109375, 0.2969169616699219, 0.31317138671875, 0.3294258117675781, 0.34568023681640625, 0.3619346618652344, 0.3781890869140625, 0.3944435119628906, 0.41069793701171875, 0.4269523620605469, 0.443206787109375, 0.4594612121582031, 0.47571563720703125, 0.4919700622558594, 0.5082244873046875, 0.5244789123535156, 0.5407333374023438, 0.5569877624511719, 0.5732421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 7.0, 5.0, 9.0, 10.0, 8.0, 19.0, 25.0, 18.0, 17.0, 26.0, 41.0, 36.0, 47.0, 40.0, 44.0, 52.0, 46.0, 45.0, 37.0, 54.0, 36.0, 48.0, 48.0, 24.0, 26.0, 38.0, 28.0, 29.0, 20.0, 24.0, 15.0, 19.0, 14.0, 6.0, 4.0, 7.0, 6.0, 3.0, 7.0, 0.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5100021362304688, -0.4911956787109375, -0.47238922119140625, -0.453582763671875, -0.43477630615234375, -0.4159698486328125, -0.39716339111328125, -0.37835693359375, -0.35955047607421875, -0.3407440185546875, -0.32193756103515625, -0.303131103515625, -0.28432464599609375, -0.2655181884765625, -0.24671173095703125, -0.2279052734375, -0.20909881591796875, -0.1902923583984375, -0.17148590087890625, -0.152679443359375, -0.13387298583984375, -0.1150665283203125, -0.09626007080078125, -0.07745361328125, -0.05864715576171875, -0.0398406982421875, -0.02103424072265625, -0.002227783203125, 0.01657867431640625, 0.0353851318359375, 0.05419158935546875, 0.072998046875, 0.09180450439453125, 0.1106109619140625, 0.12941741943359375, 0.148223876953125, 0.16703033447265625, 0.1858367919921875, 0.20464324951171875, 0.22344970703125, 0.24225616455078125, 0.2610626220703125, 0.27986907958984375, 0.298675537109375, 0.31748199462890625, 0.3362884521484375, 0.35509490966796875, 0.3739013671875, 0.39270782470703125, 0.4115142822265625, 0.43032073974609375, 0.449127197265625, 0.46793365478515625, 0.4867401123046875, 0.5055465698242188, 0.52435302734375, 0.5431594848632812, 0.5619659423828125, 0.5807723999023438, 0.599578857421875, 0.6183853149414062, 0.6371917724609375, 0.6559982299804688, 0.6748046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 9.0, 8.0, 11.0, 18.0, 22.0, 25.0, 69.0, 73.0, 127.0, 205.0, 378.0, 770.0, 2221.0, 11783.0, 132598.0, 821244.0, 68295.0, 7373.0, 1735.0, 688.0, 357.0, 178.0, 129.0, 80.0, 47.0, 32.0, 27.0, 16.0, 14.0, 3.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.589935302734375, -2.50994873046875, -2.429962158203125, -2.3499755859375, -2.269989013671875, -2.19000244140625, -2.110015869140625, -2.030029296875, -1.950042724609375, -1.87005615234375, -1.790069580078125, -1.7100830078125, -1.630096435546875, -1.55010986328125, -1.470123291015625, -1.39013671875, -1.310150146484375, -1.23016357421875, -1.150177001953125, -1.0701904296875, -0.990203857421875, -0.91021728515625, -0.830230712890625, -0.750244140625, -0.670257568359375, -0.59027099609375, -0.510284423828125, -0.4302978515625, -0.350311279296875, -0.27032470703125, -0.190338134765625, -0.1103515625, -0.030364990234375, 0.04962158203125, 0.129608154296875, 0.2095947265625, 0.289581298828125, 0.36956787109375, 0.449554443359375, 0.529541015625, 0.609527587890625, 0.68951416015625, 0.769500732421875, 0.8494873046875, 0.929473876953125, 1.00946044921875, 1.089447021484375, 1.16943359375, 1.249420166015625, 1.32940673828125, 1.409393310546875, 1.4893798828125, 1.569366455078125, 1.64935302734375, 1.729339599609375, 1.809326171875, 1.889312744140625, 1.96929931640625, 2.049285888671875, 2.1292724609375, 2.209259033203125, 2.28924560546875, 2.369232177734375, 2.44921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 13.0, 9.0, 11.0, 17.0, 21.0, 18.0, 26.0, 29.0, 31.0, 33.0, 38.0, 45.0, 37.0, 57.0, 50.0, 66.0, 52.0, 57.0, 36.0, 44.0, 36.0, 35.0, 29.0, 26.0, 37.0, 21.0, 20.0, 15.0, 11.0, 4.0, 18.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.171875, -2.10394287109375, -2.0360107421875, -1.96807861328125, -1.900146484375, -1.83221435546875, -1.7642822265625, -1.69635009765625, -1.62841796875, -1.56048583984375, -1.4925537109375, -1.42462158203125, -1.356689453125, -1.28875732421875, -1.2208251953125, -1.15289306640625, -1.0849609375, -1.01702880859375, -0.9490966796875, -0.88116455078125, -0.813232421875, -0.74530029296875, -0.6773681640625, -0.60943603515625, -0.54150390625, -0.47357177734375, -0.4056396484375, -0.33770751953125, -0.269775390625, -0.20184326171875, -0.1339111328125, -0.06597900390625, 0.001953125, 0.06988525390625, 0.1378173828125, 0.20574951171875, 0.273681640625, 0.34161376953125, 0.4095458984375, 0.47747802734375, 0.54541015625, 0.61334228515625, 0.6812744140625, 0.74920654296875, 0.817138671875, 0.88507080078125, 0.9530029296875, 1.02093505859375, 1.0888671875, 1.15679931640625, 1.2247314453125, 1.29266357421875, 1.360595703125, 1.42852783203125, 1.4964599609375, 1.56439208984375, 1.63232421875, 1.70025634765625, 1.7681884765625, 1.83612060546875, 1.904052734375, 1.97198486328125, 2.0399169921875, 2.10784912109375, 2.17578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 14.0, 13.0, 30.0, 45.0, 77.0, 109.0, 245.0, 671.0, 2086.0, 8020.0, 54119.0, 796102.0, 164318.0, 17108.0, 3666.0, 1099.0, 415.0, 149.0, 92.0, 51.0, 31.0, 18.0, 23.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.77880859375, -0.7534561157226562, -0.7281036376953125, -0.7027511596679688, -0.677398681640625, -0.6520462036132812, -0.6266937255859375, -0.6013412475585938, -0.57598876953125, -0.5506362915039062, -0.5252838134765625, -0.49993133544921875, -0.474578857421875, -0.44922637939453125, -0.4238739013671875, -0.39852142333984375, -0.3731689453125, -0.34781646728515625, -0.3224639892578125, -0.29711151123046875, -0.271759033203125, -0.24640655517578125, -0.2210540771484375, -0.19570159912109375, -0.17034912109375, -0.14499664306640625, -0.1196441650390625, -0.09429168701171875, -0.068939208984375, -0.04358673095703125, -0.0182342529296875, 0.00711822509765625, 0.032470703125, 0.05782318115234375, 0.0831756591796875, 0.10852813720703125, 0.133880615234375, 0.15923309326171875, 0.1845855712890625, 0.20993804931640625, 0.23529052734375, 0.26064300537109375, 0.2859954833984375, 0.31134796142578125, 0.336700439453125, 0.36205291748046875, 0.3874053955078125, 0.41275787353515625, 0.4381103515625, 0.46346282958984375, 0.4888153076171875, 0.5141677856445312, 0.539520263671875, 0.5648727416992188, 0.5902252197265625, 0.6155776977539062, 0.64093017578125, 0.6662826538085938, 0.6916351318359375, 0.7169876098632812, 0.742340087890625, 0.7676925659179688, 0.7930450439453125, 0.8183975219726562, 0.84375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 30.0, 37.0, 52.0, 85.0, 148.0, 177.0, 166.0, 118.0, 65.0, 39.0, 23.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003266334533691406, -0.000317256897687912, -0.00030788034200668335, -0.0002985037863254547, -0.0002891272306442261, -0.00027975067496299744, -0.0002703741192817688, -0.00026099756360054016, -0.0002516210079193115, -0.00024224445223808289, -0.00023286789655685425, -0.0002234913408756256, -0.00021411478519439697, -0.00020473822951316833, -0.0001953616738319397, -0.00018598511815071106, -0.00017660856246948242, -0.00016723200678825378, -0.00015785545110702515, -0.0001484788954257965, -0.00013910233974456787, -0.00012972578406333923, -0.0001203492283821106, -0.00011097267270088196, -0.00010159611701965332, -9.221956133842468e-05, -8.284300565719604e-05, -7.346644997596741e-05, -6.408989429473877e-05, -5.471333861351013e-05, -4.5336782932281494e-05, -3.5960227251052856e-05, -2.658367156982422e-05, -1.720711588859558e-05, -7.830560207366943e-06, 1.5459954738616943e-06, 1.0922551155090332e-05, 2.029910683631897e-05, 2.9675662517547607e-05, 3.9052218198776245e-05, 4.842877388000488e-05, 5.780532956123352e-05, 6.718188524246216e-05, 7.65584409236908e-05, 8.593499660491943e-05, 9.531155228614807e-05, 0.00010468810796737671, 0.00011406466364860535, 0.00012344121932983398, 0.00013281777501106262, 0.00014219433069229126, 0.0001515708863735199, 0.00016094744205474854, 0.00017032399773597717, 0.0001797005534172058, 0.00018907710909843445, 0.00019845366477966309, 0.00020783022046089172, 0.00021720677614212036, 0.000226583331823349, 0.00023595988750457764, 0.0002453364431858063, 0.0002547129988670349, 0.00026408955454826355, 0.0002734661102294922]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 5.0, 8.0, 10.0, 34.0, 44.0, 100.0, 327.0, 1349.0, 26678.0, 1004701.0, 13735.0, 1089.0, 284.0, 93.0, 36.0, 33.0, 8.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.247100830078125, -2.17779541015625, -2.108489990234375, -2.0391845703125, -1.969879150390625, -1.90057373046875, -1.831268310546875, -1.761962890625, -1.692657470703125, -1.62335205078125, -1.554046630859375, -1.4847412109375, -1.415435791015625, -1.34613037109375, -1.276824951171875, -1.20751953125, -1.138214111328125, -1.06890869140625, -0.999603271484375, -0.9302978515625, -0.860992431640625, -0.79168701171875, -0.722381591796875, -0.653076171875, -0.583770751953125, -0.51446533203125, -0.445159912109375, -0.3758544921875, -0.306549072265625, -0.23724365234375, -0.167938232421875, -0.0986328125, -0.029327392578125, 0.03997802734375, 0.109283447265625, 0.1785888671875, 0.247894287109375, 0.31719970703125, 0.386505126953125, 0.455810546875, 0.525115966796875, 0.59442138671875, 0.663726806640625, 0.7330322265625, 0.802337646484375, 0.87164306640625, 0.940948486328125, 1.01025390625, 1.079559326171875, 1.14886474609375, 1.218170166015625, 1.2874755859375, 1.356781005859375, 1.42608642578125, 1.495391845703125, 1.564697265625, 1.634002685546875, 1.70330810546875, 1.772613525390625, 1.8419189453125, 1.911224365234375, 1.98052978515625, 2.049835205078125, 2.119140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 13.0, 27.0, 90.0, 186.0, 266.0, 195.0, 119.0, 50.0, 17.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6279296875, -1.579620361328125, -1.53131103515625, -1.483001708984375, -1.4346923828125, -1.386383056640625, -1.33807373046875, -1.289764404296875, -1.241455078125, -1.193145751953125, -1.14483642578125, -1.096527099609375, -1.0482177734375, -0.999908447265625, -0.95159912109375, -0.903289794921875, -0.85498046875, -0.806671142578125, -0.75836181640625, -0.710052490234375, -0.6617431640625, -0.613433837890625, -0.56512451171875, -0.516815185546875, -0.468505859375, -0.420196533203125, -0.37188720703125, -0.323577880859375, -0.2752685546875, -0.226959228515625, -0.17864990234375, -0.130340576171875, -0.08203125, -0.033721923828125, 0.01458740234375, 0.062896728515625, 0.1112060546875, 0.159515380859375, 0.20782470703125, 0.256134033203125, 0.304443359375, 0.352752685546875, 0.40106201171875, 0.449371337890625, 0.4976806640625, 0.545989990234375, 0.59429931640625, 0.642608642578125, 0.69091796875, 0.739227294921875, 0.78753662109375, 0.835845947265625, 0.8841552734375, 0.932464599609375, 0.98077392578125, 1.029083251953125, 1.077392578125, 1.125701904296875, 1.17401123046875, 1.222320556640625, 1.2706298828125, 1.318939208984375, 1.36724853515625, 1.415557861328125, 1.4638671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 12.0, 27.0, 72.0, 119.0, 317.0, 283.0, 101.0, 43.0, 15.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.00189971923828, -29.363317489624023, -28.724735260009766, -28.086153030395508, -27.44757080078125, -26.80898666381836, -26.1704044342041, -25.531822204589844, -24.893239974975586, -24.254657745361328, -23.61607551574707, -22.977493286132812, -22.338909149169922, -21.700326919555664, -21.061744689941406, -20.42316246032715, -19.78458023071289, -19.145998001098633, -18.507415771484375, -17.868833541870117, -17.23025131225586, -16.59166717529297, -15.953084945678711, -15.314502716064453, -14.675920486450195, -14.037338256835938, -13.39875602722168, -12.760172843933105, -12.121590614318848, -11.48300838470459, -10.844425201416016, -10.205842971801758, -9.5672607421875, -8.928678512573242, -8.290096282958984, -7.65151309967041, -7.012930870056152, -6.3743486404418945, -5.7357659339904785, -5.0971832275390625, -4.458600997924805, -3.8200185298919678, -3.181436061859131, -2.542853593826294, -1.904271125793457, -1.2656886577606201, -0.6271061897277832, 0.011476516723632812, 0.6500587463378906, 1.2886412143707275, 1.9272236824035645, 2.5658061504364014, 3.2043886184692383, 3.842971086502075, 4.481553554534912, 5.120136260986328, 5.758718490600586, 6.397300720214844, 7.03588342666626, 7.674466133117676, 8.313048362731934, 8.951630592346191, 9.590213775634766, 10.228796005249023, 10.867378234863281]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 4.0, 13.0, 11.0, 7.0, 16.0, 17.0, 16.0, 17.0, 18.0, 18.0, 28.0, 37.0, 23.0, 26.0, 32.0, 42.0, 48.0, 103.0, 102.0, 66.0, 32.0, 27.0, 26.0, 32.0, 30.0, 33.0, 25.0, 14.0, 18.0, 7.0, 5.0, 10.0, 8.0, 12.0, 9.0, 6.0, 12.0, 2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.52434778213501, -7.28047513961792, -7.03660249710083, -6.79272985458374, -6.54885721206665, -6.3049845695495605, -6.0611114501953125, -5.817238807678223, -5.573366165161133, -5.329493522644043, -5.085620880126953, -4.841748237609863, -4.597875595092773, -4.354002952575684, -4.110130310058594, -3.866257429122925, -3.622385025024414, -3.378512382507324, -3.1346397399902344, -2.8907670974731445, -2.6468944549560547, -2.403021812438965, -2.159148931503296, -1.915276288986206, -1.6714036464691162, -1.4275310039520264, -1.1836583614349365, -0.9397855997085571, -0.6959129571914673, -0.45204031467437744, -0.20816755294799805, 0.0357050895690918, 0.27957820892333984, 0.5234508514404297, 0.7673235535621643, 1.011196255683899, 1.2550688982009888, 1.4989415407180786, 1.742814302444458, 1.9866869449615479, 2.2305595874786377, 2.4744322299957275, 2.7183048725128174, 2.9621777534484863, 3.206050395965576, 3.449923038482666, 3.693795680999756, 3.9376683235168457, 4.1815409660339355, 4.425413608551025, 4.669286251068115, 4.913158893585205, 5.157031536102295, 5.400904178619385, 5.644777297973633, 5.888649940490723, 6.1325225830078125, 6.376395225524902, 6.620267868041992, 6.864140510559082, 7.108013153076172, 7.351885795593262, 7.595758438110352, 7.839631080627441, 8.083503723144531]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 12.0, 14.0, 27.0, 30.0, 62.0, 68.0, 113.0, 152.0, 253.0, 453.0, 821.0, 1372.0, 2826.0, 6271.0, 17395.0, 64374.0, 282624.0, 1158681.0, 1865685.0, 612018.0, 130787.0, 31826.0, 9844.0, 4040.0, 1927.0, 1059.0, 554.0, 357.0, 215.0, 129.0, 93.0, 54.0, 40.0, 25.0, 20.0, 17.0, 7.0, 10.0, 5.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.60693359375, -0.58868408203125, -0.5704345703125, -0.55218505859375, -0.533935546875, -0.51568603515625, -0.4974365234375, -0.47918701171875, -0.4609375, -0.44268798828125, -0.4244384765625, -0.40618896484375, -0.387939453125, -0.36968994140625, -0.3514404296875, -0.33319091796875, -0.31494140625, -0.29669189453125, -0.2784423828125, -0.26019287109375, -0.241943359375, -0.22369384765625, -0.2054443359375, -0.18719482421875, -0.1689453125, -0.15069580078125, -0.1324462890625, -0.11419677734375, -0.095947265625, -0.07769775390625, -0.0594482421875, -0.04119873046875, -0.02294921875, -0.00469970703125, 0.0135498046875, 0.03179931640625, 0.050048828125, 0.06829833984375, 0.0865478515625, 0.10479736328125, 0.123046875, 0.14129638671875, 0.1595458984375, 0.17779541015625, 0.196044921875, 0.21429443359375, 0.2325439453125, 0.25079345703125, 0.26904296875, 0.28729248046875, 0.3055419921875, 0.32379150390625, 0.342041015625, 0.36029052734375, 0.3785400390625, 0.39678955078125, 0.4150390625, 0.43328857421875, 0.4515380859375, 0.46978759765625, 0.488037109375, 0.50628662109375, 0.5245361328125, 0.54278564453125, 0.56103515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 0.0, 9.0, 6.0, 10.0, 10.0, 9.0, 15.0, 12.0, 21.0, 22.0, 21.0, 25.0, 37.0, 33.0, 35.0, 31.0, 42.0, 34.0, 43.0, 41.0, 45.0, 34.0, 34.0, 58.0, 34.0, 34.0, 35.0, 22.0, 37.0, 30.0, 33.0, 21.0, 14.0, 13.0, 21.0, 15.0, 13.0, 10.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.52099609375, -0.504150390625, -0.4873046875, -0.470458984375, -0.45361328125, -0.436767578125, -0.419921875, -0.403076171875, -0.38623046875, -0.369384765625, -0.3525390625, -0.335693359375, -0.31884765625, -0.302001953125, -0.28515625, -0.268310546875, -0.25146484375, -0.234619140625, -0.2177734375, -0.200927734375, -0.18408203125, -0.167236328125, -0.150390625, -0.133544921875, -0.11669921875, -0.099853515625, -0.0830078125, -0.066162109375, -0.04931640625, -0.032470703125, -0.015625, 0.001220703125, 0.01806640625, 0.034912109375, 0.0517578125, 0.068603515625, 0.08544921875, 0.102294921875, 0.119140625, 0.135986328125, 0.15283203125, 0.169677734375, 0.1865234375, 0.203369140625, 0.22021484375, 0.237060546875, 0.25390625, 0.270751953125, 0.28759765625, 0.304443359375, 0.3212890625, 0.338134765625, 0.35498046875, 0.371826171875, 0.388671875, 0.405517578125, 0.42236328125, 0.439208984375, 0.4560546875, 0.472900390625, 0.48974609375, 0.506591796875, 0.5234375, 0.540283203125, 0.55712890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 17.0, 41.0, 117.0, 290.0, 1041.0, 19763.0, 4152367.0, 19013.0, 1106.0, 295.0, 116.0, 52.0, 27.0, 10.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.21209716796875, -4.0531005859375, -3.89410400390625, -3.735107421875, -3.57611083984375, -3.4171142578125, -3.25811767578125, -3.09912109375, -2.94012451171875, -2.7811279296875, -2.62213134765625, -2.463134765625, -2.30413818359375, -2.1451416015625, -1.98614501953125, -1.8271484375, -1.66815185546875, -1.5091552734375, -1.35015869140625, -1.191162109375, -1.03216552734375, -0.8731689453125, -0.71417236328125, -0.55517578125, -0.39617919921875, -0.2371826171875, -0.07818603515625, 0.080810546875, 0.23980712890625, 0.3988037109375, 0.55780029296875, 0.716796875, 0.87579345703125, 1.0347900390625, 1.19378662109375, 1.352783203125, 1.51177978515625, 1.6707763671875, 1.82977294921875, 1.98876953125, 2.14776611328125, 2.3067626953125, 2.46575927734375, 2.624755859375, 2.78375244140625, 2.9427490234375, 3.10174560546875, 3.2607421875, 3.41973876953125, 3.5787353515625, 3.73773193359375, 3.896728515625, 4.05572509765625, 4.2147216796875, 4.37371826171875, 4.53271484375, 4.69171142578125, 4.8507080078125, 5.00970458984375, 5.168701171875, 5.32769775390625, 5.4866943359375, 5.64569091796875, 5.8046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 5.0, 6.0, 3.0, 7.0, 14.0, 41.0, 88.0, 178.0, 383.0, 880.0, 1175.0, 710.0, 292.0, 142.0, 57.0, 44.0, 22.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.748046875, -1.678985595703125, -1.60992431640625, -1.540863037109375, -1.4718017578125, -1.402740478515625, -1.33367919921875, -1.264617919921875, -1.195556640625, -1.126495361328125, -1.05743408203125, -0.988372802734375, -0.9193115234375, -0.850250244140625, -0.78118896484375, -0.712127685546875, -0.64306640625, -0.574005126953125, -0.50494384765625, -0.435882568359375, -0.3668212890625, -0.297760009765625, -0.22869873046875, -0.159637451171875, -0.090576171875, -0.021514892578125, 0.04754638671875, 0.116607666015625, 0.1856689453125, 0.254730224609375, 0.32379150390625, 0.392852783203125, 0.4619140625, 0.530975341796875, 0.60003662109375, 0.669097900390625, 0.7381591796875, 0.807220458984375, 0.87628173828125, 0.945343017578125, 1.014404296875, 1.083465576171875, 1.15252685546875, 1.221588134765625, 1.2906494140625, 1.359710693359375, 1.42877197265625, 1.497833251953125, 1.56689453125, 1.635955810546875, 1.70501708984375, 1.774078369140625, 1.8431396484375, 1.912200927734375, 1.98126220703125, 2.050323486328125, 2.119384765625, 2.188446044921875, 2.25750732421875, 2.326568603515625, 2.3956298828125, 2.464691162109375, 2.53375244140625, 2.602813720703125, 2.671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 19.0, 45.0, 172.0, 361.0, 255.0, 85.0, 32.0, 20.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.079544067382812, -11.24988079071045, -10.420218467712402, -9.590555191040039, -8.760892868041992, -7.931229591369629, -7.101566314697266, -6.2719035148620605, -5.4422407150268555, -4.61257791519165, -3.782914876937866, -2.953251838684082, -2.123589038848877, -1.2939262390136719, -0.4642629623413086, 0.3653998374938965, 1.1950626373291016, 2.0247254371643066, 2.854388475418091, 3.684051513671875, 4.51371431350708, 5.343377113342285, 6.173040390014648, 7.0027031898498535, 7.832365989685059, 8.662029266357422, 9.491691589355469, 10.321354866027832, 11.151018142700195, 11.980680465698242, 12.810343742370605, 13.640007019042969, 14.469669342041016, 15.299332618713379, 16.128995895385742, 16.95865821838379, 17.788320541381836, 18.617984771728516, 19.447647094726562, 20.27730941772461, 21.106971740722656, 21.936634063720703, 22.766298294067383, 23.59596061706543, 24.425622940063477, 25.255287170410156, 26.084949493408203, 26.91461181640625, 27.74427604675293, 28.573938369750977, 29.403602600097656, 30.233264923095703, 31.06292724609375, 31.892589569091797, 32.722251892089844, 33.551918029785156, 34.3815803527832, 35.21124267578125, 36.0409049987793, 36.870567321777344, 37.700233459472656, 38.5298957824707, 39.35955810546875, 40.1892204284668, 41.018882751464844]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 10.0, 12.0, 11.0, 17.0, 23.0, 35.0, 37.0, 35.0, 39.0, 43.0, 65.0, 43.0, 46.0, 40.0, 47.0, 44.0, 50.0, 55.0, 38.0, 36.0, 30.0, 35.0, 31.0, 31.0, 29.0, 18.0, 18.0, 15.0, 8.0, 7.0, 13.0, 7.0, 4.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.137204170227051, -6.908017635345459, -6.678831100463867, -6.449645042419434, -6.220458507537842, -5.99127197265625, -5.762085437774658, -5.532898902893066, -5.303712368011475, -5.074525833129883, -4.845339298248291, -4.616152763366699, -4.386966705322266, -4.157780170440674, -3.928593635559082, -3.6994071006774902, -3.4702208042144775, -3.2410342693328857, -3.011847972869873, -2.7826614379882812, -2.5534749031066895, -2.3242883682250977, -2.095102071762085, -1.8659155368804932, -1.636729121208191, -1.4075427055358887, -1.1783561706542969, -0.9491697549819946, -0.7199832797050476, -0.4907968044281006, -0.26161038875579834, -0.03242385387420654, 0.1967625617980957, 0.4259490370750427, 0.6551355123519897, 0.884321928024292, 1.1135084629058838, 1.342694878578186, 1.5718812942504883, 1.80106782913208, 2.030254364013672, 2.2594408988952637, 2.4886271953582764, 2.717813730239868, 2.94700026512146, 3.1761865615844727, 3.4053730964660645, 3.6345596313476562, 3.863745927810669, 4.092932224273682, 4.322118759155273, 4.551305294036865, 4.780491828918457, 5.009678363800049, 5.238864898681641, 5.468050956726074, 5.697237491607666, 5.926424026489258, 6.15561056137085, 6.384797096252441, 6.613983154296875, 6.843169689178467, 7.072356224060059, 7.30154275894165, 7.530729293823242]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 9.0, 9.0, 7.0, 19.0, 34.0, 39.0, 44.0, 78.0, 128.0, 184.0, 286.0, 431.0, 670.0, 1104.0, 1641.0, 2820.0, 4775.0, 8109.0, 14518.0, 27257.0, 53189.0, 107500.0, 212368.0, 271908.0, 167528.0, 82562.0, 41531.0, 21577.0, 11780.0, 6430.0, 3757.0, 2294.0, 1444.0, 882.0, 521.0, 367.0, 258.0, 177.0, 111.0, 55.0, 51.0, 34.0, 30.0, 13.0, 16.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5922393798828125, -0.569732666015625, -0.5472259521484375, -0.52471923828125, -0.5022125244140625, -0.479705810546875, -0.4571990966796875, -0.4346923828125, -0.4121856689453125, -0.389678955078125, -0.3671722412109375, -0.34466552734375, -0.3221588134765625, -0.299652099609375, -0.2771453857421875, -0.254638671875, -0.2321319580078125, -0.209625244140625, -0.1871185302734375, -0.16461181640625, -0.1421051025390625, -0.119598388671875, -0.0970916748046875, -0.0745849609375, -0.0520782470703125, -0.029571533203125, -0.0070648193359375, 0.01544189453125, 0.0379486083984375, 0.060455322265625, 0.0829620361328125, 0.10546875, 0.1279754638671875, 0.150482177734375, 0.1729888916015625, 0.19549560546875, 0.2180023193359375, 0.240509033203125, 0.2630157470703125, 0.2855224609375, 0.3080291748046875, 0.330535888671875, 0.3530426025390625, 0.37554931640625, 0.3980560302734375, 0.420562744140625, 0.4430694580078125, 0.465576171875, 0.4880828857421875, 0.510589599609375, 0.5330963134765625, 0.55560302734375, 0.5781097412109375, 0.600616455078125, 0.6231231689453125, 0.6456298828125, 0.6681365966796875, 0.690643310546875, 0.7131500244140625, 0.73565673828125, 0.7581634521484375, 0.780670166015625, 0.8031768798828125, 0.82568359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 10.0, 5.0, 5.0, 4.0, 15.0, 14.0, 14.0, 15.0, 20.0, 23.0, 29.0, 32.0, 35.0, 32.0, 34.0, 56.0, 37.0, 41.0, 41.0, 44.0, 54.0, 51.0, 49.0, 31.0, 48.0, 37.0, 23.0, 26.0, 28.0, 24.0, 15.0, 16.0, 19.0, 13.0, 13.0, 5.0, 6.0, 7.0, 7.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.572265625, -0.5529861450195312, -0.5337066650390625, -0.5144271850585938, -0.495147705078125, -0.47586822509765625, -0.4565887451171875, -0.43730926513671875, -0.41802978515625, -0.39875030517578125, -0.3794708251953125, -0.36019134521484375, -0.340911865234375, -0.32163238525390625, -0.3023529052734375, -0.28307342529296875, -0.2637939453125, -0.24451446533203125, -0.2252349853515625, -0.20595550537109375, -0.186676025390625, -0.16739654541015625, -0.1481170654296875, -0.12883758544921875, -0.10955810546875, -0.09027862548828125, -0.0709991455078125, -0.05171966552734375, -0.032440185546875, -0.01316070556640625, 0.0061187744140625, 0.02539825439453125, 0.044677734375, 0.06395721435546875, 0.0832366943359375, 0.10251617431640625, 0.121795654296875, 0.14107513427734375, 0.1603546142578125, 0.17963409423828125, 0.19891357421875, 0.21819305419921875, 0.2374725341796875, 0.25675201416015625, 0.276031494140625, 0.29531097412109375, 0.3145904541015625, 0.33386993408203125, 0.3531494140625, 0.37242889404296875, 0.3917083740234375, 0.41098785400390625, 0.430267333984375, 0.44954681396484375, 0.4688262939453125, 0.48810577392578125, 0.50738525390625, 0.5266647338867188, 0.5459442138671875, 0.5652236938476562, 0.584503173828125, 0.6037826538085938, 0.6230621337890625, 0.6423416137695312, 0.66162109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 17.0, 16.0, 28.0, 32.0, 64.0, 98.0, 149.0, 243.0, 416.0, 883.0, 2438.0, 15990.0, 772546.0, 242044.0, 9895.0, 1924.0, 791.0, 396.0, 221.0, 123.0, 81.0, 38.0, 32.0, 23.0, 21.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.39453125, -4.275421142578125, -4.15631103515625, -4.037200927734375, -3.9180908203125, -3.798980712890625, -3.67987060546875, -3.560760498046875, -3.441650390625, -3.322540283203125, -3.20343017578125, -3.084320068359375, -2.9652099609375, -2.846099853515625, -2.72698974609375, -2.607879638671875, -2.48876953125, -2.369659423828125, -2.25054931640625, -2.131439208984375, -2.0123291015625, -1.893218994140625, -1.77410888671875, -1.654998779296875, -1.535888671875, -1.416778564453125, -1.29766845703125, -1.178558349609375, -1.0594482421875, -0.940338134765625, -0.82122802734375, -0.702117919921875, -0.5830078125, -0.463897705078125, -0.34478759765625, -0.225677490234375, -0.1065673828125, 0.012542724609375, 0.13165283203125, 0.250762939453125, 0.369873046875, 0.488983154296875, 0.60809326171875, 0.727203369140625, 0.8463134765625, 0.965423583984375, 1.08453369140625, 1.203643798828125, 1.32275390625, 1.441864013671875, 1.56097412109375, 1.680084228515625, 1.7991943359375, 1.918304443359375, 2.03741455078125, 2.156524658203125, 2.275634765625, 2.394744873046875, 2.51385498046875, 2.632965087890625, 2.7520751953125, 2.871185302734375, 2.99029541015625, 3.109405517578125, 3.228515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 7.0, 4.0, 2.0, 7.0, 9.0, 12.0, 8.0, 15.0, 18.0, 22.0, 19.0, 29.0, 29.0, 26.0, 44.0, 44.0, 42.0, 52.0, 57.0, 60.0, 57.0, 51.0, 54.0, 43.0, 53.0, 30.0, 32.0, 27.0, 29.0, 19.0, 16.0, 11.0, 19.0, 5.0, 7.0, 5.0, 8.0, 3.0, 1.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.322509765625, -2.24658203125, -2.170654296875, -2.0947265625, -2.018798828125, -1.94287109375, -1.866943359375, -1.791015625, -1.715087890625, -1.63916015625, -1.563232421875, -1.4873046875, -1.411376953125, -1.33544921875, -1.259521484375, -1.18359375, -1.107666015625, -1.03173828125, -0.955810546875, -0.8798828125, -0.803955078125, -0.72802734375, -0.652099609375, -0.576171875, -0.500244140625, -0.42431640625, -0.348388671875, -0.2724609375, -0.196533203125, -0.12060546875, -0.044677734375, 0.03125, 0.107177734375, 0.18310546875, 0.259033203125, 0.3349609375, 0.410888671875, 0.48681640625, 0.562744140625, 0.638671875, 0.714599609375, 0.79052734375, 0.866455078125, 0.9423828125, 1.018310546875, 1.09423828125, 1.170166015625, 1.24609375, 1.322021484375, 1.39794921875, 1.473876953125, 1.5498046875, 1.625732421875, 1.70166015625, 1.777587890625, 1.853515625, 1.929443359375, 2.00537109375, 2.081298828125, 2.1572265625, 2.233154296875, 2.30908203125, 2.385009765625, 2.4609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 1.0, 14.0, 9.0, 8.0, 5.0, 14.0, 27.0, 34.0, 52.0, 80.0, 117.0, 206.0, 437.0, 897.0, 2509.0, 9615.0, 55684.0, 760473.0, 188027.0, 22418.0, 4888.0, 1597.0, 635.0, 314.0, 189.0, 95.0, 60.0, 36.0, 29.0, 19.0, 9.0, 8.0, 6.0, 9.0, 2.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6648788452148438, -0.6451873779296875, -0.6254959106445312, -0.605804443359375, -0.5861129760742188, -0.5664215087890625, -0.5467300415039062, -0.52703857421875, -0.5073471069335938, -0.4876556396484375, -0.46796417236328125, -0.448272705078125, -0.42858123779296875, -0.4088897705078125, -0.38919830322265625, -0.3695068359375, -0.34981536865234375, -0.3301239013671875, -0.31043243408203125, -0.290740966796875, -0.27104949951171875, -0.2513580322265625, -0.23166656494140625, -0.21197509765625, -0.19228363037109375, -0.1725921630859375, -0.15290069580078125, -0.133209228515625, -0.11351776123046875, -0.0938262939453125, -0.07413482666015625, -0.054443359375, -0.03475189208984375, -0.0150604248046875, 0.00463104248046875, 0.024322509765625, 0.04401397705078125, 0.0637054443359375, 0.08339691162109375, 0.10308837890625, 0.12277984619140625, 0.1424713134765625, 0.16216278076171875, 0.181854248046875, 0.20154571533203125, 0.2212371826171875, 0.24092864990234375, 0.2606201171875, 0.28031158447265625, 0.3000030517578125, 0.31969451904296875, 0.339385986328125, 0.35907745361328125, 0.3787689208984375, 0.39846038818359375, 0.41815185546875, 0.43784332275390625, 0.4575347900390625, 0.47722625732421875, 0.496917724609375, 0.5166091918945312, 0.5363006591796875, 0.5559921264648438, 0.57568359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 13.0, 19.0, 22.0, 45.0, 83.0, 120.0, 190.0, 184.0, 98.0, 83.0, 38.0, 24.0, 22.0, 13.0, 10.0, 12.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003020763397216797, -0.0002916567027568817, -0.00028123706579208374, -0.00027081742882728577, -0.0002603977918624878, -0.0002499781548976898, -0.00023955851793289185, -0.00022913888096809387, -0.0002187192440032959, -0.00020829960703849792, -0.00019787997007369995, -0.00018746033310890198, -0.000177040696144104, -0.00016662105917930603, -0.00015620142221450806, -0.00014578178524971008, -0.0001353621482849121, -0.00012494251132011414, -0.00011452287435531616, -0.00010410323739051819, -9.368360042572021e-05, -8.326396346092224e-05, -7.284432649612427e-05, -6.24246895313263e-05, -5.200505256652832e-05, -4.158541560173035e-05, -3.116577863693237e-05, -2.07461416721344e-05, -1.0326504707336426e-05, 9.313225746154785e-08, 1.0512769222259521e-05, 2.0932406187057495e-05, 3.135204315185547e-05, 4.177168011665344e-05, 5.2191317081451416e-05, 6.261095404624939e-05, 7.303059101104736e-05, 8.345022797584534e-05, 9.386986494064331e-05, 0.00010428950190544128, 0.00011470913887023926, 0.00012512877583503723, 0.0001355484127998352, 0.00014596804976463318, 0.00015638768672943115, 0.00016680732369422913, 0.0001772269606590271, 0.00018764659762382507, 0.00019806623458862305, 0.00020848587155342102, 0.000218905508518219, 0.00022932514548301697, 0.00023974478244781494, 0.0002501644194126129, 0.0002605840563774109, 0.00027100369334220886, 0.00028142333030700684, 0.0002918429672718048, 0.0003022626042366028, 0.00031268224120140076, 0.00032310187816619873, 0.0003335215151309967, 0.0003439411520957947, 0.00035436078906059265, 0.0003647804260253906]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 1.0, 5.0, 8.0, 17.0, 23.0, 38.0, 46.0, 76.0, 107.0, 220.0, 445.0, 968.0, 3615.0, 22006.0, 671845.0, 325755.0, 18197.0, 3147.0, 1018.0, 442.0, 213.0, 115.0, 87.0, 44.0, 29.0, 17.0, 14.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.927734375, -0.9026336669921875, -0.877532958984375, -0.8524322509765625, -0.82733154296875, -0.8022308349609375, -0.777130126953125, -0.7520294189453125, -0.7269287109375, -0.7018280029296875, -0.676727294921875, -0.6516265869140625, -0.62652587890625, -0.6014251708984375, -0.576324462890625, -0.5512237548828125, -0.526123046875, -0.5010223388671875, -0.475921630859375, -0.4508209228515625, -0.42572021484375, -0.4006195068359375, -0.375518798828125, -0.3504180908203125, -0.3253173828125, -0.3002166748046875, -0.275115966796875, -0.2500152587890625, -0.22491455078125, -0.1998138427734375, -0.174713134765625, -0.1496124267578125, -0.12451171875, -0.0994110107421875, -0.074310302734375, -0.0492095947265625, -0.02410888671875, 0.0009918212890625, 0.026092529296875, 0.0511932373046875, 0.0762939453125, 0.1013946533203125, 0.126495361328125, 0.1515960693359375, 0.17669677734375, 0.2017974853515625, 0.226898193359375, 0.2519989013671875, 0.277099609375, 0.3022003173828125, 0.327301025390625, 0.3524017333984375, 0.37750244140625, 0.4026031494140625, 0.427703857421875, 0.4528045654296875, 0.4779052734375, 0.5030059814453125, 0.528106689453125, 0.5532073974609375, 0.57830810546875, 0.6034088134765625, 0.628509521484375, 0.6536102294921875, 0.6787109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 7.0, 10.0, 15.0, 14.0, 21.0, 42.0, 35.0, 61.0, 84.0, 105.0, 103.0, 121.0, 93.0, 86.0, 54.0, 39.0, 30.0, 16.0, 12.0, 12.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6493377685546875, -0.631195068359375, -0.6130523681640625, -0.59490966796875, -0.5767669677734375, -0.558624267578125, -0.5404815673828125, -0.5223388671875, -0.5041961669921875, -0.486053466796875, -0.4679107666015625, -0.44976806640625, -0.4316253662109375, -0.413482666015625, -0.3953399658203125, -0.377197265625, -0.3590545654296875, -0.340911865234375, -0.3227691650390625, -0.30462646484375, -0.2864837646484375, -0.268341064453125, -0.2501983642578125, -0.2320556640625, -0.2139129638671875, -0.195770263671875, -0.1776275634765625, -0.15948486328125, -0.1413421630859375, -0.123199462890625, -0.1050567626953125, -0.0869140625, -0.0687713623046875, -0.050628662109375, -0.0324859619140625, -0.01434326171875, 0.0037994384765625, 0.021942138671875, 0.0400848388671875, 0.0582275390625, 0.0763702392578125, 0.094512939453125, 0.1126556396484375, 0.13079833984375, 0.1489410400390625, 0.167083740234375, 0.1852264404296875, 0.203369140625, 0.2215118408203125, 0.239654541015625, 0.2577972412109375, 0.27593994140625, 0.2940826416015625, 0.312225341796875, 0.3303680419921875, 0.3485107421875, 0.3666534423828125, 0.384796142578125, 0.4029388427734375, 0.42108154296875, 0.4392242431640625, 0.457366943359375, 0.4755096435546875, 0.49365234375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 14.0, 62.0, 433.0, 398.0, 74.0, 16.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.4105110168457, -45.120765686035156, -43.83102035522461, -42.54127502441406, -41.251529693603516, -39.96178436279297, -38.67203903198242, -37.382293701171875, -36.09254455566406, -34.802799224853516, -33.51305389404297, -32.22330856323242, -30.933563232421875, -29.643817901611328, -28.35407066345215, -27.0643253326416, -25.774581909179688, -24.48483657836914, -23.195091247558594, -21.905345916748047, -20.6156005859375, -19.325855255126953, -18.036108016967773, -16.746362686157227, -15.45661735534668, -14.166872024536133, -12.877126693725586, -11.587380409240723, -10.297635078430176, -9.007889747619629, -7.718143939971924, -6.428398132324219, -5.1386566162109375, -3.8489110469818115, -2.5591654777526855, -1.2694199085235596, 0.020325660705566406, 1.3100709915161133, 2.5998167991638184, 3.8895626068115234, 5.17930793762207, 6.469053268432617, 7.758799076080322, 9.048544883728027, 10.338290214538574, 11.628035545349121, 12.917781829833984, 14.207527160644531, 15.497272491455078, 16.787017822265625, 18.076763153076172, 19.36650848388672, 20.656253814697266, 21.945999145507812, 23.235746383666992, 24.52549171447754, 25.815237045288086, 27.104982376098633, 28.39472770690918, 29.684473037719727, 30.974220275878906, 32.26396560668945, 33.5537109375, 34.84345626831055, 36.133201599121094]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 10.0, 10.0, 17.0, 18.0, 22.0, 18.0, 25.0, 44.0, 30.0, 20.0, 38.0, 53.0, 168.0, 168.0, 54.0, 44.0, 34.0, 24.0, 27.0, 18.0, 33.0, 17.0, 13.0, 11.0, 12.0, 15.0, 9.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53750991821289, -11.177508354187012, -10.81750774383545, -10.45750617980957, -10.097505569458008, -9.737504005432129, -9.37750244140625, -9.017501831054688, -8.657500267028809, -8.29749870300293, -7.937498092651367, -7.577496528625488, -7.217495441436768, -6.857494354248047, -6.497493267059326, -6.1374921798706055, -5.777491092681885, -5.417490005493164, -5.057488918304443, -4.697487831115723, -4.337486267089844, -3.977485179901123, -3.6174840927124023, -3.2574827671051025, -2.897481679916382, -2.537480592727661, -2.1774792671203613, -1.8174781799316406, -1.4574769735336304, -1.0974757671356201, -0.7374746799468994, -0.3774733543395996, -0.017472267150878906, 0.34252890944480896, 0.7025300860404968, 1.0625312328338623, 1.4225324392318726, 1.7825336456298828, 2.1425347328186035, 2.5025360584259033, 2.862537145614624, 3.2225382328033447, 3.5825395584106445, 3.9425406455993652, 4.302541732788086, 4.662543296813965, 5.022543907165527, 5.382545471191406, 5.742546558380127, 6.102547645568848, 6.462548732757568, 6.822549819946289, 7.182551383972168, 7.542552471160889, 7.902553558349609, 8.262555122375488, 8.62255573272705, 8.98255729675293, 9.342557907104492, 9.702559471130371, 10.062560081481934, 10.422561645507812, 10.782562255859375, 11.142563819885254, 11.502565383911133]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 12.0, 14.0, 29.0, 46.0, 101.0, 148.0, 320.0, 637.0, 1469.0, 3992.0, 13599.0, 77161.0, 894439.0, 2717211.0, 432710.0, 38969.0, 8289.0, 2832.0, 1146.0, 552.0, 260.0, 146.0, 79.0, 58.0, 31.0, 16.0, 11.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.904296875, -0.85986328125, -0.8154296875, -0.77099609375, -0.7265625, -0.68212890625, -0.6376953125, -0.59326171875, -0.548828125, -0.50439453125, -0.4599609375, -0.41552734375, -0.37109375, -0.32666015625, -0.2822265625, -0.23779296875, -0.193359375, -0.14892578125, -0.1044921875, -0.06005859375, -0.015625, 0.02880859375, 0.0732421875, 0.11767578125, 0.162109375, 0.20654296875, 0.2509765625, 0.29541015625, 0.33984375, 0.38427734375, 0.4287109375, 0.47314453125, 0.517578125, 0.56201171875, 0.6064453125, 0.65087890625, 0.6953125, 0.73974609375, 0.7841796875, 0.82861328125, 0.873046875, 0.91748046875, 0.9619140625, 1.00634765625, 1.05078125, 1.09521484375, 1.1396484375, 1.18408203125, 1.228515625, 1.27294921875, 1.3173828125, 1.36181640625, 1.40625, 1.45068359375, 1.4951171875, 1.53955078125, 1.583984375, 1.62841796875, 1.6728515625, 1.71728515625, 1.76171875, 1.80615234375, 1.8505859375, 1.89501953125, 1.939453125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 8.0, 12.0, 11.0, 22.0, 20.0, 32.0, 35.0, 41.0, 57.0, 55.0, 57.0, 53.0, 61.0, 62.0, 50.0, 76.0, 52.0, 44.0, 46.0, 47.0, 30.0, 21.0, 18.0, 21.0, 17.0, 13.0, 6.0, 6.0, 11.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.495880126953125, -0.47027587890625, -0.444671630859375, -0.4190673828125, -0.393463134765625, -0.36785888671875, -0.342254638671875, -0.316650390625, -0.291046142578125, -0.26544189453125, -0.239837646484375, -0.2142333984375, -0.188629150390625, -0.16302490234375, -0.137420654296875, -0.11181640625, -0.086212158203125, -0.06060791015625, -0.035003662109375, -0.0093994140625, 0.016204833984375, 0.04180908203125, 0.067413330078125, 0.093017578125, 0.118621826171875, 0.14422607421875, 0.169830322265625, 0.1954345703125, 0.221038818359375, 0.24664306640625, 0.272247314453125, 0.2978515625, 0.323455810546875, 0.34906005859375, 0.374664306640625, 0.4002685546875, 0.425872802734375, 0.45147705078125, 0.477081298828125, 0.502685546875, 0.528289794921875, 0.55389404296875, 0.579498291015625, 0.6051025390625, 0.630706787109375, 0.65631103515625, 0.681915283203125, 0.70751953125, 0.733123779296875, 0.75872802734375, 0.784332275390625, 0.8099365234375, 0.835540771484375, 0.86114501953125, 0.886749267578125, 0.912353515625, 0.937957763671875, 0.96356201171875, 0.989166259765625, 1.0147705078125, 1.040374755859375, 1.06597900390625, 1.091583251953125, 1.1171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 2.0, 2.0, 15.0, 45.0, 66.0, 127.0, 352.0, 868.0, 4737.0, 4020751.0, 163389.0, 2654.0, 691.0, 290.0, 143.0, 58.0, 34.0, 18.0, 12.0, 10.0, 4.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.07421875, -6.80047607421875, -6.5267333984375, -6.25299072265625, -5.979248046875, -5.70550537109375, -5.4317626953125, -5.15802001953125, -4.88427734375, -4.61053466796875, -4.3367919921875, -4.06304931640625, -3.789306640625, -3.51556396484375, -3.2418212890625, -2.96807861328125, -2.6943359375, -2.42059326171875, -2.1468505859375, -1.87310791015625, -1.599365234375, -1.32562255859375, -1.0518798828125, -0.77813720703125, -0.50439453125, -0.23065185546875, 0.0430908203125, 0.31683349609375, 0.590576171875, 0.86431884765625, 1.1380615234375, 1.41180419921875, 1.685546875, 1.95928955078125, 2.2330322265625, 2.50677490234375, 2.780517578125, 3.05426025390625, 3.3280029296875, 3.60174560546875, 3.87548828125, 4.14923095703125, 4.4229736328125, 4.69671630859375, 4.970458984375, 5.24420166015625, 5.5179443359375, 5.79168701171875, 6.0654296875, 6.33917236328125, 6.6129150390625, 6.88665771484375, 7.160400390625, 7.43414306640625, 7.7078857421875, 7.98162841796875, 8.25537109375, 8.52911376953125, 8.8028564453125, 9.07659912109375, 9.350341796875, 9.62408447265625, 9.8978271484375, 10.17156982421875, 10.4453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 21.0, 22.0, 49.0, 102.0, 199.0, 490.0, 1291.0, 1087.0, 430.0, 179.0, 99.0, 48.0, 25.0, 19.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.90557861328125, -1.7681884765625, -1.63079833984375, -1.493408203125, -1.35601806640625, -1.2186279296875, -1.08123779296875, -0.94384765625, -0.80645751953125, -0.6690673828125, -0.53167724609375, -0.394287109375, -0.25689697265625, -0.1195068359375, 0.01788330078125, 0.1552734375, 0.29266357421875, 0.4300537109375, 0.56744384765625, 0.704833984375, 0.84222412109375, 0.9796142578125, 1.11700439453125, 1.25439453125, 1.39178466796875, 1.5291748046875, 1.66656494140625, 1.803955078125, 1.94134521484375, 2.0787353515625, 2.21612548828125, 2.353515625, 2.49090576171875, 2.6282958984375, 2.76568603515625, 2.903076171875, 3.04046630859375, 3.1778564453125, 3.31524658203125, 3.45263671875, 3.59002685546875, 3.7274169921875, 3.86480712890625, 4.002197265625, 4.13958740234375, 4.2769775390625, 4.41436767578125, 4.5517578125, 4.68914794921875, 4.8265380859375, 4.96392822265625, 5.101318359375, 5.23870849609375, 5.3760986328125, 5.51348876953125, 5.65087890625, 5.78826904296875, 5.9256591796875, 6.06304931640625, 6.200439453125, 6.33782958984375, 6.4752197265625, 6.61260986328125, 6.75]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 6.0, 10.0, 10.0, 22.0, 54.0, 119.0, 240.0, 236.0, 150.0, 66.0, 34.0, 15.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.86121940612793, -14.803691864013672, -13.746164321899414, -12.68863582611084, -11.631108283996582, -10.573580741882324, -9.51605224609375, -8.458524703979492, -7.400997161865234, -6.343469619750977, -5.2859416007995605, -4.2284135818481445, -3.1708860397338867, -2.113358497619629, -1.055830478668213, 0.001697540283203125, 1.059225082397461, 2.116752862930298, 3.1742806434631348, 4.231808662414551, 5.289336204528809, 6.346863746643066, 7.404391765594482, 8.461919784545898, 9.519447326660156, 10.576974868774414, 11.634502410888672, 12.692030906677246, 13.749558448791504, 14.807085990905762, 15.864614486694336, 16.922142028808594, 17.97966766357422, 19.037195205688477, 20.094722747802734, 21.152250289916992, 22.20977783203125, 23.26730728149414, 24.3248348236084, 25.382362365722656, 26.439889907836914, 27.497417449951172, 28.55494499206543, 29.612472534179688, 30.670001983642578, 31.727527618408203, 32.785057067871094, 33.84258270263672, 34.90011215209961, 35.9576416015625, 37.015167236328125, 38.072696685791016, 39.13022232055664, 40.18775177001953, 41.245277404785156, 42.30280685424805, 43.36033630371094, 44.41786575317383, 45.47539138793945, 46.532920837402344, 47.59044647216797, 48.64797592163086, 49.705501556396484, 50.763031005859375, 51.820556640625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 8.0, 12.0, 9.0, 11.0, 18.0, 24.0, 25.0, 39.0, 27.0, 26.0, 28.0, 38.0, 38.0, 44.0, 55.0, 43.0, 59.0, 59.0, 68.0, 39.0, 54.0, 44.0, 32.0, 25.0, 31.0, 26.0, 22.0, 15.0, 12.0, 9.0, 7.0, 8.0, 6.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.595611572265625, -12.182685852050781, -11.769760131835938, -11.356834411621094, -10.94390869140625, -10.530982971191406, -10.118057250976562, -9.705131530761719, -9.292205810546875, -8.879280090332031, -8.466354370117188, -8.053428649902344, -7.6405029296875, -7.227577209472656, -6.814651966094971, -6.401726245880127, -5.988801002502441, -5.575875282287598, -5.162949562072754, -4.75002384185791, -4.337098121643066, -3.9241726398468018, -3.511247158050537, -3.0983214378356934, -2.6853957176208496, -2.272469997406006, -1.8595443964004517, -1.4466187953948975, -1.0336930751800537, -0.62076735496521, -0.2078418731689453, 0.20508384704589844, 0.6180095672607422, 1.030935287475586, 1.4438608884811401, 1.8567864894866943, 2.269712209701538, 2.682637929916382, 3.0955634117126465, 3.5084891319274902, 3.921414852142334, 4.334340572357178, 4.7472662925720215, 5.160191535949707, 5.573117256164551, 5.9860429763793945, 6.398968696594238, 6.811894416809082, 7.224820137023926, 7.6377458572387695, 8.050671577453613, 8.463597297668457, 8.8765230178833, 9.289448738098145, 9.702373504638672, 10.115299224853516, 10.52822494506836, 10.941150665283203, 11.354076385498047, 11.76700210571289, 12.179927825927734, 12.592853546142578, 13.005779266357422, 13.418704986572266, 13.83163070678711]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 5.0, 6.0, 15.0, 23.0, 27.0, 38.0, 64.0, 87.0, 155.0, 235.0, 459.0, 945.0, 1814.0, 4016.0, 9942.0, 29436.0, 120252.0, 633944.0, 185110.0, 39750.0, 12679.0, 4992.0, 2167.0, 1037.0, 572.0, 300.0, 187.0, 96.0, 60.0, 38.0, 33.0, 23.0, 15.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5228118896484375, -1.471405029296875, -1.4199981689453125, -1.36859130859375, -1.3171844482421875, -1.265777587890625, -1.2143707275390625, -1.1629638671875, -1.1115570068359375, -1.060150146484375, -1.0087432861328125, -0.95733642578125, -0.9059295654296875, -0.854522705078125, -0.8031158447265625, -0.751708984375, -0.7003021240234375, -0.648895263671875, -0.5974884033203125, -0.54608154296875, -0.4946746826171875, -0.443267822265625, -0.3918609619140625, -0.3404541015625, -0.2890472412109375, -0.237640380859375, -0.1862335205078125, -0.13482666015625, -0.0834197998046875, -0.032012939453125, 0.0193939208984375, 0.07080078125, 0.1222076416015625, 0.173614501953125, 0.2250213623046875, 0.27642822265625, 0.3278350830078125, 0.379241943359375, 0.4306488037109375, 0.4820556640625, 0.5334625244140625, 0.584869384765625, 0.6362762451171875, 0.68768310546875, 0.7390899658203125, 0.790496826171875, 0.8419036865234375, 0.893310546875, 0.9447174072265625, 0.996124267578125, 1.0475311279296875, 1.09893798828125, 1.1503448486328125, 1.201751708984375, 1.2531585693359375, 1.3045654296875, 1.3559722900390625, 1.407379150390625, 1.4587860107421875, 1.51019287109375, 1.5615997314453125, 1.613006591796875, 1.6644134521484375, 1.7158203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 19.0, 21.0, 17.0, 21.0, 18.0, 37.0, 27.0, 43.0, 53.0, 55.0, 70.0, 59.0, 69.0, 60.0, 60.0, 34.0, 50.0, 46.0, 49.0, 27.0, 23.0, 26.0, 19.0, 18.0, 12.0, 9.0, 8.0, 7.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.86669921875, -0.8351211547851562, -0.8035430908203125, -0.7719650268554688, -0.740386962890625, -0.7088088989257812, -0.6772308349609375, -0.6456527709960938, -0.61407470703125, -0.5824966430664062, -0.5509185791015625, -0.5193405151367188, -0.487762451171875, -0.45618438720703125, -0.4246063232421875, -0.39302825927734375, -0.3614501953125, -0.32987213134765625, -0.2982940673828125, -0.26671600341796875, -0.235137939453125, -0.20355987548828125, -0.1719818115234375, -0.14040374755859375, -0.10882568359375, -0.07724761962890625, -0.0456695556640625, -0.01409149169921875, 0.017486572265625, 0.04906463623046875, 0.0806427001953125, 0.11222076416015625, 0.143798828125, 0.17537689208984375, 0.2069549560546875, 0.23853302001953125, 0.270111083984375, 0.30168914794921875, 0.3332672119140625, 0.36484527587890625, 0.39642333984375, 0.42800140380859375, 0.4595794677734375, 0.49115753173828125, 0.522735595703125, 0.5543136596679688, 0.5858917236328125, 0.6174697875976562, 0.6490478515625, 0.6806259155273438, 0.7122039794921875, 0.7437820434570312, 0.775360107421875, 0.8069381713867188, 0.8385162353515625, 0.8700942993164062, 0.90167236328125, 0.9332504272460938, 0.9648284912109375, 0.9964065551757812, 1.027984619140625, 1.0595626831054688, 1.0911407470703125, 1.1227188110351562, 1.154296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 8.0, 7.0, 18.0, 27.0, 40.0, 55.0, 83.0, 134.0, 255.0, 495.0, 1294.0, 5068.0, 61670.0, 949746.0, 24940.0, 3000.0, 870.0, 351.0, 173.0, 93.0, 55.0, 38.0, 22.0, 20.0, 17.0, 12.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.45001220703125, -3.3433837890625, -3.23675537109375, -3.130126953125, -3.02349853515625, -2.9168701171875, -2.81024169921875, -2.70361328125, -2.59698486328125, -2.4903564453125, -2.38372802734375, -2.277099609375, -2.17047119140625, -2.0638427734375, -1.95721435546875, -1.8505859375, -1.74395751953125, -1.6373291015625, -1.53070068359375, -1.424072265625, -1.31744384765625, -1.2108154296875, -1.10418701171875, -0.99755859375, -0.89093017578125, -0.7843017578125, -0.67767333984375, -0.571044921875, -0.46441650390625, -0.3577880859375, -0.25115966796875, -0.14453125, -0.03790283203125, 0.0687255859375, 0.17535400390625, 0.281982421875, 0.38861083984375, 0.4952392578125, 0.60186767578125, 0.70849609375, 0.81512451171875, 0.9217529296875, 1.02838134765625, 1.135009765625, 1.24163818359375, 1.3482666015625, 1.45489501953125, 1.5615234375, 1.66815185546875, 1.7747802734375, 1.88140869140625, 1.988037109375, 2.09466552734375, 2.2012939453125, 2.30792236328125, 2.41455078125, 2.52117919921875, 2.6278076171875, 2.73443603515625, 2.841064453125, 2.94769287109375, 3.0543212890625, 3.16094970703125, 3.267578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 8.0, 6.0, 12.0, 5.0, 10.0, 15.0, 12.0, 12.0, 16.0, 24.0, 30.0, 33.0, 33.0, 32.0, 51.0, 46.0, 65.0, 63.0, 71.0, 76.0, 61.0, 50.0, 45.0, 36.0, 29.0, 24.0, 24.0, 14.0, 12.0, 15.0, 17.0, 8.0, 11.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.213348388671875, -3.10052490234375, -2.987701416015625, -2.8748779296875, -2.762054443359375, -2.64923095703125, -2.536407470703125, -2.423583984375, -2.310760498046875, -2.19793701171875, -2.085113525390625, -1.9722900390625, -1.859466552734375, -1.74664306640625, -1.633819580078125, -1.52099609375, -1.408172607421875, -1.29534912109375, -1.182525634765625, -1.0697021484375, -0.956878662109375, -0.84405517578125, -0.731231689453125, -0.618408203125, -0.505584716796875, -0.39276123046875, -0.279937744140625, -0.1671142578125, -0.054290771484375, 0.05853271484375, 0.171356201171875, 0.2841796875, 0.397003173828125, 0.50982666015625, 0.622650146484375, 0.7354736328125, 0.848297119140625, 0.96112060546875, 1.073944091796875, 1.186767578125, 1.299591064453125, 1.41241455078125, 1.525238037109375, 1.6380615234375, 1.750885009765625, 1.86370849609375, 1.976531982421875, 2.08935546875, 2.202178955078125, 2.31500244140625, 2.427825927734375, 2.5406494140625, 2.653472900390625, 2.76629638671875, 2.879119873046875, 2.991943359375, 3.104766845703125, 3.21759033203125, 3.330413818359375, 3.4432373046875, 3.556060791015625, 3.66888427734375, 3.781707763671875, 3.89453125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 13.0, 14.0, 21.0, 24.0, 37.0, 49.0, 96.0, 274.0, 692.0, 3021.0, 46940.0, 983604.0, 11363.0, 1563.0, 389.0, 189.0, 91.0, 61.0, 19.0, 19.0, 12.0, 11.0, 12.0, 3.0, 6.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.125, -1.085235595703125, -1.04547119140625, -1.005706787109375, -0.9659423828125, -0.926177978515625, -0.88641357421875, -0.846649169921875, -0.806884765625, -0.767120361328125, -0.72735595703125, -0.687591552734375, -0.6478271484375, -0.608062744140625, -0.56829833984375, -0.528533935546875, -0.48876953125, -0.449005126953125, -0.40924072265625, -0.369476318359375, -0.3297119140625, -0.289947509765625, -0.25018310546875, -0.210418701171875, -0.170654296875, -0.130889892578125, -0.09112548828125, -0.051361083984375, -0.0115966796875, 0.028167724609375, 0.06793212890625, 0.107696533203125, 0.1474609375, 0.187225341796875, 0.22698974609375, 0.266754150390625, 0.3065185546875, 0.346282958984375, 0.38604736328125, 0.425811767578125, 0.465576171875, 0.505340576171875, 0.54510498046875, 0.584869384765625, 0.6246337890625, 0.664398193359375, 0.70416259765625, 0.743927001953125, 0.78369140625, 0.823455810546875, 0.86322021484375, 0.902984619140625, 0.9427490234375, 0.982513427734375, 1.02227783203125, 1.062042236328125, 1.101806640625, 1.141571044921875, 1.18133544921875, 1.221099853515625, 1.2608642578125, 1.300628662109375, 1.34039306640625, 1.380157470703125, 1.419921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 14.0, 27.0, 24.0, 39.0, 74.0, 132.0, 185.0, 166.0, 105.0, 69.0, 41.0, 15.0, 21.0, 16.0, 14.0, 13.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000247955322265625, -0.00024062395095825195, -0.0002332925796508789, -0.00022596120834350586, -0.0002186298370361328, -0.00021129846572875977, -0.00020396709442138672, -0.00019663572311401367, -0.00018930435180664062, -0.00018197298049926758, -0.00017464160919189453, -0.00016731023788452148, -0.00015997886657714844, -0.0001526474952697754, -0.00014531612396240234, -0.0001379847526550293, -0.00013065338134765625, -0.0001233220100402832, -0.00011599063873291016, -0.00010865926742553711, -0.00010132789611816406, -9.399652481079102e-05, -8.666515350341797e-05, -7.933378219604492e-05, -7.200241088867188e-05, -6.467103958129883e-05, -5.733966827392578e-05, -5.0008296966552734e-05, -4.267692565917969e-05, -3.534555435180664e-05, -2.8014183044433594e-05, -2.0682811737060547e-05, -1.33514404296875e-05, -6.020069122314453e-06, 1.3113021850585938e-06, 8.64267349243164e-06, 1.5974044799804688e-05, 2.3305416107177734e-05, 3.063678741455078e-05, 3.796815872192383e-05, 4.5299530029296875e-05, 5.263090133666992e-05, 5.996227264404297e-05, 6.729364395141602e-05, 7.462501525878906e-05, 8.195638656616211e-05, 8.928775787353516e-05, 9.66191291809082e-05, 0.00010395050048828125, 0.0001112818717956543, 0.00011861324310302734, 0.0001259446144104004, 0.00013327598571777344, 0.00014060735702514648, 0.00014793872833251953, 0.00015527009963989258, 0.00016260147094726562, 0.00016993284225463867, 0.00017726421356201172, 0.00018459558486938477, 0.0001919269561767578, 0.00019925832748413086, 0.0002065896987915039, 0.00021392107009887695, 0.00022125244140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 9.0, 15.0, 34.0, 54.0, 81.0, 159.0, 427.0, 1240.0, 5265.0, 59267.0, 952863.0, 24311.0, 3284.0, 919.0, 297.0, 144.0, 64.0, 36.0, 25.0, 14.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6846847534179688, -0.6613616943359375, -0.6380386352539062, -0.614715576171875, -0.5913925170898438, -0.5680694580078125, -0.5447463989257812, -0.52142333984375, -0.49810028076171875, -0.4747772216796875, -0.45145416259765625, -0.428131103515625, -0.40480804443359375, -0.3814849853515625, -0.35816192626953125, -0.3348388671875, -0.31151580810546875, -0.2881927490234375, -0.26486968994140625, -0.241546630859375, -0.21822357177734375, -0.1949005126953125, -0.17157745361328125, -0.14825439453125, -0.12493133544921875, -0.1016082763671875, -0.07828521728515625, -0.054962158203125, -0.03163909912109375, -0.0083160400390625, 0.01500701904296875, 0.038330078125, 0.06165313720703125, 0.0849761962890625, 0.10829925537109375, 0.131622314453125, 0.15494537353515625, 0.1782684326171875, 0.20159149169921875, 0.22491455078125, 0.24823760986328125, 0.2715606689453125, 0.29488372802734375, 0.318206787109375, 0.34152984619140625, 0.3648529052734375, 0.38817596435546875, 0.4114990234375, 0.43482208251953125, 0.4581451416015625, 0.48146820068359375, 0.504791259765625, 0.5281143188476562, 0.5514373779296875, 0.5747604370117188, 0.59808349609375, 0.6214065551757812, 0.6447296142578125, 0.6680526733398438, 0.691375732421875, 0.7146987915039062, 0.7380218505859375, 0.7613449096679688, 0.78466796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 10.0, 7.0, 13.0, 16.0, 17.0, 35.0, 47.0, 67.0, 88.0, 110.0, 125.0, 131.0, 75.0, 74.0, 44.0, 27.0, 25.0, 19.0, 12.0, 9.0, 14.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.6201171875, -0.603668212890625, -0.58721923828125, -0.570770263671875, -0.5543212890625, -0.537872314453125, -0.52142333984375, -0.504974365234375, -0.488525390625, -0.472076416015625, -0.45562744140625, -0.439178466796875, -0.4227294921875, -0.406280517578125, -0.38983154296875, -0.373382568359375, -0.35693359375, -0.340484619140625, -0.32403564453125, -0.307586669921875, -0.2911376953125, -0.274688720703125, -0.25823974609375, -0.241790771484375, -0.225341796875, -0.208892822265625, -0.19244384765625, -0.175994873046875, -0.1595458984375, -0.143096923828125, -0.12664794921875, -0.110198974609375, -0.09375, -0.077301025390625, -0.06085205078125, -0.044403076171875, -0.0279541015625, -0.011505126953125, 0.00494384765625, 0.021392822265625, 0.037841796875, 0.054290771484375, 0.07073974609375, 0.087188720703125, 0.1036376953125, 0.120086669921875, 0.13653564453125, 0.152984619140625, 0.16943359375, 0.185882568359375, 0.20233154296875, 0.218780517578125, 0.2352294921875, 0.251678466796875, 0.26812744140625, 0.284576416015625, 0.301025390625, 0.317474365234375, 0.33392333984375, 0.350372314453125, 0.3668212890625, 0.383270263671875, 0.39971923828125, 0.416168212890625, 0.4326171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 12.0, 58.0, 683.0, 209.0, 31.0, 13.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.34331130981445, -45.75852584838867, -44.173736572265625, -42.588951110839844, -41.00416564941406, -39.41938018798828, -37.834590911865234, -36.24980545043945, -34.665016174316406, -33.080230712890625, -31.49544334411621, -29.910655975341797, -28.325870513916016, -26.7410831451416, -25.156295776367188, -23.571510314941406, -21.986724853515625, -20.40193748474121, -18.81715202331543, -17.232364654541016, -15.647578239440918, -14.06279182434082, -12.478004455566406, -10.893218040466309, -9.308431625366211, -7.723645210266113, -6.138858318328857, -4.554071426391602, -2.969285011291504, -1.3844985961914062, 0.2002887725830078, 1.7850751876831055, 3.369861602783203, 4.954648017883301, 6.539434909820557, 8.124221801757812, 9.70900821685791, 11.293794631958008, 12.878582000732422, 14.46336841583252, 16.048154830932617, 17.63294219970703, 19.217727661132812, 20.802515029907227, 22.38730239868164, 23.972087860107422, 25.556875228881836, 27.14166259765625, 28.72644805908203, 30.311235427856445, 31.896020889282227, 33.48080825805664, 35.06559371948242, 36.65038299560547, 38.23516845703125, 39.81995391845703, 41.40473937988281, 42.989524841308594, 44.57431411743164, 46.15909957885742, 47.7438850402832, 49.32867431640625, 50.91345977783203, 52.49824523925781, 54.08303451538086]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 17.0, 20.0, 23.0, 38.0, 57.0, 65.0, 378.0, 166.0, 66.0, 43.0, 37.0, 27.0, 15.0, 12.0, 10.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.040874481201172, -9.316638946533203, -8.59240436553955, -7.868168830871582, -7.143933296203613, -6.419698238372803, -5.695463180541992, -4.971227645874023, -4.246992588043213, -3.5227572917938232, -2.7985219955444336, -2.074286937713623, -1.3500516414642334, -0.6258163452148438, 0.0984187126159668, 0.8226542472839355, 1.546889305114746, 2.2711246013641357, 2.9953598976135254, 3.719594955444336, 4.443830490112305, 5.168065547943115, 5.892300605773926, 6.6165361404418945, 7.340771198272705, 8.065006256103516, 8.789241790771484, 9.513477325439453, 10.237711906433105, 10.961947441101074, 11.686182022094727, 12.410417556762695, 13.134653091430664, 13.858888626098633, 14.583123207092285, 15.307358741760254, 16.031593322753906, 16.755828857421875, 17.480064392089844, 18.204299926757812, 18.92853546142578, 19.65277099609375, 20.37700653076172, 21.101242065429688, 21.825475692749023, 22.549711227416992, 23.27394676208496, 23.99818229675293, 24.722415924072266, 25.446651458740234, 26.170886993408203, 26.895122528076172, 27.619356155395508, 28.343591690063477, 29.067827224731445, 29.792062759399414, 30.516298294067383, 31.24053382873535, 31.96476936340332, 32.689002990722656, 33.413238525390625, 34.137474060058594, 34.86170959472656, 35.58594512939453, 36.3101806640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 9.0, 9.0, 14.0, 21.0, 32.0, 30.0, 44.0, 54.0, 47.0, 100.0, 342.0, 99.0, 40.0, 43.0, 37.0, 19.0, 18.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8437728881835938, -0.7983856201171875, -0.7529983520507812, -0.707611083984375, -0.6622238159179688, -0.6168365478515625, -0.5714492797851562, -0.52606201171875, -0.48067474365234375, -0.4352874755859375, -0.38990020751953125, -0.344512939453125, -0.29912567138671875, -0.2537384033203125, -0.20835113525390625, -0.1629638671875, -0.11757659912109375, -0.0721893310546875, -0.02680206298828125, 0.018585205078125, 0.06397247314453125, 0.1093597412109375, 0.15474700927734375, 0.20013427734375, 0.24552154541015625, 0.2909088134765625, 0.33629608154296875, 0.381683349609375, 0.42707061767578125, 0.4724578857421875, 0.5178451538085938, 0.563232421875, 0.6086196899414062, 0.6540069580078125, 0.6993942260742188, 0.744781494140625, 0.7901687622070312, 0.8355560302734375, 0.8809432983398438, 0.92633056640625, 0.9717178344726562, 1.0171051025390625, 1.0624923706054688, 1.107879638671875, 1.1532669067382812, 1.1986541748046875, 1.2440414428710938, 1.2894287109375, 1.3348159790039062, 1.3802032470703125, 1.4255905151367188, 1.470977783203125, 1.5163650512695312, 1.5617523193359375, 1.6071395874023438, 1.65252685546875, 1.6979141235351562, 1.7433013916015625, 1.7886886596679688, 1.834075927734375, 1.8794631958007812, 1.9248504638671875, 1.9702377319335938, 2.015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 7.0, 7.0, 0.0, 5.0, 16.0, 10.0, 27.0, 28.0, 65.0, 159.0, 823.0, 46812.0, 8339089.0, 1119.0, 205.0, 84.0, 50.0, 28.0, 11.0, 8.0, 8.0, 3.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.296606063842773, -26.54012680053711, -25.783649444580078, -25.027170181274414, -24.270692825317383, -23.51421356201172, -22.757736206054688, -22.001256942749023, -21.24477767944336, -20.488298416137695, -19.731821060180664, -18.975341796875, -18.21886444091797, -17.462385177612305, -16.70590591430664, -15.94942855834961, -15.192951202392578, -14.43647289276123, -13.679994583129883, -12.923515319824219, -12.167037963867188, -11.410558700561523, -10.654080390930176, -9.897602081298828, -9.14112377166748, -8.384645462036133, -7.628167152404785, -6.871688365936279, -6.115210056304932, -5.358731746673584, -4.602252960205078, -3.8457746505737305, -3.08929443359375, -2.3328161239624023, -1.5763375759124756, -0.8198590278625488, -0.06338071823120117, 0.6930975914001465, 1.4495763778686523, 2.2060546875, 2.9625329971313477, 3.7190113067626953, 4.475489616394043, 5.231968402862549, 5.9884467124938965, 6.744925022125244, 7.50140380859375, 8.257882118225098, 9.014360427856445, 9.770838737487793, 10.52731704711914, 11.283796310424805, 12.040273666381836, 12.7967529296875, 13.553231239318848, 14.309709548950195, 15.066187858581543, 15.82266616821289, 16.579145431518555, 17.335622787475586, 18.09210205078125, 18.84857940673828, 19.605058670043945, 20.36153793334961, 21.11801528930664]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 6.0, 6.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.687347412109375, -26.179248809814453, -25.671152114868164, -25.163053512573242, -24.65495491027832, -24.14685821533203, -23.63875961303711, -23.130661010742188, -22.622562408447266, -22.114463806152344, -21.606367111206055, -21.098268508911133, -20.59016990661621, -20.082073211669922, -19.573974609375, -19.065876007080078, -18.55777931213379, -18.049680709838867, -17.541584014892578, -17.033485412597656, -16.525386810302734, -16.017288208007812, -15.509191513061523, -15.001092910766602, -14.492995262145996, -13.98489761352539, -13.476799011230469, -12.968701362609863, -12.460603713989258, -11.952505111694336, -11.44440746307373, -10.936309814453125, -10.428211212158203, -9.920113563537598, -9.412014961242676, -8.90391731262207, -8.395818710327148, -7.887721061706543, -7.3796234130859375, -6.871525287628174, -6.363426685333252, -5.855328559875488, -5.347230911254883, -4.839132785797119, -4.3310346603393555, -3.822936534881592, -3.3148386478424072, -2.8067407608032227, -2.298642635345459, -1.7905446290969849, -1.2824466228485107, -0.7743486166000366, -0.2662506103515625, 0.24184751510620117, 0.7499454021453857, 1.2580432891845703, 1.766141414642334, 2.2742395401000977, 2.7823374271392822, 3.290435314178467, 3.7985334396362305, 4.306631565093994, 4.814729690551758, 5.322827339172363, 5.830925464630127]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 12.0, 9.0, 22.0, 27.0, 30.0, 46.0, 79.0, 91.0, 166.0, 255.0, 445.0, 891.0, 1928.0, 4929.0, 15850.0, 62754.0, 236602.0, 146543.0, 35313.0, 10472.0, 4020.0, 1760.0, 887.0, 430.0, 266.0, 156.0, 83.0, 64.0, 46.0, 28.0, 20.0, 11.0, 8.0, 6.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.3984375, -9.15606689453125, -8.9136962890625, -8.67132568359375, -8.428955078125, -8.18658447265625, -7.9442138671875, -7.70184326171875, -7.45947265625, -7.21710205078125, -6.9747314453125, -6.73236083984375, -6.489990234375, -6.24761962890625, -6.0052490234375, -5.76287841796875, -5.5205078125, -5.27813720703125, -5.0357666015625, -4.79339599609375, -4.551025390625, -4.30865478515625, -4.0662841796875, -3.82391357421875, -3.58154296875, -3.33917236328125, -3.0968017578125, -2.85443115234375, -2.612060546875, -2.36968994140625, -2.1273193359375, -1.88494873046875, -1.642578125, -1.40020751953125, -1.1578369140625, -0.91546630859375, -0.673095703125, -0.43072509765625, -0.1883544921875, 0.05401611328125, 0.29638671875, 0.53875732421875, 0.7811279296875, 1.02349853515625, 1.265869140625, 1.50823974609375, 1.7506103515625, 1.99298095703125, 2.2353515625, 2.47772216796875, 2.7200927734375, 2.96246337890625, 3.204833984375, 3.44720458984375, 3.6895751953125, 3.93194580078125, 4.17431640625, 4.41668701171875, 4.6590576171875, 4.90142822265625, 5.143798828125, 5.38616943359375, 5.6285400390625, 5.87091064453125, 6.11328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 9.0, 5.0, 11.0, 29.0, 26.0, 49.0, 72.0, 97.0, 93.0, 139.0, 121.0, 109.0, 61.0, 44.0, 34.0, 27.0, 15.0, 15.0, 12.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.480316162109375, -1.42156982421875, -1.362823486328125, -1.3040771484375, -1.245330810546875, -1.18658447265625, -1.127838134765625, -1.069091796875, -1.010345458984375, -0.95159912109375, -0.892852783203125, -0.8341064453125, -0.775360107421875, -0.71661376953125, -0.657867431640625, -0.59912109375, -0.540374755859375, -0.48162841796875, -0.422882080078125, -0.3641357421875, -0.305389404296875, -0.24664306640625, -0.187896728515625, -0.129150390625, -0.070404052734375, -0.01165771484375, 0.047088623046875, 0.1058349609375, 0.164581298828125, 0.22332763671875, 0.282073974609375, 0.3408203125, 0.399566650390625, 0.45831298828125, 0.517059326171875, 0.5758056640625, 0.634552001953125, 0.69329833984375, 0.752044677734375, 0.810791015625, 0.869537353515625, 0.92828369140625, 0.987030029296875, 1.0457763671875, 1.104522705078125, 1.16326904296875, 1.222015380859375, 1.28076171875, 1.339508056640625, 1.39825439453125, 1.457000732421875, 1.5157470703125, 1.574493408203125, 1.63323974609375, 1.691986083984375, 1.750732421875, 1.809478759765625, 1.86822509765625, 1.926971435546875, 1.9857177734375, 2.044464111328125, 2.10321044921875, 2.161956787109375, 2.220703125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 7.0, 7.0, 10.0, 11.0, 15.0, 26.0, 65.0, 115.0, 104.0, 55.0, 28.0, 12.0, 11.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.74677848815918, -11.425983428955078, -11.105188369750977, -10.784393310546875, -10.463598251342773, -10.142803192138672, -9.82200813293457, -9.501213073730469, -9.180418014526367, -8.859622955322266, -8.538827896118164, -8.218032836914062, -7.897237777709961, -7.576442718505859, -7.255647659301758, -6.934852600097656, -6.614058017730713, -6.293262958526611, -5.97246789932251, -5.651672840118408, -5.330877780914307, -5.010082721710205, -4.689288139343262, -4.36849308013916, -4.047698020935059, -3.726902961730957, -3.4061079025268555, -3.085312843322754, -2.7645177841186523, -2.443722724914551, -2.1229279041290283, -1.8021328449249268, -1.481337547302246, -1.1605424880981445, -0.8397474884986877, -0.518952488899231, -0.1981574296951294, 0.12263762950897217, 0.4434325695037842, 0.7642276287078857, 1.0850226879119873, 1.4058177471160889, 1.7266128063201904, 2.047407627105713, 2.3682026863098145, 2.688997745513916, 3.0097928047180176, 3.330587863922119, 3.6513829231262207, 3.9721779823303223, 4.292973041534424, 4.613768100738525, 4.934563159942627, 5.2553582191467285, 5.576152801513672, 5.896947860717773, 6.217742919921875, 6.538537979125977, 6.859333038330078, 7.18012809753418, 7.500923156738281, 7.821718215942383, 8.142513275146484, 8.463308334350586, 8.784103393554688]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 4.0, 3.0, 11.0, 6.0, 6.0, 9.0, 14.0, 28.0, 63.0, 85.0, 102.0, 69.0, 34.0, 17.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.045466423034668, -6.832422256469727, -6.619378089904785, -6.406333923339844, -6.193289279937744, -5.980245113372803, -5.767200946807861, -5.55415678024292, -5.3411126136779785, -5.128068447113037, -4.915024280548096, -4.701979637145996, -4.488935470581055, -4.275891304016113, -4.062847137451172, -3.8498029708862305, -3.63675856590271, -3.4237143993377686, -3.210669994354248, -2.9976258277893066, -2.7845816612243652, -2.571537494659424, -2.3584930896759033, -2.145448923110962, -1.932404637336731, -1.7193603515625, -1.5063161849975586, -1.2932718992233276, -1.0802276134490967, -0.8671834468841553, -0.6541391611099243, -0.4410949945449829, -0.22805070877075195, -0.015006467700004578, 0.1980377733707428, 0.41108202934265137, 0.6241262555122375, 0.8371704816818237, 1.0502147674560547, 1.263258934020996, 1.476303219795227, 1.689347505569458, 1.9023916721343994, 2.11543607711792, 2.3284802436828613, 2.5415244102478027, 2.754568576812744, 2.9676127433776855, 3.180657148361206, 3.3937013149261475, 3.606745719909668, 3.8197898864746094, 4.032834053039551, 4.245878219604492, 4.458922386169434, 4.671966552734375, 4.885011196136475, 5.098055362701416, 5.311099529266357, 5.524144172668457, 5.737188339233398, 5.95023250579834, 6.163276672363281, 6.376320838928223, 6.589365005493164]}, "eval/loss": 4.16819953918457, "eval/wer": 1.9665807219357399, "eval/runtime": 794.4467, "eval/samples_per_second": 3.326, "eval/steps_per_second": 0.278, "train/train_runtime": 6757.0177, "train/train_samples_per_second": 4.223, "train/train_steps_per_second": 0.176, "train/total_flos": 0.0, "train/train_loss": 4.268135019066556} \ No newline at end of file +{"train/loss": 4.4211, "train/learning_rate": 5.805515239477504e-08, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 8059, "_timestamp": 1646074088, "_step": 1192, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 199.0, 773.0, 38.0, 3.0], "bins": [-638.4752197265625, -628.0576171875, -617.6399536132812, -607.2223510742188, -596.8046875, -586.3870849609375, -575.969482421875, -565.5518188476562, -555.1342163085938, -544.7166137695312, -534.2989501953125, -523.88134765625, -513.4636840820312, -503.04608154296875, -492.6284484863281, -482.2108154296875, -471.7931823730469, -461.37554931640625, -450.9579162597656, -440.5403137207031, -430.1226806640625, -419.7050476074219, -409.28741455078125, -398.8697814941406, -388.4521484375, -378.0345153808594, -367.61688232421875, -357.19927978515625, -346.7816467285156, -336.364013671875, -325.9463806152344, -315.52874755859375, -305.1111145019531, -294.6934814453125, -284.2758483886719, -273.8582458496094, -263.44061279296875, -253.02297973632812, -242.6053466796875, -232.18771362304688, -221.77011108398438, -211.35247802734375, -200.9348602294922, -190.51722717285156, -180.099609375, -169.68197631835938, -159.26434326171875, -148.84671020507812, -138.42909240722656, -128.01145935058594, -117.59384155273438, -107.17620849609375, -96.75858306884766, -86.34095764160156, -75.92332458496094, -65.50569915771484, -55.08807373046875, -44.670448303222656, -34.2528190612793, -23.83519172668457, -13.417564392089844, -2.99993896484375, 7.417690277099609, 17.83531951904297, 28.252946853637695]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 7.0, 4.0, 3.0, 2.0, 12.0, 7.0, 9.0, 10.0, 13.0, 26.0, 23.0, 22.0, 24.0, 29.0, 36.0, 37.0, 45.0, 33.0, 39.0, 37.0, 61.0, 51.0, 50.0, 48.0, 51.0, 46.0, 37.0, 24.0, 35.0, 21.0, 27.0, 20.0, 19.0, 14.0, 16.0, 12.0, 13.0, 11.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.6351318359375, -54.82221984863281, -53.009307861328125, -51.19639587402344, -49.383480072021484, -47.5705680847168, -45.75765609741211, -43.94474411010742, -42.13182830810547, -40.31891632080078, -38.506004333496094, -36.693092346191406, -34.88017654418945, -33.067264556884766, -31.254352569580078, -29.44144058227539, -27.628528594970703, -25.815616607666016, -24.002702713012695, -22.189790725708008, -20.376876831054688, -18.56396484375, -16.751052856445312, -14.938139915466309, -13.125226974487305, -11.3123140335083, -9.499401092529297, -7.686489105224609, -5.8735761642456055, -4.060663223266602, -2.247751235961914, -0.43483829498291016, 1.3780746459960938, 3.1909873485565186, 5.003900051116943, 6.816812515258789, 8.629725456237793, 10.442638397216797, 12.255550384521484, 14.068463325500488, 15.881376266479492, 17.69428825378418, 19.5072021484375, 21.320114135742188, 23.133026123046875, 24.945940017700195, 26.758852005004883, 28.571765899658203, 30.38467788696289, 32.19758987426758, 34.010501861572266, 35.82341766357422, 37.636329650878906, 39.449241638183594, 41.26215362548828, 43.07506561279297, 44.887977600097656, 46.700889587402344, 48.51380157470703, 50.32671356201172, 52.13962936401367, 53.95254135131836, 55.76545333862305, 57.578365325927734, 59.39128112792969]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 10.0, 12.0, 20.0, 15.0, 32.0, 45.0, 51.0, 46.0, 68.0, 78.0, 72.0, 86.0, 83.0, 89.0, 75.0, 51.0, 40.0, 31.0, 32.0, 19.0, 12.0, 10.0, 11.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.62652587890625, -9.3936767578125, -9.16082763671875, -8.927978515625, -8.69512939453125, -8.4622802734375, -8.22943115234375, -7.99658203125, -7.76373291015625, -7.5308837890625, -7.29803466796875, -7.065185546875, -6.83233642578125, -6.5994873046875, -6.36663818359375, -6.1337890625, -5.90093994140625, -5.6680908203125, -5.43524169921875, -5.202392578125, -4.96954345703125, -4.7366943359375, -4.50384521484375, -4.27099609375, -4.03814697265625, -3.8052978515625, -3.57244873046875, -3.339599609375, -3.10675048828125, -2.8739013671875, -2.64105224609375, -2.408203125, -2.17535400390625, -1.9425048828125, -1.70965576171875, -1.476806640625, -1.24395751953125, -1.0111083984375, -0.77825927734375, -0.54541015625, -0.31256103515625, -0.0797119140625, 0.15313720703125, 0.385986328125, 0.61883544921875, 0.8516845703125, 1.08453369140625, 1.3173828125, 1.55023193359375, 1.7830810546875, 2.01593017578125, 2.248779296875, 2.48162841796875, 2.7144775390625, 2.94732666015625, 3.18017578125, 3.41302490234375, 3.6458740234375, 3.87872314453125, 4.111572265625, 4.34442138671875, 4.5772705078125, 4.81011962890625, 5.04296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4.0, 8.0, 11.0, 13.0, 29.0, 34.0, 72.0, 89.0, 139.0, 212.0, 396.0, 735.0, 1454.0, 3154.0, 9650.0, 51280.0, 1266920.0, 2726149.0, 110410.0, 15390.0, 4333.0, 1812.0, 835.0, 446.0, 255.0, 145.0, 110.0, 66.0, 56.0, 31.0, 17.0, 14.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.0, -21.4381103515625, -20.876220703125, -20.3143310546875, -19.75244140625, -19.1905517578125, -18.628662109375, -18.0667724609375, -17.5048828125, -16.9429931640625, -16.381103515625, -15.8192138671875, -15.25732421875, -14.6954345703125, -14.133544921875, -13.5716552734375, -13.009765625, -12.4478759765625, -11.885986328125, -11.3240966796875, -10.76220703125, -10.2003173828125, -9.638427734375, -9.0765380859375, -8.5146484375, -7.9527587890625, -7.390869140625, -6.8289794921875, -6.26708984375, -5.7052001953125, -5.143310546875, -4.5814208984375, -4.01953125, -3.4576416015625, -2.895751953125, -2.3338623046875, -1.77197265625, -1.2100830078125, -0.648193359375, -0.0863037109375, 0.4755859375, 1.0374755859375, 1.599365234375, 2.1612548828125, 2.72314453125, 3.2850341796875, 3.846923828125, 4.4088134765625, 4.970703125, 5.5325927734375, 6.094482421875, 6.6563720703125, 7.21826171875, 7.7801513671875, 8.342041015625, 8.9039306640625, 9.4658203125, 10.0277099609375, 10.589599609375, 11.1514892578125, 11.71337890625, 12.2752685546875, 12.837158203125, 13.3990478515625, 13.9609375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 10.0, 13.0, 11.0, 32.0, 53.0, 49.0, 112.0, 172.0, 272.0, 472.0, 830.0, 815.0, 513.0, 268.0, 172.0, 85.0, 60.0, 42.0, 24.0, 20.0, 11.0, 11.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.671875, -27.97314453125, -27.2744140625, -26.57568359375, -25.876953125, -25.17822265625, -24.4794921875, -23.78076171875, -23.08203125, -22.38330078125, -21.6845703125, -20.98583984375, -20.287109375, -19.58837890625, -18.8896484375, -18.19091796875, -17.4921875, -16.79345703125, -16.0947265625, -15.39599609375, -14.697265625, -13.99853515625, -13.2998046875, -12.60107421875, -11.90234375, -11.20361328125, -10.5048828125, -9.80615234375, -9.107421875, -8.40869140625, -7.7099609375, -7.01123046875, -6.3125, -5.61376953125, -4.9150390625, -4.21630859375, -3.517578125, -2.81884765625, -2.1201171875, -1.42138671875, -0.72265625, -0.02392578125, 0.6748046875, 1.37353515625, 2.072265625, 2.77099609375, 3.4697265625, 4.16845703125, 4.8671875, 5.56591796875, 6.2646484375, 6.96337890625, 7.662109375, 8.36083984375, 9.0595703125, 9.75830078125, 10.45703125, 11.15576171875, 11.8544921875, 12.55322265625, 13.251953125, 13.95068359375, 14.6494140625, 15.34814453125, 16.046875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 13.0, 24.0, 31.0, 84.0, 145.0, 272.0, 602.0, 1688.0, 19694.0, 4153828.0, 15221.0, 1551.0, 584.0, 232.0, 132.0, 58.0, 40.0, 22.0, 19.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -84.2548828125, -81.072265625, -77.8896484375, -74.70703125, -71.5244140625, -68.341796875, -65.1591796875, -61.9765625, -58.7939453125, -55.611328125, -52.4287109375, -49.24609375, -46.0634765625, -42.880859375, -39.6982421875, -36.515625, -33.3330078125, -30.150390625, -26.9677734375, -23.78515625, -20.6025390625, -17.419921875, -14.2373046875, -11.0546875, -7.8720703125, -4.689453125, -1.5068359375, 1.67578125, 4.8583984375, 8.041015625, 11.2236328125, 14.40625, 17.5888671875, 20.771484375, 23.9541015625, 27.13671875, 30.3193359375, 33.501953125, 36.6845703125, 39.8671875, 43.0498046875, 46.232421875, 49.4150390625, 52.59765625, 55.7802734375, 58.962890625, 62.1455078125, 65.328125, 68.5107421875, 71.693359375, 74.8759765625, 78.05859375, 81.2412109375, 84.423828125, 87.6064453125, 90.7890625, 93.9716796875, 97.154296875, 100.3369140625, 103.51953125, 106.7021484375, 109.884765625, 113.0673828125, 116.25]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 106.0, 600.0, 285.0, 12.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.01038360595703, -31.39297103881836, -24.775558471679688, -18.15814781188965, -11.540735244750977, -4.9233245849609375, 1.6940879821777344, 8.311500549316406, 14.928913116455078, 21.54632568359375, 28.163738250732422, 34.781150817871094, 41.3985595703125, 48.01597213745117, 54.633384704589844, 61.250797271728516, 67.86820983886719, 74.4856185913086, 81.10303497314453, 87.72044372558594, 94.33786010742188, 100.95526885986328, 107.57267761230469, 114.19009399414062, 120.80751037597656, 127.42491912841797, 134.04232788085938, 140.6597442626953, 147.27716064453125, 153.89456176757812, 160.51197814941406, 167.12939453125, 173.74681091308594, 180.36422729492188, 186.98162841796875, 193.5990447998047, 200.21646118164062, 206.8338623046875, 213.45127868652344, 220.06869506835938, 226.6861114501953, 233.30352783203125, 239.92092895507812, 246.53834533691406, 253.15576171875, 259.7731628417969, 266.3905944824219, 273.00799560546875, 279.6253967285156, 286.2427978515625, 292.8602294921875, 299.4776306152344, 306.09503173828125, 312.71246337890625, 319.3298645019531, 325.947265625, 332.564697265625, 339.1820983886719, 345.7995300292969, 352.41693115234375, 359.0343322753906, 365.6517639160156, 372.2691650390625, 378.8865966796875, 385.5039978027344]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 2.0, 14.0, 16.0, 19.0, 20.0, 30.0, 27.0, 46.0, 38.0, 48.0, 50.0, 57.0, 59.0, 63.0, 59.0, 51.0, 66.0, 49.0, 45.0, 47.0, 40.0, 28.0, 24.0, 19.0, 17.0, 19.0, 6.0, 7.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.2113037109375, -70.05340576171875, -67.8955078125, -65.73760986328125, -63.579708099365234, -61.421810150146484, -59.26390838623047, -57.10601043701172, -54.94811248779297, -52.79021453857422, -50.63231658935547, -48.47441482543945, -46.3165168762207, -44.15861892700195, -42.00071716308594, -39.84281921386719, -37.68492126464844, -35.52702331542969, -33.36912536621094, -31.211223602294922, -29.053325653076172, -26.895427703857422, -24.73752784729004, -22.579627990722656, -20.421730041503906, -18.263832092285156, -16.105932235717773, -13.948033332824707, -11.79013442993164, -9.632235527038574, -7.474336624145508, -5.316437721252441, -3.158538818359375, -1.0006399154663086, 1.1572589874267578, 3.315157890319824, 5.473056793212891, 7.630955696105957, 9.788854598999023, 11.94675350189209, 14.104652404785156, 16.262550354003906, 18.42045021057129, 20.578350067138672, 22.736248016357422, 24.894145965576172, 27.052045822143555, 29.209945678710938, 31.367843627929688, 33.52574157714844, 35.68363952636719, 37.8415412902832, 39.99943923950195, 42.1573371887207, 44.31523895263672, 46.47313690185547, 48.63103485107422, 50.78893280029297, 52.94683074951172, 55.104732513427734, 57.262630462646484, 59.420528411865234, 61.57843017578125, 63.736328125, 65.89422607421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 16.0, 18.0, 17.0, 15.0, 31.0, 17.0, 24.0, 36.0, 34.0, 33.0, 48.0, 50.0, 50.0, 55.0, 52.0, 62.0, 58.0, 47.0, 54.0, 30.0, 44.0, 33.0, 31.0, 20.0, 15.0, 13.0, 17.0, 11.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.29296875, -6.13153076171875, -5.9700927734375, -5.80865478515625, -5.647216796875, -5.48577880859375, -5.3243408203125, -5.16290283203125, -5.00146484375, -4.84002685546875, -4.6785888671875, -4.51715087890625, -4.355712890625, -4.19427490234375, -4.0328369140625, -3.87139892578125, -3.7099609375, -3.54852294921875, -3.3870849609375, -3.22564697265625, -3.064208984375, -2.90277099609375, -2.7413330078125, -2.57989501953125, -2.41845703125, -2.25701904296875, -2.0955810546875, -1.93414306640625, -1.772705078125, -1.61126708984375, -1.4498291015625, -1.28839111328125, -1.126953125, -0.96551513671875, -0.8040771484375, -0.64263916015625, -0.481201171875, -0.31976318359375, -0.1583251953125, 0.00311279296875, 0.16455078125, 0.32598876953125, 0.4874267578125, 0.64886474609375, 0.810302734375, 0.97174072265625, 1.1331787109375, 1.29461669921875, 1.4560546875, 1.61749267578125, 1.7789306640625, 1.94036865234375, 2.101806640625, 2.26324462890625, 2.4246826171875, 2.58612060546875, 2.74755859375, 2.90899658203125, 3.0704345703125, 3.23187255859375, 3.393310546875, 3.55474853515625, 3.7161865234375, 3.87762451171875, 4.0390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 8.0, 13.0, 17.0, 22.0, 35.0, 42.0, 89.0, 102.0, 183.0, 302.0, 449.0, 704.0, 1127.0, 1783.0, 2727.0, 4546.0, 7419.0, 11690.0, 19468.0, 33639.0, 58963.0, 111802.0, 223293.0, 266057.0, 135739.0, 70513.0, 39252.0, 22660.0, 13811.0, 8325.0, 5118.0, 3155.0, 2007.0, 1254.0, 777.0, 550.0, 304.0, 215.0, 133.0, 87.0, 52.0, 37.0, 28.0, 10.0, 7.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 4.0], "bins": [-0.7763671875, -0.7522125244140625, -0.728057861328125, -0.7039031982421875, -0.67974853515625, -0.6555938720703125, -0.631439208984375, -0.6072845458984375, -0.5831298828125, -0.5589752197265625, -0.534820556640625, -0.5106658935546875, -0.48651123046875, -0.4623565673828125, -0.438201904296875, -0.4140472412109375, -0.389892578125, -0.3657379150390625, -0.341583251953125, -0.3174285888671875, -0.29327392578125, -0.2691192626953125, -0.244964599609375, -0.2208099365234375, -0.1966552734375, -0.1725006103515625, -0.148345947265625, -0.1241912841796875, -0.10003662109375, -0.0758819580078125, -0.051727294921875, -0.0275726318359375, -0.00341796875, 0.0207366943359375, 0.044891357421875, 0.0690460205078125, 0.09320068359375, 0.1173553466796875, 0.141510009765625, 0.1656646728515625, 0.1898193359375, 0.2139739990234375, 0.238128662109375, 0.2622833251953125, 0.28643798828125, 0.3105926513671875, 0.334747314453125, 0.3589019775390625, 0.383056640625, 0.4072113037109375, 0.431365966796875, 0.4555206298828125, 0.47967529296875, 0.5038299560546875, 0.527984619140625, 0.5521392822265625, 0.5762939453125, 0.6004486083984375, 0.624603271484375, 0.6487579345703125, 0.67291259765625, 0.6970672607421875, 0.721221923828125, 0.7453765869140625, 0.76953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 9.0, 10.0, 16.0, 18.0, 27.0, 23.0, 26.0, 26.0, 26.0, 27.0, 32.0, 36.0, 51.0, 36.0, 42.0, 42.0, 1063.0, 38.0, 38.0, 47.0, 41.0, 31.0, 43.0, 26.0, 35.0, 32.0, 23.0, 20.0, 14.0, 17.0, 12.0, 12.0, 15.0, 9.0, 11.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.446624755859375, -2.36199951171875, -2.277374267578125, -2.1927490234375, -2.108123779296875, -2.02349853515625, -1.938873291015625, -1.854248046875, -1.769622802734375, -1.68499755859375, -1.600372314453125, -1.5157470703125, -1.431121826171875, -1.34649658203125, -1.261871337890625, -1.17724609375, -1.092620849609375, -1.00799560546875, -0.923370361328125, -0.8387451171875, -0.754119873046875, -0.66949462890625, -0.584869384765625, -0.500244140625, -0.415618896484375, -0.33099365234375, -0.246368408203125, -0.1617431640625, -0.077117919921875, 0.00750732421875, 0.092132568359375, 0.1767578125, 0.261383056640625, 0.34600830078125, 0.430633544921875, 0.5152587890625, 0.599884033203125, 0.68450927734375, 0.769134521484375, 0.853759765625, 0.938385009765625, 1.02301025390625, 1.107635498046875, 1.1922607421875, 1.276885986328125, 1.36151123046875, 1.446136474609375, 1.53076171875, 1.615386962890625, 1.70001220703125, 1.784637451171875, 1.8692626953125, 1.953887939453125, 2.03851318359375, 2.123138427734375, 2.207763671875, 2.292388916015625, 2.37701416015625, 2.461639404296875, 2.5462646484375, 2.630889892578125, 2.71551513671875, 2.800140380859375, 2.884765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 14.0, 19.0, 26.0, 45.0, 60.0, 67.0, 143.0, 166.0, 315.0, 353.0, 595.0, 886.0, 1324.0, 1876.0, 2637.0, 3929.0, 5793.0, 8424.0, 12820.0, 18899.0, 28910.0, 44685.0, 71852.0, 116453.0, 200355.0, 1249274.0, 119444.0, 73563.0, 45799.0, 29574.0, 19114.0, 12771.0, 8515.0, 5815.0, 3943.0, 2773.0, 1862.0, 1309.0, 882.0, 584.0, 413.0, 287.0, 181.0, 118.0, 74.0, 65.0, 29.0, 32.0, 22.0, 11.0, 13.0, 8.0, 1.0, 4.0, 3.0, 2.0], "bins": [-0.56787109375, -0.5506744384765625, -0.533477783203125, -0.5162811279296875, -0.49908447265625, -0.4818878173828125, -0.464691162109375, -0.4474945068359375, -0.4302978515625, -0.4131011962890625, -0.395904541015625, -0.3787078857421875, -0.36151123046875, -0.3443145751953125, -0.327117919921875, -0.3099212646484375, -0.292724609375, -0.2755279541015625, -0.258331298828125, -0.2411346435546875, -0.22393798828125, -0.2067413330078125, -0.189544677734375, -0.1723480224609375, -0.1551513671875, -0.1379547119140625, -0.120758056640625, -0.1035614013671875, -0.08636474609375, -0.0691680908203125, -0.051971435546875, -0.0347747802734375, -0.017578125, -0.0003814697265625, 0.016815185546875, 0.0340118408203125, 0.05120849609375, 0.0684051513671875, 0.085601806640625, 0.1027984619140625, 0.1199951171875, 0.1371917724609375, 0.154388427734375, 0.1715850830078125, 0.18878173828125, 0.2059783935546875, 0.223175048828125, 0.2403717041015625, 0.257568359375, 0.2747650146484375, 0.291961669921875, 0.3091583251953125, 0.32635498046875, 0.3435516357421875, 0.360748291015625, 0.3779449462890625, 0.3951416015625, 0.4123382568359375, 0.429534912109375, 0.4467315673828125, 0.46392822265625, 0.4811248779296875, 0.498321533203125, 0.5155181884765625, 0.53271484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 2.0, 7.0, 9.0, 17.0, 16.0, 19.0, 22.0, 30.0, 41.0, 45.0, 47.0, 55.0, 71.0, 59.0, 62.0, 59.0, 76.0, 51.0, 52.0, 43.0, 27.0, 47.0, 26.0, 22.0, 16.0, 11.0, 14.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002894401550292969, -0.0002780109643936157, -0.00026658177375793457, -0.0002551525831222534, -0.00024372339248657227, -0.0002322942018508911, -0.00022086501121520996, -0.0002094358205795288, -0.00019800662994384766, -0.0001865774393081665, -0.00017514824867248535, -0.0001637190580368042, -0.00015228986740112305, -0.0001408606767654419, -0.00012943148612976074, -0.00011800229549407959, -0.00010657310485839844, -9.514391422271729e-05, -8.371472358703613e-05, -7.228553295135498e-05, -6.085634231567383e-05, -4.9427151679992676e-05, -3.7997961044311523e-05, -2.656877040863037e-05, -1.5139579772949219e-05, -3.7103891372680664e-06, 7.718801498413086e-06, 1.9147992134094238e-05, 3.057718276977539e-05, 4.200637340545654e-05, 5.3435564041137695e-05, 6.486475467681885e-05, 7.62939453125e-05, 8.772313594818115e-05, 9.91523265838623e-05, 0.00011058151721954346, 0.00012201070785522461, 0.00013343989849090576, 0.00014486908912658691, 0.00015629827976226807, 0.00016772747039794922, 0.00017915666103363037, 0.00019058585166931152, 0.00020201504230499268, 0.00021344423294067383, 0.00022487342357635498, 0.00023630261421203613, 0.0002477318048477173, 0.00025916099548339844, 0.0002705901861190796, 0.00028201937675476074, 0.0002934485673904419, 0.00030487775802612305, 0.0003163069486618042, 0.00032773613929748535, 0.0003391653299331665, 0.00035059452056884766, 0.0003620237112045288, 0.00037345290184020996, 0.0003848820924758911, 0.00039631128311157227, 0.0004077404737472534, 0.00041916966438293457, 0.0004305988550186157, 0.0004420280456542969]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 7.0, 6.0, 7.0, 12.0, 11.0, 23.0, 38.0, 45.0, 41.0, 73.0, 98.0, 144.0, 191.0, 244.0, 378.0, 696.0, 3017.0, 1039662.0, 1912.0, 616.0, 389.0, 241.0, 184.0, 125.0, 92.0, 75.0, 43.0, 57.0, 29.0, 18.0, 22.0, 8.0, 5.0, 10.0, 5.0, 10.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.00812530517578125, -0.00788944959640503, -0.007653594017028809, -0.007417738437652588, -0.007181882858276367, -0.0069460272789001465, -0.006710171699523926, -0.006474316120147705, -0.006238460540771484, -0.006002604961395264, -0.005766749382019043, -0.005530893802642822, -0.0052950382232666016, -0.005059182643890381, -0.00482332706451416, -0.0045874714851379395, -0.004351615905761719, -0.004115760326385498, -0.0038799047470092773, -0.0036440491676330566, -0.003408193588256836, -0.0031723380088806152, -0.0029364824295043945, -0.002700626850128174, -0.002464771270751953, -0.0022289156913757324, -0.0019930601119995117, -0.001757204532623291, -0.0015213489532470703, -0.0012854933738708496, -0.001049637794494629, -0.0008137822151184082, -0.0005779266357421875, -0.0003420710563659668, -0.0001062154769897461, 0.0001296401023864746, 0.0003654956817626953, 0.000601351261138916, 0.0008372068405151367, 0.0010730624198913574, 0.0013089179992675781, 0.0015447735786437988, 0.0017806291580200195, 0.0020164847373962402, 0.002252340316772461, 0.0024881958961486816, 0.0027240514755249023, 0.002959907054901123, 0.0031957626342773438, 0.0034316182136535645, 0.003667473793029785, 0.003903329372406006, 0.0041391849517822266, 0.004375040531158447, 0.004610896110534668, 0.004846751689910889, 0.005082607269287109, 0.00531846284866333, 0.005554318428039551, 0.0057901740074157715, 0.006026029586791992, 0.006261885166168213, 0.006497740745544434, 0.006733596324920654, 0.006969451904296875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 374.0, 640.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027660042978823185, -0.0027096248231828213, -0.002653245348483324, -0.002596865873783827, -0.002540486166253686, -0.0024841066915541887, -0.0024277272168546915, -0.0023713477421551943, -0.002314968267455697, -0.0022585887927562, -0.0022022093180567026, -0.0021458298433572054, -0.0020894501358270645, -0.0020330706611275673, -0.00197669118642807, -0.0019203117117285728, -0.0018639322370290756, -0.0018075527623295784, -0.0017511731712147593, -0.0016947936965152621, -0.001638414221815765, -0.0015820346307009459, -0.0015256551560014486, -0.0014692756813019514, -0.0014128960901871324, -0.0013565166154876351, -0.001300137024372816, -0.0012437575496733189, -0.0011873780749738216, -0.0011309986002743244, -0.0010746190091595054, -0.0010182395344600081, -0.0009618600597605109, -0.0009054805268533528, -0.0008491010521538556, -0.0007927215192466974, -0.0007363420445472002, -0.0006799625116400421, -0.0006235829787328839, -0.0005672035040333867, -0.0005108240293338895, -0.0004544445255305618, -0.0003980650217272341, -0.000341685488820076, -0.00028530601412057877, -0.00022892648121342063, -0.00017254697741009295, -0.00011616747360676527, -5.9787940699607134e-05, -3.408433258300647e-06, 5.297107418300584e-05, 0.00010935058526229113, 0.0001657300890656188, 0.00022210960742086172, 0.0002784891112241894, 0.0003348686150275171, 0.00039124811883084476, 0.00044762762263417244, 0.0005040071555413306, 0.0005603866302408278, 0.0006167661631479859, 0.0006731456378474832, 0.0007295251707546413, 0.0007859047036617994, 0.0008422841783612967]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 4.0, 8.0, 10.0, 7.0, 10.0, 11.0, 12.0, 10.0, 23.0, 9.0, 33.0, 21.0, 21.0, 39.0, 20.0, 48.0, 28.0, 32.0, 35.0, 42.0, 37.0, 52.0, 41.0, 32.0, 34.0, 35.0, 36.0, 28.0, 31.0, 28.0, 24.0, 30.0, 24.0, 24.0, 13.0, 21.0, 21.0, 13.0, 15.0, 6.0, 9.0, 4.0, 5.0, 5.0, 3.0, 7.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018829107284545898, -0.00018277112394571304, -0.0001772511750459671, -0.00017173122614622116, -0.00016621127724647522, -0.00016069132834672928, -0.00015517137944698334, -0.0001496514305472374, -0.00014413148164749146, -0.00013861153274774551, -0.00013309158384799957, -0.00012757163494825363, -0.00012205168604850769, -0.00011653173714876175, -0.00011101178824901581, -0.00010549183934926987, -9.997189044952393e-05, -9.445194154977798e-05, -8.893199265003204e-05, -8.34120437502861e-05, -7.789209485054016e-05, -7.237214595079422e-05, -6.685219705104828e-05, -6.133224815130234e-05, -5.5812299251556396e-05, -5.0292350351810455e-05, -4.4772401452064514e-05, -3.925245255231857e-05, -3.373250365257263e-05, -2.821255475282669e-05, -2.269260585308075e-05, -1.717265695333481e-05, -1.1652708053588867e-05, -6.132759153842926e-06, -6.128102540969849e-07, 4.907138645648956e-06, 1.0427087545394897e-05, 1.594703644514084e-05, 2.146698534488678e-05, 2.698693424463272e-05, 3.250688314437866e-05, 3.80268320441246e-05, 4.3546780943870544e-05, 4.9066729843616486e-05, 5.458667874336243e-05, 6.010662764310837e-05, 6.562657654285431e-05, 7.114652544260025e-05, 7.666647434234619e-05, 8.218642324209213e-05, 8.770637214183807e-05, 9.322632104158401e-05, 9.874626994132996e-05, 0.0001042662188410759, 0.00010978616774082184, 0.00011530611664056778, 0.00012082606554031372, 0.00012634601444005966, 0.0001318659633398056, 0.00013738591223955154, 0.00014290586113929749, 0.00014842581003904343, 0.00015394575893878937, 0.0001594657078385353, 0.00016498565673828125]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 16.0, 18.0, 17.0, 15.0, 31.0, 17.0, 24.0, 36.0, 34.0, 33.0, 48.0, 50.0, 50.0, 55.0, 52.0, 62.0, 58.0, 47.0, 54.0, 30.0, 44.0, 33.0, 31.0, 20.0, 15.0, 13.0, 17.0, 11.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.29296875, -6.13153076171875, -5.9700927734375, -5.80865478515625, -5.647216796875, -5.48577880859375, -5.3243408203125, -5.16290283203125, -5.00146484375, -4.84002685546875, -4.6785888671875, -4.51715087890625, -4.355712890625, -4.19427490234375, -4.0328369140625, -3.87139892578125, -3.7099609375, -3.54852294921875, -3.3870849609375, -3.22564697265625, -3.064208984375, -2.90277099609375, -2.7413330078125, -2.57989501953125, -2.41845703125, -2.25701904296875, -2.0955810546875, -1.93414306640625, -1.772705078125, -1.61126708984375, -1.4498291015625, -1.28839111328125, -1.126953125, -0.96551513671875, -0.8040771484375, -0.64263916015625, -0.481201171875, -0.31976318359375, -0.1583251953125, 0.00311279296875, 0.16455078125, 0.32598876953125, 0.4874267578125, 0.64886474609375, 0.810302734375, 0.97174072265625, 1.1331787109375, 1.29461669921875, 1.4560546875, 1.61749267578125, 1.7789306640625, 1.94036865234375, 2.101806640625, 2.26324462890625, 2.4246826171875, 2.58612060546875, 2.74755859375, 2.90899658203125, 3.0704345703125, 3.23187255859375, 3.393310546875, 3.55474853515625, 3.7161865234375, 3.87762451171875, 4.0390625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 9.0, 9.0, 19.0, 23.0, 20.0, 42.0, 44.0, 69.0, 103.0, 126.0, 182.0, 231.0, 321.0, 491.0, 635.0, 933.0, 1326.0, 1971.0, 3080.0, 5351.0, 10535.0, 30146.0, 756300.0, 195459.0, 19870.0, 8296.0, 4420.0, 2745.0, 1694.0, 1169.0, 828.0, 574.0, 425.0, 297.0, 223.0, 169.0, 111.0, 79.0, 67.0, 40.0, 35.0, 24.0, 19.0, 18.0, 11.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.515625, -29.58642578125, -28.6572265625, -27.72802734375, -26.798828125, -25.86962890625, -24.9404296875, -24.01123046875, -23.08203125, -22.15283203125, -21.2236328125, -20.29443359375, -19.365234375, -18.43603515625, -17.5068359375, -16.57763671875, -15.6484375, -14.71923828125, -13.7900390625, -12.86083984375, -11.931640625, -11.00244140625, -10.0732421875, -9.14404296875, -8.21484375, -7.28564453125, -6.3564453125, -5.42724609375, -4.498046875, -3.56884765625, -2.6396484375, -1.71044921875, -0.78125, 0.14794921875, 1.0771484375, 2.00634765625, 2.935546875, 3.86474609375, 4.7939453125, 5.72314453125, 6.65234375, 7.58154296875, 8.5107421875, 9.43994140625, 10.369140625, 11.29833984375, 12.2275390625, 13.15673828125, 14.0859375, 15.01513671875, 15.9443359375, 16.87353515625, 17.802734375, 18.73193359375, 19.6611328125, 20.59033203125, 21.51953125, 22.44873046875, 23.3779296875, 24.30712890625, 25.236328125, 26.16552734375, 27.0947265625, 28.02392578125, 28.953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 7.0, 8.0, 11.0, 12.0, 11.0, 14.0, 10.0, 19.0, 15.0, 22.0, 27.0, 22.0, 39.0, 30.0, 32.0, 43.0, 40.0, 55.0, 79.0, 204.0, 1642.0, 216.0, 84.0, 52.0, 37.0, 36.0, 35.0, 37.0, 29.0, 33.0, 25.0, 20.0, 19.0, 18.0, 14.0, 7.0, 10.0, 9.0, 1.0, 10.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.4609375, -12.0777587890625, -11.694580078125, -11.3114013671875, -10.92822265625, -10.5450439453125, -10.161865234375, -9.7786865234375, -9.3955078125, -9.0123291015625, -8.629150390625, -8.2459716796875, -7.86279296875, -7.4796142578125, -7.096435546875, -6.7132568359375, -6.330078125, -5.9468994140625, -5.563720703125, -5.1805419921875, -4.79736328125, -4.4141845703125, -4.031005859375, -3.6478271484375, -3.2646484375, -2.8814697265625, -2.498291015625, -2.1151123046875, -1.73193359375, -1.3487548828125, -0.965576171875, -0.5823974609375, -0.19921875, 0.1839599609375, 0.567138671875, 0.9503173828125, 1.33349609375, 1.7166748046875, 2.099853515625, 2.4830322265625, 2.8662109375, 3.2493896484375, 3.632568359375, 4.0157470703125, 4.39892578125, 4.7821044921875, 5.165283203125, 5.5484619140625, 5.931640625, 6.3148193359375, 6.697998046875, 7.0811767578125, 7.46435546875, 7.8475341796875, 8.230712890625, 8.6138916015625, 8.9970703125, 9.3802490234375, 9.763427734375, 10.1466064453125, 10.52978515625, 10.9129638671875, 11.296142578125, 11.6793212890625, 12.0625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 8.0, 13.0, 17.0, 15.0, 24.0, 21.0, 28.0, 37.0, 37.0, 38.0, 56.0, 69.0, 172.0, 551.0, 3187.0, 3109555.0, 30118.0, 925.0, 302.0, 127.0, 72.0, 35.0, 39.0, 31.0, 29.0, 22.0, 20.0, 30.0, 19.0, 7.0, 15.0, 10.0, 12.0, 11.0, 4.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-55.0625, -53.32568359375, -51.5888671875, -49.85205078125, -48.115234375, -46.37841796875, -44.6416015625, -42.90478515625, -41.16796875, -39.43115234375, -37.6943359375, -35.95751953125, -34.220703125, -32.48388671875, -30.7470703125, -29.01025390625, -27.2734375, -25.53662109375, -23.7998046875, -22.06298828125, -20.326171875, -18.58935546875, -16.8525390625, -15.11572265625, -13.37890625, -11.64208984375, -9.9052734375, -8.16845703125, -6.431640625, -4.69482421875, -2.9580078125, -1.22119140625, 0.515625, 2.25244140625, 3.9892578125, 5.72607421875, 7.462890625, 9.19970703125, 10.9365234375, 12.67333984375, 14.41015625, 16.14697265625, 17.8837890625, 19.62060546875, 21.357421875, 23.09423828125, 24.8310546875, 26.56787109375, 28.3046875, 30.04150390625, 31.7783203125, 33.51513671875, 35.251953125, 36.98876953125, 38.7255859375, 40.46240234375, 42.19921875, 43.93603515625, 45.6728515625, 47.40966796875, 49.146484375, 50.88330078125, 52.6201171875, 54.35693359375, 56.09375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 755.0, 243.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.55690002441406, -167.24212646484375, -162.92735290527344, -158.61257934570312, -154.2978057861328, -149.9830322265625, -145.6682586669922, -141.35348510742188, -137.0386962890625, -132.7239227294922, -128.40914916992188, -124.09437561035156, -119.77960205078125, -115.46482849121094, -111.1500473022461, -106.83527374267578, -102.5205078125, -98.20573425292969, -93.89096069335938, -89.57618713378906, -85.26141357421875, -80.94664001464844, -76.6318588256836, -72.31708526611328, -68.00231170654297, -63.687538146972656, -59.372764587402344, -55.057987213134766, -50.74321365356445, -46.42844009399414, -42.11366271972656, -37.79888916015625, -33.48411560058594, -29.169342041015625, -24.85456657409668, -20.539791107177734, -16.225017547607422, -11.91024398803711, -7.595468521118164, -3.2806930541992188, 1.0340805053710938, 5.348855018615723, 9.663629531860352, 13.97840404510498, 18.29317855834961, 22.607952117919922, 26.922727584838867, 31.237503051757812, 35.552276611328125, 39.86705017089844, 44.18182373046875, 48.49660110473633, 52.81137466430664, 57.12614822387695, 61.44092559814453, 65.75569915771484, 70.07047271728516, 74.38524627685547, 78.70001983642578, 83.0147933959961, 87.32957458496094, 91.64434814453125, 95.95912170410156, 100.27389526367188, 104.58866882324219]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 0.0, 3.0, 9.0, 5.0, 6.0, 19.0, 8.0, 7.0, 14.0, 20.0, 23.0, 27.0, 26.0, 23.0, 30.0, 32.0, 42.0, 28.0, 48.0, 43.0, 48.0, 45.0, 47.0, 38.0, 45.0, 46.0, 39.0, 35.0, 25.0, 42.0, 25.0, 28.0, 20.0, 21.0, 17.0, 11.0, 8.0, 16.0, 5.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.96411895751953, -35.4940071105957, -34.02389907836914, -32.55378723144531, -31.083677291870117, -29.613567352294922, -28.143457412719727, -26.67334747314453, -25.203235626220703, -23.733125686645508, -22.263015747070312, -20.792903900146484, -19.32279396057129, -17.852684020996094, -16.3825740814209, -14.912463188171387, -13.442354202270508, -11.972244262695312, -10.5021333694458, -9.032023429870605, -7.561913013458252, -6.091802597045898, -4.621692657470703, -3.1515817642211914, -1.681471824645996, -0.21136152744293213, 1.2587487697601318, 2.7288589477539062, 4.19896936416626, 5.669079780578613, 7.139189720153809, 8.60930061340332, 10.079410552978516, 11.549520492553711, 13.019631385803223, 14.489741325378418, 15.95985221862793, 17.429962158203125, 18.90007209777832, 20.370182037353516, 21.840293884277344, 23.31040382385254, 24.780513763427734, 26.250625610351562, 27.720735549926758, 29.190845489501953, 30.66095542907715, 32.131065368652344, 33.601173400878906, 35.071285247802734, 36.5413932800293, 38.011505126953125, 39.48161315917969, 40.951725006103516, 42.421836853027344, 43.891944885253906, 45.362056732177734, 46.83216857910156, 48.302276611328125, 49.77238845825195, 51.242496490478516, 52.712608337402344, 54.182716369628906, 55.652828216552734, 57.12294006347656]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 7.0, 11.0, 10.0, 14.0, 19.0, 20.0, 17.0, 25.0, 22.0, 28.0, 25.0, 39.0, 30.0, 45.0, 51.0, 54.0, 47.0, 58.0, 54.0, 61.0, 55.0, 38.0, 35.0, 39.0, 34.0, 29.0, 19.0, 23.0, 19.0, 15.0, 11.0, 7.0, 14.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1875, -6.020263671875, -5.85302734375, -5.685791015625, -5.5185546875, -5.351318359375, -5.18408203125, -5.016845703125, -4.849609375, -4.682373046875, -4.51513671875, -4.347900390625, -4.1806640625, -4.013427734375, -3.84619140625, -3.678955078125, -3.51171875, -3.344482421875, -3.17724609375, -3.010009765625, -2.8427734375, -2.675537109375, -2.50830078125, -2.341064453125, -2.173828125, -2.006591796875, -1.83935546875, -1.672119140625, -1.5048828125, -1.337646484375, -1.17041015625, -1.003173828125, -0.8359375, -0.668701171875, -0.50146484375, -0.334228515625, -0.1669921875, 0.000244140625, 0.16748046875, 0.334716796875, 0.501953125, 0.669189453125, 0.83642578125, 1.003662109375, 1.1708984375, 1.338134765625, 1.50537109375, 1.672607421875, 1.83984375, 2.007080078125, 2.17431640625, 2.341552734375, 2.5087890625, 2.676025390625, 2.84326171875, 3.010498046875, 3.177734375, 3.344970703125, 3.51220703125, 3.679443359375, 3.8466796875, 4.013916015625, 4.18115234375, 4.348388671875, 4.515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 8.0, 5.0, 7.0, 11.0, 21.0, 18.0, 26.0, 32.0, 53.0, 77.0, 111.0, 200.0, 319.0, 551.0, 1045.0, 2162.0, 4484.0, 10499.0, 30649.0, 201788.0, 3619767.0, 268429.0, 33329.0, 10871.0, 4800.0, 2275.0, 1155.0, 622.0, 325.0, 209.0, 129.0, 95.0, 58.0, 43.0, 24.0, 16.0, 16.0, 15.0, 7.0, 9.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.5087890625, -25.611328125, -24.7138671875, -23.81640625, -22.9189453125, -22.021484375, -21.1240234375, -20.2265625, -19.3291015625, -18.431640625, -17.5341796875, -16.63671875, -15.7392578125, -14.841796875, -13.9443359375, -13.046875, -12.1494140625, -11.251953125, -10.3544921875, -9.45703125, -8.5595703125, -7.662109375, -6.7646484375, -5.8671875, -4.9697265625, -4.072265625, -3.1748046875, -2.27734375, -1.3798828125, -0.482421875, 0.4150390625, 1.3125, 2.2099609375, 3.107421875, 4.0048828125, 4.90234375, 5.7998046875, 6.697265625, 7.5947265625, 8.4921875, 9.3896484375, 10.287109375, 11.1845703125, 12.08203125, 12.9794921875, 13.876953125, 14.7744140625, 15.671875, 16.5693359375, 17.466796875, 18.3642578125, 19.26171875, 20.1591796875, 21.056640625, 21.9541015625, 22.8515625, 23.7490234375, 24.646484375, 25.5439453125, 26.44140625, 27.3388671875, 28.236328125, 29.1337890625, 30.03125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 9.0, 16.0, 25.0, 40.0, 48.0, 56.0, 99.0, 129.0, 214.0, 346.0, 618.0, 771.0, 606.0, 346.0, 242.0, 148.0, 92.0, 73.0, 49.0, 29.0, 25.0, 33.0, 14.0, 11.0, 7.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.5703125, -26.75, -25.9296875, -25.109375, -24.2890625, -23.46875, -22.6484375, -21.828125, -21.0078125, -20.1875, -19.3671875, -18.546875, -17.7265625, -16.90625, -16.0859375, -15.265625, -14.4453125, -13.625, -12.8046875, -11.984375, -11.1640625, -10.34375, -9.5234375, -8.703125, -7.8828125, -7.0625, -6.2421875, -5.421875, -4.6015625, -3.78125, -2.9609375, -2.140625, -1.3203125, -0.5, 0.3203125, 1.140625, 1.9609375, 2.78125, 3.6015625, 4.421875, 5.2421875, 6.0625, 6.8828125, 7.703125, 8.5234375, 9.34375, 10.1640625, 10.984375, 11.8046875, 12.625, 13.4453125, 14.265625, 15.0859375, 15.90625, 16.7265625, 17.546875, 18.3671875, 19.1875, 20.0078125, 20.828125, 21.6484375, 22.46875, 23.2890625, 24.109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 7.0, 6.0, 11.0, 7.0, 21.0, 27.0, 36.0, 38.0, 54.0, 87.0, 123.0, 168.0, 334.0, 838.0, 13162.0, 4170489.0, 7280.0, 710.0, 339.0, 173.0, 118.0, 84.0, 49.0, 32.0, 30.0, 21.0, 16.0, 6.0, 2.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.25, -80.49609375, -76.7421875, -72.98828125, -69.234375, -65.48046875, -61.7265625, -57.97265625, -54.21875, -50.46484375, -46.7109375, -42.95703125, -39.203125, -35.44921875, -31.6953125, -27.94140625, -24.1875, -20.43359375, -16.6796875, -12.92578125, -9.171875, -5.41796875, -1.6640625, 2.08984375, 5.84375, 9.59765625, 13.3515625, 17.10546875, 20.859375, 24.61328125, 28.3671875, 32.12109375, 35.875, 39.62890625, 43.3828125, 47.13671875, 50.890625, 54.64453125, 58.3984375, 62.15234375, 65.90625, 69.66015625, 73.4140625, 77.16796875, 80.921875, 84.67578125, 88.4296875, 92.18359375, 95.9375, 99.69140625, 103.4453125, 107.19921875, 110.953125, 114.70703125, 118.4609375, 122.21484375, 125.96875, 129.72265625, 133.4765625, 137.23046875, 140.984375, 144.73828125, 148.4921875, 152.24609375, 156.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [4.0, 2.0, 134.0, 771.0, 107.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.26115798950195, -23.710105895996094, -14.159051895141602, -4.607997894287109, 4.94305419921875, 14.49410629272461, 24.045162200927734, 33.59621047973633, 43.14726638793945, 52.69831848144531, 62.24937438964844, 71.80043029785156, 81.35147857666016, 90.90252685546875, 100.45358276367188, 110.004638671875, 119.55569458007812, 129.10675048828125, 138.65780639648438, 148.2088623046875, 157.75990295410156, 167.3109588623047, 176.8620147705078, 186.41305541992188, 195.964111328125, 205.51516723632812, 215.06622314453125, 224.61727905273438, 234.16831970214844, 243.71937561035156, 253.2704315185547, 262.82147216796875, 272.3725280761719, 281.923583984375, 291.4746398925781, 301.02569580078125, 310.5767517089844, 320.1278076171875, 329.6788330078125, 339.2298889160156, 348.78094482421875, 358.3320007324219, 367.883056640625, 377.4341125488281, 386.98516845703125, 396.53619384765625, 406.0872802734375, 415.6383056640625, 425.18939208984375, 434.7404479980469, 444.29150390625, 453.8425598144531, 463.39361572265625, 472.94464111328125, 482.4957275390625, 492.0467529296875, 501.5978088378906, 511.14886474609375, 520.6998901367188, 530.2509765625, 539.802001953125, 549.3530883789062, 558.9041137695312, 568.4552001953125, 578.0062255859375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 9.0, 12.0, 9.0, 16.0, 16.0, 19.0, 17.0, 31.0, 25.0, 26.0, 40.0, 43.0, 33.0, 34.0, 38.0, 38.0, 52.0, 44.0, 50.0, 47.0, 35.0, 47.0, 26.0, 38.0, 34.0, 19.0, 27.0, 24.0, 23.0, 21.0, 20.0, 16.0, 15.0, 8.0, 10.0, 8.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-69.60829162597656, -67.6014404296875, -65.59459686279297, -63.587745666503906, -61.580894470214844, -59.57404708862305, -57.56719970703125, -55.56034851074219, -53.553497314453125, -51.54664993286133, -49.539798736572266, -47.53295135498047, -45.526100158691406, -43.51925277709961, -41.51240539550781, -39.50555419921875, -37.49870681762695, -35.491859436035156, -33.485008239746094, -31.478160858154297, -29.471309661865234, -27.464462280273438, -25.457612991333008, -23.450763702392578, -21.44391441345215, -19.43706512451172, -17.43021583557129, -15.423367500305176, -13.416518211364746, -11.409668922424316, -9.402820587158203, -7.395971298217773, -5.389122009277344, -3.382272958755493, -1.3754239082336426, 0.6314249038696289, 2.6382741928100586, 4.645123481750488, 6.651971817016602, 8.658821105957031, 10.665670394897461, 12.67251968383789, 14.67936897277832, 16.68621826171875, 18.693065643310547, 20.69991683959961, 22.706764221191406, 24.713613510131836, 26.720462799072266, 28.727312088012695, 30.734161376953125, 32.74100875854492, 34.747859954833984, 36.75470733642578, 38.761558532714844, 40.76840591430664, 42.77525329589844, 44.782100677490234, 46.7889518737793, 48.795799255371094, 50.802650451660156, 52.80949783325195, 54.81634521484375, 56.82319641113281, 58.830047607421875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 9.0, 13.0, 7.0, 14.0, 17.0, 22.0, 23.0, 35.0, 23.0, 35.0, 29.0, 33.0, 43.0, 40.0, 42.0, 50.0, 45.0, 59.0, 53.0, 40.0, 45.0, 43.0, 32.0, 40.0, 29.0, 27.0, 23.0, 19.0, 17.0, 14.0, 12.0, 7.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.7109375, -5.55352783203125, -5.3961181640625, -5.23870849609375, -5.081298828125, -4.92388916015625, -4.7664794921875, -4.60906982421875, -4.45166015625, -4.29425048828125, -4.1368408203125, -3.97943115234375, -3.822021484375, -3.66461181640625, -3.5072021484375, -3.34979248046875, -3.1923828125, -3.03497314453125, -2.8775634765625, -2.72015380859375, -2.562744140625, -2.40533447265625, -2.2479248046875, -2.09051513671875, -1.93310546875, -1.77569580078125, -1.6182861328125, -1.46087646484375, -1.303466796875, -1.14605712890625, -0.9886474609375, -0.83123779296875, -0.673828125, -0.51641845703125, -0.3590087890625, -0.20159912109375, -0.044189453125, 0.11322021484375, 0.2706298828125, 0.42803955078125, 0.58544921875, 0.74285888671875, 0.9002685546875, 1.05767822265625, 1.215087890625, 1.37249755859375, 1.5299072265625, 1.68731689453125, 1.8447265625, 2.00213623046875, 2.1595458984375, 2.31695556640625, 2.474365234375, 2.63177490234375, 2.7891845703125, 2.94659423828125, 3.10400390625, 3.26141357421875, 3.4188232421875, 3.57623291015625, 3.733642578125, 3.89105224609375, 4.0484619140625, 4.20587158203125, 4.36328125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 15.0, 19.0, 37.0, 54.0, 79.0, 118.0, 192.0, 310.0, 453.0, 686.0, 1059.0, 1833.0, 2942.0, 4715.0, 7616.0, 12326.0, 20740.0, 34448.0, 58052.0, 101939.0, 192597.0, 265304.0, 145790.0, 79400.0, 46776.0, 27820.0, 16736.0, 9980.0, 6300.0, 3768.0, 2378.0, 1466.0, 940.0, 607.0, 356.0, 216.0, 162.0, 100.0, 80.0, 54.0, 31.0, 17.0, 11.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.87060546875, -0.844451904296875, -0.81829833984375, -0.792144775390625, -0.7659912109375, -0.739837646484375, -0.71368408203125, -0.687530517578125, -0.661376953125, -0.635223388671875, -0.60906982421875, -0.582916259765625, -0.5567626953125, -0.530609130859375, -0.50445556640625, -0.478302001953125, -0.4521484375, -0.425994873046875, -0.39984130859375, -0.373687744140625, -0.3475341796875, -0.321380615234375, -0.29522705078125, -0.269073486328125, -0.242919921875, -0.216766357421875, -0.19061279296875, -0.164459228515625, -0.1383056640625, -0.112152099609375, -0.08599853515625, -0.059844970703125, -0.03369140625, -0.007537841796875, 0.01861572265625, 0.044769287109375, 0.0709228515625, 0.097076416015625, 0.12322998046875, 0.149383544921875, 0.175537109375, 0.201690673828125, 0.22784423828125, 0.253997802734375, 0.2801513671875, 0.306304931640625, 0.33245849609375, 0.358612060546875, 0.384765625, 0.410919189453125, 0.43707275390625, 0.463226318359375, 0.4893798828125, 0.515533447265625, 0.54168701171875, 0.567840576171875, 0.593994140625, 0.620147705078125, 0.64630126953125, 0.672454833984375, 0.6986083984375, 0.724761962890625, 0.75091552734375, 0.777069091796875, 0.80322265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 4.0, 2.0, 11.0, 14.0, 9.0, 12.0, 17.0, 11.0, 26.0, 29.0, 24.0, 22.0, 20.0, 30.0, 43.0, 33.0, 32.0, 41.0, 35.0, 45.0, 1059.0, 40.0, 44.0, 39.0, 34.0, 45.0, 34.0, 31.0, 29.0, 34.0, 30.0, 20.0, 26.0, 17.0, 9.0, 14.0, 11.0, 7.0, 12.0, 5.0, 5.0, 7.0, 0.0, 9.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.734375, -2.64202880859375, -2.5496826171875, -2.45733642578125, -2.364990234375, -2.27264404296875, -2.1802978515625, -2.08795166015625, -1.99560546875, -1.90325927734375, -1.8109130859375, -1.71856689453125, -1.626220703125, -1.53387451171875, -1.4415283203125, -1.34918212890625, -1.2568359375, -1.16448974609375, -1.0721435546875, -0.97979736328125, -0.887451171875, -0.79510498046875, -0.7027587890625, -0.61041259765625, -0.51806640625, -0.42572021484375, -0.3333740234375, -0.24102783203125, -0.148681640625, -0.05633544921875, 0.0360107421875, 0.12835693359375, 0.220703125, 0.31304931640625, 0.4053955078125, 0.49774169921875, 0.590087890625, 0.68243408203125, 0.7747802734375, 0.86712646484375, 0.95947265625, 1.05181884765625, 1.1441650390625, 1.23651123046875, 1.328857421875, 1.42120361328125, 1.5135498046875, 1.60589599609375, 1.6982421875, 1.79058837890625, 1.8829345703125, 1.97528076171875, 2.067626953125, 2.15997314453125, 2.2523193359375, 2.34466552734375, 2.43701171875, 2.52935791015625, 2.6217041015625, 2.71405029296875, 2.806396484375, 2.89874267578125, 2.9910888671875, 3.08343505859375, 3.17578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 7.0, 15.0, 18.0, 30.0, 45.0, 61.0, 101.0, 140.0, 202.0, 320.0, 486.0, 761.0, 1079.0, 1647.0, 2387.0, 3792.0, 5561.0, 8600.0, 13120.0, 20200.0, 31747.0, 52094.0, 85638.0, 150482.0, 1299043.0, 168678.0, 95309.0, 56819.0, 35211.0, 22080.0, 14080.0, 9200.0, 6152.0, 4050.0, 2662.0, 1785.0, 1138.0, 794.0, 530.0, 349.0, 258.0, 144.0, 98.0, 78.0, 45.0, 36.0, 21.0, 10.0, 10.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.69873046875, -0.6779327392578125, -0.657135009765625, -0.6363372802734375, -0.61553955078125, -0.5947418212890625, -0.573944091796875, -0.5531463623046875, -0.5323486328125, -0.5115509033203125, -0.490753173828125, -0.4699554443359375, -0.44915771484375, -0.4283599853515625, -0.407562255859375, -0.3867645263671875, -0.365966796875, -0.3451690673828125, -0.324371337890625, -0.3035736083984375, -0.28277587890625, -0.2619781494140625, -0.241180419921875, -0.2203826904296875, -0.1995849609375, -0.1787872314453125, -0.157989501953125, -0.1371917724609375, -0.11639404296875, -0.0955963134765625, -0.074798583984375, -0.0540008544921875, -0.033203125, -0.0124053955078125, 0.008392333984375, 0.0291900634765625, 0.04998779296875, 0.0707855224609375, 0.091583251953125, 0.1123809814453125, 0.1331787109375, 0.1539764404296875, 0.174774169921875, 0.1955718994140625, 0.21636962890625, 0.2371673583984375, 0.257965087890625, 0.2787628173828125, 0.299560546875, 0.3203582763671875, 0.341156005859375, 0.3619537353515625, 0.38275146484375, 0.4035491943359375, 0.424346923828125, 0.4451446533203125, 0.4659423828125, 0.4867401123046875, 0.507537841796875, 0.5283355712890625, 0.54913330078125, 0.5699310302734375, 0.590728759765625, 0.6115264892578125, 0.63232421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 9.0, 16.0, 8.0, 14.0, 21.0, 24.0, 35.0, 31.0, 32.0, 28.0, 41.0, 50.0, 54.0, 55.0, 66.0, 75.0, 42.0, 45.0, 49.0, 51.0, 38.0, 46.0, 18.0, 17.0, 18.0, 14.0, 15.0, 19.0, 12.0, 5.0, 9.0, 8.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.0005235671997070312, -0.00051068514585495, -0.0004978030920028687, -0.00048492103815078735, -0.00047203898429870605, -0.00045915693044662476, -0.00044627487659454346, -0.00043339282274246216, -0.00042051076889038086, -0.00040762871503829956, -0.00039474666118621826, -0.00038186460733413696, -0.00036898255348205566, -0.00035610049962997437, -0.00034321844577789307, -0.00033033639192581177, -0.00031745433807373047, -0.00030457228422164917, -0.00029169023036956787, -0.00027880817651748657, -0.0002659261226654053, -0.000253044068813324, -0.00024016201496124268, -0.00022727996110916138, -0.00021439790725708008, -0.00020151585340499878, -0.00018863379955291748, -0.00017575174570083618, -0.00016286969184875488, -0.00014998763799667358, -0.00013710558414459229, -0.00012422353029251099, -0.00011134147644042969, -9.845942258834839e-05, -8.557736873626709e-05, -7.269531488418579e-05, -5.981326103210449e-05, -4.693120718002319e-05, -3.4049153327941895e-05, -2.1167099475860596e-05, -8.285045623779297e-06, 4.597008228302002e-06, 1.74790620803833e-05, 3.03611159324646e-05, 4.32431697845459e-05, 5.61252236366272e-05, 6.90072774887085e-05, 8.18893313407898e-05, 9.47713851928711e-05, 0.00010765343904495239, 0.00012053549289703369, 0.000133417546749115, 0.0001462996006011963, 0.0001591816544532776, 0.0001720637083053589, 0.00018494576215744019, 0.00019782781600952148, 0.00021070986986160278, 0.00022359192371368408, 0.00023647397756576538, 0.0002493560314178467, 0.000262238085269928, 0.0002751201391220093, 0.0002880021929740906, 0.0003008842468261719]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 16.0, 11.0, 22.0, 21.0, 30.0, 39.0, 66.0, 66.0, 101.0, 144.0, 317.0, 602.0, 4301.0, 1040318.0, 1268.0, 426.0, 242.0, 148.0, 102.0, 70.0, 53.0, 32.0, 32.0, 18.0, 14.0, 20.0, 13.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00841522216796875, -0.008054494857788086, -0.007693767547607422, -0.007333040237426758, -0.006972312927246094, -0.00661158561706543, -0.006250858306884766, -0.0058901309967041016, -0.0055294036865234375, -0.0051686763763427734, -0.004807949066162109, -0.004447221755981445, -0.004086494445800781, -0.003725767135620117, -0.003365039825439453, -0.003004312515258789, -0.002643585205078125, -0.002282857894897461, -0.0019221305847167969, -0.0015614032745361328, -0.0012006759643554688, -0.0008399486541748047, -0.0004792213439941406, -0.00011849403381347656, 0.0002422332763671875, 0.0006029605865478516, 0.0009636878967285156, 0.0013244152069091797, 0.0016851425170898438, 0.002045869827270508, 0.002406597137451172, 0.002767324447631836, 0.0031280517578125, 0.003488779067993164, 0.003849506378173828, 0.004210233688354492, 0.004570960998535156, 0.00493168830871582, 0.005292415618896484, 0.0056531429290771484, 0.0060138702392578125, 0.0063745975494384766, 0.006735324859619141, 0.007096052169799805, 0.007456779479980469, 0.007817506790161133, 0.008178234100341797, 0.008538961410522461, 0.008899688720703125, 0.009260416030883789, 0.009621143341064453, 0.009981870651245117, 0.010342597961425781, 0.010703325271606445, 0.01106405258178711, 0.011424779891967773, 0.011785507202148438, 0.012146234512329102, 0.012506961822509766, 0.01286768913269043, 0.013228416442871094, 0.013589143753051758, 0.013949871063232422, 0.014310598373413086, 0.01467132568359375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 14.0, 57.0, 248.0, 461.0, 195.0, 31.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003618910850491375, -0.00034320427221246064, -0.00032451743027195334, -0.0003058306174352765, -0.0002871437754947692, -0.0002684569626580924, -0.0002497701207175851, -0.00023108330788090825, -0.00021239648049231619, -0.00019370965310372412, -0.00017502282571513206, -0.00015633599832654, -0.00013764918548986316, -0.00011896235082531348, -0.00010027553071267903, -8.158870332408696e-05, -6.29018759354949e-05, -4.4215048546902835e-05, -2.5528224796289578e-05, -6.841401045676321e-06, 1.1845426342915744e-05, 3.053225373150781e-05, 4.921907384414226e-05, 6.790590123273432e-05, 8.659272862132639e-05, 0.00010527955600991845, 0.00012396638339851052, 0.00014265321078710258, 0.00016134002362377942, 0.0001800268655642867, 0.00019871367840096354, 0.0002174005057895556, 0.00023608730407431722, 0.00025477411691099405, 0.00027346095885150135, 0.0002921477716881782, 0.0003108346136286855, 0.0003295214264653623, 0.00034820823930203915, 0.00036689508124254644, 0.00038558192318305373, 0.00040426873601973057, 0.00042295557796023786, 0.0004416423907969147, 0.000460329232737422, 0.0004790160455740988, 0.0004977028584107757, 0.0005163897294551134, 0.0005350764840841293, 0.0005537632969208062, 0.000572450109757483, 0.0005911369808018208, 0.0006098237936384976, 0.0006285106064751744, 0.0006471974193118513, 0.0006658842321485281, 0.0006845711031928658, 0.0007032579160295427, 0.0007219447288662195, 0.0007406315999105573, 0.0007593184127472341, 0.0007780052255839109, 0.0007966920384205878, 0.0008153788512572646, 0.0008340657223016024]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 8.0, 12.0, 21.0, 16.0, 25.0, 19.0, 28.0, 16.0, 24.0, 37.0, 27.0, 36.0, 27.0, 29.0, 37.0, 49.0, 42.0, 39.0, 49.0, 37.0, 37.0, 35.0, 36.0, 30.0, 33.0, 31.0, 26.0, 20.0, 19.0, 25.0, 19.0, 15.0, 9.0, 17.0, 7.0, 5.0, 7.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002194046974182129, -0.00021274667233228683, -0.00020608864724636078, -0.00019943062216043472, -0.00019277259707450867, -0.0001861145719885826, -0.00017945654690265656, -0.0001727985218167305, -0.00016614049673080444, -0.0001594824716448784, -0.00015282444655895233, -0.00014616642147302628, -0.00013950839638710022, -0.00013285037130117416, -0.0001261923462152481, -0.00011953432112932205, -0.000112876296043396, -0.00010621827095746994, -9.956024587154388e-05, -9.290222078561783e-05, -8.624419569969177e-05, -7.958617061376572e-05, -7.292814552783966e-05, -6.62701204419136e-05, -5.961209535598755e-05, -5.295407027006149e-05, -4.629604518413544e-05, -3.963802009820938e-05, -3.2979995012283325e-05, -2.632196992635727e-05, -1.9663944840431213e-05, -1.3005919754505157e-05, -6.3478946685791016e-06, 3.1013041734695435e-07, 6.96815550327301e-06, 1.3626180589199066e-05, 2.0284205675125122e-05, 2.6942230761051178e-05, 3.3600255846977234e-05, 4.025828093290329e-05, 4.6916306018829346e-05, 5.35743311047554e-05, 6.023235619068146e-05, 6.689038127660751e-05, 7.354840636253357e-05, 8.020643144845963e-05, 8.686445653438568e-05, 9.352248162031174e-05, 0.00010018050670623779, 0.00010683853179216385, 0.0001134965568780899, 0.00012015458196401596, 0.00012681260704994202, 0.00013347063213586807, 0.00014012865722179413, 0.00014678668230772018, 0.00015344470739364624, 0.0001601027324795723, 0.00016676075756549835, 0.0001734187826514244, 0.00018007680773735046, 0.00018673483282327652, 0.00019339285790920258, 0.00020005088299512863, 0.0002067089080810547]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 9.0, 13.0, 7.0, 14.0, 17.0, 22.0, 23.0, 35.0, 23.0, 35.0, 29.0, 33.0, 43.0, 40.0, 42.0, 50.0, 45.0, 59.0, 53.0, 40.0, 45.0, 43.0, 32.0, 40.0, 29.0, 27.0, 23.0, 19.0, 17.0, 14.0, 12.0, 7.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.7109375, -5.55352783203125, -5.3961181640625, -5.23870849609375, -5.081298828125, -4.92388916015625, -4.7664794921875, -4.60906982421875, -4.45166015625, -4.29425048828125, -4.1368408203125, -3.97943115234375, -3.822021484375, -3.66461181640625, -3.5072021484375, -3.34979248046875, -3.1923828125, -3.03497314453125, -2.8775634765625, -2.72015380859375, -2.562744140625, -2.40533447265625, -2.2479248046875, -2.09051513671875, -1.93310546875, -1.77569580078125, -1.6182861328125, -1.46087646484375, -1.303466796875, -1.14605712890625, -0.9886474609375, -0.83123779296875, -0.673828125, -0.51641845703125, -0.3590087890625, -0.20159912109375, -0.044189453125, 0.11322021484375, 0.2706298828125, 0.42803955078125, 0.58544921875, 0.74285888671875, 0.9002685546875, 1.05767822265625, 1.215087890625, 1.37249755859375, 1.5299072265625, 1.68731689453125, 1.8447265625, 2.00213623046875, 2.1595458984375, 2.31695556640625, 2.474365234375, 2.63177490234375, 2.7891845703125, 2.94659423828125, 3.10400390625, 3.26141357421875, 3.4188232421875, 3.57623291015625, 3.733642578125, 3.89105224609375, 4.0484619140625, 4.20587158203125, 4.36328125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 21.0, 23.0, 46.0, 48.0, 78.0, 91.0, 131.0, 225.0, 299.0, 563.0, 958.0, 1930.0, 4603.0, 13680.0, 46226.0, 193152.0, 543248.0, 178341.0, 43035.0, 12883.0, 4531.0, 1970.0, 919.0, 539.0, 304.0, 225.0, 130.0, 81.0, 70.0, 59.0, 31.0, 27.0, 15.0, 14.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.796875, -5.62872314453125, -5.4605712890625, -5.29241943359375, -5.124267578125, -4.95611572265625, -4.7879638671875, -4.61981201171875, -4.45166015625, -4.28350830078125, -4.1153564453125, -3.94720458984375, -3.779052734375, -3.61090087890625, -3.4427490234375, -3.27459716796875, -3.1064453125, -2.93829345703125, -2.7701416015625, -2.60198974609375, -2.433837890625, -2.26568603515625, -2.0975341796875, -1.92938232421875, -1.76123046875, -1.59307861328125, -1.4249267578125, -1.25677490234375, -1.088623046875, -0.92047119140625, -0.7523193359375, -0.58416748046875, -0.416015625, -0.24786376953125, -0.0797119140625, 0.08843994140625, 0.256591796875, 0.42474365234375, 0.5928955078125, 0.76104736328125, 0.92919921875, 1.09735107421875, 1.2655029296875, 1.43365478515625, 1.601806640625, 1.76995849609375, 1.9381103515625, 2.10626220703125, 2.2744140625, 2.44256591796875, 2.6107177734375, 2.77886962890625, 2.947021484375, 3.11517333984375, 3.2833251953125, 3.45147705078125, 3.61962890625, 3.78778076171875, 3.9559326171875, 4.12408447265625, 4.292236328125, 4.46038818359375, 4.6285400390625, 4.79669189453125, 4.96484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 9.0, 8.0, 16.0, 15.0, 17.0, 23.0, 26.0, 30.0, 25.0, 25.0, 30.0, 30.0, 40.0, 54.0, 40.0, 83.0, 437.0, 1607.0, 81.0, 38.0, 53.0, 42.0, 43.0, 42.0, 24.0, 28.0, 27.0, 17.0, 23.0, 21.0, 15.0, 19.0, 11.0, 7.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.53125, -16.0313720703125, -15.531494140625, -15.0316162109375, -14.53173828125, -14.0318603515625, -13.531982421875, -13.0321044921875, -12.5322265625, -12.0323486328125, -11.532470703125, -11.0325927734375, -10.53271484375, -10.0328369140625, -9.532958984375, -9.0330810546875, -8.533203125, -8.0333251953125, -7.533447265625, -7.0335693359375, -6.53369140625, -6.0338134765625, -5.533935546875, -5.0340576171875, -4.5341796875, -4.0343017578125, -3.534423828125, -3.0345458984375, -2.53466796875, -2.0347900390625, -1.534912109375, -1.0350341796875, -0.53515625, -0.0352783203125, 0.464599609375, 0.9644775390625, 1.46435546875, 1.9642333984375, 2.464111328125, 2.9639892578125, 3.4638671875, 3.9637451171875, 4.463623046875, 4.9635009765625, 5.46337890625, 5.9632568359375, 6.463134765625, 6.9630126953125, 7.462890625, 7.9627685546875, 8.462646484375, 8.9625244140625, 9.46240234375, 9.9622802734375, 10.462158203125, 10.9620361328125, 11.4619140625, 11.9617919921875, 12.461669921875, 12.9615478515625, 13.46142578125, 13.9613037109375, 14.461181640625, 14.9610595703125, 15.4609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 9.0, 7.0, 9.0, 15.0, 17.0, 28.0, 22.0, 18.0, 23.0, 38.0, 31.0, 61.0, 77.0, 139.0, 191.0, 545.0, 2388.0, 2961827.0, 178001.0, 1239.0, 395.0, 174.0, 97.0, 75.0, 42.0, 37.0, 30.0, 30.0, 29.0, 21.0, 16.0, 20.0, 10.0, 6.0, 11.0, 6.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.21875, -35.044921875, -33.87109375, -32.697265625, -31.5234375, -30.349609375, -29.17578125, -28.001953125, -26.828125, -25.654296875, -24.48046875, -23.306640625, -22.1328125, -20.958984375, -19.78515625, -18.611328125, -17.4375, -16.263671875, -15.08984375, -13.916015625, -12.7421875, -11.568359375, -10.39453125, -9.220703125, -8.046875, -6.873046875, -5.69921875, -4.525390625, -3.3515625, -2.177734375, -1.00390625, 0.169921875, 1.34375, 2.517578125, 3.69140625, 4.865234375, 6.0390625, 7.212890625, 8.38671875, 9.560546875, 10.734375, 11.908203125, 13.08203125, 14.255859375, 15.4296875, 16.603515625, 17.77734375, 18.951171875, 20.125, 21.298828125, 22.47265625, 23.646484375, 24.8203125, 25.994140625, 27.16796875, 28.341796875, 29.515625, 30.689453125, 31.86328125, 33.037109375, 34.2109375, 35.384765625, 36.55859375, 37.732421875, 38.90625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 8.0, 19.0, 75.0, 173.0, 236.0, 254.0, 154.0, 59.0, 29.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.962770938873291, -5.297201633453369, -4.631632328033447, -3.9660627841949463, -3.3004934787750244, -2.6349241733551025, -1.9693546295166016, -1.3037853240966797, -0.6382160186767578, 0.027353346347808838, 0.6929227113723755, 1.358492136001587, 2.024061441421509, 2.6896307468414307, 3.3552002906799316, 4.0207695960998535, 4.686338901519775, 5.351908206939697, 6.017477512359619, 6.683047294616699, 7.348616600036621, 8.014185905456543, 8.679755210876465, 9.345324516296387, 10.010893821716309, 10.67646312713623, 11.342032432556152, 12.007601737976074, 12.673171043395996, 13.338740348815918, 14.004310607910156, 14.669879913330078, 15.335447311401367, 16.00101661682129, 16.66658592224121, 17.332155227661133, 17.997724533081055, 18.663293838500977, 19.3288631439209, 19.99443244934082, 20.660001754760742, 21.325571060180664, 21.991140365600586, 22.656709671020508, 23.32227897644043, 23.98784828186035, 24.653417587280273, 25.318986892700195, 25.98455810546875, 26.650127410888672, 27.315696716308594, 27.981266021728516, 28.646835327148438, 29.31240463256836, 29.97797393798828, 30.643543243408203, 31.309112548828125, 31.974681854248047, 32.64025115966797, 33.30582046508789, 33.97138977050781, 34.636959075927734, 35.302528381347656, 35.96809768676758, 36.6336669921875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 12.0, 16.0, 10.0, 16.0, 11.0, 22.0, 22.0, 36.0, 37.0, 31.0, 47.0, 29.0, 32.0, 39.0, 44.0, 44.0, 43.0, 44.0, 56.0, 49.0, 50.0, 38.0, 27.0, 36.0, 26.0, 25.0, 22.0, 15.0, 29.0, 17.0, 8.0, 13.0, 6.0, 14.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.35805130004883, -52.647804260253906, -50.937557220458984, -49.22731018066406, -47.517066955566406, -45.806819915771484, -44.09657287597656, -42.38632583618164, -40.67607879638672, -38.9658317565918, -37.255584716796875, -35.54534149169922, -33.8350944519043, -32.124847412109375, -30.414600372314453, -28.70435333251953, -26.994110107421875, -25.283863067626953, -23.573617935180664, -21.863370895385742, -20.153125762939453, -18.44287872314453, -16.73263168334961, -15.022385597229004, -13.312139511108398, -11.601893424987793, -9.891647338867188, -8.181400299072266, -6.47115421295166, -4.760908126831055, -3.050661087036133, -1.3404150009155273, 0.36983489990234375, 2.0800812244415283, 3.790327548980713, 5.500574111938477, 7.210820198059082, 8.921066284179688, 10.63131332397461, 12.341559410095215, 14.05180549621582, 15.762051582336426, 17.47229766845703, 19.182544708251953, 20.892791748046875, 22.603036880493164, 24.313283920288086, 26.023529052734375, 27.733776092529297, 29.44402313232422, 31.154268264770508, 32.86451721191406, 34.57476043701172, 36.28500747680664, 37.99525451660156, 39.705501556396484, 41.415748596191406, 43.12599563598633, 44.83624267578125, 46.546485900878906, 48.25673294067383, 49.96697998046875, 51.67722702026367, 53.387474060058594, 55.09771728515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 3.0, 7.0, 9.0, 11.0, 11.0, 10.0, 18.0, 9.0, 23.0, 22.0, 28.0, 27.0, 26.0, 35.0, 36.0, 44.0, 35.0, 37.0, 46.0, 50.0, 50.0, 57.0, 55.0, 35.0, 50.0, 37.0, 38.0, 28.0, 25.0, 27.0, 21.0, 10.0, 20.0, 11.0, 12.0, 6.0, 9.0, 12.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.73046875, -5.56939697265625, -5.4083251953125, -5.24725341796875, -5.086181640625, -4.92510986328125, -4.7640380859375, -4.60296630859375, -4.44189453125, -4.28082275390625, -4.1197509765625, -3.95867919921875, -3.797607421875, -3.63653564453125, -3.4754638671875, -3.31439208984375, -3.1533203125, -2.99224853515625, -2.8311767578125, -2.67010498046875, -2.509033203125, -2.34796142578125, -2.1868896484375, -2.02581787109375, -1.86474609375, -1.70367431640625, -1.5426025390625, -1.38153076171875, -1.220458984375, -1.05938720703125, -0.8983154296875, -0.73724365234375, -0.576171875, -0.41510009765625, -0.2540283203125, -0.09295654296875, 0.068115234375, 0.22918701171875, 0.3902587890625, 0.55133056640625, 0.71240234375, 0.87347412109375, 1.0345458984375, 1.19561767578125, 1.356689453125, 1.51776123046875, 1.6788330078125, 1.83990478515625, 2.0009765625, 2.16204833984375, 2.3231201171875, 2.48419189453125, 2.645263671875, 2.80633544921875, 2.9674072265625, 3.12847900390625, 3.28955078125, 3.45062255859375, 3.6116943359375, 3.77276611328125, 3.933837890625, 4.09490966796875, 4.2559814453125, 4.41705322265625, 4.578125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 12.0, 10.0, 6.0, 18.0, 14.0, 15.0, 33.0, 35.0, 56.0, 74.0, 119.0, 176.0, 343.0, 772.0, 3004.0, 24010.0, 597422.0, 3239332.0, 310238.0, 14954.0, 2170.0, 671.0, 300.0, 162.0, 97.0, 61.0, 49.0, 32.0, 28.0, 14.0, 17.0, 12.0, 5.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.46875, -19.9215087890625, -19.374267578125, -18.8270263671875, -18.27978515625, -17.7325439453125, -17.185302734375, -16.6380615234375, -16.0908203125, -15.5435791015625, -14.996337890625, -14.4490966796875, -13.90185546875, -13.3546142578125, -12.807373046875, -12.2601318359375, -11.712890625, -11.1656494140625, -10.618408203125, -10.0711669921875, -9.52392578125, -8.9766845703125, -8.429443359375, -7.8822021484375, -7.3349609375, -6.7877197265625, -6.240478515625, -5.6932373046875, -5.14599609375, -4.5987548828125, -4.051513671875, -3.5042724609375, -2.95703125, -2.4097900390625, -1.862548828125, -1.3153076171875, -0.76806640625, -0.2208251953125, 0.326416015625, 0.8736572265625, 1.4208984375, 1.9681396484375, 2.515380859375, 3.0626220703125, 3.60986328125, 4.1571044921875, 4.704345703125, 5.2515869140625, 5.798828125, 6.3460693359375, 6.893310546875, 7.4405517578125, 7.98779296875, 8.5350341796875, 9.082275390625, 9.6295166015625, 10.1767578125, 10.7239990234375, 11.271240234375, 11.8184814453125, 12.36572265625, 12.9129638671875, 13.460205078125, 14.0074462890625, 14.5546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 16.0, 10.0, 29.0, 40.0, 58.0, 79.0, 116.0, 171.0, 280.0, 432.0, 653.0, 719.0, 492.0, 316.0, 200.0, 151.0, 94.0, 64.0, 47.0, 38.0, 17.0, 13.0, 14.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.078125, -28.335693359375, -27.59326171875, -26.850830078125, -26.1083984375, -25.365966796875, -24.62353515625, -23.881103515625, -23.138671875, -22.396240234375, -21.65380859375, -20.911376953125, -20.1689453125, -19.426513671875, -18.68408203125, -17.941650390625, -17.19921875, -16.456787109375, -15.71435546875, -14.971923828125, -14.2294921875, -13.487060546875, -12.74462890625, -12.002197265625, -11.259765625, -10.517333984375, -9.77490234375, -9.032470703125, -8.2900390625, -7.547607421875, -6.80517578125, -6.062744140625, -5.3203125, -4.577880859375, -3.83544921875, -3.093017578125, -2.3505859375, -1.608154296875, -0.86572265625, -0.123291015625, 0.619140625, 1.361572265625, 2.10400390625, 2.846435546875, 3.5888671875, 4.331298828125, 5.07373046875, 5.816162109375, 6.55859375, 7.301025390625, 8.04345703125, 8.785888671875, 9.5283203125, 10.270751953125, 11.01318359375, 11.755615234375, 12.498046875, 13.240478515625, 13.98291015625, 14.725341796875, 15.4677734375, 16.210205078125, 16.95263671875, 17.695068359375, 18.4375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 9.0, 18.0, 29.0, 28.0, 60.0, 76.0, 113.0, 180.0, 260.0, 464.0, 1192.0, 26659.0, 4112762.0, 49792.0, 1364.0, 474.0, 257.0, 162.0, 101.0, 82.0, 48.0, 43.0, 25.0, 22.0, 10.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.0625, -50.8095703125, -48.556640625, -46.3037109375, -44.05078125, -41.7978515625, -39.544921875, -37.2919921875, -35.0390625, -32.7861328125, -30.533203125, -28.2802734375, -26.02734375, -23.7744140625, -21.521484375, -19.2685546875, -17.015625, -14.7626953125, -12.509765625, -10.2568359375, -8.00390625, -5.7509765625, -3.498046875, -1.2451171875, 1.0078125, 3.2607421875, 5.513671875, 7.7666015625, 10.01953125, 12.2724609375, 14.525390625, 16.7783203125, 19.03125, 21.2841796875, 23.537109375, 25.7900390625, 28.04296875, 30.2958984375, 32.548828125, 34.8017578125, 37.0546875, 39.3076171875, 41.560546875, 43.8134765625, 46.06640625, 48.3193359375, 50.572265625, 52.8251953125, 55.078125, 57.3310546875, 59.583984375, 61.8369140625, 64.08984375, 66.3427734375, 68.595703125, 70.8486328125, 73.1015625, 75.3544921875, 77.607421875, 79.8603515625, 82.11328125, 84.3662109375, 86.619140625, 88.8720703125, 91.125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 92.0, 707.0, 211.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-588.1069946289062, -577.901123046875, -567.6953125, -557.4894409179688, -547.2836303710938, -537.0777587890625, -526.8719482421875, -516.6660766601562, -506.46026611328125, -496.2544250488281, -486.048583984375, -475.8427429199219, -465.63690185546875, -455.4310607910156, -445.2252197265625, -435.01934814453125, -424.8135070800781, -414.607666015625, -404.4018249511719, -394.19598388671875, -383.9901428222656, -373.7843017578125, -363.5784606933594, -353.37261962890625, -343.166748046875, -332.9609069824219, -322.75506591796875, -312.5492248535156, -302.3433837890625, -292.1375427246094, -281.93170166015625, -271.725830078125, -261.52001953125, -251.31417846679688, -241.10833740234375, -230.90249633789062, -220.6966552734375, -210.49081420898438, -200.2849578857422, -190.07911682128906, -179.873291015625, -169.66744995117188, -159.46160888671875, -149.25576782226562, -139.0499267578125, -128.84408569335938, -118.63822937011719, -108.43238830566406, -98.2265396118164, -88.02069854736328, -77.81484985351562, -67.6090087890625, -57.403167724609375, -47.19732666015625, -36.99148178100586, -26.78563690185547, -16.579795837402344, -6.373952865600586, 3.831890106201172, 14.03773307800293, 24.243576049804688, 34.44941711425781, 44.6552619934082, 54.861106872558594, 65.06694793701172]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 10.0, 3.0, 11.0, 8.0, 18.0, 12.0, 17.0, 26.0, 25.0, 21.0, 21.0, 30.0, 23.0, 40.0, 31.0, 27.0, 39.0, 46.0, 38.0, 45.0, 23.0, 46.0, 40.0, 34.0, 38.0, 27.0, 29.0, 35.0, 29.0, 24.0, 30.0, 26.0, 24.0, 23.0, 16.0, 8.0, 9.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.29388427734375, -52.568817138671875, -50.84375, -49.118682861328125, -47.39361572265625, -45.668548583984375, -43.9434814453125, -42.218414306640625, -40.49334716796875, -38.768280029296875, -37.043212890625, -35.318145751953125, -33.59307861328125, -31.868011474609375, -30.1429443359375, -28.417877197265625, -26.692811965942383, -24.967744827270508, -23.242677688598633, -21.517610549926758, -19.792543411254883, -18.06747817993164, -16.342411041259766, -14.617342948913574, -12.8922758102417, -11.167208671569824, -9.44214153289795, -7.717074871063232, -5.992007732391357, -4.266941070556641, -2.5418739318847656, -0.8168067932128906, 0.9082603454589844, 2.6333274841308594, 4.358394622802734, 6.083461284637451, 7.808528423309326, 9.533595085144043, 11.258662223815918, 12.983729362487793, 14.708796501159668, 16.433862686157227, 18.1589298248291, 19.883996963500977, 21.60906410217285, 23.334131240844727, 25.0591983795166, 26.784265518188477, 28.50933265686035, 30.234399795532227, 31.9594669342041, 33.684532165527344, 35.40959930419922, 37.134666442871094, 38.85973358154297, 40.584800720214844, 42.30986785888672, 44.034934997558594, 45.76000213623047, 47.485069274902344, 49.21013641357422, 50.935203552246094, 52.66027069091797, 54.385337829589844, 56.11040496826172]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 12.0, 8.0, 8.0, 14.0, 14.0, 10.0, 18.0, 21.0, 32.0, 27.0, 32.0, 32.0, 24.0, 36.0, 51.0, 29.0, 48.0, 37.0, 51.0, 43.0, 51.0, 49.0, 44.0, 49.0, 36.0, 34.0, 21.0, 31.0, 31.0, 20.0, 15.0, 11.0, 9.0, 8.0, 9.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2265625, -5.06439208984375, -4.9022216796875, -4.74005126953125, -4.577880859375, -4.41571044921875, -4.2535400390625, -4.09136962890625, -3.92919921875, -3.76702880859375, -3.6048583984375, -3.44268798828125, -3.280517578125, -3.11834716796875, -2.9561767578125, -2.79400634765625, -2.6318359375, -2.46966552734375, -2.3074951171875, -2.14532470703125, -1.983154296875, -1.82098388671875, -1.6588134765625, -1.49664306640625, -1.33447265625, -1.17230224609375, -1.0101318359375, -0.84796142578125, -0.685791015625, -0.52362060546875, -0.3614501953125, -0.19927978515625, -0.037109375, 0.12506103515625, 0.2872314453125, 0.44940185546875, 0.611572265625, 0.77374267578125, 0.9359130859375, 1.09808349609375, 1.26025390625, 1.42242431640625, 1.5845947265625, 1.74676513671875, 1.908935546875, 2.07110595703125, 2.2332763671875, 2.39544677734375, 2.5576171875, 2.71978759765625, 2.8819580078125, 3.04412841796875, 3.206298828125, 3.36846923828125, 3.5306396484375, 3.69281005859375, 3.85498046875, 4.01715087890625, 4.1793212890625, 4.34149169921875, 4.503662109375, 4.66583251953125, 4.8280029296875, 4.99017333984375, 5.15234375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 6.0, 10.0, 9.0, 18.0, 23.0, 32.0, 37.0, 52.0, 71.0, 101.0, 157.0, 256.0, 374.0, 472.0, 721.0, 1083.0, 1570.0, 2366.0, 3531.0, 5383.0, 8465.0, 13279.0, 21158.0, 33813.0, 57093.0, 98510.0, 172252.0, 244687.0, 156638.0, 88838.0, 51828.0, 31164.0, 19382.0, 12223.0, 7711.0, 4995.0, 3338.0, 2260.0, 1439.0, 1019.0, 713.0, 431.0, 324.0, 216.0, 150.0, 118.0, 73.0, 57.0, 40.0, 23.0, 15.0, 15.0, 10.0, 8.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.76806640625, -0.7436141967773438, -0.7191619873046875, -0.6947097778320312, -0.670257568359375, -0.6458053588867188, -0.6213531494140625, -0.5969009399414062, -0.57244873046875, -0.5479965209960938, -0.5235443115234375, -0.49909210205078125, -0.474639892578125, -0.45018768310546875, -0.4257354736328125, -0.40128326416015625, -0.3768310546875, -0.35237884521484375, -0.3279266357421875, -0.30347442626953125, -0.279022216796875, -0.25457000732421875, -0.2301177978515625, -0.20566558837890625, -0.18121337890625, -0.15676116943359375, -0.1323089599609375, -0.10785675048828125, -0.083404541015625, -0.05895233154296875, -0.0345001220703125, -0.01004791259765625, 0.014404296875, 0.03885650634765625, 0.0633087158203125, 0.08776092529296875, 0.112213134765625, 0.13666534423828125, 0.1611175537109375, 0.18556976318359375, 0.21002197265625, 0.23447418212890625, 0.2589263916015625, 0.28337860107421875, 0.307830810546875, 0.33228302001953125, 0.3567352294921875, 0.38118743896484375, 0.4056396484375, 0.43009185791015625, 0.4545440673828125, 0.47899627685546875, 0.503448486328125, 0.5279006958007812, 0.5523529052734375, 0.5768051147460938, 0.60125732421875, 0.6257095336914062, 0.6501617431640625, 0.6746139526367188, 0.699066162109375, 0.7235183715820312, 0.7479705810546875, 0.7724227905273438, 0.796875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 4.0, 5.0, 7.0, 11.0, 8.0, 12.0, 9.0, 16.0, 14.0, 23.0, 16.0, 21.0, 19.0, 28.0, 39.0, 21.0, 43.0, 45.0, 35.0, 42.0, 45.0, 1061.0, 42.0, 40.0, 37.0, 43.0, 37.0, 26.0, 32.0, 37.0, 23.0, 25.0, 22.0, 18.0, 15.0, 15.0, 13.0, 12.0, 13.0, 8.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.84765625, -2.75567626953125, -2.6636962890625, -2.57171630859375, -2.479736328125, -2.38775634765625, -2.2957763671875, -2.20379638671875, -2.11181640625, -2.01983642578125, -1.9278564453125, -1.83587646484375, -1.743896484375, -1.65191650390625, -1.5599365234375, -1.46795654296875, -1.3759765625, -1.28399658203125, -1.1920166015625, -1.10003662109375, -1.008056640625, -0.91607666015625, -0.8240966796875, -0.73211669921875, -0.64013671875, -0.54815673828125, -0.4561767578125, -0.36419677734375, -0.272216796875, -0.18023681640625, -0.0882568359375, 0.00372314453125, 0.095703125, 0.18768310546875, 0.2796630859375, 0.37164306640625, 0.463623046875, 0.55560302734375, 0.6475830078125, 0.73956298828125, 0.83154296875, 0.92352294921875, 1.0155029296875, 1.10748291015625, 1.199462890625, 1.29144287109375, 1.3834228515625, 1.47540283203125, 1.5673828125, 1.65936279296875, 1.7513427734375, 1.84332275390625, 1.935302734375, 2.02728271484375, 2.1192626953125, 2.21124267578125, 2.30322265625, 2.39520263671875, 2.4871826171875, 2.57916259765625, 2.671142578125, 2.76312255859375, 2.8551025390625, 2.94708251953125, 3.0390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 14.0, 15.0, 27.0, 47.0, 51.0, 112.0, 159.0, 238.0, 316.0, 522.0, 685.0, 997.0, 1476.0, 2131.0, 3245.0, 4675.0, 6797.0, 10387.0, 15530.0, 24333.0, 38678.0, 63029.0, 107734.0, 196292.0, 1284523.0, 131346.0, 75151.0, 45761.0, 28333.0, 18164.0, 11986.0, 7670.0, 5207.0, 3625.0, 2516.0, 1689.0, 1136.0, 815.0, 550.0, 364.0, 267.0, 161.0, 123.0, 84.0, 53.0, 38.0, 25.0, 18.0, 11.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6675491333007812, -0.6461334228515625, -0.6247177124023438, -0.603302001953125, -0.5818862915039062, -0.5604705810546875, -0.5390548706054688, -0.51763916015625, -0.49622344970703125, -0.4748077392578125, -0.45339202880859375, -0.431976318359375, -0.41056060791015625, -0.3891448974609375, -0.36772918701171875, -0.3463134765625, -0.32489776611328125, -0.3034820556640625, -0.28206634521484375, -0.260650634765625, -0.23923492431640625, -0.2178192138671875, -0.19640350341796875, -0.17498779296875, -0.15357208251953125, -0.1321563720703125, -0.11074066162109375, -0.089324951171875, -0.06790924072265625, -0.0464935302734375, -0.02507781982421875, -0.003662109375, 0.01775360107421875, 0.0391693115234375, 0.06058502197265625, 0.082000732421875, 0.10341644287109375, 0.1248321533203125, 0.14624786376953125, 0.16766357421875, 0.18907928466796875, 0.2104949951171875, 0.23191070556640625, 0.253326416015625, 0.27474212646484375, 0.2961578369140625, 0.31757354736328125, 0.3389892578125, 0.36040496826171875, 0.3818206787109375, 0.40323638916015625, 0.424652099609375, 0.44606781005859375, 0.4674835205078125, 0.48889923095703125, 0.51031494140625, 0.5317306518554688, 0.5531463623046875, 0.5745620727539062, 0.595977783203125, 0.6173934936523438, 0.6388092041015625, 0.6602249145507812, 0.681640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 14.0, 19.0, 16.0, 15.0, 20.0, 19.0, 31.0, 36.0, 54.0, 44.0, 66.0, 67.0, 69.0, 74.0, 60.0, 64.0, 60.0, 45.0, 40.0, 39.0, 21.0, 22.0, 20.0, 15.0, 8.0, 9.0, 10.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005450248718261719, -0.0005289986729621887, -0.0005129724740982056, -0.0004969462752342224, -0.00048092007637023926, -0.0004648938775062561, -0.00044886767864227295, -0.0004328414797782898, -0.00041681528091430664, -0.0004007890820503235, -0.00038476288318634033, -0.0003687366843223572, -0.000352710485458374, -0.00033668428659439087, -0.0003206580877304077, -0.00030463188886642456, -0.0002886056900024414, -0.00027257949113845825, -0.0002565532922744751, -0.00024052709341049194, -0.0002245008945465088, -0.00020847469568252563, -0.00019244849681854248, -0.00017642229795455933, -0.00016039609909057617, -0.00014436990022659302, -0.00012834370136260986, -0.00011231750249862671, -9.629130363464355e-05, -8.02651047706604e-05, -6.423890590667725e-05, -4.821270704269409e-05, -3.218650817871094e-05, -1.6160309314727783e-05, -1.341104507446289e-07, 1.5892088413238525e-05, 3.191828727722168e-05, 4.7944486141204834e-05, 6.397068500518799e-05, 7.999688386917114e-05, 9.60230827331543e-05, 0.00011204928159713745, 0.0001280754804611206, 0.00014410167932510376, 0.00016012787818908691, 0.00017615407705307007, 0.00019218027591705322, 0.00020820647478103638, 0.00022423267364501953, 0.00024025887250900269, 0.00025628507137298584, 0.000272311270236969, 0.00028833746910095215, 0.0003043636679649353, 0.00032038986682891846, 0.0003364160656929016, 0.00035244226455688477, 0.0003684684634208679, 0.0003844946622848511, 0.00040052086114883423, 0.0004165470600128174, 0.00043257325887680054, 0.0004485994577407837, 0.00046462565660476685, 0.00048065185546875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 4.0, 6.0, 7.0, 8.0, 13.0, 7.0, 17.0, 17.0, 21.0, 27.0, 30.0, 65.0, 88.0, 146.0, 205.0, 363.0, 1037.0, 1037134.0, 8085.0, 515.0, 269.0, 138.0, 94.0, 69.0, 45.0, 31.0, 20.0, 21.0, 11.0, 18.0, 9.0, 12.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0130615234375, -0.012662410736083984, -0.012263298034667969, -0.011864185333251953, -0.011465072631835938, -0.011065959930419922, -0.010666847229003906, -0.01026773452758789, -0.009868621826171875, -0.00946950912475586, -0.009070396423339844, -0.008671283721923828, -0.008272171020507812, -0.007873058319091797, -0.007473945617675781, -0.007074832916259766, -0.00667572021484375, -0.006276607513427734, -0.005877494812011719, -0.005478382110595703, -0.0050792694091796875, -0.004680156707763672, -0.004281044006347656, -0.0038819313049316406, -0.003482818603515625, -0.0030837059020996094, -0.0026845932006835938, -0.002285480499267578, -0.0018863677978515625, -0.0014872550964355469, -0.0010881423950195312, -0.0006890296936035156, -0.0002899169921875, 0.00010919570922851562, 0.0005083084106445312, 0.0009074211120605469, 0.0013065338134765625, 0.0017056465148925781, 0.0021047592163085938, 0.0025038719177246094, 0.002902984619140625, 0.0033020973205566406, 0.0037012100219726562, 0.004100322723388672, 0.0044994354248046875, 0.004898548126220703, 0.005297660827636719, 0.005696773529052734, 0.00609588623046875, 0.006494998931884766, 0.006894111633300781, 0.007293224334716797, 0.0076923370361328125, 0.008091449737548828, 0.008490562438964844, 0.00888967514038086, 0.009288787841796875, 0.00968790054321289, 0.010087013244628906, 0.010486125946044922, 0.010885238647460938, 0.011284351348876953, 0.011683464050292969, 0.012082576751708984, 0.012481689453125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 116.0, 707.0, 182.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023232121020555496, -0.002281415509060025, -0.0022396191488951445, -0.00219782255589962, -0.0021560261957347393, -0.002114229602739215, -0.0020724330097436905, -0.0020306366495788097, -0.0019888400565832853, -0.0019470435800030828, -0.0019052471034228802, -0.0018634505104273558, -0.0018216540338471532, -0.0017798575572669506, -0.0017380609642714262, -0.0016962644876912236, -0.001654468011111021, -0.0016126715345308185, -0.0015708750579506159, -0.0015290784649550915, -0.001487281988374889, -0.0014454855117946863, -0.001403688918799162, -0.0013618924422189593, -0.0013200959656387568, -0.0012782994890585542, -0.0012365030124783516, -0.0011947064194828272, -0.0011529099429026246, -0.001111113466322422, -0.0010693168733268976, -0.001027520396746695, -0.0009857239201664925, -0.0009439274435862899, -0.0009021309087984264, -0.0008603343740105629, -0.0008185378974303603, -0.0007767414208501577, -0.0007349448860622942, -0.0006931483512744308, -0.0006513518746942282, -0.0006095553981140256, -0.0005677588633261621, -0.0005259623285382986, -0.00048416585195809603, -0.000442369346274063, -0.00040057284059002995, -0.0003587763349059969, -0.0003169798292219639, -0.00027518332353793085, -0.0002333868178538978, -0.00019159031216986477, -0.00014979380648583174, -0.0001079973008017987, -6.620079511776567e-05, -2.440428943373263e-05, 1.7392216250300407e-05, 5.9188721934333444e-05, 0.00010098522761836648, 0.00014278173330239952, 0.00018457823898643255, 0.0002263747446704656, 0.0002681712503544986, 0.00030996775603853166, 0.0003517642617225647]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 8.0, 3.0, 6.0, 13.0, 12.0, 19.0, 19.0, 23.0, 19.0, 25.0, 34.0, 32.0, 33.0, 34.0, 31.0, 47.0, 50.0, 40.0, 36.0, 47.0, 47.0, 46.0, 28.0, 35.0, 34.0, 29.0, 32.0, 40.0, 23.0, 18.0, 16.0, 23.0, 17.0, 14.0, 11.0, 16.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00025641918182373047, -0.00024845823645591736, -0.00024049729108810425, -0.00023253634572029114, -0.00022457540035247803, -0.00021661445498466492, -0.0002086535096168518, -0.0002006925642490387, -0.00019273161888122559, -0.00018477067351341248, -0.00017680972814559937, -0.00016884878277778625, -0.00016088783740997314, -0.00015292689204216003, -0.00014496594667434692, -0.0001370050013065338, -0.0001290440559387207, -0.00012108311057090759, -0.00011312216520309448, -0.00010516121983528137, -9.720027446746826e-05, -8.923932909965515e-05, -8.127838373184204e-05, -7.331743836402893e-05, -6.535649299621582e-05, -5.739554762840271e-05, -4.94346022605896e-05, -4.147365689277649e-05, -3.351271152496338e-05, -2.555176615715027e-05, -1.7590820789337158e-05, -9.629875421524048e-06, -1.6689300537109375e-06, 6.292015314102173e-06, 1.4252960681915283e-05, 2.2213906049728394e-05, 3.0174851417541504e-05, 3.8135796785354614e-05, 4.6096742153167725e-05, 5.4057687520980835e-05, 6.201863288879395e-05, 6.997957825660706e-05, 7.794052362442017e-05, 8.590146899223328e-05, 9.386241436004639e-05, 0.0001018233597278595, 0.00010978430509567261, 0.00011774525046348572, 0.00012570619583129883, 0.00013366714119911194, 0.00014162808656692505, 0.00014958903193473816, 0.00015754997730255127, 0.00016551092267036438, 0.0001734718680381775, 0.0001814328134059906, 0.0001893937587738037, 0.00019735470414161682, 0.00020531564950942993, 0.00021327659487724304, 0.00022123754024505615, 0.00022919848561286926, 0.00023715943098068237, 0.0002451203763484955, 0.0002530813217163086]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 12.0, 8.0, 8.0, 14.0, 14.0, 10.0, 18.0, 21.0, 32.0, 27.0, 32.0, 32.0, 24.0, 36.0, 51.0, 29.0, 48.0, 37.0, 51.0, 43.0, 51.0, 49.0, 44.0, 49.0, 36.0, 34.0, 21.0, 31.0, 31.0, 20.0, 15.0, 11.0, 9.0, 8.0, 9.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2265625, -5.06439208984375, -4.9022216796875, -4.74005126953125, -4.577880859375, -4.41571044921875, -4.2535400390625, -4.09136962890625, -3.92919921875, -3.76702880859375, -3.6048583984375, -3.44268798828125, -3.280517578125, -3.11834716796875, -2.9561767578125, -2.79400634765625, -2.6318359375, -2.46966552734375, -2.3074951171875, -2.14532470703125, -1.983154296875, -1.82098388671875, -1.6588134765625, -1.49664306640625, -1.33447265625, -1.17230224609375, -1.0101318359375, -0.84796142578125, -0.685791015625, -0.52362060546875, -0.3614501953125, -0.19927978515625, -0.037109375, 0.12506103515625, 0.2872314453125, 0.44940185546875, 0.611572265625, 0.77374267578125, 0.9359130859375, 1.09808349609375, 1.26025390625, 1.42242431640625, 1.5845947265625, 1.74676513671875, 1.908935546875, 2.07110595703125, 2.2332763671875, 2.39544677734375, 2.5576171875, 2.71978759765625, 2.8819580078125, 3.04412841796875, 3.206298828125, 3.36846923828125, 3.5306396484375, 3.69281005859375, 3.85498046875, 4.01715087890625, 4.1793212890625, 4.34149169921875, 4.503662109375, 4.66583251953125, 4.8280029296875, 4.99017333984375, 5.15234375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 11.0, 14.0, 11.0, 10.0, 17.0, 28.0, 36.0, 59.0, 78.0, 91.0, 143.0, 215.0, 318.0, 503.0, 735.0, 1192.0, 2123.0, 3845.0, 7421.0, 15796.0, 37459.0, 99707.0, 328021.0, 364664.0, 110647.0, 40395.0, 17154.0, 8054.0, 4065.0, 2126.0, 1272.0, 815.0, 472.0, 328.0, 219.0, 161.0, 112.0, 64.0, 40.0, 37.0, 26.0, 21.0, 16.0, 11.0, 9.0, 5.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.48828125, -3.379425048828125, -3.27056884765625, -3.161712646484375, -3.0528564453125, -2.944000244140625, -2.83514404296875, -2.726287841796875, -2.617431640625, -2.508575439453125, -2.39971923828125, -2.290863037109375, -2.1820068359375, -2.073150634765625, -1.96429443359375, -1.855438232421875, -1.74658203125, -1.637725830078125, -1.52886962890625, -1.420013427734375, -1.3111572265625, -1.202301025390625, -1.09344482421875, -0.984588623046875, -0.875732421875, -0.766876220703125, -0.65802001953125, -0.549163818359375, -0.4403076171875, -0.331451416015625, -0.22259521484375, -0.113739013671875, -0.0048828125, 0.103973388671875, 0.21282958984375, 0.321685791015625, 0.4305419921875, 0.539398193359375, 0.64825439453125, 0.757110595703125, 0.865966796875, 0.974822998046875, 1.08367919921875, 1.192535400390625, 1.3013916015625, 1.410247802734375, 1.51910400390625, 1.627960205078125, 1.73681640625, 1.845672607421875, 1.95452880859375, 2.063385009765625, 2.1722412109375, 2.281097412109375, 2.38995361328125, 2.498809814453125, 2.607666015625, 2.716522216796875, 2.82537841796875, 2.934234619140625, 3.0430908203125, 3.151947021484375, 3.26080322265625, 3.369659423828125, 3.478515625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 4.0, 12.0, 11.0, 10.0, 17.0, 19.0, 16.0, 31.0, 36.0, 32.0, 32.0, 39.0, 42.0, 46.0, 57.0, 61.0, 223.0, 1786.0, 103.0, 57.0, 64.0, 44.0, 41.0, 47.0, 35.0, 30.0, 16.0, 28.0, 15.0, 16.0, 16.0, 9.0, 13.0, 9.0, 3.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -16.998291015625, -16.41845703125, -15.838623046875, -15.2587890625, -14.678955078125, -14.09912109375, -13.519287109375, -12.939453125, -12.359619140625, -11.77978515625, -11.199951171875, -10.6201171875, -10.040283203125, -9.46044921875, -8.880615234375, -8.30078125, -7.720947265625, -7.14111328125, -6.561279296875, -5.9814453125, -5.401611328125, -4.82177734375, -4.241943359375, -3.662109375, -3.082275390625, -2.50244140625, -1.922607421875, -1.3427734375, -0.762939453125, -0.18310546875, 0.396728515625, 0.9765625, 1.556396484375, 2.13623046875, 2.716064453125, 3.2958984375, 3.875732421875, 4.45556640625, 5.035400390625, 5.615234375, 6.195068359375, 6.77490234375, 7.354736328125, 7.9345703125, 8.514404296875, 9.09423828125, 9.674072265625, 10.25390625, 10.833740234375, 11.41357421875, 11.993408203125, 12.5732421875, 13.153076171875, 13.73291015625, 14.312744140625, 14.892578125, 15.472412109375, 16.05224609375, 16.632080078125, 17.2119140625, 17.791748046875, 18.37158203125, 18.951416015625, 19.53125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 10.0, 5.0, 15.0, 11.0, 11.0, 21.0, 21.0, 32.0, 30.0, 31.0, 64.0, 77.0, 109.0, 202.0, 386.0, 1099.0, 12272.0, 3060969.0, 67103.0, 1903.0, 560.0, 223.0, 145.0, 97.0, 61.0, 57.0, 39.0, 28.0, 24.0, 21.0, 18.0, 11.0, 10.0, 9.0, 5.0, 9.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.4375, -32.444580078125, -31.45166015625, -30.458740234375, -29.4658203125, -28.472900390625, -27.47998046875, -26.487060546875, -25.494140625, -24.501220703125, -23.50830078125, -22.515380859375, -21.5224609375, -20.529541015625, -19.53662109375, -18.543701171875, -17.55078125, -16.557861328125, -15.56494140625, -14.572021484375, -13.5791015625, -12.586181640625, -11.59326171875, -10.600341796875, -9.607421875, -8.614501953125, -7.62158203125, -6.628662109375, -5.6357421875, -4.642822265625, -3.64990234375, -2.656982421875, -1.6640625, -0.671142578125, 0.32177734375, 1.314697265625, 2.3076171875, 3.300537109375, 4.29345703125, 5.286376953125, 6.279296875, 7.272216796875, 8.26513671875, 9.258056640625, 10.2509765625, 11.243896484375, 12.23681640625, 13.229736328125, 14.22265625, 15.215576171875, 16.20849609375, 17.201416015625, 18.1943359375, 19.187255859375, 20.18017578125, 21.173095703125, 22.166015625, 23.158935546875, 24.15185546875, 25.144775390625, 26.1376953125, 27.130615234375, 28.12353515625, 29.116455078125, 30.109375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 14.0, 45.0, 127.0, 252.0, 296.0, 175.0, 63.0, 25.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61174201965332, -8.57434368133545, -7.536944389343262, -6.499546051025391, -5.462147235870361, -4.424748420715332, -3.387350082397461, -2.3499512672424316, -1.3125524520874023, -0.2751537561416626, 0.7622449398040771, 1.7996435165405273, 2.8370423316955566, 3.874441146850586, 4.911839485168457, 5.949238300323486, 6.986637115478516, 8.024035453796387, 9.061434745788574, 10.098833084106445, 11.136232376098633, 12.173630714416504, 13.211029052734375, 14.248428344726562, 15.285826683044434, 16.323225021362305, 17.360624313354492, 18.398021697998047, 19.435420989990234, 20.472820281982422, 21.51021957397461, 22.547616958618164, 23.58501434326172, 24.622413635253906, 25.65981101989746, 26.69721031188965, 27.734609603881836, 28.77200698852539, 29.809406280517578, 30.846805572509766, 31.884204864501953, 32.92160415649414, 33.95900344848633, 34.99639892578125, 36.03379821777344, 37.071197509765625, 38.10859680175781, 39.14599609375, 40.18339538574219, 41.220794677734375, 42.25819396972656, 43.29559326171875, 44.33298873901367, 45.37038803100586, 46.40778732299805, 47.445186614990234, 48.482582092285156, 49.519981384277344, 50.55738067626953, 51.59477996826172, 52.63217544555664, 53.66957473754883, 54.706974029541016, 55.7443733215332, 56.78177261352539]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 8.0, 5.0, 7.0, 6.0, 7.0, 3.0, 11.0, 8.0, 14.0, 14.0, 16.0, 25.0, 33.0, 28.0, 42.0, 40.0, 46.0, 44.0, 57.0, 44.0, 52.0, 38.0, 55.0, 36.0, 47.0, 33.0, 28.0, 36.0, 28.0, 35.0, 20.0, 24.0, 17.0, 17.0, 16.0, 15.0, 15.0, 9.0, 11.0, 6.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.94017028808594, -54.101715087890625, -52.26325988769531, -50.4248046875, -48.58634948730469, -46.747894287109375, -44.90943908691406, -43.07098388671875, -41.23252868652344, -39.394073486328125, -37.55561828613281, -35.7171630859375, -33.87870788574219, -32.040252685546875, -30.201799392700195, -28.363344192504883, -26.524890899658203, -24.68643569946289, -22.847980499267578, -21.009525299072266, -19.171070098876953, -17.33261489868164, -15.494161605834961, -13.655706405639648, -11.817251205444336, -9.978796005249023, -8.140340805053711, -6.301886558532715, -4.463431358337402, -2.62497615814209, -0.7865219116210938, 1.0519332885742188, 2.8903884887695312, 4.728843688964844, 6.567298412322998, 8.405753135681152, 10.244208335876465, 12.082663536071777, 13.921117782592773, 15.759572982788086, 17.5980281829834, 19.43648338317871, 21.274938583374023, 23.113391876220703, 24.951847076416016, 26.790302276611328, 28.62875747680664, 30.467212677001953, 32.305667877197266, 34.14412307739258, 35.98257827758789, 37.8210334777832, 39.659488677978516, 41.49794387817383, 43.336395263671875, 45.17485046386719, 47.0133056640625, 48.85176086425781, 50.690216064453125, 52.52867126464844, 54.36712646484375, 56.20558166503906, 58.044036865234375, 59.88249206542969, 61.720947265625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 8.0, 4.0, 11.0, 5.0, 10.0, 14.0, 12.0, 13.0, 12.0, 30.0, 22.0, 29.0, 29.0, 28.0, 32.0, 36.0, 43.0, 45.0, 30.0, 47.0, 45.0, 46.0, 49.0, 55.0, 45.0, 44.0, 35.0, 32.0, 27.0, 30.0, 26.0, 19.0, 28.0, 6.0, 10.0, 10.0, 6.0, 11.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.22265625, -5.05645751953125, -4.8902587890625, -4.72406005859375, -4.557861328125, -4.39166259765625, -4.2254638671875, -4.05926513671875, -3.89306640625, -3.72686767578125, -3.5606689453125, -3.39447021484375, -3.228271484375, -3.06207275390625, -2.8958740234375, -2.72967529296875, -2.5634765625, -2.39727783203125, -2.2310791015625, -2.06488037109375, -1.898681640625, -1.73248291015625, -1.5662841796875, -1.40008544921875, -1.23388671875, -1.06768798828125, -0.9014892578125, -0.73529052734375, -0.569091796875, -0.40289306640625, -0.2366943359375, -0.07049560546875, 0.095703125, 0.26190185546875, 0.4281005859375, 0.59429931640625, 0.760498046875, 0.92669677734375, 1.0928955078125, 1.25909423828125, 1.42529296875, 1.59149169921875, 1.7576904296875, 1.92388916015625, 2.090087890625, 2.25628662109375, 2.4224853515625, 2.58868408203125, 2.7548828125, 2.92108154296875, 3.0872802734375, 3.25347900390625, 3.419677734375, 3.58587646484375, 3.7520751953125, 3.91827392578125, 4.08447265625, 4.25067138671875, 4.4168701171875, 4.58306884765625, 4.749267578125, 4.91546630859375, 5.0816650390625, 5.24786376953125, 5.4140625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 10.0, 11.0, 9.0, 14.0, 14.0, 20.0, 19.0, 22.0, 18.0, 30.0, 24.0, 23.0, 31.0, 28.0, 58.0, 116.0, 824.0, 17305.0, 3149680.0, 1019371.0, 5782.0, 439.0, 90.0, 49.0, 39.0, 29.0, 28.0, 30.0, 19.0, 27.0, 23.0, 18.0, 13.0, 8.0, 15.0, 12.0, 11.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.953125, -28.949951171875, -27.94677734375, -26.943603515625, -25.9404296875, -24.937255859375, -23.93408203125, -22.930908203125, -21.927734375, -20.924560546875, -19.92138671875, -18.918212890625, -17.9150390625, -16.911865234375, -15.90869140625, -14.905517578125, -13.90234375, -12.899169921875, -11.89599609375, -10.892822265625, -9.8896484375, -8.886474609375, -7.88330078125, -6.880126953125, -5.876953125, -4.873779296875, -3.87060546875, -2.867431640625, -1.8642578125, -0.861083984375, 0.14208984375, 1.145263671875, 2.1484375, 3.151611328125, 4.15478515625, 5.157958984375, 6.1611328125, 7.164306640625, 8.16748046875, 9.170654296875, 10.173828125, 11.177001953125, 12.18017578125, 13.183349609375, 14.1865234375, 15.189697265625, 16.19287109375, 17.196044921875, 18.19921875, 19.202392578125, 20.20556640625, 21.208740234375, 22.2119140625, 23.215087890625, 24.21826171875, 25.221435546875, 26.224609375, 27.227783203125, 28.23095703125, 29.234130859375, 30.2373046875, 31.240478515625, 32.24365234375, 33.246826171875, 34.25]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 8.0, 17.0, 16.0, 37.0, 41.0, 79.0, 83.0, 151.0, 234.0, 338.0, 570.0, 741.0, 611.0, 402.0, 249.0, 159.0, 114.0, 79.0, 46.0, 28.0, 24.0, 13.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.546875, -26.8680419921875, -26.189208984375, -25.5103759765625, -24.83154296875, -24.1527099609375, -23.473876953125, -22.7950439453125, -22.1162109375, -21.4373779296875, -20.758544921875, -20.0797119140625, -19.40087890625, -18.7220458984375, -18.043212890625, -17.3643798828125, -16.685546875, -16.0067138671875, -15.327880859375, -14.6490478515625, -13.97021484375, -13.2913818359375, -12.612548828125, -11.9337158203125, -11.2548828125, -10.5760498046875, -9.897216796875, -9.2183837890625, -8.53955078125, -7.8607177734375, -7.181884765625, -6.5030517578125, -5.82421875, -5.1453857421875, -4.466552734375, -3.7877197265625, -3.10888671875, -2.4300537109375, -1.751220703125, -1.0723876953125, -0.3935546875, 0.2852783203125, 0.964111328125, 1.6429443359375, 2.32177734375, 3.0006103515625, 3.679443359375, 4.3582763671875, 5.037109375, 5.7159423828125, 6.394775390625, 7.0736083984375, 7.75244140625, 8.4312744140625, 9.110107421875, 9.7889404296875, 10.4677734375, 11.1466064453125, 11.825439453125, 12.5042724609375, 13.18310546875, 13.8619384765625, 14.540771484375, 15.2196044921875, 15.8984375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 13.0, 19.0, 33.0, 43.0, 77.0, 123.0, 213.0, 334.0, 795.0, 11502.0, 4165605.0, 13949.0, 714.0, 350.0, 193.0, 121.0, 69.0, 49.0, 27.0, 9.0, 12.0, 5.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.1875, -68.9814453125, -65.775390625, -62.5693359375, -59.36328125, -56.1572265625, -52.951171875, -49.7451171875, -46.5390625, -43.3330078125, -40.126953125, -36.9208984375, -33.71484375, -30.5087890625, -27.302734375, -24.0966796875, -20.890625, -17.6845703125, -14.478515625, -11.2724609375, -8.06640625, -4.8603515625, -1.654296875, 1.5517578125, 4.7578125, 7.9638671875, 11.169921875, 14.3759765625, 17.58203125, 20.7880859375, 23.994140625, 27.2001953125, 30.40625, 33.6123046875, 36.818359375, 40.0244140625, 43.23046875, 46.4365234375, 49.642578125, 52.8486328125, 56.0546875, 59.2607421875, 62.466796875, 65.6728515625, 68.87890625, 72.0849609375, 75.291015625, 78.4970703125, 81.703125, 84.9091796875, 88.115234375, 91.3212890625, 94.52734375, 97.7333984375, 100.939453125, 104.1455078125, 107.3515625, 110.5576171875, 113.763671875, 116.9697265625, 120.17578125, 123.3818359375, 126.587890625, 129.7939453125, 133.0]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 62.0, 208.0, 377.0, 253.0, 84.0, 14.0, 6.0, 0.0, 2.0, 2.0], "bins": [-271.8650207519531, -267.0650634765625, -262.26507568359375, -257.4651184082031, -252.6651611328125, -247.86520385742188, -243.0652313232422, -238.2652587890625, -233.46530151367188, -228.66534423828125, -223.86537170410156, -219.06539916992188, -214.26544189453125, -209.46548461914062, -204.66551208496094, -199.86553955078125, -195.06558227539062, -190.265625, -185.4656524658203, -180.66567993164062, -175.86572265625, -171.06576538085938, -166.2657928466797, -161.4658203125, -156.66586303710938, -151.86590576171875, -147.06593322753906, -142.26596069335938, -137.46600341796875, -132.66604614257812, -127.86607360839844, -123.06610870361328, -118.26615905761719, -113.46619415283203, -108.66622924804688, -103.86626434326172, -99.06629943847656, -94.2663345336914, -89.46636962890625, -84.6664047241211, -79.86643981933594, -75.06647491455078, -70.26651000976562, -65.46654510498047, -60.66658020019531, -55.866615295410156, -51.066650390625, -46.266685485839844, -41.46672058105469, -36.66675567626953, -31.866790771484375, -27.06682586669922, -22.266860961914062, -17.466896057128906, -12.66693115234375, -7.866966247558594, -3.0670013427734375, 1.7329635620117188, 6.532928466796875, 11.332893371582031, 16.132858276367188, 20.932823181152344, 25.7327880859375, 30.532752990722656, 35.33271789550781]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 7.0, 2.0, 2.0, 8.0, 4.0, 8.0, 11.0, 5.0, 11.0, 10.0, 11.0, 21.0, 20.0, 19.0, 22.0, 26.0, 32.0, 25.0, 38.0, 48.0, 45.0, 51.0, 33.0, 48.0, 47.0, 39.0, 45.0, 40.0, 40.0, 39.0, 34.0, 35.0, 27.0, 25.0, 24.0, 13.0, 16.0, 15.0, 14.0, 9.0, 11.0, 13.0, 10.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.365203857421875, -43.54517364501953, -41.72513961791992, -39.90510940551758, -38.085079193115234, -36.265045166015625, -34.44501495361328, -32.62498474121094, -30.804954528808594, -28.984922409057617, -27.164892196655273, -25.344860076904297, -23.524829864501953, -21.704797744750977, -19.884765625, -18.064735412597656, -16.24470329284668, -14.42467212677002, -12.60464096069336, -10.784608840942383, -8.964578628540039, -7.1445465087890625, -5.324515342712402, -3.504484176635742, -1.684453010559082, 0.13557827472686768, 1.9556095600128174, 3.7756409645080566, 5.595672130584717, 7.415703773498535, 9.235734939575195, 11.055766105651855, 12.875797271728516, 14.695828437805176, 16.515859603881836, 18.335891723632812, 20.155921936035156, 21.975954055786133, 23.79598617553711, 25.616016387939453, 27.436046600341797, 29.256078720092773, 31.076108932495117, 32.896141052246094, 34.71617126464844, 36.53620147705078, 38.35623550415039, 40.176265716552734, 41.996299743652344, 43.81632995605469, 45.6363639831543, 47.45639419555664, 49.276424407958984, 51.096458435058594, 52.91648864746094, 54.73651885986328, 56.556549072265625, 58.37657928466797, 60.19661331176758, 62.01664352416992, 63.836673736572266, 65.65670776367188, 67.47673797607422, 69.29676818847656, 71.1167984008789]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 7.0, 9.0, 15.0, 7.0, 13.0, 18.0, 14.0, 22.0, 27.0, 28.0, 21.0, 27.0, 28.0, 33.0, 46.0, 42.0, 37.0, 51.0, 50.0, 41.0, 50.0, 44.0, 49.0, 45.0, 37.0, 29.0, 29.0, 30.0, 23.0, 12.0, 18.0, 18.0, 17.0, 9.0, 17.0, 10.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.12890625, -4.96002197265625, -4.7911376953125, -4.62225341796875, -4.453369140625, -4.28448486328125, -4.1156005859375, -3.94671630859375, -3.77783203125, -3.60894775390625, -3.4400634765625, -3.27117919921875, -3.102294921875, -2.93341064453125, -2.7645263671875, -2.59564208984375, -2.4267578125, -2.25787353515625, -2.0889892578125, -1.92010498046875, -1.751220703125, -1.58233642578125, -1.4134521484375, -1.24456787109375, -1.07568359375, -0.90679931640625, -0.7379150390625, -0.56903076171875, -0.400146484375, -0.23126220703125, -0.0623779296875, 0.10650634765625, 0.275390625, 0.44427490234375, 0.6131591796875, 0.78204345703125, 0.950927734375, 1.11981201171875, 1.2886962890625, 1.45758056640625, 1.62646484375, 1.79534912109375, 1.9642333984375, 2.13311767578125, 2.302001953125, 2.47088623046875, 2.6397705078125, 2.80865478515625, 2.9775390625, 3.14642333984375, 3.3153076171875, 3.48419189453125, 3.653076171875, 3.82196044921875, 3.9908447265625, 4.15972900390625, 4.32861328125, 4.49749755859375, 4.6663818359375, 4.83526611328125, 5.004150390625, 5.17303466796875, 5.3419189453125, 5.51080322265625, 5.6796875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 10.0, 24.0, 25.0, 53.0, 63.0, 90.0, 126.0, 195.0, 275.0, 451.0, 725.0, 1186.0, 1822.0, 2953.0, 4668.0, 7752.0, 12854.0, 20597.0, 34828.0, 60651.0, 110730.0, 211067.0, 261287.0, 137905.0, 72931.0, 41731.0, 24748.0, 14848.0, 9035.0, 5655.0, 3444.0, 2189.0, 1291.0, 860.0, 544.0, 290.0, 221.0, 130.0, 81.0, 85.0, 40.0, 29.0, 20.0, 15.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.85107421875, -0.8228607177734375, -0.794647216796875, -0.7664337158203125, -0.73822021484375, -0.7100067138671875, -0.681793212890625, -0.6535797119140625, -0.6253662109375, -0.5971527099609375, -0.568939208984375, -0.5407257080078125, -0.51251220703125, -0.4842987060546875, -0.456085205078125, -0.4278717041015625, -0.399658203125, -0.3714447021484375, -0.343231201171875, -0.3150177001953125, -0.28680419921875, -0.2585906982421875, -0.230377197265625, -0.2021636962890625, -0.1739501953125, -0.1457366943359375, -0.117523193359375, -0.0893096923828125, -0.06109619140625, -0.0328826904296875, -0.004669189453125, 0.0235443115234375, 0.0517578125, 0.0799713134765625, 0.108184814453125, 0.1363983154296875, 0.16461181640625, 0.1928253173828125, 0.221038818359375, 0.2492523193359375, 0.2774658203125, 0.3056793212890625, 0.333892822265625, 0.3621063232421875, 0.39031982421875, 0.4185333251953125, 0.446746826171875, 0.4749603271484375, 0.503173828125, 0.5313873291015625, 0.559600830078125, 0.5878143310546875, 0.61602783203125, 0.6442413330078125, 0.672454833984375, 0.7006683349609375, 0.7288818359375, 0.7570953369140625, 0.785308837890625, 0.8135223388671875, 0.84173583984375, 0.8699493408203125, 0.898162841796875, 0.9263763427734375, 0.95458984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 1.0, 3.0, 5.0, 9.0, 9.0, 14.0, 12.0, 16.0, 23.0, 21.0, 22.0, 28.0, 30.0, 20.0, 32.0, 41.0, 21.0, 37.0, 41.0, 33.0, 36.0, 1051.0, 41.0, 38.0, 43.0, 44.0, 37.0, 33.0, 32.0, 31.0, 32.0, 21.0, 26.0, 22.0, 19.0, 17.0, 14.0, 10.0, 7.0, 14.0, 10.0, 7.0, 2.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.375, -3.274688720703125, -3.17437744140625, -3.074066162109375, -2.9737548828125, -2.873443603515625, -2.77313232421875, -2.672821044921875, -2.572509765625, -2.472198486328125, -2.37188720703125, -2.271575927734375, -2.1712646484375, -2.070953369140625, -1.97064208984375, -1.870330810546875, -1.77001953125, -1.669708251953125, -1.56939697265625, -1.469085693359375, -1.3687744140625, -1.268463134765625, -1.16815185546875, -1.067840576171875, -0.967529296875, -0.867218017578125, -0.76690673828125, -0.666595458984375, -0.5662841796875, -0.465972900390625, -0.36566162109375, -0.265350341796875, -0.1650390625, -0.064727783203125, 0.03558349609375, 0.135894775390625, 0.2362060546875, 0.336517333984375, 0.43682861328125, 0.537139892578125, 0.637451171875, 0.737762451171875, 0.83807373046875, 0.938385009765625, 1.0386962890625, 1.139007568359375, 1.23931884765625, 1.339630126953125, 1.43994140625, 1.540252685546875, 1.64056396484375, 1.740875244140625, 1.8411865234375, 1.941497802734375, 2.04180908203125, 2.142120361328125, 2.242431640625, 2.342742919921875, 2.44305419921875, 2.543365478515625, 2.6436767578125, 2.743988037109375, 2.84429931640625, 2.944610595703125, 3.044921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 17.0, 17.0, 21.0, 38.0, 57.0, 81.0, 105.0, 150.0, 246.0, 332.0, 478.0, 641.0, 929.0, 1311.0, 1725.0, 2507.0, 3548.0, 5109.0, 7005.0, 10326.0, 14945.0, 21992.0, 32681.0, 49468.0, 77491.0, 125528.0, 1253785.0, 175974.0, 106980.0, 67359.0, 43701.0, 28777.0, 19481.0, 13311.0, 8981.0, 6556.0, 4511.0, 3133.0, 2279.0, 1594.0, 1176.0, 807.0, 605.0, 419.0, 283.0, 182.0, 148.0, 101.0, 70.0, 49.0, 34.0, 29.0, 20.0, 15.0, 5.0, 6.0, 4.0, 3.0], "bins": [-0.65673828125, -0.6367416381835938, -0.6167449951171875, -0.5967483520507812, -0.576751708984375, -0.5567550659179688, -0.5367584228515625, -0.5167617797851562, -0.49676513671875, -0.47676849365234375, -0.4567718505859375, -0.43677520751953125, -0.416778564453125, -0.39678192138671875, -0.3767852783203125, -0.35678863525390625, -0.3367919921875, -0.31679534912109375, -0.2967987060546875, -0.27680206298828125, -0.256805419921875, -0.23680877685546875, -0.2168121337890625, -0.19681549072265625, -0.17681884765625, -0.15682220458984375, -0.1368255615234375, -0.11682891845703125, -0.096832275390625, -0.07683563232421875, -0.0568389892578125, -0.03684234619140625, -0.016845703125, 0.00315093994140625, 0.0231475830078125, 0.04314422607421875, 0.063140869140625, 0.08313751220703125, 0.1031341552734375, 0.12313079833984375, 0.14312744140625, 0.16312408447265625, 0.1831207275390625, 0.20311737060546875, 0.223114013671875, 0.24311065673828125, 0.2631072998046875, 0.28310394287109375, 0.3031005859375, 0.32309722900390625, 0.3430938720703125, 0.36309051513671875, 0.383087158203125, 0.40308380126953125, 0.4230804443359375, 0.44307708740234375, 0.46307373046875, 0.48307037353515625, 0.5030670166015625, 0.5230636596679688, 0.543060302734375, 0.5630569458007812, 0.5830535888671875, 0.6030502319335938, 0.623046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 5.0, 10.0, 14.0, 17.0, 28.0, 24.0, 27.0, 37.0, 58.0, 58.0, 75.0, 70.0, 75.0, 75.0, 78.0, 52.0, 61.0, 46.0, 32.0, 35.0, 24.0, 9.0, 8.0, 11.0, 9.0, 11.0, 8.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005273818969726562, -0.0005113109946250916, -0.0004952400922775269, -0.00047916918992996216, -0.00046309828758239746, -0.00044702738523483276, -0.00043095648288726807, -0.00041488558053970337, -0.00039881467819213867, -0.000382743775844574, -0.0003666728734970093, -0.0003506019711494446, -0.0003345310688018799, -0.0003184601664543152, -0.0003023892641067505, -0.0002863183617591858, -0.0002702474594116211, -0.0002541765570640564, -0.0002381056547164917, -0.000222034752368927, -0.0002059638500213623, -0.0001898929476737976, -0.0001738220453262329, -0.0001577511429786682, -0.00014168024063110352, -0.00012560933828353882, -0.00010953843593597412, -9.346753358840942e-05, -7.739663124084473e-05, -6.132572889328003e-05, -4.525482654571533e-05, -2.9183924198150635e-05, -1.3113021850585938e-05, 2.9578804969787598e-06, 1.9028782844543457e-05, 3.5099685192108154e-05, 5.117058753967285e-05, 6.724148988723755e-05, 8.331239223480225e-05, 9.938329458236694e-05, 0.00011545419692993164, 0.00013152509927749634, 0.00014759600162506104, 0.00016366690397262573, 0.00017973780632019043, 0.00019580870866775513, 0.00021187961101531982, 0.00022795051336288452, 0.00024402141571044922, 0.0002600923180580139, 0.0002761632204055786, 0.0002922341227531433, 0.000308305025100708, 0.0003243759274482727, 0.0003404468297958374, 0.0003565177321434021, 0.0003725886344909668, 0.0003886595368385315, 0.0004047304391860962, 0.0004208013415336609, 0.0004368722438812256, 0.0004529431462287903, 0.000469014048576355, 0.0004850849509239197, 0.0005011558532714844]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 8.0, 9.0, 12.0, 23.0, 24.0, 45.0, 69.0, 120.0, 163.0, 288.0, 509.0, 4461.0, 1039695.0, 1910.0, 485.0, 224.0, 146.0, 120.0, 67.0, 51.0, 38.0, 21.0, 24.0, 2.0, 8.0, 5.0, 3.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01320648193359375, -0.012786149978637695, -0.01236581802368164, -0.011945486068725586, -0.011525154113769531, -0.011104822158813477, -0.010684490203857422, -0.010264158248901367, -0.009843826293945312, -0.009423494338989258, -0.009003162384033203, -0.008582830429077148, -0.008162498474121094, -0.007742166519165039, -0.007321834564208984, -0.00690150260925293, -0.006481170654296875, -0.00606083869934082, -0.005640506744384766, -0.005220174789428711, -0.004799842834472656, -0.0043795108795166016, -0.003959178924560547, -0.003538846969604492, -0.0031185150146484375, -0.002698183059692383, -0.002277851104736328, -0.0018575191497802734, -0.0014371871948242188, -0.001016855239868164, -0.0005965232849121094, -0.0001761913299560547, 0.000244140625, 0.0006644725799560547, 0.0010848045349121094, 0.001505136489868164, 0.0019254684448242188, 0.0023458003997802734, 0.002766132354736328, 0.003186464309692383, 0.0036067962646484375, 0.004027128219604492, 0.004447460174560547, 0.0048677921295166016, 0.005288124084472656, 0.005708456039428711, 0.006128787994384766, 0.00654911994934082, 0.006969451904296875, 0.00738978385925293, 0.007810115814208984, 0.008230447769165039, 0.008650779724121094, 0.009071111679077148, 0.009491443634033203, 0.009911775588989258, 0.010332107543945312, 0.010752439498901367, 0.011172771453857422, 0.011593103408813477, 0.012013435363769531, 0.012433767318725586, 0.01285409927368164, 0.013274431228637695, 0.01369476318359375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 498.0, 463.0, 32.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.003202585969120264, -0.003145412774756551, -0.003088239813223481, -0.003031066618859768, -0.0029738936573266983, -0.002916720462962985, -0.0028595475014299154, -0.002802374307066202, -0.0027452013455331326, -0.0026880281511694193, -0.0026308551896363497, -0.0025736819952726364, -0.002516509033739567, -0.0024593358393758535, -0.002402162877842784, -0.0023449896834790707, -0.0022878164891153574, -0.002230643294751644, -0.0021734703332185745, -0.0021162971388548613, -0.0020591241773217916, -0.0020019509829580784, -0.0019447780214250088, -0.0018876048270612955, -0.001830431865528226, -0.0017732587875798345, -0.001716085709631443, -0.0016589126316830516, -0.0016017395537346601, -0.0015445663593709469, -0.0014873933978378773, -0.001430220203474164, -0.0013730472419410944, -0.001315874163992703, -0.0012587010860443115, -0.00120152800809592, -0.0011443549301475286, -0.0010871817357838154, -0.0010300087742507458, -0.0009728355798870325, -0.0009156625019386411, -0.0008584894239902496, -0.0008013163460418582, -0.0007441432680934668, -0.0006869701319374144, -0.000629797053989023, -0.0005726239760406315, -0.0005154508398845792, -0.0004582777910400182, -0.00040110471309162676, -0.00034393160603940487, -0.00028675852809101343, -0.00022958543559070677, -0.0001724123430904001, -0.00011523926514200866, -5.806615808978677e-05, -8.930801413953304e-07, 5.628000872093253e-05, 0.00011345309758326039, 0.00017062618280760944, 0.0002277992753079161, 0.00028497236780822277, 0.0003421454457566142, 0.0003993185528088361, 0.00045649163075722754]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 7.0, 14.0, 16.0, 5.0, 19.0, 21.0, 27.0, 17.0, 14.0, 35.0, 32.0, 37.0, 38.0, 40.0, 39.0, 36.0, 50.0, 50.0, 33.0, 47.0, 48.0, 38.0, 42.0, 42.0, 30.0, 28.0, 30.0, 23.0, 18.0, 15.0, 12.0, 17.0, 13.0, 15.0, 9.0, 11.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002529025077819824, -0.0002455078065395355, -0.00023811310529708862, -0.00023071840405464172, -0.00022332370281219482, -0.00021592900156974792, -0.00020853430032730103, -0.00020113959908485413, -0.00019374489784240723, -0.00018635019659996033, -0.00017895549535751343, -0.00017156079411506653, -0.00016416609287261963, -0.00015677139163017273, -0.00014937669038772583, -0.00014198198914527893, -0.00013458728790283203, -0.00012719258666038513, -0.00011979788541793823, -0.00011240318417549133, -0.00010500848293304443, -9.761378169059753e-05, -9.021908044815063e-05, -8.282437920570374e-05, -7.542967796325684e-05, -6.803497672080994e-05, -6.064027547836304e-05, -5.324557423591614e-05, -4.585087299346924e-05, -3.845617175102234e-05, -3.106147050857544e-05, -2.366676926612854e-05, -1.627206802368164e-05, -8.877366781234741e-06, -1.4826655387878418e-06, 5.912035703659058e-06, 1.3306736946105957e-05, 2.0701438188552856e-05, 2.8096139430999756e-05, 3.5490840673446655e-05, 4.2885541915893555e-05, 5.0280243158340454e-05, 5.7674944400787354e-05, 6.506964564323425e-05, 7.246434688568115e-05, 7.985904812812805e-05, 8.725374937057495e-05, 9.464845061302185e-05, 0.00010204315185546875, 0.00010943785309791565, 0.00011683255434036255, 0.00012422725558280945, 0.00013162195682525635, 0.00013901665806770325, 0.00014641135931015015, 0.00015380606055259705, 0.00016120076179504395, 0.00016859546303749084, 0.00017599016427993774, 0.00018338486552238464, 0.00019077956676483154, 0.00019817426800727844, 0.00020556896924972534, 0.00021296367049217224, 0.00022035837173461914]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 7.0, 9.0, 15.0, 7.0, 13.0, 18.0, 14.0, 22.0, 27.0, 28.0, 21.0, 27.0, 28.0, 33.0, 46.0, 42.0, 37.0, 51.0, 50.0, 41.0, 50.0, 44.0, 49.0, 45.0, 37.0, 29.0, 29.0, 30.0, 23.0, 12.0, 18.0, 18.0, 17.0, 9.0, 17.0, 10.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.12890625, -4.96002197265625, -4.7911376953125, -4.62225341796875, -4.453369140625, -4.28448486328125, -4.1156005859375, -3.94671630859375, -3.77783203125, -3.60894775390625, -3.4400634765625, -3.27117919921875, -3.102294921875, -2.93341064453125, -2.7645263671875, -2.59564208984375, -2.4267578125, -2.25787353515625, -2.0889892578125, -1.92010498046875, -1.751220703125, -1.58233642578125, -1.4134521484375, -1.24456787109375, -1.07568359375, -0.90679931640625, -0.7379150390625, -0.56903076171875, -0.400146484375, -0.23126220703125, -0.0623779296875, 0.10650634765625, 0.275390625, 0.44427490234375, 0.6131591796875, 0.78204345703125, 0.950927734375, 1.11981201171875, 1.2886962890625, 1.45758056640625, 1.62646484375, 1.79534912109375, 1.9642333984375, 2.13311767578125, 2.302001953125, 2.47088623046875, 2.6397705078125, 2.80865478515625, 2.9775390625, 3.14642333984375, 3.3153076171875, 3.48419189453125, 3.653076171875, 3.82196044921875, 3.9908447265625, 4.15972900390625, 4.32861328125, 4.49749755859375, 4.6663818359375, 4.83526611328125, 5.004150390625, 5.17303466796875, 5.3419189453125, 5.51080322265625, 5.6796875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 5.0, 10.0, 13.0, 11.0, 23.0, 44.0, 51.0, 54.0, 78.0, 112.0, 172.0, 215.0, 344.0, 566.0, 796.0, 1415.0, 2421.0, 5063.0, 11027.0, 30647.0, 106062.0, 481712.0, 300480.0, 67911.0, 21299.0, 8435.0, 4002.0, 2128.0, 1251.0, 738.0, 485.0, 289.0, 177.0, 153.0, 97.0, 85.0, 45.0, 39.0, 26.0, 20.0, 12.0, 6.0, 8.0, 5.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.140625, -4.0145263671875, -3.888427734375, -3.7623291015625, -3.63623046875, -3.5101318359375, -3.384033203125, -3.2579345703125, -3.1318359375, -3.0057373046875, -2.879638671875, -2.7535400390625, -2.62744140625, -2.5013427734375, -2.375244140625, -2.2491455078125, -2.123046875, -1.9969482421875, -1.870849609375, -1.7447509765625, -1.61865234375, -1.4925537109375, -1.366455078125, -1.2403564453125, -1.1142578125, -0.9881591796875, -0.862060546875, -0.7359619140625, -0.60986328125, -0.4837646484375, -0.357666015625, -0.2315673828125, -0.10546875, 0.0206298828125, 0.146728515625, 0.2728271484375, 0.39892578125, 0.5250244140625, 0.651123046875, 0.7772216796875, 0.9033203125, 1.0294189453125, 1.155517578125, 1.2816162109375, 1.40771484375, 1.5338134765625, 1.659912109375, 1.7860107421875, 1.912109375, 2.0382080078125, 2.164306640625, 2.2904052734375, 2.41650390625, 2.5426025390625, 2.668701171875, 2.7947998046875, 2.9208984375, 3.0469970703125, 3.173095703125, 3.2991943359375, 3.42529296875, 3.5513916015625, 3.677490234375, 3.8035888671875, 3.9296875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 6.0, 9.0, 20.0, 13.0, 20.0, 26.0, 18.0, 34.0, 40.0, 55.0, 46.0, 53.0, 61.0, 111.0, 1926.0, 173.0, 65.0, 39.0, 50.0, 56.0, 38.0, 39.0, 34.0, 24.0, 16.0, 15.0, 15.0, 6.0, 14.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-27.484375, -26.753173828125, -26.02197265625, -25.290771484375, -24.5595703125, -23.828369140625, -23.09716796875, -22.365966796875, -21.634765625, -20.903564453125, -20.17236328125, -19.441162109375, -18.7099609375, -17.978759765625, -17.24755859375, -16.516357421875, -15.78515625, -15.053955078125, -14.32275390625, -13.591552734375, -12.8603515625, -12.129150390625, -11.39794921875, -10.666748046875, -9.935546875, -9.204345703125, -8.47314453125, -7.741943359375, -7.0107421875, -6.279541015625, -5.54833984375, -4.817138671875, -4.0859375, -3.354736328125, -2.62353515625, -1.892333984375, -1.1611328125, -0.429931640625, 0.30126953125, 1.032470703125, 1.763671875, 2.494873046875, 3.22607421875, 3.957275390625, 4.6884765625, 5.419677734375, 6.15087890625, 6.882080078125, 7.61328125, 8.344482421875, 9.07568359375, 9.806884765625, 10.5380859375, 11.269287109375, 12.00048828125, 12.731689453125, 13.462890625, 14.194091796875, 14.92529296875, 15.656494140625, 16.3876953125, 17.118896484375, 17.85009765625, 18.581298828125, 19.3125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 9.0, 12.0, 5.0, 17.0, 18.0, 15.0, 25.0, 41.0, 46.0, 68.0, 104.0, 143.0, 245.0, 590.0, 3471.0, 3014078.0, 124255.0, 1494.0, 445.0, 202.0, 118.0, 71.0, 60.0, 39.0, 14.0, 31.0, 21.0, 11.0, 18.0, 9.0, 8.0, 2.0, 2.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.65625, -29.513671875, -28.37109375, -27.228515625, -26.0859375, -24.943359375, -23.80078125, -22.658203125, -21.515625, -20.373046875, -19.23046875, -18.087890625, -16.9453125, -15.802734375, -14.66015625, -13.517578125, -12.375, -11.232421875, -10.08984375, -8.947265625, -7.8046875, -6.662109375, -5.51953125, -4.376953125, -3.234375, -2.091796875, -0.94921875, 0.193359375, 1.3359375, 2.478515625, 3.62109375, 4.763671875, 5.90625, 7.048828125, 8.19140625, 9.333984375, 10.4765625, 11.619140625, 12.76171875, 13.904296875, 15.046875, 16.189453125, 17.33203125, 18.474609375, 19.6171875, 20.759765625, 21.90234375, 23.044921875, 24.1875, 25.330078125, 26.47265625, 27.615234375, 28.7578125, 29.900390625, 31.04296875, 32.185546875, 33.328125, 34.470703125, 35.61328125, 36.755859375, 37.8984375, 39.041015625, 40.18359375, 41.326171875, 42.46875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 171.0, 739.0, 103.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.85891723632812, -143.07476806640625, -140.2906036376953, -137.50645446777344, -134.7222900390625, -131.93814086914062, -129.15399169921875, -126.36983489990234, -123.58567810058594, -120.80152130126953, -118.01736450195312, -115.23321533203125, -112.44905853271484, -109.66490173339844, -106.88075256347656, -104.09659576416016, -101.31243896484375, -98.52828216552734, -95.74412536621094, -92.95997619628906, -90.17581939697266, -87.39166259765625, -84.60751342773438, -81.82335662841797, -79.03919982910156, -76.25504302978516, -73.47088623046875, -70.68673706054688, -67.90258026123047, -65.11842346191406, -62.33427047729492, -59.55011749267578, -56.76596450805664, -53.9818115234375, -51.197654724121094, -48.41349792480469, -45.62934494018555, -42.845191955566406, -40.06103515625, -37.276878356933594, -34.49272537231445, -31.70857048034668, -28.924415588378906, -26.140260696411133, -23.35610580444336, -20.571950912475586, -17.787796020507812, -15.003641128540039, -12.219486236572266, -9.435331344604492, -6.651176452636719, -3.8670215606689453, -1.0828666687011719, 1.7012882232666016, 4.485443115234375, 7.269598007202148, 10.053752899169922, 12.837907791137695, 15.622062683105469, 18.406217575073242, 21.190372467041016, 23.97452735900879, 26.758682250976562, 29.542837142944336, 32.32699203491211]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 7.0, 8.0, 7.0, 14.0, 13.0, 13.0, 21.0, 16.0, 25.0, 31.0, 28.0, 34.0, 33.0, 28.0, 46.0, 36.0, 34.0, 41.0, 45.0, 36.0, 34.0, 37.0, 30.0, 38.0, 30.0, 32.0, 25.0, 36.0, 18.0, 20.0, 27.0, 25.0, 16.0, 20.0, 16.0, 14.0, 10.0, 5.0, 10.0, 10.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.84174346923828, -51.20581817626953, -49.56989669799805, -47.93397521972656, -46.29804992675781, -44.66212463378906, -43.02620315551758, -41.390281677246094, -39.754356384277344, -38.118431091308594, -36.48250961303711, -34.846588134765625, -33.210662841796875, -31.574739456176758, -29.93881607055664, -28.302892684936523, -26.666969299316406, -25.03104591369629, -23.395122528076172, -21.759199142456055, -20.123275756835938, -18.48735237121582, -16.851428985595703, -15.215505599975586, -13.579582214355469, -11.943658828735352, -10.307735443115234, -8.671812057495117, -7.035888671875, -5.399965286254883, -3.7640419006347656, -2.1281185150146484, -0.49219512939453125, 1.143728256225586, 2.779651641845703, 4.41557502746582, 6.0514984130859375, 7.687421798706055, 9.323345184326172, 10.959268569946289, 12.595191955566406, 14.231115341186523, 15.86703872680664, 17.502962112426758, 19.138885498046875, 20.774808883666992, 22.41073226928711, 24.046655654907227, 25.682579040527344, 27.31850242614746, 28.954425811767578, 30.590349197387695, 32.22627258300781, 33.86219787597656, 35.49811935424805, 37.13404083251953, 38.76996612548828, 40.40589141845703, 42.041812896728516, 43.677734375, 45.31365966796875, 46.9495849609375, 48.585506439208984, 50.22142791748047, 51.85735321044922]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 8.0, 11.0, 6.0, 10.0, 9.0, 15.0, 10.0, 14.0, 18.0, 20.0, 25.0, 29.0, 23.0, 23.0, 35.0, 37.0, 41.0, 34.0, 40.0, 53.0, 43.0, 57.0, 35.0, 50.0, 44.0, 48.0, 32.0, 41.0, 29.0, 25.0, 22.0, 15.0, 19.0, 22.0, 6.0, 20.0, 15.0, 6.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.28515625, -5.1119384765625, -4.938720703125, -4.7655029296875, -4.59228515625, -4.4190673828125, -4.245849609375, -4.0726318359375, -3.8994140625, -3.7261962890625, -3.552978515625, -3.3797607421875, -3.20654296875, -3.0333251953125, -2.860107421875, -2.6868896484375, -2.513671875, -2.3404541015625, -2.167236328125, -1.9940185546875, -1.82080078125, -1.6475830078125, -1.474365234375, -1.3011474609375, -1.1279296875, -0.9547119140625, -0.781494140625, -0.6082763671875, -0.43505859375, -0.2618408203125, -0.088623046875, 0.0845947265625, 0.2578125, 0.4310302734375, 0.604248046875, 0.7774658203125, 0.95068359375, 1.1239013671875, 1.297119140625, 1.4703369140625, 1.6435546875, 1.8167724609375, 1.989990234375, 2.1632080078125, 2.33642578125, 2.5096435546875, 2.682861328125, 2.8560791015625, 3.029296875, 3.2025146484375, 3.375732421875, 3.5489501953125, 3.72216796875, 3.8953857421875, 4.068603515625, 4.2418212890625, 4.4150390625, 4.5882568359375, 4.761474609375, 4.9346923828125, 5.10791015625, 5.2811279296875, 5.454345703125, 5.6275634765625, 5.80078125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 9.0, 3.0, 10.0, 8.0, 18.0, 19.0, 26.0, 24.0, 30.0, 44.0, 71.0, 102.0, 195.0, 379.0, 1087.0, 3539.0, 14292.0, 80068.0, 662130.0, 2335069.0, 946128.0, 124343.0, 19600.0, 4553.0, 1378.0, 488.0, 230.0, 119.0, 86.0, 62.0, 31.0, 35.0, 18.0, 19.0, 14.0, 9.0, 11.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7890625, -9.4691162109375, -9.149169921875, -8.8292236328125, -8.50927734375, -8.1893310546875, -7.869384765625, -7.5494384765625, -7.2294921875, -6.9095458984375, -6.589599609375, -6.2696533203125, -5.94970703125, -5.6297607421875, -5.309814453125, -4.9898681640625, -4.669921875, -4.3499755859375, -4.030029296875, -3.7100830078125, -3.39013671875, -3.0701904296875, -2.750244140625, -2.4302978515625, -2.1103515625, -1.7904052734375, -1.470458984375, -1.1505126953125, -0.83056640625, -0.5106201171875, -0.190673828125, 0.1292724609375, 0.44921875, 0.7691650390625, 1.089111328125, 1.4090576171875, 1.72900390625, 2.0489501953125, 2.368896484375, 2.6888427734375, 3.0087890625, 3.3287353515625, 3.648681640625, 3.9686279296875, 4.28857421875, 4.6085205078125, 4.928466796875, 5.2484130859375, 5.568359375, 5.8883056640625, 6.208251953125, 6.5281982421875, 6.84814453125, 7.1680908203125, 7.488037109375, 7.8079833984375, 8.1279296875, 8.4478759765625, 8.767822265625, 9.0877685546875, 9.40771484375, 9.7276611328125, 10.047607421875, 10.3675537109375, 10.6875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 28.0, 25.0, 52.0, 65.0, 98.0, 144.0, 260.0, 413.0, 640.0, 723.0, 598.0, 374.0, 229.0, 143.0, 88.0, 53.0, 38.0, 27.0, 14.0, 21.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.966064453125, -26.24462890625, -25.523193359375, -24.8017578125, -24.080322265625, -23.35888671875, -22.637451171875, -21.916015625, -21.194580078125, -20.47314453125, -19.751708984375, -19.0302734375, -18.308837890625, -17.58740234375, -16.865966796875, -16.14453125, -15.423095703125, -14.70166015625, -13.980224609375, -13.2587890625, -12.537353515625, -11.81591796875, -11.094482421875, -10.373046875, -9.651611328125, -8.93017578125, -8.208740234375, -7.4873046875, -6.765869140625, -6.04443359375, -5.322998046875, -4.6015625, -3.880126953125, -3.15869140625, -2.437255859375, -1.7158203125, -0.994384765625, -0.27294921875, 0.448486328125, 1.169921875, 1.891357421875, 2.61279296875, 3.334228515625, 4.0556640625, 4.777099609375, 5.49853515625, 6.219970703125, 6.94140625, 7.662841796875, 8.38427734375, 9.105712890625, 9.8271484375, 10.548583984375, 11.27001953125, 11.991455078125, 12.712890625, 13.434326171875, 14.15576171875, 14.877197265625, 15.5986328125, 16.320068359375, 17.04150390625, 17.762939453125, 18.484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 6.0, 11.0, 10.0, 12.0, 19.0, 21.0, 38.0, 56.0, 93.0, 109.0, 168.0, 334.0, 988.0, 47984.0, 4132958.0, 10022.0, 659.0, 254.0, 177.0, 118.0, 85.0, 39.0, 35.0, 23.0, 19.0, 16.0, 8.0, 4.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.8125, -71.1162109375, -68.419921875, -65.7236328125, -63.02734375, -60.3310546875, -57.634765625, -54.9384765625, -52.2421875, -49.5458984375, -46.849609375, -44.1533203125, -41.45703125, -38.7607421875, -36.064453125, -33.3681640625, -30.671875, -27.9755859375, -25.279296875, -22.5830078125, -19.88671875, -17.1904296875, -14.494140625, -11.7978515625, -9.1015625, -6.4052734375, -3.708984375, -1.0126953125, 1.68359375, 4.3798828125, 7.076171875, 9.7724609375, 12.46875, 15.1650390625, 17.861328125, 20.5576171875, 23.25390625, 25.9501953125, 28.646484375, 31.3427734375, 34.0390625, 36.7353515625, 39.431640625, 42.1279296875, 44.82421875, 47.5205078125, 50.216796875, 52.9130859375, 55.609375, 58.3056640625, 61.001953125, 63.6982421875, 66.39453125, 69.0908203125, 71.787109375, 74.4833984375, 77.1796875, 79.8759765625, 82.572265625, 85.2685546875, 87.96484375, 90.6611328125, 93.357421875, 96.0537109375, 98.75]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 18.0, 73.0, 308.0, 369.0, 199.0, 36.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-124.89875030517578, -119.7562484741211, -114.61375427246094, -109.47125244140625, -104.32875061035156, -99.18624877929688, -94.04375457763672, -88.90125274658203, -83.75875854492188, -78.61625671386719, -73.47376251220703, -68.33126068115234, -63.188758850097656, -58.046260833740234, -52.90376281738281, -47.761260986328125, -42.61875915527344, -37.476261138916016, -32.33375930786133, -27.191261291503906, -22.04876136779785, -16.906261444091797, -11.763763427734375, -6.6212615966796875, -1.4787635803222656, 3.663735866546631, 8.806235313415527, 13.948734283447266, 19.09123420715332, 24.233734130859375, 29.376232147216797, 34.518733978271484, 39.66123962402344, 44.80373764038086, 49.94623947143555, 55.08873748779297, 60.231239318847656, 65.37373352050781, 70.5162353515625, 75.65873718261719, 80.80123901367188, 85.94374084472656, 91.08623504638672, 96.2287368774414, 101.3712387084961, 106.51373291015625, 111.65623474121094, 116.79873657226562, 121.94123077392578, 127.08373260498047, 132.22622680664062, 137.3687286376953, 142.51123046875, 147.6537322998047, 152.79623413085938, 157.938720703125, 163.0812225341797, 168.22372436523438, 173.36622619628906, 178.50872802734375, 183.65121459960938, 188.79371643066406, 193.93621826171875, 199.07872009277344, 204.22122192382812]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 9.0, 15.0, 15.0, 6.0, 15.0, 15.0, 23.0, 27.0, 27.0, 35.0, 38.0, 30.0, 38.0, 29.0, 42.0, 35.0, 43.0, 35.0, 51.0, 30.0, 42.0, 30.0, 29.0, 38.0, 39.0, 30.0, 40.0, 25.0, 22.0, 20.0, 19.0, 15.0, 9.0, 11.0, 14.0, 7.0, 8.0, 6.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.622406005859375, -50.974788665771484, -49.32716751098633, -47.67955017089844, -46.03193283081055, -44.384315490722656, -42.7366943359375, -41.08907699584961, -39.44145965576172, -37.79384231567383, -36.14622116088867, -34.49860382080078, -32.85098648071289, -31.203367233276367, -29.555747985839844, -27.908130645751953, -26.260509490966797, -24.612890243530273, -22.965272903442383, -21.31765365600586, -19.67003631591797, -18.022417068481445, -16.374797821044922, -14.727179527282715, -13.079561233520508, -11.4319429397583, -9.784324645996094, -8.13670539855957, -6.489087104797363, -4.841468811035156, -3.193849563598633, -1.5462312698364258, 0.10138702392578125, 1.7490055561065674, 3.3966240882873535, 5.044242858886719, 6.691861152648926, 8.339479446411133, 9.987098693847656, 11.634716987609863, 13.28233528137207, 14.929953575134277, 16.577571868896484, 18.225191116333008, 19.87281036376953, 21.520427703857422, 23.168046951293945, 24.81566619873047, 26.46328353881836, 28.110902786254883, 29.758520126342773, 31.406139373779297, 33.05375671386719, 34.701377868652344, 36.348995208740234, 37.996612548828125, 39.64423370361328, 41.29185104370117, 42.93947219848633, 44.58708953857422, 46.23470687866211, 47.88232421875, 49.529945373535156, 51.17756271362305, 52.82518005371094]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 11.0, 2.0, 5.0, 9.0, 5.0, 9.0, 13.0, 15.0, 16.0, 21.0, 23.0, 29.0, 35.0, 18.0, 26.0, 28.0, 49.0, 45.0, 31.0, 49.0, 43.0, 45.0, 50.0, 45.0, 38.0, 48.0, 38.0, 34.0, 34.0, 25.0, 25.0, 27.0, 21.0, 12.0, 15.0, 12.0, 13.0, 13.0, 9.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.00384521484375, -4.8319091796875, -4.65997314453125, -4.488037109375, -4.31610107421875, -4.1441650390625, -3.97222900390625, -3.80029296875, -3.62835693359375, -3.4564208984375, -3.28448486328125, -3.112548828125, -2.94061279296875, -2.7686767578125, -2.59674072265625, -2.4248046875, -2.25286865234375, -2.0809326171875, -1.90899658203125, -1.737060546875, -1.56512451171875, -1.3931884765625, -1.22125244140625, -1.04931640625, -0.87738037109375, -0.7054443359375, -0.53350830078125, -0.361572265625, -0.18963623046875, -0.0177001953125, 0.15423583984375, 0.326171875, 0.49810791015625, 0.6700439453125, 0.84197998046875, 1.013916015625, 1.18585205078125, 1.3577880859375, 1.52972412109375, 1.70166015625, 1.87359619140625, 2.0455322265625, 2.21746826171875, 2.389404296875, 2.56134033203125, 2.7332763671875, 2.90521240234375, 3.0771484375, 3.24908447265625, 3.4210205078125, 3.59295654296875, 3.764892578125, 3.93682861328125, 4.1087646484375, 4.28070068359375, 4.45263671875, 4.62457275390625, 4.7965087890625, 4.96844482421875, 5.140380859375, 5.31231689453125, 5.4842529296875, 5.65618896484375, 5.828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 11.0, 24.0, 27.0, 42.0, 66.0, 92.0, 113.0, 169.0, 271.0, 399.0, 625.0, 916.0, 1444.0, 2082.0, 3367.0, 5320.0, 8425.0, 13224.0, 21561.0, 35665.0, 61286.0, 111960.0, 218869.0, 256923.0, 130108.0, 70410.0, 40259.0, 24170.0, 14928.0, 9190.0, 5783.0, 3756.0, 2501.0, 1583.0, 1018.0, 644.0, 418.0, 311.0, 176.0, 153.0, 81.0, 55.0, 39.0, 39.0, 10.0, 9.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.86865234375, -0.8407363891601562, -0.8128204345703125, -0.7849044799804688, -0.756988525390625, -0.7290725708007812, -0.7011566162109375, -0.6732406616210938, -0.64532470703125, -0.6174087524414062, -0.5894927978515625, -0.5615768432617188, -0.533660888671875, -0.5057449340820312, -0.4778289794921875, -0.44991302490234375, -0.4219970703125, -0.39408111572265625, -0.3661651611328125, -0.33824920654296875, -0.310333251953125, -0.28241729736328125, -0.2545013427734375, -0.22658538818359375, -0.19866943359375, -0.17075347900390625, -0.1428375244140625, -0.11492156982421875, -0.087005615234375, -0.05908966064453125, -0.0311737060546875, -0.00325775146484375, 0.024658203125, 0.05257415771484375, 0.0804901123046875, 0.10840606689453125, 0.136322021484375, 0.16423797607421875, 0.1921539306640625, 0.22006988525390625, 0.24798583984375, 0.27590179443359375, 0.3038177490234375, 0.33173370361328125, 0.359649658203125, 0.38756561279296875, 0.4154815673828125, 0.44339752197265625, 0.4713134765625, 0.49922943115234375, 0.5271453857421875, 0.5550613403320312, 0.582977294921875, 0.6108932495117188, 0.6388092041015625, 0.6667251586914062, 0.69464111328125, 0.7225570678710938, 0.7504730224609375, 0.7783889770507812, 0.806304931640625, 0.8342208862304688, 0.8621368408203125, 0.8900527954101562, 0.91796875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 2.0, 6.0, 9.0, 7.0, 7.0, 15.0, 14.0, 11.0, 20.0, 13.0, 19.0, 24.0, 47.0, 31.0, 29.0, 30.0, 50.0, 51.0, 40.0, 49.0, 31.0, 1063.0, 36.0, 38.0, 41.0, 34.0, 39.0, 34.0, 23.0, 28.0, 18.0, 24.0, 18.0, 19.0, 16.0, 16.0, 15.0, 6.0, 9.0, 7.0, 10.0, 8.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.728302001953125, -2.62847900390625, -2.528656005859375, -2.4288330078125, -2.329010009765625, -2.22918701171875, -2.129364013671875, -2.029541015625, -1.929718017578125, -1.82989501953125, -1.730072021484375, -1.6302490234375, -1.530426025390625, -1.43060302734375, -1.330780029296875, -1.23095703125, -1.131134033203125, -1.03131103515625, -0.931488037109375, -0.8316650390625, -0.731842041015625, -0.63201904296875, -0.532196044921875, -0.432373046875, -0.332550048828125, -0.23272705078125, -0.132904052734375, -0.0330810546875, 0.066741943359375, 0.16656494140625, 0.266387939453125, 0.3662109375, 0.466033935546875, 0.56585693359375, 0.665679931640625, 0.7655029296875, 0.865325927734375, 0.96514892578125, 1.064971923828125, 1.164794921875, 1.264617919921875, 1.36444091796875, 1.464263916015625, 1.5640869140625, 1.663909912109375, 1.76373291015625, 1.863555908203125, 1.96337890625, 2.063201904296875, 2.16302490234375, 2.262847900390625, 2.3626708984375, 2.462493896484375, 2.56231689453125, 2.662139892578125, 2.761962890625, 2.861785888671875, 2.96160888671875, 3.061431884765625, 3.1612548828125, 3.261077880859375, 3.36090087890625, 3.460723876953125, 3.560546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 15.0, 13.0, 22.0, 32.0, 47.0, 67.0, 110.0, 176.0, 248.0, 352.0, 514.0, 729.0, 1040.0, 1557.0, 2174.0, 3126.0, 4583.0, 6768.0, 9845.0, 15197.0, 23305.0, 36507.0, 58957.0, 97970.0, 171060.0, 1290048.0, 144192.0, 84142.0, 50819.0, 31761.0, 20265.0, 13211.0, 9017.0, 6006.0, 3924.0, 2851.0, 2081.0, 1361.0, 924.0, 666.0, 479.0, 331.0, 200.0, 128.0, 105.0, 71.0, 49.0, 30.0, 12.0, 19.0, 7.0, 8.0, 2.0, 6.0, 0.0, 3.0], "bins": [-0.7353515625, -0.7133026123046875, -0.691253662109375, -0.6692047119140625, -0.64715576171875, -0.6251068115234375, -0.603057861328125, -0.5810089111328125, -0.5589599609375, -0.5369110107421875, -0.514862060546875, -0.4928131103515625, -0.47076416015625, -0.4487152099609375, -0.426666259765625, -0.4046173095703125, -0.382568359375, -0.3605194091796875, -0.338470458984375, -0.3164215087890625, -0.29437255859375, -0.2723236083984375, -0.250274658203125, -0.2282257080078125, -0.2061767578125, -0.1841278076171875, -0.162078857421875, -0.1400299072265625, -0.11798095703125, -0.0959320068359375, -0.073883056640625, -0.0518341064453125, -0.02978515625, -0.0077362060546875, 0.014312744140625, 0.0363616943359375, 0.05841064453125, 0.0804595947265625, 0.102508544921875, 0.1245574951171875, 0.1466064453125, 0.1686553955078125, 0.190704345703125, 0.2127532958984375, 0.23480224609375, 0.2568511962890625, 0.278900146484375, 0.3009490966796875, 0.322998046875, 0.3450469970703125, 0.367095947265625, 0.3891448974609375, 0.41119384765625, 0.4332427978515625, 0.455291748046875, 0.4773406982421875, 0.4993896484375, 0.5214385986328125, 0.543487548828125, 0.5655364990234375, 0.58758544921875, 0.6096343994140625, 0.631683349609375, 0.6537322998046875, 0.67578125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 10.0, 9.0, 11.0, 6.0, 7.0, 15.0, 16.0, 20.0, 16.0, 23.0, 20.0, 34.0, 43.0, 56.0, 49.0, 52.0, 58.0, 52.0, 69.0, 61.0, 55.0, 55.0, 37.0, 43.0, 35.0, 36.0, 25.0, 16.0, 15.0, 5.0, 8.0, 9.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.000400543212890625, -0.0003871545195579529, -0.00037376582622528076, -0.00036037713289260864, -0.0003469884395599365, -0.0003335997462272644, -0.0003202110528945923, -0.00030682235956192017, -0.00029343366622924805, -0.00028004497289657593, -0.0002666562795639038, -0.0002532675862312317, -0.00023987889289855957, -0.00022649019956588745, -0.00021310150623321533, -0.0001997128129005432, -0.0001863241195678711, -0.00017293542623519897, -0.00015954673290252686, -0.00014615803956985474, -0.00013276934623718262, -0.0001193806529045105, -0.00010599195957183838, -9.260326623916626e-05, -7.921457290649414e-05, -6.582587957382202e-05, -5.24371862411499e-05, -3.904849290847778e-05, -2.5659799575805664e-05, -1.2271106243133545e-05, 1.1175870895385742e-06, 1.4506280422210693e-05, 2.7894973754882812e-05, 4.128366708755493e-05, 5.467236042022705e-05, 6.806105375289917e-05, 8.144974708557129e-05, 9.483844041824341e-05, 0.00010822713375091553, 0.00012161582708358765, 0.00013500452041625977, 0.00014839321374893188, 0.000161781907081604, 0.00017517060041427612, 0.00018855929374694824, 0.00020194798707962036, 0.00021533668041229248, 0.0002287253737449646, 0.00024211406707763672, 0.00025550276041030884, 0.00026889145374298096, 0.0002822801470756531, 0.0002956688404083252, 0.0003090575337409973, 0.00032244622707366943, 0.00033583492040634155, 0.00034922361373901367, 0.0003626123070716858, 0.0003760010004043579, 0.00038938969373703003, 0.00040277838706970215, 0.00041616708040237427, 0.0004295557737350464, 0.0004429444670677185, 0.0004563331604003906]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 6.0, 5.0, 8.0, 16.0, 19.0, 35.0, 49.0, 65.0, 82.0, 165.0, 303.0, 532.0, 3075.0, 1039797.0, 3084.0, 553.0, 240.0, 143.0, 107.0, 68.0, 44.0, 38.0, 18.0, 12.0, 9.0, 13.0, 15.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0155487060546875, -0.015144824981689453, -0.014740943908691406, -0.01433706283569336, -0.013933181762695312, -0.013529300689697266, -0.013125419616699219, -0.012721538543701172, -0.012317657470703125, -0.011913776397705078, -0.011509895324707031, -0.011106014251708984, -0.010702133178710938, -0.01029825210571289, -0.009894371032714844, -0.009490489959716797, -0.00908660888671875, -0.008682727813720703, -0.008278846740722656, -0.00787496566772461, -0.0074710845947265625, -0.007067203521728516, -0.006663322448730469, -0.006259441375732422, -0.005855560302734375, -0.005451679229736328, -0.005047798156738281, -0.004643917083740234, -0.0042400360107421875, -0.0038361549377441406, -0.0034322738647460938, -0.003028392791748047, -0.00262451171875, -0.002220630645751953, -0.0018167495727539062, -0.0014128684997558594, -0.0010089874267578125, -0.0006051063537597656, -0.00020122528076171875, 0.00020265579223632812, 0.000606536865234375, 0.0010104179382324219, 0.0014142990112304688, 0.0018181800842285156, 0.0022220611572265625, 0.0026259422302246094, 0.0030298233032226562, 0.003433704376220703, 0.00383758544921875, 0.004241466522216797, 0.004645347595214844, 0.005049228668212891, 0.0054531097412109375, 0.005856990814208984, 0.006260871887207031, 0.006664752960205078, 0.007068634033203125, 0.007472515106201172, 0.007876396179199219, 0.008280277252197266, 0.008684158325195312, 0.00908803939819336, 0.009491920471191406, 0.009895801544189453, 0.0102996826171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 91.0, 730.0, 189.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023884994443506002, -0.002328182104974985, -0.0022678645327687263, -0.0022075471933931112, -0.002147229854017496, -0.002086912514641881, -0.002026595175266266, -0.001966277603060007, -0.001905960263684392, -0.0018456429243087769, -0.00178532546851784, -0.001725008012726903, -0.0016646906733512878, -0.0016043733339756727, -0.0015440558781847358, -0.0014837384223937988, -0.0014234210830181837, -0.0013631037436425686, -0.0013027862878516316, -0.0012424688320606947, -0.0011821514926850796, -0.0011218341533094645, -0.0010615166975185275, -0.0010011992417275906, -0.0009408819023519754, -0.0008805645047686994, -0.0008202471071854234, -0.0007599297096021473, -0.0006996123120188713, -0.0006392949144355953, -0.0005789775168523192, -0.0005186601192690432, -0.000458342838101089, -0.00039802544051781297, -0.00033770804293453693, -0.0002773906453512609, -0.00021707324776798487, -0.00015675585018470883, -9.64384526014328e-05, -3.612105501815677e-05, 2.4196342565119267e-05, 8.45137401483953e-05, 0.00014483113773167133, 0.00020514853531494737, 0.0002654659328982234, 0.00032578333048149943, 0.00038610072806477547, 0.0004464181256480515, 0.0005067355232313275, 0.0005670529208146036, 0.0006273703183978796, 0.0006876877159811556, 0.0007480051135644317, 0.0008083225111477077, 0.0008686399087309837, 0.0009289573063142598, 0.0009892747038975358, 0.0010495921596884727, 0.0011099094990640879, 0.001170226838439703, 0.00123054429423064, 0.0012908617500215769, 0.001351179089397192, 0.0014114964287728071, 0.001471813884563744]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 2.0, 6.0, 5.0, 8.0, 11.0, 8.0, 21.0, 17.0, 11.0, 10.0, 22.0, 25.0, 39.0, 40.0, 37.0, 26.0, 39.0, 32.0, 43.0, 40.0, 37.0, 31.0, 44.0, 37.0, 38.0, 31.0, 24.0, 23.0, 34.0, 33.0, 33.0, 22.0, 21.0, 26.0, 16.0, 20.0, 18.0, 9.0, 15.0, 8.0, 7.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00021779537200927734, -0.00021124351769685745, -0.00020469166338443756, -0.00019813980907201767, -0.00019158795475959778, -0.0001850361004471779, -0.000178484246134758, -0.0001719323918223381, -0.0001653805375099182, -0.00015882868319749832, -0.00015227682888507843, -0.00014572497457265854, -0.00013917312026023865, -0.00013262126594781876, -0.00012606941163539886, -0.00011951755732297897, -0.00011296570301055908, -0.00010641384869813919, -9.98619943857193e-05, -9.331014007329941e-05, -8.675828576087952e-05, -8.020643144845963e-05, -7.365457713603973e-05, -6.710272282361984e-05, -6.055086851119995e-05, -5.399901419878006e-05, -4.744715988636017e-05, -4.089530557394028e-05, -3.4343451261520386e-05, -2.7791596949100494e-05, -2.1239742636680603e-05, -1.4687888324260712e-05, -8.13603401184082e-06, -1.584179699420929e-06, 4.967674612998962e-06, 1.1519528925418854e-05, 1.8071383237838745e-05, 2.4623237550258636e-05, 3.117509186267853e-05, 3.772694617509842e-05, 4.427880048751831e-05, 5.08306547999382e-05, 5.738250911235809e-05, 6.393436342477798e-05, 7.048621773719788e-05, 7.703807204961777e-05, 8.358992636203766e-05, 9.014178067445755e-05, 9.669363498687744e-05, 0.00010324548929929733, 0.00010979734361171722, 0.00011634919792413712, 0.000122901052236557, 0.0001294529065489769, 0.0001360047608613968, 0.00014255661517381668, 0.00014910846948623657, 0.00015566032379865646, 0.00016221217811107635, 0.00016876403242349625, 0.00017531588673591614, 0.00018186774104833603, 0.00018841959536075592, 0.0001949714496731758, 0.0002015233039855957]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 11.0, 2.0, 5.0, 9.0, 5.0, 9.0, 13.0, 15.0, 16.0, 21.0, 23.0, 29.0, 35.0, 18.0, 26.0, 28.0, 49.0, 45.0, 31.0, 49.0, 43.0, 45.0, 50.0, 45.0, 38.0, 48.0, 38.0, 34.0, 34.0, 25.0, 25.0, 27.0, 21.0, 12.0, 15.0, 12.0, 13.0, 13.0, 9.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.00384521484375, -4.8319091796875, -4.65997314453125, -4.488037109375, -4.31610107421875, -4.1441650390625, -3.97222900390625, -3.80029296875, -3.62835693359375, -3.4564208984375, -3.28448486328125, -3.112548828125, -2.94061279296875, -2.7686767578125, -2.59674072265625, -2.4248046875, -2.25286865234375, -2.0809326171875, -1.90899658203125, -1.737060546875, -1.56512451171875, -1.3931884765625, -1.22125244140625, -1.04931640625, -0.87738037109375, -0.7054443359375, -0.53350830078125, -0.361572265625, -0.18963623046875, -0.0177001953125, 0.15423583984375, 0.326171875, 0.49810791015625, 0.6700439453125, 0.84197998046875, 1.013916015625, 1.18585205078125, 1.3577880859375, 1.52972412109375, 1.70166015625, 1.87359619140625, 2.0455322265625, 2.21746826171875, 2.389404296875, 2.56134033203125, 2.7332763671875, 2.90521240234375, 3.0771484375, 3.24908447265625, 3.4210205078125, 3.59295654296875, 3.764892578125, 3.93682861328125, 4.1087646484375, 4.28070068359375, 4.45263671875, 4.62457275390625, 4.7965087890625, 4.96844482421875, 5.140380859375, 5.31231689453125, 5.4842529296875, 5.65618896484375, 5.828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 10.0, 3.0, 8.0, 10.0, 7.0, 18.0, 18.0, 28.0, 40.0, 69.0, 101.0, 191.0, 335.0, 626.0, 1269.0, 2618.0, 5253.0, 11807.0, 28155.0, 79228.0, 252014.0, 419149.0, 158916.0, 52188.0, 19926.0, 8633.0, 3864.0, 1971.0, 922.0, 483.0, 268.0, 151.0, 83.0, 65.0, 28.0, 23.0, 23.0, 11.0, 14.0, 11.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.24609375, -3.13897705078125, -3.0318603515625, -2.92474365234375, -2.817626953125, -2.71051025390625, -2.6033935546875, -2.49627685546875, -2.38916015625, -2.28204345703125, -2.1749267578125, -2.06781005859375, -1.960693359375, -1.85357666015625, -1.7464599609375, -1.63934326171875, -1.5322265625, -1.42510986328125, -1.3179931640625, -1.21087646484375, -1.103759765625, -0.99664306640625, -0.8895263671875, -0.78240966796875, -0.67529296875, -0.56817626953125, -0.4610595703125, -0.35394287109375, -0.246826171875, -0.13970947265625, -0.0325927734375, 0.07452392578125, 0.181640625, 0.28875732421875, 0.3958740234375, 0.50299072265625, 0.610107421875, 0.71722412109375, 0.8243408203125, 0.93145751953125, 1.03857421875, 1.14569091796875, 1.2528076171875, 1.35992431640625, 1.467041015625, 1.57415771484375, 1.6812744140625, 1.78839111328125, 1.8955078125, 2.00262451171875, 2.1097412109375, 2.21685791015625, 2.323974609375, 2.43109130859375, 2.5382080078125, 2.64532470703125, 2.75244140625, 2.85955810546875, 2.9666748046875, 3.07379150390625, 3.180908203125, 3.28802490234375, 3.3951416015625, 3.50225830078125, 3.609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 6.0, 8.0, 10.0, 14.0, 17.0, 21.0, 27.0, 17.0, 28.0, 34.0, 30.0, 45.0, 33.0, 47.0, 52.0, 56.0, 86.0, 1532.0, 462.0, 83.0, 63.0, 51.0, 42.0, 38.0, 29.0, 27.0, 18.0, 19.0, 27.0, 8.0, 24.0, 22.0, 17.0, 9.0, 9.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.999755859375, -18.40576171875, -17.811767578125, -17.2177734375, -16.623779296875, -16.02978515625, -15.435791015625, -14.841796875, -14.247802734375, -13.65380859375, -13.059814453125, -12.4658203125, -11.871826171875, -11.27783203125, -10.683837890625, -10.08984375, -9.495849609375, -8.90185546875, -8.307861328125, -7.7138671875, -7.119873046875, -6.52587890625, -5.931884765625, -5.337890625, -4.743896484375, -4.14990234375, -3.555908203125, -2.9619140625, -2.367919921875, -1.77392578125, -1.179931640625, -0.5859375, 0.008056640625, 0.60205078125, 1.196044921875, 1.7900390625, 2.384033203125, 2.97802734375, 3.572021484375, 4.166015625, 4.760009765625, 5.35400390625, 5.947998046875, 6.5419921875, 7.135986328125, 7.72998046875, 8.323974609375, 8.91796875, 9.511962890625, 10.10595703125, 10.699951171875, 11.2939453125, 11.887939453125, 12.48193359375, 13.075927734375, 13.669921875, 14.263916015625, 14.85791015625, 15.451904296875, 16.0458984375, 16.639892578125, 17.23388671875, 17.827880859375, 18.421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 1.0, 10.0, 3.0, 8.0, 14.0, 15.0, 24.0, 20.0, 15.0, 30.0, 31.0, 47.0, 55.0, 98.0, 148.0, 215.0, 349.0, 1009.0, 12165.0, 3080595.0, 47790.0, 1687.0, 493.0, 275.0, 160.0, 98.0, 81.0, 40.0, 46.0, 31.0, 26.0, 29.0, 25.0, 10.0, 18.0, 7.0, 7.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.68603515625, -28.6845703125, -27.68310546875, -26.681640625, -25.68017578125, -24.6787109375, -23.67724609375, -22.67578125, -21.67431640625, -20.6728515625, -19.67138671875, -18.669921875, -17.66845703125, -16.6669921875, -15.66552734375, -14.6640625, -13.66259765625, -12.6611328125, -11.65966796875, -10.658203125, -9.65673828125, -8.6552734375, -7.65380859375, -6.65234375, -5.65087890625, -4.6494140625, -3.64794921875, -2.646484375, -1.64501953125, -0.6435546875, 0.35791015625, 1.359375, 2.36083984375, 3.3623046875, 4.36376953125, 5.365234375, 6.36669921875, 7.3681640625, 8.36962890625, 9.37109375, 10.37255859375, 11.3740234375, 12.37548828125, 13.376953125, 14.37841796875, 15.3798828125, 16.38134765625, 17.3828125, 18.38427734375, 19.3857421875, 20.38720703125, 21.388671875, 22.39013671875, 23.3916015625, 24.39306640625, 25.39453125, 26.39599609375, 27.3974609375, 28.39892578125, 29.400390625, 30.40185546875, 31.4033203125, 32.40478515625, 33.40625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [3.0, 48.0, 802.0, 160.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.05388069152832, -6.874826431274414, -2.695772171020508, 1.4832820892333984, 5.662336349487305, 9.841390609741211, 14.020444869995117, 18.199499130249023, 22.37855339050293, 26.557607650756836, 30.736661911010742, 34.91571807861328, 39.09477233886719, 43.273826599121094, 47.452880859375, 51.631935119628906, 55.81098937988281, 59.99004364013672, 64.16909790039062, 68.34815216064453, 72.52720642089844, 76.70626068115234, 80.88531494140625, 85.06436920166016, 89.24342346191406, 93.42247772216797, 97.60153198242188, 101.78058624267578, 105.95964050292969, 110.1386947631836, 114.3177490234375, 118.4968032836914, 122.67584228515625, 126.85489654541016, 131.03395080566406, 135.2130126953125, 139.39205932617188, 143.57110595703125, 147.7501678466797, 151.92922973632812, 156.1082763671875, 160.28732299804688, 164.4663848876953, 168.64544677734375, 172.82449340820312, 177.0035400390625, 181.18260192871094, 185.36166381835938, 189.54071044921875, 193.71975708007812, 197.89881896972656, 202.077880859375, 206.25692749023438, 210.43597412109375, 214.6150360107422, 218.79409790039062, 222.97314453125, 227.15219116210938, 231.3312530517578, 235.51031494140625, 239.68936157226562, 243.868408203125, 248.04747009277344, 252.22653198242188, 256.40557861328125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 10.0, 8.0, 12.0, 15.0, 6.0, 4.0, 18.0, 18.0, 17.0, 30.0, 28.0, 21.0, 19.0, 35.0, 35.0, 48.0, 38.0, 39.0, 34.0, 29.0, 42.0, 53.0, 37.0, 32.0, 38.0, 44.0, 36.0, 25.0, 28.0, 22.0, 23.0, 28.0, 14.0, 17.0, 15.0, 13.0, 10.0, 10.0, 14.0, 9.0, 9.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-63.37583923339844, -61.554351806640625, -59.73286437988281, -57.911380767822266, -56.08989334106445, -54.26840591430664, -52.446922302246094, -50.62543487548828, -48.80394744873047, -46.982460021972656, -45.160972595214844, -43.3394889831543, -41.518001556396484, -39.69651412963867, -37.875030517578125, -36.05354309082031, -34.2320556640625, -32.41056823730469, -30.589082717895508, -28.767597198486328, -26.946109771728516, -25.124622344970703, -23.303136825561523, -21.481651306152344, -19.66016387939453, -17.83867645263672, -16.01719093322754, -14.195704460144043, -12.374217987060547, -10.55273151397705, -8.731245040893555, -6.909758567810059, -5.0882720947265625, -3.2667856216430664, -1.4452991485595703, 0.3761873245239258, 2.197673797607422, 4.019160270690918, 5.840646743774414, 7.66213321685791, 9.483619689941406, 11.305106163024902, 13.126592636108398, 14.948079109191895, 16.76956558227539, 18.591053009033203, 20.412538528442383, 22.234024047851562, 24.055511474609375, 25.876998901367188, 27.698484420776367, 29.519969940185547, 31.34145736694336, 33.16294479370117, 34.98442840576172, 36.80591583251953, 38.627403259277344, 40.448890686035156, 42.27037811279297, 44.091861724853516, 45.91334915161133, 47.73483657836914, 49.55632019042969, 51.3778076171875, 53.19929504394531]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 5.0, 3.0, 7.0, 9.0, 4.0, 8.0, 9.0, 18.0, 13.0, 19.0, 22.0, 32.0, 17.0, 24.0, 36.0, 25.0, 43.0, 38.0, 40.0, 29.0, 41.0, 39.0, 47.0, 52.0, 37.0, 42.0, 37.0, 42.0, 37.0, 27.0, 22.0, 35.0, 24.0, 20.0, 17.0, 12.0, 13.0, 12.0, 9.0, 11.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.07421875, -4.904296875, -4.734375, -4.564453125, -4.39453125, -4.224609375, -4.0546875, -3.884765625, -3.71484375, -3.544921875, -3.375, -3.205078125, -3.03515625, -2.865234375, -2.6953125, -2.525390625, -2.35546875, -2.185546875, -2.015625, -1.845703125, -1.67578125, -1.505859375, -1.3359375, -1.166015625, -0.99609375, -0.826171875, -0.65625, -0.486328125, -0.31640625, -0.146484375, 0.0234375, 0.193359375, 0.36328125, 0.533203125, 0.703125, 0.873046875, 1.04296875, 1.212890625, 1.3828125, 1.552734375, 1.72265625, 1.892578125, 2.0625, 2.232421875, 2.40234375, 2.572265625, 2.7421875, 2.912109375, 3.08203125, 3.251953125, 3.421875, 3.591796875, 3.76171875, 3.931640625, 4.1015625, 4.271484375, 4.44140625, 4.611328125, 4.78125, 4.951171875, 5.12109375, 5.291015625, 5.4609375, 5.630859375, 5.80078125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 8.0, 7.0, 6.0, 10.0, 4.0, 13.0, 17.0, 22.0, 26.0, 31.0, 33.0, 38.0, 57.0, 96.0, 156.0, 331.0, 1098.0, 6321.0, 67677.0, 1612939.0, 2372440.0, 121022.0, 9339.0, 1561.0, 427.0, 201.0, 103.0, 53.0, 50.0, 45.0, 24.0, 27.0, 20.0, 14.0, 18.0, 10.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.9765625, -15.4456787109375, -14.914794921875, -14.3839111328125, -13.85302734375, -13.3221435546875, -12.791259765625, -12.2603759765625, -11.7294921875, -11.1986083984375, -10.667724609375, -10.1368408203125, -9.60595703125, -9.0750732421875, -8.544189453125, -8.0133056640625, -7.482421875, -6.9515380859375, -6.420654296875, -5.8897705078125, -5.35888671875, -4.8280029296875, -4.297119140625, -3.7662353515625, -3.2353515625, -2.7044677734375, -2.173583984375, -1.6427001953125, -1.11181640625, -0.5809326171875, -0.050048828125, 0.4808349609375, 1.01171875, 1.5426025390625, 2.073486328125, 2.6043701171875, 3.13525390625, 3.6661376953125, 4.197021484375, 4.7279052734375, 5.2587890625, 5.7896728515625, 6.320556640625, 6.8514404296875, 7.38232421875, 7.9132080078125, 8.444091796875, 8.9749755859375, 9.505859375, 10.0367431640625, 10.567626953125, 11.0985107421875, 11.62939453125, 12.1602783203125, 12.691162109375, 13.2220458984375, 13.7529296875, 14.2838134765625, 14.814697265625, 15.3455810546875, 15.87646484375, 16.4073486328125, 16.938232421875, 17.4691162109375, 18.0]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 3.0, 19.0, 16.0, 31.0, 34.0, 48.0, 88.0, 122.0, 192.0, 230.0, 360.0, 516.0, 609.0, 555.0, 402.0, 263.0, 195.0, 117.0, 74.0, 62.0, 40.0, 27.0, 27.0, 12.0, 8.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.25, -19.646240234375, -19.04248046875, -18.438720703125, -17.8349609375, -17.231201171875, -16.62744140625, -16.023681640625, -15.419921875, -14.816162109375, -14.21240234375, -13.608642578125, -13.0048828125, -12.401123046875, -11.79736328125, -11.193603515625, -10.58984375, -9.986083984375, -9.38232421875, -8.778564453125, -8.1748046875, -7.571044921875, -6.96728515625, -6.363525390625, -5.759765625, -5.156005859375, -4.55224609375, -3.948486328125, -3.3447265625, -2.740966796875, -2.13720703125, -1.533447265625, -0.9296875, -0.325927734375, 0.27783203125, 0.881591796875, 1.4853515625, 2.089111328125, 2.69287109375, 3.296630859375, 3.900390625, 4.504150390625, 5.10791015625, 5.711669921875, 6.3154296875, 6.919189453125, 7.52294921875, 8.126708984375, 8.73046875, 9.334228515625, 9.93798828125, 10.541748046875, 11.1455078125, 11.749267578125, 12.35302734375, 12.956787109375, 13.560546875, 14.164306640625, 14.76806640625, 15.371826171875, 15.9755859375, 16.579345703125, 17.18310546875, 17.786865234375, 18.390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 2.0, 7.0, 4.0, 11.0, 12.0, 18.0, 21.0, 28.0, 40.0, 49.0, 58.0, 93.0, 103.0, 157.0, 215.0, 330.0, 835.0, 7116.0, 3160006.0, 1019411.0, 3970.0, 681.0, 319.0, 208.0, 146.0, 116.0, 78.0, 65.0, 40.0, 37.0, 23.0, 27.0, 12.0, 13.0, 8.0, 4.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.59375, -56.63525390625, -54.6767578125, -52.71826171875, -50.759765625, -48.80126953125, -46.8427734375, -44.88427734375, -42.92578125, -40.96728515625, -39.0087890625, -37.05029296875, -35.091796875, -33.13330078125, -31.1748046875, -29.21630859375, -27.2578125, -25.29931640625, -23.3408203125, -21.38232421875, -19.423828125, -17.46533203125, -15.5068359375, -13.54833984375, -11.58984375, -9.63134765625, -7.6728515625, -5.71435546875, -3.755859375, -1.79736328125, 0.1611328125, 2.11962890625, 4.078125, 6.03662109375, 7.9951171875, 9.95361328125, 11.912109375, 13.87060546875, 15.8291015625, 17.78759765625, 19.74609375, 21.70458984375, 23.6630859375, 25.62158203125, 27.580078125, 29.53857421875, 31.4970703125, 33.45556640625, 35.4140625, 37.37255859375, 39.3310546875, 41.28955078125, 43.248046875, 45.20654296875, 47.1650390625, 49.12353515625, 51.08203125, 53.04052734375, 54.9990234375, 56.95751953125, 58.916015625, 60.87451171875, 62.8330078125, 64.79150390625, 66.75]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 15.0, 24.0, 68.0, 123.0, 210.0, 178.0, 146.0, 118.0, 61.0, 38.0, 16.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.94272232055664, -50.34061050415039, -47.73849868774414, -45.13638687133789, -42.534278869628906, -39.932167053222656, -37.330055236816406, -34.727943420410156, -32.125831604003906, -29.523719787597656, -26.921607971191406, -24.31949806213379, -21.71738624572754, -19.11527442932129, -16.513164520263672, -13.911052703857422, -11.308940887451172, -8.706829071044922, -6.104718208312988, -3.5026068687438965, -0.9004955291748047, 1.7016162872314453, 4.303727149963379, 6.9058380126953125, 9.507949829101562, 12.110061645507812, 14.712172508239746, 17.31428337097168, 19.91639518737793, 22.51850700378418, 25.120616912841797, 27.722728729248047, 30.32483673095703, 32.92694854736328, 35.52906036376953, 38.13117218017578, 40.73328399658203, 43.33539581298828, 45.937503814697266, 48.539615631103516, 51.141727447509766, 53.743839263916016, 56.345951080322266, 58.948062896728516, 61.5501708984375, 64.15228271484375, 66.75439453125, 69.35650634765625, 71.9586181640625, 74.56072998046875, 77.162841796875, 79.76495361328125, 82.3670654296875, 84.96917724609375, 87.5712890625, 90.17340087890625, 92.7755126953125, 95.37762451171875, 97.979736328125, 100.58184814453125, 103.1839599609375, 105.78607177734375, 108.38818359375, 110.99029541015625, 113.59239959716797]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 7.0, 8.0, 9.0, 8.0, 8.0, 12.0, 10.0, 14.0, 14.0, 25.0, 18.0, 34.0, 21.0, 38.0, 33.0, 38.0, 43.0, 43.0, 44.0, 40.0, 43.0, 48.0, 46.0, 38.0, 36.0, 35.0, 31.0, 35.0, 37.0, 21.0, 34.0, 21.0, 13.0, 16.0, 12.0, 18.0, 14.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.909263610839844, -48.3282585144043, -46.74725341796875, -45.16624450683594, -43.58523941040039, -42.004234313964844, -40.4232292175293, -38.84222412109375, -37.2612190246582, -35.680213928222656, -34.09920883178711, -32.51820373535156, -30.937196731567383, -29.356189727783203, -27.775184631347656, -26.19417953491211, -24.61317253112793, -23.032167434692383, -21.451160430908203, -19.870155334472656, -18.28915023803711, -16.708145141601562, -15.127138137817383, -13.546133041381836, -11.965126991271973, -10.38412094116211, -8.803115844726562, -7.222109794616699, -5.641104221343994, -4.060098648071289, -2.479092597961426, -0.8980875015258789, 0.6829185485839844, 2.2639241218566895, 3.8449299335479736, 5.425935745239258, 7.006941318511963, 8.587946891784668, 10.168952941894531, 11.749958038330078, 13.330964088439941, 14.911970138549805, 16.49297523498535, 18.07398223876953, 19.654987335205078, 21.235992431640625, 22.816997528076172, 24.39800262451172, 25.9790096282959, 27.560014724731445, 29.141021728515625, 30.722026824951172, 32.30303192138672, 33.884037017822266, 35.46504211425781, 37.046051025390625, 38.62705612182617, 40.20806121826172, 41.789066314697266, 43.37007141113281, 44.951080322265625, 46.53208541870117, 48.11309051513672, 49.694095611572266, 51.27510070800781]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 12.0, 11.0, 10.0, 8.0, 17.0, 22.0, 23.0, 27.0, 26.0, 29.0, 45.0, 36.0, 37.0, 39.0, 32.0, 51.0, 38.0, 44.0, 46.0, 43.0, 37.0, 39.0, 41.0, 37.0, 35.0, 31.0, 25.0, 22.0, 17.0, 18.0, 21.0, 14.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5546875, -5.3758544921875, -5.197021484375, -5.0181884765625, -4.83935546875, -4.6605224609375, -4.481689453125, -4.3028564453125, -4.1240234375, -3.9451904296875, -3.766357421875, -3.5875244140625, -3.40869140625, -3.2298583984375, -3.051025390625, -2.8721923828125, -2.693359375, -2.5145263671875, -2.335693359375, -2.1568603515625, -1.97802734375, -1.7991943359375, -1.620361328125, -1.4415283203125, -1.2626953125, -1.0838623046875, -0.905029296875, -0.7261962890625, -0.54736328125, -0.3685302734375, -0.189697265625, -0.0108642578125, 0.16796875, 0.3468017578125, 0.525634765625, 0.7044677734375, 0.88330078125, 1.0621337890625, 1.240966796875, 1.4197998046875, 1.5986328125, 1.7774658203125, 1.956298828125, 2.1351318359375, 2.31396484375, 2.4927978515625, 2.671630859375, 2.8504638671875, 3.029296875, 3.2081298828125, 3.386962890625, 3.5657958984375, 3.74462890625, 3.9234619140625, 4.102294921875, 4.2811279296875, 4.4599609375, 4.6387939453125, 4.817626953125, 4.9964599609375, 5.17529296875, 5.3541259765625, 5.532958984375, 5.7117919921875, 5.890625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 11.0, 19.0, 27.0, 52.0, 54.0, 94.0, 138.0, 217.0, 294.0, 463.0, 721.0, 1118.0, 1805.0, 2591.0, 4134.0, 6490.0, 10333.0, 17389.0, 29919.0, 53212.0, 97122.0, 184213.0, 270767.0, 163479.0, 87091.0, 47589.0, 26958.0, 15897.0, 9661.0, 5912.0, 3794.0, 2482.0, 1520.0, 967.0, 689.0, 449.0, 305.0, 189.0, 136.0, 79.0, 49.0, 42.0, 27.0, 19.0, 11.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9563674926757812, -0.9259185791015625, -0.8954696655273438, -0.865020751953125, -0.8345718383789062, -0.8041229248046875, -0.7736740112304688, -0.74322509765625, -0.7127761840820312, -0.6823272705078125, -0.6518783569335938, -0.621429443359375, -0.5909805297851562, -0.5605316162109375, -0.5300827026367188, -0.4996337890625, -0.46918487548828125, -0.4387359619140625, -0.40828704833984375, -0.377838134765625, -0.34738922119140625, -0.3169403076171875, -0.28649139404296875, -0.25604248046875, -0.22559356689453125, -0.1951446533203125, -0.16469573974609375, -0.134246826171875, -0.10379791259765625, -0.0733489990234375, -0.04290008544921875, -0.012451171875, 0.01799774169921875, 0.0484466552734375, 0.07889556884765625, 0.109344482421875, 0.13979339599609375, 0.1702423095703125, 0.20069122314453125, 0.23114013671875, 0.26158905029296875, 0.2920379638671875, 0.32248687744140625, 0.352935791015625, 0.38338470458984375, 0.4138336181640625, 0.44428253173828125, 0.4747314453125, 0.5051803588867188, 0.5356292724609375, 0.5660781860351562, 0.596527099609375, 0.6269760131835938, 0.6574249267578125, 0.6878738403320312, 0.71832275390625, 0.7487716674804688, 0.7792205810546875, 0.8096694946289062, 0.840118408203125, 0.8705673217773438, 0.9010162353515625, 0.9314651489257812, 0.9619140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 9.0, 6.0, 10.0, 10.0, 19.0, 18.0, 14.0, 26.0, 28.0, 45.0, 30.0, 46.0, 33.0, 37.0, 36.0, 28.0, 49.0, 1065.0, 43.0, 46.0, 38.0, 47.0, 39.0, 40.0, 26.0, 26.0, 30.0, 25.0, 30.0, 24.0, 14.0, 20.0, 14.0, 10.0, 4.0, 8.0, 6.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0], "bins": [-4.18359375, -4.06707763671875, -3.9505615234375, -3.83404541015625, -3.717529296875, -3.60101318359375, -3.4844970703125, -3.36798095703125, -3.25146484375, -3.13494873046875, -3.0184326171875, -2.90191650390625, -2.785400390625, -2.66888427734375, -2.5523681640625, -2.43585205078125, -2.3193359375, -2.20281982421875, -2.0863037109375, -1.96978759765625, -1.853271484375, -1.73675537109375, -1.6202392578125, -1.50372314453125, -1.38720703125, -1.27069091796875, -1.1541748046875, -1.03765869140625, -0.921142578125, -0.80462646484375, -0.6881103515625, -0.57159423828125, -0.455078125, -0.33856201171875, -0.2220458984375, -0.10552978515625, 0.010986328125, 0.12750244140625, 0.2440185546875, 0.36053466796875, 0.47705078125, 0.59356689453125, 0.7100830078125, 0.82659912109375, 0.943115234375, 1.05963134765625, 1.1761474609375, 1.29266357421875, 1.4091796875, 1.52569580078125, 1.6422119140625, 1.75872802734375, 1.875244140625, 1.99176025390625, 2.1082763671875, 2.22479248046875, 2.34130859375, 2.45782470703125, 2.5743408203125, 2.69085693359375, 2.807373046875, 2.92388916015625, 3.0404052734375, 3.15692138671875, 3.2734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 12.0, 23.0, 31.0, 24.0, 72.0, 81.0, 133.0, 193.0, 325.0, 476.0, 836.0, 1276.0, 1985.0, 3081.0, 5152.0, 8236.0, 13357.0, 22130.0, 37946.0, 65216.0, 117977.0, 225570.0, 1294953.0, 127456.0, 69846.0, 39582.0, 23720.0, 14155.0, 8701.0, 5368.0, 3379.0, 2170.0, 1346.0, 821.0, 560.0, 327.0, 218.0, 142.0, 83.0, 59.0, 55.0, 16.0, 12.0, 8.0, 10.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8340911865234375, -0.805389404296875, -0.7766876220703125, -0.74798583984375, -0.7192840576171875, -0.690582275390625, -0.6618804931640625, -0.6331787109375, -0.6044769287109375, -0.575775146484375, -0.5470733642578125, -0.51837158203125, -0.4896697998046875, -0.460968017578125, -0.4322662353515625, -0.403564453125, -0.3748626708984375, -0.346160888671875, -0.3174591064453125, -0.28875732421875, -0.2600555419921875, -0.231353759765625, -0.2026519775390625, -0.1739501953125, -0.1452484130859375, -0.116546630859375, -0.0878448486328125, -0.05914306640625, -0.0304412841796875, -0.001739501953125, 0.0269622802734375, 0.0556640625, 0.0843658447265625, 0.113067626953125, 0.1417694091796875, 0.17047119140625, 0.1991729736328125, 0.227874755859375, 0.2565765380859375, 0.2852783203125, 0.3139801025390625, 0.342681884765625, 0.3713836669921875, 0.40008544921875, 0.4287872314453125, 0.457489013671875, 0.4861907958984375, 0.514892578125, 0.5435943603515625, 0.572296142578125, 0.6009979248046875, 0.62969970703125, 0.6584014892578125, 0.687103271484375, 0.7158050537109375, 0.7445068359375, 0.7732086181640625, 0.801910400390625, 0.8306121826171875, 0.85931396484375, 0.8880157470703125, 0.916717529296875, 0.9454193115234375, 0.97412109375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 5.0, 6.0, 8.0, 3.0, 8.0, 12.0, 15.0, 6.0, 21.0, 25.0, 24.0, 32.0, 41.0, 57.0, 51.0, 60.0, 62.0, 71.0, 68.0, 58.0, 38.0, 60.0, 49.0, 43.0, 32.0, 33.0, 23.0, 10.0, 14.0, 11.0, 9.0, 15.0, 6.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004563331604003906, -0.00044209882616996765, -0.0004278644919395447, -0.0004136301577091217, -0.00039939582347869873, -0.00038516148924827576, -0.0003709271550178528, -0.0003566928207874298, -0.00034245848655700684, -0.00032822415232658386, -0.0003139898180961609, -0.0002997554838657379, -0.00028552114963531494, -0.00027128681540489197, -0.000257052481174469, -0.00024281814694404602, -0.00022858381271362305, -0.00021434947848320007, -0.0002001151442527771, -0.00018588081002235413, -0.00017164647579193115, -0.00015741214156150818, -0.0001431778073310852, -0.00012894347310066223, -0.00011470913887023926, -0.00010047480463981628, -8.624047040939331e-05, -7.200613617897034e-05, -5.777180194854736e-05, -4.353746771812439e-05, -2.9303133487701416e-05, -1.5068799257278442e-05, -8.344650268554688e-07, 1.3399869203567505e-05, 2.763420343399048e-05, 4.186853766441345e-05, 5.6102871894836426e-05, 7.03372061252594e-05, 8.457154035568237e-05, 9.880587458610535e-05, 0.00011304020881652832, 0.0001272745430469513, 0.00014150887727737427, 0.00015574321150779724, 0.00016997754573822021, 0.0001842118799686432, 0.00019844621419906616, 0.00021268054842948914, 0.0002269148826599121, 0.00024114921689033508, 0.00025538355112075806, 0.00026961788535118103, 0.000283852219581604, 0.000298086553812027, 0.00031232088804244995, 0.0003265552222728729, 0.0003407895565032959, 0.00035502389073371887, 0.00036925822496414185, 0.0003834925591945648, 0.0003977268934249878, 0.00041196122765541077, 0.00042619556188583374, 0.0004404298961162567, 0.0004546642303466797]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 8.0, 9.0, 13.0, 18.0, 33.0, 34.0, 53.0, 71.0, 118.0, 213.0, 330.0, 821.0, 244133.0, 800553.0, 1071.0, 421.0, 211.0, 136.0, 72.0, 46.0, 32.0, 25.0, 18.0, 18.0, 16.0, 12.0, 10.0, 8.0, 3.0, 4.0, 5.0, 3.0, 9.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01161956787109375, -0.01124560832977295, -0.010871648788452148, -0.010497689247131348, -0.010123729705810547, -0.009749770164489746, -0.009375810623168945, -0.009001851081848145, -0.008627891540527344, -0.008253931999206543, -0.007879972457885742, -0.007506012916564941, -0.007132053375244141, -0.00675809383392334, -0.006384134292602539, -0.006010174751281738, -0.0056362152099609375, -0.005262255668640137, -0.004888296127319336, -0.004514336585998535, -0.004140377044677734, -0.0037664175033569336, -0.003392457962036133, -0.003018498420715332, -0.0026445388793945312, -0.0022705793380737305, -0.0018966197967529297, -0.001522660255432129, -0.0011487007141113281, -0.0007747411727905273, -0.00040078163146972656, -2.682209014892578e-05, 0.000347137451171875, 0.0007210969924926758, 0.0010950565338134766, 0.0014690160751342773, 0.0018429756164550781, 0.002216935157775879, 0.0025908946990966797, 0.0029648542404174805, 0.0033388137817382812, 0.003712773323059082, 0.004086732864379883, 0.004460692405700684, 0.004834651947021484, 0.005208611488342285, 0.005582571029663086, 0.005956530570983887, 0.0063304901123046875, 0.006704449653625488, 0.007078409194946289, 0.00745236873626709, 0.00782632827758789, 0.008200287818908691, 0.008574247360229492, 0.008948206901550293, 0.009322166442871094, 0.009696125984191895, 0.010070085525512695, 0.010444045066833496, 0.010818004608154297, 0.011191964149475098, 0.011565923690795898, 0.0119398832321167, 0.0123138427734375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 76.0, 348.0, 413.0, 146.0, 23.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006749026360921562, -0.0006397803663276136, -0.0006046581547707319, -0.0005695358850061893, -0.0005344136152416468, -0.0004992913454771042, -0.00046416910481639206, -0.00042904686415567994, -0.00039392459439113736, -0.0003588023246265948, -0.00032368008396588266, -0.00028855784330517054, -0.00025343557354062796, -0.0002183133183280006, -0.00018319106311537325, -0.00014806882245466113, -0.00011294655269011855, -7.78242974774912e-05, -4.270204226486385e-05, -7.579787052236497e-06, 2.7542468160390854e-05, 6.26647233730182e-05, 9.778697858564556e-05, 0.00013290921924635768, 0.00016803148901090026, 0.0002031537442235276, 0.00023827599943615496, 0.0002733982400968671, 0.00030852050986140966, 0.00034364277962595224, 0.00037876502028666437, 0.0004138872609473765, 0.00044900947250425816, 0.00048413174226880074, 0.0005192540120333433, 0.000554376223590225, 0.0005894984933547676, 0.0006246207631193101, 0.0006597429746761918, 0.0006948652444407344, 0.000729987514205277, 0.0007651097839698195, 0.0008002320537343621, 0.0008353542652912438, 0.0008704765350557864, 0.000905598804820329, 0.0009407210163772106, 0.0009758432861417532, 0.0010109655559062958, 0.0010460878256708384, 0.001081210095435381, 0.0011163323651999235, 0.001151454634964466, 0.0011865767883136868, 0.0012216990580782294, 0.001256821327842772, 0.0012919435976073146, 0.0013270658673718572, 0.0013621881371363997, 0.0013973104069009423, 0.001432432560250163, 0.0014675548300147057, 0.0015026770997792482, 0.0015377993695437908, 0.0015729216393083334]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 3.0, 7.0, 4.0, 15.0, 13.0, 16.0, 16.0, 23.0, 21.0, 23.0, 34.0, 23.0, 33.0, 36.0, 37.0, 40.0, 38.0, 30.0, 35.0, 45.0, 53.0, 23.0, 45.0, 45.0, 34.0, 26.0, 33.0, 30.0, 37.0, 19.0, 28.0, 17.0, 16.0, 13.0, 11.0, 6.0, 18.0, 10.0, 4.0, 5.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00021910667419433594, -0.00021243561059236526, -0.0002057645469903946, -0.00019909348338842392, -0.00019242241978645325, -0.00018575135618448257, -0.0001790802925825119, -0.00017240922898054123, -0.00016573816537857056, -0.00015906710177659988, -0.0001523960381746292, -0.00014572497457265854, -0.00013905391097068787, -0.0001323828473687172, -0.00012571178376674652, -0.00011904072016477585, -0.00011236965656280518, -0.0001056985929608345, -9.902752935886383e-05, -9.235646575689316e-05, -8.568540215492249e-05, -7.901433855295181e-05, -7.234327495098114e-05, -6.567221134901047e-05, -5.9001147747039795e-05, -5.233008414506912e-05, -4.565902054309845e-05, -3.898795694112778e-05, -3.2316893339157104e-05, -2.5645829737186432e-05, -1.897476613521576e-05, -1.2303702533245087e-05, -5.632638931274414e-06, 1.0384246706962585e-06, 7.709488272666931e-06, 1.4380551874637604e-05, 2.1051615476608276e-05, 2.772267907857895e-05, 3.439374268054962e-05, 4.1064806282520294e-05, 4.773586988449097e-05, 5.440693348646164e-05, 6.107799708843231e-05, 6.774906069040298e-05, 7.442012429237366e-05, 8.109118789434433e-05, 8.7762251496315e-05, 9.443331509828568e-05, 0.00010110437870025635, 0.00010777544230222702, 0.00011444650590419769, 0.00012111756950616837, 0.00012778863310813904, 0.0001344596967101097, 0.00014113076031208038, 0.00014780182391405106, 0.00015447288751602173, 0.0001611439511179924, 0.00016781501471996307, 0.00017448607832193375, 0.00018115714192390442, 0.0001878282055258751, 0.00019449926912784576, 0.00020117033272981644, 0.0002078413963317871]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 12.0, 11.0, 10.0, 8.0, 17.0, 22.0, 23.0, 27.0, 26.0, 29.0, 45.0, 36.0, 37.0, 39.0, 32.0, 51.0, 38.0, 44.0, 46.0, 43.0, 37.0, 39.0, 41.0, 37.0, 35.0, 31.0, 25.0, 22.0, 17.0, 18.0, 21.0, 14.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5546875, -5.3758544921875, -5.197021484375, -5.0181884765625, -4.83935546875, -4.6605224609375, -4.481689453125, -4.3028564453125, -4.1240234375, -3.9451904296875, -3.766357421875, -3.5875244140625, -3.40869140625, -3.2298583984375, -3.051025390625, -2.8721923828125, -2.693359375, -2.5145263671875, -2.335693359375, -2.1568603515625, -1.97802734375, -1.7991943359375, -1.620361328125, -1.4415283203125, -1.2626953125, -1.0838623046875, -0.905029296875, -0.7261962890625, -0.54736328125, -0.3685302734375, -0.189697265625, -0.0108642578125, 0.16796875, 0.3468017578125, 0.525634765625, 0.7044677734375, 0.88330078125, 1.0621337890625, 1.240966796875, 1.4197998046875, 1.5986328125, 1.7774658203125, 1.956298828125, 2.1351318359375, 2.31396484375, 2.4927978515625, 2.671630859375, 2.8504638671875, 3.029296875, 3.2081298828125, 3.386962890625, 3.5657958984375, 3.74462890625, 3.9234619140625, 4.102294921875, 4.2811279296875, 4.4599609375, 4.6387939453125, 4.817626953125, 4.9964599609375, 5.17529296875, 5.3541259765625, 5.532958984375, 5.7117919921875, 5.890625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 34.0, 33.0, 53.0, 69.0, 108.0, 136.0, 194.0, 282.0, 391.0, 579.0, 907.0, 1337.0, 2202.0, 3598.0, 6162.0, 11728.0, 24533.0, 60251.0, 194739.0, 504320.0, 143932.0, 47955.0, 20478.0, 10027.0, 5499.0, 3094.0, 1955.0, 1216.0, 809.0, 546.0, 399.0, 291.0, 199.0, 116.0, 90.0, 77.0, 37.0, 37.0, 33.0, 21.0, 19.0, 11.0, 6.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.65234375, -4.51300048828125, -4.3736572265625, -4.23431396484375, -4.094970703125, -3.95562744140625, -3.8162841796875, -3.67694091796875, -3.53759765625, -3.39825439453125, -3.2589111328125, -3.11956787109375, -2.980224609375, -2.84088134765625, -2.7015380859375, -2.56219482421875, -2.4228515625, -2.28350830078125, -2.1441650390625, -2.00482177734375, -1.865478515625, -1.72613525390625, -1.5867919921875, -1.44744873046875, -1.30810546875, -1.16876220703125, -1.0294189453125, -0.89007568359375, -0.750732421875, -0.61138916015625, -0.4720458984375, -0.33270263671875, -0.193359375, -0.05401611328125, 0.0853271484375, 0.22467041015625, 0.364013671875, 0.50335693359375, 0.6427001953125, 0.78204345703125, 0.92138671875, 1.06072998046875, 1.2000732421875, 1.33941650390625, 1.478759765625, 1.61810302734375, 1.7574462890625, 1.89678955078125, 2.0361328125, 2.17547607421875, 2.3148193359375, 2.45416259765625, 2.593505859375, 2.73284912109375, 2.8721923828125, 3.01153564453125, 3.15087890625, 3.29022216796875, 3.4295654296875, 3.56890869140625, 3.708251953125, 3.84759521484375, 3.9869384765625, 4.12628173828125, 4.265625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 5.0, 7.0, 3.0, 8.0, 9.0, 11.0, 12.0, 14.0, 21.0, 27.0, 24.0, 25.0, 21.0, 32.0, 26.0, 29.0, 33.0, 29.0, 56.0, 83.0, 271.0, 1680.0, 123.0, 61.0, 55.0, 44.0, 31.0, 28.0, 32.0, 34.0, 27.0, 29.0, 16.0, 18.0, 20.0, 16.0, 8.0, 10.0, 10.0, 13.0, 8.0, 9.0, 8.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.533447265625, -16.00439453125, -15.475341796875, -14.9462890625, -14.417236328125, -13.88818359375, -13.359130859375, -12.830078125, -12.301025390625, -11.77197265625, -11.242919921875, -10.7138671875, -10.184814453125, -9.65576171875, -9.126708984375, -8.59765625, -8.068603515625, -7.53955078125, -7.010498046875, -6.4814453125, -5.952392578125, -5.42333984375, -4.894287109375, -4.365234375, -3.836181640625, -3.30712890625, -2.778076171875, -2.2490234375, -1.719970703125, -1.19091796875, -0.661865234375, -0.1328125, 0.396240234375, 0.92529296875, 1.454345703125, 1.9833984375, 2.512451171875, 3.04150390625, 3.570556640625, 4.099609375, 4.628662109375, 5.15771484375, 5.686767578125, 6.2158203125, 6.744873046875, 7.27392578125, 7.802978515625, 8.33203125, 8.861083984375, 9.39013671875, 9.919189453125, 10.4482421875, 10.977294921875, 11.50634765625, 12.035400390625, 12.564453125, 13.093505859375, 13.62255859375, 14.151611328125, 14.6806640625, 15.209716796875, 15.73876953125, 16.267822265625, 16.796875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 11.0, 16.0, 17.0, 23.0, 23.0, 25.0, 43.0, 41.0, 82.0, 132.0, 167.0, 283.0, 646.0, 3322.0, 609572.0, 2525340.0, 4324.0, 710.0, 313.0, 163.0, 113.0, 81.0, 62.0, 57.0, 28.0, 22.0, 14.0, 14.0, 9.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.15625, -35.78271484375, -34.4091796875, -33.03564453125, -31.662109375, -30.28857421875, -28.9150390625, -27.54150390625, -26.16796875, -24.79443359375, -23.4208984375, -22.04736328125, -20.673828125, -19.30029296875, -17.9267578125, -16.55322265625, -15.1796875, -13.80615234375, -12.4326171875, -11.05908203125, -9.685546875, -8.31201171875, -6.9384765625, -5.56494140625, -4.19140625, -2.81787109375, -1.4443359375, -0.07080078125, 1.302734375, 2.67626953125, 4.0498046875, 5.42333984375, 6.796875, 8.17041015625, 9.5439453125, 10.91748046875, 12.291015625, 13.66455078125, 15.0380859375, 16.41162109375, 17.78515625, 19.15869140625, 20.5322265625, 21.90576171875, 23.279296875, 24.65283203125, 26.0263671875, 27.39990234375, 28.7734375, 30.14697265625, 31.5205078125, 32.89404296875, 34.267578125, 35.64111328125, 37.0146484375, 38.38818359375, 39.76171875, 41.13525390625, 42.5087890625, 43.88232421875, 45.255859375, 46.62939453125, 48.0029296875, 49.37646484375, 50.75]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 10.0, 22.0, 55.0, 58.0, 100.0, 113.0, 176.0, 137.0, 101.0, 97.0, 55.0, 39.0, 13.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.346296310424805, -28.64324188232422, -27.940187454223633, -27.237133026123047, -26.534076690673828, -25.831022262573242, -25.127967834472656, -24.42491340637207, -23.721858978271484, -23.0188045501709, -22.315750122070312, -21.612693786621094, -20.909639358520508, -20.206584930419922, -19.503530502319336, -18.80047607421875, -18.09741973876953, -17.394365310668945, -16.69131088256836, -15.988255500793457, -15.285201072692871, -14.582145690917969, -13.879091262817383, -13.176036834716797, -12.472982406616211, -11.769927978515625, -11.066872596740723, -10.363818168640137, -9.66076374053955, -8.957708358764648, -8.254653930664062, -7.551599502563477, -6.848544120788574, -6.14548921585083, -5.442434787750244, -4.7393798828125, -4.036325454711914, -3.33327054977417, -2.630215644836426, -1.9271612167358398, -1.2241063117980957, -0.5210515856742859, 0.18200314044952393, 0.8850579261779785, 1.5881125926971436, 2.2911672592163086, 2.9942221641540527, 3.6972765922546387, 4.400331497192383, 5.103386402130127, 5.806440830230713, 6.509495735168457, 7.212550163269043, 7.915605068206787, 8.618659973144531, 9.321714401245117, 10.024768829345703, 10.727823257446289, 11.430878639221191, 12.133933067321777, 12.836987495422363, 13.540042877197266, 14.243097305297852, 14.946151733398438, 15.64920711517334]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 10.0, 7.0, 9.0, 16.0, 12.0, 14.0, 7.0, 13.0, 22.0, 15.0, 20.0, 38.0, 30.0, 28.0, 28.0, 37.0, 34.0, 40.0, 41.0, 40.0, 35.0, 54.0, 32.0, 37.0, 36.0, 33.0, 35.0, 27.0, 29.0, 25.0, 22.0, 28.0, 29.0, 14.0, 18.0, 19.0, 12.0, 6.0, 9.0, 7.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-57.35395812988281, -55.69116973876953, -54.028385162353516, -52.3656005859375, -50.70281219482422, -49.04002380371094, -47.37723922729492, -45.714454650878906, -44.051666259765625, -42.388877868652344, -40.72609329223633, -39.06330871582031, -37.40052032470703, -35.73773193359375, -34.074947357177734, -32.41216278076172, -30.749374389648438, -29.08658790588379, -27.42380142211914, -25.761014938354492, -24.098228454589844, -22.435441970825195, -20.772655487060547, -19.1098690032959, -17.44708251953125, -15.784296035766602, -14.121509552001953, -12.458723068237305, -10.795936584472656, -9.133150100708008, -7.470363616943359, -5.807577133178711, -4.1447906494140625, -2.482004165649414, -0.8192176818847656, 0.8435688018798828, 2.5063552856445312, 4.16914176940918, 5.831928253173828, 7.494714736938477, 9.157501220703125, 10.820287704467773, 12.483074188232422, 14.14586067199707, 15.808647155761719, 17.471433639526367, 19.134220123291016, 20.797006607055664, 22.459793090820312, 24.12257957458496, 25.78536605834961, 27.448152542114258, 29.110939025878906, 30.773725509643555, 32.4365119934082, 34.09929656982422, 35.7620849609375, 37.42487335205078, 39.0876579284668, 40.75044250488281, 42.413230895996094, 44.076019287109375, 45.73880386352539, 47.401588439941406, 49.06437683105469]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 6.0, 14.0, 11.0, 16.0, 15.0, 27.0, 19.0, 32.0, 25.0, 30.0, 43.0, 41.0, 31.0, 40.0, 49.0, 33.0, 43.0, 44.0, 46.0, 41.0, 35.0, 49.0, 42.0, 34.0, 37.0, 25.0, 16.0, 24.0, 18.0, 21.0, 18.0, 7.0, 10.0, 9.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.66796875, -5.4833984375, -5.298828125, -5.1142578125, -4.9296875, -4.7451171875, -4.560546875, -4.3759765625, -4.19140625, -4.0068359375, -3.822265625, -3.6376953125, -3.453125, -3.2685546875, -3.083984375, -2.8994140625, -2.71484375, -2.5302734375, -2.345703125, -2.1611328125, -1.9765625, -1.7919921875, -1.607421875, -1.4228515625, -1.23828125, -1.0537109375, -0.869140625, -0.6845703125, -0.5, -0.3154296875, -0.130859375, 0.0537109375, 0.23828125, 0.4228515625, 0.607421875, 0.7919921875, 0.9765625, 1.1611328125, 1.345703125, 1.5302734375, 1.71484375, 1.8994140625, 2.083984375, 2.2685546875, 2.453125, 2.6376953125, 2.822265625, 3.0068359375, 3.19140625, 3.3759765625, 3.560546875, 3.7451171875, 3.9296875, 4.1142578125, 4.298828125, 4.4833984375, 4.66796875, 4.8525390625, 5.037109375, 5.2216796875, 5.40625, 5.5908203125, 5.775390625, 5.9599609375, 6.14453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 8.0, 16.0, 22.0, 33.0, 62.0, 74.0, 120.0, 180.0, 310.0, 584.0, 1073.0, 2127.0, 4443.0, 10263.0, 27643.0, 88036.0, 324207.0, 1008811.0, 1525975.0, 835750.0, 254567.0, 70797.0, 22539.0, 8820.0, 3717.0, 1833.0, 930.0, 481.0, 310.0, 176.0, 111.0, 71.0, 46.0, 33.0, 25.0, 19.0, 11.0, 10.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.6412353515625, -5.442626953125, -5.2440185546875, -5.04541015625, -4.8468017578125, -4.648193359375, -4.4495849609375, -4.2509765625, -4.0523681640625, -3.853759765625, -3.6551513671875, -3.45654296875, -3.2579345703125, -3.059326171875, -2.8607177734375, -2.662109375, -2.4635009765625, -2.264892578125, -2.0662841796875, -1.86767578125, -1.6690673828125, -1.470458984375, -1.2718505859375, -1.0732421875, -0.8746337890625, -0.676025390625, -0.4774169921875, -0.27880859375, -0.0802001953125, 0.118408203125, 0.3170166015625, 0.515625, 0.7142333984375, 0.912841796875, 1.1114501953125, 1.31005859375, 1.5086669921875, 1.707275390625, 1.9058837890625, 2.1044921875, 2.3031005859375, 2.501708984375, 2.7003173828125, 2.89892578125, 3.0975341796875, 3.296142578125, 3.4947509765625, 3.693359375, 3.8919677734375, 4.090576171875, 4.2891845703125, 4.48779296875, 4.6864013671875, 4.885009765625, 5.0836181640625, 5.2822265625, 5.4808349609375, 5.679443359375, 5.8780517578125, 6.07666015625, 6.2752685546875, 6.473876953125, 6.6724853515625, 6.87109375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 12.0, 12.0, 10.0, 15.0, 28.0, 45.0, 61.0, 72.0, 101.0, 133.0, 168.0, 256.0, 316.0, 433.0, 507.0, 481.0, 396.0, 280.0, 209.0, 122.0, 133.0, 79.0, 54.0, 46.0, 34.0, 21.0, 17.0, 10.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.078125, -20.57275390625, -20.0673828125, -19.56201171875, -19.056640625, -18.55126953125, -18.0458984375, -17.54052734375, -17.03515625, -16.52978515625, -16.0244140625, -15.51904296875, -15.013671875, -14.50830078125, -14.0029296875, -13.49755859375, -12.9921875, -12.48681640625, -11.9814453125, -11.47607421875, -10.970703125, -10.46533203125, -9.9599609375, -9.45458984375, -8.94921875, -8.44384765625, -7.9384765625, -7.43310546875, -6.927734375, -6.42236328125, -5.9169921875, -5.41162109375, -4.90625, -4.40087890625, -3.8955078125, -3.39013671875, -2.884765625, -2.37939453125, -1.8740234375, -1.36865234375, -0.86328125, -0.35791015625, 0.1474609375, 0.65283203125, 1.158203125, 1.66357421875, 2.1689453125, 2.67431640625, 3.1796875, 3.68505859375, 4.1904296875, 4.69580078125, 5.201171875, 5.70654296875, 6.2119140625, 6.71728515625, 7.22265625, 7.72802734375, 8.2333984375, 8.73876953125, 9.244140625, 9.74951171875, 10.2548828125, 10.76025390625, 11.265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 5.0, 8.0, 8.0, 10.0, 15.0, 18.0, 30.0, 30.0, 54.0, 75.0, 86.0, 116.0, 154.0, 266.0, 477.0, 2098.0, 224599.0, 3953174.0, 11097.0, 861.0, 352.0, 218.0, 146.0, 77.0, 70.0, 59.0, 36.0, 43.0, 19.0, 14.0, 20.0, 13.0, 11.0, 9.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.1875, -48.1181640625, -46.048828125, -43.9794921875, -41.91015625, -39.8408203125, -37.771484375, -35.7021484375, -33.6328125, -31.5634765625, -29.494140625, -27.4248046875, -25.35546875, -23.2861328125, -21.216796875, -19.1474609375, -17.078125, -15.0087890625, -12.939453125, -10.8701171875, -8.80078125, -6.7314453125, -4.662109375, -2.5927734375, -0.5234375, 1.5458984375, 3.615234375, 5.6845703125, 7.75390625, 9.8232421875, 11.892578125, 13.9619140625, 16.03125, 18.1005859375, 20.169921875, 22.2392578125, 24.30859375, 26.3779296875, 28.447265625, 30.5166015625, 32.5859375, 34.6552734375, 36.724609375, 38.7939453125, 40.86328125, 42.9326171875, 45.001953125, 47.0712890625, 49.140625, 51.2099609375, 53.279296875, 55.3486328125, 57.41796875, 59.4873046875, 61.556640625, 63.6259765625, 65.6953125, 67.7646484375, 69.833984375, 71.9033203125, 73.97265625, 76.0419921875, 78.111328125, 80.1806640625, 82.25]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 10.0, 63.0, 173.0, 275.0, 268.0, 159.0, 45.0, 13.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-199.8118133544922, -195.46070861816406, -191.10958862304688, -186.75848388671875, -182.40737915039062, -178.0562744140625, -173.7051544189453, -169.3540496826172, -165.00294494628906, -160.65184020996094, -156.30072021484375, -151.94961547851562, -147.5985107421875, -143.24740600585938, -138.8962860107422, -134.54518127441406, -130.19406127929688, -125.84294891357422, -121.4918441772461, -117.14073181152344, -112.78962707519531, -108.43851470947266, -104.08740234375, -99.73629760742188, -95.38519287109375, -91.0340805053711, -86.68297576904297, -82.33186340332031, -77.98075866699219, -73.62964630126953, -69.27853393554688, -64.92742919921875, -60.576324462890625, -56.225215911865234, -51.874107360839844, -47.52299499511719, -43.17189025878906, -38.820777893066406, -34.469669342041016, -30.118560791015625, -25.767452239990234, -21.416343688964844, -17.065235137939453, -12.71412467956543, -8.363016128540039, -4.011907577514648, 0.339202880859375, 4.690311431884766, 9.041419982910156, 13.392528533935547, 17.743637084960938, 22.09474754333496, 26.44585609436035, 30.796964645385742, 35.148075103759766, 39.499183654785156, 43.85029220581055, 48.20140075683594, 52.55250930786133, 56.90361785888672, 61.254730224609375, 65.6058349609375, 69.95694732666016, 74.30805969238281, 78.65916442871094]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 3.0, 11.0, 7.0, 9.0, 7.0, 16.0, 18.0, 16.0, 22.0, 18.0, 20.0, 28.0, 28.0, 36.0, 36.0, 52.0, 49.0, 53.0, 38.0, 46.0, 36.0, 43.0, 33.0, 36.0, 40.0, 39.0, 34.0, 27.0, 33.0, 30.0, 19.0, 20.0, 14.0, 12.0, 13.0, 10.0, 13.0, 9.0, 6.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.4869384765625, -49.87363052368164, -48.260318756103516, -46.647010803222656, -45.03369903564453, -43.42039108276367, -41.80708312988281, -40.19377136230469, -38.58046340942383, -36.96715545654297, -35.353843688964844, -33.740535736083984, -32.12722396850586, -30.513916015625, -28.900606155395508, -27.287296295166016, -25.673986434936523, -24.06067657470703, -22.44736671447754, -20.834056854248047, -19.220748901367188, -17.607439041137695, -15.994129180908203, -14.380820274353027, -12.767510414123535, -11.154200553894043, -9.540891647338867, -7.927581787109375, -6.314272403717041, -4.700963020324707, -3.087653160095215, -1.474344253540039, 0.13896560668945312, 1.7522751092910767, 3.3655846118927, 4.978894233703613, 6.592203617095947, 8.205513000488281, 9.818822860717773, 11.43213176727295, 13.045441627502441, 14.658751487731934, 16.27206039428711, 17.8853702545166, 19.498680114746094, 21.111988067626953, 22.725299835205078, 24.338607788085938, 25.95191764831543, 27.565227508544922, 29.178537368774414, 30.791847229003906, 32.405155181884766, 34.018463134765625, 35.63177490234375, 37.24508285522461, 38.858394622802734, 40.471702575683594, 42.08501434326172, 43.69832229614258, 45.3116340637207, 46.92494201660156, 48.53825378417969, 50.15156173706055, 51.764869689941406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 6.0, 22.0, 22.0, 25.0, 17.0, 35.0, 36.0, 30.0, 36.0, 37.0, 50.0, 34.0, 48.0, 44.0, 42.0, 46.0, 53.0, 45.0, 36.0, 40.0, 32.0, 29.0, 23.0, 31.0, 29.0, 17.0, 14.0, 13.0, 20.0, 7.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.55078125, -6.3590087890625, -6.167236328125, -5.9754638671875, -5.78369140625, -5.5919189453125, -5.400146484375, -5.2083740234375, -5.0166015625, -4.8248291015625, -4.633056640625, -4.4412841796875, -4.24951171875, -4.0577392578125, -3.865966796875, -3.6741943359375, -3.482421875, -3.2906494140625, -3.098876953125, -2.9071044921875, -2.71533203125, -2.5235595703125, -2.331787109375, -2.1400146484375, -1.9482421875, -1.7564697265625, -1.564697265625, -1.3729248046875, -1.18115234375, -0.9893798828125, -0.797607421875, -0.6058349609375, -0.4140625, -0.2222900390625, -0.030517578125, 0.1612548828125, 0.35302734375, 0.5447998046875, 0.736572265625, 0.9283447265625, 1.1201171875, 1.3118896484375, 1.503662109375, 1.6954345703125, 1.88720703125, 2.0789794921875, 2.270751953125, 2.4625244140625, 2.654296875, 2.8460693359375, 3.037841796875, 3.2296142578125, 3.42138671875, 3.6131591796875, 3.804931640625, 3.9967041015625, 4.1884765625, 4.3802490234375, 4.572021484375, 4.7637939453125, 4.95556640625, 5.1473388671875, 5.339111328125, 5.5308837890625, 5.72265625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 9.0, 6.0, 6.0, 17.0, 22.0, 33.0, 43.0, 51.0, 95.0, 150.0, 201.0, 323.0, 468.0, 736.0, 1060.0, 1597.0, 2532.0, 3924.0, 6090.0, 9483.0, 15250.0, 24923.0, 40460.0, 69007.0, 119891.0, 215314.0, 225635.0, 126166.0, 72457.0, 43064.0, 25618.0, 15892.0, 9843.0, 6407.0, 4040.0, 2665.0, 1722.0, 1114.0, 765.0, 473.0, 331.0, 237.0, 139.0, 90.0, 76.0, 43.0, 32.0, 21.0, 17.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.86572265625, -0.8378372192382812, -0.8099517822265625, -0.7820663452148438, -0.754180908203125, -0.7262954711914062, -0.6984100341796875, -0.6705245971679688, -0.64263916015625, -0.6147537231445312, -0.5868682861328125, -0.5589828491210938, -0.531097412109375, -0.5032119750976562, -0.4753265380859375, -0.44744110107421875, -0.4195556640625, -0.39167022705078125, -0.3637847900390625, -0.33589935302734375, -0.308013916015625, -0.28012847900390625, -0.2522430419921875, -0.22435760498046875, -0.19647216796875, -0.16858673095703125, -0.1407012939453125, -0.11281585693359375, -0.084930419921875, -0.05704498291015625, -0.0291595458984375, -0.00127410888671875, 0.026611328125, 0.05449676513671875, 0.0823822021484375, 0.11026763916015625, 0.138153076171875, 0.16603851318359375, 0.1939239501953125, 0.22180938720703125, 0.24969482421875, 0.27758026123046875, 0.3054656982421875, 0.33335113525390625, 0.361236572265625, 0.38912200927734375, 0.4170074462890625, 0.44489288330078125, 0.4727783203125, 0.5006637573242188, 0.5285491943359375, 0.5564346313476562, 0.584320068359375, 0.6122055053710938, 0.6400909423828125, 0.6679763793945312, 0.69586181640625, 0.7237472534179688, 0.7516326904296875, 0.7795181274414062, 0.807403564453125, 0.8352890014648438, 0.8631744384765625, 0.8910598754882812, 0.9189453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 7.0, 2.0, 2.0, 3.0, 8.0, 10.0, 9.0, 10.0, 9.0, 18.0, 8.0, 11.0, 21.0, 25.0, 30.0, 26.0, 28.0, 33.0, 29.0, 33.0, 41.0, 39.0, 34.0, 27.0, 38.0, 1056.0, 27.0, 32.0, 43.0, 33.0, 33.0, 35.0, 36.0, 32.0, 19.0, 20.0, 20.0, 24.0, 17.0, 16.0, 19.0, 11.0, 12.0, 10.0, 8.0, 14.0, 9.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.55078125, -3.448150634765625, -3.34552001953125, -3.242889404296875, -3.1402587890625, -3.037628173828125, -2.93499755859375, -2.832366943359375, -2.729736328125, -2.627105712890625, -2.52447509765625, -2.421844482421875, -2.3192138671875, -2.216583251953125, -2.11395263671875, -2.011322021484375, -1.90869140625, -1.806060791015625, -1.70343017578125, -1.600799560546875, -1.4981689453125, -1.395538330078125, -1.29290771484375, -1.190277099609375, -1.087646484375, -0.985015869140625, -0.88238525390625, -0.779754638671875, -0.6771240234375, -0.574493408203125, -0.47186279296875, -0.369232177734375, -0.2666015625, -0.163970947265625, -0.06134033203125, 0.041290283203125, 0.1439208984375, 0.246551513671875, 0.34918212890625, 0.451812744140625, 0.554443359375, 0.657073974609375, 0.75970458984375, 0.862335205078125, 0.9649658203125, 1.067596435546875, 1.17022705078125, 1.272857666015625, 1.37548828125, 1.478118896484375, 1.58074951171875, 1.683380126953125, 1.7860107421875, 1.888641357421875, 1.99127197265625, 2.093902587890625, 2.196533203125, 2.299163818359375, 2.40179443359375, 2.504425048828125, 2.6070556640625, 2.709686279296875, 2.81231689453125, 2.914947509765625, 3.017578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 8.0, 14.0, 23.0, 25.0, 38.0, 48.0, 73.0, 126.0, 177.0, 260.0, 375.0, 544.0, 819.0, 1209.0, 1762.0, 2443.0, 3634.0, 5305.0, 7798.0, 11428.0, 17042.0, 26258.0, 39833.0, 62694.0, 100271.0, 174079.0, 1278231.0, 132673.0, 80289.0, 51215.0, 32617.0, 21592.0, 14070.0, 9557.0, 6579.0, 4383.0, 3038.0, 2099.0, 1363.0, 994.0, 697.0, 493.0, 327.0, 199.0, 161.0, 90.0, 66.0, 41.0, 24.0, 14.0, 15.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.71240234375, -0.6888656616210938, -0.6653289794921875, -0.6417922973632812, -0.618255615234375, -0.5947189331054688, -0.5711822509765625, -0.5476455688476562, -0.52410888671875, -0.5005722045898438, -0.4770355224609375, -0.45349884033203125, -0.429962158203125, -0.40642547607421875, -0.3828887939453125, -0.35935211181640625, -0.3358154296875, -0.31227874755859375, -0.2887420654296875, -0.26520538330078125, -0.241668701171875, -0.21813201904296875, -0.1945953369140625, -0.17105865478515625, -0.14752197265625, -0.12398529052734375, -0.1004486083984375, -0.07691192626953125, -0.053375244140625, -0.02983856201171875, -0.0063018798828125, 0.01723480224609375, 0.040771484375, 0.06430816650390625, 0.0878448486328125, 0.11138153076171875, 0.134918212890625, 0.15845489501953125, 0.1819915771484375, 0.20552825927734375, 0.22906494140625, 0.25260162353515625, 0.2761383056640625, 0.29967498779296875, 0.323211669921875, 0.34674835205078125, 0.3702850341796875, 0.39382171630859375, 0.4173583984375, 0.44089508056640625, 0.4644317626953125, 0.48796844482421875, 0.511505126953125, 0.5350418090820312, 0.5585784912109375, 0.5821151733398438, 0.60565185546875, 0.6291885375976562, 0.6527252197265625, 0.6762619018554688, 0.699798583984375, 0.7233352661132812, 0.7468719482421875, 0.7704086303710938, 0.7939453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 10.0, 8.0, 10.0, 13.0, 17.0, 14.0, 17.0, 19.0, 24.0, 30.0, 32.0, 36.0, 48.0, 42.0, 53.0, 60.0, 47.0, 53.0, 52.0, 50.0, 55.0, 49.0, 33.0, 38.0, 24.0, 21.0, 15.0, 11.0, 20.0, 15.0, 12.0, 13.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004000663757324219, -0.0003859996795654297, -0.0003719329833984375, -0.0003578662872314453, -0.0003437995910644531, -0.00032973289489746094, -0.00031566619873046875, -0.00030159950256347656, -0.0002875328063964844, -0.0002734661102294922, -0.0002593994140625, -0.0002453327178955078, -0.00023126602172851562, -0.00021719932556152344, -0.00020313262939453125, -0.00018906593322753906, -0.00017499923706054688, -0.0001609325408935547, -0.0001468658447265625, -0.0001327991485595703, -0.00011873245239257812, -0.00010466575622558594, -9.059906005859375e-05, -7.653236389160156e-05, -6.246566772460938e-05, -4.839897155761719e-05, -3.4332275390625e-05, -2.0265579223632812e-05, -6.198883056640625e-06, 7.867813110351562e-06, 2.193450927734375e-05, 3.600120544433594e-05, 5.0067901611328125e-05, 6.413459777832031e-05, 7.82012939453125e-05, 9.226799011230469e-05, 0.00010633468627929688, 0.00012040138244628906, 0.00013446807861328125, 0.00014853477478027344, 0.00016260147094726562, 0.0001766681671142578, 0.00019073486328125, 0.0002048015594482422, 0.00021886825561523438, 0.00023293495178222656, 0.00024700164794921875, 0.00026106834411621094, 0.0002751350402832031, 0.0002892017364501953, 0.0003032684326171875, 0.0003173351287841797, 0.0003314018249511719, 0.00034546852111816406, 0.00035953521728515625, 0.00037360191345214844, 0.0003876686096191406, 0.0004017353057861328, 0.000415802001953125, 0.0004298686981201172, 0.0004439353942871094, 0.00045800209045410156, 0.00047206878662109375, 0.00048613548278808594, 0.0005002021789550781]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 9.0, 13.0, 15.0, 14.0, 15.0, 20.0, 43.0, 45.0, 64.0, 107.0, 143.0, 267.0, 495.0, 1038.0, 107731.0, 935202.0, 1854.0, 543.0, 284.0, 201.0, 112.0, 71.0, 64.0, 30.0, 32.0, 23.0, 23.0, 15.0, 11.0, 7.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.012176513671875, -0.01179802417755127, -0.011419534683227539, -0.011041045188903809, -0.010662555694580078, -0.010284066200256348, -0.009905576705932617, -0.009527087211608887, -0.009148597717285156, -0.008770108222961426, -0.008391618728637695, -0.008013129234313965, -0.007634639739990234, -0.007256150245666504, -0.0068776607513427734, -0.006499171257019043, -0.0061206817626953125, -0.005742192268371582, -0.0053637027740478516, -0.004985213279724121, -0.004606723785400391, -0.00422823429107666, -0.0038497447967529297, -0.0034712553024291992, -0.0030927658081054688, -0.0027142763137817383, -0.002335786819458008, -0.0019572973251342773, -0.0015788078308105469, -0.0012003183364868164, -0.0008218288421630859, -0.00044333934783935547, -6.4849853515625e-05, 0.00031363964080810547, 0.0006921291351318359, 0.0010706186294555664, 0.0014491081237792969, 0.0018275976181030273, 0.002206087112426758, 0.0025845766067504883, 0.0029630661010742188, 0.0033415555953979492, 0.0037200450897216797, 0.00409853458404541, 0.004477024078369141, 0.004855513572692871, 0.0052340030670166016, 0.005612492561340332, 0.0059909820556640625, 0.006369471549987793, 0.0067479610443115234, 0.007126450538635254, 0.007504940032958984, 0.007883429527282715, 0.008261919021606445, 0.008640408515930176, 0.009018898010253906, 0.009397387504577637, 0.009775876998901367, 0.010154366493225098, 0.010532855987548828, 0.010911345481872559, 0.011289834976196289, 0.01166832447052002, 0.01204681396484375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 34.0, 180.0, 417.0, 275.0, 79.0, 19.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006863728631287813, -0.0006496244459412992, -0.0006128760287538171, -0.000576127611566335, -0.0005393791943788528, -0.0005026307189837098, -0.0004658823017962277, -0.0004291338846087456, -0.00039238546742126346, -0.00035563705023378134, -0.0003188886330462992, -0.00028214018675498664, -0.0002453917695675045, -0.0002086433523800224, -0.00017189492064062506, -0.0001351464889012277, -9.83980717137456e-05, -6.164964725030586e-05, -2.490122278686613e-05, 1.1847201676573604e-05, 4.859562614001334e-05, 8.534404332749546e-05, 0.0001220924750668928, 0.00015884090680629015, 0.00019558932399377227, 0.0002323377411812544, 0.0002690861583687365, 0.0003058346046600491, 0.0003425830218475312, 0.0003793314390350133, 0.0004160798853263259, 0.000452828302513808, 0.0004895767197012901, 0.0005263251368887722, 0.0005630735540762544, 0.0005998219712637365, 0.0006365703884512186, 0.0006733188638463616, 0.0007100672810338438, 0.0007468156982213259, 0.000783564115408808, 0.0008203125325962901, 0.0008570609497837722, 0.0008938093669712543, 0.0009305578423663974, 0.0009673062013462186, 0.0010040546767413616, 0.0010408030357211828, 0.0010775515111163259, 0.0011142999865114689, 0.00115104834549129, 0.0011877968208864331, 0.0012245451798662543, 0.0012612936552613974, 0.0012980420142412186, 0.0013347904896363616, 0.0013715389650315046, 0.0014082874404266477, 0.0014450357994064689, 0.001481784274801612, 0.001518532633781433, 0.0015552811091765761, 0.0015920294681563973, 0.0016287779435515404, 0.0016655263025313616]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 10.0, 9.0, 5.0, 3.0, 4.0, 9.0, 11.0, 14.0, 20.0, 15.0, 12.0, 18.0, 21.0, 23.0, 23.0, 32.0, 26.0, 36.0, 28.0, 29.0, 35.0, 27.0, 37.0, 35.0, 47.0, 36.0, 35.0, 30.0, 25.0, 30.0, 31.0, 34.0, 32.0, 29.0, 19.0, 29.0, 17.0, 18.0, 16.0, 12.0, 15.0, 5.0, 10.0, 7.0, 9.0, 5.0, 9.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0], "bins": [-0.0002532005310058594, -0.0002459865063428879, -0.00023877248167991638, -0.00023155845701694489, -0.0002243444323539734, -0.0002171304076910019, -0.0002099163830280304, -0.0002027023583650589, -0.0001954883337020874, -0.0001882743090391159, -0.0001810602843761444, -0.0001738462597131729, -0.00016663223505020142, -0.00015941821038722992, -0.00015220418572425842, -0.00014499016106128693, -0.00013777613639831543, -0.00013056211173534393, -0.00012334808707237244, -0.00011613406240940094, -0.00010892003774642944, -0.00010170601308345795, -9.449198842048645e-05, -8.727796375751495e-05, -8.006393909454346e-05, -7.284991443157196e-05, -6.563588976860046e-05, -5.842186510562897e-05, -5.120784044265747e-05, -4.3993815779685974e-05, -3.677979111671448e-05, -2.956576645374298e-05, -2.2351741790771484e-05, -1.5137717127799988e-05, -7.923692464828491e-06, -7.096678018569946e-07, 6.504356861114502e-06, 1.3718381524085999e-05, 2.0932406187057495e-05, 2.8146430850028992e-05, 3.536045551300049e-05, 4.2574480175971985e-05, 4.978850483894348e-05, 5.700252950191498e-05, 6.421655416488647e-05, 7.143057882785797e-05, 7.864460349082947e-05, 8.585862815380096e-05, 9.307265281677246e-05, 0.00010028667747974396, 0.00010750070214271545, 0.00011471472680568695, 0.00012192875146865845, 0.00012914277613162994, 0.00013635680079460144, 0.00014357082545757294, 0.00015078485012054443, 0.00015799887478351593, 0.00016521289944648743, 0.00017242692410945892, 0.00017964094877243042, 0.00018685497343540192, 0.0001940689980983734, 0.0002012830227613449, 0.0002084970474243164]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 6.0, 22.0, 22.0, 25.0, 17.0, 35.0, 36.0, 30.0, 36.0, 37.0, 50.0, 34.0, 48.0, 44.0, 42.0, 46.0, 53.0, 45.0, 36.0, 40.0, 32.0, 29.0, 23.0, 31.0, 29.0, 17.0, 14.0, 13.0, 20.0, 7.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.55078125, -6.3590087890625, -6.167236328125, -5.9754638671875, -5.78369140625, -5.5919189453125, -5.400146484375, -5.2083740234375, -5.0166015625, -4.8248291015625, -4.633056640625, -4.4412841796875, -4.24951171875, -4.0577392578125, -3.865966796875, -3.6741943359375, -3.482421875, -3.2906494140625, -3.098876953125, -2.9071044921875, -2.71533203125, -2.5235595703125, -2.331787109375, -2.1400146484375, -1.9482421875, -1.7564697265625, -1.564697265625, -1.3729248046875, -1.18115234375, -0.9893798828125, -0.797607421875, -0.6058349609375, -0.4140625, -0.2222900390625, -0.030517578125, 0.1612548828125, 0.35302734375, 0.5447998046875, 0.736572265625, 0.9283447265625, 1.1201171875, 1.3118896484375, 1.503662109375, 1.6954345703125, 1.88720703125, 2.0789794921875, 2.270751953125, 2.4625244140625, 2.654296875, 2.8460693359375, 3.037841796875, 3.2296142578125, 3.42138671875, 3.6131591796875, 3.804931640625, 3.9967041015625, 4.1884765625, 4.3802490234375, 4.572021484375, 4.7637939453125, 4.95556640625, 5.1473388671875, 5.339111328125, 5.5308837890625, 5.72265625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 11.0, 15.0, 22.0, 28.0, 33.0, 63.0, 88.0, 132.0, 234.0, 400.0, 616.0, 1197.0, 2148.0, 4364.0, 9285.0, 23070.0, 69216.0, 271163.0, 470391.0, 130645.0, 38222.0, 14247.0, 6268.0, 2936.0, 1565.0, 838.0, 503.0, 314.0, 170.0, 112.0, 76.0, 57.0, 41.0, 17.0, 15.0, 14.0, 5.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.2734375, -5.11944580078125, -4.9654541015625, -4.81146240234375, -4.657470703125, -4.50347900390625, -4.3494873046875, -4.19549560546875, -4.04150390625, -3.88751220703125, -3.7335205078125, -3.57952880859375, -3.425537109375, -3.27154541015625, -3.1175537109375, -2.96356201171875, -2.8095703125, -2.65557861328125, -2.5015869140625, -2.34759521484375, -2.193603515625, -2.03961181640625, -1.8856201171875, -1.73162841796875, -1.57763671875, -1.42364501953125, -1.2696533203125, -1.11566162109375, -0.961669921875, -0.80767822265625, -0.6536865234375, -0.49969482421875, -0.345703125, -0.19171142578125, -0.0377197265625, 0.11627197265625, 0.270263671875, 0.42425537109375, 0.5782470703125, 0.73223876953125, 0.88623046875, 1.04022216796875, 1.1942138671875, 1.34820556640625, 1.502197265625, 1.65618896484375, 1.8101806640625, 1.96417236328125, 2.1181640625, 2.27215576171875, 2.4261474609375, 2.58013916015625, 2.734130859375, 2.88812255859375, 3.0421142578125, 3.19610595703125, 3.35009765625, 3.50408935546875, 3.6580810546875, 3.81207275390625, 3.966064453125, 4.12005615234375, 4.2740478515625, 4.42803955078125, 4.58203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 8.0, 5.0, 9.0, 14.0, 6.0, 19.0, 15.0, 31.0, 21.0, 26.0, 24.0, 27.0, 40.0, 43.0, 43.0, 39.0, 62.0, 112.0, 444.0, 1519.0, 111.0, 60.0, 44.0, 34.0, 31.0, 43.0, 38.0, 27.0, 21.0, 22.0, 23.0, 12.0, 10.0, 15.0, 12.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.796875, -22.146484375, -21.49609375, -20.845703125, -20.1953125, -19.544921875, -18.89453125, -18.244140625, -17.59375, -16.943359375, -16.29296875, -15.642578125, -14.9921875, -14.341796875, -13.69140625, -13.041015625, -12.390625, -11.740234375, -11.08984375, -10.439453125, -9.7890625, -9.138671875, -8.48828125, -7.837890625, -7.1875, -6.537109375, -5.88671875, -5.236328125, -4.5859375, -3.935546875, -3.28515625, -2.634765625, -1.984375, -1.333984375, -0.68359375, -0.033203125, 0.6171875, 1.267578125, 1.91796875, 2.568359375, 3.21875, 3.869140625, 4.51953125, 5.169921875, 5.8203125, 6.470703125, 7.12109375, 7.771484375, 8.421875, 9.072265625, 9.72265625, 10.373046875, 11.0234375, 11.673828125, 12.32421875, 12.974609375, 13.625, 14.275390625, 14.92578125, 15.576171875, 16.2265625, 16.876953125, 17.52734375, 18.177734375, 18.828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 4.0, 5.0, 9.0, 9.0, 12.0, 16.0, 16.0, 18.0, 24.0, 34.0, 33.0, 45.0, 69.0, 120.0, 116.0, 187.0, 300.0, 520.0, 2440.0, 644345.0, 2492429.0, 3273.0, 572.0, 321.0, 207.0, 132.0, 96.0, 70.0, 66.0, 46.0, 31.0, 38.0, 16.0, 22.0, 10.0, 14.0, 8.0, 11.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-38.65625, -37.32568359375, -35.9951171875, -34.66455078125, -33.333984375, -32.00341796875, -30.6728515625, -29.34228515625, -28.01171875, -26.68115234375, -25.3505859375, -24.02001953125, -22.689453125, -21.35888671875, -20.0283203125, -18.69775390625, -17.3671875, -16.03662109375, -14.7060546875, -13.37548828125, -12.044921875, -10.71435546875, -9.3837890625, -8.05322265625, -6.72265625, -5.39208984375, -4.0615234375, -2.73095703125, -1.400390625, -0.06982421875, 1.2607421875, 2.59130859375, 3.921875, 5.25244140625, 6.5830078125, 7.91357421875, 9.244140625, 10.57470703125, 11.9052734375, 13.23583984375, 14.56640625, 15.89697265625, 17.2275390625, 18.55810546875, 19.888671875, 21.21923828125, 22.5498046875, 23.88037109375, 25.2109375, 26.54150390625, 27.8720703125, 29.20263671875, 30.533203125, 31.86376953125, 33.1943359375, 34.52490234375, 35.85546875, 37.18603515625, 38.5166015625, 39.84716796875, 41.177734375, 42.50830078125, 43.8388671875, 45.16943359375, 46.5]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 41.0, 225.0, 452.0, 246.0, 35.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.57462310791016, -66.5911865234375, -64.60775756835938, -62.62432098388672, -60.64088439941406, -58.657447814941406, -56.674015045166016, -54.690582275390625, -52.70714569091797, -50.72370910644531, -48.74027633666992, -46.75684356689453, -44.773406982421875, -42.78997039794922, -40.80653762817383, -38.82310485839844, -36.83966827392578, -34.856231689453125, -32.872798919677734, -30.88936424255371, -28.905929565429688, -26.922494888305664, -24.93906021118164, -22.955625534057617, -20.972190856933594, -18.98875617980957, -17.005321502685547, -15.021886825561523, -13.0384521484375, -11.055017471313477, -9.071582794189453, -7.08814811706543, -5.104709625244141, -3.121274948120117, -1.1378402709960938, 0.8455944061279297, 2.829029083251953, 4.812463760375977, 6.7958984375, 8.779333114624023, 10.762767791748047, 12.74620246887207, 14.729637145996094, 16.713071823120117, 18.69650650024414, 20.679941177368164, 22.663375854492188, 24.64681053161621, 26.630245208740234, 28.613679885864258, 30.59711456298828, 32.58055114746094, 34.56398391723633, 36.54741668701172, 38.530853271484375, 40.51428985595703, 42.49772262573242, 44.48115539550781, 46.46459197998047, 48.448028564453125, 50.431461334228516, 52.414894104003906, 54.39833068847656, 56.38176727294922, 58.36520004272461]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 8.0, 8.0, 9.0, 13.0, 22.0, 17.0, 17.0, 18.0, 18.0, 26.0, 30.0, 33.0, 31.0, 40.0, 52.0, 54.0, 37.0, 51.0, 51.0, 66.0, 52.0, 39.0, 33.0, 34.0, 36.0, 26.0, 29.0, 28.0, 19.0, 14.0, 21.0, 6.0, 8.0, 15.0, 9.0, 5.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.504302978515625, -58.72920227050781, -56.954105377197266, -55.17900466918945, -53.403907775878906, -51.628807067871094, -49.85370635986328, -48.078609466552734, -46.30350875854492, -44.52840805053711, -42.75331115722656, -40.97821044921875, -39.2031135559082, -37.42801284790039, -35.652915954589844, -33.87781524658203, -32.10271453857422, -30.32761573791504, -28.55251693725586, -26.777416229248047, -25.002317428588867, -23.227218627929688, -21.452119827270508, -19.677021026611328, -17.90192413330078, -16.1268253326416, -14.351725578308105, -12.576626777648926, -10.80152702331543, -9.02642822265625, -7.25132942199707, -5.476229667663574, -3.701129913330078, -1.9260307550430298, -0.15093159675598145, 1.6241674423217773, 3.3992667198181152, 5.174365997314453, 6.949464797973633, 8.724564552307129, 10.499663352966309, 12.274762153625488, 14.049861907958984, 15.824960708618164, 17.600059509277344, 19.375160217285156, 21.150257110595703, 22.925357818603516, 24.700456619262695, 26.475555419921875, 28.250654220581055, 30.025753021240234, 31.800853729248047, 33.575950622558594, 35.351051330566406, 37.12615203857422, 38.901248931884766, 40.67634963989258, 42.451446533203125, 44.22654724121094, 46.001644134521484, 47.7767448425293, 49.551841735839844, 51.326942443847656, 53.10204315185547]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 10.0, 13.0, 9.0, 21.0, 19.0, 27.0, 19.0, 29.0, 30.0, 35.0, 39.0, 35.0, 27.0, 51.0, 52.0, 36.0, 43.0, 42.0, 41.0, 49.0, 57.0, 31.0, 24.0, 38.0, 28.0, 23.0, 26.0, 20.0, 22.0, 20.0, 19.0, 9.0, 9.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.6640625, -6.47216796875, -6.2802734375, -6.08837890625, -5.896484375, -5.70458984375, -5.5126953125, -5.32080078125, -5.12890625, -4.93701171875, -4.7451171875, -4.55322265625, -4.361328125, -4.16943359375, -3.9775390625, -3.78564453125, -3.59375, -3.40185546875, -3.2099609375, -3.01806640625, -2.826171875, -2.63427734375, -2.4423828125, -2.25048828125, -2.05859375, -1.86669921875, -1.6748046875, -1.48291015625, -1.291015625, -1.09912109375, -0.9072265625, -0.71533203125, -0.5234375, -0.33154296875, -0.1396484375, 0.05224609375, 0.244140625, 0.43603515625, 0.6279296875, 0.81982421875, 1.01171875, 1.20361328125, 1.3955078125, 1.58740234375, 1.779296875, 1.97119140625, 2.1630859375, 2.35498046875, 2.546875, 2.73876953125, 2.9306640625, 3.12255859375, 3.314453125, 3.50634765625, 3.6982421875, 3.89013671875, 4.08203125, 4.27392578125, 4.4658203125, 4.65771484375, 4.849609375, 5.04150390625, 5.2333984375, 5.42529296875, 5.6171875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 6.0, 9.0, 10.0, 12.0, 14.0, 19.0, 26.0, 27.0, 31.0, 30.0, 45.0, 62.0, 60.0, 120.0, 232.0, 862.0, 17477.0, 3487930.0, 682171.0, 4040.0, 480.0, 166.0, 98.0, 62.0, 52.0, 42.0, 41.0, 27.0, 21.0, 15.0, 18.0, 16.0, 12.0, 13.0, 8.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.8125, -37.697265625, -36.58203125, -35.466796875, -34.3515625, -33.236328125, -32.12109375, -31.005859375, -29.890625, -28.775390625, -27.66015625, -26.544921875, -25.4296875, -24.314453125, -23.19921875, -22.083984375, -20.96875, -19.853515625, -18.73828125, -17.623046875, -16.5078125, -15.392578125, -14.27734375, -13.162109375, -12.046875, -10.931640625, -9.81640625, -8.701171875, -7.5859375, -6.470703125, -5.35546875, -4.240234375, -3.125, -2.009765625, -0.89453125, 0.220703125, 1.3359375, 2.451171875, 3.56640625, 4.681640625, 5.796875, 6.912109375, 8.02734375, 9.142578125, 10.2578125, 11.373046875, 12.48828125, 13.603515625, 14.71875, 15.833984375, 16.94921875, 18.064453125, 19.1796875, 20.294921875, 21.41015625, 22.525390625, 23.640625, 24.755859375, 25.87109375, 26.986328125, 28.1015625, 29.216796875, 30.33203125, 31.447265625, 32.5625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 9.0, 17.0, 17.0, 23.0, 24.0, 35.0, 42.0, 47.0, 73.0, 84.0, 125.0, 175.0, 214.0, 287.0, 310.0, 342.0, 392.0, 405.0, 321.0, 255.0, 201.0, 137.0, 103.0, 83.0, 70.0, 52.0, 48.0, 42.0, 39.0, 20.0, 21.0, 13.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-11.6640625, -11.3040771484375, -10.944091796875, -10.5841064453125, -10.22412109375, -9.8641357421875, -9.504150390625, -9.1441650390625, -8.7841796875, -8.4241943359375, -8.064208984375, -7.7042236328125, -7.34423828125, -6.9842529296875, -6.624267578125, -6.2642822265625, -5.904296875, -5.5443115234375, -5.184326171875, -4.8243408203125, -4.46435546875, -4.1043701171875, -3.744384765625, -3.3843994140625, -3.0244140625, -2.6644287109375, -2.304443359375, -1.9444580078125, -1.58447265625, -1.2244873046875, -0.864501953125, -0.5045166015625, -0.14453125, 0.2154541015625, 0.575439453125, 0.9354248046875, 1.29541015625, 1.6553955078125, 2.015380859375, 2.3753662109375, 2.7353515625, 3.0953369140625, 3.455322265625, 3.8153076171875, 4.17529296875, 4.5352783203125, 4.895263671875, 5.2552490234375, 5.615234375, 5.9752197265625, 6.335205078125, 6.6951904296875, 7.05517578125, 7.4151611328125, 7.775146484375, 8.1351318359375, 8.4951171875, 8.8551025390625, 9.215087890625, 9.5750732421875, 9.93505859375, 10.2950439453125, 10.655029296875, 11.0150146484375, 11.375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 4.0, 1.0, 13.0, 7.0, 10.0, 11.0, 16.0, 30.0, 32.0, 30.0, 54.0, 48.0, 75.0, 80.0, 103.0, 146.0, 173.0, 267.0, 399.0, 869.0, 6599.0, 2688803.0, 1489234.0, 5082.0, 800.0, 418.0, 249.0, 165.0, 117.0, 103.0, 76.0, 70.0, 36.0, 40.0, 27.0, 27.0, 12.0, 18.0, 11.0, 12.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.625, -41.876953125, -40.12890625, -38.380859375, -36.6328125, -34.884765625, -33.13671875, -31.388671875, -29.640625, -27.892578125, -26.14453125, -24.396484375, -22.6484375, -20.900390625, -19.15234375, -17.404296875, -15.65625, -13.908203125, -12.16015625, -10.412109375, -8.6640625, -6.916015625, -5.16796875, -3.419921875, -1.671875, 0.076171875, 1.82421875, 3.572265625, 5.3203125, 7.068359375, 8.81640625, 10.564453125, 12.3125, 14.060546875, 15.80859375, 17.556640625, 19.3046875, 21.052734375, 22.80078125, 24.548828125, 26.296875, 28.044921875, 29.79296875, 31.541015625, 33.2890625, 35.037109375, 36.78515625, 38.533203125, 40.28125, 42.029296875, 43.77734375, 45.525390625, 47.2734375, 49.021484375, 50.76953125, 52.517578125, 54.265625, 56.013671875, 57.76171875, 59.509765625, 61.2578125, 63.005859375, 64.75390625, 66.501953125, 68.25]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 14.0, 41.0, 103.0, 176.0, 238.0, 231.0, 116.0, 63.0, 16.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.58984375, -22.22252082824707, -18.85519790649414, -15.487876892089844, -12.120553970336914, -8.753231048583984, -5.3859100341796875, -2.018587112426758, 1.3487358093261719, 4.716058254241943, 8.083380699157715, 11.450702667236328, 14.818025588989258, 18.185348510742188, 21.552669525146484, 24.919992446899414, 28.287315368652344, 31.654638290405273, 35.0219612121582, 38.3892822265625, 41.75660705566406, 45.12392807006836, 48.491249084472656, 51.85857391357422, 55.225894927978516, 58.59321594238281, 61.960540771484375, 65.32786560058594, 68.69518280029297, 72.06250762939453, 75.42982482910156, 78.79714965820312, 82.16447448730469, 85.53179931640625, 88.89911651611328, 92.26644134521484, 95.6337661743164, 99.00108337402344, 102.368408203125, 105.73573303222656, 109.10305786132812, 112.47038269042969, 115.83769989013672, 119.20502471923828, 122.57234954833984, 125.93966674804688, 129.30699157714844, 132.67431640625, 136.0416259765625, 139.40895080566406, 142.77627563476562, 146.14358520507812, 149.5109100341797, 152.87823486328125, 156.2455596923828, 159.61288452148438, 162.98020935058594, 166.3475341796875, 169.71485900878906, 173.08218383789062, 176.44949340820312, 179.8168182373047, 183.18414306640625, 186.5514678955078, 189.91879272460938]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 7.0, 10.0, 12.0, 12.0, 3.0, 17.0, 16.0, 15.0, 19.0, 19.0, 23.0, 22.0, 21.0, 26.0, 41.0, 34.0, 41.0, 36.0, 44.0, 38.0, 44.0, 38.0, 47.0, 43.0, 31.0, 41.0, 31.0, 30.0, 23.0, 22.0, 27.0, 20.0, 30.0, 16.0, 12.0, 8.0, 19.0, 9.0, 10.0, 12.0, 5.0, 2.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.049949645996094, -34.77021789550781, -33.49048614501953, -32.21075439453125, -30.93102264404297, -29.651290893554688, -28.371559143066406, -27.091827392578125, -25.812095642089844, -24.532363891601562, -23.25263214111328, -21.972900390625, -20.69316864013672, -19.413436889648438, -18.133705139160156, -16.853973388671875, -15.574239730834961, -14.29450798034668, -13.014776229858398, -11.735044479370117, -10.455312728881836, -9.175580978393555, -7.895848274230957, -6.616116523742676, -5.3363847732543945, -4.056653022766113, -2.776921033859253, -1.4971890449523926, -0.21745729446411133, 1.06227445602417, 2.3420066833496094, 3.6217384338378906, 4.901470184326172, 6.181201934814453, 7.460933685302734, 8.740665435791016, 10.020397186279297, 11.300128936767578, 12.579861640930176, 13.859593391418457, 15.139325141906738, 16.419057846069336, 17.698789596557617, 18.9785213470459, 20.25825309753418, 21.53798484802246, 22.817716598510742, 24.097448348999023, 25.377180099487305, 26.656911849975586, 27.936643600463867, 29.21637535095215, 30.49610710144043, 31.77583885192871, 33.055572509765625, 34.335304260253906, 35.61503601074219, 36.89476776123047, 38.17449951171875, 39.45423126220703, 40.73396301269531, 42.013694763183594, 43.293426513671875, 44.573158264160156, 45.85289001464844]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 13.0, 7.0, 8.0, 15.0, 13.0, 16.0, 21.0, 17.0, 25.0, 30.0, 33.0, 33.0, 36.0, 30.0, 46.0, 31.0, 35.0, 41.0, 26.0, 48.0, 40.0, 39.0, 44.0, 41.0, 27.0, 39.0, 26.0, 28.0, 29.0, 28.0, 16.0, 20.0, 20.0, 15.0, 12.0, 7.0, 14.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.1514892578125, -5.970947265625, -5.7904052734375, -5.60986328125, -5.4293212890625, -5.248779296875, -5.0682373046875, -4.8876953125, -4.7071533203125, -4.526611328125, -4.3460693359375, -4.16552734375, -3.9849853515625, -3.804443359375, -3.6239013671875, -3.443359375, -3.2628173828125, -3.082275390625, -2.9017333984375, -2.72119140625, -2.5406494140625, -2.360107421875, -2.1795654296875, -1.9990234375, -1.8184814453125, -1.637939453125, -1.4573974609375, -1.27685546875, -1.0963134765625, -0.915771484375, -0.7352294921875, -0.5546875, -0.3741455078125, -0.193603515625, -0.0130615234375, 0.16748046875, 0.3480224609375, 0.528564453125, 0.7091064453125, 0.8896484375, 1.0701904296875, 1.250732421875, 1.4312744140625, 1.61181640625, 1.7923583984375, 1.972900390625, 2.1534423828125, 2.333984375, 2.5145263671875, 2.695068359375, 2.8756103515625, 3.05615234375, 3.2366943359375, 3.417236328125, 3.5977783203125, 3.7783203125, 3.9588623046875, 4.139404296875, 4.3199462890625, 4.50048828125, 4.6810302734375, 4.861572265625, 5.0421142578125, 5.22265625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 9.0, 18.0, 26.0, 41.0, 45.0, 75.0, 118.0, 158.0, 195.0, 315.0, 476.0, 664.0, 916.0, 1365.0, 1929.0, 2785.0, 4232.0, 6430.0, 9579.0, 14449.0, 22414.0, 35127.0, 55854.0, 89463.0, 146149.0, 227960.0, 159915.0, 97740.0, 60889.0, 37760.0, 24092.0, 15798.0, 10257.0, 6864.0, 4595.0, 3073.0, 2098.0, 1467.0, 964.0, 667.0, 513.0, 286.0, 243.0, 147.0, 123.0, 82.0, 60.0, 32.0, 37.0, 16.0, 11.0, 11.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.84423828125, -0.8175125122070312, -0.7907867431640625, -0.7640609741210938, -0.737335205078125, -0.7106094360351562, -0.6838836669921875, -0.6571578979492188, -0.63043212890625, -0.6037063598632812, -0.5769805908203125, -0.5502548217773438, -0.523529052734375, -0.49680328369140625, -0.4700775146484375, -0.44335174560546875, -0.4166259765625, -0.38990020751953125, -0.3631744384765625, -0.33644866943359375, -0.309722900390625, -0.28299713134765625, -0.2562713623046875, -0.22954559326171875, -0.20281982421875, -0.17609405517578125, -0.1493682861328125, -0.12264251708984375, -0.095916748046875, -0.06919097900390625, -0.0424652099609375, -0.01573944091796875, 0.010986328125, 0.03771209716796875, 0.0644378662109375, 0.09116363525390625, 0.117889404296875, 0.14461517333984375, 0.1713409423828125, 0.19806671142578125, 0.22479248046875, 0.25151824951171875, 0.2782440185546875, 0.30496978759765625, 0.331695556640625, 0.35842132568359375, 0.3851470947265625, 0.41187286376953125, 0.4385986328125, 0.46532440185546875, 0.4920501708984375, 0.5187759399414062, 0.545501708984375, 0.5722274780273438, 0.5989532470703125, 0.6256790161132812, 0.65240478515625, 0.6791305541992188, 0.7058563232421875, 0.7325820922851562, 0.759307861328125, 0.7860336303710938, 0.8127593994140625, 0.8394851684570312, 0.8662109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 3.0, 6.0, 7.0, 16.0, 18.0, 21.0, 23.0, 31.0, 22.0, 32.0, 48.0, 38.0, 39.0, 31.0, 36.0, 45.0, 44.0, 1077.0, 41.0, 45.0, 48.0, 39.0, 29.0, 41.0, 22.0, 29.0, 27.0, 24.0, 22.0, 21.0, 16.0, 15.0, 11.0, 7.0, 8.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.390625, -4.267822265625, -4.14501953125, -4.022216796875, -3.8994140625, -3.776611328125, -3.65380859375, -3.531005859375, -3.408203125, -3.285400390625, -3.16259765625, -3.039794921875, -2.9169921875, -2.794189453125, -2.67138671875, -2.548583984375, -2.42578125, -2.302978515625, -2.18017578125, -2.057373046875, -1.9345703125, -1.811767578125, -1.68896484375, -1.566162109375, -1.443359375, -1.320556640625, -1.19775390625, -1.074951171875, -0.9521484375, -0.829345703125, -0.70654296875, -0.583740234375, -0.4609375, -0.338134765625, -0.21533203125, -0.092529296875, 0.0302734375, 0.153076171875, 0.27587890625, 0.398681640625, 0.521484375, 0.644287109375, 0.76708984375, 0.889892578125, 1.0126953125, 1.135498046875, 1.25830078125, 1.381103515625, 1.50390625, 1.626708984375, 1.74951171875, 1.872314453125, 1.9951171875, 2.117919921875, 2.24072265625, 2.363525390625, 2.486328125, 2.609130859375, 2.73193359375, 2.854736328125, 2.9775390625, 3.100341796875, 3.22314453125, 3.345947265625, 3.46875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 9.0, 9.0, 15.0, 23.0, 33.0, 67.0, 95.0, 124.0, 186.0, 286.0, 452.0, 626.0, 967.0, 1513.0, 2239.0, 3438.0, 5013.0, 7713.0, 12092.0, 18818.0, 30214.0, 49345.0, 83538.0, 149650.0, 1311109.0, 174373.0, 96039.0, 55742.0, 33704.0, 21266.0, 13136.0, 8562.0, 5725.0, 3724.0, 2449.0, 1653.0, 1100.0, 722.0, 446.0, 298.0, 213.0, 134.0, 88.0, 69.0, 33.0, 26.0, 17.0, 13.0, 9.0, 6.0, 2.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.833984375, -0.8067474365234375, -0.779510498046875, -0.7522735595703125, -0.72503662109375, -0.6977996826171875, -0.670562744140625, -0.6433258056640625, -0.6160888671875, -0.5888519287109375, -0.561614990234375, -0.5343780517578125, -0.50714111328125, -0.4799041748046875, -0.452667236328125, -0.4254302978515625, -0.398193359375, -0.3709564208984375, -0.343719482421875, -0.3164825439453125, -0.28924560546875, -0.2620086669921875, -0.234771728515625, -0.2075347900390625, -0.1802978515625, -0.1530609130859375, -0.125823974609375, -0.0985870361328125, -0.07135009765625, -0.0441131591796875, -0.016876220703125, 0.0103607177734375, 0.03759765625, 0.0648345947265625, 0.092071533203125, 0.1193084716796875, 0.14654541015625, 0.1737823486328125, 0.201019287109375, 0.2282562255859375, 0.2554931640625, 0.2827301025390625, 0.309967041015625, 0.3372039794921875, 0.36444091796875, 0.3916778564453125, 0.418914794921875, 0.4461517333984375, 0.473388671875, 0.5006256103515625, 0.527862548828125, 0.5550994873046875, 0.58233642578125, 0.6095733642578125, 0.636810302734375, 0.6640472412109375, 0.6912841796875, 0.7185211181640625, 0.745758056640625, 0.7729949951171875, 0.80023193359375, 0.8274688720703125, 0.854705810546875, 0.8819427490234375, 0.9091796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 6.0, 6.0, 9.0, 14.0, 8.0, 13.0, 11.0, 17.0, 22.0, 26.0, 44.0, 39.0, 45.0, 45.0, 57.0, 69.0, 71.0, 54.0, 71.0, 57.0, 49.0, 45.0, 40.0, 30.0, 23.0, 26.0, 15.0, 15.0, 11.0, 9.0, 15.0, 6.0, 5.0, 5.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005655288696289062, -0.0005484223365783691, -0.000531315803527832, -0.0005142092704772949, -0.0004971027374267578, -0.0004799962043762207, -0.0004628896713256836, -0.0004457831382751465, -0.0004286766052246094, -0.00041157007217407227, -0.00039446353912353516, -0.00037735700607299805, -0.00036025047302246094, -0.00034314393997192383, -0.0003260374069213867, -0.0003089308738708496, -0.0002918243408203125, -0.0002747178077697754, -0.0002576112747192383, -0.00024050474166870117, -0.00022339820861816406, -0.00020629167556762695, -0.00018918514251708984, -0.00017207860946655273, -0.00015497207641601562, -0.00013786554336547852, -0.0001207590103149414, -0.0001036524772644043, -8.654594421386719e-05, -6.943941116333008e-05, -5.233287811279297e-05, -3.522634506225586e-05, -1.811981201171875e-05, -1.0132789611816406e-06, 1.609325408935547e-05, 3.319978713989258e-05, 5.030632019042969e-05, 6.74128532409668e-05, 8.45193862915039e-05, 0.00010162591934204102, 0.00011873245239257812, 0.00013583898544311523, 0.00015294551849365234, 0.00017005205154418945, 0.00018715858459472656, 0.00020426511764526367, 0.00022137165069580078, 0.0002384781837463379, 0.000255584716796875, 0.0002726912498474121, 0.0002897977828979492, 0.00030690431594848633, 0.00032401084899902344, 0.00034111738204956055, 0.00035822391510009766, 0.00037533044815063477, 0.0003924369812011719, 0.000409543514251709, 0.0004266500473022461, 0.0004437565803527832, 0.0004608631134033203, 0.0004779696464538574, 0.0004950761795043945, 0.0005121827125549316, 0.0005292892456054688]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 12.0, 12.0, 25.0, 20.0, 28.0, 53.0, 77.0, 126.0, 210.0, 491.0, 1654.0, 1016260.0, 27997.0, 780.0, 296.0, 164.0, 102.0, 80.0, 41.0, 38.0, 12.0, 14.0, 15.0, 9.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157012939453125, -0.015190839767456055, -0.01468038558959961, -0.014169931411743164, -0.013659477233886719, -0.013149023056030273, -0.012638568878173828, -0.012128114700317383, -0.011617660522460938, -0.011107206344604492, -0.010596752166748047, -0.010086297988891602, -0.009575843811035156, -0.009065389633178711, -0.008554935455322266, -0.00804448127746582, -0.007534027099609375, -0.00702357292175293, -0.006513118743896484, -0.006002664566040039, -0.005492210388183594, -0.0049817562103271484, -0.004471302032470703, -0.003960847854614258, -0.0034503936767578125, -0.002939939498901367, -0.002429485321044922, -0.0019190311431884766, -0.0014085769653320312, -0.0008981227874755859, -0.0003876686096191406, 0.0001227855682373047, 0.00063323974609375, 0.0011436939239501953, 0.0016541481018066406, 0.002164602279663086, 0.0026750564575195312, 0.0031855106353759766, 0.003695964813232422, 0.004206418991088867, 0.0047168731689453125, 0.005227327346801758, 0.005737781524658203, 0.0062482357025146484, 0.006758689880371094, 0.007269144058227539, 0.007779598236083984, 0.00829005241394043, 0.008800506591796875, 0.00931096076965332, 0.009821414947509766, 0.010331869125366211, 0.010842323303222656, 0.011352777481079102, 0.011863231658935547, 0.012373685836791992, 0.012884140014648438, 0.013394594192504883, 0.013905048370361328, 0.014415502548217773, 0.014925956726074219, 0.015436410903930664, 0.01594686508178711, 0.016457319259643555, 0.0169677734375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 105.0, 682.0, 215.0, 9.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009810629999265075, -0.00091396807692945, -0.0008468731539323926, -0.0007797781727276742, -0.0007126832497306168, -0.0006455883267335594, -0.000578493345528841, -0.0005113984225317836, -0.00044430349953472614, -0.0003772085765376687, -0.0003101136244367808, -0.00024301868688780814, -0.00017592374933883548, -0.00010882882634177804, -4.1733874240890145e-05, 2.536107785999775e-05, 9.245600085705519e-05, 0.00015955093840602785, 0.00022664587595500052, 0.0002937408280558884, 0.00036083575105294585, 0.0004279306740500033, 0.0004950256552547216, 0.0005621205782517791, 0.0006292155012488365, 0.000696310424245894, 0.0007634053472429514, 0.0008305003284476697, 0.0008975952514447272, 0.0009646901744417846, 0.001031785155646503, 0.0010988800786435604, 0.0011659751180559397, 0.0012330700410529971, 0.0013001649640500546, 0.001367259887047112, 0.0014343548100441694, 0.0015014498494565487, 0.0015685447724536061, 0.0016356396954506636, 0.001702734618447721, 0.0017698295414447784, 0.0018369244644418359, 0.0019040193874388933, 0.0019711144268512726, 0.002038209233433008, 0.0021053042728453875, 0.0021723993122577667, 0.0022394941188395023, 0.0023065891582518816, 0.002373683964833617, 0.0024407790042459965, 0.002507873810827732, 0.0025749688502401114, 0.002642063656821847, 0.0027091586962342262, 0.002776253502815962, 0.002843348542228341, 0.0029104433488100767, 0.002977538388222456, 0.0030446331948041916, 0.003111728234216571, 0.0031788230407983065, 0.0032459180802106857, 0.003313013119623065]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 3.0, 1.0, 6.0, 11.0, 3.0, 5.0, 8.0, 10.0, 15.0, 5.0, 12.0, 29.0, 13.0, 25.0, 31.0, 33.0, 37.0, 43.0, 40.0, 34.0, 38.0, 32.0, 36.0, 36.0, 37.0, 33.0, 30.0, 32.0, 47.0, 33.0, 35.0, 28.0, 24.0, 23.0, 35.0, 16.0, 17.0, 11.0, 13.0, 12.0, 14.0, 9.0, 11.0, 11.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0002714991569519043, -0.0002638213336467743, -0.0002561435103416443, -0.0002484656870365143, -0.00024078786373138428, -0.00023311004042625427, -0.00022543221712112427, -0.00021775439381599426, -0.00021007657051086426, -0.00020239874720573425, -0.00019472092390060425, -0.00018704310059547424, -0.00017936527729034424, -0.00017168745398521423, -0.00016400963068008423, -0.00015633180737495422, -0.00014865398406982422, -0.00014097616076469421, -0.0001332983374595642, -0.0001256205141544342, -0.0001179426908493042, -0.0001102648675441742, -0.00010258704423904419, -9.490922093391418e-05, -8.723139762878418e-05, -7.955357432365417e-05, -7.187575101852417e-05, -6.419792771339417e-05, -5.652010440826416e-05, -4.8842281103134155e-05, -4.116445779800415e-05, -3.3486634492874146e-05, -2.580881118774414e-05, -1.8130987882614136e-05, -1.0453164577484131e-05, -2.775341272354126e-06, 4.902482032775879e-06, 1.2580305337905884e-05, 2.025812864303589e-05, 2.7935951948165894e-05, 3.56137752532959e-05, 4.32915985584259e-05, 5.096942186355591e-05, 5.864724516868591e-05, 6.632506847381592e-05, 7.400289177894592e-05, 8.168071508407593e-05, 8.935853838920593e-05, 9.703636169433594e-05, 0.00010471418499946594, 0.00011239200830459595, 0.00012006983160972595, 0.00012774765491485596, 0.00013542547821998596, 0.00014310330152511597, 0.00015078112483024597, 0.00015845894813537598, 0.00016613677144050598, 0.00017381459474563599, 0.000181492418050766, 0.000189170241355896, 0.000196848064661026, 0.000204525887966156, 0.000212203711271286, 0.00021988153457641602]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 13.0, 7.0, 8.0, 15.0, 13.0, 16.0, 21.0, 17.0, 25.0, 30.0, 33.0, 33.0, 36.0, 30.0, 46.0, 31.0, 35.0, 41.0, 26.0, 48.0, 40.0, 39.0, 44.0, 41.0, 27.0, 39.0, 26.0, 28.0, 29.0, 28.0, 16.0, 21.0, 19.0, 15.0, 12.0, 7.0, 14.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.1514892578125, -5.970947265625, -5.7904052734375, -5.60986328125, -5.4293212890625, -5.248779296875, -5.0682373046875, -4.8876953125, -4.7071533203125, -4.526611328125, -4.3460693359375, -4.16552734375, -3.9849853515625, -3.804443359375, -3.6239013671875, -3.443359375, -3.2628173828125, -3.082275390625, -2.9017333984375, -2.72119140625, -2.5406494140625, -2.360107421875, -2.1795654296875, -1.9990234375, -1.8184814453125, -1.637939453125, -1.4573974609375, -1.27685546875, -1.0963134765625, -0.915771484375, -0.7352294921875, -0.5546875, -0.3741455078125, -0.193603515625, -0.0130615234375, 0.16748046875, 0.3480224609375, 0.528564453125, 0.7091064453125, 0.8896484375, 1.0701904296875, 1.250732421875, 1.4312744140625, 1.61181640625, 1.7923583984375, 1.972900390625, 2.1534423828125, 2.333984375, 2.5145263671875, 2.695068359375, 2.8756103515625, 3.05615234375, 3.2366943359375, 3.417236328125, 3.5977783203125, 3.7783203125, 3.9588623046875, 4.139404296875, 4.3199462890625, 4.50048828125, 4.6810302734375, 4.861572265625, 5.0421142578125, 5.22265625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 9.0, 10.0, 11.0, 13.0, 25.0, 39.0, 49.0, 80.0, 113.0, 144.0, 227.0, 372.0, 593.0, 969.0, 1526.0, 2629.0, 4192.0, 7286.0, 12230.0, 22611.0, 43806.0, 92643.0, 232976.0, 354338.0, 139737.0, 61580.0, 30810.0, 16265.0, 9209.0, 5593.0, 3174.0, 1956.0, 1249.0, 747.0, 447.0, 283.0, 203.0, 128.0, 85.0, 61.0, 47.0, 30.0, 18.0, 14.0, 11.0, 7.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.00390625, -2.907745361328125, -2.81158447265625, -2.715423583984375, -2.6192626953125, -2.523101806640625, -2.42694091796875, -2.330780029296875, -2.234619140625, -2.138458251953125, -2.04229736328125, -1.946136474609375, -1.8499755859375, -1.753814697265625, -1.65765380859375, -1.561492919921875, -1.46533203125, -1.369171142578125, -1.27301025390625, -1.176849365234375, -1.0806884765625, -0.984527587890625, -0.88836669921875, -0.792205810546875, -0.696044921875, -0.599884033203125, -0.50372314453125, -0.407562255859375, -0.3114013671875, -0.215240478515625, -0.11907958984375, -0.022918701171875, 0.0732421875, 0.169403076171875, 0.26556396484375, 0.361724853515625, 0.4578857421875, 0.554046630859375, 0.65020751953125, 0.746368408203125, 0.842529296875, 0.938690185546875, 1.03485107421875, 1.131011962890625, 1.2271728515625, 1.323333740234375, 1.41949462890625, 1.515655517578125, 1.61181640625, 1.707977294921875, 1.80413818359375, 1.900299072265625, 1.9964599609375, 2.092620849609375, 2.18878173828125, 2.284942626953125, 2.381103515625, 2.477264404296875, 2.57342529296875, 2.669586181640625, 2.7657470703125, 2.861907958984375, 2.95806884765625, 3.054229736328125, 3.150390625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 4.0, 6.0, 7.0, 4.0, 7.0, 16.0, 12.0, 18.0, 23.0, 17.0, 27.0, 31.0, 33.0, 47.0, 52.0, 57.0, 102.0, 1565.0, 449.0, 105.0, 56.0, 53.0, 58.0, 47.0, 40.0, 31.0, 25.0, 32.0, 21.0, 22.0, 20.0, 10.0, 13.0, 6.0, 6.0, 4.0, 8.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.781982421875, -19.04833984375, -18.314697265625, -17.5810546875, -16.847412109375, -16.11376953125, -15.380126953125, -14.646484375, -13.912841796875, -13.17919921875, -12.445556640625, -11.7119140625, -10.978271484375, -10.24462890625, -9.510986328125, -8.77734375, -8.043701171875, -7.31005859375, -6.576416015625, -5.8427734375, -5.109130859375, -4.37548828125, -3.641845703125, -2.908203125, -2.174560546875, -1.44091796875, -0.707275390625, 0.0263671875, 0.760009765625, 1.49365234375, 2.227294921875, 2.9609375, 3.694580078125, 4.42822265625, 5.161865234375, 5.8955078125, 6.629150390625, 7.36279296875, 8.096435546875, 8.830078125, 9.563720703125, 10.29736328125, 11.031005859375, 11.7646484375, 12.498291015625, 13.23193359375, 13.965576171875, 14.69921875, 15.432861328125, 16.16650390625, 16.900146484375, 17.6337890625, 18.367431640625, 19.10107421875, 19.834716796875, 20.568359375, 21.302001953125, 22.03564453125, 22.769287109375, 23.5029296875, 24.236572265625, 24.97021484375, 25.703857421875, 26.4375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 12.0, 15.0, 11.0, 19.0, 26.0, 35.0, 39.0, 49.0, 55.0, 82.0, 125.0, 170.0, 249.0, 349.0, 744.0, 7047.0, 3009985.0, 123302.0, 1951.0, 480.0, 280.0, 172.0, 123.0, 82.0, 69.0, 51.0, 29.0, 29.0, 19.0, 11.0, 11.0, 10.0, 11.0, 13.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.6875, -44.2939453125, -42.900390625, -41.5068359375, -40.11328125, -38.7197265625, -37.326171875, -35.9326171875, -34.5390625, -33.1455078125, -31.751953125, -30.3583984375, -28.96484375, -27.5712890625, -26.177734375, -24.7841796875, -23.390625, -21.9970703125, -20.603515625, -19.2099609375, -17.81640625, -16.4228515625, -15.029296875, -13.6357421875, -12.2421875, -10.8486328125, -9.455078125, -8.0615234375, -6.66796875, -5.2744140625, -3.880859375, -2.4873046875, -1.09375, 0.2998046875, 1.693359375, 3.0869140625, 4.48046875, 5.8740234375, 7.267578125, 8.6611328125, 10.0546875, 11.4482421875, 12.841796875, 14.2353515625, 15.62890625, 17.0224609375, 18.416015625, 19.8095703125, 21.203125, 22.5966796875, 23.990234375, 25.3837890625, 26.77734375, 28.1708984375, 29.564453125, 30.9580078125, 32.3515625, 33.7451171875, 35.138671875, 36.5322265625, 37.92578125, 39.3193359375, 40.712890625, 42.1064453125, 43.5]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 51.0, 151.0, 372.0, 297.0, 112.0, 20.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.156606674194336, -27.310348510742188, -25.464088439941406, -23.617830276489258, -21.77157211303711, -19.925312042236328, -18.07905387878418, -16.23279571533203, -14.386536598205566, -12.540277481079102, -10.694019317626953, -8.847760200500488, -7.001501560211182, -5.155242919921875, -3.30898380279541, -1.4627256393432617, 0.3835334777832031, 2.2297921180725098, 4.076050758361816, 5.922309875488281, 7.768568515777588, 9.614827156066895, 11.46108627319336, 13.307344436645508, 15.153603553771973, 16.999862670898438, 18.846120834350586, 20.692378997802734, 22.538639068603516, 24.384897232055664, 26.231155395507812, 28.077415466308594, 29.92367172241211, 31.769929885864258, 33.616188049316406, 35.46244812011719, 37.30870819091797, 39.154964447021484, 41.001224517822266, 42.84748077392578, 44.69374084472656, 46.540000915527344, 48.38625717163086, 50.23251724243164, 52.07877731323242, 53.92503356933594, 55.77129364013672, 57.6175537109375, 59.46381378173828, 61.31007385253906, 63.15633010864258, 65.00259399414062, 66.84884643554688, 68.69510650634766, 70.54136657714844, 72.38762664794922, 74.23387908935547, 76.08013916015625, 77.92639923095703, 79.77265930175781, 81.61891174316406, 83.46517181396484, 85.31143188476562, 87.1576919555664, 89.00395202636719]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 10.0, 7.0, 6.0, 18.0, 17.0, 24.0, 14.0, 11.0, 27.0, 26.0, 30.0, 45.0, 29.0, 34.0, 32.0, 29.0, 43.0, 45.0, 59.0, 33.0, 33.0, 38.0, 38.0, 35.0, 46.0, 25.0, 30.0, 24.0, 33.0, 22.0, 21.0, 19.0, 19.0, 8.0, 16.0, 11.0, 7.0, 5.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.529762268066406, -49.7943115234375, -48.058860778808594, -46.32341384887695, -44.58796310424805, -42.85251235961914, -41.117061614990234, -39.381614685058594, -37.64616394042969, -35.91071319580078, -34.175262451171875, -32.439815521240234, -30.704364776611328, -28.968914031982422, -27.233463287353516, -25.498014450073242, -23.762563705444336, -22.02711296081543, -20.291664123535156, -18.55621337890625, -16.820764541625977, -15.08531379699707, -13.34986400604248, -11.61441421508789, -9.8789644241333, -8.143514633178711, -6.408064842224121, -4.672614574432373, -2.937164783477783, -1.2017145156860352, 0.5337352752685547, 2.2691850662231445, 4.004634857177734, 5.740084648132324, 7.475534439086914, 9.21098518371582, 10.946434020996094, 12.681884765625, 14.41733455657959, 16.15278434753418, 17.888233184814453, 19.62368392944336, 21.359132766723633, 23.09458351135254, 24.830032348632812, 26.56548309326172, 28.300933837890625, 30.0363826751709, 31.771833419799805, 33.50728225708008, 35.242733001708984, 36.97818374633789, 38.7136344909668, 40.44908142089844, 42.184532165527344, 43.91998291015625, 45.655433654785156, 47.39088439941406, 49.12633514404297, 50.86178207397461, 52.597232818603516, 54.33268356323242, 56.06813430786133, 57.80358123779297, 59.539031982421875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 10.0, 9.0, 8.0, 16.0, 11.0, 12.0, 16.0, 24.0, 28.0, 32.0, 30.0, 32.0, 41.0, 30.0, 42.0, 39.0, 37.0, 41.0, 40.0, 39.0, 40.0, 42.0, 52.0, 33.0, 29.0, 31.0, 34.0, 31.0, 24.0, 21.0, 18.0, 20.0, 19.0, 11.0, 16.0, 10.0, 7.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.75, -6.55615234375, -6.3623046875, -6.16845703125, -5.974609375, -5.78076171875, -5.5869140625, -5.39306640625, -5.19921875, -5.00537109375, -4.8115234375, -4.61767578125, -4.423828125, -4.22998046875, -4.0361328125, -3.84228515625, -3.6484375, -3.45458984375, -3.2607421875, -3.06689453125, -2.873046875, -2.67919921875, -2.4853515625, -2.29150390625, -2.09765625, -1.90380859375, -1.7099609375, -1.51611328125, -1.322265625, -1.12841796875, -0.9345703125, -0.74072265625, -0.546875, -0.35302734375, -0.1591796875, 0.03466796875, 0.228515625, 0.42236328125, 0.6162109375, 0.81005859375, 1.00390625, 1.19775390625, 1.3916015625, 1.58544921875, 1.779296875, 1.97314453125, 2.1669921875, 2.36083984375, 2.5546875, 2.74853515625, 2.9423828125, 3.13623046875, 3.330078125, 3.52392578125, 3.7177734375, 3.91162109375, 4.10546875, 4.29931640625, 4.4931640625, 4.68701171875, 4.880859375, 5.07470703125, 5.2685546875, 5.46240234375, 5.65625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 9.0, 10.0, 22.0, 26.0, 30.0, 39.0, 51.0, 59.0, 116.0, 149.0, 206.0, 373.0, 578.0, 1210.0, 2707.0, 7473.0, 29676.0, 183918.0, 1015312.0, 1962888.0, 820835.0, 133066.0, 24050.0, 6327.0, 2372.0, 1112.0, 588.0, 338.0, 217.0, 171.0, 82.0, 63.0, 46.0, 48.0, 22.0, 14.0, 19.0, 13.0, 14.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.28125, -8.9949951171875, -8.708740234375, -8.4224853515625, -8.13623046875, -7.8499755859375, -7.563720703125, -7.2774658203125, -6.9912109375, -6.7049560546875, -6.418701171875, -6.1324462890625, -5.84619140625, -5.5599365234375, -5.273681640625, -4.9874267578125, -4.701171875, -4.4149169921875, -4.128662109375, -3.8424072265625, -3.55615234375, -3.2698974609375, -2.983642578125, -2.6973876953125, -2.4111328125, -2.1248779296875, -1.838623046875, -1.5523681640625, -1.26611328125, -0.9798583984375, -0.693603515625, -0.4073486328125, -0.12109375, 0.1651611328125, 0.451416015625, 0.7376708984375, 1.02392578125, 1.3101806640625, 1.596435546875, 1.8826904296875, 2.1689453125, 2.4552001953125, 2.741455078125, 3.0277099609375, 3.31396484375, 3.6002197265625, 3.886474609375, 4.1727294921875, 4.458984375, 4.7452392578125, 5.031494140625, 5.3177490234375, 5.60400390625, 5.8902587890625, 6.176513671875, 6.4627685546875, 6.7490234375, 7.0352783203125, 7.321533203125, 7.6077880859375, 7.89404296875, 8.1802978515625, 8.466552734375, 8.7528076171875, 9.0390625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 8.0, 11.0, 16.0, 30.0, 37.0, 56.0, 68.0, 86.0, 119.0, 134.0, 209.0, 332.0, 396.0, 535.0, 506.0, 374.0, 281.0, 245.0, 178.0, 116.0, 95.0, 66.0, 46.0, 35.0, 26.0, 19.0, 17.0, 11.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.3631591796875, -11.906005859375, -11.4488525390625, -10.99169921875, -10.5345458984375, -10.077392578125, -9.6202392578125, -9.1630859375, -8.7059326171875, -8.248779296875, -7.7916259765625, -7.33447265625, -6.8773193359375, -6.420166015625, -5.9630126953125, -5.505859375, -5.0487060546875, -4.591552734375, -4.1343994140625, -3.67724609375, -3.2200927734375, -2.762939453125, -2.3057861328125, -1.8486328125, -1.3914794921875, -0.934326171875, -0.4771728515625, -0.02001953125, 0.4371337890625, 0.894287109375, 1.3514404296875, 1.80859375, 2.2657470703125, 2.722900390625, 3.1800537109375, 3.63720703125, 4.0943603515625, 4.551513671875, 5.0086669921875, 5.4658203125, 5.9229736328125, 6.380126953125, 6.8372802734375, 7.29443359375, 7.7515869140625, 8.208740234375, 8.6658935546875, 9.123046875, 9.5802001953125, 10.037353515625, 10.4945068359375, 10.95166015625, 11.4088134765625, 11.865966796875, 12.3231201171875, 12.7802734375, 13.2374267578125, 13.694580078125, 14.1517333984375, 14.60888671875, 15.0660400390625, 15.523193359375, 15.9803466796875, 16.4375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 9.0, 12.0, 18.0, 24.0, 25.0, 36.0, 37.0, 54.0, 87.0, 115.0, 167.0, 267.0, 429.0, 1373.0, 137776.0, 4044247.0, 7766.0, 740.0, 361.0, 201.0, 138.0, 110.0, 63.0, 53.0, 38.0, 33.0, 20.0, 16.0, 17.0, 8.0, 9.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15625, -59.95849609375, -57.7607421875, -55.56298828125, -53.365234375, -51.16748046875, -48.9697265625, -46.77197265625, -44.57421875, -42.37646484375, -40.1787109375, -37.98095703125, -35.783203125, -33.58544921875, -31.3876953125, -29.18994140625, -26.9921875, -24.79443359375, -22.5966796875, -20.39892578125, -18.201171875, -16.00341796875, -13.8056640625, -11.60791015625, -9.41015625, -7.21240234375, -5.0146484375, -2.81689453125, -0.619140625, 1.57861328125, 3.7763671875, 5.97412109375, 8.171875, 10.36962890625, 12.5673828125, 14.76513671875, 16.962890625, 19.16064453125, 21.3583984375, 23.55615234375, 25.75390625, 27.95166015625, 30.1494140625, 32.34716796875, 34.544921875, 36.74267578125, 38.9404296875, 41.13818359375, 43.3359375, 45.53369140625, 47.7314453125, 49.92919921875, 52.126953125, 54.32470703125, 56.5224609375, 58.72021484375, 60.91796875, 63.11572265625, 65.3134765625, 67.51123046875, 69.708984375, 71.90673828125, 74.1044921875, 76.30224609375, 78.5]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 16.0, 194.0, 529.0, 245.0, 28.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.300514221191406, -44.32118225097656, -36.34185028076172, -28.362516403198242, -20.3831844329834, -12.403850555419922, -4.424518585205078, 3.5548133850097656, 11.53414535522461, 19.513477325439453, 27.492809295654297, 35.472145080566406, 43.45147705078125, 51.430809020996094, 59.41014099121094, 67.38947296142578, 75.36880493164062, 83.34813690185547, 91.32746887207031, 99.30680084228516, 107.2861328125, 115.26547241210938, 123.24479675292969, 131.22413635253906, 139.20346069335938, 147.18280029296875, 155.16212463378906, 163.14146423339844, 171.12078857421875, 179.10012817382812, 187.07945251464844, 195.0587921142578, 203.0381317138672, 211.01747131347656, 218.99679565429688, 226.97613525390625, 234.95545959472656, 242.93479919433594, 250.91412353515625, 258.8934631347656, 266.872802734375, 274.8521423339844, 282.83148193359375, 290.810791015625, 298.7901306152344, 306.76947021484375, 314.7488098144531, 322.7281188964844, 330.70745849609375, 338.6867980957031, 346.6661376953125, 354.64544677734375, 362.6247863769531, 370.6041259765625, 378.5834655761719, 386.5627746582031, 394.5421142578125, 402.5214538574219, 410.50079345703125, 418.4801025390625, 426.4594421386719, 434.43878173828125, 442.4181213378906, 450.3974304199219, 458.37677001953125]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 7.0, 10.0, 13.0, 12.0, 14.0, 25.0, 22.0, 22.0, 31.0, 27.0, 27.0, 37.0, 38.0, 30.0, 41.0, 38.0, 34.0, 43.0, 45.0, 53.0, 42.0, 17.0, 42.0, 41.0, 26.0, 25.0, 33.0, 29.0, 27.0, 26.0, 26.0, 14.0, 13.0, 9.0, 13.0, 8.0, 3.0, 8.0, 8.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.74163055419922, -44.348087310791016, -42.95454788208008, -41.561004638671875, -40.16746520996094, -38.773921966552734, -37.38037872314453, -35.986839294433594, -34.59329605102539, -33.19975280761719, -31.80621337890625, -30.412670135498047, -29.019128799438477, -27.625587463378906, -26.232046127319336, -24.838504791259766, -23.444963455200195, -22.051422119140625, -20.657880783081055, -19.264339447021484, -17.87079620361328, -16.47725486755371, -15.08371353149414, -13.690171241760254, -12.296629905700684, -10.903088569641113, -9.509546279907227, -8.116004943847656, -6.722463130950928, -5.328921318054199, -3.935379981994629, -2.541837692260742, -1.1482963562011719, 0.2452453374862671, 1.638787031173706, 3.0323286056518555, 4.425870418548584, 5.8194122314453125, 7.212953567504883, 8.60649585723877, 10.00003719329834, 11.39357852935791, 12.787120819091797, 14.180662155151367, 15.574203491210938, 16.96774673461914, 18.361286163330078, 19.75482940673828, 21.14837074279785, 22.541912078857422, 23.935453414916992, 25.328994750976562, 26.722537994384766, 28.116079330444336, 29.509620666503906, 30.90316390991211, 32.29670333862305, 33.69024658203125, 35.08378601074219, 36.47732925415039, 37.87086868286133, 39.26441192626953, 40.65795135498047, 42.05149459838867, 43.445037841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 2.0, 6.0, 6.0, 14.0, 16.0, 9.0, 17.0, 15.0, 25.0, 37.0, 25.0, 25.0, 28.0, 36.0, 42.0, 49.0, 43.0, 47.0, 37.0, 51.0, 44.0, 43.0, 40.0, 37.0, 43.0, 33.0, 40.0, 24.0, 35.0, 26.0, 26.0, 17.0, 12.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.90234375, -6.6944580078125, -6.486572265625, -6.2786865234375, -6.07080078125, -5.8629150390625, -5.655029296875, -5.4471435546875, -5.2392578125, -5.0313720703125, -4.823486328125, -4.6156005859375, -4.40771484375, -4.1998291015625, -3.991943359375, -3.7840576171875, -3.576171875, -3.3682861328125, -3.160400390625, -2.9525146484375, -2.74462890625, -2.5367431640625, -2.328857421875, -2.1209716796875, -1.9130859375, -1.7052001953125, -1.497314453125, -1.2894287109375, -1.08154296875, -0.8736572265625, -0.665771484375, -0.4578857421875, -0.25, -0.0421142578125, 0.165771484375, 0.3736572265625, 0.58154296875, 0.7894287109375, 0.997314453125, 1.2052001953125, 1.4130859375, 1.6209716796875, 1.828857421875, 2.0367431640625, 2.24462890625, 2.4525146484375, 2.660400390625, 2.8682861328125, 3.076171875, 3.2840576171875, 3.491943359375, 3.6998291015625, 3.90771484375, 4.1156005859375, 4.323486328125, 4.5313720703125, 4.7392578125, 4.9471435546875, 5.155029296875, 5.3629150390625, 5.57080078125, 5.7786865234375, 5.986572265625, 6.1944580078125, 6.40234375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 15.0, 20.0, 24.0, 39.0, 61.0, 93.0, 133.0, 236.0, 333.0, 534.0, 864.0, 1294.0, 2130.0, 3409.0, 5581.0, 8892.0, 14662.0, 24440.0, 42134.0, 74351.0, 136709.0, 251402.0, 214002.0, 113439.0, 63492.0, 35997.0, 21129.0, 12519.0, 7876.0, 4749.0, 2916.0, 1851.0, 1167.0, 714.0, 469.0, 287.0, 229.0, 126.0, 77.0, 46.0, 42.0, 22.0, 15.0, 8.0, 7.0, 8.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9233932495117188, -0.8902435302734375, -0.8570938110351562, -0.823944091796875, -0.7907943725585938, -0.7576446533203125, -0.7244949340820312, -0.69134521484375, -0.6581954956054688, -0.6250457763671875, -0.5918960571289062, -0.558746337890625, -0.5255966186523438, -0.4924468994140625, -0.45929718017578125, -0.4261474609375, -0.39299774169921875, -0.3598480224609375, -0.32669830322265625, -0.293548583984375, -0.26039886474609375, -0.2272491455078125, -0.19409942626953125, -0.16094970703125, -0.12779998779296875, -0.0946502685546875, -0.06150054931640625, -0.028350830078125, 0.00479888916015625, 0.0379486083984375, 0.07109832763671875, 0.104248046875, 0.13739776611328125, 0.1705474853515625, 0.20369720458984375, 0.236846923828125, 0.26999664306640625, 0.3031463623046875, 0.33629608154296875, 0.36944580078125, 0.40259552001953125, 0.4357452392578125, 0.46889495849609375, 0.502044677734375, 0.5351943969726562, 0.5683441162109375, 0.6014938354492188, 0.6346435546875, 0.6677932739257812, 0.7009429931640625, 0.7340927124023438, 0.767242431640625, 0.8003921508789062, 0.8335418701171875, 0.8666915893554688, 0.89984130859375, 0.9329910278320312, 0.9661407470703125, 0.9992904663085938, 1.032440185546875, 1.0655899047851562, 1.0987396240234375, 1.1318893432617188, 1.1650390625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 4.0, 10.0, 8.0, 11.0, 10.0, 13.0, 26.0, 27.0, 13.0, 27.0, 35.0, 29.0, 29.0, 42.0, 35.0, 40.0, 33.0, 51.0, 48.0, 1065.0, 41.0, 41.0, 32.0, 41.0, 42.0, 31.0, 28.0, 36.0, 26.0, 16.0, 26.0, 19.0, 8.0, 14.0, 14.0, 6.0, 3.0, 9.0, 5.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.443359375, -3.325775146484375, -3.20819091796875, -3.090606689453125, -2.9730224609375, -2.855438232421875, -2.73785400390625, -2.620269775390625, -2.502685546875, -2.385101318359375, -2.26751708984375, -2.149932861328125, -2.0323486328125, -1.914764404296875, -1.79718017578125, -1.679595947265625, -1.56201171875, -1.444427490234375, -1.32684326171875, -1.209259033203125, -1.0916748046875, -0.974090576171875, -0.85650634765625, -0.738922119140625, -0.621337890625, -0.503753662109375, -0.38616943359375, -0.268585205078125, -0.1510009765625, -0.033416748046875, 0.08416748046875, 0.201751708984375, 0.3193359375, 0.436920166015625, 0.55450439453125, 0.672088623046875, 0.7896728515625, 0.907257080078125, 1.02484130859375, 1.142425537109375, 1.260009765625, 1.377593994140625, 1.49517822265625, 1.612762451171875, 1.7303466796875, 1.847930908203125, 1.96551513671875, 2.083099365234375, 2.20068359375, 2.318267822265625, 2.43585205078125, 2.553436279296875, 2.6710205078125, 2.788604736328125, 2.90618896484375, 3.023773193359375, 3.141357421875, 3.258941650390625, 3.37652587890625, 3.494110107421875, 3.6116943359375, 3.729278564453125, 3.84686279296875, 3.964447021484375, 4.08203125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 16.0, 11.0, 23.0, 45.0, 53.0, 97.0, 118.0, 214.0, 267.0, 421.0, 574.0, 856.0, 1314.0, 2002.0, 3115.0, 4649.0, 7316.0, 11763.0, 18493.0, 30250.0, 50059.0, 85780.0, 159367.0, 1323726.0, 170074.0, 89833.0, 52398.0, 31235.0, 19162.0, 11937.0, 7608.0, 4863.0, 3198.0, 2044.0, 1376.0, 983.0, 604.0, 392.0, 267.0, 199.0, 131.0, 100.0, 59.0, 45.0, 31.0, 27.0, 12.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.95556640625, -0.9270782470703125, -0.898590087890625, -0.8701019287109375, -0.84161376953125, -0.8131256103515625, -0.784637451171875, -0.7561492919921875, -0.7276611328125, -0.6991729736328125, -0.670684814453125, -0.6421966552734375, -0.61370849609375, -0.5852203369140625, -0.556732177734375, -0.5282440185546875, -0.499755859375, -0.4712677001953125, -0.442779541015625, -0.4142913818359375, -0.38580322265625, -0.3573150634765625, -0.328826904296875, -0.3003387451171875, -0.2718505859375, -0.2433624267578125, -0.214874267578125, -0.1863861083984375, -0.15789794921875, -0.1294097900390625, -0.100921630859375, -0.0724334716796875, -0.0439453125, -0.0154571533203125, 0.013031005859375, 0.0415191650390625, 0.07000732421875, 0.0984954833984375, 0.126983642578125, 0.1554718017578125, 0.1839599609375, 0.2124481201171875, 0.240936279296875, 0.2694244384765625, 0.29791259765625, 0.3264007568359375, 0.354888916015625, 0.3833770751953125, 0.411865234375, 0.4403533935546875, 0.468841552734375, 0.4973297119140625, 0.52581787109375, 0.5543060302734375, 0.582794189453125, 0.6112823486328125, 0.6397705078125, 0.6682586669921875, 0.696746826171875, 0.7252349853515625, 0.75372314453125, 0.7822113037109375, 0.810699462890625, 0.8391876220703125, 0.86767578125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 11.0, 11.0, 11.0, 22.0, 20.0, 26.0, 32.0, 36.0, 53.0, 71.0, 82.0, 69.0, 82.0, 78.0, 58.0, 76.0, 40.0, 41.0, 34.0, 33.0, 19.0, 21.0, 11.0, 10.0, 7.0, 11.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000858306884765625, -0.0008352473378181458, -0.0008121877908706665, -0.0007891282439231873, -0.000766068696975708, -0.0007430091500282288, -0.0007199496030807495, -0.0006968900561332703, -0.000673830509185791, -0.0006507709622383118, -0.0006277114152908325, -0.0006046518683433533, -0.000581592321395874, -0.0005585327744483948, -0.0005354732275009155, -0.0005124136805534363, -0.000489354133605957, -0.0004662945866584778, -0.00044323503971099854, -0.0004201754927635193, -0.00039711594581604004, -0.0003740563988685608, -0.00035099685192108154, -0.0003279373049736023, -0.00030487775802612305, -0.0002818182110786438, -0.00025875866413116455, -0.0002356991171836853, -0.00021263957023620605, -0.0001895800232887268, -0.00016652047634124756, -0.0001434609293937683, -0.00012040138244628906, -9.734183549880981e-05, -7.428228855133057e-05, -5.122274160385132e-05, -2.816319465637207e-05, -5.103647708892822e-06, 1.7955899238586426e-05, 4.1015446186065674e-05, 6.407499313354492e-05, 8.713454008102417e-05, 0.00011019408702850342, 0.00013325363397598267, 0.00015631318092346191, 0.00017937272787094116, 0.0002024322748184204, 0.00022549182176589966, 0.0002485513687133789, 0.00027161091566085815, 0.0002946704626083374, 0.00031773000955581665, 0.0003407895565032959, 0.00036384910345077515, 0.0003869086503982544, 0.00040996819734573364, 0.0004330277442932129, 0.00045608729124069214, 0.0004791468381881714, 0.0005022063851356506, 0.0005252659320831299, 0.0005483254790306091, 0.0005713850259780884, 0.0005944445729255676, 0.0006175041198730469]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 9.0, 4.0, 8.0, 4.0, 13.0, 15.0, 25.0, 28.0, 29.0, 45.0, 49.0, 98.0, 126.0, 229.0, 505.0, 2101.0, 1024475.0, 19171.0, 811.0, 314.0, 152.0, 94.0, 61.0, 45.0, 35.0, 24.0, 23.0, 17.0, 12.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01293182373046875, -0.01240837574005127, -0.011884927749633789, -0.011361479759216309, -0.010838031768798828, -0.010314583778381348, -0.009791135787963867, -0.009267687797546387, -0.008744239807128906, -0.008220791816711426, -0.007697343826293945, -0.007173895835876465, -0.006650447845458984, -0.006126999855041504, -0.0056035518646240234, -0.005080103874206543, -0.0045566558837890625, -0.004033207893371582, -0.0035097599029541016, -0.002986311912536621, -0.0024628639221191406, -0.0019394159317016602, -0.0014159679412841797, -0.0008925199508666992, -0.00036907196044921875, 0.00015437602996826172, 0.0006778240203857422, 0.0012012720108032227, 0.0017247200012207031, 0.0022481679916381836, 0.002771615982055664, 0.0032950639724731445, 0.003818511962890625, 0.0043419599533081055, 0.004865407943725586, 0.005388855934143066, 0.005912303924560547, 0.006435751914978027, 0.006959199905395508, 0.007482647895812988, 0.008006095886230469, 0.00852954387664795, 0.00905299186706543, 0.00957643985748291, 0.01009988784790039, 0.010623335838317871, 0.011146783828735352, 0.011670231819152832, 0.012193679809570312, 0.012717127799987793, 0.013240575790405273, 0.013764023780822754, 0.014287471771240234, 0.014810919761657715, 0.015334367752075195, 0.015857815742492676, 0.016381263732910156, 0.016904711723327637, 0.017428159713745117, 0.017951607704162598, 0.018475055694580078, 0.01899850368499756, 0.01952195167541504, 0.02004539966583252, 0.02056884765625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 206.0, 599.0, 181.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001273144967854023, -0.001213787472806871, -0.001154429977759719, -0.0010950724827125669, -0.0010357149876654148, -0.0009763575508259237, -0.0009170001139864326, -0.0008576426189392805, -0.0007982851238921285, -0.0007389276288449764, -0.0006795701337978244, -0.0006202126969583333, -0.0005608552019111812, -0.0005014977068640292, -0.0004421402409207076, -0.000382782774977386, -0.00032342527993023396, -0.0002640677848830819, -0.00020471031893976033, -0.0001453528384445235, -8.59953579492867e-05, -2.6637862902134657e-05, 3.271960304118693e-05, 9.207706898450851e-05, 0.00015143456403166056, 0.00021079204452689737, 0.0002701495250221342, 0.00032950699096545577, 0.0003888644860126078, 0.00044822198105975986, 0.000507579417899251, 0.000566936912946403, 0.0006262944079935551, 0.0006856519030407071, 0.0007450093980878592, 0.0008043668349273503, 0.0008637243299745023, 0.0009230818250216544, 0.0009824392618611455, 0.0010417967569082975, 0.0011011542519554496, 0.0011605117470026016, 0.0012198692420497537, 0.0012792267370969057, 0.001338584115728736, 0.0013979417271912098, 0.00145729910582304, 0.001516656600870192, 0.001576014095917344, 0.0016353715909644961, 0.0016947290860116482, 0.0017540865810588002, 0.0018134440761059523, 0.0018728014547377825, 0.0019321589497849345, 0.0019915164448320866, 0.0020508738234639168, 0.002110231202095747, 0.002169588813558221, 0.002228946192190051, 0.002288303803652525, 0.002347661182284355, 0.002407018793746829, 0.0024663761723786592, 0.002525733783841133]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 7.0, 8.0, 15.0, 13.0, 17.0, 12.0, 21.0, 20.0, 25.0, 31.0, 38.0, 41.0, 35.0, 35.0, 50.0, 38.0, 58.0, 40.0, 45.0, 39.0, 47.0, 53.0, 39.0, 48.0, 41.0, 23.0, 25.0, 28.0, 23.0, 22.0, 11.0, 13.0, 7.0, 9.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00037992000579833984, -0.0003685504198074341, -0.0003571808338165283, -0.00034581124782562256, -0.0003344416618347168, -0.00032307207584381104, -0.0003117024898529053, -0.0003003329038619995, -0.00028896331787109375, -0.000277593731880188, -0.0002662241458892822, -0.00025485455989837646, -0.0002434849739074707, -0.00023211538791656494, -0.00022074580192565918, -0.00020937621593475342, -0.00019800662994384766, -0.0001866370439529419, -0.00017526745796203613, -0.00016389787197113037, -0.0001525282859802246, -0.00014115869998931885, -0.00012978911399841309, -0.00011841952800750732, -0.00010704994201660156, -9.56803560256958e-05, -8.431077003479004e-05, -7.294118404388428e-05, -6.157159805297852e-05, -5.0202012062072754e-05, -3.883242607116699e-05, -2.746284008026123e-05, -1.609325408935547e-05, -4.723668098449707e-06, 6.645917892456055e-06, 1.8015503883361816e-05, 2.9385089874267578e-05, 4.075467586517334e-05, 5.21242618560791e-05, 6.349384784698486e-05, 7.486343383789062e-05, 8.623301982879639e-05, 9.760260581970215e-05, 0.00010897219181060791, 0.00012034177780151367, 0.00013171136379241943, 0.0001430809497833252, 0.00015445053577423096, 0.00016582012176513672, 0.00017718970775604248, 0.00018855929374694824, 0.000199928879737854, 0.00021129846572875977, 0.00022266805171966553, 0.0002340376377105713, 0.00024540722370147705, 0.0002567768096923828, 0.0002681463956832886, 0.00027951598167419434, 0.0002908855676651001, 0.00030225515365600586, 0.0003136247396469116, 0.0003249943256378174, 0.00033636391162872314, 0.0003477334976196289]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 2.0, 6.0, 6.0, 14.0, 16.0, 9.0, 17.0, 15.0, 25.0, 37.0, 25.0, 25.0, 28.0, 36.0, 42.0, 49.0, 43.0, 47.0, 37.0, 51.0, 44.0, 43.0, 40.0, 38.0, 42.0, 33.0, 40.0, 24.0, 35.0, 26.0, 26.0, 17.0, 12.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.90234375, -6.6944580078125, -6.486572265625, -6.2786865234375, -6.07080078125, -5.8629150390625, -5.655029296875, -5.4471435546875, -5.2392578125, -5.0313720703125, -4.823486328125, -4.6156005859375, -4.40771484375, -4.1998291015625, -3.991943359375, -3.7840576171875, -3.576171875, -3.3682861328125, -3.160400390625, -2.9525146484375, -2.74462890625, -2.5367431640625, -2.328857421875, -2.1209716796875, -1.9130859375, -1.7052001953125, -1.497314453125, -1.2894287109375, -1.08154296875, -0.8736572265625, -0.665771484375, -0.4578857421875, -0.25, -0.0421142578125, 0.165771484375, 0.3736572265625, 0.58154296875, 0.7894287109375, 0.997314453125, 1.2052001953125, 1.4130859375, 1.6209716796875, 1.828857421875, 2.0367431640625, 2.24462890625, 2.4525146484375, 2.660400390625, 2.8682861328125, 3.076171875, 3.2840576171875, 3.491943359375, 3.6998291015625, 3.90771484375, 4.1156005859375, 4.323486328125, 4.5313720703125, 4.7392578125, 4.9471435546875, 5.155029296875, 5.3629150390625, 5.57080078125, 5.7786865234375, 5.986572265625, 6.1944580078125, 6.40234375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 19.0, 18.0, 14.0, 22.0, 35.0, 65.0, 92.0, 106.0, 161.0, 232.0, 362.0, 594.0, 1046.0, 1934.0, 3851.0, 8274.0, 17506.0, 37971.0, 84670.0, 199725.0, 366990.0, 180739.0, 77462.0, 35009.0, 16119.0, 7426.0, 3543.0, 1886.0, 954.0, 566.0, 384.0, 244.0, 149.0, 115.0, 74.0, 61.0, 33.0, 30.0, 13.0, 13.0, 12.0, 12.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.75177001953125, -3.6285400390625, -3.50531005859375, -3.382080078125, -3.25885009765625, -3.1356201171875, -3.01239013671875, -2.88916015625, -2.76593017578125, -2.6427001953125, -2.51947021484375, -2.396240234375, -2.27301025390625, -2.1497802734375, -2.02655029296875, -1.9033203125, -1.78009033203125, -1.6568603515625, -1.53363037109375, -1.410400390625, -1.28717041015625, -1.1639404296875, -1.04071044921875, -0.91748046875, -0.79425048828125, -0.6710205078125, -0.54779052734375, -0.424560546875, -0.30133056640625, -0.1781005859375, -0.05487060546875, 0.068359375, 0.19158935546875, 0.3148193359375, 0.43804931640625, 0.561279296875, 0.68450927734375, 0.8077392578125, 0.93096923828125, 1.05419921875, 1.17742919921875, 1.3006591796875, 1.42388916015625, 1.547119140625, 1.67034912109375, 1.7935791015625, 1.91680908203125, 2.0400390625, 2.16326904296875, 2.2864990234375, 2.40972900390625, 2.532958984375, 2.65618896484375, 2.7794189453125, 2.90264892578125, 3.02587890625, 3.14910888671875, 3.2723388671875, 3.39556884765625, 3.518798828125, 3.64202880859375, 3.7652587890625, 3.88848876953125, 4.01171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 4.0, 3.0, 1.0, 4.0, 9.0, 10.0, 11.0, 11.0, 16.0, 24.0, 33.0, 31.0, 39.0, 25.0, 44.0, 53.0, 53.0, 61.0, 111.0, 1536.0, 454.0, 121.0, 58.0, 41.0, 48.0, 37.0, 32.0, 31.0, 30.0, 28.0, 17.0, 13.0, 12.0, 9.0, 10.0, 6.0, 8.0, 9.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-28.84375, -28.063720703125, -27.28369140625, -26.503662109375, -25.7236328125, -24.943603515625, -24.16357421875, -23.383544921875, -22.603515625, -21.823486328125, -21.04345703125, -20.263427734375, -19.4833984375, -18.703369140625, -17.92333984375, -17.143310546875, -16.36328125, -15.583251953125, -14.80322265625, -14.023193359375, -13.2431640625, -12.463134765625, -11.68310546875, -10.903076171875, -10.123046875, -9.343017578125, -8.56298828125, -7.782958984375, -7.0029296875, -6.222900390625, -5.44287109375, -4.662841796875, -3.8828125, -3.102783203125, -2.32275390625, -1.542724609375, -0.7626953125, 0.017333984375, 0.79736328125, 1.577392578125, 2.357421875, 3.137451171875, 3.91748046875, 4.697509765625, 5.4775390625, 6.257568359375, 7.03759765625, 7.817626953125, 8.59765625, 9.377685546875, 10.15771484375, 10.937744140625, 11.7177734375, 12.497802734375, 13.27783203125, 14.057861328125, 14.837890625, 15.617919921875, 16.39794921875, 17.177978515625, 17.9580078125, 18.738037109375, 19.51806640625, 20.298095703125, 21.078125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 8.0, 12.0, 10.0, 10.0, 20.0, 21.0, 22.0, 30.0, 48.0, 75.0, 94.0, 125.0, 164.0, 281.0, 456.0, 1595.0, 78745.0, 3056121.0, 5950.0, 705.0, 344.0, 238.0, 174.0, 105.0, 70.0, 72.0, 44.0, 39.0, 33.0, 15.0, 19.0, 12.0, 12.0, 9.0, 4.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.25, -46.4794921875, -44.708984375, -42.9384765625, -41.16796875, -39.3974609375, -37.626953125, -35.8564453125, -34.0859375, -32.3154296875, -30.544921875, -28.7744140625, -27.00390625, -25.2333984375, -23.462890625, -21.6923828125, -19.921875, -18.1513671875, -16.380859375, -14.6103515625, -12.83984375, -11.0693359375, -9.298828125, -7.5283203125, -5.7578125, -3.9873046875, -2.216796875, -0.4462890625, 1.32421875, 3.0947265625, 4.865234375, 6.6357421875, 8.40625, 10.1767578125, 11.947265625, 13.7177734375, 15.48828125, 17.2587890625, 19.029296875, 20.7998046875, 22.5703125, 24.3408203125, 26.111328125, 27.8818359375, 29.65234375, 31.4228515625, 33.193359375, 34.9638671875, 36.734375, 38.5048828125, 40.275390625, 42.0458984375, 43.81640625, 45.5869140625, 47.357421875, 49.1279296875, 50.8984375, 52.6689453125, 54.439453125, 56.2099609375, 57.98046875, 59.7509765625, 61.521484375, 63.2919921875, 65.0625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 34.0, 95.0, 232.0, 364.0, 198.0, 65.0, 14.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.634822845458984, -10.941692352294922, -9.248560905456543, -7.555429935455322, -5.862298965454102, -4.169168472290039, -2.47603702545166, -0.7829055786132812, 0.9102249145507812, 2.603355884552002, 4.296486854553223, 5.989617824554443, 7.682748794555664, 9.375879287719727, 11.069010734558105, 12.762142181396484, 14.455272674560547, 16.14840316772461, 17.841533660888672, 19.534666061401367, 21.22779655456543, 22.920927047729492, 24.614059448242188, 26.30718994140625, 28.000320434570312, 29.693450927734375, 31.386581420898438, 33.0797119140625, 34.77284240722656, 36.465972900390625, 38.15910720825195, 39.852237701416016, 41.54536437988281, 43.238494873046875, 44.93162536621094, 46.624755859375, 48.31788635253906, 50.011016845703125, 51.70415115356445, 53.397281646728516, 55.09041213989258, 56.78354263305664, 58.4766731262207, 60.169803619384766, 61.862937927246094, 63.556068420410156, 65.24919891357422, 66.94232940673828, 68.63545989990234, 70.3285903930664, 72.02172088623047, 73.71485137939453, 75.4079818725586, 77.10111236572266, 78.79424285888672, 80.48738098144531, 82.18051147460938, 83.87364196777344, 85.5667724609375, 87.25990295410156, 88.95303344726562, 90.64616394042969, 92.33929443359375, 94.03242492675781, 95.72555541992188]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 2.0, 6.0, 6.0, 11.0, 9.0, 9.0, 20.0, 21.0, 22.0, 29.0, 25.0, 31.0, 32.0, 47.0, 34.0, 43.0, 48.0, 46.0, 40.0, 49.0, 49.0, 62.0, 26.0, 48.0, 49.0, 37.0, 37.0, 37.0, 25.0, 20.0, 20.0, 21.0, 15.0, 7.0, 5.0, 4.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.82101058959961, -55.9080924987793, -53.995174407958984, -52.08225631713867, -50.169334411621094, -48.25641632080078, -46.34349822998047, -44.430580139160156, -42.517662048339844, -40.60474395751953, -38.69182586669922, -36.778907775878906, -34.865989685058594, -32.95307159423828, -31.040149688720703, -29.12723159790039, -27.214313507080078, -25.301395416259766, -23.388477325439453, -21.475557327270508, -19.562639236450195, -17.649721145629883, -15.736802101135254, -13.823883056640625, -11.910964965820312, -9.998046875, -8.085127830505371, -6.1722092628479, -4.25929069519043, -2.346372604370117, -0.4334535598754883, 1.4794654846191406, 3.3923873901367188, 5.3053059577941895, 7.21822452545166, 9.131143569946289, 11.044061660766602, 12.956979751586914, 14.869898796081543, 16.782817840576172, 18.695735931396484, 20.608654022216797, 22.52157211303711, 24.434492111206055, 26.347410202026367, 28.26032829284668, 30.173248291015625, 32.08616638183594, 33.99908447265625, 35.91200256347656, 37.824920654296875, 39.73783874511719, 41.6507568359375, 43.56367492675781, 45.47659683227539, 47.3895149230957, 49.302433013916016, 51.21535110473633, 53.12826919555664, 55.04118728637695, 56.95410919189453, 58.867027282714844, 60.779945373535156, 62.69286346435547, 64.60578155517578]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 4.0, 8.0, 16.0, 14.0, 11.0, 17.0, 25.0, 19.0, 23.0, 20.0, 41.0, 31.0, 37.0, 40.0, 36.0, 47.0, 54.0, 44.0, 46.0, 55.0, 38.0, 27.0, 40.0, 46.0, 38.0, 27.0, 38.0, 28.0, 23.0, 25.0, 26.0, 11.0, 10.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.97265625, -6.75579833984375, -6.5389404296875, -6.32208251953125, -6.105224609375, -5.88836669921875, -5.6715087890625, -5.45465087890625, -5.23779296875, -5.02093505859375, -4.8040771484375, -4.58721923828125, -4.370361328125, -4.15350341796875, -3.9366455078125, -3.71978759765625, -3.5029296875, -3.28607177734375, -3.0692138671875, -2.85235595703125, -2.635498046875, -2.41864013671875, -2.2017822265625, -1.98492431640625, -1.76806640625, -1.55120849609375, -1.3343505859375, -1.11749267578125, -0.900634765625, -0.68377685546875, -0.4669189453125, -0.25006103515625, -0.033203125, 0.18365478515625, 0.4005126953125, 0.61737060546875, 0.834228515625, 1.05108642578125, 1.2679443359375, 1.48480224609375, 1.70166015625, 1.91851806640625, 2.1353759765625, 2.35223388671875, 2.569091796875, 2.78594970703125, 3.0028076171875, 3.21966552734375, 3.4365234375, 3.65338134765625, 3.8702392578125, 4.08709716796875, 4.303955078125, 4.52081298828125, 4.7376708984375, 4.95452880859375, 5.17138671875, 5.38824462890625, 5.6051025390625, 5.82196044921875, 6.038818359375, 6.25567626953125, 6.4725341796875, 6.68939208984375, 6.90625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 6.0, 7.0, 14.0, 19.0, 16.0, 17.0, 24.0, 28.0, 33.0, 28.0, 43.0, 47.0, 86.0, 295.0, 1455.0, 31883.0, 2953219.0, 1195165.0, 10505.0, 816.0, 193.0, 77.0, 45.0, 48.0, 33.0, 33.0, 30.0, 24.0, 17.0, 22.0, 13.0, 5.0, 10.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.53125, -25.642578125, -24.75390625, -23.865234375, -22.9765625, -22.087890625, -21.19921875, -20.310546875, -19.421875, -18.533203125, -17.64453125, -16.755859375, -15.8671875, -14.978515625, -14.08984375, -13.201171875, -12.3125, -11.423828125, -10.53515625, -9.646484375, -8.7578125, -7.869140625, -6.98046875, -6.091796875, -5.203125, -4.314453125, -3.42578125, -2.537109375, -1.6484375, -0.759765625, 0.12890625, 1.017578125, 1.90625, 2.794921875, 3.68359375, 4.572265625, 5.4609375, 6.349609375, 7.23828125, 8.126953125, 9.015625, 9.904296875, 10.79296875, 11.681640625, 12.5703125, 13.458984375, 14.34765625, 15.236328125, 16.125, 17.013671875, 17.90234375, 18.791015625, 19.6796875, 20.568359375, 21.45703125, 22.345703125, 23.234375, 24.123046875, 25.01171875, 25.900390625, 26.7890625, 27.677734375, 28.56640625, 29.455078125, 30.34375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 9.0, 6.0, 12.0, 18.0, 16.0, 29.0, 19.0, 54.0, 64.0, 83.0, 97.0, 160.0, 167.0, 239.0, 297.0, 397.0, 482.0, 432.0, 350.0, 286.0, 206.0, 173.0, 118.0, 82.0, 87.0, 40.0, 41.0, 33.0, 21.0, 16.0, 13.0, 6.0, 12.0, 7.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1484375, -12.7479248046875, -12.347412109375, -11.9468994140625, -11.54638671875, -11.1458740234375, -10.745361328125, -10.3448486328125, -9.9443359375, -9.5438232421875, -9.143310546875, -8.7427978515625, -8.34228515625, -7.9417724609375, -7.541259765625, -7.1407470703125, -6.740234375, -6.3397216796875, -5.939208984375, -5.5386962890625, -5.13818359375, -4.7376708984375, -4.337158203125, -3.9366455078125, -3.5361328125, -3.1356201171875, -2.735107421875, -2.3345947265625, -1.93408203125, -1.5335693359375, -1.133056640625, -0.7325439453125, -0.33203125, 0.0684814453125, 0.468994140625, 0.8695068359375, 1.27001953125, 1.6705322265625, 2.071044921875, 2.4715576171875, 2.8720703125, 3.2725830078125, 3.673095703125, 4.0736083984375, 4.47412109375, 4.8746337890625, 5.275146484375, 5.6756591796875, 6.076171875, 6.4766845703125, 6.877197265625, 7.2777099609375, 7.67822265625, 8.0787353515625, 8.479248046875, 8.8797607421875, 9.2802734375, 9.6807861328125, 10.081298828125, 10.4818115234375, 10.88232421875, 11.2828369140625, 11.683349609375, 12.0838623046875, 12.484375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 16.0, 17.0, 14.0, 26.0, 18.0, 26.0, 41.0, 49.0, 74.0, 84.0, 138.0, 173.0, 288.0, 554.0, 2531.0, 1972171.0, 2213831.0, 2561.0, 603.0, 310.0, 208.0, 136.0, 90.0, 79.0, 48.0, 26.0, 34.0, 25.0, 24.0, 9.0, 10.0, 9.0, 11.0, 14.0, 3.0, 4.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.375, -63.2666015625, -61.158203125, -59.0498046875, -56.94140625, -54.8330078125, -52.724609375, -50.6162109375, -48.5078125, -46.3994140625, -44.291015625, -42.1826171875, -40.07421875, -37.9658203125, -35.857421875, -33.7490234375, -31.640625, -29.5322265625, -27.423828125, -25.3154296875, -23.20703125, -21.0986328125, -18.990234375, -16.8818359375, -14.7734375, -12.6650390625, -10.556640625, -8.4482421875, -6.33984375, -4.2314453125, -2.123046875, -0.0146484375, 2.09375, 4.2021484375, 6.310546875, 8.4189453125, 10.52734375, 12.6357421875, 14.744140625, 16.8525390625, 18.9609375, 21.0693359375, 23.177734375, 25.2861328125, 27.39453125, 29.5029296875, 31.611328125, 33.7197265625, 35.828125, 37.9365234375, 40.044921875, 42.1533203125, 44.26171875, 46.3701171875, 48.478515625, 50.5869140625, 52.6953125, 54.8037109375, 56.912109375, 59.0205078125, 61.12890625, 63.2373046875, 65.345703125, 67.4541015625, 69.5625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [4.0, 5.0, 100.0, 481.0, 361.0, 65.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.876556396484375, -22.218677520751953, -14.560799598693848, -6.902921676635742, 0.7549571990966797, 8.412834167480469, 16.07071304321289, 23.728591918945312, 31.386470794677734, 39.044349670410156, 46.70222854614258, 54.360107421875, 62.017982482910156, 69.67585754394531, 77.333740234375, 84.99162292480469, 92.64949798583984, 100.307373046875, 107.96525573730469, 115.62313079833984, 123.28101348876953, 130.9388885498047, 138.59677124023438, 146.254638671875, 153.9125213623047, 161.57040405273438, 169.228271484375, 176.8861541748047, 184.54403686523438, 192.201904296875, 199.8597869873047, 207.51766967773438, 215.17555236816406, 222.83343505859375, 230.49130249023438, 238.14918518066406, 245.80706787109375, 253.46493530273438, 261.1228332519531, 268.78070068359375, 276.4385681152344, 284.096435546875, 291.75433349609375, 299.4122009277344, 307.070068359375, 314.72796630859375, 322.3858337402344, 330.043701171875, 337.70159912109375, 345.3594665527344, 353.0173645019531, 360.67523193359375, 368.3330993652344, 375.9909973144531, 383.64886474609375, 391.3067626953125, 398.9646301269531, 406.62249755859375, 414.2803955078125, 421.9382629394531, 429.59613037109375, 437.2540283203125, 444.9118957519531, 452.56976318359375, 460.2276611328125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 7.0, 4.0, 8.0, 4.0, 13.0, 12.0, 22.0, 20.0, 16.0, 17.0, 26.0, 27.0, 19.0, 26.0, 20.0, 30.0, 44.0, 53.0, 39.0, 31.0, 43.0, 41.0, 43.0, 40.0, 40.0, 34.0, 29.0, 43.0, 31.0, 17.0, 25.0, 20.0, 28.0, 15.0, 18.0, 16.0, 17.0, 15.0, 8.0, 13.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0], "bins": [-43.180816650390625, -41.95011520385742, -40.71941375732422, -39.488712310791016, -38.25801086425781, -37.02730941772461, -35.796607971191406, -34.56590270996094, -33.335205078125, -32.1045036315918, -30.873802185058594, -29.64310073852539, -28.412399291992188, -27.181697845458984, -25.95099449157715, -24.720293045043945, -23.48958969116211, -22.258888244628906, -21.028186798095703, -19.7974853515625, -18.566783905029297, -17.336082458496094, -16.105379104614258, -14.874677658081055, -13.643976211547852, -12.413274765014648, -11.182573318481445, -9.951870918273926, -8.721169471740723, -7.4904680252075195, -6.259766101837158, -5.029064178466797, -3.798358917236328, -2.567657232284546, -1.3369555473327637, -0.10625386238098145, 1.1244478225708008, 2.355149269104004, 3.5858511924743652, 4.816553115844727, 6.04725456237793, 7.277956008911133, 8.508657455444336, 9.739359855651855, 10.970061302185059, 12.200762748718262, 13.431465148925781, 14.662166595458984, 15.892868041992188, 17.12356948852539, 18.354270935058594, 19.584972381591797, 20.815673828125, 22.046375274658203, 23.27707862854004, 24.507780075073242, 25.738481521606445, 26.96918296813965, 28.19988441467285, 29.430585861206055, 30.66128921508789, 31.891990661621094, 33.1226921081543, 34.3533935546875, 35.5840950012207]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 16.0, 14.0, 23.0, 18.0, 30.0, 24.0, 28.0, 35.0, 36.0, 33.0, 42.0, 46.0, 50.0, 44.0, 41.0, 45.0, 50.0, 38.0, 34.0, 41.0, 40.0, 37.0, 37.0, 31.0, 27.0, 26.0, 18.0, 13.0, 11.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.40625, -7.18658447265625, -6.9669189453125, -6.74725341796875, -6.527587890625, -6.30792236328125, -6.0882568359375, -5.86859130859375, -5.64892578125, -5.42926025390625, -5.2095947265625, -4.98992919921875, -4.770263671875, -4.55059814453125, -4.3309326171875, -4.11126708984375, -3.8916015625, -3.67193603515625, -3.4522705078125, -3.23260498046875, -3.012939453125, -2.79327392578125, -2.5736083984375, -2.35394287109375, -2.13427734375, -1.91461181640625, -1.6949462890625, -1.47528076171875, -1.255615234375, -1.03594970703125, -0.8162841796875, -0.59661865234375, -0.376953125, -0.15728759765625, 0.0623779296875, 0.28204345703125, 0.501708984375, 0.72137451171875, 0.9410400390625, 1.16070556640625, 1.38037109375, 1.60003662109375, 1.8197021484375, 2.03936767578125, 2.259033203125, 2.47869873046875, 2.6983642578125, 2.91802978515625, 3.1376953125, 3.35736083984375, 3.5770263671875, 3.79669189453125, 4.016357421875, 4.23602294921875, 4.4556884765625, 4.67535400390625, 4.89501953125, 5.11468505859375, 5.3343505859375, 5.55401611328125, 5.773681640625, 5.99334716796875, 6.2130126953125, 6.43267822265625, 6.65234375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 28.0, 30.0, 42.0, 59.0, 96.0, 119.0, 208.0, 312.0, 477.0, 735.0, 1123.0, 1750.0, 2727.0, 4466.0, 6779.0, 10907.0, 17343.0, 27910.0, 45204.0, 75650.0, 128731.0, 226243.0, 203187.0, 116444.0, 67905.0, 41163.0, 25756.0, 15902.0, 9932.0, 6246.0, 3893.0, 2545.0, 1611.0, 1035.0, 672.0, 477.0, 247.0, 191.0, 131.0, 80.0, 63.0, 38.0, 25.0, 14.0, 14.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.0224609375, -0.9913864135742188, -0.9603118896484375, -0.9292373657226562, -0.898162841796875, -0.8670883178710938, -0.8360137939453125, -0.8049392700195312, -0.77386474609375, -0.7427902221679688, -0.7117156982421875, -0.6806411743164062, -0.649566650390625, -0.6184921264648438, -0.5874176025390625, -0.5563430786132812, -0.5252685546875, -0.49419403076171875, -0.4631195068359375, -0.43204498291015625, -0.400970458984375, -0.36989593505859375, -0.3388214111328125, -0.30774688720703125, -0.27667236328125, -0.24559783935546875, -0.2145233154296875, -0.18344879150390625, -0.152374267578125, -0.12129974365234375, -0.0902252197265625, -0.05915069580078125, -0.028076171875, 0.00299835205078125, 0.0340728759765625, 0.06514739990234375, 0.096221923828125, 0.12729644775390625, 0.1583709716796875, 0.18944549560546875, 0.22052001953125, 0.25159454345703125, 0.2826690673828125, 0.31374359130859375, 0.344818115234375, 0.37589263916015625, 0.4069671630859375, 0.43804168701171875, 0.4691162109375, 0.5001907348632812, 0.5312652587890625, 0.5623397827148438, 0.593414306640625, 0.6244888305664062, 0.6555633544921875, 0.6866378784179688, 0.71771240234375, 0.7487869262695312, 0.7798614501953125, 0.8109359741210938, 0.842010498046875, 0.8730850219726562, 0.9041595458984375, 0.9352340698242188, 0.96630859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 8.0, 8.0, 10.0, 15.0, 10.0, 9.0, 22.0, 22.0, 31.0, 21.0, 35.0, 31.0, 28.0, 36.0, 25.0, 40.0, 44.0, 36.0, 21.0, 1074.0, 39.0, 47.0, 40.0, 45.0, 31.0, 31.0, 26.0, 33.0, 25.0, 22.0, 27.0, 15.0, 19.0, 13.0, 20.0, 10.0, 10.0, 6.0, 6.0, 1.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.23046875, -4.110504150390625, -3.99053955078125, -3.870574951171875, -3.7506103515625, -3.630645751953125, -3.51068115234375, -3.390716552734375, -3.270751953125, -3.150787353515625, -3.03082275390625, -2.910858154296875, -2.7908935546875, -2.670928955078125, -2.55096435546875, -2.430999755859375, -2.31103515625, -2.191070556640625, -2.07110595703125, -1.951141357421875, -1.8311767578125, -1.711212158203125, -1.59124755859375, -1.471282958984375, -1.351318359375, -1.231353759765625, -1.11138916015625, -0.991424560546875, -0.8714599609375, -0.751495361328125, -0.63153076171875, -0.511566162109375, -0.3916015625, -0.271636962890625, -0.15167236328125, -0.031707763671875, 0.0882568359375, 0.208221435546875, 0.32818603515625, 0.448150634765625, 0.568115234375, 0.688079833984375, 0.80804443359375, 0.928009033203125, 1.0479736328125, 1.167938232421875, 1.28790283203125, 1.407867431640625, 1.52783203125, 1.647796630859375, 1.76776123046875, 1.887725830078125, 2.0076904296875, 2.127655029296875, 2.24761962890625, 2.367584228515625, 2.487548828125, 2.607513427734375, 2.72747802734375, 2.847442626953125, 2.9674072265625, 3.087371826171875, 3.20733642578125, 3.327301025390625, 3.447265625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 7.0, 1.0, 12.0, 9.0, 16.0, 36.0, 42.0, 60.0, 100.0, 137.0, 226.0, 321.0, 480.0, 745.0, 1147.0, 1760.0, 2647.0, 4067.0, 6166.0, 9447.0, 14891.0, 23799.0, 38560.0, 63901.0, 110809.0, 207837.0, 1290866.0, 128780.0, 73040.0, 43675.0, 26538.0, 16804.0, 10623.0, 6832.0, 4327.0, 2890.0, 1933.0, 1219.0, 840.0, 520.0, 336.0, 214.0, 177.0, 104.0, 82.0, 37.0, 36.0, 16.0, 11.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89013671875, -0.8605880737304688, -0.8310394287109375, -0.8014907836914062, -0.771942138671875, -0.7423934936523438, -0.7128448486328125, -0.6832962036132812, -0.65374755859375, -0.6241989135742188, -0.5946502685546875, -0.5651016235351562, -0.535552978515625, -0.5060043334960938, -0.4764556884765625, -0.44690704345703125, -0.4173583984375, -0.38780975341796875, -0.3582611083984375, -0.32871246337890625, -0.299163818359375, -0.26961517333984375, -0.2400665283203125, -0.21051788330078125, -0.18096923828125, -0.15142059326171875, -0.1218719482421875, -0.09232330322265625, -0.062774658203125, -0.03322601318359375, -0.0036773681640625, 0.02587127685546875, 0.055419921875, 0.08496856689453125, 0.1145172119140625, 0.14406585693359375, 0.173614501953125, 0.20316314697265625, 0.2327117919921875, 0.26226043701171875, 0.29180908203125, 0.32135772705078125, 0.3509063720703125, 0.38045501708984375, 0.410003662109375, 0.43955230712890625, 0.4691009521484375, 0.49864959716796875, 0.5281982421875, 0.5577468872070312, 0.5872955322265625, 0.6168441772460938, 0.646392822265625, 0.6759414672851562, 0.7054901123046875, 0.7350387573242188, 0.76458740234375, 0.7941360473632812, 0.8236846923828125, 0.8532333374023438, 0.882781982421875, 0.9123306274414062, 0.9418792724609375, 0.9714279174804688, 1.0009765625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 8.0, 6.0, 14.0, 11.0, 16.0, 14.0, 23.0, 21.0, 31.0, 40.0, 57.0, 56.0, 68.0, 59.0, 74.0, 92.0, 77.0, 61.0, 63.0, 37.0, 29.0, 28.0, 25.0, 17.0, 14.0, 5.0, 10.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008139610290527344, -0.0007902905344963074, -0.0007666200399398804, -0.0007429495453834534, -0.0007192790508270264, -0.0006956085562705994, -0.0006719380617141724, -0.0006482675671577454, -0.0006245970726013184, -0.0006009265780448914, -0.0005772560834884644, -0.0005535855889320374, -0.0005299150943756104, -0.0005062445998191833, -0.00048257410526275635, -0.00045890361070632935, -0.00043523311614990234, -0.00041156262159347534, -0.00038789212703704834, -0.00036422163248062134, -0.00034055113792419434, -0.00031688064336776733, -0.00029321014881134033, -0.00026953965425491333, -0.00024586915969848633, -0.00022219866514205933, -0.00019852817058563232, -0.00017485767602920532, -0.00015118718147277832, -0.00012751668691635132, -0.00010384619235992432, -8.017569780349731e-05, -5.650520324707031e-05, -3.283470869064331e-05, -9.164214134216309e-06, 1.4506280422210693e-05, 3.8176774978637695e-05, 6.18472695350647e-05, 8.55177640914917e-05, 0.0001091882586479187, 0.0001328587532043457, 0.0001565292477607727, 0.0001801997423171997, 0.0002038702368736267, 0.0002275407314300537, 0.0002512112259864807, 0.0002748817205429077, 0.0002985522150993347, 0.0003222227096557617, 0.0003458932042121887, 0.0003695636987686157, 0.0003932341933250427, 0.0004169046878814697, 0.00044057518243789673, 0.00046424567699432373, 0.00048791617155075073, 0.0005115866661071777, 0.0005352571606636047, 0.0005589276552200317, 0.0005825981497764587, 0.0006062686443328857, 0.0006299391388893127, 0.0006536096334457397, 0.0006772801280021667, 0.0007009506225585938]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 11.0, 15.0, 18.0, 20.0, 40.0, 41.0, 80.0, 133.0, 251.0, 602.0, 3234.0, 1037664.0, 5091.0, 679.0, 228.0, 115.0, 77.0, 60.0, 36.0, 31.0, 16.0, 15.0, 6.0, 15.0, 9.0, 16.0, 5.0, 7.0, 3.0, 5.0, 2.0, 0.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.017578125, -0.01702094078063965, -0.016463756561279297, -0.015906572341918945, -0.015349388122558594, -0.014792203903198242, -0.01423501968383789, -0.013677835464477539, -0.013120651245117188, -0.012563467025756836, -0.012006282806396484, -0.011449098587036133, -0.010891914367675781, -0.01033473014831543, -0.009777545928955078, -0.009220361709594727, -0.008663177490234375, -0.008105993270874023, -0.007548809051513672, -0.00699162483215332, -0.006434440612792969, -0.005877256393432617, -0.005320072174072266, -0.004762887954711914, -0.0042057037353515625, -0.003648519515991211, -0.0030913352966308594, -0.002534151077270508, -0.0019769668579101562, -0.0014197826385498047, -0.0008625984191894531, -0.00030541419982910156, 0.00025177001953125, 0.0008089542388916016, 0.0013661384582519531, 0.0019233226776123047, 0.0024805068969726562, 0.003037691116333008, 0.0035948753356933594, 0.004152059555053711, 0.0047092437744140625, 0.005266427993774414, 0.005823612213134766, 0.006380796432495117, 0.006937980651855469, 0.00749516487121582, 0.008052349090576172, 0.008609533309936523, 0.009166717529296875, 0.009723901748657227, 0.010281085968017578, 0.01083827018737793, 0.011395454406738281, 0.011952638626098633, 0.012509822845458984, 0.013067007064819336, 0.013624191284179688, 0.014181375503540039, 0.01473855972290039, 0.015295743942260742, 0.015852928161621094, 0.016410112380981445, 0.016967296600341797, 0.01752448081970215, 0.0180816650390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 231.0, 734.0, 47.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005053344066254795, -0.0004097155178897083, -0.0003140966291539371, -0.00021847771131433547, -0.00012285882257856429, -2.7239933842793107e-05, 6.837898399680853e-05, 0.0001639978727325797, 0.0002596167614683509, 0.00035523565020412207, 0.00045085453893989325, 0.0005464734276756644, 0.0006420923164114356, 0.0007377112051472068, 0.0008333301520906389, 0.0009289490408264101, 0.0010245679877698421, 0.0011201868765056133, 0.0012158057652413845, 0.0013114246539771557, 0.0014070435427129269, 0.001502662431448698, 0.0015982813201844692, 0.0016939002089202404, 0.0017895190976560116, 0.0018851379863917828, 0.001980756875127554, 0.002076375763863325, 0.0021719946525990963, 0.0022676135413348675, 0.0023632324300706387, 0.00245885131880641, 0.0025544704403728247, 0.002650089329108596, 0.002745708217844367, 0.002841327106580138, 0.0029369459953159094, 0.0030325648840516806, 0.0031281837727874517, 0.003223802661523223, 0.003319421550258994, 0.0034150404389947653, 0.0035106593277305365, 0.0036062782164663076, 0.003701897105202079, 0.00379751599393785, 0.003893134882673621, 0.003988754004240036, 0.004084372892975807, 0.004179991781711578, 0.0042756106704473495, 0.004371229559183121, 0.004466848447918892, 0.004562467336654663, 0.004658086225390434, 0.0047537051141262054, 0.004849324002861977, 0.004944942891597748, 0.005040561780333519, 0.00513618066906929, 0.005231799557805061, 0.0053274184465408325, 0.005423037335276604, 0.005518656224012375, 0.005614275112748146]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 1.0, 2.0, 9.0, 8.0, 8.0, 9.0, 9.0, 16.0, 12.0, 22.0, 19.0, 25.0, 31.0, 39.0, 35.0, 35.0, 32.0, 24.0, 34.0, 40.0, 33.0, 36.0, 54.0, 54.0, 41.0, 32.0, 35.0, 39.0, 27.0, 21.0, 23.0, 22.0, 17.0, 28.0, 17.0, 12.0, 17.0, 13.0, 8.0, 9.0, 11.0, 5.0, 9.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00034803152084350586, -0.00033771153539419174, -0.0003273915499448776, -0.0003170715644955635, -0.0003067515790462494, -0.00029643159359693527, -0.00028611160814762115, -0.00027579162269830704, -0.0002654716372489929, -0.0002551516517996788, -0.0002448316663503647, -0.00023451168090105057, -0.00022419169545173645, -0.00021387171000242233, -0.00020355172455310822, -0.0001932317391037941, -0.00018291175365447998, -0.00017259176820516586, -0.00016227178275585175, -0.00015195179730653763, -0.0001416318118572235, -0.0001313118264079094, -0.00012099184095859528, -0.00011067185550928116, -0.00010035187005996704, -9.003188461065292e-05, -7.97118991613388e-05, -6.939191371202469e-05, -5.907192826271057e-05, -4.8751942813396454e-05, -3.8431957364082336e-05, -2.811197191476822e-05, -1.77919864654541e-05, -7.472001016139984e-06, 2.8479844331741333e-06, 1.316796988248825e-05, 2.3487955331802368e-05, 3.3807940781116486e-05, 4.41279262304306e-05, 5.444791167974472e-05, 6.476789712905884e-05, 7.508788257837296e-05, 8.540786802768707e-05, 9.572785347700119e-05, 0.00010604783892631531, 0.00011636782437562943, 0.00012668780982494354, 0.00013700779527425766, 0.00014732778072357178, 0.0001576477661728859, 0.0001679677516222, 0.00017828773707151413, 0.00018860772252082825, 0.00019892770797014236, 0.00020924769341945648, 0.0002195676788687706, 0.00022988766431808472, 0.00024020764976739883, 0.00025052763521671295, 0.00026084762066602707, 0.0002711676061153412, 0.0002814875915646553, 0.0002918075770139694, 0.00030212756246328354, 0.00031244754791259766]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 16.0, 14.0, 23.0, 18.0, 30.0, 24.0, 28.0, 35.0, 36.0, 33.0, 42.0, 46.0, 50.0, 44.0, 41.0, 45.0, 50.0, 38.0, 34.0, 41.0, 40.0, 37.0, 37.0, 31.0, 27.0, 26.0, 18.0, 13.0, 11.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.40625, -7.18658447265625, -6.9669189453125, -6.74725341796875, -6.527587890625, -6.30792236328125, -6.0882568359375, -5.86859130859375, -5.64892578125, -5.42926025390625, -5.2095947265625, -4.98992919921875, -4.770263671875, -4.55059814453125, -4.3309326171875, -4.11126708984375, -3.8916015625, -3.67193603515625, -3.4522705078125, -3.23260498046875, -3.012939453125, -2.79327392578125, -2.5736083984375, -2.35394287109375, -2.13427734375, -1.91461181640625, -1.6949462890625, -1.47528076171875, -1.255615234375, -1.03594970703125, -0.8162841796875, -0.59661865234375, -0.376953125, -0.15728759765625, 0.0623779296875, 0.28204345703125, 0.501708984375, 0.72137451171875, 0.9410400390625, 1.16070556640625, 1.38037109375, 1.60003662109375, 1.8197021484375, 2.03936767578125, 2.259033203125, 2.47869873046875, 2.6983642578125, 2.91802978515625, 3.1376953125, 3.35736083984375, 3.5770263671875, 3.79669189453125, 4.016357421875, 4.23602294921875, 4.4556884765625, 4.67535400390625, 4.89501953125, 5.11468505859375, 5.3343505859375, 5.55401611328125, 5.773681640625, 5.99334716796875, 6.2130126953125, 6.43267822265625, 6.65234375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 6.0, 10.0, 13.0, 15.0, 35.0, 28.0, 52.0, 47.0, 86.0, 107.0, 177.0, 235.0, 363.0, 543.0, 940.0, 1699.0, 3707.0, 9049.0, 23893.0, 69892.0, 207955.0, 466905.0, 170120.0, 57509.0, 20433.0, 7543.0, 3199.0, 1536.0, 851.0, 491.0, 314.0, 241.0, 165.0, 103.0, 68.0, 61.0, 51.0, 32.0, 21.0, 16.0, 4.0, 8.0, 9.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.453125, -5.2899169921875, -5.126708984375, -4.9635009765625, -4.80029296875, -4.6370849609375, -4.473876953125, -4.3106689453125, -4.1474609375, -3.9842529296875, -3.821044921875, -3.6578369140625, -3.49462890625, -3.3314208984375, -3.168212890625, -3.0050048828125, -2.841796875, -2.6785888671875, -2.515380859375, -2.3521728515625, -2.18896484375, -2.0257568359375, -1.862548828125, -1.6993408203125, -1.5361328125, -1.3729248046875, -1.209716796875, -1.0465087890625, -0.88330078125, -0.7200927734375, -0.556884765625, -0.3936767578125, -0.23046875, -0.0672607421875, 0.095947265625, 0.2591552734375, 0.42236328125, 0.5855712890625, 0.748779296875, 0.9119873046875, 1.0751953125, 1.2384033203125, 1.401611328125, 1.5648193359375, 1.72802734375, 1.8912353515625, 2.054443359375, 2.2176513671875, 2.380859375, 2.5440673828125, 2.707275390625, 2.8704833984375, 3.03369140625, 3.1968994140625, 3.360107421875, 3.5233154296875, 3.6865234375, 3.8497314453125, 4.012939453125, 4.1761474609375, 4.33935546875, 4.5025634765625, 4.665771484375, 4.8289794921875, 4.9921875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 1.0, 4.0, 4.0, 8.0, 7.0, 6.0, 8.0, 15.0, 13.0, 14.0, 13.0, 18.0, 28.0, 20.0, 26.0, 26.0, 37.0, 36.0, 38.0, 57.0, 80.0, 74.0, 317.0, 1597.0, 125.0, 70.0, 57.0, 59.0, 37.0, 45.0, 37.0, 28.0, 25.0, 23.0, 16.0, 20.0, 10.0, 8.0, 11.0, 11.0, 3.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.46875, -23.792236328125, -23.11572265625, -22.439208984375, -21.7626953125, -21.086181640625, -20.40966796875, -19.733154296875, -19.056640625, -18.380126953125, -17.70361328125, -17.027099609375, -16.3505859375, -15.674072265625, -14.99755859375, -14.321044921875, -13.64453125, -12.968017578125, -12.29150390625, -11.614990234375, -10.9384765625, -10.261962890625, -9.58544921875, -8.908935546875, -8.232421875, -7.555908203125, -6.87939453125, -6.202880859375, -5.5263671875, -4.849853515625, -4.17333984375, -3.496826171875, -2.8203125, -2.143798828125, -1.46728515625, -0.790771484375, -0.1142578125, 0.562255859375, 1.23876953125, 1.915283203125, 2.591796875, 3.268310546875, 3.94482421875, 4.621337890625, 5.2978515625, 5.974365234375, 6.65087890625, 7.327392578125, 8.00390625, 8.680419921875, 9.35693359375, 10.033447265625, 10.7099609375, 11.386474609375, 12.06298828125, 12.739501953125, 13.416015625, 14.092529296875, 14.76904296875, 15.445556640625, 16.1220703125, 16.798583984375, 17.47509765625, 18.151611328125, 18.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 20.0, 16.0, 19.0, 45.0, 53.0, 67.0, 105.0, 163.0, 217.0, 342.0, 694.0, 6205.0, 3121553.0, 14089.0, 876.0, 359.0, 227.0, 161.0, 124.0, 94.0, 54.0, 53.0, 30.0, 30.0, 26.0, 20.0, 14.0, 11.0, 4.0, 7.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-73.8125, -71.79443359375, -69.7763671875, -67.75830078125, -65.740234375, -63.72216796875, -61.7041015625, -59.68603515625, -57.66796875, -55.64990234375, -53.6318359375, -51.61376953125, -49.595703125, -47.57763671875, -45.5595703125, -43.54150390625, -41.5234375, -39.50537109375, -37.4873046875, -35.46923828125, -33.451171875, -31.43310546875, -29.4150390625, -27.39697265625, -25.37890625, -23.36083984375, -21.3427734375, -19.32470703125, -17.306640625, -15.28857421875, -13.2705078125, -11.25244140625, -9.234375, -7.21630859375, -5.1982421875, -3.18017578125, -1.162109375, 0.85595703125, 2.8740234375, 4.89208984375, 6.91015625, 8.92822265625, 10.9462890625, 12.96435546875, 14.982421875, 17.00048828125, 19.0185546875, 21.03662109375, 23.0546875, 25.07275390625, 27.0908203125, 29.10888671875, 31.126953125, 33.14501953125, 35.1630859375, 37.18115234375, 39.19921875, 41.21728515625, 43.2353515625, 45.25341796875, 47.271484375, 49.28955078125, 51.3076171875, 53.32568359375, 55.34375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 24.0, 117.0, 426.0, 339.0, 96.0, 8.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.97565841674805, -46.39053726196289, -43.805416107177734, -41.22029113769531, -38.635169982910156, -36.050048828125, -33.464927673339844, -30.879804611206055, -28.2946834564209, -25.709562301635742, -23.124439239501953, -20.539318084716797, -17.95419692993164, -15.369073867797852, -12.783952713012695, -10.198829650878906, -7.61370849609375, -5.028586387634277, -2.443464756011963, 0.14165687561035156, 2.726778984069824, 5.311901092529297, 7.897022247314453, 10.482145309448242, 13.067266464233398, 15.652388572692871, 18.237510681152344, 20.8226318359375, 23.407752990722656, 25.992876052856445, 28.5779972076416, 31.16312026977539, 33.74823760986328, 36.33335876464844, 38.918479919433594, 41.50360107421875, 44.08872604370117, 46.67384719848633, 49.258968353271484, 51.844093322753906, 54.42921447753906, 57.01433563232422, 59.599456787109375, 62.18457794189453, 64.76969909667969, 67.35482788085938, 69.93994140625, 72.52507019042969, 75.11018371582031, 77.69530487060547, 80.28042602539062, 82.86554718017578, 85.45066833496094, 88.03579711914062, 90.62091064453125, 93.20603942871094, 95.7911605834961, 98.37628173828125, 100.9614028930664, 103.54652404785156, 106.13164520263672, 108.71676635742188, 111.30189514160156, 113.88701629638672, 116.47213745117188]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 8.0, 8.0, 3.0, 7.0, 10.0, 13.0, 17.0, 15.0, 26.0, 20.0, 29.0, 21.0, 32.0, 36.0, 39.0, 39.0, 35.0, 35.0, 42.0, 41.0, 40.0, 28.0, 44.0, 52.0, 46.0, 26.0, 40.0, 27.0, 32.0, 22.0, 27.0, 24.0, 19.0, 12.0, 12.0, 16.0, 7.0, 9.0, 1.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-63.36546325683594, -61.41703414916992, -59.46860885620117, -57.520179748535156, -55.571754455566406, -53.62332534790039, -51.674896240234375, -49.726470947265625, -47.77804183959961, -45.829612731933594, -43.881187438964844, -41.93275833129883, -39.98432922363281, -38.03590393066406, -36.08747482299805, -34.13904571533203, -32.19062042236328, -30.2421932220459, -28.293766021728516, -26.3453369140625, -24.396909713745117, -22.448482513427734, -20.50005340576172, -18.551626205444336, -16.603199005126953, -14.65477180480957, -12.706343650817871, -10.757915496826172, -8.809488296508789, -6.861061096191406, -4.912632942199707, -2.964204788208008, -1.015777587890625, 0.932650089263916, 2.881077766418457, 4.829505443572998, 6.777933120727539, 8.726360321044922, 10.674788475036621, 12.62321662902832, 14.571643829345703, 16.520071029663086, 18.46849822998047, 20.416927337646484, 22.365354537963867, 24.31378173828125, 26.262210845947266, 28.21063804626465, 30.15906524658203, 32.10749435424805, 34.0559196472168, 36.00434875488281, 37.95277404785156, 39.90120315551758, 41.849632263183594, 43.798057556152344, 45.74648666381836, 47.694915771484375, 49.643341064453125, 51.59177017211914, 53.540199279785156, 55.488624572753906, 57.43705368041992, 59.38548278808594, 61.33390808105469]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 17.0, 19.0, 21.0, 22.0, 16.0, 28.0, 20.0, 44.0, 30.0, 30.0, 41.0, 47.0, 48.0, 44.0, 50.0, 41.0, 34.0, 34.0, 38.0, 37.0, 37.0, 40.0, 41.0, 32.0, 28.0, 21.0, 20.0, 18.0, 20.0, 14.0, 9.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.2109375, -6.98712158203125, -6.7633056640625, -6.53948974609375, -6.315673828125, -6.09185791015625, -5.8680419921875, -5.64422607421875, -5.42041015625, -5.19659423828125, -4.9727783203125, -4.74896240234375, -4.525146484375, -4.30133056640625, -4.0775146484375, -3.85369873046875, -3.6298828125, -3.40606689453125, -3.1822509765625, -2.95843505859375, -2.734619140625, -2.51080322265625, -2.2869873046875, -2.06317138671875, -1.83935546875, -1.61553955078125, -1.3917236328125, -1.16790771484375, -0.944091796875, -0.72027587890625, -0.4964599609375, -0.27264404296875, -0.048828125, 0.17498779296875, 0.3988037109375, 0.62261962890625, 0.846435546875, 1.07025146484375, 1.2940673828125, 1.51788330078125, 1.74169921875, 1.96551513671875, 2.1893310546875, 2.41314697265625, 2.636962890625, 2.86077880859375, 3.0845947265625, 3.30841064453125, 3.5322265625, 3.75604248046875, 3.9798583984375, 4.20367431640625, 4.427490234375, 4.65130615234375, 4.8751220703125, 5.09893798828125, 5.32275390625, 5.54656982421875, 5.7703857421875, 5.99420166015625, 6.218017578125, 6.44183349609375, 6.6656494140625, 6.88946533203125, 7.11328125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 12.0, 16.0, 11.0, 10.0, 17.0, 18.0, 24.0, 28.0, 23.0, 31.0, 40.0, 41.0, 72.0, 169.0, 553.0, 2700.0, 61131.0, 3086468.0, 1028382.0, 12504.0, 1251.0, 338.0, 106.0, 62.0, 41.0, 33.0, 35.0, 30.0, 12.0, 21.0, 23.0, 19.0, 11.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.171875, -24.3544921875, -23.537109375, -22.7197265625, -21.90234375, -21.0849609375, -20.267578125, -19.4501953125, -18.6328125, -17.8154296875, -16.998046875, -16.1806640625, -15.36328125, -14.5458984375, -13.728515625, -12.9111328125, -12.09375, -11.2763671875, -10.458984375, -9.6416015625, -8.82421875, -8.0068359375, -7.189453125, -6.3720703125, -5.5546875, -4.7373046875, -3.919921875, -3.1025390625, -2.28515625, -1.4677734375, -0.650390625, 0.1669921875, 0.984375, 1.8017578125, 2.619140625, 3.4365234375, 4.25390625, 5.0712890625, 5.888671875, 6.7060546875, 7.5234375, 8.3408203125, 9.158203125, 9.9755859375, 10.79296875, 11.6103515625, 12.427734375, 13.2451171875, 14.0625, 14.8798828125, 15.697265625, 16.5146484375, 17.33203125, 18.1494140625, 18.966796875, 19.7841796875, 20.6015625, 21.4189453125, 22.236328125, 23.0537109375, 23.87109375, 24.6884765625, 25.505859375, 26.3232421875, 27.140625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 7.0, 15.0, 19.0, 17.0, 32.0, 46.0, 43.0, 91.0, 103.0, 129.0, 168.0, 230.0, 320.0, 378.0, 442.0, 487.0, 385.0, 304.0, 218.0, 162.0, 123.0, 78.0, 64.0, 45.0, 46.0, 28.0, 20.0, 14.0, 10.0, 10.0, 5.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.071533203125, -10.65869140625, -10.245849609375, -9.8330078125, -9.420166015625, -9.00732421875, -8.594482421875, -8.181640625, -7.768798828125, -7.35595703125, -6.943115234375, -6.5302734375, -6.117431640625, -5.70458984375, -5.291748046875, -4.87890625, -4.466064453125, -4.05322265625, -3.640380859375, -3.2275390625, -2.814697265625, -2.40185546875, -1.989013671875, -1.576171875, -1.163330078125, -0.75048828125, -0.337646484375, 0.0751953125, 0.488037109375, 0.90087890625, 1.313720703125, 1.7265625, 2.139404296875, 2.55224609375, 2.965087890625, 3.3779296875, 3.790771484375, 4.20361328125, 4.616455078125, 5.029296875, 5.442138671875, 5.85498046875, 6.267822265625, 6.6806640625, 7.093505859375, 7.50634765625, 7.919189453125, 8.33203125, 8.744873046875, 9.15771484375, 9.570556640625, 9.9833984375, 10.396240234375, 10.80908203125, 11.221923828125, 11.634765625, 12.047607421875, 12.46044921875, 12.873291015625, 13.2861328125, 13.698974609375, 14.11181640625, 14.524658203125, 14.9375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 16.0, 18.0, 24.0, 23.0, 42.0, 51.0, 64.0, 82.0, 97.0, 139.0, 191.0, 237.0, 403.0, 732.0, 6149.0, 4022252.0, 160889.0, 1190.0, 476.0, 314.0, 206.0, 154.0, 121.0, 90.0, 73.0, 48.0, 38.0, 31.0, 29.0, 17.0, 13.0, 13.0, 14.0, 4.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.59375, -60.48876953125, -58.3837890625, -56.27880859375, -54.173828125, -52.06884765625, -49.9638671875, -47.85888671875, -45.75390625, -43.64892578125, -41.5439453125, -39.43896484375, -37.333984375, -35.22900390625, -33.1240234375, -31.01904296875, -28.9140625, -26.80908203125, -24.7041015625, -22.59912109375, -20.494140625, -18.38916015625, -16.2841796875, -14.17919921875, -12.07421875, -9.96923828125, -7.8642578125, -5.75927734375, -3.654296875, -1.54931640625, 0.5556640625, 2.66064453125, 4.765625, 6.87060546875, 8.9755859375, 11.08056640625, 13.185546875, 15.29052734375, 17.3955078125, 19.50048828125, 21.60546875, 23.71044921875, 25.8154296875, 27.92041015625, 30.025390625, 32.13037109375, 34.2353515625, 36.34033203125, 38.4453125, 40.55029296875, 42.6552734375, 44.76025390625, 46.865234375, 48.97021484375, 51.0751953125, 53.18017578125, 55.28515625, 57.39013671875, 59.4951171875, 61.60009765625, 63.705078125, 65.81005859375, 67.9150390625, 70.02001953125, 72.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 26.0, 204.0, 473.0, 267.0, 38.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.7817611694336, -80.40135955810547, -74.02095794677734, -67.64056396484375, -61.26015853881836, -54.879756927490234, -48.499359130859375, -42.11895751953125, -35.738555908203125, -29.358154296875, -22.977754592895508, -16.597354888916016, -10.21695327758789, -3.8365516662597656, 2.5438461303710938, 8.924247741699219, 15.304649353027344, 21.68505096435547, 28.06545066833496, 34.44585037231445, 40.82625198364258, 47.2066535949707, 53.58705139160156, 59.96745300292969, 66.34785461425781, 72.72825622558594, 79.10865783691406, 85.48905944824219, 91.86946105957031, 98.24986267089844, 104.63025665283203, 111.01065826416016, 117.39105224609375, 123.77145385742188, 130.15185546875, 136.53225708007812, 142.91265869140625, 149.29306030273438, 155.6734619140625, 162.05386352539062, 168.43426513671875, 174.81466674804688, 181.195068359375, 187.57546997070312, 193.95587158203125, 200.33627319335938, 206.7166748046875, 213.09707641601562, 219.4774627685547, 225.8578643798828, 232.23826599121094, 238.61866760253906, 244.9990692138672, 251.3794708251953, 257.7598571777344, 264.1402587890625, 270.5206604003906, 276.90106201171875, 283.2814636230469, 289.661865234375, 296.0422668457031, 302.42266845703125, 308.8030700683594, 315.1834716796875, 321.5638732910156]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 6.0, 12.0, 13.0, 17.0, 20.0, 17.0, 13.0, 29.0, 24.0, 23.0, 29.0, 35.0, 33.0, 29.0, 40.0, 39.0, 39.0, 28.0, 40.0, 41.0, 37.0, 32.0, 46.0, 41.0, 30.0, 32.0, 27.0, 30.0, 12.0, 36.0, 25.0, 22.0, 16.0, 5.0, 12.0, 11.0, 6.0, 7.0, 8.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.13287353515625, -38.885887145996094, -37.6389045715332, -36.39191818237305, -35.144935607910156, -33.89794921875, -32.650962829589844, -31.40397834777832, -30.156993865966797, -28.910009384155273, -27.66302490234375, -26.416038513183594, -25.16905403137207, -23.922069549560547, -22.67508316040039, -21.428098678588867, -20.181114196777344, -18.93412971496582, -17.687145233154297, -16.44015884399414, -15.193174362182617, -13.946189880371094, -12.699204444885254, -11.452219009399414, -10.20523452758789, -8.958250045776367, -7.711264610290527, -6.464279651641846, -5.217294692993164, -3.9703097343444824, -2.723324775695801, -1.476339340209961, -0.2293548583984375, 1.0176301002502441, 2.264615058898926, 3.5116000175476074, 4.758584976196289, 6.005569934844971, 7.252554893493652, 8.499540328979492, 9.746524810791016, 10.993509292602539, 12.240494728088379, 13.487480163574219, 14.734464645385742, 15.981449127197266, 17.228435516357422, 18.475419998168945, 19.72240447998047, 20.969388961791992, 22.216373443603516, 23.463359832763672, 24.710344314575195, 25.95732879638672, 27.204315185546875, 28.4512996673584, 29.698284149169922, 30.945268630981445, 32.19225311279297, 33.439239501953125, 34.68622589111328, 35.93320846557617, 37.18019485473633, 38.42717742919922, 39.674163818359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 4.0, 11.0, 15.0, 13.0, 24.0, 21.0, 32.0, 19.0, 33.0, 26.0, 44.0, 29.0, 41.0, 48.0, 41.0, 41.0, 32.0, 43.0, 43.0, 39.0, 36.0, 33.0, 42.0, 30.0, 30.0, 47.0, 33.0, 25.0, 13.0, 15.0, 14.0, 13.0, 12.0, 7.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.6307373046875, -6.417724609375, -6.2047119140625, -5.99169921875, -5.7786865234375, -5.565673828125, -5.3526611328125, -5.1396484375, -4.9266357421875, -4.713623046875, -4.5006103515625, -4.28759765625, -4.0745849609375, -3.861572265625, -3.6485595703125, -3.435546875, -3.2225341796875, -3.009521484375, -2.7965087890625, -2.58349609375, -2.3704833984375, -2.157470703125, -1.9444580078125, -1.7314453125, -1.5184326171875, -1.305419921875, -1.0924072265625, -0.87939453125, -0.6663818359375, -0.453369140625, -0.2403564453125, -0.02734375, 0.1856689453125, 0.398681640625, 0.6116943359375, 0.82470703125, 1.0377197265625, 1.250732421875, 1.4637451171875, 1.6767578125, 1.8897705078125, 2.102783203125, 2.3157958984375, 2.52880859375, 2.7418212890625, 2.954833984375, 3.1678466796875, 3.380859375, 3.5938720703125, 3.806884765625, 4.0198974609375, 4.23291015625, 4.4459228515625, 4.658935546875, 4.8719482421875, 5.0849609375, 5.2979736328125, 5.510986328125, 5.7239990234375, 5.93701171875, 6.1500244140625, 6.363037109375, 6.5760498046875, 6.7890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 15.0, 11.0, 26.0, 34.0, 45.0, 93.0, 132.0, 163.0, 278.0, 359.0, 503.0, 746.0, 1191.0, 1588.0, 2343.0, 3371.0, 5073.0, 7756.0, 11658.0, 17886.0, 27850.0, 43930.0, 69396.0, 114518.0, 196334.0, 210764.0, 124608.0, 74774.0, 46853.0, 29598.0, 19131.0, 12575.0, 8177.0, 5334.0, 3716.0, 2416.0, 1658.0, 1124.0, 725.0, 549.0, 382.0, 265.0, 198.0, 132.0, 89.0, 63.0, 43.0, 32.0, 16.0, 6.0, 8.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.95849609375, -0.9286117553710938, -0.8987274169921875, -0.8688430786132812, -0.838958740234375, -0.8090744018554688, -0.7791900634765625, -0.7493057250976562, -0.71942138671875, -0.6895370483398438, -0.6596527099609375, -0.6297683715820312, -0.599884033203125, -0.5699996948242188, -0.5401153564453125, -0.5102310180664062, -0.4803466796875, -0.45046234130859375, -0.4205780029296875, -0.39069366455078125, -0.360809326171875, -0.33092498779296875, -0.3010406494140625, -0.27115631103515625, -0.24127197265625, -0.21138763427734375, -0.1815032958984375, -0.15161895751953125, -0.121734619140625, -0.09185028076171875, -0.0619659423828125, -0.03208160400390625, -0.002197265625, 0.02768707275390625, 0.0575714111328125, 0.08745574951171875, 0.117340087890625, 0.14722442626953125, 0.1771087646484375, 0.20699310302734375, 0.23687744140625, 0.26676177978515625, 0.2966461181640625, 0.32653045654296875, 0.356414794921875, 0.38629913330078125, 0.4161834716796875, 0.44606781005859375, 0.4759521484375, 0.5058364868164062, 0.5357208251953125, 0.5656051635742188, 0.595489501953125, 0.6253738403320312, 0.6552581787109375, 0.6851425170898438, 0.71502685546875, 0.7449111938476562, 0.7747955322265625, 0.8046798706054688, 0.834564208984375, 0.8644485473632812, 0.8943328857421875, 0.9242172241210938, 0.9541015625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 11.0, 7.0, 11.0, 12.0, 12.0, 17.0, 20.0, 18.0, 23.0, 32.0, 35.0, 36.0, 36.0, 33.0, 41.0, 35.0, 61.0, 35.0, 1077.0, 41.0, 42.0, 47.0, 40.0, 27.0, 50.0, 26.0, 26.0, 25.0, 25.0, 19.0, 17.0, 11.0, 14.0, 8.0, 13.0, 6.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.41015625, -4.27276611328125, -4.1353759765625, -3.99798583984375, -3.860595703125, -3.72320556640625, -3.5858154296875, -3.44842529296875, -3.31103515625, -3.17364501953125, -3.0362548828125, -2.89886474609375, -2.761474609375, -2.62408447265625, -2.4866943359375, -2.34930419921875, -2.2119140625, -2.07452392578125, -1.9371337890625, -1.79974365234375, -1.662353515625, -1.52496337890625, -1.3875732421875, -1.25018310546875, -1.11279296875, -0.97540283203125, -0.8380126953125, -0.70062255859375, -0.563232421875, -0.42584228515625, -0.2884521484375, -0.15106201171875, -0.013671875, 0.12371826171875, 0.2611083984375, 0.39849853515625, 0.535888671875, 0.67327880859375, 0.8106689453125, 0.94805908203125, 1.08544921875, 1.22283935546875, 1.3602294921875, 1.49761962890625, 1.635009765625, 1.77239990234375, 1.9097900390625, 2.04718017578125, 2.1845703125, 2.32196044921875, 2.4593505859375, 2.59674072265625, 2.734130859375, 2.87152099609375, 3.0089111328125, 3.14630126953125, 3.28369140625, 3.42108154296875, 3.5584716796875, 3.69586181640625, 3.833251953125, 3.97064208984375, 4.1080322265625, 4.24542236328125, 4.3828125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 15.0, 20.0, 26.0, 47.0, 78.0, 120.0, 142.0, 252.0, 351.0, 507.0, 855.0, 1294.0, 2107.0, 3119.0, 4958.0, 7604.0, 12587.0, 20164.0, 34104.0, 58667.0, 107009.0, 209666.0, 1317679.0, 135846.0, 73397.0, 41919.0, 24468.0, 14898.0, 9211.0, 5696.0, 3616.0, 2314.0, 1574.0, 1021.0, 612.0, 396.0, 254.0, 174.0, 135.0, 68.0, 52.0, 44.0, 19.0, 19.0, 8.0, 8.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.016143798828125, -0.98248291015625, -0.948822021484375, -0.9151611328125, -0.881500244140625, -0.84783935546875, -0.814178466796875, -0.780517578125, -0.746856689453125, -0.71319580078125, -0.679534912109375, -0.6458740234375, -0.612213134765625, -0.57855224609375, -0.544891357421875, -0.51123046875, -0.477569580078125, -0.44390869140625, -0.410247802734375, -0.3765869140625, -0.342926025390625, -0.30926513671875, -0.275604248046875, -0.241943359375, -0.208282470703125, -0.17462158203125, -0.140960693359375, -0.1072998046875, -0.073638916015625, -0.03997802734375, -0.006317138671875, 0.02734375, 0.061004638671875, 0.09466552734375, 0.128326416015625, 0.1619873046875, 0.195648193359375, 0.22930908203125, 0.262969970703125, 0.296630859375, 0.330291748046875, 0.36395263671875, 0.397613525390625, 0.4312744140625, 0.464935302734375, 0.49859619140625, 0.532257080078125, 0.56591796875, 0.599578857421875, 0.63323974609375, 0.666900634765625, 0.7005615234375, 0.734222412109375, 0.76788330078125, 0.801544189453125, 0.835205078125, 0.868865966796875, 0.90252685546875, 0.936187744140625, 0.9698486328125, 1.003509521484375, 1.03717041015625, 1.070831298828125, 1.1044921875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 5.0, 15.0, 11.0, 16.0, 17.0, 21.0, 27.0, 26.0, 41.0, 32.0, 34.0, 49.0, 90.0, 70.0, 77.0, 54.0, 67.0, 55.0, 51.0, 49.0, 27.0, 25.0, 21.0, 16.0, 12.0, 10.0, 14.0, 6.0, 12.0, 7.0, 6.0, 3.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006728172302246094, -0.0006508305668830872, -0.0006288439035415649, -0.0006068572402000427, -0.0005848705768585205, -0.0005628839135169983, -0.0005408972501754761, -0.0005189105868339539, -0.0004969239234924316, -0.0004749372601509094, -0.0004529505968093872, -0.000430963933467865, -0.0004089772701263428, -0.00038699060678482056, -0.00036500394344329834, -0.0003430172801017761, -0.0003210306167602539, -0.0002990439534187317, -0.00027705729007720947, -0.00025507062673568726, -0.00023308396339416504, -0.00021109730005264282, -0.0001891106367111206, -0.0001671239733695984, -0.00014513731002807617, -0.00012315064668655396, -0.00010116398334503174, -7.917732000350952e-05, -5.7190656661987305e-05, -3.520399332046509e-05, -1.3217329978942871e-05, 8.769333362579346e-06, 3.075599670410156e-05, 5.274266004562378e-05, 7.4729323387146e-05, 9.671598672866821e-05, 0.00011870265007019043, 0.00014068931341171265, 0.00016267597675323486, 0.00018466264009475708, 0.0002066493034362793, 0.00022863596677780151, 0.00025062263011932373, 0.00027260929346084595, 0.00029459595680236816, 0.0003165826201438904, 0.0003385692834854126, 0.0003605559468269348, 0.00038254261016845703, 0.00040452927350997925, 0.00042651593685150146, 0.0004485026001930237, 0.0004704892635345459, 0.0004924759268760681, 0.0005144625902175903, 0.0005364492535591125, 0.0005584359169006348, 0.000580422580242157, 0.0006024092435836792, 0.0006243959069252014, 0.0006463825702667236, 0.0006683692336082458, 0.0006903558969497681, 0.0007123425602912903, 0.0007343292236328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 1.0, 8.0, 7.0, 6.0, 9.0, 10.0, 15.0, 10.0, 23.0, 28.0, 31.0, 40.0, 60.0, 89.0, 120.0, 252.0, 799.0, 9936.0, 1033213.0, 2591.0, 610.0, 230.0, 106.0, 80.0, 64.0, 34.0, 26.0, 38.0, 15.0, 22.0, 12.0, 15.0, 13.0, 7.0, 10.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016326904296875, -0.015822649002075195, -0.01531839370727539, -0.014814138412475586, -0.014309883117675781, -0.013805627822875977, -0.013301372528076172, -0.012797117233276367, -0.012292861938476562, -0.011788606643676758, -0.011284351348876953, -0.010780096054077148, -0.010275840759277344, -0.009771585464477539, -0.009267330169677734, -0.00876307487487793, -0.008258819580078125, -0.00775456428527832, -0.007250308990478516, -0.006746053695678711, -0.006241798400878906, -0.0057375431060791016, -0.005233287811279297, -0.004729032516479492, -0.0042247772216796875, -0.003720521926879883, -0.003216266632080078, -0.0027120113372802734, -0.0022077560424804688, -0.001703500747680664, -0.0011992454528808594, -0.0006949901580810547, -0.00019073486328125, 0.0003135204315185547, 0.0008177757263183594, 0.001322031021118164, 0.0018262863159179688, 0.0023305416107177734, 0.002834796905517578, 0.003339052200317383, 0.0038433074951171875, 0.004347562789916992, 0.004851818084716797, 0.0053560733795166016, 0.005860328674316406, 0.006364583969116211, 0.006868839263916016, 0.00737309455871582, 0.007877349853515625, 0.00838160514831543, 0.008885860443115234, 0.009390115737915039, 0.009894371032714844, 0.010398626327514648, 0.010902881622314453, 0.011407136917114258, 0.011911392211914062, 0.012415647506713867, 0.012919902801513672, 0.013424158096313477, 0.013928413391113281, 0.014432668685913086, 0.01493692398071289, 0.015441179275512695, 0.0159454345703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 14.0, 81.0, 199.0, 341.0, 241.0, 99.0, 26.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013728872872889042, -0.0013427898520603776, -0.001312692416831851, -0.0012825950980186462, -0.0012524976627901196, -0.001222400227561593, -0.0011923027923330665, -0.0011622053571045399, -0.0011321079218760133, -0.0011020104866474867, -0.00107191305141896, -0.0010418156161904335, -0.0010117182973772287, -0.0009816208621487021, -0.0009515234269201756, -0.000921425991691649, -0.0008913286728784442, -0.0008612312376499176, -0.0008311338606290519, -0.0008010364254005253, -0.0007709389901719987, -0.0007408416131511331, -0.0007107441779226065, -0.0006806467426940799, -0.0006505493074655533, -0.0006204518722370267, -0.000590354495216161, -0.0005602570599876344, -0.0005301596247591078, -0.0005000622477382421, -0.00046996481250971556, -0.0004398674063850194, -0.0004097700002603233, -0.00037967259413562715, -0.00034957515890710056, -0.0003194777527824044, -0.0002893803466577083, -0.00025928294053301215, -0.00022918550530448556, -0.00019908809917978942, -0.00016899067850317806, -0.0001388932578265667, -0.00010879585170187056, -7.86984310252592e-05, -4.860101762460545e-05, -1.8503604223951697e-05, 1.1593816452659667e-05, 4.16912225773558e-05, 7.178864325396717e-05, 0.00010188605665462092, 0.00013198347005527467, 0.00016208089073188603, 0.00019217829685658216, 0.00022227571753319353, 0.0002523731382098049, 0.00028247054433450103, 0.0003125679795630276, 0.00034266538568772376, 0.00037276282091625035, 0.0004028602270409465, 0.0004329576331656426, 0.00046305503929033875, 0.0004931524745188653, 0.000523249851539731, 0.0005533472867682576]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 6.0, 4.0, 5.0, 2.0, 3.0, 9.0, 13.0, 11.0, 11.0, 15.0, 18.0, 25.0, 26.0, 18.0, 30.0, 25.0, 26.0, 29.0, 37.0, 27.0, 44.0, 38.0, 41.0, 56.0, 40.0, 39.0, 32.0, 37.0, 25.0, 26.0, 16.0, 19.0, 34.0, 21.0, 28.0, 25.0, 21.0, 15.0, 15.0, 17.0, 11.0, 6.0, 17.0, 6.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003209710121154785, -0.0003109695389866829, -0.00030096806585788727, -0.00029096659272909164, -0.000280965119600296, -0.0002709636464715004, -0.0002609621733427048, -0.00025096070021390915, -0.00024095922708511353, -0.0002309577539563179, -0.00022095628082752228, -0.00021095480769872665, -0.00020095333456993103, -0.0001909518614411354, -0.00018095038831233978, -0.00017094891518354416, -0.00016094744205474854, -0.0001509459689259529, -0.0001409444957971573, -0.00013094302266836166, -0.00012094154953956604, -0.00011094007641077042, -0.00010093860328197479, -9.093713015317917e-05, -8.093565702438354e-05, -7.093418389558792e-05, -6.09327107667923e-05, -5.0931237637996674e-05, -4.092976450920105e-05, -3.0928291380405426e-05, -2.0926818251609802e-05, -1.0925345122814178e-05, -9.238719940185547e-07, 9.077601134777069e-06, 1.9079074263572693e-05, 2.9080547392368317e-05, 3.908202052116394e-05, 4.9083493649959564e-05, 5.908496677875519e-05, 6.908643990755081e-05, 7.908791303634644e-05, 8.908938616514206e-05, 9.909085929393768e-05, 0.00010909233242273331, 0.00011909380555152893, 0.00012909527868032455, 0.00013909675180912018, 0.0001490982249379158, 0.00015909969806671143, 0.00016910117119550705, 0.00017910264432430267, 0.0001891041174530983, 0.00019910559058189392, 0.00020910706371068954, 0.00021910853683948517, 0.0002291100099682808, 0.00023911148309707642, 0.00024911295622587204, 0.00025911442935466766, 0.0002691159024834633, 0.0002791173756122589, 0.00028911884874105453, 0.00029912032186985016, 0.0003091217949986458, 0.0003191232681274414]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 4.0, 11.0, 15.0, 13.0, 24.0, 22.0, 31.0, 19.0, 33.0, 26.0, 44.0, 29.0, 41.0, 48.0, 41.0, 41.0, 32.0, 43.0, 43.0, 39.0, 36.0, 33.0, 42.0, 30.0, 30.0, 47.0, 33.0, 25.0, 13.0, 15.0, 14.0, 13.0, 12.0, 7.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.6307373046875, -6.417724609375, -6.2047119140625, -5.99169921875, -5.7786865234375, -5.565673828125, -5.3526611328125, -5.1396484375, -4.9266357421875, -4.713623046875, -4.5006103515625, -4.28759765625, -4.0745849609375, -3.861572265625, -3.6485595703125, -3.435546875, -3.2225341796875, -3.009521484375, -2.7965087890625, -2.58349609375, -2.3704833984375, -2.157470703125, -1.9444580078125, -1.7314453125, -1.5184326171875, -1.305419921875, -1.0924072265625, -0.87939453125, -0.6663818359375, -0.453369140625, -0.2403564453125, -0.02734375, 0.1856689453125, 0.398681640625, 0.6116943359375, 0.82470703125, 1.0377197265625, 1.250732421875, 1.4637451171875, 1.6767578125, 1.8897705078125, 2.102783203125, 2.3157958984375, 2.52880859375, 2.7418212890625, 2.954833984375, 3.1678466796875, 3.380859375, 3.5938720703125, 3.806884765625, 4.0198974609375, 4.23291015625, 4.4459228515625, 4.658935546875, 4.8719482421875, 5.0849609375, 5.2979736328125, 5.510986328125, 5.7239990234375, 5.93701171875, 6.1500244140625, 6.363037109375, 6.5760498046875, 6.7890625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 14.0, 17.0, 32.0, 49.0, 73.0, 91.0, 131.0, 138.0, 227.0, 404.0, 658.0, 1118.0, 1902.0, 3429.0, 6830.0, 14724.0, 35121.0, 93736.0, 283319.0, 387929.0, 132503.0, 47770.0, 19549.0, 8787.0, 4395.0, 2235.0, 1255.0, 709.0, 444.0, 306.0, 195.0, 116.0, 101.0, 70.0, 40.0, 31.0, 25.0, 20.0, 18.0, 10.0, 3.0, 4.0, 5.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.12109375, -4.97119140625, -4.8212890625, -4.67138671875, -4.521484375, -4.37158203125, -4.2216796875, -4.07177734375, -3.921875, -3.77197265625, -3.6220703125, -3.47216796875, -3.322265625, -3.17236328125, -3.0224609375, -2.87255859375, -2.72265625, -2.57275390625, -2.4228515625, -2.27294921875, -2.123046875, -1.97314453125, -1.8232421875, -1.67333984375, -1.5234375, -1.37353515625, -1.2236328125, -1.07373046875, -0.923828125, -0.77392578125, -0.6240234375, -0.47412109375, -0.32421875, -0.17431640625, -0.0244140625, 0.12548828125, 0.275390625, 0.42529296875, 0.5751953125, 0.72509765625, 0.875, 1.02490234375, 1.1748046875, 1.32470703125, 1.474609375, 1.62451171875, 1.7744140625, 1.92431640625, 2.07421875, 2.22412109375, 2.3740234375, 2.52392578125, 2.673828125, 2.82373046875, 2.9736328125, 3.12353515625, 3.2734375, 3.42333984375, 3.5732421875, 3.72314453125, 3.873046875, 4.02294921875, 4.1728515625, 4.32275390625, 4.47265625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 4.0, 8.0, 14.0, 12.0, 10.0, 16.0, 18.0, 29.0, 21.0, 23.0, 23.0, 47.0, 35.0, 51.0, 45.0, 56.0, 93.0, 316.0, 1582.0, 123.0, 94.0, 57.0, 47.0, 38.0, 39.0, 33.0, 34.0, 32.0, 23.0, 15.0, 27.0, 10.0, 14.0, 8.0, 7.0, 7.0, 9.0, 6.0, 1.0, 1.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.484375, -21.80712890625, -21.1298828125, -20.45263671875, -19.775390625, -19.09814453125, -18.4208984375, -17.74365234375, -17.06640625, -16.38916015625, -15.7119140625, -15.03466796875, -14.357421875, -13.68017578125, -13.0029296875, -12.32568359375, -11.6484375, -10.97119140625, -10.2939453125, -9.61669921875, -8.939453125, -8.26220703125, -7.5849609375, -6.90771484375, -6.23046875, -5.55322265625, -4.8759765625, -4.19873046875, -3.521484375, -2.84423828125, -2.1669921875, -1.48974609375, -0.8125, -0.13525390625, 0.5419921875, 1.21923828125, 1.896484375, 2.57373046875, 3.2509765625, 3.92822265625, 4.60546875, 5.28271484375, 5.9599609375, 6.63720703125, 7.314453125, 7.99169921875, 8.6689453125, 9.34619140625, 10.0234375, 10.70068359375, 11.3779296875, 12.05517578125, 12.732421875, 13.40966796875, 14.0869140625, 14.76416015625, 15.44140625, 16.11865234375, 16.7958984375, 17.47314453125, 18.150390625, 18.82763671875, 19.5048828125, 20.18212890625, 20.859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 12.0, 13.0, 32.0, 54.0, 95.0, 182.0, 273.0, 495.0, 1754.0, 3133674.0, 7738.0, 613.0, 311.0, 187.0, 109.0, 59.0, 36.0, 21.0, 20.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.875, -137.41015625, -133.9453125, -130.48046875, -127.015625, -123.55078125, -120.0859375, -116.62109375, -113.15625, -109.69140625, -106.2265625, -102.76171875, -99.296875, -95.83203125, -92.3671875, -88.90234375, -85.4375, -81.97265625, -78.5078125, -75.04296875, -71.578125, -68.11328125, -64.6484375, -61.18359375, -57.71875, -54.25390625, -50.7890625, -47.32421875, -43.859375, -40.39453125, -36.9296875, -33.46484375, -30.0, -26.53515625, -23.0703125, -19.60546875, -16.140625, -12.67578125, -9.2109375, -5.74609375, -2.28125, 1.18359375, 4.6484375, 8.11328125, 11.578125, 15.04296875, 18.5078125, 21.97265625, 25.4375, 28.90234375, 32.3671875, 35.83203125, 39.296875, 42.76171875, 46.2265625, 49.69140625, 53.15625, 56.62109375, 60.0859375, 63.55078125, 67.015625, 70.48046875, 73.9453125, 77.41015625, 80.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [4.0, 937.0, 80.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.38177490234375, -7.355345726013184, 2.671083450317383, 12.697513580322266, 22.723941802978516, 32.750370025634766, 42.77680206298828, 52.80323028564453, 62.82965850830078, 72.85608673095703, 82.88251495361328, 92.90895080566406, 102.93537902832031, 112.96180725097656, 122.98823547363281, 133.01466369628906, 143.0410919189453, 153.06752014160156, 163.0939483642578, 173.12037658691406, 183.1468048095703, 193.17323303222656, 203.19967651367188, 213.22610473632812, 223.25253295898438, 233.27896118164062, 243.30538940429688, 253.33181762695312, 263.3582458496094, 273.3846740722656, 283.4111022949219, 293.4375305175781, 303.4639587402344, 313.4903869628906, 323.5168151855469, 333.5432434082031, 343.5696716308594, 353.5960998535156, 363.6225280761719, 373.6489562988281, 383.6753845214844, 393.7018127441406, 403.7282409667969, 413.7546691894531, 423.7810974121094, 433.8075256347656, 443.8339538574219, 453.8603820800781, 463.8868408203125, 473.91326904296875, 483.939697265625, 493.96612548828125, 503.9925537109375, 514.0189819335938, 524.04541015625, 534.0718383789062, 544.0982666015625, 554.1246948242188, 564.151123046875, 574.1775512695312, 584.2039794921875, 594.2304077148438, 604.2568359375, 614.2832641601562, 624.3096923828125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 10.0, 10.0, 8.0, 10.0, 14.0, 14.0, 14.0, 18.0, 20.0, 35.0, 25.0, 26.0, 30.0, 32.0, 29.0, 32.0, 45.0, 48.0, 43.0, 51.0, 43.0, 37.0, 45.0, 37.0, 35.0, 33.0, 32.0, 28.0, 31.0, 22.0, 23.0, 24.0, 12.0, 17.0, 10.0, 15.0, 14.0, 10.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.804561614990234, -57.924407958984375, -56.044254302978516, -54.164100646972656, -52.2839469909668, -50.40379333496094, -48.523643493652344, -46.64348602294922, -44.763336181640625, -42.883182525634766, -41.003028869628906, -39.12287521362305, -37.24272155761719, -35.36256790161133, -33.48241424560547, -31.602262496948242, -29.72210693359375, -27.84195327758789, -25.96179962158203, -24.081645965576172, -22.201492309570312, -20.321338653564453, -18.441186904907227, -16.561033248901367, -14.680879592895508, -12.800725936889648, -10.920572280883789, -9.040419578552246, -7.160265922546387, -5.280112266540527, -3.3999595642089844, -1.519805908203125, 0.3603477478027344, 2.2405011653900146, 4.120654582977295, 6.000807762145996, 7.8809614181518555, 9.761115074157715, 11.641267776489258, 13.521421432495117, 15.401575088500977, 17.281728744506836, 19.161882400512695, 21.042034149169922, 22.92218780517578, 24.80234146118164, 26.6824951171875, 28.56264877319336, 30.44280242919922, 32.32295608520508, 34.20310974121094, 36.0832633972168, 37.963417053222656, 39.843570709228516, 41.723724365234375, 43.60387420654297, 45.484031677246094, 47.36418533325195, 49.24433898925781, 51.12449264526367, 53.00464630126953, 54.88479995727539, 56.76495361328125, 58.645103454589844, 60.5252571105957]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 11.0, 6.0, 8.0, 16.0, 16.0, 17.0, 14.0, 21.0, 28.0, 30.0, 37.0, 42.0, 31.0, 43.0, 44.0, 41.0, 47.0, 42.0, 43.0, 37.0, 44.0, 33.0, 32.0, 33.0, 35.0, 33.0, 44.0, 36.0, 31.0, 16.0, 15.0, 8.0, 6.0, 16.0, 12.0, 6.0, 9.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12109375, -6.8931884765625, -6.665283203125, -6.4373779296875, -6.20947265625, -5.9815673828125, -5.753662109375, -5.5257568359375, -5.2978515625, -5.0699462890625, -4.842041015625, -4.6141357421875, -4.38623046875, -4.1583251953125, -3.930419921875, -3.7025146484375, -3.474609375, -3.2467041015625, -3.018798828125, -2.7908935546875, -2.56298828125, -2.3350830078125, -2.107177734375, -1.8792724609375, -1.6513671875, -1.4234619140625, -1.195556640625, -0.9676513671875, -0.73974609375, -0.5118408203125, -0.283935546875, -0.0560302734375, 0.171875, 0.3997802734375, 0.627685546875, 0.8555908203125, 1.08349609375, 1.3114013671875, 1.539306640625, 1.7672119140625, 1.9951171875, 2.2230224609375, 2.450927734375, 2.6788330078125, 2.90673828125, 3.1346435546875, 3.362548828125, 3.5904541015625, 3.818359375, 4.0462646484375, 4.274169921875, 4.5020751953125, 4.72998046875, 4.9578857421875, 5.185791015625, 5.4136962890625, 5.6416015625, 5.8695068359375, 6.097412109375, 6.3253173828125, 6.55322265625, 6.7811279296875, 7.009033203125, 7.2369384765625, 7.46484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 7.0, 5.0, 6.0, 9.0, 13.0, 12.0, 12.0, 10.0, 19.0, 27.0, 21.0, 31.0, 43.0, 49.0, 87.0, 116.0, 279.0, 796.0, 3136.0, 34569.0, 1201812.0, 2781809.0, 161368.0, 7689.0, 1352.0, 414.0, 176.0, 102.0, 76.0, 48.0, 33.0, 29.0, 24.0, 24.0, 18.0, 13.0, 9.0, 10.0, 6.0, 9.0, 6.0, 3.0, 7.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.540283203125, -16.93994140625, -16.339599609375, -15.7392578125, -15.138916015625, -14.53857421875, -13.938232421875, -13.337890625, -12.737548828125, -12.13720703125, -11.536865234375, -10.9365234375, -10.336181640625, -9.73583984375, -9.135498046875, -8.53515625, -7.934814453125, -7.33447265625, -6.734130859375, -6.1337890625, -5.533447265625, -4.93310546875, -4.332763671875, -3.732421875, -3.132080078125, -2.53173828125, -1.931396484375, -1.3310546875, -0.730712890625, -0.13037109375, 0.469970703125, 1.0703125, 1.670654296875, 2.27099609375, 2.871337890625, 3.4716796875, 4.072021484375, 4.67236328125, 5.272705078125, 5.873046875, 6.473388671875, 7.07373046875, 7.674072265625, 8.2744140625, 8.874755859375, 9.47509765625, 10.075439453125, 10.67578125, 11.276123046875, 11.87646484375, 12.476806640625, 13.0771484375, 13.677490234375, 14.27783203125, 14.878173828125, 15.478515625, 16.078857421875, 16.67919921875, 17.279541015625, 17.8798828125, 18.480224609375, 19.08056640625, 19.680908203125, 20.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 13.0, 6.0, 3.0, 9.0, 17.0, 12.0, 28.0, 24.0, 33.0, 39.0, 34.0, 63.0, 73.0, 90.0, 108.0, 140.0, 184.0, 232.0, 269.0, 372.0, 364.0, 344.0, 286.0, 280.0, 238.0, 165.0, 125.0, 112.0, 90.0, 63.0, 65.0, 41.0, 32.0, 29.0, 22.0, 14.0, 14.0, 5.0, 9.0, 6.0, 6.0, 7.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5743408203125, -8.265869140625, -7.9573974609375, -7.64892578125, -7.3404541015625, -7.031982421875, -6.7235107421875, -6.4150390625, -6.1065673828125, -5.798095703125, -5.4896240234375, -5.18115234375, -4.8726806640625, -4.564208984375, -4.2557373046875, -3.947265625, -3.6387939453125, -3.330322265625, -3.0218505859375, -2.71337890625, -2.4049072265625, -2.096435546875, -1.7879638671875, -1.4794921875, -1.1710205078125, -0.862548828125, -0.5540771484375, -0.24560546875, 0.0628662109375, 0.371337890625, 0.6798095703125, 0.98828125, 1.2967529296875, 1.605224609375, 1.9136962890625, 2.22216796875, 2.5306396484375, 2.839111328125, 3.1475830078125, 3.4560546875, 3.7645263671875, 4.072998046875, 4.3814697265625, 4.68994140625, 4.9984130859375, 5.306884765625, 5.6153564453125, 5.923828125, 6.2322998046875, 6.540771484375, 6.8492431640625, 7.15771484375, 7.4661865234375, 7.774658203125, 8.0831298828125, 8.3916015625, 8.7000732421875, 9.008544921875, 9.3170166015625, 9.62548828125, 9.9339599609375, 10.242431640625, 10.5509033203125, 10.859375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 20.0, 25.0, 28.0, 38.0, 38.0, 78.0, 108.0, 117.0, 160.0, 195.0, 344.0, 641.0, 3144.0, 4060837.0, 126119.0, 894.0, 441.0, 254.0, 188.0, 148.0, 114.0, 73.0, 58.0, 46.0, 40.0, 29.0, 19.0, 20.0, 10.0, 7.0, 3.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.625, -81.21875, -78.8125, -76.40625, -74.0, -71.59375, -69.1875, -66.78125, -64.375, -61.96875, -59.5625, -57.15625, -54.75, -52.34375, -49.9375, -47.53125, -45.125, -42.71875, -40.3125, -37.90625, -35.5, -33.09375, -30.6875, -28.28125, -25.875, -23.46875, -21.0625, -18.65625, -16.25, -13.84375, -11.4375, -9.03125, -6.625, -4.21875, -1.8125, 0.59375, 3.0, 5.40625, 7.8125, 10.21875, 12.625, 15.03125, 17.4375, 19.84375, 22.25, 24.65625, 27.0625, 29.46875, 31.875, 34.28125, 36.6875, 39.09375, 41.5, 43.90625, 46.3125, 48.71875, 51.125, 53.53125, 55.9375, 58.34375, 60.75, 63.15625, 65.5625, 67.96875, 70.375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 13.0, 17.0, 31.0, 31.0, 47.0, 59.0, 90.0, 85.0, 104.0, 91.0, 87.0, 76.0, 78.0, 66.0, 36.0, 31.0, 21.0, 10.0, 12.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.27195739746094, -32.10111999511719, -30.930282592773438, -29.759445190429688, -28.588607788085938, -27.417770385742188, -26.24693489074707, -25.07609748840332, -23.90526008605957, -22.73442268371582, -21.56358528137207, -20.39274787902832, -19.221912384033203, -18.051074981689453, -16.880237579345703, -15.709400177001953, -14.538562774658203, -13.367725372314453, -12.196887969970703, -11.02605152130127, -9.85521411895752, -8.68437671661377, -7.513539791107178, -6.342702865600586, -5.171865463256836, -4.001028060913086, -2.830191135406494, -1.6593539714813232, -0.48851680755615234, 0.6823205947875977, 1.8531575202941895, 3.0239944458007812, 4.194828033447266, 5.365665435791016, 6.536502361297607, 7.707339286804199, 8.87817668914795, 10.0490140914917, 11.219850540161133, 12.390687942504883, 13.561525344848633, 14.732362747192383, 15.903200149536133, 17.074037551879883, 18.244873046875, 19.41571044921875, 20.5865478515625, 21.75738525390625, 22.92822265625, 24.09906005859375, 25.2698974609375, 26.44073486328125, 27.611572265625, 28.78240966796875, 29.953245162963867, 31.124082565307617, 32.294921875, 33.46575927734375, 34.6365966796875, 35.80743408203125, 36.978271484375, 38.14910888671875, 39.3199462890625, 40.49078369140625, 41.661617279052734]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 10.0, 5.0, 9.0, 6.0, 11.0, 14.0, 12.0, 17.0, 17.0, 27.0, 25.0, 15.0, 29.0, 28.0, 38.0, 33.0, 31.0, 37.0, 49.0, 36.0, 33.0, 39.0, 47.0, 36.0, 47.0, 37.0, 29.0, 35.0, 24.0, 32.0, 28.0, 28.0, 25.0, 21.0, 11.0, 14.0, 16.0, 14.0, 7.0, 5.0, 5.0, 5.0, 6.0, 7.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.13691711425781, -37.85509490966797, -36.57327651977539, -35.29145431518555, -34.0096321105957, -32.72780990600586, -31.44599151611328, -30.164169311523438, -28.882347106933594, -27.600526809692383, -26.31870460510254, -25.036884307861328, -23.755062103271484, -22.473241806030273, -21.191421508789062, -19.90959930419922, -18.627779006958008, -17.345958709716797, -16.064136505126953, -14.782316207885742, -13.500494003295898, -12.218673706054688, -10.93685245513916, -9.655031204223633, -8.373209953308105, -7.091388702392578, -5.809567451477051, -4.527746677398682, -3.2459254264831543, -1.964104175567627, -0.6822834014892578, 0.5995378494262695, 1.8813591003417969, 3.163180351257324, 4.445001602172852, 5.726822376251221, 7.008643627166748, 8.290464401245117, 9.572285652160645, 10.854106903076172, 12.1359281539917, 13.417749404907227, 14.699570655822754, 15.981391906738281, 17.263212203979492, 18.545034408569336, 19.826854705810547, 21.10867691040039, 22.3904972076416, 23.672317504882812, 24.954139709472656, 26.235960006713867, 27.51778221130371, 28.799602508544922, 30.081424713134766, 31.363245010375977, 32.64506530761719, 33.92688751220703, 35.20870590209961, 36.49052810668945, 37.7723503112793, 39.05417251586914, 40.33599090576172, 41.61781311035156, 42.899635314941406]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 0.0, 8.0, 10.0, 7.0, 6.0, 10.0, 9.0, 14.0, 25.0, 29.0, 21.0, 39.0, 35.0, 29.0, 33.0, 45.0, 53.0, 45.0, 39.0, 46.0, 47.0, 32.0, 43.0, 38.0, 36.0, 36.0, 48.0, 27.0, 38.0, 21.0, 27.0, 13.0, 20.0, 15.0, 16.0, 8.0, 13.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9609375, -6.73858642578125, -6.5162353515625, -6.29388427734375, -6.071533203125, -5.84918212890625, -5.6268310546875, -5.40447998046875, -5.18212890625, -4.95977783203125, -4.7374267578125, -4.51507568359375, -4.292724609375, -4.07037353515625, -3.8480224609375, -3.62567138671875, -3.4033203125, -3.18096923828125, -2.9586181640625, -2.73626708984375, -2.513916015625, -2.29156494140625, -2.0692138671875, -1.84686279296875, -1.62451171875, -1.40216064453125, -1.1798095703125, -0.95745849609375, -0.735107421875, -0.51275634765625, -0.2904052734375, -0.06805419921875, 0.154296875, 0.37664794921875, 0.5989990234375, 0.82135009765625, 1.043701171875, 1.26605224609375, 1.4884033203125, 1.71075439453125, 1.93310546875, 2.15545654296875, 2.3778076171875, 2.60015869140625, 2.822509765625, 3.04486083984375, 3.2672119140625, 3.48956298828125, 3.7119140625, 3.93426513671875, 4.1566162109375, 4.37896728515625, 4.601318359375, 4.82366943359375, 5.0460205078125, 5.26837158203125, 5.49072265625, 5.71307373046875, 5.9354248046875, 6.15777587890625, 6.380126953125, 6.60247802734375, 6.8248291015625, 7.04718017578125, 7.26953125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 12.0, 10.0, 22.0, 42.0, 36.0, 74.0, 109.0, 172.0, 292.0, 463.0, 720.0, 1156.0, 1990.0, 3265.0, 5284.0, 8844.0, 15321.0, 26684.0, 47120.0, 85639.0, 162992.0, 283631.0, 185092.0, 95783.0, 52748.0, 29515.0, 16812.0, 9780.0, 5862.0, 3493.0, 2084.0, 1284.0, 825.0, 482.0, 336.0, 188.0, 129.0, 91.0, 56.0, 37.0, 25.0, 15.0, 12.0, 18.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3193359375, -1.280059814453125, -1.24078369140625, -1.201507568359375, -1.1622314453125, -1.122955322265625, -1.08367919921875, -1.044403076171875, -1.005126953125, -0.965850830078125, -0.92657470703125, -0.887298583984375, -0.8480224609375, -0.808746337890625, -0.76947021484375, -0.730194091796875, -0.69091796875, -0.651641845703125, -0.61236572265625, -0.573089599609375, -0.5338134765625, -0.494537353515625, -0.45526123046875, -0.415985107421875, -0.376708984375, -0.337432861328125, -0.29815673828125, -0.258880615234375, -0.2196044921875, -0.180328369140625, -0.14105224609375, -0.101776123046875, -0.0625, -0.023223876953125, 0.01605224609375, 0.055328369140625, 0.0946044921875, 0.133880615234375, 0.17315673828125, 0.212432861328125, 0.251708984375, 0.290985107421875, 0.33026123046875, 0.369537353515625, 0.4088134765625, 0.448089599609375, 0.48736572265625, 0.526641845703125, 0.56591796875, 0.605194091796875, 0.64447021484375, 0.683746337890625, 0.7230224609375, 0.762298583984375, 0.80157470703125, 0.840850830078125, 0.880126953125, 0.919403076171875, 0.95867919921875, 0.997955322265625, 1.0372314453125, 1.076507568359375, 1.11578369140625, 1.155059814453125, 1.1943359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 5.0, 7.0, 12.0, 7.0, 14.0, 13.0, 14.0, 20.0, 19.0, 24.0, 24.0, 29.0, 30.0, 31.0, 28.0, 36.0, 29.0, 25.0, 50.0, 33.0, 1061.0, 56.0, 51.0, 39.0, 41.0, 42.0, 29.0, 27.0, 37.0, 17.0, 24.0, 19.0, 21.0, 19.0, 9.0, 18.0, 16.0, 9.0, 7.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.67169189453125, -3.5465087890625, -3.42132568359375, -3.296142578125, -3.17095947265625, -3.0457763671875, -2.92059326171875, -2.79541015625, -2.67022705078125, -2.5450439453125, -2.41986083984375, -2.294677734375, -2.16949462890625, -2.0443115234375, -1.91912841796875, -1.7939453125, -1.66876220703125, -1.5435791015625, -1.41839599609375, -1.293212890625, -1.16802978515625, -1.0428466796875, -0.91766357421875, -0.79248046875, -0.66729736328125, -0.5421142578125, -0.41693115234375, -0.291748046875, -0.16656494140625, -0.0413818359375, 0.08380126953125, 0.208984375, 0.33416748046875, 0.4593505859375, 0.58453369140625, 0.709716796875, 0.83489990234375, 0.9600830078125, 1.08526611328125, 1.21044921875, 1.33563232421875, 1.4608154296875, 1.58599853515625, 1.711181640625, 1.83636474609375, 1.9615478515625, 2.08673095703125, 2.2119140625, 2.33709716796875, 2.4622802734375, 2.58746337890625, 2.712646484375, 2.83782958984375, 2.9630126953125, 3.08819580078125, 3.21337890625, 3.33856201171875, 3.4637451171875, 3.58892822265625, 3.714111328125, 3.83929443359375, 3.9644775390625, 4.08966064453125, 4.21484375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 12.0, 4.0, 9.0, 21.0, 28.0, 38.0, 56.0, 98.0, 139.0, 210.0, 315.0, 411.0, 636.0, 858.0, 1263.0, 1948.0, 2850.0, 4228.0, 6351.0, 9725.0, 14716.0, 22595.0, 35422.0, 57620.0, 95504.0, 173869.0, 1296970.0, 146503.0, 83497.0, 50449.0, 31439.0, 19929.0, 13267.0, 8578.0, 5797.0, 3756.0, 2492.0, 1715.0, 1206.0, 847.0, 562.0, 373.0, 262.0, 172.0, 136.0, 79.0, 65.0, 37.0, 20.0, 23.0, 18.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.9287109375, -0.9000167846679688, -0.8713226318359375, -0.8426284790039062, -0.813934326171875, -0.7852401733398438, -0.7565460205078125, -0.7278518676757812, -0.69915771484375, -0.6704635620117188, -0.6417694091796875, -0.6130752563476562, -0.584381103515625, -0.5556869506835938, -0.5269927978515625, -0.49829864501953125, -0.4696044921875, -0.44091033935546875, -0.4122161865234375, -0.38352203369140625, -0.354827880859375, -0.32613372802734375, -0.2974395751953125, -0.26874542236328125, -0.24005126953125, -0.21135711669921875, -0.1826629638671875, -0.15396881103515625, -0.125274658203125, -0.09658050537109375, -0.0678863525390625, -0.03919219970703125, -0.010498046875, 0.01819610595703125, 0.0468902587890625, 0.07558441162109375, 0.104278564453125, 0.13297271728515625, 0.1616668701171875, 0.19036102294921875, 0.21905517578125, 0.24774932861328125, 0.2764434814453125, 0.30513763427734375, 0.333831787109375, 0.36252593994140625, 0.3912200927734375, 0.41991424560546875, 0.4486083984375, 0.47730255126953125, 0.5059967041015625, 0.5346908569335938, 0.563385009765625, 0.5920791625976562, 0.6207733154296875, 0.6494674682617188, 0.67816162109375, 0.7068557739257812, 0.7355499267578125, 0.7642440795898438, 0.792938232421875, 0.8216323852539062, 0.8503265380859375, 0.8790206909179688, 0.90771484375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 12.0, 15.0, 20.0, 16.0, 31.0, 41.0, 39.0, 56.0, 67.0, 77.0, 75.0, 78.0, 77.0, 61.0, 56.0, 44.0, 44.0, 25.0, 30.0, 20.0, 19.0, 16.0, 6.0, 10.0, 10.0, 9.0, 6.0, 1.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0007271766662597656, -0.0007058605551719666, -0.0006845444440841675, -0.0006632283329963684, -0.0006419122219085693, -0.0006205961108207703, -0.0005992799997329712, -0.0005779638886451721, -0.000556647777557373, -0.000535331666469574, -0.0005140155553817749, -0.0004926994442939758, -0.00047138333320617676, -0.0004500672221183777, -0.0004287511110305786, -0.00040743499994277954, -0.00038611888885498047, -0.0003648027777671814, -0.0003434866666793823, -0.00032217055559158325, -0.0003008544445037842, -0.0002795383334159851, -0.00025822222232818604, -0.00023690611124038696, -0.0002155900001525879, -0.00019427388906478882, -0.00017295777797698975, -0.00015164166688919067, -0.0001303255558013916, -0.00010900944471359253, -8.769333362579346e-05, -6.637722253799438e-05, -4.506111145019531e-05, -2.374500036239624e-05, -2.428889274597168e-06, 1.8887221813201904e-05, 4.0203332901000977e-05, 6.151944398880005e-05, 8.283555507659912e-05, 0.0001041516661643982, 0.00012546777725219727, 0.00014678388833999634, 0.0001680999994277954, 0.00018941611051559448, 0.00021073222160339355, 0.00023204833269119263, 0.0002533644437789917, 0.00027468055486679077, 0.00029599666595458984, 0.0003173127770423889, 0.000338628888130188, 0.00035994499921798706, 0.00038126111030578613, 0.0004025772213935852, 0.0004238933324813843, 0.00044520944356918335, 0.0004665255546569824, 0.0004878416657447815, 0.0005091577768325806, 0.0005304738879203796, 0.0005517899990081787, 0.0005731061100959778, 0.0005944222211837769, 0.0006157383322715759, 0.000637054443359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 12.0, 11.0, 12.0, 17.0, 19.0, 21.0, 26.0, 35.0, 57.0, 64.0, 91.0, 162.0, 267.0, 784.0, 27787.0, 1016309.0, 1830.0, 431.0, 205.0, 120.0, 83.0, 46.0, 33.0, 32.0, 17.0, 16.0, 8.0, 14.0, 11.0, 4.0, 2.0, 2.0, 3.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01488494873046875, -0.014392971992492676, -0.013900995254516602, -0.013409018516540527, -0.012917041778564453, -0.012425065040588379, -0.011933088302612305, -0.01144111156463623, -0.010949134826660156, -0.010457158088684082, -0.009965181350708008, -0.009473204612731934, -0.00898122787475586, -0.008489251136779785, -0.007997274398803711, -0.007505297660827637, -0.0070133209228515625, -0.006521344184875488, -0.006029367446899414, -0.00553739070892334, -0.005045413970947266, -0.004553437232971191, -0.004061460494995117, -0.003569483757019043, -0.0030775070190429688, -0.0025855302810668945, -0.0020935535430908203, -0.001601576805114746, -0.0011096000671386719, -0.0006176233291625977, -0.00012564659118652344, 0.0003663301467895508, 0.000858306884765625, 0.0013502836227416992, 0.0018422603607177734, 0.0023342370986938477, 0.002826213836669922, 0.003318190574645996, 0.0038101673126220703, 0.0043021440505981445, 0.004794120788574219, 0.005286097526550293, 0.005778074264526367, 0.006270051002502441, 0.006762027740478516, 0.00725400447845459, 0.007745981216430664, 0.008237957954406738, 0.008729934692382812, 0.009221911430358887, 0.009713888168334961, 0.010205864906311035, 0.01069784164428711, 0.011189818382263184, 0.011681795120239258, 0.012173771858215332, 0.012665748596191406, 0.01315772533416748, 0.013649702072143555, 0.014141678810119629, 0.014633655548095703, 0.015125632286071777, 0.015617609024047852, 0.016109585762023926, 0.0166015625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 20.0, 33.0, 74.0, 99.0, 139.0, 186.0, 153.0, 128.0, 75.0, 46.0, 18.0, 17.0, 8.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003211433067917824, -0.00030575686832889915, -0.00029037045896984637, -0.00027498402050696313, -0.00025959761114791036, -0.0002442111726850271, -0.00022882474877405912, -0.0002134383248630911, -0.0001980519009521231, -0.0001826654770411551, -0.0001672790531301871, -0.0001518926292192191, -0.00013650619075633585, -0.00012111977412132546, -0.00010573334293439984, -9.034691902343184e-05, -7.496049511246383e-05, -5.9574071201495826e-05, -4.4187643652549013e-05, -2.88012161036022e-05, -1.3414792192634195e-05, 1.9716317183338106e-06, 1.735806290525943e-05, 3.2744486816227436e-05, 4.813091072719544e-05, 6.351733463816345e-05, 7.890375854913145e-05, 9.429018973605707e-05, 0.00010967661364702508, 0.00012506303028203547, 0.0001404494687449187, 0.0001558358926558867, 0.00017122231656685472, 0.00018660874047782272, 0.00020199516438879073, 0.00021738160285167396, 0.00023276801221072674, 0.00024815445067360997, 0.0002635408891364932, 0.000278927298495546, 0.00029431370785459876, 0.000309700146317482, 0.00032508655567653477, 0.000340472994139418, 0.0003558594034984708, 0.000371245841961354, 0.00038663228042423725, 0.00040201868978329003, 0.00041740512824617326, 0.0004327915667090565, 0.0004481779760681093, 0.0004635644145309925, 0.0004789508238900453, 0.0004943372332490981, 0.0005097236717119813, 0.0005251101101748645, 0.0005404965486377478, 0.000555882987100631, 0.0005712694255635142, 0.0005866558058187366, 0.0006020422442816198, 0.000617428682744503, 0.0006328151212073863, 0.0006482015596702695, 0.0006635879399254918]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 9.0, 14.0, 7.0, 10.0, 14.0, 15.0, 15.0, 20.0, 26.0, 27.0, 27.0, 24.0, 35.0, 24.0, 27.0, 28.0, 38.0, 30.0, 33.0, 32.0, 36.0, 33.0, 44.0, 48.0, 29.0, 41.0, 21.0, 29.0, 24.0, 22.0, 34.0, 22.0, 14.0, 22.0, 14.0, 21.0, 17.0, 19.0, 11.0, 7.0, 3.0, 3.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00028628110885620117, -0.0002773944288492203, -0.0002685077488422394, -0.0002596210688352585, -0.0002507343888282776, -0.0002418477088212967, -0.0002329610288143158, -0.0002240743488073349, -0.000215187668800354, -0.0002063009887933731, -0.0001974143087863922, -0.00018852762877941132, -0.00017964094877243042, -0.00017075426876544952, -0.00016186758875846863, -0.00015298090875148773, -0.00014409422874450684, -0.00013520754873752594, -0.00012632086873054504, -0.00011743418872356415, -0.00010854750871658325, -9.966082870960236e-05, -9.077414870262146e-05, -8.188746869564056e-05, -7.300078868865967e-05, -6.411410868167877e-05, -5.5227428674697876e-05, -4.634074866771698e-05, -3.7454068660736084e-05, -2.8567388653755188e-05, -1.9680708646774292e-05, -1.0794028639793396e-05, -1.9073486328125e-06, 6.979331374168396e-06, 1.5866011381149292e-05, 2.4752691388130188e-05, 3.3639371395111084e-05, 4.252605140209198e-05, 5.1412731409072876e-05, 6.029941141605377e-05, 6.918609142303467e-05, 7.807277143001556e-05, 8.695945143699646e-05, 9.584613144397736e-05, 0.00010473281145095825, 0.00011361949145793915, 0.00012250617146492004, 0.00013139285147190094, 0.00014027953147888184, 0.00014916621148586273, 0.00015805289149284363, 0.00016693957149982452, 0.00017582625150680542, 0.00018471293151378632, 0.0001935996115207672, 0.0002024862915277481, 0.000211372971534729, 0.0002202596515417099, 0.0002291463315486908, 0.0002380330115556717, 0.0002469196915626526, 0.0002558063715696335, 0.0002646930515766144, 0.0002735797315835953, 0.00028246641159057617]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 8.0, 10.0, 7.0, 6.0, 10.0, 9.0, 14.0, 25.0, 29.0, 21.0, 39.0, 35.0, 29.0, 33.0, 45.0, 53.0, 45.0, 39.0, 46.0, 47.0, 32.0, 43.0, 38.0, 36.0, 36.0, 48.0, 27.0, 38.0, 21.0, 27.0, 13.0, 20.0, 15.0, 16.0, 8.0, 13.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9609375, -6.73858642578125, -6.5162353515625, -6.29388427734375, -6.071533203125, -5.84918212890625, -5.6268310546875, -5.40447998046875, -5.18212890625, -4.95977783203125, -4.7374267578125, -4.51507568359375, -4.292724609375, -4.07037353515625, -3.8480224609375, -3.62567138671875, -3.4033203125, -3.18096923828125, -2.9586181640625, -2.73626708984375, -2.513916015625, -2.29156494140625, -2.0692138671875, -1.84686279296875, -1.62451171875, -1.40216064453125, -1.1798095703125, -0.95745849609375, -0.735107421875, -0.51275634765625, -0.2904052734375, -0.06805419921875, 0.154296875, 0.37664794921875, 0.5989990234375, 0.82135009765625, 1.043701171875, 1.26605224609375, 1.4884033203125, 1.71075439453125, 1.93310546875, 2.15545654296875, 2.3778076171875, 2.60015869140625, 2.822509765625, 3.04486083984375, 3.2672119140625, 3.48956298828125, 3.7119140625, 3.93426513671875, 4.1566162109375, 4.37896728515625, 4.601318359375, 4.82366943359375, 5.0460205078125, 5.26837158203125, 5.49072265625, 5.71307373046875, 5.9354248046875, 6.15777587890625, 6.380126953125, 6.60247802734375, 6.8248291015625, 7.04718017578125, 7.26953125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 0.0, 8.0, 10.0, 8.0, 10.0, 19.0, 27.0, 27.0, 50.0, 60.0, 81.0, 143.0, 238.0, 332.0, 682.0, 1499.0, 4242.0, 13220.0, 51743.0, 250789.0, 555620.0, 127779.0, 28861.0, 7977.0, 2707.0, 1118.0, 529.0, 266.0, 162.0, 94.0, 68.0, 44.0, 38.0, 21.0, 23.0, 13.0, 19.0, 6.0, 13.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.5380859375, -6.322265625, -6.1064453125, -5.890625, -5.6748046875, -5.458984375, -5.2431640625, -5.02734375, -4.8115234375, -4.595703125, -4.3798828125, -4.1640625, -3.9482421875, -3.732421875, -3.5166015625, -3.30078125, -3.0849609375, -2.869140625, -2.6533203125, -2.4375, -2.2216796875, -2.005859375, -1.7900390625, -1.57421875, -1.3583984375, -1.142578125, -0.9267578125, -0.7109375, -0.4951171875, -0.279296875, -0.0634765625, 0.15234375, 0.3681640625, 0.583984375, 0.7998046875, 1.015625, 1.2314453125, 1.447265625, 1.6630859375, 1.87890625, 2.0947265625, 2.310546875, 2.5263671875, 2.7421875, 2.9580078125, 3.173828125, 3.3896484375, 3.60546875, 3.8212890625, 4.037109375, 4.2529296875, 4.46875, 4.6845703125, 4.900390625, 5.1162109375, 5.33203125, 5.5478515625, 5.763671875, 5.9794921875, 6.1953125, 6.4111328125, 6.626953125, 6.8427734375, 7.05859375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 11.0, 10.0, 16.0, 21.0, 19.0, 28.0, 40.0, 40.0, 31.0, 37.0, 27.0, 45.0, 59.0, 110.0, 371.0, 1586.0, 111.0, 51.0, 42.0, 46.0, 32.0, 34.0, 39.0, 23.0, 29.0, 23.0, 15.0, 19.0, 21.0, 18.0, 9.0, 7.0, 11.0, 8.0, 5.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.5, -19.819580078125, -19.13916015625, -18.458740234375, -17.7783203125, -17.097900390625, -16.41748046875, -15.737060546875, -15.056640625, -14.376220703125, -13.69580078125, -13.015380859375, -12.3349609375, -11.654541015625, -10.97412109375, -10.293701171875, -9.61328125, -8.932861328125, -8.25244140625, -7.572021484375, -6.8916015625, -6.211181640625, -5.53076171875, -4.850341796875, -4.169921875, -3.489501953125, -2.80908203125, -2.128662109375, -1.4482421875, -0.767822265625, -0.08740234375, 0.593017578125, 1.2734375, 1.953857421875, 2.63427734375, 3.314697265625, 3.9951171875, 4.675537109375, 5.35595703125, 6.036376953125, 6.716796875, 7.397216796875, 8.07763671875, 8.758056640625, 9.4384765625, 10.118896484375, 10.79931640625, 11.479736328125, 12.16015625, 12.840576171875, 13.52099609375, 14.201416015625, 14.8818359375, 15.562255859375, 16.24267578125, 16.923095703125, 17.603515625, 18.283935546875, 18.96435546875, 19.644775390625, 20.3251953125, 21.005615234375, 21.68603515625, 22.366455078125, 23.046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 9.0, 13.0, 19.0, 28.0, 49.0, 58.0, 87.0, 133.0, 260.0, 422.0, 1275.0, 94034.0, 3046052.0, 2007.0, 512.0, 263.0, 179.0, 97.0, 63.0, 43.0, 28.0, 18.0, 11.0, 12.0, 6.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.3125, -76.5888671875, -73.865234375, -71.1416015625, -68.41796875, -65.6943359375, -62.970703125, -60.2470703125, -57.5234375, -54.7998046875, -52.076171875, -49.3525390625, -46.62890625, -43.9052734375, -41.181640625, -38.4580078125, -35.734375, -33.0107421875, -30.287109375, -27.5634765625, -24.83984375, -22.1162109375, -19.392578125, -16.6689453125, -13.9453125, -11.2216796875, -8.498046875, -5.7744140625, -3.05078125, -0.3271484375, 2.396484375, 5.1201171875, 7.84375, 10.5673828125, 13.291015625, 16.0146484375, 18.73828125, 21.4619140625, 24.185546875, 26.9091796875, 29.6328125, 32.3564453125, 35.080078125, 37.8037109375, 40.52734375, 43.2509765625, 45.974609375, 48.6982421875, 51.421875, 54.1455078125, 56.869140625, 59.5927734375, 62.31640625, 65.0400390625, 67.763671875, 70.4873046875, 73.2109375, 75.9345703125, 78.658203125, 81.3818359375, 84.10546875, 86.8291015625, 89.552734375, 92.2763671875, 95.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1010.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.07209396362305, -45.55060958862305, -33.02912139892578, -20.50763702392578, -7.986152648925781, 4.535331726074219, 17.056819915771484, 29.578304290771484, 42.099788665771484, 54.621273040771484, 67.14276123046875, 79.66424560546875, 92.18572998046875, 104.70721435546875, 117.22869873046875, 129.75018310546875, 142.27166748046875, 154.79315185546875, 167.31463623046875, 179.83612060546875, 192.35760498046875, 204.87908935546875, 217.40057373046875, 229.92205810546875, 242.4435577392578, 254.9650421142578, 267.4865417480469, 280.0080261230469, 292.5295104980469, 305.0509948730469, 317.5724792480469, 330.0939636230469, 342.6154479980469, 355.1369323730469, 367.6584167480469, 380.1799011230469, 392.7013854980469, 405.2228698730469, 417.7443542480469, 430.2658386230469, 442.7873229980469, 455.3088073730469, 467.8302917480469, 480.3517761230469, 492.8732604980469, 505.3947448730469, 517.916259765625, 530.437744140625, 542.959228515625, 555.480712890625, 568.002197265625, 580.523681640625, 593.045166015625, 605.566650390625, 618.088134765625, 630.609619140625, 643.131103515625, 655.652587890625, 668.174072265625, 680.695556640625, 693.217041015625, 705.738525390625, 718.260009765625, 730.781494140625, 743.302978515625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 9.0, 12.0, 17.0, 18.0, 15.0, 26.0, 23.0, 24.0, 33.0, 31.0, 25.0, 34.0, 40.0, 37.0, 30.0, 39.0, 39.0, 40.0, 43.0, 41.0, 44.0, 33.0, 29.0, 50.0, 34.0, 21.0, 23.0, 26.0, 22.0, 19.0, 19.0, 14.0, 8.0, 9.0, 17.0, 4.0, 3.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-65.43413543701172, -63.51478576660156, -61.59543991088867, -59.676090240478516, -57.756744384765625, -55.83739471435547, -53.91804504394531, -51.99869918823242, -50.07935333251953, -48.160003662109375, -46.240657806396484, -44.32130813598633, -42.40196228027344, -40.48261260986328, -38.563262939453125, -36.643917083740234, -34.72456741333008, -32.80521774291992, -30.88587188720703, -28.966522216796875, -27.047176361083984, -25.127826690673828, -23.208478927612305, -21.28913116455078, -19.369783401489258, -17.450435638427734, -15.531087875366211, -13.611739158630371, -11.692391395568848, -9.773043632507324, -7.853694915771484, -5.934347152709961, -4.0149993896484375, -2.095651388168335, -0.17630338668823242, 1.7430448532104492, 3.6623926162719727, 5.581740379333496, 7.501089096069336, 9.42043685913086, 11.339784622192383, 13.259132385253906, 15.17848014831543, 17.097827911376953, 19.01717758178711, 20.9365234375, 22.855873107910156, 24.77522087097168, 26.694568634033203, 28.613916397094727, 30.53326416015625, 32.452613830566406, 34.3719596862793, 36.29130935668945, 38.210655212402344, 40.1300048828125, 42.049354553222656, 43.96870422363281, 45.8880500793457, 47.80739974975586, 49.72674560546875, 51.646095275878906, 53.56544494628906, 55.48479080200195, 57.404136657714844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 9.0, 4.0, 7.0, 8.0, 16.0, 18.0, 21.0, 28.0, 30.0, 21.0, 45.0, 34.0, 39.0, 50.0, 42.0, 46.0, 54.0, 44.0, 42.0, 40.0, 39.0, 35.0, 37.0, 34.0, 37.0, 38.0, 35.0, 18.0, 20.0, 15.0, 19.0, 13.0, 15.0, 15.0, 7.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.72265625, -6.48919677734375, -6.2557373046875, -6.02227783203125, -5.788818359375, -5.55535888671875, -5.3218994140625, -5.08843994140625, -4.85498046875, -4.62152099609375, -4.3880615234375, -4.15460205078125, -3.921142578125, -3.68768310546875, -3.4542236328125, -3.22076416015625, -2.9873046875, -2.75384521484375, -2.5203857421875, -2.28692626953125, -2.053466796875, -1.82000732421875, -1.5865478515625, -1.35308837890625, -1.11962890625, -0.88616943359375, -0.6527099609375, -0.41925048828125, -0.185791015625, 0.04766845703125, 0.2811279296875, 0.51458740234375, 0.748046875, 0.98150634765625, 1.2149658203125, 1.44842529296875, 1.681884765625, 1.91534423828125, 2.1488037109375, 2.38226318359375, 2.61572265625, 2.84918212890625, 3.0826416015625, 3.31610107421875, 3.549560546875, 3.78302001953125, 4.0164794921875, 4.24993896484375, 4.4833984375, 4.71685791015625, 4.9503173828125, 5.18377685546875, 5.417236328125, 5.65069580078125, 5.8841552734375, 6.11761474609375, 6.35107421875, 6.58453369140625, 6.8179931640625, 7.05145263671875, 7.284912109375, 7.51837158203125, 7.7518310546875, 7.98529052734375, 8.21875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 0.0, 13.0, 10.0, 19.0, 18.0, 21.0, 32.0, 34.0, 37.0, 48.0, 60.0, 70.0, 136.0, 140.0, 246.0, 425.0, 1276.0, 6121.0, 110931.0, 2250592.0, 1753481.0, 63394.0, 4861.0, 1052.0, 391.0, 226.0, 151.0, 92.0, 72.0, 51.0, 46.0, 40.0, 40.0, 34.0, 34.0, 14.0, 12.0, 14.0, 10.0, 11.0, 6.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.1875, -15.60791015625, -15.0283203125, -14.44873046875, -13.869140625, -13.28955078125, -12.7099609375, -12.13037109375, -11.55078125, -10.97119140625, -10.3916015625, -9.81201171875, -9.232421875, -8.65283203125, -8.0732421875, -7.49365234375, -6.9140625, -6.33447265625, -5.7548828125, -5.17529296875, -4.595703125, -4.01611328125, -3.4365234375, -2.85693359375, -2.27734375, -1.69775390625, -1.1181640625, -0.53857421875, 0.041015625, 0.62060546875, 1.2001953125, 1.77978515625, 2.359375, 2.93896484375, 3.5185546875, 4.09814453125, 4.677734375, 5.25732421875, 5.8369140625, 6.41650390625, 6.99609375, 7.57568359375, 8.1552734375, 8.73486328125, 9.314453125, 9.89404296875, 10.4736328125, 11.05322265625, 11.6328125, 12.21240234375, 12.7919921875, 13.37158203125, 13.951171875, 14.53076171875, 15.1103515625, 15.68994140625, 16.26953125, 16.84912109375, 17.4287109375, 18.00830078125, 18.587890625, 19.16748046875, 19.7470703125, 20.32666015625, 20.90625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 13.0, 16.0, 14.0, 8.0, 21.0, 27.0, 38.0, 52.0, 69.0, 75.0, 97.0, 145.0, 192.0, 259.0, 335.0, 417.0, 428.0, 431.0, 343.0, 241.0, 219.0, 129.0, 110.0, 93.0, 79.0, 56.0, 37.0, 18.0, 24.0, 18.0, 16.0, 9.0, 8.0, 8.0, 6.0, 4.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.087158203125, -9.72119140625, -9.355224609375, -8.9892578125, -8.623291015625, -8.25732421875, -7.891357421875, -7.525390625, -7.159423828125, -6.79345703125, -6.427490234375, -6.0615234375, -5.695556640625, -5.32958984375, -4.963623046875, -4.59765625, -4.231689453125, -3.86572265625, -3.499755859375, -3.1337890625, -2.767822265625, -2.40185546875, -2.035888671875, -1.669921875, -1.303955078125, -0.93798828125, -0.572021484375, -0.2060546875, 0.159912109375, 0.52587890625, 0.891845703125, 1.2578125, 1.623779296875, 1.98974609375, 2.355712890625, 2.7216796875, 3.087646484375, 3.45361328125, 3.819580078125, 4.185546875, 4.551513671875, 4.91748046875, 5.283447265625, 5.6494140625, 6.015380859375, 6.38134765625, 6.747314453125, 7.11328125, 7.479248046875, 7.84521484375, 8.211181640625, 8.5771484375, 8.943115234375, 9.30908203125, 9.675048828125, 10.041015625, 10.406982421875, 10.77294921875, 11.138916015625, 11.5048828125, 11.870849609375, 12.23681640625, 12.602783203125, 12.96875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 7.0, 7.0, 10.0, 7.0, 13.0, 19.0, 14.0, 23.0, 26.0, 42.0, 50.0, 61.0, 97.0, 89.0, 121.0, 154.0, 177.0, 235.0, 367.0, 582.0, 3389.0, 3810469.0, 375065.0, 1336.0, 536.0, 336.0, 219.0, 165.0, 134.0, 104.0, 72.0, 78.0, 59.0, 45.0, 39.0, 36.0, 26.0, 18.0, 23.0, 10.0, 7.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.875, -61.8037109375, -59.732421875, -57.6611328125, -55.58984375, -53.5185546875, -51.447265625, -49.3759765625, -47.3046875, -45.2333984375, -43.162109375, -41.0908203125, -39.01953125, -36.9482421875, -34.876953125, -32.8056640625, -30.734375, -28.6630859375, -26.591796875, -24.5205078125, -22.44921875, -20.3779296875, -18.306640625, -16.2353515625, -14.1640625, -12.0927734375, -10.021484375, -7.9501953125, -5.87890625, -3.8076171875, -1.736328125, 0.3349609375, 2.40625, 4.4775390625, 6.548828125, 8.6201171875, 10.69140625, 12.7626953125, 14.833984375, 16.9052734375, 18.9765625, 21.0478515625, 23.119140625, 25.1904296875, 27.26171875, 29.3330078125, 31.404296875, 33.4755859375, 35.546875, 37.6181640625, 39.689453125, 41.7607421875, 43.83203125, 45.9033203125, 47.974609375, 50.0458984375, 52.1171875, 54.1884765625, 56.259765625, 58.3310546875, 60.40234375, 62.4736328125, 64.544921875, 66.6162109375, 68.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 62.0, 550.0, 379.0, 22.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.54374694824219, -113.67644500732422, -104.80913543701172, -95.94183349609375, -87.07452392578125, -78.20722198486328, -69.33992004394531, -60.47261428833008, -51.605308532714844, -42.73800277709961, -33.870697021484375, -25.003395080566406, -16.136089324951172, -7.2687835693359375, 1.5985183715820312, 10.465824127197266, 19.3331298828125, 28.200435638427734, 37.06774139404297, 45.93504333496094, 54.80234909057617, 63.669654846191406, 72.53695678710938, 81.40426635742188, 90.27156829833984, 99.13887023925781, 108.00617980957031, 116.87348175048828, 125.74078369140625, 134.60809326171875, 143.47540283203125, 152.3426971435547, 161.21002197265625, 170.07733154296875, 178.9446258544922, 187.8119354248047, 196.6792449951172, 205.54653930664062, 214.41384887695312, 223.28115844726562, 232.14846801757812, 241.01577758789062, 249.88307189941406, 258.7503662109375, 267.61767578125, 276.4849853515625, 285.352294921875, 294.2196044921875, 303.0869140625, 311.9542236328125, 320.821533203125, 329.6888427734375, 338.5561218261719, 347.4234313964844, 356.2907409667969, 365.1580505371094, 374.02532958984375, 382.89263916015625, 391.75994873046875, 400.62725830078125, 409.4945373535156, 418.3618469238281, 427.2291564941406, 436.0964660644531, 444.9637756347656]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 9.0, 16.0, 11.0, 16.0, 12.0, 26.0, 21.0, 32.0, 39.0, 35.0, 36.0, 45.0, 32.0, 38.0, 40.0, 38.0, 58.0, 48.0, 56.0, 44.0, 38.0, 29.0, 35.0, 32.0, 33.0, 31.0, 17.0, 29.0, 20.0, 10.0, 9.0, 9.0, 10.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.27734375, -44.82401657104492, -43.370689392089844, -41.917362213134766, -40.46403503417969, -39.010711669921875, -37.5573844909668, -36.10405731201172, -34.65073013305664, -33.19740295410156, -31.744075775146484, -30.29075050354004, -28.83742332458496, -27.384096145629883, -25.930770874023438, -24.47744369506836, -23.02411651611328, -21.570789337158203, -20.117462158203125, -18.66413688659668, -17.2108097076416, -15.757482528686523, -14.304156303405762, -12.850830078125, -11.397502899169922, -9.944175720214844, -8.490849494934082, -7.037522792816162, -5.584196090698242, -4.130869388580322, -2.6775426864624023, -1.2242164611816406, 0.2291107177734375, 1.6824374198913574, 3.1357641220092773, 4.589090824127197, 6.042417526245117, 7.495744228363037, 8.949070930480957, 10.402397155761719, 11.855724334716797, 13.309051513671875, 14.762377738952637, 16.2157039642334, 17.669031143188477, 19.122358322143555, 20.57568359375, 22.029010772705078, 23.482337951660156, 24.935665130615234, 26.388992309570312, 27.842317581176758, 29.295644760131836, 30.748971939086914, 32.20229721069336, 33.65562438964844, 35.108951568603516, 36.562278747558594, 38.01560592651367, 39.46893310546875, 40.92225646972656, 42.37558364868164, 43.82891082763672, 45.2822380065918, 46.735565185546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 8.0, 16.0, 11.0, 17.0, 25.0, 28.0, 32.0, 40.0, 22.0, 34.0, 34.0, 40.0, 36.0, 49.0, 30.0, 51.0, 47.0, 48.0, 42.0, 43.0, 34.0, 33.0, 34.0, 36.0, 28.0, 23.0, 23.0, 27.0, 18.0, 17.0, 9.0, 16.0, 15.0, 8.0, 7.0, 2.0, 5.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.2955322265625, -6.075439453125, -5.8553466796875, -5.63525390625, -5.4151611328125, -5.195068359375, -4.9749755859375, -4.7548828125, -4.5347900390625, -4.314697265625, -4.0946044921875, -3.87451171875, -3.6544189453125, -3.434326171875, -3.2142333984375, -2.994140625, -2.7740478515625, -2.553955078125, -2.3338623046875, -2.11376953125, -1.8936767578125, -1.673583984375, -1.4534912109375, -1.2333984375, -1.0133056640625, -0.793212890625, -0.5731201171875, -0.35302734375, -0.1329345703125, 0.087158203125, 0.3072509765625, 0.52734375, 0.7474365234375, 0.967529296875, 1.1876220703125, 1.40771484375, 1.6278076171875, 1.847900390625, 2.0679931640625, 2.2880859375, 2.5081787109375, 2.728271484375, 2.9483642578125, 3.16845703125, 3.3885498046875, 3.608642578125, 3.8287353515625, 4.048828125, 4.2689208984375, 4.489013671875, 4.7091064453125, 4.92919921875, 5.1492919921875, 5.369384765625, 5.5894775390625, 5.8095703125, 6.0296630859375, 6.249755859375, 6.4698486328125, 6.68994140625, 6.9100341796875, 7.130126953125, 7.3502197265625, 7.5703125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 24.0, 30.0, 33.0, 76.0, 90.0, 157.0, 233.0, 338.0, 539.0, 821.0, 1303.0, 2094.0, 3360.0, 5206.0, 8046.0, 13163.0, 20698.0, 34112.0, 57358.0, 101977.0, 196468.0, 267024.0, 141850.0, 77084.0, 44286.0, 26736.0, 16659.0, 10733.0, 6523.0, 4103.0, 2656.0, 1748.0, 1058.0, 701.0, 490.0, 277.0, 179.0, 117.0, 55.0, 48.0, 37.0, 16.0, 15.0, 12.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.17578125, -1.1414642333984375, -1.107147216796875, -1.0728302001953125, -1.03851318359375, -1.0041961669921875, -0.969879150390625, -0.9355621337890625, -0.9012451171875, -0.8669281005859375, -0.832611083984375, -0.7982940673828125, -0.76397705078125, -0.7296600341796875, -0.695343017578125, -0.6610260009765625, -0.626708984375, -0.5923919677734375, -0.558074951171875, -0.5237579345703125, -0.48944091796875, -0.4551239013671875, -0.420806884765625, -0.3864898681640625, -0.3521728515625, -0.3178558349609375, -0.283538818359375, -0.2492218017578125, -0.21490478515625, -0.1805877685546875, -0.146270751953125, -0.1119537353515625, -0.07763671875, -0.0433197021484375, -0.009002685546875, 0.0253143310546875, 0.05963134765625, 0.0939483642578125, 0.128265380859375, 0.1625823974609375, 0.1968994140625, 0.2312164306640625, 0.265533447265625, 0.2998504638671875, 0.33416748046875, 0.3684844970703125, 0.402801513671875, 0.4371185302734375, 0.471435546875, 0.5057525634765625, 0.540069580078125, 0.5743865966796875, 0.60870361328125, 0.6430206298828125, 0.677337646484375, 0.7116546630859375, 0.7459716796875, 0.7802886962890625, 0.814605712890625, 0.8489227294921875, 0.88323974609375, 0.9175567626953125, 0.951873779296875, 0.9861907958984375, 1.0205078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 3.0, 7.0, 13.0, 13.0, 9.0, 12.0, 21.0, 12.0, 23.0, 16.0, 24.0, 32.0, 18.0, 32.0, 38.0, 44.0, 35.0, 38.0, 37.0, 37.0, 1048.0, 30.0, 51.0, 29.0, 48.0, 43.0, 29.0, 34.0, 30.0, 28.0, 24.0, 22.0, 17.0, 10.0, 20.0, 13.0, 16.0, 12.0, 6.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.68359375, -3.56640625, -3.44921875, -3.33203125, -3.21484375, -3.09765625, -2.98046875, -2.86328125, -2.74609375, -2.62890625, -2.51171875, -2.39453125, -2.27734375, -2.16015625, -2.04296875, -1.92578125, -1.80859375, -1.69140625, -1.57421875, -1.45703125, -1.33984375, -1.22265625, -1.10546875, -0.98828125, -0.87109375, -0.75390625, -0.63671875, -0.51953125, -0.40234375, -0.28515625, -0.16796875, -0.05078125, 0.06640625, 0.18359375, 0.30078125, 0.41796875, 0.53515625, 0.65234375, 0.76953125, 0.88671875, 1.00390625, 1.12109375, 1.23828125, 1.35546875, 1.47265625, 1.58984375, 1.70703125, 1.82421875, 1.94140625, 2.05859375, 2.17578125, 2.29296875, 2.41015625, 2.52734375, 2.64453125, 2.76171875, 2.87890625, 2.99609375, 3.11328125, 3.23046875, 3.34765625, 3.46484375, 3.58203125, 3.69921875, 3.81640625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 13.0, 16.0, 21.0, 23.0, 47.0, 70.0, 105.0, 142.0, 218.0, 322.0, 465.0, 670.0, 951.0, 1319.0, 1787.0, 2746.0, 4008.0, 5913.0, 8744.0, 13147.0, 20511.0, 32149.0, 51895.0, 85973.0, 148626.0, 1289126.0, 169847.0, 96840.0, 58146.0, 36081.0, 22562.0, 14548.0, 9400.0, 6615.0, 4325.0, 2935.0, 2102.0, 1411.0, 1005.0, 724.0, 489.0, 356.0, 246.0, 151.0, 116.0, 70.0, 48.0, 40.0, 29.0, 15.0, 8.0, 7.0, 7.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.90478515625, -0.877044677734375, -0.84930419921875, -0.821563720703125, -0.7938232421875, -0.766082763671875, -0.73834228515625, -0.710601806640625, -0.682861328125, -0.655120849609375, -0.62738037109375, -0.599639892578125, -0.5718994140625, -0.544158935546875, -0.51641845703125, -0.488677978515625, -0.4609375, -0.433197021484375, -0.40545654296875, -0.377716064453125, -0.3499755859375, -0.322235107421875, -0.29449462890625, -0.266754150390625, -0.239013671875, -0.211273193359375, -0.18353271484375, -0.155792236328125, -0.1280517578125, -0.100311279296875, -0.07257080078125, -0.044830322265625, -0.01708984375, 0.010650634765625, 0.03839111328125, 0.066131591796875, 0.0938720703125, 0.121612548828125, 0.14935302734375, 0.177093505859375, 0.204833984375, 0.232574462890625, 0.26031494140625, 0.288055419921875, 0.3157958984375, 0.343536376953125, 0.37127685546875, 0.399017333984375, 0.4267578125, 0.454498291015625, 0.48223876953125, 0.509979248046875, 0.5377197265625, 0.565460205078125, 0.59320068359375, 0.620941162109375, 0.648681640625, 0.676422119140625, 0.70416259765625, 0.731903076171875, 0.7596435546875, 0.787384033203125, 0.81512451171875, 0.842864990234375, 0.87060546875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 13.0, 19.0, 27.0, 38.0, 45.0, 72.0, 76.0, 104.0, 124.0, 101.0, 91.0, 77.0, 49.0, 42.0, 30.0, 16.0, 26.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009589195251464844, -0.0009312108159065247, -0.0009035021066665649, -0.0008757933974266052, -0.0008480846881866455, -0.0008203759789466858, -0.0007926672697067261, -0.0007649585604667664, -0.0007372498512268066, -0.0007095411419868469, -0.0006818324327468872, -0.0006541237235069275, -0.0006264150142669678, -0.0005987063050270081, -0.0005709975957870483, -0.0005432888865470886, -0.0005155801773071289, -0.0004878714680671692, -0.00046016275882720947, -0.00043245404958724976, -0.00040474534034729004, -0.0003770366311073303, -0.0003493279218673706, -0.0003216192126274109, -0.00029391050338745117, -0.00026620179414749146, -0.00023849308490753174, -0.00021078437566757202, -0.0001830756664276123, -0.0001553669571876526, -0.00012765824794769287, -9.994953870773315e-05, -7.224082946777344e-05, -4.453212022781372e-05, -1.6823410987854004e-05, 1.0885298252105713e-05, 3.859400749206543e-05, 6.630271673202515e-05, 9.401142597198486e-05, 0.00012172013521194458, 0.0001494288444519043, 0.00017713755369186401, 0.00020484626293182373, 0.00023255497217178345, 0.00026026368141174316, 0.0002879723906517029, 0.0003156810998916626, 0.0003433898091316223, 0.00037109851837158203, 0.00039880722761154175, 0.00042651593685150146, 0.0004542246460914612, 0.0004819333553314209, 0.0005096420645713806, 0.0005373507738113403, 0.0005650594830513, 0.0005927681922912598, 0.0006204769015312195, 0.0006481856107711792, 0.0006758943200111389, 0.0007036030292510986, 0.0007313117384910583, 0.0007590204477310181, 0.0007867291569709778, 0.0008144378662109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 10.0, 7.0, 15.0, 14.0, 18.0, 38.0, 54.0, 85.0, 136.0, 224.0, 812.0, 788461.0, 257434.0, 661.0, 223.0, 120.0, 64.0, 52.0, 29.0, 26.0, 21.0, 12.0, 8.0, 5.0, 9.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019439697265625, -0.018790721893310547, -0.018141746520996094, -0.01749277114868164, -0.016843795776367188, -0.016194820404052734, -0.015545845031738281, -0.014896869659423828, -0.014247894287109375, -0.013598918914794922, -0.012949943542480469, -0.012300968170166016, -0.011651992797851562, -0.01100301742553711, -0.010354042053222656, -0.009705066680908203, -0.00905609130859375, -0.008407115936279297, -0.007758140563964844, -0.007109165191650391, -0.0064601898193359375, -0.005811214447021484, -0.005162239074707031, -0.004513263702392578, -0.003864288330078125, -0.003215312957763672, -0.0025663375854492188, -0.0019173622131347656, -0.0012683868408203125, -0.0006194114685058594, 2.956390380859375e-05, 0.0006785392761230469, 0.0013275146484375, 0.001976490020751953, 0.0026254653930664062, 0.0032744407653808594, 0.0039234161376953125, 0.004572391510009766, 0.005221366882324219, 0.005870342254638672, 0.006519317626953125, 0.007168292999267578, 0.007817268371582031, 0.008466243743896484, 0.009115219116210938, 0.00976419448852539, 0.010413169860839844, 0.011062145233154297, 0.01171112060546875, 0.012360095977783203, 0.013009071350097656, 0.01365804672241211, 0.014307022094726562, 0.014955997467041016, 0.015604972839355469, 0.016253948211669922, 0.016902923583984375, 0.017551898956298828, 0.01820087432861328, 0.018849849700927734, 0.019498825073242188, 0.02014780044555664, 0.020796775817871094, 0.021445751190185547, 0.0220947265625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 295.0, 711.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005777199403382838, -0.00046610942808911204, -0.0003544989158399403, -0.00024288837448693812, -0.00013127786223776639, -1.9667320884764194e-05, 9.194319136440754e-05, 0.00020355370361357927, 0.000315164215862751, 0.00042677472811192274, 0.0005383852403610945, 0.0006499957526102662, 0.0007616062648594379, 0.0008732168353162706, 0.0009848272893577814, 0.001096437918022275, 0.0012080483138561249, 0.0013196588261052966, 0.0014312693383544683, 0.00154287985060364, 0.0016544903628528118, 0.0017661009915173054, 0.0018777113873511553, 0.001989322016015649, 0.0021009324118494987, 0.0022125430405139923, 0.002324153436347842, 0.0024357640650123358, 0.0025473744608461857, 0.0026589850895106792, 0.002770595485344529, 0.0028822061140090227, 0.0029938167426735163, 0.00310542737133801, 0.0032170377671718597, 0.0033286483958363533, 0.003440258791670203, 0.0035518694203346968, 0.0036634798161685467, 0.0037750904448330402, 0.00388670084066689, 0.00399831123650074, 0.004109921865165234, 0.004221532493829727, 0.004333143122494221, 0.004444753285497427, 0.0045563639141619205, 0.004667974542826414, 0.004779585171490908, 0.004891195800155401, 0.005002806428819895, 0.005114416591823101, 0.005226027220487595, 0.005337637849152088, 0.005449248477816582, 0.005560858640819788, 0.0056724692694842815, 0.005784079898148775, 0.005895690526813269, 0.006007300689816475, 0.0061189113184809685, 0.006230521947145462, 0.006342132575809956, 0.006453742738813162, 0.006565353367477655]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 11.0, 10.0, 11.0, 16.0, 19.0, 19.0, 20.0, 10.0, 25.0, 28.0, 27.0, 35.0, 32.0, 33.0, 24.0, 34.0, 53.0, 38.0, 40.0, 42.0, 43.0, 37.0, 47.0, 35.0, 34.0, 33.0, 30.0, 28.0, 24.0, 18.0, 20.0, 15.0, 14.0, 11.0, 15.0, 10.0, 17.0, 6.0, 6.0, 3.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026416778564453125, -0.0002552289515733719, -0.0002462901175022125, -0.00023735128343105316, -0.0002284124493598938, -0.00021947361528873444, -0.00021053478121757507, -0.0002015959471464157, -0.00019265711307525635, -0.00018371827900409698, -0.00017477944493293762, -0.00016584061086177826, -0.0001569017767906189, -0.00014796294271945953, -0.00013902410864830017, -0.0001300852745771408, -0.00012114644050598145, -0.00011220760643482208, -0.00010326877236366272, -9.432993829250336e-05, -8.5391104221344e-05, -7.645227015018463e-05, -6.751343607902527e-05, -5.8574602007865906e-05, -4.963576793670654e-05, -4.069693386554718e-05, -3.175809979438782e-05, -2.2819265723228455e-05, -1.3880431652069092e-05, -4.941597580909729e-06, 3.997236490249634e-06, 1.2936070561408997e-05, 2.187490463256836e-05, 3.081373870372772e-05, 3.9752572774887085e-05, 4.869140684604645e-05, 5.763024091720581e-05, 6.656907498836517e-05, 7.550790905952454e-05, 8.44467431306839e-05, 9.338557720184326e-05, 0.00010232441127300262, 0.00011126324534416199, 0.00012020207941532135, 0.0001291409134864807, 0.00013807974755764008, 0.00014701858162879944, 0.0001559574156999588, 0.00016489624977111816, 0.00017383508384227753, 0.0001827739179134369, 0.00019171275198459625, 0.00020065158605575562, 0.00020959042012691498, 0.00021852925419807434, 0.0002274680882692337, 0.00023640692234039307, 0.00024534575641155243, 0.0002542845904827118, 0.00026322342455387115, 0.0002721622586250305, 0.0002811010926961899, 0.00029003992676734924, 0.0002989787608385086, 0.00030791759490966797]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 8.0, 16.0, 11.0, 17.0, 25.0, 28.0, 32.0, 40.0, 22.0, 34.0, 34.0, 40.0, 36.0, 49.0, 30.0, 51.0, 47.0, 48.0, 42.0, 43.0, 34.0, 33.0, 34.0, 36.0, 28.0, 23.0, 23.0, 27.0, 18.0, 17.0, 9.0, 16.0, 15.0, 8.0, 7.0, 2.0, 5.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.2955322265625, -6.075439453125, -5.8553466796875, -5.63525390625, -5.4151611328125, -5.195068359375, -4.9749755859375, -4.7548828125, -4.5347900390625, -4.314697265625, -4.0946044921875, -3.87451171875, -3.6544189453125, -3.434326171875, -3.2142333984375, -2.994140625, -2.7740478515625, -2.553955078125, -2.3338623046875, -2.11376953125, -1.8936767578125, -1.673583984375, -1.4534912109375, -1.2333984375, -1.0133056640625, -0.793212890625, -0.5731201171875, -0.35302734375, -0.1329345703125, 0.087158203125, 0.3072509765625, 0.52734375, 0.7474365234375, 0.967529296875, 1.1876220703125, 1.40771484375, 1.6278076171875, 1.847900390625, 2.0679931640625, 2.2880859375, 2.5081787109375, 2.728271484375, 2.9483642578125, 3.16845703125, 3.3885498046875, 3.608642578125, 3.8287353515625, 4.048828125, 4.2689208984375, 4.489013671875, 4.7091064453125, 4.92919921875, 5.1492919921875, 5.369384765625, 5.5894775390625, 5.8095703125, 6.0296630859375, 6.249755859375, 6.4698486328125, 6.68994140625, 6.9100341796875, 7.130126953125, 7.3502197265625, 7.5703125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 10.0, 6.0, 14.0, 11.0, 14.0, 26.0, 36.0, 44.0, 69.0, 138.0, 243.0, 410.0, 855.0, 1628.0, 3221.0, 6738.0, 14392.0, 32769.0, 82577.0, 225869.0, 405137.0, 165105.0, 61806.0, 25324.0, 11166.0, 5352.0, 2615.0, 1345.0, 681.0, 389.0, 210.0, 118.0, 57.0, 52.0, 32.0, 12.0, 18.0, 14.0, 9.0, 11.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.955078125, -3.8203125, -3.685546875, -3.55078125, -3.416015625, -3.28125, -3.146484375, -3.01171875, -2.876953125, -2.7421875, -2.607421875, -2.47265625, -2.337890625, -2.203125, -2.068359375, -1.93359375, -1.798828125, -1.6640625, -1.529296875, -1.39453125, -1.259765625, -1.125, -0.990234375, -0.85546875, -0.720703125, -0.5859375, -0.451171875, -0.31640625, -0.181640625, -0.046875, 0.087890625, 0.22265625, 0.357421875, 0.4921875, 0.626953125, 0.76171875, 0.896484375, 1.03125, 1.166015625, 1.30078125, 1.435546875, 1.5703125, 1.705078125, 1.83984375, 1.974609375, 2.109375, 2.244140625, 2.37890625, 2.513671875, 2.6484375, 2.783203125, 2.91796875, 3.052734375, 3.1875, 3.322265625, 3.45703125, 3.591796875, 3.7265625, 3.861328125, 3.99609375, 4.130859375, 4.265625, 4.400390625, 4.53515625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 7.0, 8.0, 7.0, 11.0, 10.0, 13.0, 21.0, 15.0, 17.0, 25.0, 31.0, 31.0, 42.0, 39.0, 50.0, 54.0, 87.0, 179.0, 1693.0, 186.0, 85.0, 58.0, 41.0, 38.0, 33.0, 33.0, 33.0, 29.0, 31.0, 20.0, 25.0, 10.0, 19.0, 10.0, 6.0, 4.0, 8.0, 8.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-21.3125, -20.634765625, -19.95703125, -19.279296875, -18.6015625, -17.923828125, -17.24609375, -16.568359375, -15.890625, -15.212890625, -14.53515625, -13.857421875, -13.1796875, -12.501953125, -11.82421875, -11.146484375, -10.46875, -9.791015625, -9.11328125, -8.435546875, -7.7578125, -7.080078125, -6.40234375, -5.724609375, -5.046875, -4.369140625, -3.69140625, -3.013671875, -2.3359375, -1.658203125, -0.98046875, -0.302734375, 0.375, 1.052734375, 1.73046875, 2.408203125, 3.0859375, 3.763671875, 4.44140625, 5.119140625, 5.796875, 6.474609375, 7.15234375, 7.830078125, 8.5078125, 9.185546875, 9.86328125, 10.541015625, 11.21875, 11.896484375, 12.57421875, 13.251953125, 13.9296875, 14.607421875, 15.28515625, 15.962890625, 16.640625, 17.318359375, 17.99609375, 18.673828125, 19.3515625, 20.029296875, 20.70703125, 21.384765625, 22.0625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 10.0, 12.0, 9.0, 9.0, 24.0, 21.0, 24.0, 32.0, 49.0, 61.0, 71.0, 105.0, 110.0, 139.0, 205.0, 332.0, 601.0, 2288.0, 419133.0, 2717268.0, 3339.0, 652.0, 296.0, 221.0, 148.0, 135.0, 73.0, 70.0, 54.0, 39.0, 40.0, 25.0, 19.0, 13.0, 11.0, 10.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-53.53125, -51.9130859375, -50.294921875, -48.6767578125, -47.05859375, -45.4404296875, -43.822265625, -42.2041015625, -40.5859375, -38.9677734375, -37.349609375, -35.7314453125, -34.11328125, -32.4951171875, -30.876953125, -29.2587890625, -27.640625, -26.0224609375, -24.404296875, -22.7861328125, -21.16796875, -19.5498046875, -17.931640625, -16.3134765625, -14.6953125, -13.0771484375, -11.458984375, -9.8408203125, -8.22265625, -6.6044921875, -4.986328125, -3.3681640625, -1.75, -0.1318359375, 1.486328125, 3.1044921875, 4.72265625, 6.3408203125, 7.958984375, 9.5771484375, 11.1953125, 12.8134765625, 14.431640625, 16.0498046875, 17.66796875, 19.2861328125, 20.904296875, 22.5224609375, 24.140625, 25.7587890625, 27.376953125, 28.9951171875, 30.61328125, 32.2314453125, 33.849609375, 35.4677734375, 37.0859375, 38.7041015625, 40.322265625, 41.9404296875, 43.55859375, 45.1767578125, 46.794921875, 48.4130859375, 50.03125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 9.0, 220.0, 652.0, 125.0, 12.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.327392578125, -16.333105087280273, -13.338817596435547, -10.34453010559082, -7.350242614746094, -4.355955123901367, -1.3616676330566406, 1.632619857788086, 4.6269073486328125, 7.621194839477539, 10.615482330322266, 13.609769821166992, 16.60405731201172, 19.598344802856445, 22.592632293701172, 25.5869197845459, 28.581207275390625, 31.57549476623535, 34.56978225708008, 37.56407165527344, 40.55835723876953, 43.552642822265625, 46.546932220458984, 49.541221618652344, 52.53550720214844, 55.52979278564453, 58.52408218383789, 61.51837158203125, 64.51265716552734, 67.50694274902344, 70.50123596191406, 73.49552154541016, 76.48980712890625, 79.48409271240234, 82.47837829589844, 85.47267150878906, 88.46695709228516, 91.46124267578125, 94.45553588867188, 97.44982147216797, 100.44410705566406, 103.43839263916016, 106.43267822265625, 109.42697143554688, 112.42125701904297, 115.41554260253906, 118.40983581542969, 121.40412139892578, 124.39840698242188, 127.39269256591797, 130.38697814941406, 133.3812713623047, 136.37554931640625, 139.36984252929688, 142.3641357421875, 145.35841369628906, 148.3527069091797, 151.3470001220703, 154.34127807617188, 157.3355712890625, 160.32986450195312, 163.3241424560547, 166.3184356689453, 169.31271362304688, 172.3070068359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 7.0, 7.0, 6.0, 11.0, 13.0, 20.0, 21.0, 11.0, 22.0, 29.0, 26.0, 27.0, 27.0, 28.0, 30.0, 37.0, 42.0, 38.0, 40.0, 37.0, 46.0, 48.0, 32.0, 46.0, 27.0, 39.0, 29.0, 28.0, 19.0, 28.0, 32.0, 18.0, 23.0, 20.0, 18.0, 14.0, 11.0, 9.0, 5.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.3079833984375, -46.60369110107422, -44.89939880371094, -43.195106506347656, -41.490814208984375, -39.786521911621094, -38.08222961425781, -36.37793731689453, -34.67364501953125, -32.96935272216797, -31.265060424804688, -29.560768127441406, -27.856475830078125, -26.152183532714844, -24.44788932800293, -22.74359703063965, -21.039302825927734, -19.335010528564453, -17.630718231201172, -15.926424980163574, -14.222132682800293, -12.517840385437012, -10.813547134399414, -9.109254837036133, -7.404962539672852, -5.70067024230957, -3.996377468109131, -2.2920846939086914, -0.5877923965454102, 1.116499900817871, 2.8207931518554688, 4.52508544921875, 6.229377746582031, 7.9336700439453125, 9.637962341308594, 11.342255592346191, 13.046547889709473, 14.750840187072754, 16.45513343811035, 18.159425735473633, 19.863718032836914, 21.568010330200195, 23.272302627563477, 24.97659683227539, 26.680889129638672, 28.385181427001953, 30.089473724365234, 31.793766021728516, 33.4980583190918, 35.20235061645508, 36.90664291381836, 38.61093521118164, 40.31522750854492, 42.0195198059082, 43.72381591796875, 45.42810821533203, 47.13240051269531, 48.836692810058594, 50.540985107421875, 52.245277404785156, 53.94956970214844, 55.65386199951172, 57.358154296875, 59.06244659423828, 60.76673889160156]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 3.0, 8.0, 11.0, 11.0, 14.0, 18.0, 16.0, 27.0, 34.0, 32.0, 33.0, 21.0, 48.0, 36.0, 47.0, 38.0, 41.0, 45.0, 42.0, 33.0, 51.0, 41.0, 35.0, 39.0, 42.0, 36.0, 26.0, 23.0, 18.0, 24.0, 15.0, 19.0, 16.0, 16.0, 8.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.2794189453125, -6.051025390625, -5.8226318359375, -5.59423828125, -5.3658447265625, -5.137451171875, -4.9090576171875, -4.6806640625, -4.4522705078125, -4.223876953125, -3.9954833984375, -3.76708984375, -3.5386962890625, -3.310302734375, -3.0819091796875, -2.853515625, -2.6251220703125, -2.396728515625, -2.1683349609375, -1.93994140625, -1.7115478515625, -1.483154296875, -1.2547607421875, -1.0263671875, -0.7979736328125, -0.569580078125, -0.3411865234375, -0.11279296875, 0.1156005859375, 0.343994140625, 0.5723876953125, 0.80078125, 1.0291748046875, 1.257568359375, 1.4859619140625, 1.71435546875, 1.9427490234375, 2.171142578125, 2.3995361328125, 2.6279296875, 2.8563232421875, 3.084716796875, 3.3131103515625, 3.54150390625, 3.7698974609375, 3.998291015625, 4.2266845703125, 4.455078125, 4.6834716796875, 4.911865234375, 5.1402587890625, 5.36865234375, 5.5970458984375, 5.825439453125, 6.0538330078125, 6.2822265625, 6.5106201171875, 6.739013671875, 6.9674072265625, 7.19580078125, 7.4241943359375, 7.652587890625, 7.8809814453125, 8.109375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 4.0, 13.0, 6.0, 13.0, 10.0, 22.0, 24.0, 33.0, 17.0, 48.0, 42.0, 66.0, 110.0, 220.0, 603.0, 2116.0, 20680.0, 1442369.0, 2674540.0, 48384.0, 3341.0, 813.0, 309.0, 159.0, 80.0, 39.0, 40.0, 33.0, 18.0, 17.0, 19.0, 17.0, 18.0, 11.0, 10.0, 10.0, 6.0, 1.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.63671875, -20.8671875, -20.09765625, -19.328125, -18.55859375, -17.7890625, -17.01953125, -16.25, -15.48046875, -14.7109375, -13.94140625, -13.171875, -12.40234375, -11.6328125, -10.86328125, -10.09375, -9.32421875, -8.5546875, -7.78515625, -7.015625, -6.24609375, -5.4765625, -4.70703125, -3.9375, -3.16796875, -2.3984375, -1.62890625, -0.859375, -0.08984375, 0.6796875, 1.44921875, 2.21875, 2.98828125, 3.7578125, 4.52734375, 5.296875, 6.06640625, 6.8359375, 7.60546875, 8.375, 9.14453125, 9.9140625, 10.68359375, 11.453125, 12.22265625, 12.9921875, 13.76171875, 14.53125, 15.30078125, 16.0703125, 16.83984375, 17.609375, 18.37890625, 19.1484375, 19.91796875, 20.6875, 21.45703125, 22.2265625, 22.99609375, 23.765625, 24.53515625, 25.3046875, 26.07421875, 26.84375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 14.0, 12.0, 13.0, 14.0, 36.0, 42.0, 46.0, 81.0, 99.0, 139.0, 214.0, 319.0, 456.0, 557.0, 570.0, 392.0, 316.0, 222.0, 149.0, 108.0, 85.0, 58.0, 37.0, 29.0, 25.0, 10.0, 11.0, 6.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.828125, -17.3585205078125, -16.888916015625, -16.4193115234375, -15.94970703125, -15.4801025390625, -15.010498046875, -14.5408935546875, -14.0712890625, -13.6016845703125, -13.132080078125, -12.6624755859375, -12.19287109375, -11.7232666015625, -11.253662109375, -10.7840576171875, -10.314453125, -9.8448486328125, -9.375244140625, -8.9056396484375, -8.43603515625, -7.9664306640625, -7.496826171875, -7.0272216796875, -6.5576171875, -6.0880126953125, -5.618408203125, -5.1488037109375, -4.67919921875, -4.2095947265625, -3.739990234375, -3.2703857421875, -2.80078125, -2.3311767578125, -1.861572265625, -1.3919677734375, -0.92236328125, -0.4527587890625, 0.016845703125, 0.4864501953125, 0.9560546875, 1.4256591796875, 1.895263671875, 2.3648681640625, 2.83447265625, 3.3040771484375, 3.773681640625, 4.2432861328125, 4.712890625, 5.1824951171875, 5.652099609375, 6.1217041015625, 6.59130859375, 7.0609130859375, 7.530517578125, 8.0001220703125, 8.4697265625, 8.9393310546875, 9.408935546875, 9.8785400390625, 10.34814453125, 10.8177490234375, 11.287353515625, 11.7569580078125, 12.2265625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 19.0, 22.0, 36.0, 44.0, 67.0, 86.0, 124.0, 165.0, 232.0, 322.0, 523.0, 1701.0, 4063190.0, 125500.0, 856.0, 397.0, 269.0, 176.0, 137.0, 104.0, 80.0, 67.0, 49.0, 29.0, 29.0, 20.0, 9.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.875, -107.8623046875, -104.849609375, -101.8369140625, -98.82421875, -95.8115234375, -92.798828125, -89.7861328125, -86.7734375, -83.7607421875, -80.748046875, -77.7353515625, -74.72265625, -71.7099609375, -68.697265625, -65.6845703125, -62.671875, -59.6591796875, -56.646484375, -53.6337890625, -50.62109375, -47.6083984375, -44.595703125, -41.5830078125, -38.5703125, -35.5576171875, -32.544921875, -29.5322265625, -26.51953125, -23.5068359375, -20.494140625, -17.4814453125, -14.46875, -11.4560546875, -8.443359375, -5.4306640625, -2.41796875, 0.5947265625, 3.607421875, 6.6201171875, 9.6328125, 12.6455078125, 15.658203125, 18.6708984375, 21.68359375, 24.6962890625, 27.708984375, 30.7216796875, 33.734375, 36.7470703125, 39.759765625, 42.7724609375, 45.78515625, 48.7978515625, 51.810546875, 54.8232421875, 57.8359375, 60.8486328125, 63.861328125, 66.8740234375, 69.88671875, 72.8994140625, 75.912109375, 78.9248046875, 81.9375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 164.0, 574.0, 249.0, 22.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.2158508300781, -278.1891784667969, -271.1625061035156, -264.1358337402344, -257.1091613769531, -250.0824737548828, -243.05580139160156, -236.0291290283203, -229.00245666503906, -221.9757843017578, -214.94911193847656, -207.92242431640625, -200.895751953125, -193.86907958984375, -186.8424072265625, -179.81573486328125, -172.7890625, -165.76239013671875, -158.7357177734375, -151.70904541015625, -144.68235778808594, -137.6556854248047, -130.62901306152344, -123.60234069824219, -116.57565307617188, -109.54898071289062, -102.52230072021484, -95.4956283569336, -88.46895599365234, -81.44227600097656, -74.41560363769531, -67.38893127441406, -60.36225891113281, -53.3355827331543, -46.30891036987305, -39.28223419189453, -32.25556182861328, -25.228885650634766, -18.20220947265625, -11.175537109375, -4.148860931396484, 2.8778138160705566, 9.904488563537598, 16.931163787841797, 23.95783805847168, 30.984512329101562, 38.01118850708008, 45.03786087036133, 52.064537048339844, 59.09121322631836, 66.11788940429688, 73.14456176757812, 80.17123413085938, 87.19790649414062, 94.2245864868164, 101.25125885009766, 108.27793884277344, 115.30461120605469, 122.33129119873047, 129.35797119140625, 136.3846435546875, 143.41131591796875, 150.43798828125, 157.46466064453125, 164.4913330078125]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 7.0, 15.0, 10.0, 15.0, 15.0, 11.0, 24.0, 17.0, 27.0, 32.0, 25.0, 21.0, 43.0, 36.0, 26.0, 37.0, 33.0, 35.0, 36.0, 48.0, 38.0, 36.0, 54.0, 47.0, 40.0, 30.0, 28.0, 28.0, 23.0, 21.0, 25.0, 17.0, 8.0, 16.0, 15.0, 14.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.587913513183594, -39.29560470581055, -38.003292083740234, -36.71098327636719, -35.41867446899414, -34.12636184692383, -32.83405303955078, -31.5417423248291, -30.249431610107422, -28.957120895385742, -27.664812088012695, -26.372501373291016, -25.080190658569336, -23.787879943847656, -22.49557113647461, -21.20326042175293, -19.910951614379883, -18.618640899658203, -17.326332092285156, -16.034021377563477, -14.741710662841797, -13.449400901794434, -12.15709114074707, -10.86478042602539, -9.572470664978027, -8.280160903930664, -6.987850189208984, -5.695540428161621, -4.4032301902771, -3.110919952392578, -1.8186101913452148, -0.5262994766235352, 0.7660102844238281, 2.0583205223083496, 3.350630521774292, 4.642940521240234, 5.935250759124756, 7.227560997009277, 8.51987075805664, 9.81218147277832, 11.104491233825684, 12.396800994873047, 13.689111709594727, 14.98142147064209, 16.273731231689453, 17.566041946411133, 18.858352661132812, 20.15066146850586, 21.44297218322754, 22.73528289794922, 24.027591705322266, 25.319902420043945, 26.612213134765625, 27.904521942138672, 29.19683265686035, 30.48914337158203, 31.781452178955078, 33.073760986328125, 34.36607360839844, 35.658382415771484, 36.95069122314453, 38.243003845214844, 39.53531265258789, 40.82762145996094, 42.11993408203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 8.0, 15.0, 13.0, 12.0, 15.0, 11.0, 23.0, 28.0, 33.0, 32.0, 31.0, 39.0, 42.0, 30.0, 48.0, 35.0, 37.0, 36.0, 35.0, 42.0, 56.0, 41.0, 35.0, 26.0, 24.0, 21.0, 32.0, 26.0, 27.0, 20.0, 29.0, 11.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 7.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.473876953125, -6.26416015625, -6.054443359375, -5.8447265625, -5.635009765625, -5.42529296875, -5.215576171875, -5.005859375, -4.796142578125, -4.58642578125, -4.376708984375, -4.1669921875, -3.957275390625, -3.74755859375, -3.537841796875, -3.328125, -3.118408203125, -2.90869140625, -2.698974609375, -2.4892578125, -2.279541015625, -2.06982421875, -1.860107421875, -1.650390625, -1.440673828125, -1.23095703125, -1.021240234375, -0.8115234375, -0.601806640625, -0.39208984375, -0.182373046875, 0.02734375, 0.237060546875, 0.44677734375, 0.656494140625, 0.8662109375, 1.075927734375, 1.28564453125, 1.495361328125, 1.705078125, 1.914794921875, 2.12451171875, 2.334228515625, 2.5439453125, 2.753662109375, 2.96337890625, 3.173095703125, 3.3828125, 3.592529296875, 3.80224609375, 4.011962890625, 4.2216796875, 4.431396484375, 4.64111328125, 4.850830078125, 5.060546875, 5.270263671875, 5.47998046875, 5.689697265625, 5.8994140625, 6.109130859375, 6.31884765625, 6.528564453125, 6.73828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 5.0, 11.0, 14.0, 15.0, 37.0, 42.0, 55.0, 103.0, 116.0, 186.0, 268.0, 370.0, 499.0, 701.0, 995.0, 1431.0, 2021.0, 2871.0, 4241.0, 6083.0, 8718.0, 12652.0, 18859.0, 29384.0, 45377.0, 72180.0, 115096.0, 191436.0, 198293.0, 121336.0, 75060.0, 47404.0, 29989.0, 20092.0, 13219.0, 8885.0, 6005.0, 4349.0, 2995.0, 2126.0, 1541.0, 1089.0, 713.0, 547.0, 353.0, 240.0, 177.0, 107.0, 79.0, 59.0, 49.0, 24.0, 18.0, 16.0, 17.0, 5.0, 8.0, 3.0, 2.0, 2.0], "bins": [-0.89111328125, -0.8633041381835938, -0.8354949951171875, -0.8076858520507812, -0.779876708984375, -0.7520675659179688, -0.7242584228515625, -0.6964492797851562, -0.66864013671875, -0.6408309936523438, -0.6130218505859375, -0.5852127075195312, -0.557403564453125, -0.5295944213867188, -0.5017852783203125, -0.47397613525390625, -0.4461669921875, -0.41835784912109375, -0.3905487060546875, -0.36273956298828125, -0.334930419921875, -0.30712127685546875, -0.2793121337890625, -0.25150299072265625, -0.22369384765625, -0.19588470458984375, -0.1680755615234375, -0.14026641845703125, -0.112457275390625, -0.08464813232421875, -0.0568389892578125, -0.02902984619140625, -0.001220703125, 0.02658843994140625, 0.0543975830078125, 0.08220672607421875, 0.110015869140625, 0.13782501220703125, 0.1656341552734375, 0.19344329833984375, 0.22125244140625, 0.24906158447265625, 0.2768707275390625, 0.30467987060546875, 0.332489013671875, 0.36029815673828125, 0.3881072998046875, 0.41591644287109375, 0.4437255859375, 0.47153472900390625, 0.4993438720703125, 0.5271530151367188, 0.554962158203125, 0.5827713012695312, 0.6105804443359375, 0.6383895874023438, 0.66619873046875, 0.6940078735351562, 0.7218170166015625, 0.7496261596679688, 0.777435302734375, 0.8052444458007812, 0.8330535888671875, 0.8608627319335938, 0.888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 9.0, 4.0, 7.0, 4.0, 4.0, 8.0, 10.0, 9.0, 10.0, 19.0, 19.0, 20.0, 13.0, 28.0, 20.0, 23.0, 20.0, 24.0, 21.0, 26.0, 28.0, 28.0, 32.0, 38.0, 27.0, 1052.0, 27.0, 29.0, 38.0, 36.0, 22.0, 31.0, 41.0, 32.0, 23.0, 28.0, 26.0, 23.0, 25.0, 18.0, 28.0, 21.0, 6.0, 18.0, 11.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.123046875, -3.01348876953125, -2.9039306640625, -2.79437255859375, -2.684814453125, -2.57525634765625, -2.4656982421875, -2.35614013671875, -2.24658203125, -2.13702392578125, -2.0274658203125, -1.91790771484375, -1.808349609375, -1.69879150390625, -1.5892333984375, -1.47967529296875, -1.3701171875, -1.26055908203125, -1.1510009765625, -1.04144287109375, -0.931884765625, -0.82232666015625, -0.7127685546875, -0.60321044921875, -0.49365234375, -0.38409423828125, -0.2745361328125, -0.16497802734375, -0.055419921875, 0.05413818359375, 0.1636962890625, 0.27325439453125, 0.3828125, 0.49237060546875, 0.6019287109375, 0.71148681640625, 0.821044921875, 0.93060302734375, 1.0401611328125, 1.14971923828125, 1.25927734375, 1.36883544921875, 1.4783935546875, 1.58795166015625, 1.697509765625, 1.80706787109375, 1.9166259765625, 2.02618408203125, 2.1357421875, 2.24530029296875, 2.3548583984375, 2.46441650390625, 2.573974609375, 2.68353271484375, 2.7930908203125, 2.90264892578125, 3.01220703125, 3.12176513671875, 3.2313232421875, 3.34088134765625, 3.450439453125, 3.55999755859375, 3.6695556640625, 3.77911376953125, 3.888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 7.0, 15.0, 13.0, 23.0, 33.0, 43.0, 76.0, 86.0, 165.0, 213.0, 314.0, 485.0, 682.0, 918.0, 1274.0, 1900.0, 2636.0, 3690.0, 5464.0, 7725.0, 11066.0, 15582.0, 23066.0, 34593.0, 51036.0, 79182.0, 126756.0, 1258390.0, 169149.0, 100755.0, 65098.0, 42784.0, 28927.0, 19746.0, 13450.0, 9479.0, 6679.0, 4618.0, 3335.0, 2235.0, 1643.0, 1184.0, 770.0, 597.0, 385.0, 272.0, 197.0, 134.0, 91.0, 55.0, 38.0, 37.0, 23.0, 6.0, 10.0, 4.0, 2.0, 2.0], "bins": [-0.8681640625, -0.8424606323242188, -0.8167572021484375, -0.7910537719726562, -0.765350341796875, -0.7396469116210938, -0.7139434814453125, -0.6882400512695312, -0.66253662109375, -0.6368331909179688, -0.6111297607421875, -0.5854263305664062, -0.559722900390625, -0.5340194702148438, -0.5083160400390625, -0.48261260986328125, -0.4569091796875, -0.43120574951171875, -0.4055023193359375, -0.37979888916015625, -0.354095458984375, -0.32839202880859375, -0.3026885986328125, -0.27698516845703125, -0.25128173828125, -0.22557830810546875, -0.1998748779296875, -0.17417144775390625, -0.148468017578125, -0.12276458740234375, -0.0970611572265625, -0.07135772705078125, -0.045654296875, -0.01995086669921875, 0.0057525634765625, 0.03145599365234375, 0.057159423828125, 0.08286285400390625, 0.1085662841796875, 0.13426971435546875, 0.15997314453125, 0.18567657470703125, 0.2113800048828125, 0.23708343505859375, 0.262786865234375, 0.28849029541015625, 0.3141937255859375, 0.33989715576171875, 0.3656005859375, 0.39130401611328125, 0.4170074462890625, 0.44271087646484375, 0.468414306640625, 0.49411773681640625, 0.5198211669921875, 0.5455245971679688, 0.57122802734375, 0.5969314575195312, 0.6226348876953125, 0.6483383178710938, 0.674041748046875, 0.6997451782226562, 0.7254486083984375, 0.7511520385742188, 0.77685546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 6.0, 10.0, 14.0, 19.0, 24.0, 26.0, 20.0, 37.0, 38.0, 26.0, 45.0, 64.0, 52.0, 74.0, 63.0, 65.0, 58.0, 54.0, 50.0, 39.0, 30.0, 33.0, 24.0, 28.0, 25.0, 8.0, 16.0, 5.0, 8.0, 7.0, 9.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0006403923034667969, -0.0006232447922229767, -0.0006060972809791565, -0.0005889497697353363, -0.0005718022584915161, -0.0005546547472476959, -0.0005375072360038757, -0.0005203597247600555, -0.0005032122135162354, -0.00048606470227241516, -0.00046891719102859497, -0.0004517696797847748, -0.0004346221685409546, -0.0004174746572971344, -0.0004003271460533142, -0.000383179634809494, -0.00036603212356567383, -0.00034888461232185364, -0.00033173710107803345, -0.00031458958983421326, -0.00029744207859039307, -0.0002802945673465729, -0.0002631470561027527, -0.0002459995448589325, -0.0002288520336151123, -0.00021170452237129211, -0.00019455701112747192, -0.00017740949988365173, -0.00016026198863983154, -0.00014311447739601135, -0.00012596696615219116, -0.00010881945490837097, -9.167194366455078e-05, -7.452443242073059e-05, -5.73769211769104e-05, -4.022940993309021e-05, -2.308189868927002e-05, -5.934387445449829e-06, 1.1213123798370361e-05, 2.8360635042190552e-05, 4.550814628601074e-05, 6.265565752983093e-05, 7.980316877365112e-05, 9.695068001747131e-05, 0.0001140981912612915, 0.0001312457025051117, 0.00014839321374893188, 0.00016554072499275208, 0.00018268823623657227, 0.00019983574748039246, 0.00021698325872421265, 0.00023413076996803284, 0.00025127828121185303, 0.0002684257924556732, 0.0002855733036994934, 0.0003027208149433136, 0.0003198683261871338, 0.000337015837430954, 0.00035416334867477417, 0.00037131085991859436, 0.00038845837116241455, 0.00040560588240623474, 0.00042275339365005493, 0.0004399009048938751, 0.0004570484161376953]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 11.0, 3.0, 7.0, 11.0, 16.0, 17.0, 24.0, 22.0, 35.0, 26.0, 43.0, 44.0, 63.0, 92.0, 149.0, 243.0, 594.0, 4455.0, 1032496.0, 8656.0, 703.0, 259.0, 140.0, 94.0, 75.0, 51.0, 47.0, 31.0, 28.0, 23.0, 23.0, 14.0, 8.0, 15.0, 8.0, 4.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0107574462890625, -0.010380744934082031, -0.010004043579101562, -0.009627342224121094, -0.009250640869140625, -0.008873939514160156, -0.008497238159179688, -0.008120536804199219, -0.00774383544921875, -0.007367134094238281, -0.0069904327392578125, -0.006613731384277344, -0.006237030029296875, -0.005860328674316406, -0.0054836273193359375, -0.005106925964355469, -0.004730224609375, -0.004353523254394531, -0.0039768218994140625, -0.0036001205444335938, -0.003223419189453125, -0.0028467178344726562, -0.0024700164794921875, -0.0020933151245117188, -0.00171661376953125, -0.0013399124145507812, -0.0009632110595703125, -0.0005865097045898438, -0.000209808349609375, 0.00016689300537109375, 0.0005435943603515625, 0.0009202957153320312, 0.0012969970703125, 0.0016736984252929688, 0.0020503997802734375, 0.0024271011352539062, 0.002803802490234375, 0.0031805038452148438, 0.0035572052001953125, 0.003933906555175781, 0.00431060791015625, 0.004687309265136719, 0.0050640106201171875, 0.005440711975097656, 0.005817413330078125, 0.006194114685058594, 0.0065708160400390625, 0.006947517395019531, 0.00732421875, 0.007700920104980469, 0.008077621459960938, 0.008454322814941406, 0.008831024169921875, 0.009207725524902344, 0.009584426879882812, 0.009961128234863281, 0.01033782958984375, 0.010714530944824219, 0.011091232299804688, 0.011467933654785156, 0.011844635009765625, 0.012221336364746094, 0.012598037719726562, 0.012974739074707031, 0.0133514404296875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 37.0, 287.0, 506.0, 162.0, 16.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0024123857729136944, -0.0023662885650992393, -0.0023201913572847843, -0.0022740941494703293, -0.0022279969416558743, -0.0021818997338414192, -0.002135802526026964, -0.002089705318212509, -0.002043608110398054, -0.001997510902583599, -0.001951413694769144, -0.001905316486954689, -0.001859219279140234, -0.001813122071325779, -0.001767024863511324, -0.001720927655696869, -0.0016748305642977357, -0.0016287333564832807, -0.0015826361486688256, -0.0015365389408543706, -0.0014904417330399156, -0.0014443445252254605, -0.0013982474338263273, -0.0013521502260118723, -0.0013060530181974173, -0.0012599558103829622, -0.0012138586025685072, -0.0011677613947540522, -0.0011216641869395971, -0.001075566979125142, -0.001029469771310687, -0.000983372563496232, -0.0009372754138894379, -0.0008911782060749829, -0.0008450809982605278, -0.0007989838486537337, -0.0007528866408392787, -0.0007067894330248237, -0.0006606922252103686, -0.0006145950173959136, -0.0005684978095814586, -0.0005224006017670035, -0.0004763033939525485, -0.00043020621524192393, -0.0003841090074274689, -0.00033801179961301386, -0.0002919146209023893, -0.00024581741308793426, -0.00019972020527347922, -0.0001536229974590242, -0.00010752580419648439, -6.142861093394458e-05, -1.533140311948955e-05, 3.076580469496548e-05, 7.686298340559006e-05, 0.0001229601912200451, 0.00016905739903450012, 0.00021515460684895515, 0.0002612518146634102, 0.00030734899337403476, 0.0003534462011884898, 0.0003995434090029448, 0.0004456405877135694, 0.0004917377955280244, 0.0005378350033424795]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 5.0, 11.0, 8.0, 13.0, 12.0, 18.0, 17.0, 15.0, 20.0, 27.0, 23.0, 29.0, 30.0, 25.0, 36.0, 36.0, 36.0, 33.0, 58.0, 35.0, 36.0, 43.0, 44.0, 33.0, 42.0, 45.0, 27.0, 28.0, 20.0, 30.0, 20.0, 19.0, 14.0, 17.0, 15.0, 10.0, 11.0, 13.0, 6.0, 10.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00025594234466552734, -0.0002481583505868912, -0.000240374356508255, -0.00023259036242961884, -0.00022480636835098267, -0.0002170223742723465, -0.00020923838019371033, -0.00020145438611507416, -0.000193670392036438, -0.00018588639795780182, -0.00017810240387916565, -0.00017031840980052948, -0.0001625344157218933, -0.00015475042164325714, -0.00014696642756462097, -0.0001391824334859848, -0.00013139843940734863, -0.00012361444532871246, -0.0001158304512500763, -0.00010804645717144012, -0.00010026246309280396, -9.247846901416779e-05, -8.469447493553162e-05, -7.691048085689545e-05, -6.912648677825928e-05, -6.134249269962311e-05, -5.355849862098694e-05, -4.577450454235077e-05, -3.79905104637146e-05, -3.020651638507843e-05, -2.242252230644226e-05, -1.4638528227806091e-05, -6.854534149169922e-06, 9.294599294662476e-07, 8.713454008102417e-06, 1.6497448086738586e-05, 2.4281442165374756e-05, 3.2065436244010925e-05, 3.9849430322647095e-05, 4.7633424401283264e-05, 5.5417418479919434e-05, 6.32014125585556e-05, 7.098540663719177e-05, 7.876940071582794e-05, 8.655339479446411e-05, 9.433738887310028e-05, 0.00010212138295173645, 0.00010990537703037262, 0.00011768937110900879, 0.00012547336518764496, 0.00013325735926628113, 0.0001410413533449173, 0.00014882534742355347, 0.00015660934150218964, 0.0001643933355808258, 0.00017217732965946198, 0.00017996132373809814, 0.00018774531781673431, 0.00019552931189537048, 0.00020331330597400665, 0.00021109730005264282, 0.000218881294131279, 0.00022666528820991516, 0.00023444928228855133, 0.0002422332763671875]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 8.0, 15.0, 13.0, 12.0, 15.0, 11.0, 23.0, 28.0, 33.0, 32.0, 31.0, 39.0, 42.0, 30.0, 48.0, 35.0, 37.0, 36.0, 35.0, 42.0, 56.0, 41.0, 35.0, 26.0, 24.0, 21.0, 32.0, 26.0, 27.0, 20.0, 29.0, 11.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 7.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.473876953125, -6.26416015625, -6.054443359375, -5.8447265625, -5.635009765625, -5.42529296875, -5.215576171875, -5.005859375, -4.796142578125, -4.58642578125, -4.376708984375, -4.1669921875, -3.957275390625, -3.74755859375, -3.537841796875, -3.328125, -3.118408203125, -2.90869140625, -2.698974609375, -2.4892578125, -2.279541015625, -2.06982421875, -1.860107421875, -1.650390625, -1.440673828125, -1.23095703125, -1.021240234375, -0.8115234375, -0.601806640625, -0.39208984375, -0.182373046875, 0.02734375, 0.237060546875, 0.44677734375, 0.656494140625, 0.8662109375, 1.075927734375, 1.28564453125, 1.495361328125, 1.705078125, 1.914794921875, 2.12451171875, 2.334228515625, 2.5439453125, 2.753662109375, 2.96337890625, 3.173095703125, 3.3828125, 3.592529296875, 3.80224609375, 4.011962890625, 4.2216796875, 4.431396484375, 4.64111328125, 4.850830078125, 5.060546875, 5.270263671875, 5.47998046875, 5.689697265625, 5.8994140625, 6.109130859375, 6.31884765625, 6.528564453125, 6.73828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 7.0, 10.0, 18.0, 14.0, 28.0, 41.0, 50.0, 64.0, 87.0, 103.0, 133.0, 176.0, 316.0, 546.0, 1190.0, 2891.0, 8457.0, 27007.0, 87651.0, 316758.0, 432949.0, 116460.0, 35437.0, 11276.0, 3724.0, 1384.0, 636.0, 300.0, 221.0, 142.0, 120.0, 82.0, 59.0, 51.0, 29.0, 38.0, 27.0, 12.0, 7.0, 9.0, 5.0, 10.0, 6.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.9609375, -6.74420166015625, -6.5274658203125, -6.31072998046875, -6.093994140625, -5.87725830078125, -5.6605224609375, -5.44378662109375, -5.22705078125, -5.01031494140625, -4.7935791015625, -4.57684326171875, -4.360107421875, -4.14337158203125, -3.9266357421875, -3.70989990234375, -3.4931640625, -3.27642822265625, -3.0596923828125, -2.84295654296875, -2.626220703125, -2.40948486328125, -2.1927490234375, -1.97601318359375, -1.75927734375, -1.54254150390625, -1.3258056640625, -1.10906982421875, -0.892333984375, -0.67559814453125, -0.4588623046875, -0.24212646484375, -0.025390625, 0.19134521484375, 0.4080810546875, 0.62481689453125, 0.841552734375, 1.05828857421875, 1.2750244140625, 1.49176025390625, 1.70849609375, 1.92523193359375, 2.1419677734375, 2.35870361328125, 2.575439453125, 2.79217529296875, 3.0089111328125, 3.22564697265625, 3.4423828125, 3.65911865234375, 3.8758544921875, 4.09259033203125, 4.309326171875, 4.52606201171875, 4.7427978515625, 4.95953369140625, 5.17626953125, 5.39300537109375, 5.6097412109375, 5.82647705078125, 6.043212890625, 6.25994873046875, 6.4766845703125, 6.69342041015625, 6.91015625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 7.0, 9.0, 11.0, 17.0, 23.0, 26.0, 30.0, 30.0, 31.0, 46.0, 45.0, 32.0, 50.0, 74.0, 119.0, 1814.0, 237.0, 68.0, 49.0, 49.0, 43.0, 36.0, 35.0, 24.0, 26.0, 30.0, 21.0, 15.0, 22.0, 14.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.25, -28.43115234375, -27.6123046875, -26.79345703125, -25.974609375, -25.15576171875, -24.3369140625, -23.51806640625, -22.69921875, -21.88037109375, -21.0615234375, -20.24267578125, -19.423828125, -18.60498046875, -17.7861328125, -16.96728515625, -16.1484375, -15.32958984375, -14.5107421875, -13.69189453125, -12.873046875, -12.05419921875, -11.2353515625, -10.41650390625, -9.59765625, -8.77880859375, -7.9599609375, -7.14111328125, -6.322265625, -5.50341796875, -4.6845703125, -3.86572265625, -3.046875, -2.22802734375, -1.4091796875, -0.59033203125, 0.228515625, 1.04736328125, 1.8662109375, 2.68505859375, 3.50390625, 4.32275390625, 5.1416015625, 5.96044921875, 6.779296875, 7.59814453125, 8.4169921875, 9.23583984375, 10.0546875, 10.87353515625, 11.6923828125, 12.51123046875, 13.330078125, 14.14892578125, 14.9677734375, 15.78662109375, 16.60546875, 17.42431640625, 18.2431640625, 19.06201171875, 19.880859375, 20.69970703125, 21.5185546875, 22.33740234375, 23.15625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 10.0, 6.0, 8.0, 20.0, 23.0, 62.0, 61.0, 81.0, 121.0, 179.0, 297.0, 606.0, 3398.0, 3129633.0, 9421.0, 817.0, 349.0, 201.0, 119.0, 98.0, 61.0, 44.0, 29.0, 23.0, 13.0, 10.0, 8.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.75, -68.2763671875, -65.802734375, -63.3291015625, -60.85546875, -58.3818359375, -55.908203125, -53.4345703125, -50.9609375, -48.4873046875, -46.013671875, -43.5400390625, -41.06640625, -38.5927734375, -36.119140625, -33.6455078125, -31.171875, -28.6982421875, -26.224609375, -23.7509765625, -21.27734375, -18.8037109375, -16.330078125, -13.8564453125, -11.3828125, -8.9091796875, -6.435546875, -3.9619140625, -1.48828125, 0.9853515625, 3.458984375, 5.9326171875, 8.40625, 10.8798828125, 13.353515625, 15.8271484375, 18.30078125, 20.7744140625, 23.248046875, 25.7216796875, 28.1953125, 30.6689453125, 33.142578125, 35.6162109375, 38.08984375, 40.5634765625, 43.037109375, 45.5107421875, 47.984375, 50.4580078125, 52.931640625, 55.4052734375, 57.87890625, 60.3525390625, 62.826171875, 65.2998046875, 67.7734375, 70.2470703125, 72.720703125, 75.1943359375, 77.66796875, 80.1416015625, 82.615234375, 85.0888671875, 87.5625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 41.0, 667.0, 294.0, 11.0, 1.0, 0.0, 1.0], "bins": [-240.0944366455078, -236.007080078125, -231.91973876953125, -227.83238220214844, -223.74502563476562, -219.65768432617188, -215.57032775878906, -211.48297119140625, -207.3956298828125, -203.3082733154297, -199.22093200683594, -195.13357543945312, -191.0462188720703, -186.9588623046875, -182.87152099609375, -178.78416442871094, -174.69680786132812, -170.6094512939453, -166.52210998535156, -162.43475341796875, -158.34739685058594, -154.26004028320312, -150.17269897460938, -146.08534240722656, -141.99798583984375, -137.91062927246094, -133.8232879638672, -129.73593139648438, -125.64857482910156, -121.56122589111328, -117.473876953125, -113.38652038574219, -109.29917907714844, -105.21183013916016, -101.12447357177734, -97.03712463378906, -92.94976806640625, -88.86241912841797, -84.77507019042969, -80.68771362304688, -76.6003646850586, -72.51301574707031, -68.4256591796875, -64.33831024169922, -60.25095748901367, -56.163604736328125, -52.076255798339844, -47.9889030456543, -43.90155029296875, -39.8141975402832, -35.726844787597656, -31.639495849609375, -27.552143096923828, -23.46479034423828, -19.377439498901367, -15.290088653564453, -11.202737808227539, -7.115386009216309, -3.028034210205078, 1.0593175888061523, 5.146669387817383, 9.23402214050293, 13.321372985839844, 17.408723831176758, 21.496076583862305]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 6.0, 9.0, 11.0, 15.0, 12.0, 6.0, 23.0, 20.0, 26.0, 25.0, 21.0, 24.0, 41.0, 27.0, 35.0, 36.0, 46.0, 38.0, 40.0, 50.0, 42.0, 41.0, 41.0, 38.0, 37.0, 34.0, 27.0, 39.0, 17.0, 23.0, 23.0, 23.0, 15.0, 9.0, 13.0, 13.0, 11.0, 5.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-59.17918395996094, -57.40391540527344, -55.62864685058594, -53.8533821105957, -52.0781135559082, -50.3028450012207, -48.52758026123047, -46.75231170654297, -44.97704315185547, -43.20177459716797, -41.42650604248047, -39.651241302490234, -37.875972747802734, -36.100704193115234, -34.325439453125, -32.5501708984375, -30.77490234375, -28.9996337890625, -27.224367141723633, -25.449100494384766, -23.673831939697266, -21.898563385009766, -20.1232967376709, -18.34803009033203, -16.57276153564453, -14.797493934631348, -13.022226333618164, -11.24695873260498, -9.471691131591797, -7.696423530578613, -5.92115592956543, -4.145888328552246, -2.370624542236328, -0.5953569412231445, 1.179910659790039, 2.9551782608032227, 4.730445861816406, 6.50571346282959, 8.280981063842773, 10.056248664855957, 11.83151626586914, 13.606783866882324, 15.382051467895508, 17.157318115234375, 18.932586669921875, 20.707855224609375, 22.483121871948242, 24.25838851928711, 26.03365707397461, 27.80892562866211, 29.584192276000977, 31.359458923339844, 33.134727478027344, 34.909996032714844, 36.685264587402344, 38.46052932739258, 40.23579788208008, 42.01106643676758, 43.78633117675781, 45.56159973144531, 47.33686828613281, 49.11213684082031, 50.88740539550781, 52.66267013549805, 54.43793869018555]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 7.0, 8.0, 9.0, 12.0, 17.0, 19.0, 14.0, 12.0, 26.0, 28.0, 33.0, 37.0, 39.0, 27.0, 39.0, 39.0, 33.0, 39.0, 30.0, 34.0, 43.0, 36.0, 45.0, 37.0, 42.0, 26.0, 21.0, 29.0, 28.0, 21.0, 25.0, 20.0, 21.0, 17.0, 16.0, 12.0, 6.0, 10.0, 7.0, 4.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.7109375, -6.50421142578125, -6.2974853515625, -6.09075927734375, -5.884033203125, -5.67730712890625, -5.4705810546875, -5.26385498046875, -5.05712890625, -4.85040283203125, -4.6436767578125, -4.43695068359375, -4.230224609375, -4.02349853515625, -3.8167724609375, -3.61004638671875, -3.4033203125, -3.19659423828125, -2.9898681640625, -2.78314208984375, -2.576416015625, -2.36968994140625, -2.1629638671875, -1.95623779296875, -1.74951171875, -1.54278564453125, -1.3360595703125, -1.12933349609375, -0.922607421875, -0.71588134765625, -0.5091552734375, -0.30242919921875, -0.095703125, 0.11102294921875, 0.3177490234375, 0.52447509765625, 0.731201171875, 0.93792724609375, 1.1446533203125, 1.35137939453125, 1.55810546875, 1.76483154296875, 1.9715576171875, 2.17828369140625, 2.385009765625, 2.59173583984375, 2.7984619140625, 3.00518798828125, 3.2119140625, 3.41864013671875, 3.6253662109375, 3.83209228515625, 4.038818359375, 4.24554443359375, 4.4522705078125, 4.65899658203125, 4.86572265625, 5.07244873046875, 5.2791748046875, 5.48590087890625, 5.692626953125, 5.89935302734375, 6.1060791015625, 6.31280517578125, 6.51953125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 6.0, 5.0, 9.0, 6.0, 9.0, 18.0, 12.0, 19.0, 19.0, 31.0, 48.0, 60.0, 75.0, 91.0, 156.0, 202.0, 415.0, 1106.0, 6842.0, 290235.0, 3570370.0, 314713.0, 7392.0, 1223.0, 417.0, 229.0, 126.0, 97.0, 71.0, 63.0, 42.0, 48.0, 23.0, 20.0, 16.0, 8.0, 13.0, 8.0, 7.0, 8.0, 6.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.015625, -24.290771484375, -23.56591796875, -22.841064453125, -22.1162109375, -21.391357421875, -20.66650390625, -19.941650390625, -19.216796875, -18.491943359375, -17.76708984375, -17.042236328125, -16.3173828125, -15.592529296875, -14.86767578125, -14.142822265625, -13.41796875, -12.693115234375, -11.96826171875, -11.243408203125, -10.5185546875, -9.793701171875, -9.06884765625, -8.343994140625, -7.619140625, -6.894287109375, -6.16943359375, -5.444580078125, -4.7197265625, -3.994873046875, -3.27001953125, -2.545166015625, -1.8203125, -1.095458984375, -0.37060546875, 0.354248046875, 1.0791015625, 1.803955078125, 2.52880859375, 3.253662109375, 3.978515625, 4.703369140625, 5.42822265625, 6.153076171875, 6.8779296875, 7.602783203125, 8.32763671875, 9.052490234375, 9.77734375, 10.502197265625, 11.22705078125, 11.951904296875, 12.6767578125, 13.401611328125, 14.12646484375, 14.851318359375, 15.576171875, 16.301025390625, 17.02587890625, 17.750732421875, 18.4755859375, 19.200439453125, 19.92529296875, 20.650146484375, 21.375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 18.0, 26.0, 38.0, 51.0, 75.0, 77.0, 101.0, 156.0, 230.0, 349.0, 528.0, 580.0, 580.0, 411.0, 252.0, 180.0, 127.0, 86.0, 49.0, 51.0, 30.0, 16.0, 9.0, 13.0, 9.0, 0.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7109375, -14.244873046875, -13.77880859375, -13.312744140625, -12.8466796875, -12.380615234375, -11.91455078125, -11.448486328125, -10.982421875, -10.516357421875, -10.05029296875, -9.584228515625, -9.1181640625, -8.652099609375, -8.18603515625, -7.719970703125, -7.25390625, -6.787841796875, -6.32177734375, -5.855712890625, -5.3896484375, -4.923583984375, -4.45751953125, -3.991455078125, -3.525390625, -3.059326171875, -2.59326171875, -2.127197265625, -1.6611328125, -1.195068359375, -0.72900390625, -0.262939453125, 0.203125, 0.669189453125, 1.13525390625, 1.601318359375, 2.0673828125, 2.533447265625, 2.99951171875, 3.465576171875, 3.931640625, 4.397705078125, 4.86376953125, 5.329833984375, 5.7958984375, 6.261962890625, 6.72802734375, 7.194091796875, 7.66015625, 8.126220703125, 8.59228515625, 9.058349609375, 9.5244140625, 9.990478515625, 10.45654296875, 10.922607421875, 11.388671875, 11.854736328125, 12.32080078125, 12.786865234375, 13.2529296875, 13.718994140625, 14.18505859375, 14.651123046875, 15.1171875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 13.0, 12.0, 16.0, 30.0, 32.0, 53.0, 49.0, 103.0, 104.0, 124.0, 182.0, 255.0, 347.0, 610.0, 3026.0, 4030765.0, 155985.0, 974.0, 373.0, 279.0, 213.0, 135.0, 113.0, 98.0, 85.0, 64.0, 54.0, 50.0, 29.0, 38.0, 14.0, 12.0, 11.0, 13.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.4375, -75.8896484375, -73.341796875, -70.7939453125, -68.24609375, -65.6982421875, -63.150390625, -60.6025390625, -58.0546875, -55.5068359375, -52.958984375, -50.4111328125, -47.86328125, -45.3154296875, -42.767578125, -40.2197265625, -37.671875, -35.1240234375, -32.576171875, -30.0283203125, -27.48046875, -24.9326171875, -22.384765625, -19.8369140625, -17.2890625, -14.7412109375, -12.193359375, -9.6455078125, -7.09765625, -4.5498046875, -2.001953125, 0.5458984375, 3.09375, 5.6416015625, 8.189453125, 10.7373046875, 13.28515625, 15.8330078125, 18.380859375, 20.9287109375, 23.4765625, 26.0244140625, 28.572265625, 31.1201171875, 33.66796875, 36.2158203125, 38.763671875, 41.3115234375, 43.859375, 46.4072265625, 48.955078125, 51.5029296875, 54.05078125, 56.5986328125, 59.146484375, 61.6943359375, 64.2421875, 66.7900390625, 69.337890625, 71.8857421875, 74.43359375, 76.9814453125, 79.529296875, 82.0771484375, 84.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 43.0, 274.0, 447.0, 204.0, 34.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.85195922851562, -217.94973754882812, -213.04751586914062, -208.14529418945312, -203.24307250976562, -198.3408660888672, -193.4386444091797, -188.5364227294922, -183.6342010498047, -178.7319793701172, -173.8297576904297, -168.9275360107422, -164.02532958984375, -159.12310791015625, -154.22088623046875, -149.31866455078125, -144.41644287109375, -139.51422119140625, -134.61199951171875, -129.70977783203125, -124.80756378173828, -119.90534210205078, -115.00312805175781, -110.10090637207031, -105.19868469238281, -100.29646301269531, -95.39424133300781, -90.49202728271484, -85.58980560302734, -80.68758392333984, -75.78536987304688, -70.88314819335938, -65.9809341430664, -61.078712463378906, -56.17649459838867, -51.27427673339844, -46.37205505371094, -41.46983337402344, -36.5676155090332, -31.66539764404297, -26.76317596435547, -21.8609561920166, -16.958736419677734, -12.056516647338867, -7.154296875, -2.252077102661133, 2.6501426696777344, 7.552360534667969, 12.454582214355469, 17.356801986694336, 22.259021759033203, 27.16124153137207, 32.06346130371094, 36.96568298339844, 41.86790084838867, 46.770118713378906, 51.672340393066406, 56.574562072753906, 61.47677993774414, 66.37899780273438, 71.28121948242188, 76.18344116210938, 81.08566284179688, 85.98787689208984, 90.89009857177734]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 7.0, 10.0, 10.0, 20.0, 13.0, 22.0, 10.0, 40.0, 25.0, 38.0, 32.0, 29.0, 40.0, 36.0, 40.0, 42.0, 34.0, 38.0, 32.0, 37.0, 44.0, 33.0, 39.0, 34.0, 30.0, 25.0, 37.0, 20.0, 16.0, 21.0, 16.0, 21.0, 13.0, 10.0, 8.0, 13.0, 5.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-39.63624572753906, -38.40560531616211, -37.17496871948242, -35.94432830810547, -34.71369171142578, -33.48305130004883, -32.252410888671875, -31.021772384643555, -29.791133880615234, -28.560495376586914, -27.329856872558594, -26.09921646118164, -24.86857795715332, -23.637939453125, -22.407299041748047, -21.176660537719727, -19.946022033691406, -18.715383529663086, -17.484745025634766, -16.254104614257812, -15.023466110229492, -13.792827606201172, -12.562188148498535, -11.331548690795898, -10.100910186767578, -8.870271682739258, -7.639632225036621, -6.408993244171143, -5.178354263305664, -3.9477152824401855, -2.717076301574707, -1.4864368438720703, -0.2557945251464844, 0.9748444557189941, 2.2054834365844727, 3.436122417449951, 4.66676139831543, 5.897400379180908, 7.128039360046387, 8.358678817749023, 9.589317321777344, 10.819955825805664, 12.0505952835083, 13.281234741210938, 14.511873245239258, 15.742511749267578, 16.97315216064453, 18.20379066467285, 19.434429168701172, 20.665067672729492, 21.895706176757812, 23.126346588134766, 24.356985092163086, 25.587623596191406, 26.81826400756836, 28.04890251159668, 29.279541015625, 30.51017951965332, 31.74081802368164, 32.971458435058594, 34.20209503173828, 35.432735443115234, 36.66337585449219, 37.894012451171875, 39.12465286254883]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 11.0, 12.0, 15.0, 18.0, 12.0, 23.0, 28.0, 19.0, 28.0, 27.0, 36.0, 35.0, 44.0, 33.0, 47.0, 46.0, 50.0, 33.0, 39.0, 39.0, 37.0, 33.0, 28.0, 36.0, 39.0, 26.0, 26.0, 26.0, 23.0, 24.0, 14.0, 19.0, 10.0, 10.0, 15.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3212890625, -6.099609375, -5.8779296875, -5.65625, -5.4345703125, -5.212890625, -4.9912109375, -4.76953125, -4.5478515625, -4.326171875, -4.1044921875, -3.8828125, -3.6611328125, -3.439453125, -3.2177734375, -2.99609375, -2.7744140625, -2.552734375, -2.3310546875, -2.109375, -1.8876953125, -1.666015625, -1.4443359375, -1.22265625, -1.0009765625, -0.779296875, -0.5576171875, -0.3359375, -0.1142578125, 0.107421875, 0.3291015625, 0.55078125, 0.7724609375, 0.994140625, 1.2158203125, 1.4375, 1.6591796875, 1.880859375, 2.1025390625, 2.32421875, 2.5458984375, 2.767578125, 2.9892578125, 3.2109375, 3.4326171875, 3.654296875, 3.8759765625, 4.09765625, 4.3193359375, 4.541015625, 4.7626953125, 4.984375, 5.2060546875, 5.427734375, 5.6494140625, 5.87109375, 6.0927734375, 6.314453125, 6.5361328125, 6.7578125, 6.9794921875, 7.201171875, 7.4228515625, 7.64453125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 5.0, 12.0, 10.0, 17.0, 27.0, 42.0, 56.0, 73.0, 99.0, 175.0, 248.0, 360.0, 491.0, 790.0, 1167.0, 1654.0, 2565.0, 3856.0, 5926.0, 9279.0, 14653.0, 23762.0, 38019.0, 63856.0, 108400.0, 192852.0, 236447.0, 137716.0, 79264.0, 47644.0, 28962.0, 17869.0, 11261.0, 7100.0, 4692.0, 3045.0, 1999.0, 1291.0, 941.0, 569.0, 443.0, 284.0, 200.0, 140.0, 95.0, 60.0, 40.0, 24.0, 29.0, 25.0, 8.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0], "bins": [-1.150390625, -1.115753173828125, -1.08111572265625, -1.046478271484375, -1.0118408203125, -0.977203369140625, -0.94256591796875, -0.907928466796875, -0.873291015625, -0.838653564453125, -0.80401611328125, -0.769378662109375, -0.7347412109375, -0.700103759765625, -0.66546630859375, -0.630828857421875, -0.59619140625, -0.561553955078125, -0.52691650390625, -0.492279052734375, -0.4576416015625, -0.423004150390625, -0.38836669921875, -0.353729248046875, -0.319091796875, -0.284454345703125, -0.24981689453125, -0.215179443359375, -0.1805419921875, -0.145904541015625, -0.11126708984375, -0.076629638671875, -0.0419921875, -0.007354736328125, 0.02728271484375, 0.061920166015625, 0.0965576171875, 0.131195068359375, 0.16583251953125, 0.200469970703125, 0.235107421875, 0.269744873046875, 0.30438232421875, 0.339019775390625, 0.3736572265625, 0.408294677734375, 0.44293212890625, 0.477569580078125, 0.51220703125, 0.546844482421875, 0.58148193359375, 0.616119384765625, 0.6507568359375, 0.685394287109375, 0.72003173828125, 0.754669189453125, 0.789306640625, 0.823944091796875, 0.85858154296875, 0.893218994140625, 0.9278564453125, 0.962493896484375, 0.99713134765625, 1.031768798828125, 1.06640625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 12.0, 14.0, 22.0, 13.0, 16.0, 19.0, 20.0, 27.0, 30.0, 33.0, 38.0, 45.0, 42.0, 50.0, 35.0, 69.0, 1063.0, 56.0, 36.0, 39.0, 41.0, 43.0, 32.0, 44.0, 27.0, 25.0, 17.0, 23.0, 15.0, 23.0, 16.0, 4.0, 7.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9921875, -4.83648681640625, -4.6807861328125, -4.52508544921875, -4.369384765625, -4.21368408203125, -4.0579833984375, -3.90228271484375, -3.74658203125, -3.59088134765625, -3.4351806640625, -3.27947998046875, -3.123779296875, -2.96807861328125, -2.8123779296875, -2.65667724609375, -2.5009765625, -2.34527587890625, -2.1895751953125, -2.03387451171875, -1.878173828125, -1.72247314453125, -1.5667724609375, -1.41107177734375, -1.25537109375, -1.09967041015625, -0.9439697265625, -0.78826904296875, -0.632568359375, -0.47686767578125, -0.3211669921875, -0.16546630859375, -0.009765625, 0.14593505859375, 0.3016357421875, 0.45733642578125, 0.613037109375, 0.76873779296875, 0.9244384765625, 1.08013916015625, 1.23583984375, 1.39154052734375, 1.5472412109375, 1.70294189453125, 1.858642578125, 2.01434326171875, 2.1700439453125, 2.32574462890625, 2.4814453125, 2.63714599609375, 2.7928466796875, 2.94854736328125, 3.104248046875, 3.25994873046875, 3.4156494140625, 3.57135009765625, 3.72705078125, 3.88275146484375, 4.0384521484375, 4.19415283203125, 4.349853515625, 4.50555419921875, 4.6612548828125, 4.81695556640625, 4.97265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 17.0, 25.0, 25.0, 43.0, 72.0, 84.0, 167.0, 222.0, 351.0, 571.0, 829.0, 1403.0, 2175.0, 3327.0, 5270.0, 8255.0, 13209.0, 22526.0, 38718.0, 68479.0, 123478.0, 1290857.0, 235396.0, 119917.0, 66549.0, 37954.0, 21848.0, 12909.0, 8115.0, 5102.0, 3317.0, 2125.0, 1331.0, 902.0, 520.0, 351.0, 223.0, 155.0, 102.0, 64.0, 45.0, 37.0, 17.0, 18.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0279998779296875, -0.992523193359375, -0.9570465087890625, -0.92156982421875, -0.8860931396484375, -0.850616455078125, -0.8151397705078125, -0.7796630859375, -0.7441864013671875, -0.708709716796875, -0.6732330322265625, -0.63775634765625, -0.6022796630859375, -0.566802978515625, -0.5313262939453125, -0.495849609375, -0.4603729248046875, -0.424896240234375, -0.3894195556640625, -0.35394287109375, -0.3184661865234375, -0.282989501953125, -0.2475128173828125, -0.2120361328125, -0.1765594482421875, -0.141082763671875, -0.1056060791015625, -0.07012939453125, -0.0346527099609375, 0.000823974609375, 0.0363006591796875, 0.07177734375, 0.1072540283203125, 0.142730712890625, 0.1782073974609375, 0.21368408203125, 0.2491607666015625, 0.284637451171875, 0.3201141357421875, 0.3555908203125, 0.3910675048828125, 0.426544189453125, 0.4620208740234375, 0.49749755859375, 0.5329742431640625, 0.568450927734375, 0.6039276123046875, 0.639404296875, 0.6748809814453125, 0.710357666015625, 0.7458343505859375, 0.78131103515625, 0.8167877197265625, 0.852264404296875, 0.8877410888671875, 0.9232177734375, 0.9586944580078125, 0.994171142578125, 1.0296478271484375, 1.06512451171875, 1.1006011962890625, 1.136077880859375, 1.1715545654296875, 1.20703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 0.0, 5.0, 4.0, 5.0, 4.0, 10.0, 10.0, 10.0, 18.0, 11.0, 16.0, 25.0, 19.0, 33.0, 36.0, 29.0, 42.0, 49.0, 58.0, 60.0, 49.0, 56.0, 44.0, 46.0, 51.0, 48.0, 45.0, 34.0, 33.0, 23.0, 17.0, 22.0, 16.0, 17.0, 9.0, 13.0, 5.0, 8.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00040340423583984375, -0.00038740038871765137, -0.000371396541595459, -0.0003553926944732666, -0.0003393888473510742, -0.00032338500022888184, -0.00030738115310668945, -0.00029137730598449707, -0.0002753734588623047, -0.0002593696117401123, -0.00024336576461791992, -0.00022736191749572754, -0.00021135807037353516, -0.00019535422325134277, -0.0001793503761291504, -0.000163346529006958, -0.00014734268188476562, -0.00013133883476257324, -0.00011533498764038086, -9.933114051818848e-05, -8.33272933959961e-05, -6.732344627380371e-05, -5.131959915161133e-05, -3.5315752029418945e-05, -1.9311904907226562e-05, -3.3080577850341797e-06, 1.2695789337158203e-05, 2.8699636459350586e-05, 4.470348358154297e-05, 6.070733070373535e-05, 7.671117782592773e-05, 9.271502494812012e-05, 0.0001087188720703125, 0.00012472271919250488, 0.00014072656631469727, 0.00015673041343688965, 0.00017273426055908203, 0.00018873810768127441, 0.0002047419548034668, 0.00022074580192565918, 0.00023674964904785156, 0.00025275349617004395, 0.00026875734329223633, 0.0002847611904144287, 0.0003007650375366211, 0.0003167688846588135, 0.00033277273178100586, 0.00034877657890319824, 0.0003647804260253906, 0.000380784273147583, 0.0003967881202697754, 0.0004127919673919678, 0.00042879581451416016, 0.00044479966163635254, 0.0004608035087585449, 0.0004768073558807373, 0.0004928112030029297, 0.0005088150501251221, 0.0005248188972473145, 0.0005408227443695068, 0.0005568265914916992, 0.0005728304386138916, 0.000588834285736084, 0.0006048381328582764, 0.0006208419799804688]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 7.0, 6.0, 5.0, 19.0, 14.0, 13.0, 27.0, 34.0, 46.0, 56.0, 76.0, 98.0, 146.0, 270.0, 736.0, 43407.0, 1001008.0, 1531.0, 414.0, 197.0, 108.0, 81.0, 59.0, 42.0, 39.0, 29.0, 21.0, 16.0, 11.0, 11.0, 9.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0182037353515625, -0.017739534378051758, -0.017275333404541016, -0.016811132431030273, -0.01634693145751953, -0.01588273048400879, -0.015418529510498047, -0.014954328536987305, -0.014490127563476562, -0.01402592658996582, -0.013561725616455078, -0.013097524642944336, -0.012633323669433594, -0.012169122695922852, -0.01170492172241211, -0.011240720748901367, -0.010776519775390625, -0.010312318801879883, -0.00984811782836914, -0.009383916854858398, -0.008919715881347656, -0.008455514907836914, -0.007991313934326172, -0.00752711296081543, -0.0070629119873046875, -0.006598711013793945, -0.006134510040283203, -0.005670309066772461, -0.005206108093261719, -0.0047419071197509766, -0.004277706146240234, -0.003813505172729492, -0.00334930419921875, -0.002885103225708008, -0.0024209022521972656, -0.0019567012786865234, -0.0014925003051757812, -0.001028299331665039, -0.0005640983581542969, -9.989738464355469e-05, 0.0003643035888671875, 0.0008285045623779297, 0.0012927055358886719, 0.001756906509399414, 0.0022211074829101562, 0.0026853084564208984, 0.0031495094299316406, 0.003613710403442383, 0.004077911376953125, 0.004542112350463867, 0.005006313323974609, 0.0054705142974853516, 0.005934715270996094, 0.006398916244506836, 0.006863117218017578, 0.00732731819152832, 0.0077915191650390625, 0.008255720138549805, 0.008719921112060547, 0.009184122085571289, 0.009648323059082031, 0.010112524032592773, 0.010576725006103516, 0.011040925979614258, 0.011505126953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 16.0, 26.0, 74.0, 132.0, 192.0, 230.0, 164.0, 102.0, 44.0, 17.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005026980652473867, -0.00048484522267244756, -0.0004669924092013389, -0.00044913956662639976, -0.0004312867531552911, -0.00041343391058035195, -0.0003955810680054128, -0.00037772825453430414, -0.00035987544106319547, -0.00034202259848825634, -0.00032416978501714766, -0.00030631694244220853, -0.00028846412897109985, -0.0002706112863961607, -0.0002527584438212216, -0.00023490563035011292, -0.00021705278777517378, -0.00019919995975214988, -0.00018134713172912598, -0.00016349428915418684, -0.00014564147568307817, -0.00012778863310813904, -0.00010993580508511513, -9.208297706209123e-05, -7.423014903906733e-05, -5.6377321016043425e-05, -3.8524489355040714e-05, -2.0671657694038004e-05, -2.8188296710141003e-06, 1.5033998352009803e-05, 3.288683365099132e-05, 5.0739661674015224e-05, 6.859248969703913e-05, 8.644531772006303e-05, 0.00010429814574308693, 0.00012215098831802607, 0.00014000380178913474, 0.00015785664436407387, 0.00017570947238709778, 0.00019356230041012168, 0.00021141512843314558, 0.00022926795645616949, 0.0002471207990311086, 0.0002649736125022173, 0.0002828264550771564, 0.0003006792685482651, 0.00031853211112320423, 0.0003363849245943129, 0.00035423776716925204, 0.00037209060974419117, 0.00038994342321529984, 0.000407796265790239, 0.00042564907926134765, 0.0004435019218362868, 0.00046135473530739546, 0.0004792075778823346, 0.0004970604204572737, 0.0005149132339283824, 0.000532766105607152, 0.0005506189190782607, 0.0005684717325493693, 0.000586324546020478, 0.0006041774176992476, 0.0006220302311703563, 0.000639883044641465]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 12.0, 14.0, 14.0, 26.0, 16.0, 20.0, 32.0, 31.0, 42.0, 23.0, 28.0, 38.0, 41.0, 34.0, 43.0, 50.0, 49.0, 42.0, 35.0, 42.0, 34.0, 31.0, 43.0, 35.0, 27.0, 32.0, 29.0, 21.0, 21.0, 16.0, 14.0, 17.0, 8.0, 8.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00031960010528564453, -0.00031033530831336975, -0.00030107051134109497, -0.0002918057143688202, -0.0002825409173965454, -0.00027327612042427063, -0.00026401132345199585, -0.00025474652647972107, -0.0002454817295074463, -0.0002362169325351715, -0.00022695213556289673, -0.00021768733859062195, -0.00020842254161834717, -0.0001991577446460724, -0.0001898929476737976, -0.00018062815070152283, -0.00017136335372924805, -0.00016209855675697327, -0.00015283375978469849, -0.0001435689628124237, -0.00013430416584014893, -0.00012503936886787415, -0.00011577457189559937, -0.00010650977492332458, -9.72449779510498e-05, -8.798018097877502e-05, -7.871538400650024e-05, -6.945058703422546e-05, -6.0185790061950684e-05, -5.09209930896759e-05, -4.165619611740112e-05, -3.239139914512634e-05, -2.3126602172851562e-05, -1.3861805200576782e-05, -4.597008228302002e-06, 4.667788743972778e-06, 1.3932585716247559e-05, 2.319738268852234e-05, 3.246217966079712e-05, 4.17269766330719e-05, 5.099177360534668e-05, 6.025657057762146e-05, 6.952136754989624e-05, 7.878616452217102e-05, 8.80509614944458e-05, 9.731575846672058e-05, 0.00010658055543899536, 0.00011584535241127014, 0.00012511014938354492, 0.0001343749463558197, 0.00014363974332809448, 0.00015290454030036926, 0.00016216933727264404, 0.00017143413424491882, 0.0001806989312171936, 0.00018996372818946838, 0.00019922852516174316, 0.00020849332213401794, 0.00021775811910629272, 0.0002270229160785675, 0.00023628771305084229, 0.00024555251002311707, 0.00025481730699539185, 0.0002640821039676666, 0.0002733469009399414]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 11.0, 12.0, 15.0, 18.0, 12.0, 23.0, 28.0, 19.0, 28.0, 27.0, 36.0, 35.0, 44.0, 33.0, 47.0, 46.0, 50.0, 33.0, 39.0, 39.0, 37.0, 33.0, 28.0, 36.0, 39.0, 26.0, 26.0, 26.0, 23.0, 24.0, 14.0, 19.0, 10.0, 10.0, 15.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3212890625, -6.099609375, -5.8779296875, -5.65625, -5.4345703125, -5.212890625, -4.9912109375, -4.76953125, -4.5478515625, -4.326171875, -4.1044921875, -3.8828125, -3.6611328125, -3.439453125, -3.2177734375, -2.99609375, -2.7744140625, -2.552734375, -2.3310546875, -2.109375, -1.8876953125, -1.666015625, -1.4443359375, -1.22265625, -1.0009765625, -0.779296875, -0.5576171875, -0.3359375, -0.1142578125, 0.107421875, 0.3291015625, 0.55078125, 0.7724609375, 0.994140625, 1.2158203125, 1.4375, 1.6591796875, 1.880859375, 2.1025390625, 2.32421875, 2.5458984375, 2.767578125, 2.9892578125, 3.2109375, 3.4326171875, 3.654296875, 3.8759765625, 4.09765625, 4.3193359375, 4.541015625, 4.7626953125, 4.984375, 5.2060546875, 5.427734375, 5.6494140625, 5.87109375, 6.0927734375, 6.314453125, 6.5361328125, 6.7578125, 6.9794921875, 7.201171875, 7.4228515625, 7.64453125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 9.0, 6.0, 17.0, 23.0, 21.0, 28.0, 28.0, 50.0, 62.0, 84.0, 101.0, 170.0, 216.0, 370.0, 573.0, 1073.0, 3416.0, 25175.0, 364112.0, 609130.0, 36368.0, 4442.0, 1187.0, 633.0, 373.0, 257.0, 155.0, 107.0, 88.0, 64.0, 58.0, 31.0, 22.0, 28.0, 10.0, 19.0, 16.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.1070556640625, -11.690673828125, -11.2742919921875, -10.85791015625, -10.4415283203125, -10.025146484375, -9.6087646484375, -9.1923828125, -8.7760009765625, -8.359619140625, -7.9432373046875, -7.52685546875, -7.1104736328125, -6.694091796875, -6.2777099609375, -5.861328125, -5.4449462890625, -5.028564453125, -4.6121826171875, -4.19580078125, -3.7794189453125, -3.363037109375, -2.9466552734375, -2.5302734375, -2.1138916015625, -1.697509765625, -1.2811279296875, -0.86474609375, -0.4483642578125, -0.031982421875, 0.3843994140625, 0.80078125, 1.2171630859375, 1.633544921875, 2.0499267578125, 2.46630859375, 2.8826904296875, 3.299072265625, 3.7154541015625, 4.1318359375, 4.5482177734375, 4.964599609375, 5.3809814453125, 5.79736328125, 6.2137451171875, 6.630126953125, 7.0465087890625, 7.462890625, 7.8792724609375, 8.295654296875, 8.7120361328125, 9.12841796875, 9.5447998046875, 9.961181640625, 10.3775634765625, 10.7939453125, 11.2103271484375, 11.626708984375, 12.0430908203125, 12.45947265625, 12.8758544921875, 13.292236328125, 13.7086181640625, 14.125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 7.0, 3.0, 10.0, 7.0, 8.0, 9.0, 18.0, 15.0, 10.0, 21.0, 34.0, 23.0, 24.0, 38.0, 41.0, 49.0, 37.0, 58.0, 70.0, 175.0, 1748.0, 157.0, 60.0, 42.0, 49.0, 35.0, 41.0, 43.0, 24.0, 16.0, 29.0, 30.0, 22.0, 13.0, 13.0, 9.0, 10.0, 11.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-22.28125, -21.615234375, -20.94921875, -20.283203125, -19.6171875, -18.951171875, -18.28515625, -17.619140625, -16.953125, -16.287109375, -15.62109375, -14.955078125, -14.2890625, -13.623046875, -12.95703125, -12.291015625, -11.625, -10.958984375, -10.29296875, -9.626953125, -8.9609375, -8.294921875, -7.62890625, -6.962890625, -6.296875, -5.630859375, -4.96484375, -4.298828125, -3.6328125, -2.966796875, -2.30078125, -1.634765625, -0.96875, -0.302734375, 0.36328125, 1.029296875, 1.6953125, 2.361328125, 3.02734375, 3.693359375, 4.359375, 5.025390625, 5.69140625, 6.357421875, 7.0234375, 7.689453125, 8.35546875, 9.021484375, 9.6875, 10.353515625, 11.01953125, 11.685546875, 12.3515625, 13.017578125, 13.68359375, 14.349609375, 15.015625, 15.681640625, 16.34765625, 17.013671875, 17.6796875, 18.345703125, 19.01171875, 19.677734375, 20.34375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 1.0, 3.0, 4.0, 8.0, 5.0, 9.0, 14.0, 14.0, 12.0, 11.0, 17.0, 29.0, 40.0, 26.0, 37.0, 41.0, 71.0, 79.0, 120.0, 186.0, 359.0, 863.0, 14169.0, 3122304.0, 5640.0, 678.0, 293.0, 171.0, 121.0, 74.0, 62.0, 47.0, 31.0, 35.0, 21.0, 19.0, 13.0, 16.0, 11.0, 10.0, 11.0, 8.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-61.375, -59.3564453125, -57.337890625, -55.3193359375, -53.30078125, -51.2822265625, -49.263671875, -47.2451171875, -45.2265625, -43.2080078125, -41.189453125, -39.1708984375, -37.15234375, -35.1337890625, -33.115234375, -31.0966796875, -29.078125, -27.0595703125, -25.041015625, -23.0224609375, -21.00390625, -18.9853515625, -16.966796875, -14.9482421875, -12.9296875, -10.9111328125, -8.892578125, -6.8740234375, -4.85546875, -2.8369140625, -0.818359375, 1.2001953125, 3.21875, 5.2373046875, 7.255859375, 9.2744140625, 11.29296875, 13.3115234375, 15.330078125, 17.3486328125, 19.3671875, 21.3857421875, 23.404296875, 25.4228515625, 27.44140625, 29.4599609375, 31.478515625, 33.4970703125, 35.515625, 37.5341796875, 39.552734375, 41.5712890625, 43.58984375, 45.6083984375, 47.626953125, 49.6455078125, 51.6640625, 53.6826171875, 55.701171875, 57.7197265625, 59.73828125, 61.7568359375, 63.775390625, 65.7939453125, 67.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 18.0, 22.0, 37.0, 63.0, 90.0, 118.0, 123.0, 129.0, 132.0, 99.0, 76.0, 49.0, 27.0, 14.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-26.973709106445312, -26.45728874206543, -25.940868377685547, -25.424448013305664, -24.90802764892578, -24.391605377197266, -23.875186920166016, -23.3587646484375, -22.842344284057617, -22.325923919677734, -21.80950355529785, -21.29308319091797, -20.776662826538086, -20.260242462158203, -19.743820190429688, -19.227399826049805, -18.710979461669922, -18.19455909729004, -17.678138732910156, -17.161718368530273, -16.64529800415039, -16.128875732421875, -15.612456321716309, -15.096035957336426, -14.57961654663086, -14.063196182250977, -13.546775817871094, -13.030355453491211, -12.513934135437012, -11.997513771057129, -11.481093406677246, -10.964673042297363, -10.448253631591797, -9.931833267211914, -9.415412902832031, -8.898992538452148, -8.38257122039795, -7.866150856018066, -7.349730491638184, -6.833310127258301, -6.316888809204102, -5.800468444824219, -5.284047603607178, -4.767627239227295, -4.251206398010254, -3.734786033630371, -3.2183656692504883, -2.7019450664520264, -2.1855244636535645, -1.6691038608551025, -1.1526833772659302, -0.6362628936767578, -0.1198422908782959, 0.396578311920166, 0.9129986763000488, 1.4294192790985107, 1.9458398818969727, 2.4622604846954346, 2.9786810874938965, 3.4951014518737793, 4.01152229309082, 4.527942657470703, 5.044363021850586, 5.560783386230469, 6.07720422744751]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 9.0, 7.0, 9.0, 8.0, 9.0, 10.0, 21.0, 11.0, 19.0, 19.0, 25.0, 22.0, 36.0, 31.0, 27.0, 31.0, 31.0, 32.0, 33.0, 40.0, 31.0, 39.0, 38.0, 38.0, 38.0, 36.0, 28.0, 32.0, 29.0, 27.0, 27.0, 27.0, 20.0, 22.0, 18.0, 23.0, 20.0, 13.0, 10.0, 7.0, 6.0, 7.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-58.09512710571289, -56.42301559448242, -54.75090789794922, -53.07879638671875, -51.40668487548828, -49.73457717895508, -48.06246566772461, -46.390357971191406, -44.71824645996094, -43.04613494873047, -41.374027252197266, -39.7019157409668, -38.029808044433594, -36.357696533203125, -34.685585021972656, -33.01347351074219, -31.341365814208984, -29.66925621032715, -27.997146606445312, -26.325035095214844, -24.652925491333008, -22.980815887451172, -21.308704376220703, -19.636594772338867, -17.96448516845703, -16.292375564575195, -14.620265007019043, -12.94815444946289, -11.276044845581055, -9.603935241699219, -7.931824684143066, -6.259714126586914, -4.587608337402344, -2.9154982566833496, -1.2433881759643555, 0.42872190475463867, 2.100831985473633, 3.7729415893554688, 5.445052146911621, 7.117162704467773, 8.78927230834961, 10.461381912231445, 12.133492469787598, 13.80560302734375, 15.477712631225586, 17.149822235107422, 18.82193374633789, 20.494043350219727, 22.166152954101562, 23.8382625579834, 25.510372161865234, 27.182483673095703, 28.85459327697754, 30.526702880859375, 32.198814392089844, 33.87092590332031, 35.543033599853516, 37.215145111083984, 38.88725280761719, 40.559364318847656, 42.231475830078125, 43.90358352661133, 45.5756950378418, 47.247802734375, 48.91991424560547]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 7.0, 8.0, 15.0, 12.0, 11.0, 26.0, 25.0, 29.0, 19.0, 28.0, 33.0, 29.0, 41.0, 37.0, 47.0, 43.0, 43.0, 53.0, 49.0, 33.0, 37.0, 38.0, 42.0, 29.0, 37.0, 26.0, 27.0, 27.0, 35.0, 20.0, 12.0, 19.0, 16.0, 11.0, 8.0, 8.0, 4.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5859375, -7.341552734375, -7.09716796875, -6.852783203125, -6.6083984375, -6.364013671875, -6.11962890625, -5.875244140625, -5.630859375, -5.386474609375, -5.14208984375, -4.897705078125, -4.6533203125, -4.408935546875, -4.16455078125, -3.920166015625, -3.67578125, -3.431396484375, -3.18701171875, -2.942626953125, -2.6982421875, -2.453857421875, -2.20947265625, -1.965087890625, -1.720703125, -1.476318359375, -1.23193359375, -0.987548828125, -0.7431640625, -0.498779296875, -0.25439453125, -0.010009765625, 0.234375, 0.478759765625, 0.72314453125, 0.967529296875, 1.2119140625, 1.456298828125, 1.70068359375, 1.945068359375, 2.189453125, 2.433837890625, 2.67822265625, 2.922607421875, 3.1669921875, 3.411376953125, 3.65576171875, 3.900146484375, 4.14453125, 4.388916015625, 4.63330078125, 4.877685546875, 5.1220703125, 5.366455078125, 5.61083984375, 5.855224609375, 6.099609375, 6.343994140625, 6.58837890625, 6.832763671875, 7.0771484375, 7.321533203125, 7.56591796875, 7.810302734375, 8.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 17.0, 15.0, 22.0, 24.0, 32.0, 57.0, 68.0, 103.0, 139.0, 246.0, 441.0, 781.0, 1879.0, 5200.0, 18019.0, 81141.0, 416757.0, 1360626.0, 1578434.0, 578609.0, 115101.0, 24645.0, 7009.0, 2524.0, 1030.0, 500.0, 256.0, 159.0, 132.0, 72.0, 61.0, 38.0, 46.0, 21.0, 19.0, 11.0, 8.0, 14.0, 2.0, 5.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.53125, -10.2396240234375, -9.947998046875, -9.6563720703125, -9.36474609375, -9.0731201171875, -8.781494140625, -8.4898681640625, -8.1982421875, -7.9066162109375, -7.614990234375, -7.3233642578125, -7.03173828125, -6.7401123046875, -6.448486328125, -6.1568603515625, -5.865234375, -5.5736083984375, -5.281982421875, -4.9903564453125, -4.69873046875, -4.4071044921875, -4.115478515625, -3.8238525390625, -3.5322265625, -3.2406005859375, -2.948974609375, -2.6573486328125, -2.36572265625, -2.0740966796875, -1.782470703125, -1.4908447265625, -1.19921875, -0.9075927734375, -0.615966796875, -0.3243408203125, -0.03271484375, 0.2589111328125, 0.550537109375, 0.8421630859375, 1.1337890625, 1.4254150390625, 1.717041015625, 2.0086669921875, 2.30029296875, 2.5919189453125, 2.883544921875, 3.1751708984375, 3.466796875, 3.7584228515625, 4.050048828125, 4.3416748046875, 4.63330078125, 4.9249267578125, 5.216552734375, 5.5081787109375, 5.7998046875, 6.0914306640625, 6.383056640625, 6.6746826171875, 6.96630859375, 7.2579345703125, 7.549560546875, 7.8411865234375, 8.1328125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 5.0, 5.0, 5.0, 12.0, 5.0, 4.0, 18.0, 27.0, 29.0, 39.0, 42.0, 45.0, 62.0, 78.0, 93.0, 133.0, 140.0, 206.0, 234.0, 297.0, 304.0, 372.0, 352.0, 298.0, 254.0, 188.0, 175.0, 124.0, 106.0, 84.0, 74.0, 61.0, 41.0, 38.0, 32.0, 24.0, 15.0, 15.0, 10.0, 9.0, 10.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.390625, -12.0433349609375, -11.696044921875, -11.3487548828125, -11.00146484375, -10.6541748046875, -10.306884765625, -9.9595947265625, -9.6123046875, -9.2650146484375, -8.917724609375, -8.5704345703125, -8.22314453125, -7.8758544921875, -7.528564453125, -7.1812744140625, -6.833984375, -6.4866943359375, -6.139404296875, -5.7921142578125, -5.44482421875, -5.0975341796875, -4.750244140625, -4.4029541015625, -4.0556640625, -3.7083740234375, -3.361083984375, -3.0137939453125, -2.66650390625, -2.3192138671875, -1.971923828125, -1.6246337890625, -1.27734375, -0.9300537109375, -0.582763671875, -0.2354736328125, 0.11181640625, 0.4591064453125, 0.806396484375, 1.1536865234375, 1.5009765625, 1.8482666015625, 2.195556640625, 2.5428466796875, 2.89013671875, 3.2374267578125, 3.584716796875, 3.9320068359375, 4.279296875, 4.6265869140625, 4.973876953125, 5.3211669921875, 5.66845703125, 6.0157470703125, 6.363037109375, 6.7103271484375, 7.0576171875, 7.4049072265625, 7.752197265625, 8.0994873046875, 8.44677734375, 8.7940673828125, 9.141357421875, 9.4886474609375, 9.8359375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 7.0, 7.0, 13.0, 14.0, 22.0, 29.0, 26.0, 46.0, 60.0, 86.0, 87.0, 108.0, 138.0, 188.0, 218.0, 280.0, 404.0, 700.0, 2289.0, 155133.0, 4018232.0, 12902.0, 1253.0, 500.0, 344.0, 228.0, 181.0, 154.0, 135.0, 100.0, 87.0, 63.0, 54.0, 45.0, 35.0, 33.0, 15.0, 15.0, 21.0, 9.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.5625, -62.68017578125, -60.7978515625, -58.91552734375, -57.033203125, -55.15087890625, -53.2685546875, -51.38623046875, -49.50390625, -47.62158203125, -45.7392578125, -43.85693359375, -41.974609375, -40.09228515625, -38.2099609375, -36.32763671875, -34.4453125, -32.56298828125, -30.6806640625, -28.79833984375, -26.916015625, -25.03369140625, -23.1513671875, -21.26904296875, -19.38671875, -17.50439453125, -15.6220703125, -13.73974609375, -11.857421875, -9.97509765625, -8.0927734375, -6.21044921875, -4.328125, -2.44580078125, -0.5634765625, 1.31884765625, 3.201171875, 5.08349609375, 6.9658203125, 8.84814453125, 10.73046875, 12.61279296875, 14.4951171875, 16.37744140625, 18.259765625, 20.14208984375, 22.0244140625, 23.90673828125, 25.7890625, 27.67138671875, 29.5537109375, 31.43603515625, 33.318359375, 35.20068359375, 37.0830078125, 38.96533203125, 40.84765625, 42.72998046875, 44.6123046875, 46.49462890625, 48.376953125, 50.25927734375, 52.1416015625, 54.02392578125, 55.90625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 55.0, 113.0, 245.0, 274.0, 191.0, 87.0, 30.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.8114242553711, -97.7901382446289, -94.76885986328125, -91.74757385253906, -88.72628784179688, -85.70500183105469, -82.68372344970703, -79.66243743896484, -76.64115142822266, -73.61986541748047, -70.59858703613281, -67.57730102539062, -64.55601501464844, -61.534732818603516, -58.513450622558594, -55.492164611816406, -52.470882415771484, -49.44960021972656, -46.428314208984375, -43.40703201293945, -40.385746002197266, -37.364463806152344, -34.343177795410156, -31.321895599365234, -28.30061149597168, -25.279327392578125, -22.25804328918457, -19.236759185791016, -16.215476989746094, -13.194191932678223, -10.172908782958984, -7.15162467956543, -4.130340576171875, -1.1090567111968994, 1.9122271537780762, 4.933510780334473, 7.954794883728027, 10.976078987121582, 13.99736213684082, 17.018646240234375, 20.03993034362793, 23.061214447021484, 26.08249855041504, 29.103782653808594, 32.125064849853516, 35.1463508605957, 38.167633056640625, 41.18891906738281, 44.210201263427734, 47.231483459472656, 50.252769470214844, 53.274051666259766, 56.29533767700195, 59.316619873046875, 62.33790588378906, 65.35919189453125, 68.3804702758789, 71.4017562866211, 74.42303466796875, 77.44432067871094, 80.46560668945312, 83.48689270019531, 86.50817108154297, 89.52945709228516, 92.55074310302734]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 9.0, 9.0, 19.0, 10.0, 23.0, 13.0, 19.0, 21.0, 23.0, 27.0, 30.0, 30.0, 35.0, 31.0, 36.0, 36.0, 42.0, 41.0, 40.0, 42.0, 40.0, 35.0, 34.0, 36.0, 30.0, 23.0, 21.0, 34.0, 14.0, 24.0, 27.0, 19.0, 16.0, 17.0, 9.0, 6.0, 15.0, 10.0, 6.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-42.974578857421875, -41.634178161621094, -40.29378128051758, -38.95338439941406, -37.61298370361328, -36.2725830078125, -34.932186126708984, -33.59178924560547, -32.25138854980469, -30.91098976135254, -29.57059097290039, -28.230192184448242, -26.889793395996094, -25.549394607543945, -24.208995819091797, -22.86859703063965, -21.5281982421875, -20.18779945373535, -18.847400665283203, -17.507001876831055, -16.166603088378906, -14.826204299926758, -13.48580551147461, -12.145406723022461, -10.805007934570312, -9.464609146118164, -8.124210357666016, -6.783811569213867, -5.443412780761719, -4.10301399230957, -2.762615203857422, -1.4222164154052734, -0.081817626953125, 1.2585811614990234, 2.598979949951172, 3.9393787384033203, 5.279777526855469, 6.620176315307617, 7.960575103759766, 9.300973892211914, 10.641372680664062, 11.981771469116211, 13.32217025756836, 14.662569046020508, 16.002967834472656, 17.343366622924805, 18.683765411376953, 20.0241641998291, 21.36456298828125, 22.7049617767334, 24.045360565185547, 25.385759353637695, 26.726158142089844, 28.066556930541992, 29.40695571899414, 30.74735450744629, 32.08775329589844, 33.42815399169922, 34.768550872802734, 36.10894775390625, 37.44934844970703, 38.78974914550781, 40.13014602661133, 41.470542907714844, 42.810943603515625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 10.0, 11.0, 17.0, 13.0, 16.0, 15.0, 18.0, 19.0, 29.0, 26.0, 38.0, 29.0, 24.0, 37.0, 31.0, 28.0, 41.0, 38.0, 47.0, 35.0, 46.0, 33.0, 35.0, 27.0, 29.0, 26.0, 28.0, 21.0, 34.0, 18.0, 30.0, 12.0, 25.0, 13.0, 10.0, 11.0, 11.0, 14.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.50262451171875, -5.3021240234375, -5.10162353515625, -4.901123046875, -4.70062255859375, -4.5001220703125, -4.29962158203125, -4.09912109375, -3.89862060546875, -3.6981201171875, -3.49761962890625, -3.297119140625, -3.09661865234375, -2.8961181640625, -2.69561767578125, -2.4951171875, -2.29461669921875, -2.0941162109375, -1.89361572265625, -1.693115234375, -1.49261474609375, -1.2921142578125, -1.09161376953125, -0.89111328125, -0.69061279296875, -0.4901123046875, -0.28961181640625, -0.089111328125, 0.11138916015625, 0.3118896484375, 0.51239013671875, 0.712890625, 0.91339111328125, 1.1138916015625, 1.31439208984375, 1.514892578125, 1.71539306640625, 1.9158935546875, 2.11639404296875, 2.31689453125, 2.51739501953125, 2.7178955078125, 2.91839599609375, 3.118896484375, 3.31939697265625, 3.5198974609375, 3.72039794921875, 3.9208984375, 4.12139892578125, 4.3218994140625, 4.52239990234375, 4.722900390625, 4.92340087890625, 5.1239013671875, 5.32440185546875, 5.52490234375, 5.72540283203125, 5.9259033203125, 6.12640380859375, 6.326904296875, 6.52740478515625, 6.7279052734375, 6.92840576171875, 7.12890625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 14.0, 11.0, 19.0, 21.0, 38.0, 50.0, 91.0, 96.0, 179.0, 260.0, 397.0, 595.0, 921.0, 1399.0, 2105.0, 3267.0, 5011.0, 7685.0, 11946.0, 18854.0, 30442.0, 49725.0, 83379.0, 140386.0, 236192.0, 181602.0, 106525.0, 63446.0, 38736.0, 23339.0, 14738.0, 9397.0, 5954.0, 4087.0, 2549.0, 1739.0, 1120.0, 776.0, 476.0, 316.0, 214.0, 155.0, 105.0, 61.0, 55.0, 25.0, 25.0, 15.0, 11.0, 6.0, 6.0, 1.0, 2.0, 3.0], "bins": [-1.177734375, -1.143829345703125, -1.10992431640625, -1.076019287109375, -1.0421142578125, -1.008209228515625, -0.97430419921875, -0.940399169921875, -0.906494140625, -0.872589111328125, -0.83868408203125, -0.804779052734375, -0.7708740234375, -0.736968994140625, -0.70306396484375, -0.669158935546875, -0.63525390625, -0.601348876953125, -0.56744384765625, -0.533538818359375, -0.4996337890625, -0.465728759765625, -0.43182373046875, -0.397918701171875, -0.364013671875, -0.330108642578125, -0.29620361328125, -0.262298583984375, -0.2283935546875, -0.194488525390625, -0.16058349609375, -0.126678466796875, -0.0927734375, -0.058868408203125, -0.02496337890625, 0.008941650390625, 0.0428466796875, 0.076751708984375, 0.11065673828125, 0.144561767578125, 0.178466796875, 0.212371826171875, 0.24627685546875, 0.280181884765625, 0.3140869140625, 0.347991943359375, 0.38189697265625, 0.415802001953125, 0.44970703125, 0.483612060546875, 0.51751708984375, 0.551422119140625, 0.5853271484375, 0.619232177734375, 0.65313720703125, 0.687042236328125, 0.720947265625, 0.754852294921875, 0.78875732421875, 0.822662353515625, 0.8565673828125, 0.890472412109375, 0.92437744140625, 0.958282470703125, 0.9921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 4.0, 10.0, 12.0, 14.0, 10.0, 12.0, 17.0, 20.0, 22.0, 17.0, 33.0, 26.0, 28.0, 28.0, 20.0, 34.0, 27.0, 31.0, 35.0, 32.0, 1058.0, 34.0, 43.0, 34.0, 47.0, 37.0, 39.0, 26.0, 26.0, 23.0, 29.0, 27.0, 25.0, 20.0, 20.0, 15.0, 18.0, 13.0, 10.0, 8.0, 3.0, 7.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.2265625, -4.101776123046875, -3.97698974609375, -3.852203369140625, -3.7274169921875, -3.602630615234375, -3.47784423828125, -3.353057861328125, -3.228271484375, -3.103485107421875, -2.97869873046875, -2.853912353515625, -2.7291259765625, -2.604339599609375, -2.47955322265625, -2.354766845703125, -2.22998046875, -2.105194091796875, -1.98040771484375, -1.855621337890625, -1.7308349609375, -1.606048583984375, -1.48126220703125, -1.356475830078125, -1.231689453125, -1.106903076171875, -0.98211669921875, -0.857330322265625, -0.7325439453125, -0.607757568359375, -0.48297119140625, -0.358184814453125, -0.2333984375, -0.108612060546875, 0.01617431640625, 0.140960693359375, 0.2657470703125, 0.390533447265625, 0.51531982421875, 0.640106201171875, 0.764892578125, 0.889678955078125, 1.01446533203125, 1.139251708984375, 1.2640380859375, 1.388824462890625, 1.51361083984375, 1.638397216796875, 1.76318359375, 1.887969970703125, 2.01275634765625, 2.137542724609375, 2.2623291015625, 2.387115478515625, 2.51190185546875, 2.636688232421875, 2.761474609375, 2.886260986328125, 3.01104736328125, 3.135833740234375, 3.2606201171875, 3.385406494140625, 3.51019287109375, 3.634979248046875, 3.759765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 8.0, 22.0, 37.0, 48.0, 64.0, 110.0, 152.0, 225.0, 346.0, 506.0, 697.0, 1035.0, 1610.0, 2275.0, 3166.0, 4654.0, 6856.0, 10163.0, 14832.0, 21779.0, 33249.0, 50151.0, 77952.0, 127717.0, 1267885.0, 176097.0, 102730.0, 64591.0, 42067.0, 27772.0, 18826.0, 12480.0, 8484.0, 5906.0, 3951.0, 2748.0, 1874.0, 1280.0, 904.0, 621.0, 390.0, 320.0, 178.0, 117.0, 80.0, 59.0, 39.0, 23.0, 15.0, 14.0, 9.0, 8.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.923828125, -0.8956527709960938, -0.8674774169921875, -0.8393020629882812, -0.811126708984375, -0.7829513549804688, -0.7547760009765625, -0.7266006469726562, -0.69842529296875, -0.6702499389648438, -0.6420745849609375, -0.6138992309570312, -0.585723876953125, -0.5575485229492188, -0.5293731689453125, -0.5011978149414062, -0.4730224609375, -0.44484710693359375, -0.4166717529296875, -0.38849639892578125, -0.360321044921875, -0.33214569091796875, -0.3039703369140625, -0.27579498291015625, -0.24761962890625, -0.21944427490234375, -0.1912689208984375, -0.16309356689453125, -0.134918212890625, -0.10674285888671875, -0.0785675048828125, -0.05039215087890625, -0.022216796875, 0.00595855712890625, 0.0341339111328125, 0.06230926513671875, 0.090484619140625, 0.11865997314453125, 0.1468353271484375, 0.17501068115234375, 0.20318603515625, 0.23136138916015625, 0.2595367431640625, 0.28771209716796875, 0.315887451171875, 0.34406280517578125, 0.3722381591796875, 0.40041351318359375, 0.4285888671875, 0.45676422119140625, 0.4849395751953125, 0.5131149291992188, 0.541290283203125, 0.5694656372070312, 0.5976409912109375, 0.6258163452148438, 0.65399169921875, 0.6821670532226562, 0.7103424072265625, 0.7385177612304688, 0.766693115234375, 0.7948684692382812, 0.8230438232421875, 0.8512191772460938, 0.87939453125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 10.0, 11.0, 19.0, 21.0, 28.0, 26.0, 30.0, 24.0, 45.0, 53.0, 52.0, 44.0, 64.0, 51.0, 53.0, 39.0, 55.0, 48.0, 44.0, 28.0, 27.0, 28.0, 36.0, 24.0, 23.0, 14.0, 13.0, 13.0, 9.0, 9.0, 5.0, 8.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004916191101074219, -0.00047466158866882324, -0.0004577040672302246, -0.000440746545791626, -0.00042378902435302734, -0.0004068315029144287, -0.0003898739814758301, -0.00037291646003723145, -0.0003559589385986328, -0.0003390014171600342, -0.00032204389572143555, -0.0003050863742828369, -0.0002881288528442383, -0.00027117133140563965, -0.000254213809967041, -0.00023725628852844238, -0.00022029876708984375, -0.00020334124565124512, -0.00018638372421264648, -0.00016942620277404785, -0.00015246868133544922, -0.00013551115989685059, -0.00011855363845825195, -0.00010159611701965332, -8.463859558105469e-05, -6.768107414245605e-05, -5.072355270385742e-05, -3.376603126525879e-05, -1.6808509826660156e-05, 1.4901161193847656e-07, 1.710653305053711e-05, 3.406405448913574e-05, 5.1021575927734375e-05, 6.797909736633301e-05, 8.493661880493164e-05, 0.00010189414024353027, 0.0001188516616821289, 0.00013580918312072754, 0.00015276670455932617, 0.0001697242259979248, 0.00018668174743652344, 0.00020363926887512207, 0.0002205967903137207, 0.00023755431175231934, 0.00025451183319091797, 0.0002714693546295166, 0.00028842687606811523, 0.00030538439750671387, 0.0003223419189453125, 0.00033929944038391113, 0.00035625696182250977, 0.0003732144832611084, 0.00039017200469970703, 0.00040712952613830566, 0.0004240870475769043, 0.00044104456901550293, 0.00045800209045410156, 0.0004749596118927002, 0.0004919171333312988, 0.0005088746547698975, 0.0005258321762084961, 0.0005427896976470947, 0.0005597472190856934, 0.000576704740524292, 0.0005936622619628906]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 9.0, 8.0, 7.0, 16.0, 8.0, 23.0, 14.0, 25.0, 27.0, 38.0, 40.0, 57.0, 68.0, 95.0, 142.0, 245.0, 496.0, 1596.0, 903343.0, 140159.0, 1022.0, 412.0, 167.0, 125.0, 84.0, 59.0, 45.0, 41.0, 35.0, 27.0, 22.0, 17.0, 13.0, 15.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01318359375, -0.012794256210327148, -0.012404918670654297, -0.012015581130981445, -0.011626243591308594, -0.011236906051635742, -0.01084756851196289, -0.010458230972290039, -0.010068893432617188, -0.009679555892944336, -0.009290218353271484, -0.008900880813598633, -0.008511543273925781, -0.00812220573425293, -0.007732868194580078, -0.0073435306549072266, -0.006954193115234375, -0.0065648555755615234, -0.006175518035888672, -0.00578618049621582, -0.005396842956542969, -0.005007505416870117, -0.004618167877197266, -0.004228830337524414, -0.0038394927978515625, -0.003450155258178711, -0.0030608177185058594, -0.002671480178833008, -0.0022821426391601562, -0.0018928050994873047, -0.0015034675598144531, -0.0011141300201416016, -0.00072479248046875, -0.00033545494079589844, 5.3882598876953125e-05, 0.0004432201385498047, 0.0008325576782226562, 0.0012218952178955078, 0.0016112327575683594, 0.002000570297241211, 0.0023899078369140625, 0.002779245376586914, 0.0031685829162597656, 0.003557920455932617, 0.003947257995605469, 0.00433659553527832, 0.004725933074951172, 0.0051152706146240234, 0.005504608154296875, 0.0058939456939697266, 0.006283283233642578, 0.00667262077331543, 0.007061958312988281, 0.007451295852661133, 0.007840633392333984, 0.008229970932006836, 0.008619308471679688, 0.009008646011352539, 0.00939798355102539, 0.009787321090698242, 0.010176658630371094, 0.010565996170043945, 0.010955333709716797, 0.011344671249389648, 0.0117340087890625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 75.0, 728.0, 208.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004281291738152504, -0.004202988464385271, -0.004124685190618038, -0.004046381916850805, -0.003968078643083572, -0.003889775602146983, -0.003811472561210394, -0.003733169287443161, -0.003654866013675928, -0.0035765627399086952, -0.0034982594661414623, -0.003419956425204873, -0.00334165315143764, -0.0032633498776704073, -0.003185046836733818, -0.003106743562966585, -0.0030284402891993523, -0.0029501370154321194, -0.0028718337416648865, -0.0027935307007282972, -0.0027152274269610643, -0.0026369241531938314, -0.002558621112257242, -0.0024803178384900093, -0.0024020145647227764, -0.0023237112909555435, -0.0022454080171883106, -0.0021671049762517214, -0.0020888017024844885, -0.0020104984287172556, -0.0019321952713653445, -0.0018538921140134335, -0.0017755888402462006, -0.0016972855664789677, -0.0016189824091270566, -0.0015406792517751455, -0.0014623759780079126, -0.0013840727042406797, -0.0013057695468887687, -0.0012274663895368576, -0.0011491631157696247, -0.0010708598420023918, -0.0009925566846504807, -0.0009142534690909088, -0.0008359502535313368, -0.0007576470379717648, -0.0006793438224121928, -0.0006010406068526208, -0.0005227374495007098, -0.0004444342339411378, -0.0003661310183815658, -0.00028782780282199383, -0.00020952458726242185, -0.00013122137170284986, -5.2918156143277884e-05, 2.5385059416294098e-05, 0.00010368827497586608, 0.00018199149053543806, 0.00026029470609501004, 0.000338597921654582, 0.000416901137214154, 0.000495204352773726, 0.000573507568333298, 0.00065181078389287, 0.0007301139994524419]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 4.0, 4.0, 9.0, 13.0, 19.0, 14.0, 16.0, 20.0, 20.0, 27.0, 32.0, 32.0, 33.0, 39.0, 28.0, 34.0, 38.0, 38.0, 50.0, 27.0, 42.0, 41.0, 24.0, 33.0, 45.0, 41.0, 32.0, 36.0, 36.0, 28.0, 16.0, 16.0, 15.0, 15.0, 13.0, 6.0, 14.0, 16.0, 12.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026291608810424805, -0.000253492034971714, -0.00024406798183918, -0.00023464392870664597, -0.00022521987557411194, -0.0002157958224415779, -0.00020637176930904388, -0.00019694771617650986, -0.00018752366304397583, -0.0001780996099114418, -0.00016867555677890778, -0.00015925150364637375, -0.00014982745051383972, -0.0001404033973813057, -0.00013097934424877167, -0.00012155529111623764, -0.00011213123798370361, -0.00010270718485116959, -9.328313171863556e-05, -8.385907858610153e-05, -7.44350254535675e-05, -6.501097232103348e-05, -5.558691918849945e-05, -4.6162866055965424e-05, -3.6738812923431396e-05, -2.731475979089737e-05, -1.7890706658363342e-05, -8.466653525829315e-06, 9.57399606704712e-07, 1.0381452739238739e-05, 1.9805505871772766e-05, 2.9229559004306793e-05, 3.865361213684082e-05, 4.807766526937485e-05, 5.7501718401908875e-05, 6.69257715344429e-05, 7.634982466697693e-05, 8.577387779951096e-05, 9.519793093204498e-05, 0.00010462198406457901, 0.00011404603719711304, 0.00012347009032964706, 0.0001328941434621811, 0.00014231819659471512, 0.00015174224972724915, 0.00016116630285978317, 0.0001705903559923172, 0.00018001440912485123, 0.00018943846225738525, 0.00019886251538991928, 0.0002082865685224533, 0.00021771062165498734, 0.00022713467478752136, 0.0002365587279200554, 0.0002459827810525894, 0.00025540683418512344, 0.00026483088731765747, 0.0002742549404501915, 0.0002836789935827255, 0.00029310304671525955, 0.0003025270998477936, 0.0003119511529803276, 0.00032137520611286163, 0.00033079925924539566, 0.0003402233123779297]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 10.0, 11.0, 17.0, 13.0, 16.0, 15.0, 18.0, 19.0, 29.0, 26.0, 39.0, 28.0, 24.0, 37.0, 31.0, 28.0, 41.0, 38.0, 47.0, 35.0, 46.0, 33.0, 35.0, 27.0, 29.0, 26.0, 28.0, 21.0, 34.0, 18.0, 30.0, 12.0, 25.0, 13.0, 10.0, 11.0, 11.0, 14.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.50262451171875, -5.3021240234375, -5.10162353515625, -4.901123046875, -4.70062255859375, -4.5001220703125, -4.29962158203125, -4.09912109375, -3.89862060546875, -3.6981201171875, -3.49761962890625, -3.297119140625, -3.09661865234375, -2.8961181640625, -2.69561767578125, -2.4951171875, -2.29461669921875, -2.0941162109375, -1.89361572265625, -1.693115234375, -1.49261474609375, -1.2921142578125, -1.09161376953125, -0.89111328125, -0.69061279296875, -0.4901123046875, -0.28961181640625, -0.089111328125, 0.11138916015625, 0.3118896484375, 0.51239013671875, 0.712890625, 0.91339111328125, 1.1138916015625, 1.31439208984375, 1.514892578125, 1.71539306640625, 1.9158935546875, 2.11639404296875, 2.31689453125, 2.51739501953125, 2.7178955078125, 2.91839599609375, 3.118896484375, 3.31939697265625, 3.5198974609375, 3.72039794921875, 3.9208984375, 4.12139892578125, 4.3218994140625, 4.52239990234375, 4.722900390625, 4.92340087890625, 5.1239013671875, 5.32440185546875, 5.52490234375, 5.72540283203125, 5.9259033203125, 6.12640380859375, 6.326904296875, 6.52740478515625, 6.7279052734375, 6.92840576171875, 7.12890625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 9.0, 14.0, 6.0, 12.0, 10.0, 20.0, 24.0, 26.0, 32.0, 27.0, 39.0, 72.0, 110.0, 150.0, 310.0, 567.0, 1153.0, 2482.0, 5271.0, 11522.0, 25285.0, 56511.0, 135683.0, 335220.0, 280620.0, 108054.0, 46079.0, 21153.0, 9485.0, 4291.0, 2007.0, 1025.0, 472.0, 252.0, 167.0, 95.0, 68.0, 39.0, 37.0, 28.0, 30.0, 15.0, 19.0, 16.0, 13.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.10546875, -4.94012451171875, -4.7747802734375, -4.60943603515625, -4.444091796875, -4.27874755859375, -4.1134033203125, -3.94805908203125, -3.78271484375, -3.61737060546875, -3.4520263671875, -3.28668212890625, -3.121337890625, -2.95599365234375, -2.7906494140625, -2.62530517578125, -2.4599609375, -2.29461669921875, -2.1292724609375, -1.96392822265625, -1.798583984375, -1.63323974609375, -1.4678955078125, -1.30255126953125, -1.13720703125, -0.97186279296875, -0.8065185546875, -0.64117431640625, -0.475830078125, -0.31048583984375, -0.1451416015625, 0.02020263671875, 0.185546875, 0.35089111328125, 0.5162353515625, 0.68157958984375, 0.846923828125, 1.01226806640625, 1.1776123046875, 1.34295654296875, 1.50830078125, 1.67364501953125, 1.8389892578125, 2.00433349609375, 2.169677734375, 2.33502197265625, 2.5003662109375, 2.66571044921875, 2.8310546875, 2.99639892578125, 3.1617431640625, 3.32708740234375, 3.492431640625, 3.65777587890625, 3.8231201171875, 3.98846435546875, 4.15380859375, 4.31915283203125, 4.4844970703125, 4.64984130859375, 4.815185546875, 4.98052978515625, 5.1458740234375, 5.31121826171875, 5.4765625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 6.0, 4.0, 14.0, 14.0, 10.0, 16.0, 25.0, 22.0, 18.0, 28.0, 33.0, 38.0, 35.0, 29.0, 50.0, 50.0, 72.0, 176.0, 1561.0, 287.0, 87.0, 51.0, 53.0, 44.0, 41.0, 36.0, 21.0, 24.0, 31.0, 16.0, 29.0, 21.0, 15.0, 14.0, 13.0, 14.0, 15.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.328125, -19.666015625, -19.00390625, -18.341796875, -17.6796875, -17.017578125, -16.35546875, -15.693359375, -15.03125, -14.369140625, -13.70703125, -13.044921875, -12.3828125, -11.720703125, -11.05859375, -10.396484375, -9.734375, -9.072265625, -8.41015625, -7.748046875, -7.0859375, -6.423828125, -5.76171875, -5.099609375, -4.4375, -3.775390625, -3.11328125, -2.451171875, -1.7890625, -1.126953125, -0.46484375, 0.197265625, 0.859375, 1.521484375, 2.18359375, 2.845703125, 3.5078125, 4.169921875, 4.83203125, 5.494140625, 6.15625, 6.818359375, 7.48046875, 8.142578125, 8.8046875, 9.466796875, 10.12890625, 10.791015625, 11.453125, 12.115234375, 12.77734375, 13.439453125, 14.1015625, 14.763671875, 15.42578125, 16.087890625, 16.75, 17.412109375, 18.07421875, 18.736328125, 19.3984375, 20.060546875, 20.72265625, 21.384765625, 22.046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 8.0, 8.0, 12.0, 14.0, 18.0, 29.0, 24.0, 33.0, 29.0, 55.0, 62.0, 74.0, 97.0, 121.0, 151.0, 227.0, 371.0, 610.0, 1595.0, 44790.0, 3042972.0, 50818.0, 1687.0, 632.0, 341.0, 228.0, 180.0, 120.0, 86.0, 54.0, 48.0, 51.0, 29.0, 29.0, 18.0, 10.0, 12.0, 12.0, 9.0, 7.0, 5.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.16015625, -34.0078125, -32.85546875, -31.703125, -30.55078125, -29.3984375, -28.24609375, -27.09375, -25.94140625, -24.7890625, -23.63671875, -22.484375, -21.33203125, -20.1796875, -19.02734375, -17.875, -16.72265625, -15.5703125, -14.41796875, -13.265625, -12.11328125, -10.9609375, -9.80859375, -8.65625, -7.50390625, -6.3515625, -5.19921875, -4.046875, -2.89453125, -1.7421875, -0.58984375, 0.5625, 1.71484375, 2.8671875, 4.01953125, 5.171875, 6.32421875, 7.4765625, 8.62890625, 9.78125, 10.93359375, 12.0859375, 13.23828125, 14.390625, 15.54296875, 16.6953125, 17.84765625, 19.0, 20.15234375, 21.3046875, 22.45703125, 23.609375, 24.76171875, 25.9140625, 27.06640625, 28.21875, 29.37109375, 30.5234375, 31.67578125, 32.828125, 33.98046875, 35.1328125, 36.28515625, 37.4375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 29.0, 123.0, 348.0, 343.0, 125.0, 28.0, 13.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.078289031982422, -22.232301712036133, -20.386314392089844, -18.540327072143555, -16.694339752197266, -14.848352432250977, -13.002365112304688, -11.156377792358398, -9.31039047241211, -7.46440315246582, -5.618415832519531, -3.772428512573242, -1.9264411926269531, -0.08045387268066406, 1.765533447265625, 3.611520767211914, 5.457508087158203, 7.303495407104492, 9.149482727050781, 10.99547004699707, 12.84145736694336, 14.687444686889648, 16.533432006835938, 18.379419326782227, 20.225406646728516, 22.071393966674805, 23.917381286621094, 25.763368606567383, 27.609355926513672, 29.45534324645996, 31.30133056640625, 33.147315979003906, 34.99330139160156, 36.83928680419922, 38.68527603149414, 40.53126525878906, 42.37725067138672, 44.223236083984375, 46.0692253112793, 47.91521453857422, 49.761199951171875, 51.60718536376953, 53.45317459106445, 55.299163818359375, 57.14514923095703, 58.99113464355469, 60.83712387084961, 62.68311309814453, 64.52909851074219, 66.37508392333984, 68.2210693359375, 70.06706237792969, 71.91304779052734, 73.759033203125, 75.60502624511719, 77.45101165771484, 79.2969970703125, 81.14298248291016, 82.98896789550781, 84.8349609375, 86.68094635009766, 88.52693176269531, 90.3729248046875, 92.21891021728516, 94.06489562988281]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 1.0, 5.0, 4.0, 8.0, 10.0, 10.0, 9.0, 11.0, 10.0, 12.0, 26.0, 15.0, 18.0, 25.0, 22.0, 26.0, 42.0, 27.0, 41.0, 42.0, 40.0, 35.0, 44.0, 37.0, 53.0, 35.0, 40.0, 34.0, 37.0, 26.0, 34.0, 31.0, 23.0, 24.0, 16.0, 19.0, 21.0, 16.0, 13.0, 12.0, 11.0, 8.0, 9.0, 3.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-51.13607406616211, -49.5098762512207, -47.8836784362793, -46.25748062133789, -44.631282806396484, -43.00508499145508, -41.37888717651367, -39.752689361572266, -38.12649154663086, -36.50029373168945, -34.87409591674805, -33.24789810180664, -31.621700286865234, -29.995502471923828, -28.369304656982422, -26.743106842041016, -25.11690902709961, -23.490711212158203, -21.864513397216797, -20.23831558227539, -18.612117767333984, -16.985919952392578, -15.359722137451172, -13.733524322509766, -12.10732650756836, -10.481128692626953, -8.854930877685547, -7.228733062744141, -5.602535247802734, -3.976337432861328, -2.350139617919922, -0.7239418029785156, 0.9022598266601562, 2.5284576416015625, 4.154655456542969, 5.780853271484375, 7.407051086425781, 9.033248901367188, 10.659446716308594, 12.28564453125, 13.911842346191406, 15.538040161132812, 17.16423797607422, 18.790435791015625, 20.41663360595703, 22.042831420898438, 23.669029235839844, 25.29522705078125, 26.921424865722656, 28.547622680664062, 30.17382049560547, 31.800018310546875, 33.42621612548828, 35.05241394042969, 36.678611755371094, 38.3048095703125, 39.931007385253906, 41.55720520019531, 43.18340301513672, 44.809600830078125, 46.43579864501953, 48.06199645996094, 49.688194274902344, 51.31439208984375, 52.940589904785156]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 1.0, 13.0, 8.0, 10.0, 13.0, 15.0, 17.0, 19.0, 14.0, 25.0, 25.0, 30.0, 26.0, 26.0, 38.0, 35.0, 43.0, 32.0, 42.0, 45.0, 41.0, 33.0, 36.0, 46.0, 33.0, 36.0, 37.0, 29.0, 32.0, 26.0, 19.0, 19.0, 27.0, 15.0, 18.0, 11.0, 12.0, 11.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.0191650390625, -5.800048828125, -5.5809326171875, -5.36181640625, -5.1427001953125, -4.923583984375, -4.7044677734375, -4.4853515625, -4.2662353515625, -4.047119140625, -3.8280029296875, -3.60888671875, -3.3897705078125, -3.170654296875, -2.9515380859375, -2.732421875, -2.5133056640625, -2.294189453125, -2.0750732421875, -1.85595703125, -1.6368408203125, -1.417724609375, -1.1986083984375, -0.9794921875, -0.7603759765625, -0.541259765625, -0.3221435546875, -0.10302734375, 0.1160888671875, 0.335205078125, 0.5543212890625, 0.7734375, 0.9925537109375, 1.211669921875, 1.4307861328125, 1.64990234375, 1.8690185546875, 2.088134765625, 2.3072509765625, 2.5263671875, 2.7454833984375, 2.964599609375, 3.1837158203125, 3.40283203125, 3.6219482421875, 3.841064453125, 4.0601806640625, 4.279296875, 4.4984130859375, 4.717529296875, 4.9366455078125, 5.15576171875, 5.3748779296875, 5.593994140625, 5.8131103515625, 6.0322265625, 6.2513427734375, 6.470458984375, 6.6895751953125, 6.90869140625, 7.1278076171875, 7.346923828125, 7.5660400390625, 7.78515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 13.0, 6.0, 17.0, 16.0, 13.0, 21.0, 16.0, 30.0, 24.0, 45.0, 47.0, 51.0, 79.0, 112.0, 178.0, 382.0, 1490.0, 15290.0, 571202.0, 3377851.0, 217059.0, 8317.0, 1083.0, 292.0, 180.0, 96.0, 56.0, 63.0, 31.0, 33.0, 37.0, 22.0, 24.0, 18.0, 13.0, 9.0, 14.0, 11.0, 8.0, 5.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.203125, -21.49560546875, -20.7880859375, -20.08056640625, -19.373046875, -18.66552734375, -17.9580078125, -17.25048828125, -16.54296875, -15.83544921875, -15.1279296875, -14.42041015625, -13.712890625, -13.00537109375, -12.2978515625, -11.59033203125, -10.8828125, -10.17529296875, -9.4677734375, -8.76025390625, -8.052734375, -7.34521484375, -6.6376953125, -5.93017578125, -5.22265625, -4.51513671875, -3.8076171875, -3.10009765625, -2.392578125, -1.68505859375, -0.9775390625, -0.27001953125, 0.4375, 1.14501953125, 1.8525390625, 2.56005859375, 3.267578125, 3.97509765625, 4.6826171875, 5.39013671875, 6.09765625, 6.80517578125, 7.5126953125, 8.22021484375, 8.927734375, 9.63525390625, 10.3427734375, 11.05029296875, 11.7578125, 12.46533203125, 13.1728515625, 13.88037109375, 14.587890625, 15.29541015625, 16.0029296875, 16.71044921875, 17.41796875, 18.12548828125, 18.8330078125, 19.54052734375, 20.248046875, 20.95556640625, 21.6630859375, 22.37060546875, 23.078125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 5.0, 6.0, 4.0, 8.0, 6.0, 17.0, 19.0, 24.0, 25.0, 41.0, 58.0, 60.0, 92.0, 95.0, 135.0, 146.0, 236.0, 310.0, 363.0, 416.0, 431.0, 330.0, 289.0, 198.0, 146.0, 140.0, 96.0, 82.0, 72.0, 54.0, 39.0, 29.0, 26.0, 19.0, 13.0, 9.0, 8.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.3587646484375, -9.022216796875, -8.6856689453125, -8.34912109375, -8.0125732421875, -7.676025390625, -7.3394775390625, -7.0029296875, -6.6663818359375, -6.329833984375, -5.9932861328125, -5.65673828125, -5.3201904296875, -4.983642578125, -4.6470947265625, -4.310546875, -3.9739990234375, -3.637451171875, -3.3009033203125, -2.96435546875, -2.6278076171875, -2.291259765625, -1.9547119140625, -1.6181640625, -1.2816162109375, -0.945068359375, -0.6085205078125, -0.27197265625, 0.0645751953125, 0.401123046875, 0.7376708984375, 1.07421875, 1.4107666015625, 1.747314453125, 2.0838623046875, 2.42041015625, 2.7569580078125, 3.093505859375, 3.4300537109375, 3.7666015625, 4.1031494140625, 4.439697265625, 4.7762451171875, 5.11279296875, 5.4493408203125, 5.785888671875, 6.1224365234375, 6.458984375, 6.7955322265625, 7.132080078125, 7.4686279296875, 7.80517578125, 8.1417236328125, 8.478271484375, 8.8148193359375, 9.1513671875, 9.4879150390625, 9.824462890625, 10.1610107421875, 10.49755859375, 10.8341064453125, 11.170654296875, 11.5072021484375, 11.84375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 9.0, 9.0, 17.0, 12.0, 29.0, 32.0, 58.0, 50.0, 71.0, 80.0, 107.0, 135.0, 230.0, 273.0, 366.0, 867.0, 11938.0, 4132243.0, 45128.0, 1049.0, 440.0, 280.0, 172.0, 136.0, 118.0, 85.0, 71.0, 56.0, 50.0, 34.0, 26.0, 30.0, 16.0, 15.0, 13.0, 11.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.625, -76.3525390625, -74.080078125, -71.8076171875, -69.53515625, -67.2626953125, -64.990234375, -62.7177734375, -60.4453125, -58.1728515625, -55.900390625, -53.6279296875, -51.35546875, -49.0830078125, -46.810546875, -44.5380859375, -42.265625, -39.9931640625, -37.720703125, -35.4482421875, -33.17578125, -30.9033203125, -28.630859375, -26.3583984375, -24.0859375, -21.8134765625, -19.541015625, -17.2685546875, -14.99609375, -12.7236328125, -10.451171875, -8.1787109375, -5.90625, -3.6337890625, -1.361328125, 0.9111328125, 3.18359375, 5.4560546875, 7.728515625, 10.0009765625, 12.2734375, 14.5458984375, 16.818359375, 19.0908203125, 21.36328125, 23.6357421875, 25.908203125, 28.1806640625, 30.453125, 32.7255859375, 34.998046875, 37.2705078125, 39.54296875, 41.8154296875, 44.087890625, 46.3603515625, 48.6328125, 50.9052734375, 53.177734375, 55.4501953125, 57.72265625, 59.9951171875, 62.267578125, 64.5400390625, 66.8125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 47.0, 296.0, 471.0, 181.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-288.2147216796875, -282.9056701660156, -277.5966491699219, -272.28759765625, -266.9785461425781, -261.66949462890625, -256.3604736328125, -251.05142211914062, -245.74237060546875, -240.43333435058594, -235.12428283691406, -229.81524658203125, -224.50619506835938, -219.19715881347656, -213.8881072998047, -208.57907104492188, -203.27001953125, -197.9609832763672, -192.6519317626953, -187.3428955078125, -182.03384399414062, -176.7248077392578, -171.41575622558594, -166.10671997070312, -160.7976837158203, -155.4886474609375, -150.17959594726562, -144.8705596923828, -139.56150817871094, -134.25247192382812, -128.94342041015625, -123.63438415527344, -118.3253173828125, -113.01627349853516, -107.70722961425781, -102.39818572998047, -97.08914184570312, -91.78009796142578, -86.47105407714844, -81.16201782226562, -75.85297393798828, -70.54393005371094, -65.2348861694336, -59.92584228515625, -54.616798400878906, -49.30775451660156, -43.998714447021484, -38.68967056274414, -33.3806266784668, -28.071582794189453, -22.76253890991211, -17.4534969329834, -12.144453048706055, -6.835409164428711, -1.5263671875, 3.7826766967773438, 9.091720581054688, 14.400764465332031, 19.709808349609375, 25.018850326538086, 30.32789421081543, 35.636940002441406, 40.945980072021484, 46.25502395629883, 51.56406784057617]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 2.0, 8.0, 16.0, 9.0, 14.0, 15.0, 22.0, 20.0, 13.0, 24.0, 18.0, 22.0, 33.0, 34.0, 32.0, 30.0, 28.0, 53.0, 42.0, 29.0, 35.0, 42.0, 37.0, 26.0, 40.0, 30.0, 27.0, 35.0, 32.0, 27.0, 27.0, 29.0, 24.0, 20.0, 21.0, 8.0, 13.0, 14.0, 6.0, 8.0, 3.0, 11.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.510982513427734, -35.232784271240234, -33.95458984375, -32.6763916015625, -31.398197174072266, -30.119998931884766, -28.8418025970459, -27.56360626220703, -26.285409927368164, -25.007213592529297, -23.72901725769043, -22.450820922851562, -21.172622680664062, -19.894428253173828, -18.616230010986328, -17.33803367614746, -16.059837341308594, -14.781641006469727, -13.50344467163086, -12.225247383117676, -10.947051048278809, -9.668854713439941, -8.390657424926758, -7.112461090087891, -5.834264755249023, -4.556068420410156, -3.277871608734131, -1.9996750354766846, -0.7214784622192383, 0.5567178726196289, 1.8349146842956543, 3.1131114959716797, 4.391304016113281, 5.669500350952148, 6.947697162628174, 8.2258939743042, 9.504090309143066, 10.782286643981934, 12.060483932495117, 13.338680267333984, 14.616876602172852, 15.895072937011719, 17.173269271850586, 18.451465606689453, 19.729663848876953, 21.007858276367188, 22.286056518554688, 23.564252853393555, 24.842449188232422, 26.12064552307129, 27.398841857910156, 28.677038192749023, 29.95523452758789, 31.23343276977539, 32.511627197265625, 33.789825439453125, 35.068023681640625, 36.346221923828125, 37.62441635131836, 38.90261459350586, 40.180809020996094, 41.459007263183594, 42.73720169067383, 44.01539993286133, 45.29359436035156]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 7.0, 18.0, 4.0, 21.0, 18.0, 23.0, 18.0, 23.0, 31.0, 32.0, 39.0, 33.0, 44.0, 29.0, 30.0, 36.0, 41.0, 58.0, 33.0, 43.0, 39.0, 35.0, 39.0, 38.0, 37.0, 28.0, 25.0, 24.0, 20.0, 17.0, 16.0, 17.0, 10.0, 14.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.22265625, -6.9989013671875, -6.775146484375, -6.5513916015625, -6.32763671875, -6.1038818359375, -5.880126953125, -5.6563720703125, -5.4326171875, -5.2088623046875, -4.985107421875, -4.7613525390625, -4.53759765625, -4.3138427734375, -4.090087890625, -3.8663330078125, -3.642578125, -3.4188232421875, -3.195068359375, -2.9713134765625, -2.74755859375, -2.5238037109375, -2.300048828125, -2.0762939453125, -1.8525390625, -1.6287841796875, -1.405029296875, -1.1812744140625, -0.95751953125, -0.7337646484375, -0.510009765625, -0.2862548828125, -0.0625, 0.1612548828125, 0.385009765625, 0.6087646484375, 0.83251953125, 1.0562744140625, 1.280029296875, 1.5037841796875, 1.7275390625, 1.9512939453125, 2.175048828125, 2.3988037109375, 2.62255859375, 2.8463134765625, 3.070068359375, 3.2938232421875, 3.517578125, 3.7413330078125, 3.965087890625, 4.1888427734375, 4.41259765625, 4.6363525390625, 4.860107421875, 5.0838623046875, 5.3076171875, 5.5313720703125, 5.755126953125, 5.9788818359375, 6.20263671875, 6.4263916015625, 6.650146484375, 6.8739013671875, 7.09765625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 18.0, 9.0, 21.0, 37.0, 56.0, 89.0, 137.0, 197.0, 273.0, 389.0, 508.0, 835.0, 1161.0, 1809.0, 2614.0, 3555.0, 5347.0, 7661.0, 11707.0, 17198.0, 26013.0, 40268.0, 62867.0, 101520.0, 166013.0, 219074.0, 138209.0, 84316.0, 53444.0, 34393.0, 22360.0, 14777.0, 10096.0, 6778.0, 4682.0, 3170.0, 2118.0, 1504.0, 1055.0, 713.0, 512.0, 333.0, 224.0, 178.0, 106.0, 71.0, 43.0, 30.0, 26.0, 19.0, 6.0, 11.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0478515625, -1.0154266357421875, -0.983001708984375, -0.9505767822265625, -0.91815185546875, -0.8857269287109375, -0.853302001953125, -0.8208770751953125, -0.7884521484375, -0.7560272216796875, -0.723602294921875, -0.6911773681640625, -0.65875244140625, -0.6263275146484375, -0.593902587890625, -0.5614776611328125, -0.529052734375, -0.4966278076171875, -0.464202880859375, -0.4317779541015625, -0.39935302734375, -0.3669281005859375, -0.334503173828125, -0.3020782470703125, -0.2696533203125, -0.2372283935546875, -0.204803466796875, -0.1723785400390625, -0.13995361328125, -0.1075286865234375, -0.075103759765625, -0.0426788330078125, -0.01025390625, 0.0221710205078125, 0.054595947265625, 0.0870208740234375, 0.11944580078125, 0.1518707275390625, 0.184295654296875, 0.2167205810546875, 0.2491455078125, 0.2815704345703125, 0.313995361328125, 0.3464202880859375, 0.37884521484375, 0.4112701416015625, 0.443695068359375, 0.4761199951171875, 0.508544921875, 0.5409698486328125, 0.573394775390625, 0.6058197021484375, 0.63824462890625, 0.6706695556640625, 0.703094482421875, 0.7355194091796875, 0.7679443359375, 0.8003692626953125, 0.832794189453125, 0.8652191162109375, 0.89764404296875, 0.9300689697265625, 0.962493896484375, 0.9949188232421875, 1.02734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 10.0, 14.0, 15.0, 12.0, 25.0, 19.0, 33.0, 17.0, 31.0, 36.0, 29.0, 40.0, 38.0, 37.0, 36.0, 44.0, 1061.0, 44.0, 40.0, 51.0, 44.0, 43.0, 33.0, 29.0, 31.0, 29.0, 28.0, 27.0, 18.0, 26.0, 17.0, 9.0, 14.0, 10.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.5655517578125, -4.416259765625, -4.2669677734375, -4.11767578125, -3.9683837890625, -3.819091796875, -3.6697998046875, -3.5205078125, -3.3712158203125, -3.221923828125, -3.0726318359375, -2.92333984375, -2.7740478515625, -2.624755859375, -2.4754638671875, -2.326171875, -2.1768798828125, -2.027587890625, -1.8782958984375, -1.72900390625, -1.5797119140625, -1.430419921875, -1.2811279296875, -1.1318359375, -0.9825439453125, -0.833251953125, -0.6839599609375, -0.53466796875, -0.3853759765625, -0.236083984375, -0.0867919921875, 0.0625, 0.2117919921875, 0.361083984375, 0.5103759765625, 0.65966796875, 0.8089599609375, 0.958251953125, 1.1075439453125, 1.2568359375, 1.4061279296875, 1.555419921875, 1.7047119140625, 1.85400390625, 2.0032958984375, 2.152587890625, 2.3018798828125, 2.451171875, 2.6004638671875, 2.749755859375, 2.8990478515625, 3.04833984375, 3.1976318359375, 3.346923828125, 3.4962158203125, 3.6455078125, 3.7947998046875, 3.944091796875, 4.0933837890625, 4.24267578125, 4.3919677734375, 4.541259765625, 4.6905517578125, 4.83984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 11.0, 18.0, 29.0, 45.0, 64.0, 91.0, 156.0, 195.0, 304.0, 455.0, 685.0, 1131.0, 1801.0, 2766.0, 4228.0, 6660.0, 10720.0, 16682.0, 27192.0, 44273.0, 74358.0, 129473.0, 1284186.0, 205998.0, 113577.0, 66363.0, 39350.0, 24453.0, 15231.0, 9548.0, 6178.0, 3904.0, 2426.0, 1568.0, 1044.0, 685.0, 423.0, 292.0, 167.0, 142.0, 88.0, 52.0, 38.0, 28.0, 12.0, 14.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.063232421875, -1.02880859375, -0.994384765625, -0.9599609375, -0.925537109375, -0.89111328125, -0.856689453125, -0.822265625, -0.787841796875, -0.75341796875, -0.718994140625, -0.6845703125, -0.650146484375, -0.61572265625, -0.581298828125, -0.546875, -0.512451171875, -0.47802734375, -0.443603515625, -0.4091796875, -0.374755859375, -0.34033203125, -0.305908203125, -0.271484375, -0.237060546875, -0.20263671875, -0.168212890625, -0.1337890625, -0.099365234375, -0.06494140625, -0.030517578125, 0.00390625, 0.038330078125, 0.07275390625, 0.107177734375, 0.1416015625, 0.176025390625, 0.21044921875, 0.244873046875, 0.279296875, 0.313720703125, 0.34814453125, 0.382568359375, 0.4169921875, 0.451416015625, 0.48583984375, 0.520263671875, 0.5546875, 0.589111328125, 0.62353515625, 0.657958984375, 0.6923828125, 0.726806640625, 0.76123046875, 0.795654296875, 0.830078125, 0.864501953125, 0.89892578125, 0.933349609375, 0.9677734375, 1.002197265625, 1.03662109375, 1.071044921875, 1.10546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 6.0, 8.0, 5.0, 8.0, 16.0, 13.0, 16.0, 35.0, 40.0, 40.0, 56.0, 62.0, 69.0, 97.0, 102.0, 69.0, 75.0, 63.0, 50.0, 42.0, 25.0, 20.0, 16.0, 9.0, 17.0, 5.0, 6.0, 7.0, 8.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009007453918457031, -0.0008743852376937866, -0.0008480250835418701, -0.0008216649293899536, -0.0007953047752380371, -0.0007689446210861206, -0.0007425844669342041, -0.0007162243127822876, -0.0006898641586303711, -0.0006635040044784546, -0.0006371438503265381, -0.0006107836961746216, -0.0005844235420227051, -0.0005580633878707886, -0.0005317032337188721, -0.0005053430795669556, -0.00047898292541503906, -0.00045262277126312256, -0.00042626261711120605, -0.00039990246295928955, -0.00037354230880737305, -0.00034718215465545654, -0.00032082200050354004, -0.00029446184635162354, -0.00026810169219970703, -0.00024174153804779053, -0.00021538138389587402, -0.00018902122974395752, -0.00016266107559204102, -0.0001363009214401245, -0.00010994076728820801, -8.35806131362915e-05, -5.7220458984375e-05, -3.0860304832458496e-05, -4.500150680541992e-06, 2.1860003471374512e-05, 4.8220157623291016e-05, 7.458031177520752e-05, 0.00010094046592712402, 0.00012730062007904053, 0.00015366077423095703, 0.00018002092838287354, 0.00020638108253479004, 0.00023274123668670654, 0.00025910139083862305, 0.00028546154499053955, 0.00031182169914245605, 0.00033818185329437256, 0.00036454200744628906, 0.00039090216159820557, 0.00041726231575012207, 0.0004436224699020386, 0.0004699826240539551, 0.0004963427782058716, 0.0005227029323577881, 0.0005490630865097046, 0.0005754232406616211, 0.0006017833948135376, 0.0006281435489654541, 0.0006545037031173706, 0.0006808638572692871, 0.0007072240114212036, 0.0007335841655731201, 0.0007599443197250366, 0.0007863044738769531]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 9.0, 13.0, 9.0, 15.0, 23.0, 27.0, 36.0, 55.0, 76.0, 153.0, 243.0, 423.0, 1709.0, 1037379.0, 6986.0, 645.0, 266.0, 151.0, 98.0, 57.0, 39.0, 40.0, 20.0, 15.0, 13.0, 8.0, 7.0, 4.0, 7.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.017974853515625, -0.017368793487548828, -0.016762733459472656, -0.016156673431396484, -0.015550613403320312, -0.01494455337524414, -0.014338493347167969, -0.013732433319091797, -0.013126373291015625, -0.012520313262939453, -0.011914253234863281, -0.01130819320678711, -0.010702133178710938, -0.010096073150634766, -0.009490013122558594, -0.008883953094482422, -0.00827789306640625, -0.007671833038330078, -0.007065773010253906, -0.006459712982177734, -0.0058536529541015625, -0.005247592926025391, -0.004641532897949219, -0.004035472869873047, -0.003429412841796875, -0.002823352813720703, -0.0022172927856445312, -0.0016112327575683594, -0.0010051727294921875, -0.0003991127014160156, 0.00020694732666015625, 0.0008130073547363281, 0.0014190673828125, 0.002025127410888672, 0.0026311874389648438, 0.0032372474670410156, 0.0038433074951171875, 0.004449367523193359, 0.005055427551269531, 0.005661487579345703, 0.006267547607421875, 0.006873607635498047, 0.007479667663574219, 0.00808572769165039, 0.008691787719726562, 0.009297847747802734, 0.009903907775878906, 0.010509967803955078, 0.01111602783203125, 0.011722087860107422, 0.012328147888183594, 0.012934207916259766, 0.013540267944335938, 0.01414632797241211, 0.014752388000488281, 0.015358448028564453, 0.015964508056640625, 0.016570568084716797, 0.01717662811279297, 0.01778268814086914, 0.018388748168945312, 0.018994808197021484, 0.019600868225097656, 0.020206928253173828, 0.02081298828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 13.0, 31.0, 175.0, 306.0, 311.0, 135.0, 35.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016441349871456623, -0.0016124630346894264, -0.0015807910822331905, -0.0015491191297769547, -0.0015174472937360406, -0.0014857753412798047, -0.0014541033888235688, -0.001422431436367333, -0.001390759483911097, -0.0013590875314548612, -0.0013274155789986253, -0.0012957437429577112, -0.0012640717905014753, -0.0012323998380452394, -0.0012007278855890036, -0.0011690559331327677, -0.0011373839806765318, -0.001105712028220296, -0.00107404007576406, -0.0010423681233078241, -0.00101069628726691, -0.0009790243348106742, -0.0009473523823544383, -0.0009156804298982024, -0.0008840085938572884, -0.0008523366414010525, -0.0008206647471524775, -0.0007889927946962416, -0.0007573208422400057, -0.0007256489479914308, -0.0006939769955351949, -0.000662305043078959, -0.000630633148830384, -0.0005989611963741481, -0.0005672893021255732, -0.0005356173496693373, -0.0005039453972131014, -0.00047227347386069596, -0.00044060155050829053, -0.00040892959805205464, -0.0003772576746996492, -0.0003455857513472438, -0.0003139137988910079, -0.00028224187553860247, -0.00025056995218619704, -0.00021889799972996116, -0.00018722607637755573, -0.00015555413847323507, -0.0001238822005689144, -9.221026266459376e-05, -6.053833203623071e-05, -2.886640140786767e-05, 2.805536496452987e-06, 3.4477474400773644e-05, 6.614939775317907e-05, 9.782133565749973e-05, 0.0001294932735618204, 0.00016116521146614105, 0.0001928371493704617, 0.00022450907272286713, 0.00025618099607527256, 0.00028785294853150845, 0.0003195248718839139, 0.0003511967952363193, 0.0003828687476925552]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 9.0, 10.0, 16.0, 8.0, 15.0, 15.0, 26.0, 21.0, 19.0, 28.0, 36.0, 28.0, 33.0, 26.0, 30.0, 38.0, 34.0, 31.0, 51.0, 38.0, 43.0, 37.0, 42.0, 30.0, 38.0, 42.0, 37.0, 31.0, 22.0, 23.0, 20.0, 13.0, 11.0, 21.0, 14.0, 10.0, 8.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003153681755065918, -0.00030407775193452835, -0.0002927873283624649, -0.00028149690479040146, -0.000270206481218338, -0.00025891605764627457, -0.0002476256340742111, -0.00023633521050214767, -0.00022504478693008423, -0.00021375436335802078, -0.00020246393978595734, -0.0001911735162138939, -0.00017988309264183044, -0.000168592669069767, -0.00015730224549770355, -0.0001460118219256401, -0.00013472139835357666, -0.00012343097478151321, -0.00011214055120944977, -0.00010085012763738632, -8.955970406532288e-05, -7.826928049325943e-05, -6.697885692119598e-05, -5.568843334913254e-05, -4.439800977706909e-05, -3.3107586205005646e-05, -2.18171626329422e-05, -1.0526739060878754e-05, 7.636845111846924e-07, 1.2054108083248138e-05, 2.3344531655311584e-05, 3.463495522737503e-05, 4.5925378799438477e-05, 5.721580237150192e-05, 6.850622594356537e-05, 7.979664951562881e-05, 9.108707308769226e-05, 0.00010237749665975571, 0.00011366792023181915, 0.0001249583438038826, 0.00013624876737594604, 0.0001475391909480095, 0.00015882961452007294, 0.00017012003809213638, 0.00018141046166419983, 0.00019270088523626328, 0.00020399130880832672, 0.00021528173238039017, 0.0002265721559524536, 0.00023786257952451706, 0.0002491530030965805, 0.00026044342666864395, 0.0002717338502407074, 0.00028302427381277084, 0.0002943146973848343, 0.00030560512095689774, 0.0003168955445289612, 0.00032818596810102463, 0.0003394763916730881, 0.0003507668152451515, 0.00036205723881721497, 0.0003733476623892784, 0.00038463808596134186, 0.0003959285095334053, 0.00040721893310546875]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 7.0, 18.0, 4.0, 21.0, 18.0, 23.0, 18.0, 23.0, 31.0, 32.0, 39.0, 33.0, 44.0, 29.0, 30.0, 36.0, 41.0, 58.0, 33.0, 43.0, 39.0, 35.0, 39.0, 38.0, 37.0, 28.0, 25.0, 24.0, 20.0, 17.0, 16.0, 17.0, 10.0, 14.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.22265625, -6.9989013671875, -6.775146484375, -6.5513916015625, -6.32763671875, -6.1038818359375, -5.880126953125, -5.6563720703125, -5.4326171875, -5.2088623046875, -4.985107421875, -4.7613525390625, -4.53759765625, -4.3138427734375, -4.090087890625, -3.8663330078125, -3.642578125, -3.4188232421875, -3.195068359375, -2.9713134765625, -2.74755859375, -2.5238037109375, -2.300048828125, -2.0762939453125, -1.8525390625, -1.6287841796875, -1.405029296875, -1.1812744140625, -0.95751953125, -0.7337646484375, -0.510009765625, -0.2862548828125, -0.0625, 0.1612548828125, 0.385009765625, 0.6087646484375, 0.83251953125, 1.0562744140625, 1.280029296875, 1.5037841796875, 1.7275390625, 1.9512939453125, 2.175048828125, 2.3988037109375, 2.62255859375, 2.8463134765625, 3.070068359375, 3.2938232421875, 3.517578125, 3.7413330078125, 3.965087890625, 4.1888427734375, 4.41259765625, 4.6363525390625, 4.860107421875, 5.0838623046875, 5.3076171875, 5.5313720703125, 5.755126953125, 5.9788818359375, 6.20263671875, 6.4263916015625, 6.650146484375, 6.8739013671875, 7.09765625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 5.0, 11.0, 10.0, 12.0, 13.0, 20.0, 33.0, 39.0, 43.0, 56.0, 72.0, 105.0, 171.0, 221.0, 362.0, 633.0, 1956.0, 11205.0, 94921.0, 766244.0, 151262.0, 16517.0, 2624.0, 753.0, 382.0, 242.0, 183.0, 115.0, 72.0, 63.0, 41.0, 31.0, 30.0, 28.0, 13.0, 17.0, 11.0, 8.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.34375, -13.9036865234375, -13.463623046875, -13.0235595703125, -12.58349609375, -12.1434326171875, -11.703369140625, -11.2633056640625, -10.8232421875, -10.3831787109375, -9.943115234375, -9.5030517578125, -9.06298828125, -8.6229248046875, -8.182861328125, -7.7427978515625, -7.302734375, -6.8626708984375, -6.422607421875, -5.9825439453125, -5.54248046875, -5.1024169921875, -4.662353515625, -4.2222900390625, -3.7822265625, -3.3421630859375, -2.902099609375, -2.4620361328125, -2.02197265625, -1.5819091796875, -1.141845703125, -0.7017822265625, -0.26171875, 0.1783447265625, 0.618408203125, 1.0584716796875, 1.49853515625, 1.9385986328125, 2.378662109375, 2.8187255859375, 3.2587890625, 3.6988525390625, 4.138916015625, 4.5789794921875, 5.01904296875, 5.4591064453125, 5.899169921875, 6.3392333984375, 6.779296875, 7.2193603515625, 7.659423828125, 8.0994873046875, 8.53955078125, 8.9796142578125, 9.419677734375, 9.8597412109375, 10.2998046875, 10.7398681640625, 11.179931640625, 11.6199951171875, 12.06005859375, 12.5001220703125, 12.940185546875, 13.3802490234375, 13.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 7.0, 12.0, 6.0, 10.0, 12.0, 10.0, 23.0, 21.0, 25.0, 22.0, 34.0, 32.0, 41.0, 36.0, 48.0, 56.0, 74.0, 247.0, 1677.0, 178.0, 57.0, 51.0, 43.0, 36.0, 42.0, 24.0, 35.0, 33.0, 18.0, 14.0, 17.0, 22.0, 16.0, 11.0, 5.0, 14.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.484375, -22.781005859375, -22.07763671875, -21.374267578125, -20.6708984375, -19.967529296875, -19.26416015625, -18.560791015625, -17.857421875, -17.154052734375, -16.45068359375, -15.747314453125, -15.0439453125, -14.340576171875, -13.63720703125, -12.933837890625, -12.23046875, -11.527099609375, -10.82373046875, -10.120361328125, -9.4169921875, -8.713623046875, -8.01025390625, -7.306884765625, -6.603515625, -5.900146484375, -5.19677734375, -4.493408203125, -3.7900390625, -3.086669921875, -2.38330078125, -1.679931640625, -0.9765625, -0.273193359375, 0.43017578125, 1.133544921875, 1.8369140625, 2.540283203125, 3.24365234375, 3.947021484375, 4.650390625, 5.353759765625, 6.05712890625, 6.760498046875, 7.4638671875, 8.167236328125, 8.87060546875, 9.573974609375, 10.27734375, 10.980712890625, 11.68408203125, 12.387451171875, 13.0908203125, 13.794189453125, 14.49755859375, 15.200927734375, 15.904296875, 16.607666015625, 17.31103515625, 18.014404296875, 18.7177734375, 19.421142578125, 20.12451171875, 20.827880859375, 21.53125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 8.0, 3.0, 11.0, 12.0, 12.0, 16.0, 23.0, 18.0, 17.0, 23.0, 42.0, 40.0, 53.0, 86.0, 88.0, 168.0, 288.0, 557.0, 2357.0, 801157.0, 2336245.0, 2886.0, 636.0, 321.0, 173.0, 103.0, 72.0, 62.0, 42.0, 29.0, 30.0, 29.0, 17.0, 13.0, 15.0, 9.0, 8.0, 11.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-49.9375, -48.32861328125, -46.7197265625, -45.11083984375, -43.501953125, -41.89306640625, -40.2841796875, -38.67529296875, -37.06640625, -35.45751953125, -33.8486328125, -32.23974609375, -30.630859375, -29.02197265625, -27.4130859375, -25.80419921875, -24.1953125, -22.58642578125, -20.9775390625, -19.36865234375, -17.759765625, -16.15087890625, -14.5419921875, -12.93310546875, -11.32421875, -9.71533203125, -8.1064453125, -6.49755859375, -4.888671875, -3.27978515625, -1.6708984375, -0.06201171875, 1.546875, 3.15576171875, 4.7646484375, 6.37353515625, 7.982421875, 9.59130859375, 11.2001953125, 12.80908203125, 14.41796875, 16.02685546875, 17.6357421875, 19.24462890625, 20.853515625, 22.46240234375, 24.0712890625, 25.68017578125, 27.2890625, 28.89794921875, 30.5068359375, 32.11572265625, 33.724609375, 35.33349609375, 36.9423828125, 38.55126953125, 40.16015625, 41.76904296875, 43.3779296875, 44.98681640625, 46.595703125, 48.20458984375, 49.8134765625, 51.42236328125, 53.03125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 13.0, 792.0, 206.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.23040008544922, -15.555150985717773, -9.879901885986328, -4.204652786254883, 1.4705963134765625, 7.145845413208008, 12.821094512939453, 18.49634552001953, 24.171592712402344, 29.84684181213379, 35.522090911865234, 41.19734191894531, 46.872589111328125, 52.54783630371094, 58.223087310791016, 63.898338317871094, 69.5735855102539, 75.24883270263672, 80.92408752441406, 86.59933471679688, 92.27458190917969, 97.9498291015625, 103.62507629394531, 109.30033111572266, 114.97557830810547, 120.65082550048828, 126.32608032226562, 132.00132751464844, 137.67657470703125, 143.35182189941406, 149.02706909179688, 154.70233154296875, 160.3775634765625, 166.0528106689453, 171.72805786132812, 177.40330505371094, 183.07855224609375, 188.75381469726562, 194.42906188964844, 200.10430908203125, 205.77955627441406, 211.45480346679688, 217.1300506591797, 222.8052978515625, 228.48056030273438, 234.1558074951172, 239.8310546875, 245.5063018798828, 251.18154907226562, 256.8568115234375, 262.53204345703125, 268.2073059082031, 273.8825378417969, 279.55780029296875, 285.2330322265625, 290.9082946777344, 296.58355712890625, 302.2588195800781, 307.9340515136719, 313.60931396484375, 319.2845458984375, 324.9598083496094, 330.6350402832031, 336.310302734375, 341.98553466796875]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 8.0, 4.0, 5.0, 11.0, 11.0, 13.0, 13.0, 13.0, 21.0, 26.0, 21.0, 28.0, 30.0, 32.0, 34.0, 51.0, 40.0, 36.0, 38.0, 49.0, 37.0, 44.0, 41.0, 34.0, 38.0, 41.0, 33.0, 30.0, 27.0, 22.0, 22.0, 31.0, 14.0, 12.0, 15.0, 16.0, 8.0, 9.0, 8.0, 12.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0], "bins": [-56.44456481933594, -54.778480529785156, -53.11240005493164, -51.446319580078125, -49.780235290527344, -48.11415100097656, -46.44807052612305, -44.78199005126953, -43.11590576171875, -41.44982147216797, -39.78374099731445, -38.11766052246094, -36.451576232910156, -34.785491943359375, -33.11941146850586, -31.45332908630371, -29.787246704101562, -28.121164321899414, -26.455081939697266, -24.788999557495117, -23.12291717529297, -21.45683479309082, -19.790752410888672, -18.124670028686523, -16.458587646484375, -14.792505264282227, -13.126422882080078, -11.46034049987793, -9.794258117675781, -8.128175735473633, -6.462093353271484, -4.796010971069336, -3.129932403564453, -1.4638500213623047, 0.20223236083984375, 1.8683147430419922, 3.5343971252441406, 5.200479507446289, 6.8665618896484375, 8.532644271850586, 10.198726654052734, 11.864809036254883, 13.530891418457031, 15.19697380065918, 16.863056182861328, 18.529138565063477, 20.195220947265625, 21.861303329467773, 23.527385711669922, 25.19346809387207, 26.85955047607422, 28.525632858276367, 30.191715240478516, 31.857797622680664, 33.52388000488281, 35.189964294433594, 36.85604476928711, 38.522125244140625, 40.188209533691406, 41.85429382324219, 43.5203742980957, 45.18645477294922, 46.8525390625, 48.51862335205078, 50.1847038269043]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 3.0, 5.0, 10.0, 14.0, 5.0, 17.0, 11.0, 26.0, 19.0, 30.0, 23.0, 37.0, 38.0, 36.0, 26.0, 33.0, 40.0, 41.0, 39.0, 44.0, 46.0, 35.0, 33.0, 38.0, 39.0, 44.0, 37.0, 31.0, 20.0, 25.0, 33.0, 21.0, 17.0, 14.0, 12.0, 9.0, 10.0, 9.0, 5.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.2734375, -7.04437255859375, -6.8153076171875, -6.58624267578125, -6.357177734375, -6.12811279296875, -5.8990478515625, -5.66998291015625, -5.44091796875, -5.21185302734375, -4.9827880859375, -4.75372314453125, -4.524658203125, -4.29559326171875, -4.0665283203125, -3.83746337890625, -3.6083984375, -3.37933349609375, -3.1502685546875, -2.92120361328125, -2.692138671875, -2.46307373046875, -2.2340087890625, -2.00494384765625, -1.77587890625, -1.54681396484375, -1.3177490234375, -1.08868408203125, -0.859619140625, -0.63055419921875, -0.4014892578125, -0.17242431640625, 0.056640625, 0.28570556640625, 0.5147705078125, 0.74383544921875, 0.972900390625, 1.20196533203125, 1.4310302734375, 1.66009521484375, 1.88916015625, 2.11822509765625, 2.3472900390625, 2.57635498046875, 2.805419921875, 3.03448486328125, 3.2635498046875, 3.49261474609375, 3.7216796875, 3.95074462890625, 4.1798095703125, 4.40887451171875, 4.637939453125, 4.86700439453125, 5.0960693359375, 5.32513427734375, 5.55419921875, 5.78326416015625, 6.0123291015625, 6.24139404296875, 6.470458984375, 6.69952392578125, 6.9285888671875, 7.15765380859375, 7.38671875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 8.0, 2.0, 8.0, 3.0, 14.0, 14.0, 25.0, 13.0, 24.0, 37.0, 45.0, 51.0, 79.0, 115.0, 257.0, 493.0, 1388.0, 7257.0, 99731.0, 2508775.0, 1521832.0, 47588.0, 4475.0, 1061.0, 371.0, 189.0, 98.0, 79.0, 65.0, 37.0, 31.0, 23.0, 25.0, 16.0, 13.0, 11.0, 5.0, 5.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.03125, -22.3515625, -21.671875, -20.9921875, -20.3125, -19.6328125, -18.953125, -18.2734375, -17.59375, -16.9140625, -16.234375, -15.5546875, -14.875, -14.1953125, -13.515625, -12.8359375, -12.15625, -11.4765625, -10.796875, -10.1171875, -9.4375, -8.7578125, -8.078125, -7.3984375, -6.71875, -6.0390625, -5.359375, -4.6796875, -4.0, -3.3203125, -2.640625, -1.9609375, -1.28125, -0.6015625, 0.078125, 0.7578125, 1.4375, 2.1171875, 2.796875, 3.4765625, 4.15625, 4.8359375, 5.515625, 6.1953125, 6.875, 7.5546875, 8.234375, 8.9140625, 9.59375, 10.2734375, 10.953125, 11.6328125, 12.3125, 12.9921875, 13.671875, 14.3515625, 15.03125, 15.7109375, 16.390625, 17.0703125, 17.75, 18.4296875, 19.109375, 19.7890625, 20.46875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 12.0, 11.0, 14.0, 17.0, 16.0, 23.0, 39.0, 47.0, 53.0, 86.0, 76.0, 114.0, 146.0, 188.0, 252.0, 330.0, 402.0, 374.0, 345.0, 338.0, 262.0, 192.0, 151.0, 127.0, 110.0, 69.0, 59.0, 41.0, 37.0, 24.0, 21.0, 21.0, 12.0, 16.0, 5.0, 4.0, 8.0, 7.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6171875, -9.292724609375, -8.96826171875, -8.643798828125, -8.3193359375, -7.994873046875, -7.67041015625, -7.345947265625, -7.021484375, -6.697021484375, -6.37255859375, -6.048095703125, -5.7236328125, -5.399169921875, -5.07470703125, -4.750244140625, -4.42578125, -4.101318359375, -3.77685546875, -3.452392578125, -3.1279296875, -2.803466796875, -2.47900390625, -2.154541015625, -1.830078125, -1.505615234375, -1.18115234375, -0.856689453125, -0.5322265625, -0.207763671875, 0.11669921875, 0.441162109375, 0.765625, 1.090087890625, 1.41455078125, 1.739013671875, 2.0634765625, 2.387939453125, 2.71240234375, 3.036865234375, 3.361328125, 3.685791015625, 4.01025390625, 4.334716796875, 4.6591796875, 4.983642578125, 5.30810546875, 5.632568359375, 5.95703125, 6.281494140625, 6.60595703125, 6.930419921875, 7.2548828125, 7.579345703125, 7.90380859375, 8.228271484375, 8.552734375, 8.877197265625, 9.20166015625, 9.526123046875, 9.8505859375, 10.175048828125, 10.49951171875, 10.823974609375, 11.1484375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 5.0, 9.0, 16.0, 21.0, 22.0, 38.0, 46.0, 52.0, 72.0, 92.0, 120.0, 161.0, 297.0, 517.0, 1835.0, 298296.0, 3885713.0, 5136.0, 680.0, 360.0, 218.0, 154.0, 93.0, 81.0, 50.0, 43.0, 31.0, 38.0, 20.0, 14.0, 10.0, 10.0, 6.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.625, -66.3505859375, -64.076171875, -61.8017578125, -59.52734375, -57.2529296875, -54.978515625, -52.7041015625, -50.4296875, -48.1552734375, -45.880859375, -43.6064453125, -41.33203125, -39.0576171875, -36.783203125, -34.5087890625, -32.234375, -29.9599609375, -27.685546875, -25.4111328125, -23.13671875, -20.8623046875, -18.587890625, -16.3134765625, -14.0390625, -11.7646484375, -9.490234375, -7.2158203125, -4.94140625, -2.6669921875, -0.392578125, 1.8818359375, 4.15625, 6.4306640625, 8.705078125, 10.9794921875, 13.25390625, 15.5283203125, 17.802734375, 20.0771484375, 22.3515625, 24.6259765625, 26.900390625, 29.1748046875, 31.44921875, 33.7236328125, 35.998046875, 38.2724609375, 40.546875, 42.8212890625, 45.095703125, 47.3701171875, 49.64453125, 51.9189453125, 54.193359375, 56.4677734375, 58.7421875, 61.0166015625, 63.291015625, 65.5654296875, 67.83984375, 70.1142578125, 72.388671875, 74.6630859375, 76.9375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 19.0, 49.0, 118.0, 135.0, 177.0, 173.0, 136.0, 86.0, 58.0, 29.0, 20.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.96239471435547, -64.2294692993164, -62.49654006958008, -60.763614654541016, -59.03068542480469, -57.297760009765625, -55.56483459472656, -53.831905364990234, -52.098976135253906, -50.366050720214844, -48.633121490478516, -46.90019607543945, -45.167266845703125, -43.43434143066406, -41.701416015625, -39.96848678588867, -38.23556137084961, -36.50263595581055, -34.76970672607422, -33.036781311035156, -31.303852081298828, -29.570926666259766, -27.83799934387207, -26.105072021484375, -24.37214469909668, -22.639217376708984, -20.90629005432129, -19.173362731933594, -17.44043731689453, -15.70750904083252, -13.97458267211914, -12.241655349731445, -10.508731842041016, -8.77580451965332, -7.042877674102783, -5.309950828552246, -3.577023506164551, -1.8440961837768555, -0.11116981506347656, 1.6217575073242188, 3.354684829711914, 5.087612152099609, 6.8205389976501465, 8.553465843200684, 10.286393165588379, 12.019320487976074, 13.752246856689453, 15.485174179077148, 17.218101501464844, 18.95102882385254, 20.683956146240234, 22.416881561279297, 24.149810791015625, 25.882736206054688, 27.615663528442383, 29.348590850830078, 31.081518173217773, 32.81444549560547, 34.54737091064453, 36.28030014038086, 38.01322555541992, 39.74615478515625, 41.47908020019531, 43.212005615234375, 44.9449348449707]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 4.0, 4.0, 11.0, 5.0, 9.0, 10.0, 22.0, 21.0, 26.0, 32.0, 31.0, 31.0, 33.0, 37.0, 36.0, 41.0, 42.0, 45.0, 44.0, 40.0, 45.0, 42.0, 48.0, 51.0, 27.0, 41.0, 32.0, 29.0, 24.0, 23.0, 25.0, 17.0, 18.0, 11.0, 9.0, 9.0, 9.0, 6.0, 8.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.00720977783203, -34.65553665161133, -33.30386734008789, -31.952194213867188, -30.600522994995117, -29.248851776123047, -27.897178649902344, -26.545507431030273, -25.193836212158203, -23.842164993286133, -22.490493774414062, -21.13882064819336, -19.78714942932129, -18.43547821044922, -17.083805084228516, -15.732133865356445, -14.380462646484375, -13.028791427612305, -11.677119255065918, -10.325447082519531, -8.973775863647461, -7.622104167938232, -6.270432472229004, -4.918760299682617, -3.567089080810547, -2.2154173851013184, -0.8637456893920898, 0.48792600631713867, 1.8395977020263672, 3.1912693977355957, 4.542941093444824, 5.894613265991211, 7.246284484863281, 8.597955703735352, 9.949627876281738, 11.301300048828125, 12.652971267700195, 14.004642486572266, 15.356314659118652, 16.70798683166504, 18.05965805053711, 19.41132926940918, 20.76300048828125, 22.114673614501953, 23.466344833374023, 24.818016052246094, 26.169689178466797, 27.521360397338867, 28.873031616210938, 30.224702835083008, 31.576374053955078, 32.92804718017578, 34.27971649169922, 35.63138961791992, 36.983062744140625, 38.33473205566406, 39.686405181884766, 41.03807830810547, 42.389747619628906, 43.74142074584961, 45.09309387207031, 46.44476318359375, 47.79643630981445, 49.148109436035156, 50.499778747558594]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 11.0, 16.0, 19.0, 18.0, 27.0, 18.0, 32.0, 17.0, 30.0, 40.0, 38.0, 27.0, 46.0, 40.0, 35.0, 44.0, 44.0, 41.0, 38.0, 34.0, 30.0, 49.0, 38.0, 34.0, 29.0, 30.0, 30.0, 21.0, 19.0, 11.0, 9.0, 14.0, 7.0, 7.0, 7.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.4053955078125, -7.166259765625, -6.9271240234375, -6.68798828125, -6.4488525390625, -6.209716796875, -5.9705810546875, -5.7314453125, -5.4923095703125, -5.253173828125, -5.0140380859375, -4.77490234375, -4.5357666015625, -4.296630859375, -4.0574951171875, -3.818359375, -3.5792236328125, -3.340087890625, -3.1009521484375, -2.86181640625, -2.6226806640625, -2.383544921875, -2.1444091796875, -1.9052734375, -1.6661376953125, -1.427001953125, -1.1878662109375, -0.94873046875, -0.7095947265625, -0.470458984375, -0.2313232421875, 0.0078125, 0.2469482421875, 0.486083984375, 0.7252197265625, 0.96435546875, 1.2034912109375, 1.442626953125, 1.6817626953125, 1.9208984375, 2.1600341796875, 2.399169921875, 2.6383056640625, 2.87744140625, 3.1165771484375, 3.355712890625, 3.5948486328125, 3.833984375, 4.0731201171875, 4.312255859375, 4.5513916015625, 4.79052734375, 5.0296630859375, 5.268798828125, 5.5079345703125, 5.7470703125, 5.9862060546875, 6.225341796875, 6.4644775390625, 6.70361328125, 6.9427490234375, 7.181884765625, 7.4210205078125, 7.66015625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 10.0, 11.0, 24.0, 32.0, 50.0, 72.0, 115.0, 204.0, 267.0, 425.0, 693.0, 1047.0, 1715.0, 2774.0, 4702.0, 7510.0, 12860.0, 22268.0, 39603.0, 71632.0, 134059.0, 263851.0, 223538.0, 115850.0, 62138.0, 34519.0, 19674.0, 11494.0, 6704.0, 4149.0, 2420.0, 1510.0, 966.0, 608.0, 369.0, 248.0, 121.0, 110.0, 57.0, 43.0, 33.0, 22.0, 18.0, 8.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.3505859375, -1.306854248046875, -1.26312255859375, -1.219390869140625, -1.1756591796875, -1.131927490234375, -1.08819580078125, -1.044464111328125, -1.000732421875, -0.957000732421875, -0.91326904296875, -0.869537353515625, -0.8258056640625, -0.782073974609375, -0.73834228515625, -0.694610595703125, -0.65087890625, -0.607147216796875, -0.56341552734375, -0.519683837890625, -0.4759521484375, -0.432220458984375, -0.38848876953125, -0.344757080078125, -0.301025390625, -0.257293701171875, -0.21356201171875, -0.169830322265625, -0.1260986328125, -0.082366943359375, -0.03863525390625, 0.005096435546875, 0.048828125, 0.092559814453125, 0.13629150390625, 0.180023193359375, 0.2237548828125, 0.267486572265625, 0.31121826171875, 0.354949951171875, 0.398681640625, 0.442413330078125, 0.48614501953125, 0.529876708984375, 0.5736083984375, 0.617340087890625, 0.66107177734375, 0.704803466796875, 0.74853515625, 0.792266845703125, 0.83599853515625, 0.879730224609375, 0.9234619140625, 0.967193603515625, 1.01092529296875, 1.054656982421875, 1.098388671875, 1.142120361328125, 1.18585205078125, 1.229583740234375, 1.2733154296875, 1.317047119140625, 1.36077880859375, 1.404510498046875, 1.4482421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 10.0, 7.0, 12.0, 9.0, 13.0, 6.0, 20.0, 20.0, 16.0, 18.0, 22.0, 33.0, 24.0, 29.0, 35.0, 31.0, 32.0, 38.0, 42.0, 43.0, 1064.0, 30.0, 29.0, 37.0, 37.0, 37.0, 32.0, 33.0, 24.0, 36.0, 26.0, 29.0, 17.0, 13.0, 15.0, 20.0, 17.0, 14.0, 18.0, 9.0, 5.0, 4.0, 1.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.07470703125, -3.9384765625, -3.80224609375, -3.666015625, -3.52978515625, -3.3935546875, -3.25732421875, -3.12109375, -2.98486328125, -2.8486328125, -2.71240234375, -2.576171875, -2.43994140625, -2.3037109375, -2.16748046875, -2.03125, -1.89501953125, -1.7587890625, -1.62255859375, -1.486328125, -1.35009765625, -1.2138671875, -1.07763671875, -0.94140625, -0.80517578125, -0.6689453125, -0.53271484375, -0.396484375, -0.26025390625, -0.1240234375, 0.01220703125, 0.1484375, 0.28466796875, 0.4208984375, 0.55712890625, 0.693359375, 0.82958984375, 0.9658203125, 1.10205078125, 1.23828125, 1.37451171875, 1.5107421875, 1.64697265625, 1.783203125, 1.91943359375, 2.0556640625, 2.19189453125, 2.328125, 2.46435546875, 2.6005859375, 2.73681640625, 2.873046875, 3.00927734375, 3.1455078125, 3.28173828125, 3.41796875, 3.55419921875, 3.6904296875, 3.82666015625, 3.962890625, 4.09912109375, 4.2353515625, 4.37158203125, 4.5078125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 10.0, 12.0, 18.0, 30.0, 47.0, 78.0, 88.0, 154.0, 234.0, 327.0, 463.0, 670.0, 995.0, 1450.0, 2050.0, 3068.0, 4617.0, 6708.0, 9916.0, 14897.0, 22525.0, 35266.0, 55791.0, 89944.0, 152458.0, 1286924.0, 155574.0, 91525.0, 56529.0, 35573.0, 22872.0, 15071.0, 10132.0, 6850.0, 4493.0, 3126.0, 2108.0, 1423.0, 975.0, 672.0, 475.0, 329.0, 220.0, 144.0, 103.0, 65.0, 43.0, 31.0, 23.0, 9.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.048828125, -1.016571044921875, -0.98431396484375, -0.952056884765625, -0.9197998046875, -0.887542724609375, -0.85528564453125, -0.823028564453125, -0.790771484375, -0.758514404296875, -0.72625732421875, -0.694000244140625, -0.6617431640625, -0.629486083984375, -0.59722900390625, -0.564971923828125, -0.53271484375, -0.500457763671875, -0.46820068359375, -0.435943603515625, -0.4036865234375, -0.371429443359375, -0.33917236328125, -0.306915283203125, -0.274658203125, -0.242401123046875, -0.21014404296875, -0.177886962890625, -0.1456298828125, -0.113372802734375, -0.08111572265625, -0.048858642578125, -0.0166015625, 0.015655517578125, 0.04791259765625, 0.080169677734375, 0.1124267578125, 0.144683837890625, 0.17694091796875, 0.209197998046875, 0.241455078125, 0.273712158203125, 0.30596923828125, 0.338226318359375, 0.3704833984375, 0.402740478515625, 0.43499755859375, 0.467254638671875, 0.49951171875, 0.531768798828125, 0.56402587890625, 0.596282958984375, 0.6285400390625, 0.660797119140625, 0.69305419921875, 0.725311279296875, 0.757568359375, 0.789825439453125, 0.82208251953125, 0.854339599609375, 0.8865966796875, 0.918853759765625, 0.95111083984375, 0.983367919921875, 1.015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 8.0, 9.0, 15.0, 15.0, 23.0, 21.0, 26.0, 37.0, 39.0, 57.0, 57.0, 53.0, 63.0, 40.0, 71.0, 40.0, 60.0, 39.0, 40.0, 40.0, 35.0, 23.0, 28.0, 23.0, 9.0, 15.0, 13.0, 12.0, 9.0, 15.0, 9.0, 4.0, 2.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006341934204101562, -0.0006148815155029297, -0.0005955696105957031, -0.0005762577056884766, -0.00055694580078125, -0.0005376338958740234, -0.0005183219909667969, -0.0004990100860595703, -0.00047969818115234375, -0.0004603862762451172, -0.0004410743713378906, -0.00042176246643066406, -0.0004024505615234375, -0.00038313865661621094, -0.0003638267517089844, -0.0003445148468017578, -0.00032520294189453125, -0.0003058910369873047, -0.0002865791320800781, -0.00026726722717285156, -0.000247955322265625, -0.00022864341735839844, -0.00020933151245117188, -0.0001900196075439453, -0.00017070770263671875, -0.0001513957977294922, -0.00013208389282226562, -0.00011277198791503906, -9.34600830078125e-05, -7.414817810058594e-05, -5.4836273193359375e-05, -3.552436828613281e-05, -1.621246337890625e-05, 3.0994415283203125e-06, 2.2411346435546875e-05, 4.172325134277344e-05, 6.103515625e-05, 8.034706115722656e-05, 9.965896606445312e-05, 0.00011897087097167969, 0.00013828277587890625, 0.0001575946807861328, 0.00017690658569335938, 0.00019621849060058594, 0.0002155303955078125, 0.00023484230041503906, 0.0002541542053222656, 0.0002734661102294922, 0.00029277801513671875, 0.0003120899200439453, 0.0003314018249511719, 0.00035071372985839844, 0.000370025634765625, 0.00038933753967285156, 0.0004086494445800781, 0.0004279613494873047, 0.00044727325439453125, 0.0004665851593017578, 0.0004858970642089844, 0.0005052089691162109, 0.0005245208740234375, 0.0005438327789306641, 0.0005631446838378906, 0.0005824565887451172, 0.0006017684936523438]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 9.0, 14.0, 13.0, 12.0, 26.0, 24.0, 26.0, 25.0, 52.0, 48.0, 76.0, 95.0, 127.0, 230.0, 482.0, 1099.0, 318087.0, 725454.0, 1328.0, 478.0, 243.0, 138.0, 121.0, 78.0, 49.0, 32.0, 35.0, 32.0, 22.0, 15.0, 18.0, 10.0, 9.0, 8.0, 7.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01404571533203125, -0.013607501983642578, -0.013169288635253906, -0.012731075286865234, -0.012292861938476562, -0.01185464859008789, -0.011416435241699219, -0.010978221893310547, -0.010540008544921875, -0.010101795196533203, -0.009663581848144531, -0.00922536849975586, -0.008787155151367188, -0.008348941802978516, -0.007910728454589844, -0.007472515106201172, -0.0070343017578125, -0.006596088409423828, -0.006157875061035156, -0.005719661712646484, -0.0052814483642578125, -0.004843235015869141, -0.004405021667480469, -0.003966808319091797, -0.003528594970703125, -0.003090381622314453, -0.0026521682739257812, -0.0022139549255371094, -0.0017757415771484375, -0.0013375282287597656, -0.0008993148803710938, -0.0004611015319824219, -2.288818359375e-05, 0.0004153251647949219, 0.0008535385131835938, 0.0012917518615722656, 0.0017299652099609375, 0.0021681785583496094, 0.0026063919067382812, 0.003044605255126953, 0.003482818603515625, 0.003921031951904297, 0.004359245300292969, 0.004797458648681641, 0.0052356719970703125, 0.005673885345458984, 0.006112098693847656, 0.006550312042236328, 0.006988525390625, 0.007426738739013672, 0.007864952087402344, 0.008303165435791016, 0.008741378784179688, 0.00917959213256836, 0.009617805480957031, 0.010056018829345703, 0.010494232177734375, 0.010932445526123047, 0.011370658874511719, 0.01180887222290039, 0.012247085571289062, 0.012685298919677734, 0.013123512268066406, 0.013561725616455078, 0.01399993896484375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 12.0, 76.0, 304.0, 397.0, 183.0, 33.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001418866217136383, -0.001380834262818098, -0.001342802424915135, -0.00130477047059685, -0.001266738516278565, -0.0012287066783756018, -0.0011906747240573168, -0.0011526427697390318, -0.0011146108154207468, -0.0010765788611024618, -0.0010385470231994987, -0.0010005150688812137, -0.0009624831145629287, -0.0009244512184523046, -0.0008864193223416805, -0.0008483873680233955, -0.0008103555301204324, -0.0007723236340098083, -0.0007342916796915233, -0.0006962597835808992, -0.0006582278292626143, -0.0006201959331519902, -0.0005821640370413661, -0.0005441320827230811, -0.000506100186612457, -0.0004680682613980025, -0.000430036336183548, -0.0003920044400729239, -0.00035397251485846937, -0.00031594058964401484, -0.00027790869353339076, -0.00023987676831893623, -0.00020184495951980352, -0.000163813034305349, -0.0001257811236428097, -8.774920570431277e-05, -4.9717287765815854e-05, -1.1685362551361322e-05, 2.634654811117798e-05, 6.437845877371728e-05, 0.00010241038398817182, 0.00014044230920262635, 0.00017847421986516565, 0.00021650613052770495, 0.0002545380557421595, 0.000292569980956614, 0.0003306018770672381, 0.0003686338022816926, 0.00040666572749614716, 0.0004446976527106017, 0.0004827295779250562, 0.0005207614740356803, 0.0005587934283539653, 0.0005968253244645894, 0.0006348572205752134, 0.0006728891748934984, 0.0007109210710041225, 0.0007489529671147466, 0.0007869849214330316, 0.0008250168175436556, 0.0008630487136542797, 0.0009010806679725647, 0.0009391125640831888, 0.0009771444601938128, 0.0010151764145120978]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 6.0, 4.0, 10.0, 7.0, 8.0, 9.0, 7.0, 20.0, 20.0, 19.0, 26.0, 24.0, 30.0, 31.0, 44.0, 33.0, 34.0, 23.0, 38.0, 38.0, 46.0, 30.0, 40.0, 56.0, 32.0, 41.0, 44.0, 36.0, 26.0, 31.0, 16.0, 30.0, 28.0, 18.0, 20.0, 14.0, 13.0, 9.0, 11.0, 13.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003337860107421875, -0.00032325461506843567, -0.00031272321939468384, -0.000302191823720932, -0.0002916604280471802, -0.00028112903237342834, -0.0002705976366996765, -0.0002600662410259247, -0.00024953484535217285, -0.00023900344967842102, -0.0002284720540046692, -0.00021794065833091736, -0.00020740926265716553, -0.0001968778669834137, -0.00018634647130966187, -0.00017581507563591003, -0.0001652836799621582, -0.00015475228428840637, -0.00014422088861465454, -0.0001336894929409027, -0.00012315809726715088, -0.00011262670159339905, -0.00010209530591964722, -9.156391024589539e-05, -8.103251457214355e-05, -7.050111889839172e-05, -5.996972322463989e-05, -4.943832755088806e-05, -3.890693187713623e-05, -2.83755362033844e-05, -1.784414052963257e-05, -7.312744855880737e-06, 3.2186508178710938e-06, 1.3750046491622925e-05, 2.4281442165374756e-05, 3.481283783912659e-05, 4.534423351287842e-05, 5.587562918663025e-05, 6.640702486038208e-05, 7.693842053413391e-05, 8.746981620788574e-05, 9.800121188163757e-05, 0.0001085326075553894, 0.00011906400322914124, 0.00012959539890289307, 0.0001401267945766449, 0.00015065819025039673, 0.00016118958592414856, 0.0001717209815979004, 0.00018225237727165222, 0.00019278377294540405, 0.00020331516861915588, 0.00021384656429290771, 0.00022437795996665955, 0.00023490935564041138, 0.0002454407513141632, 0.00025597214698791504, 0.00026650354266166687, 0.0002770349383354187, 0.00028756633400917053, 0.00029809772968292236, 0.0003086291253566742, 0.000319160521030426, 0.00032969191670417786, 0.0003402233123779297]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 11.0, 16.0, 19.0, 18.0, 27.0, 18.0, 32.0, 17.0, 30.0, 40.0, 38.0, 27.0, 46.0, 40.0, 35.0, 44.0, 44.0, 41.0, 38.0, 34.0, 30.0, 49.0, 38.0, 34.0, 29.0, 30.0, 30.0, 21.0, 19.0, 11.0, 9.0, 14.0, 7.0, 7.0, 7.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.4053955078125, -7.166259765625, -6.9271240234375, -6.68798828125, -6.4488525390625, -6.209716796875, -5.9705810546875, -5.7314453125, -5.4923095703125, -5.253173828125, -5.0140380859375, -4.77490234375, -4.5357666015625, -4.296630859375, -4.0574951171875, -3.818359375, -3.5792236328125, -3.340087890625, -3.1009521484375, -2.86181640625, -2.6226806640625, -2.383544921875, -2.1444091796875, -1.9052734375, -1.6661376953125, -1.427001953125, -1.1878662109375, -0.94873046875, -0.7095947265625, -0.470458984375, -0.2313232421875, 0.0078125, 0.2469482421875, 0.486083984375, 0.7252197265625, 0.96435546875, 1.2034912109375, 1.442626953125, 1.6817626953125, 1.9208984375, 2.1600341796875, 2.399169921875, 2.6383056640625, 2.87744140625, 3.1165771484375, 3.355712890625, 3.5948486328125, 3.833984375, 4.0731201171875, 4.312255859375, 4.5513916015625, 4.79052734375, 5.0296630859375, 5.268798828125, 5.5079345703125, 5.7470703125, 5.9862060546875, 6.225341796875, 6.4644775390625, 6.70361328125, 6.9427490234375, 7.181884765625, 7.4210205078125, 7.66015625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 6.0, 11.0, 15.0, 17.0, 24.0, 28.0, 50.0, 61.0, 88.0, 108.0, 138.0, 180.0, 244.0, 342.0, 497.0, 706.0, 1279.0, 4113.0, 26305.0, 595492.0, 390516.0, 21036.0, 3641.0, 1120.0, 651.0, 488.0, 358.0, 284.0, 192.0, 137.0, 102.0, 77.0, 55.0, 36.0, 22.0, 34.0, 22.0, 16.0, 12.0, 10.0, 7.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.34375, -18.73828125, -18.1328125, -17.52734375, -16.921875, -16.31640625, -15.7109375, -15.10546875, -14.5, -13.89453125, -13.2890625, -12.68359375, -12.078125, -11.47265625, -10.8671875, -10.26171875, -9.65625, -9.05078125, -8.4453125, -7.83984375, -7.234375, -6.62890625, -6.0234375, -5.41796875, -4.8125, -4.20703125, -3.6015625, -2.99609375, -2.390625, -1.78515625, -1.1796875, -0.57421875, 0.03125, 0.63671875, 1.2421875, 1.84765625, 2.453125, 3.05859375, 3.6640625, 4.26953125, 4.875, 5.48046875, 6.0859375, 6.69140625, 7.296875, 7.90234375, 8.5078125, 9.11328125, 9.71875, 10.32421875, 10.9296875, 11.53515625, 12.140625, 12.74609375, 13.3515625, 13.95703125, 14.5625, 15.16796875, 15.7734375, 16.37890625, 16.984375, 17.58984375, 18.1953125, 18.80078125, 19.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 4.0, 7.0, 18.0, 15.0, 16.0, 13.0, 25.0, 29.0, 26.0, 23.0, 39.0, 39.0, 41.0, 56.0, 52.0, 105.0, 1564.0, 428.0, 90.0, 54.0, 45.0, 49.0, 40.0, 38.0, 36.0, 32.0, 18.0, 25.0, 19.0, 16.0, 14.0, 16.0, 13.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.09375, -23.3623046875, -22.630859375, -21.8994140625, -21.16796875, -20.4365234375, -19.705078125, -18.9736328125, -18.2421875, -17.5107421875, -16.779296875, -16.0478515625, -15.31640625, -14.5849609375, -13.853515625, -13.1220703125, -12.390625, -11.6591796875, -10.927734375, -10.1962890625, -9.46484375, -8.7333984375, -8.001953125, -7.2705078125, -6.5390625, -5.8076171875, -5.076171875, -4.3447265625, -3.61328125, -2.8818359375, -2.150390625, -1.4189453125, -0.6875, 0.0439453125, 0.775390625, 1.5068359375, 2.23828125, 2.9697265625, 3.701171875, 4.4326171875, 5.1640625, 5.8955078125, 6.626953125, 7.3583984375, 8.08984375, 8.8212890625, 9.552734375, 10.2841796875, 11.015625, 11.7470703125, 12.478515625, 13.2099609375, 13.94140625, 14.6728515625, 15.404296875, 16.1357421875, 16.8671875, 17.5986328125, 18.330078125, 19.0615234375, 19.79296875, 20.5244140625, 21.255859375, 21.9873046875, 22.71875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 1.0, 3.0, 5.0, 3.0, 13.0, 10.0, 19.0, 14.0, 19.0, 20.0, 27.0, 30.0, 28.0, 37.0, 60.0, 70.0, 103.0, 197.0, 326.0, 959.0, 19838.0, 3113929.0, 8364.0, 758.0, 304.0, 164.0, 99.0, 50.0, 43.0, 31.0, 32.0, 33.0, 26.0, 16.0, 21.0, 16.0, 10.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.625, -62.5673828125, -60.509765625, -58.4521484375, -56.39453125, -54.3369140625, -52.279296875, -50.2216796875, -48.1640625, -46.1064453125, -44.048828125, -41.9912109375, -39.93359375, -37.8759765625, -35.818359375, -33.7607421875, -31.703125, -29.6455078125, -27.587890625, -25.5302734375, -23.47265625, -21.4150390625, -19.357421875, -17.2998046875, -15.2421875, -13.1845703125, -11.126953125, -9.0693359375, -7.01171875, -4.9541015625, -2.896484375, -0.8388671875, 1.21875, 3.2763671875, 5.333984375, 7.3916015625, 9.44921875, 11.5068359375, 13.564453125, 15.6220703125, 17.6796875, 19.7373046875, 21.794921875, 23.8525390625, 25.91015625, 27.9677734375, 30.025390625, 32.0830078125, 34.140625, 36.1982421875, 38.255859375, 40.3134765625, 42.37109375, 44.4287109375, 46.486328125, 48.5439453125, 50.6015625, 52.6591796875, 54.716796875, 56.7744140625, 58.83203125, 60.8896484375, 62.947265625, 65.0048828125, 67.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 226.0, 643.0, 131.0, 8.0, 0.0, 0.0, 1.0], "bins": [-178.9009552001953, -175.83958435058594, -172.7781982421875, -169.71682739257812, -166.6554412841797, -163.5940704345703, -160.53268432617188, -157.4713134765625, -154.40992736816406, -151.3485565185547, -148.28717041015625, -145.22579956054688, -142.16441345214844, -139.10304260253906, -136.04165649414062, -132.98028564453125, -129.91891479492188, -126.85753631591797, -123.79615783691406, -120.73477935791016, -117.67340087890625, -114.61203002929688, -111.55064392089844, -108.48927307128906, -105.42788696289062, -102.36650848388672, -99.30513000488281, -96.2437515258789, -93.182373046875, -90.12100219726562, -87.05961608886719, -83.99824523925781, -80.93685913085938, -77.87548065185547, -74.81410217285156, -71.75272369384766, -68.69134521484375, -65.62997436523438, -62.5685920715332, -59.50721740722656, -56.445838928222656, -53.38446044921875, -50.323081970214844, -47.26170349121094, -44.2003288269043, -41.13895034790039, -38.077571868896484, -35.016197204589844, -31.954818725585938, -28.89344024658203, -25.832063674926758, -22.77068519592285, -19.709308624267578, -16.647930145263672, -13.586551666259766, -10.525175094604492, -7.463796615600586, -4.402419090270996, -1.341041088104248, 1.7203369140625, 4.78171443939209, 7.84309196472168, 10.904470443725586, 13.96584701538086, 17.027225494384766]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 6.0, 4.0, 5.0, 15.0, 9.0, 9.0, 10.0, 23.0, 15.0, 17.0, 23.0, 29.0, 18.0, 38.0, 42.0, 28.0, 35.0, 43.0, 46.0, 39.0, 51.0, 38.0, 51.0, 35.0, 39.0, 38.0, 24.0, 38.0, 29.0, 39.0, 24.0, 21.0, 11.0, 20.0, 19.0, 10.0, 17.0, 10.0, 7.0, 6.0, 5.0, 10.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-55.071990966796875, -53.43459701538086, -51.797203063964844, -50.15980529785156, -48.52241134643555, -46.88501739501953, -45.247623443603516, -43.6102294921875, -41.972835540771484, -40.33544158935547, -38.69804763793945, -37.06065368652344, -35.423255920410156, -33.78586196899414, -32.148468017578125, -30.51107406616211, -28.87367820739746, -27.236284255981445, -25.598888397216797, -23.96149444580078, -22.324100494384766, -20.68670654296875, -19.0493106842041, -17.411916732788086, -15.774521827697754, -14.137126922607422, -12.499732971191406, -10.862338066101074, -9.224943161010742, -7.587549209594727, -5.9501543045043945, -4.312760353088379, -2.675365447998047, -1.0379709005355835, 0.5994236469268799, 2.236818313598633, 3.8742127418518066, 5.5116071701049805, 7.1490020751953125, 8.786396026611328, 10.42379093170166, 12.061185836791992, 13.698579788208008, 15.33597469329834, 16.973369598388672, 18.610763549804688, 20.248157501220703, 21.88555145263672, 23.522947311401367, 25.160341262817383, 26.79773712158203, 28.435131072998047, 30.072525024414062, 31.709918975830078, 33.347312927246094, 34.984710693359375, 36.62210464477539, 38.259498596191406, 39.89689254760742, 41.53428649902344, 43.17168426513672, 44.809078216552734, 46.44647216796875, 48.083866119384766, 49.72126007080078]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 12.0, 8.0, 13.0, 14.0, 12.0, 21.0, 16.0, 18.0, 26.0, 31.0, 26.0, 22.0, 27.0, 30.0, 39.0, 41.0, 39.0, 31.0, 36.0, 40.0, 38.0, 38.0, 30.0, 42.0, 38.0, 35.0, 44.0, 28.0, 23.0, 22.0, 24.0, 21.0, 18.0, 9.0, 13.0, 10.0, 13.0, 11.0, 11.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.07391357421875, -6.8470458984375, -6.62017822265625, -6.393310546875, -6.16644287109375, -5.9395751953125, -5.71270751953125, -5.48583984375, -5.25897216796875, -5.0321044921875, -4.80523681640625, -4.578369140625, -4.35150146484375, -4.1246337890625, -3.89776611328125, -3.6708984375, -3.44403076171875, -3.2171630859375, -2.99029541015625, -2.763427734375, -2.53656005859375, -2.3096923828125, -2.08282470703125, -1.85595703125, -1.62908935546875, -1.4022216796875, -1.17535400390625, -0.948486328125, -0.72161865234375, -0.4947509765625, -0.26788330078125, -0.041015625, 0.18585205078125, 0.4127197265625, 0.63958740234375, 0.866455078125, 1.09332275390625, 1.3201904296875, 1.54705810546875, 1.77392578125, 2.00079345703125, 2.2276611328125, 2.45452880859375, 2.681396484375, 2.90826416015625, 3.1351318359375, 3.36199951171875, 3.5888671875, 3.81573486328125, 4.0426025390625, 4.26947021484375, 4.496337890625, 4.72320556640625, 4.9500732421875, 5.17694091796875, 5.40380859375, 5.63067626953125, 5.8575439453125, 6.08441162109375, 6.311279296875, 6.53814697265625, 6.7650146484375, 6.99188232421875, 7.21875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 7.0, 2.0, 5.0, 6.0, 1.0, 10.0, 11.0, 3.0, 24.0, 28.0, 23.0, 46.0, 58.0, 62.0, 65.0, 95.0, 116.0, 183.0, 250.0, 377.0, 656.0, 1349.0, 3568.0, 13821.0, 129338.0, 1938843.0, 1947696.0, 136701.0, 14029.0, 3599.0, 1385.0, 604.0, 371.0, 217.0, 180.0, 127.0, 88.0, 74.0, 65.0, 30.0, 34.0, 30.0, 21.0, 19.0, 21.0, 11.0, 13.0, 10.0, 4.0, 5.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.1162109375, -15.560546875, -15.0048828125, -14.44921875, -13.8935546875, -13.337890625, -12.7822265625, -12.2265625, -11.6708984375, -11.115234375, -10.5595703125, -10.00390625, -9.4482421875, -8.892578125, -8.3369140625, -7.78125, -7.2255859375, -6.669921875, -6.1142578125, -5.55859375, -5.0029296875, -4.447265625, -3.8916015625, -3.3359375, -2.7802734375, -2.224609375, -1.6689453125, -1.11328125, -0.5576171875, -0.001953125, 0.5537109375, 1.109375, 1.6650390625, 2.220703125, 2.7763671875, 3.33203125, 3.8876953125, 4.443359375, 4.9990234375, 5.5546875, 6.1103515625, 6.666015625, 7.2216796875, 7.77734375, 8.3330078125, 8.888671875, 9.4443359375, 10.0, 10.5556640625, 11.111328125, 11.6669921875, 12.22265625, 12.7783203125, 13.333984375, 13.8896484375, 14.4453125, 15.0009765625, 15.556640625, 16.1123046875, 16.66796875, 17.2236328125, 17.779296875, 18.3349609375, 18.890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 10.0, 17.0, 19.0, 20.0, 44.0, 62.0, 84.0, 117.0, 148.0, 249.0, 399.0, 563.0, 616.0, 575.0, 392.0, 250.0, 165.0, 92.0, 81.0, 59.0, 32.0, 25.0, 15.0, 13.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.31005859375, -13.8076171875, -13.30517578125, -12.802734375, -12.30029296875, -11.7978515625, -11.29541015625, -10.79296875, -10.29052734375, -9.7880859375, -9.28564453125, -8.783203125, -8.28076171875, -7.7783203125, -7.27587890625, -6.7734375, -6.27099609375, -5.7685546875, -5.26611328125, -4.763671875, -4.26123046875, -3.7587890625, -3.25634765625, -2.75390625, -2.25146484375, -1.7490234375, -1.24658203125, -0.744140625, -0.24169921875, 0.2607421875, 0.76318359375, 1.265625, 1.76806640625, 2.2705078125, 2.77294921875, 3.275390625, 3.77783203125, 4.2802734375, 4.78271484375, 5.28515625, 5.78759765625, 6.2900390625, 6.79248046875, 7.294921875, 7.79736328125, 8.2998046875, 8.80224609375, 9.3046875, 9.80712890625, 10.3095703125, 10.81201171875, 11.314453125, 11.81689453125, 12.3193359375, 12.82177734375, 13.32421875, 13.82666015625, 14.3291015625, 14.83154296875, 15.333984375, 15.83642578125, 16.3388671875, 16.84130859375, 17.34375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 9.0, 15.0, 20.0, 23.0, 34.0, 43.0, 54.0, 78.0, 114.0, 125.0, 184.0, 313.0, 668.0, 2208.0, 45152.0, 4049742.0, 90533.0, 3013.0, 780.0, 324.0, 217.0, 131.0, 110.0, 104.0, 73.0, 41.0, 36.0, 25.0, 15.0, 24.0, 10.0, 19.0, 5.0, 5.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.9375, -49.21484375, -47.4921875, -45.76953125, -44.046875, -42.32421875, -40.6015625, -38.87890625, -37.15625, -35.43359375, -33.7109375, -31.98828125, -30.265625, -28.54296875, -26.8203125, -25.09765625, -23.375, -21.65234375, -19.9296875, -18.20703125, -16.484375, -14.76171875, -13.0390625, -11.31640625, -9.59375, -7.87109375, -6.1484375, -4.42578125, -2.703125, -0.98046875, 0.7421875, 2.46484375, 4.1875, 5.91015625, 7.6328125, 9.35546875, 11.078125, 12.80078125, 14.5234375, 16.24609375, 17.96875, 19.69140625, 21.4140625, 23.13671875, 24.859375, 26.58203125, 28.3046875, 30.02734375, 31.75, 33.47265625, 35.1953125, 36.91796875, 38.640625, 40.36328125, 42.0859375, 43.80859375, 45.53125, 47.25390625, 48.9765625, 50.69921875, 52.421875, 54.14453125, 55.8671875, 57.58984375, 59.3125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 37.0, 138.0, 304.0, 348.0, 131.0, 36.0, 8.0, 2.0, 4.0], "bins": [-213.93435668945312, -210.24412536621094, -206.55389404296875, -202.86366271972656, -199.17343139648438, -195.48321533203125, -191.79298400878906, -188.10275268554688, -184.4125213623047, -180.7222900390625, -177.0320587158203, -173.34182739257812, -169.65159606933594, -165.96136474609375, -162.27114868164062, -158.58091735839844, -154.89068603515625, -151.20045471191406, -147.51022338867188, -143.8199920654297, -140.1297607421875, -136.43954467773438, -132.7493133544922, -129.05908203125, -125.36884307861328, -121.6786117553711, -117.9883804321289, -114.29815673828125, -110.60792541503906, -106.91769409179688, -103.22746276855469, -99.5372314453125, -95.84700012207031, -92.15676879882812, -88.46653747558594, -84.77631378173828, -81.0860824584961, -77.3958511352539, -73.70561981201172, -70.01539611816406, -66.32516479492188, -62.63493347167969, -58.944705963134766, -55.25447463989258, -51.564247131347656, -47.87401580810547, -44.18378448486328, -40.49355697631836, -36.80332946777344, -33.11309814453125, -29.422870635986328, -25.73263931274414, -22.04241180419922, -18.35218048095703, -14.661951065063477, -10.971721649169922, -7.281492233276367, -3.5912625789642334, 0.09896707534790039, 3.7891969680786133, 7.479426383972168, 11.169656753540039, 14.859886169433594, 18.55011558532715, 22.240345001220703]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 5.0, 6.0, 3.0, 4.0, 10.0, 11.0, 10.0, 14.0, 15.0, 17.0, 19.0, 26.0, 27.0, 25.0, 19.0, 24.0, 29.0, 37.0, 38.0, 39.0, 40.0, 31.0, 32.0, 34.0, 46.0, 31.0, 47.0, 33.0, 26.0, 32.0, 47.0, 23.0, 23.0, 13.0, 18.0, 14.0, 25.0, 16.0, 16.0, 9.0, 15.0, 12.0, 10.0, 3.0, 11.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-35.75941467285156, -34.63930130004883, -33.51919174194336, -32.399078369140625, -31.27896499633789, -30.15885353088379, -29.038742065429688, -27.918628692626953, -26.79851722717285, -25.67840576171875, -24.558292388916016, -23.438180923461914, -22.318069458007812, -21.197956085205078, -20.077844619750977, -18.957733154296875, -17.83761978149414, -16.71750831604004, -15.597394943237305, -14.477283477783203, -13.357171058654785, -12.237058639526367, -11.116947174072266, -9.996834754943848, -8.87672233581543, -7.756609916687012, -6.636497974395752, -5.516386032104492, -4.396273612976074, -3.2761611938476562, -2.1560492515563965, -1.0359373092651367, 0.08417510986328125, 1.2042872905731201, 2.324399471282959, 3.444511651992798, 4.564623832702637, 5.684736251831055, 6.8048481941223145, 7.924960136413574, 9.045072555541992, 10.16518497467041, 11.285297393798828, 12.40540885925293, 13.525521278381348, 14.645633697509766, 15.765745162963867, 16.88585662841797, 18.005970001220703, 19.126081466674805, 20.24619483947754, 21.36630630493164, 22.486419677734375, 23.606531143188477, 24.726642608642578, 25.846755981445312, 26.966867446899414, 28.086978912353516, 29.20709228515625, 30.32720375061035, 31.447315216064453, 32.56742858886719, 33.68754196166992, 34.80765151977539, 35.927764892578125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 6.0, 6.0, 12.0, 13.0, 6.0, 22.0, 17.0, 19.0, 23.0, 34.0, 22.0, 27.0, 28.0, 37.0, 42.0, 34.0, 31.0, 43.0, 35.0, 40.0, 43.0, 46.0, 38.0, 31.0, 33.0, 30.0, 33.0, 30.0, 28.0, 22.0, 27.0, 14.0, 18.0, 19.0, 16.0, 13.0, 9.0, 9.0, 10.0, 4.0, 8.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51953125, -7.28167724609375, -7.0438232421875, -6.80596923828125, -6.568115234375, -6.33026123046875, -6.0924072265625, -5.85455322265625, -5.61669921875, -5.37884521484375, -5.1409912109375, -4.90313720703125, -4.665283203125, -4.42742919921875, -4.1895751953125, -3.95172119140625, -3.7138671875, -3.47601318359375, -3.2381591796875, -3.00030517578125, -2.762451171875, -2.52459716796875, -2.2867431640625, -2.04888916015625, -1.81103515625, -1.57318115234375, -1.3353271484375, -1.09747314453125, -0.859619140625, -0.62176513671875, -0.3839111328125, -0.14605712890625, 0.091796875, 0.32965087890625, 0.5675048828125, 0.80535888671875, 1.043212890625, 1.28106689453125, 1.5189208984375, 1.75677490234375, 1.99462890625, 2.23248291015625, 2.4703369140625, 2.70819091796875, 2.946044921875, 3.18389892578125, 3.4217529296875, 3.65960693359375, 3.8974609375, 4.13531494140625, 4.3731689453125, 4.61102294921875, 4.848876953125, 5.08673095703125, 5.3245849609375, 5.56243896484375, 5.80029296875, 6.03814697265625, 6.2760009765625, 6.51385498046875, 6.751708984375, 6.98956298828125, 7.2274169921875, 7.46527099609375, 7.703125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 4.0, 9.0, 7.0, 20.0, 22.0, 37.0, 43.0, 85.0, 105.0, 166.0, 227.0, 354.0, 438.0, 709.0, 1024.0, 1466.0, 2186.0, 3143.0, 4669.0, 6694.0, 10090.0, 15057.0, 22638.0, 34451.0, 53758.0, 85829.0, 141256.0, 224005.0, 163757.0, 98493.0, 61074.0, 39031.0, 25544.0, 16981.0, 11381.0, 7714.0, 5004.0, 3476.0, 2380.0, 1603.0, 1092.0, 778.0, 511.0, 378.0, 290.0, 189.0, 141.0, 77.0, 46.0, 44.0, 38.0, 16.0, 13.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0791015625, -1.0449981689453125, -1.010894775390625, -0.9767913818359375, -0.94268798828125, -0.9085845947265625, -0.874481201171875, -0.8403778076171875, -0.8062744140625, -0.7721710205078125, -0.738067626953125, -0.7039642333984375, -0.66986083984375, -0.6357574462890625, -0.601654052734375, -0.5675506591796875, -0.533447265625, -0.4993438720703125, -0.465240478515625, -0.4311370849609375, -0.39703369140625, -0.3629302978515625, -0.328826904296875, -0.2947235107421875, -0.2606201171875, -0.2265167236328125, -0.192413330078125, -0.1583099365234375, -0.12420654296875, -0.0901031494140625, -0.055999755859375, -0.0218963623046875, 0.01220703125, 0.0463104248046875, 0.080413818359375, 0.1145172119140625, 0.14862060546875, 0.1827239990234375, 0.216827392578125, 0.2509307861328125, 0.2850341796875, 0.3191375732421875, 0.353240966796875, 0.3873443603515625, 0.42144775390625, 0.4555511474609375, 0.489654541015625, 0.5237579345703125, 0.557861328125, 0.5919647216796875, 0.626068115234375, 0.6601715087890625, 0.69427490234375, 0.7283782958984375, 0.762481689453125, 0.7965850830078125, 0.8306884765625, 0.8647918701171875, 0.898895263671875, 0.9329986572265625, 0.96710205078125, 1.0012054443359375, 1.035308837890625, 1.0694122314453125, 1.103515625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 8.0, 10.0, 10.0, 8.0, 18.0, 13.0, 27.0, 23.0, 28.0, 29.0, 25.0, 25.0, 23.0, 34.0, 41.0, 45.0, 34.0, 37.0, 1069.0, 38.0, 34.0, 30.0, 50.0, 37.0, 35.0, 40.0, 40.0, 23.0, 24.0, 29.0, 19.0, 19.0, 11.0, 13.0, 12.0, 5.0, 9.0, 6.0, 12.0, 1.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2972412109375, -5.141357421875, -4.9854736328125, -4.82958984375, -4.6737060546875, -4.517822265625, -4.3619384765625, -4.2060546875, -4.0501708984375, -3.894287109375, -3.7384033203125, -3.58251953125, -3.4266357421875, -3.270751953125, -3.1148681640625, -2.958984375, -2.8031005859375, -2.647216796875, -2.4913330078125, -2.33544921875, -2.1795654296875, -2.023681640625, -1.8677978515625, -1.7119140625, -1.5560302734375, -1.400146484375, -1.2442626953125, -1.08837890625, -0.9324951171875, -0.776611328125, -0.6207275390625, -0.46484375, -0.3089599609375, -0.153076171875, 0.0028076171875, 0.15869140625, 0.3145751953125, 0.470458984375, 0.6263427734375, 0.7822265625, 0.9381103515625, 1.093994140625, 1.2498779296875, 1.40576171875, 1.5616455078125, 1.717529296875, 1.8734130859375, 2.029296875, 2.1851806640625, 2.341064453125, 2.4969482421875, 2.65283203125, 2.8087158203125, 2.964599609375, 3.1204833984375, 3.2763671875, 3.4322509765625, 3.588134765625, 3.7440185546875, 3.89990234375, 4.0557861328125, 4.211669921875, 4.3675537109375, 4.5234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 9.0, 12.0, 25.0, 41.0, 46.0, 91.0, 138.0, 172.0, 277.0, 379.0, 615.0, 920.0, 1456.0, 2094.0, 3098.0, 4694.0, 7172.0, 10883.0, 17039.0, 26863.0, 44315.0, 74643.0, 131300.0, 1289586.0, 201971.0, 110593.0, 63961.0, 38149.0, 23508.0, 14746.0, 9713.0, 6277.0, 4163.0, 2711.0, 1828.0, 1251.0, 801.0, 558.0, 353.0, 229.0, 158.0, 102.0, 63.0, 48.0, 28.0, 17.0, 13.0, 8.0, 4.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.169921875, -1.1320037841796875, -1.094085693359375, -1.0561676025390625, -1.01824951171875, -0.9803314208984375, -0.942413330078125, -0.9044952392578125, -0.8665771484375, -0.8286590576171875, -0.790740966796875, -0.7528228759765625, -0.71490478515625, -0.6769866943359375, -0.639068603515625, -0.6011505126953125, -0.563232421875, -0.5253143310546875, -0.487396240234375, -0.4494781494140625, -0.41156005859375, -0.3736419677734375, -0.335723876953125, -0.2978057861328125, -0.2598876953125, -0.2219696044921875, -0.184051513671875, -0.1461334228515625, -0.10821533203125, -0.0702972412109375, -0.032379150390625, 0.0055389404296875, 0.04345703125, 0.0813751220703125, 0.119293212890625, 0.1572113037109375, 0.19512939453125, 0.2330474853515625, 0.270965576171875, 0.3088836669921875, 0.3468017578125, 0.3847198486328125, 0.422637939453125, 0.4605560302734375, 0.49847412109375, 0.5363922119140625, 0.574310302734375, 0.6122283935546875, 0.650146484375, 0.6880645751953125, 0.725982666015625, 0.7639007568359375, 0.80181884765625, 0.8397369384765625, 0.877655029296875, 0.9155731201171875, 0.9534912109375, 0.9914093017578125, 1.029327392578125, 1.0672454833984375, 1.10516357421875, 1.1430816650390625, 1.180999755859375, 1.2189178466796875, 1.2568359375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 4.0, 3.0, 7.0, 16.0, 12.0, 17.0, 17.0, 18.0, 29.0, 37.0, 53.0, 68.0, 71.0, 91.0, 84.0, 84.0, 79.0, 69.0, 42.0, 47.0, 33.0, 27.0, 19.0, 21.0, 14.0, 12.0, 6.0, 10.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010671615600585938, -0.0010363012552261353, -0.0010054409503936768, -0.0009745806455612183, -0.0009437203407287598, -0.0009128600358963013, -0.0008819997310638428, -0.0008511394262313843, -0.0008202791213989258, -0.0007894188165664673, -0.0007585585117340088, -0.0007276982069015503, -0.0006968379020690918, -0.0006659775972366333, -0.0006351172924041748, -0.0006042569875717163, -0.0005733966827392578, -0.0005425363779067993, -0.0005116760730743408, -0.0004808157682418823, -0.00044995546340942383, -0.00041909515857696533, -0.00038823485374450684, -0.00035737454891204834, -0.00032651424407958984, -0.00029565393924713135, -0.00026479363441467285, -0.00023393332958221436, -0.00020307302474975586, -0.00017221271991729736, -0.00014135241508483887, -0.00011049211025238037, -7.963180541992188e-05, -4.877150058746338e-05, -1.7911195755004883e-05, 1.2949109077453613e-05, 4.380941390991211e-05, 7.46697187423706e-05, 0.0001055300235748291, 0.0001363903284072876, 0.0001672506332397461, 0.0001981109380722046, 0.00022897124290466309, 0.0002598315477371216, 0.0002906918525695801, 0.0003215521574020386, 0.00035241246223449707, 0.00038327276706695557, 0.00041413307189941406, 0.00044499337673187256, 0.00047585368156433105, 0.0005067139863967896, 0.000537574291229248, 0.0005684345960617065, 0.000599294900894165, 0.0006301552057266235, 0.000661015510559082, 0.0006918758153915405, 0.000722736120223999, 0.0007535964250564575, 0.000784456729888916, 0.0008153170347213745, 0.000846177339553833, 0.0008770376443862915, 0.00090789794921875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 15.0, 11.0, 15.0, 24.0, 36.0, 38.0, 47.0, 70.0, 98.0, 157.0, 308.0, 575.0, 3473.0, 1038840.0, 3403.0, 605.0, 287.0, 164.0, 91.0, 68.0, 59.0, 42.0, 26.0, 26.0, 11.0, 20.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.018646240234375, -0.018014192581176758, -0.017382144927978516, -0.016750097274780273, -0.01611804962158203, -0.015486001968383789, -0.014853954315185547, -0.014221906661987305, -0.013589859008789062, -0.01295781135559082, -0.012325763702392578, -0.011693716049194336, -0.011061668395996094, -0.010429620742797852, -0.00979757308959961, -0.009165525436401367, -0.008533477783203125, -0.007901430130004883, -0.007269382476806641, -0.0066373348236083984, -0.006005287170410156, -0.005373239517211914, -0.004741191864013672, -0.00410914421081543, -0.0034770965576171875, -0.0028450489044189453, -0.002213001251220703, -0.001580953598022461, -0.0009489059448242188, -0.00031685829162597656, 0.0003151893615722656, 0.0009472370147705078, 0.00157928466796875, 0.002211332321166992, 0.0028433799743652344, 0.0034754276275634766, 0.004107475280761719, 0.004739522933959961, 0.005371570587158203, 0.006003618240356445, 0.0066356658935546875, 0.00726771354675293, 0.007899761199951172, 0.008531808853149414, 0.009163856506347656, 0.009795904159545898, 0.01042795181274414, 0.011059999465942383, 0.011692047119140625, 0.012324094772338867, 0.01295614242553711, 0.013588190078735352, 0.014220237731933594, 0.014852285385131836, 0.015484333038330078, 0.01611638069152832, 0.016748428344726562, 0.017380475997924805, 0.018012523651123047, 0.01864457130432129, 0.01927661895751953, 0.019908666610717773, 0.020540714263916016, 0.021172761917114258, 0.0218048095703125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 12.0, 14.0, 38.0, 64.0, 118.0, 160.0, 200.0, 158.0, 100.0, 68.0, 39.0, 18.0, 17.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004894381272606552, -0.0004709027416538447, -0.00045236735604703426, -0.0004338319704402238, -0.00041529658483341336, -0.00039676117012277246, -0.000378225784515962, -0.00035969039890915155, -0.0003411550133023411, -0.00032261962769553065, -0.0003040842420887202, -0.00028554885648190975, -0.00026701344177126884, -0.00024847808526828885, -0.00022994267055764794, -0.0002114072849508375, -0.00019287189934402704, -0.0001743365137372166, -0.00015580112813040614, -0.00013726572797168046, -0.00011873034236487001, -0.00010019495675805956, -8.16595638752915e-05, -6.312417099252343e-05, -4.458878538571298e-05, -2.6053396140923724e-05, -7.518006896134466e-06, 1.1017382348654792e-05, 2.955277159344405e-05, 4.80881572002545e-05, 6.662355008302256e-05, 8.515894296579063e-05, 0.00010369427036494017, 0.00012222965597175062, 0.00014076504157856107, 0.00015930044173728675, 0.0001778358273440972, 0.00019637121295090765, 0.00021490661310963333, 0.00023344199871644378, 0.00025197738432325423, 0.0002705127699300647, 0.00028904815553687513, 0.0003075835411436856, 0.0003261189558543265, 0.0003446543123573065, 0.0003631897270679474, 0.00038172511267475784, 0.0004002604982815683, 0.00041879588388837874, 0.0004373312694951892, 0.00045586665510199964, 0.0004744020407088101, 0.000492937455419451, 0.000511472811922431, 0.0005300082266330719, 0.0005485436413437128, 0.0005670790560543537, 0.0005856144125573337, 0.0006041498272679746, 0.0006226851837709546, 0.0006412205984815955, 0.0006597559549845755, 0.0006782913696952164, 0.0006968267261981964]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 4.0, 5.0, 8.0, 13.0, 11.0, 14.0, 18.0, 17.0, 19.0, 26.0, 20.0, 27.0, 29.0, 30.0, 48.0, 32.0, 23.0, 40.0, 41.0, 27.0, 33.0, 47.0, 40.0, 41.0, 27.0, 39.0, 38.0, 25.0, 26.0, 32.0, 23.0, 15.0, 21.0, 21.0, 18.0, 10.0, 13.0, 11.0, 8.0, 17.0, 5.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003337264060974121, -0.0003224192187190056, -0.00031111203134059906, -0.00029980484396219254, -0.000288497656583786, -0.0002771904692053795, -0.00026588328182697296, -0.00025457609444856644, -0.0002432689070701599, -0.0002319617196917534, -0.00022065453231334686, -0.00020934734493494034, -0.0001980401575565338, -0.0001867329701781273, -0.00017542578279972076, -0.00016411859542131424, -0.00015281140804290771, -0.0001415042206645012, -0.00013019703328609467, -0.00011888984590768814, -0.00010758265852928162, -9.627547115087509e-05, -8.496828377246857e-05, -7.366109639406204e-05, -6.235390901565552e-05, -5.104672163724899e-05, -3.973953425884247e-05, -2.8432346880435944e-05, -1.712515950202942e-05, -5.817972123622894e-06, 5.48921525478363e-06, 1.6796402633190155e-05, 2.810359001159668e-05, 3.9410777390003204e-05, 5.071796476840973e-05, 6.202515214681625e-05, 7.333233952522278e-05, 8.46395269036293e-05, 9.594671428203583e-05, 0.00010725390166044235, 0.00011856108903884888, 0.0001298682764172554, 0.00014117546379566193, 0.00015248265117406845, 0.00016378983855247498, 0.0001750970259308815, 0.00018640421330928802, 0.00019771140068769455, 0.00020901858806610107, 0.0002203257754445076, 0.00023163296282291412, 0.00024294015020132065, 0.00025424733757972717, 0.0002655545249581337, 0.0002768617123365402, 0.00028816889971494675, 0.00029947608709335327, 0.0003107832744717598, 0.0003220904618501663, 0.00033339764922857285, 0.00034470483660697937, 0.0003560120239853859, 0.0003673192113637924, 0.00037862639874219894, 0.00038993358612060547]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 6.0, 6.0, 12.0, 13.0, 6.0, 22.0, 17.0, 19.0, 23.0, 34.0, 22.0, 27.0, 28.0, 37.0, 42.0, 34.0, 31.0, 43.0, 35.0, 40.0, 43.0, 46.0, 38.0, 31.0, 34.0, 29.0, 33.0, 30.0, 28.0, 22.0, 27.0, 14.0, 18.0, 19.0, 16.0, 13.0, 9.0, 9.0, 10.0, 4.0, 8.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51953125, -7.28167724609375, -7.0438232421875, -6.80596923828125, -6.568115234375, -6.33026123046875, -6.0924072265625, -5.85455322265625, -5.61669921875, -5.37884521484375, -5.1409912109375, -4.90313720703125, -4.665283203125, -4.42742919921875, -4.1895751953125, -3.95172119140625, -3.7138671875, -3.47601318359375, -3.2381591796875, -3.00030517578125, -2.762451171875, -2.52459716796875, -2.2867431640625, -2.04888916015625, -1.81103515625, -1.57318115234375, -1.3353271484375, -1.09747314453125, -0.859619140625, -0.62176513671875, -0.3839111328125, -0.14605712890625, 0.091796875, 0.32965087890625, 0.5675048828125, 0.80535888671875, 1.043212890625, 1.28106689453125, 1.5189208984375, 1.75677490234375, 1.99462890625, 2.23248291015625, 2.4703369140625, 2.70819091796875, 2.946044921875, 3.18389892578125, 3.4217529296875, 3.65960693359375, 3.8974609375, 4.13531494140625, 4.3731689453125, 4.61102294921875, 4.848876953125, 5.08673095703125, 5.3245849609375, 5.56243896484375, 5.80029296875, 6.03814697265625, 6.2760009765625, 6.51385498046875, 6.751708984375, 6.98956298828125, 7.2274169921875, 7.46527099609375, 7.703125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 8.0, 7.0, 11.0, 17.0, 24.0, 29.0, 24.0, 53.0, 54.0, 61.0, 105.0, 132.0, 182.0, 279.0, 497.0, 923.0, 1895.0, 4584.0, 11531.0, 34365.0, 116285.0, 450872.0, 308114.0, 78761.0, 24335.0, 8412.0, 3412.0, 1494.0, 728.0, 436.0, 240.0, 167.0, 128.0, 87.0, 55.0, 45.0, 56.0, 29.0, 25.0, 19.0, 16.0, 12.0, 10.0, 9.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6875, -9.38330078125, -9.0791015625, -8.77490234375, -8.470703125, -8.16650390625, -7.8623046875, -7.55810546875, -7.25390625, -6.94970703125, -6.6455078125, -6.34130859375, -6.037109375, -5.73291015625, -5.4287109375, -5.12451171875, -4.8203125, -4.51611328125, -4.2119140625, -3.90771484375, -3.603515625, -3.29931640625, -2.9951171875, -2.69091796875, -2.38671875, -2.08251953125, -1.7783203125, -1.47412109375, -1.169921875, -0.86572265625, -0.5615234375, -0.25732421875, 0.046875, 0.35107421875, 0.6552734375, 0.95947265625, 1.263671875, 1.56787109375, 1.8720703125, 2.17626953125, 2.48046875, 2.78466796875, 3.0888671875, 3.39306640625, 3.697265625, 4.00146484375, 4.3056640625, 4.60986328125, 4.9140625, 5.21826171875, 5.5224609375, 5.82666015625, 6.130859375, 6.43505859375, 6.7392578125, 7.04345703125, 7.34765625, 7.65185546875, 7.9560546875, 8.26025390625, 8.564453125, 8.86865234375, 9.1728515625, 9.47705078125, 9.78125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 5.0, 10.0, 14.0, 10.0, 10.0, 12.0, 19.0, 17.0, 25.0, 24.0, 26.0, 26.0, 23.0, 34.0, 48.0, 40.0, 51.0, 64.0, 108.0, 221.0, 1490.0, 209.0, 95.0, 64.0, 46.0, 50.0, 29.0, 43.0, 37.0, 22.0, 27.0, 19.0, 21.0, 17.0, 16.0, 16.0, 16.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.859375, -20.217041015625, -19.57470703125, -18.932373046875, -18.2900390625, -17.647705078125, -17.00537109375, -16.363037109375, -15.720703125, -15.078369140625, -14.43603515625, -13.793701171875, -13.1513671875, -12.509033203125, -11.86669921875, -11.224365234375, -10.58203125, -9.939697265625, -9.29736328125, -8.655029296875, -8.0126953125, -7.370361328125, -6.72802734375, -6.085693359375, -5.443359375, -4.801025390625, -4.15869140625, -3.516357421875, -2.8740234375, -2.231689453125, -1.58935546875, -0.947021484375, -0.3046875, 0.337646484375, 0.97998046875, 1.622314453125, 2.2646484375, 2.906982421875, 3.54931640625, 4.191650390625, 4.833984375, 5.476318359375, 6.11865234375, 6.760986328125, 7.4033203125, 8.045654296875, 8.68798828125, 9.330322265625, 9.97265625, 10.614990234375, 11.25732421875, 11.899658203125, 12.5419921875, 13.184326171875, 13.82666015625, 14.468994140625, 15.111328125, 15.753662109375, 16.39599609375, 17.038330078125, 17.6806640625, 18.322998046875, 18.96533203125, 19.607666015625, 20.25]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 10.0, 6.0, 12.0, 19.0, 25.0, 30.0, 43.0, 57.0, 91.0, 144.0, 197.0, 331.0, 657.0, 2585.0, 91752.0, 3014966.0, 31735.0, 1522.0, 559.0, 336.0, 182.0, 133.0, 90.0, 61.0, 35.0, 32.0, 28.0, 21.0, 12.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.09423828125, -32.7509765625, -31.40771484375, -30.064453125, -28.72119140625, -27.3779296875, -26.03466796875, -24.69140625, -23.34814453125, -22.0048828125, -20.66162109375, -19.318359375, -17.97509765625, -16.6318359375, -15.28857421875, -13.9453125, -12.60205078125, -11.2587890625, -9.91552734375, -8.572265625, -7.22900390625, -5.8857421875, -4.54248046875, -3.19921875, -1.85595703125, -0.5126953125, 0.83056640625, 2.173828125, 3.51708984375, 4.8603515625, 6.20361328125, 7.546875, 8.89013671875, 10.2333984375, 11.57666015625, 12.919921875, 14.26318359375, 15.6064453125, 16.94970703125, 18.29296875, 19.63623046875, 20.9794921875, 22.32275390625, 23.666015625, 25.00927734375, 26.3525390625, 27.69580078125, 29.0390625, 30.38232421875, 31.7255859375, 33.06884765625, 34.412109375, 35.75537109375, 37.0986328125, 38.44189453125, 39.78515625, 41.12841796875, 42.4716796875, 43.81494140625, 45.158203125, 46.50146484375, 47.8447265625, 49.18798828125, 50.53125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 52.0, 878.0, 85.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.468585968017578, -9.919108390808105, -3.369630813598633, 3.1798477172851562, 9.729324340820312, 16.27880096435547, 22.82828140258789, 29.377758026123047, 35.9272346496582, 42.47671127319336, 49.02619171142578, 55.57566833496094, 62.125144958496094, 68.67462158203125, 75.22410583496094, 81.77357482910156, 88.32305908203125, 94.8725357055664, 101.42201232910156, 107.97149658203125, 114.52096557617188, 121.07044982910156, 127.61992645263672, 134.16940307617188, 140.7188720703125, 147.2683563232422, 153.8178253173828, 160.3673095703125, 166.91677856445312, 173.4662628173828, 180.0157470703125, 186.56521606445312, 193.11468505859375, 199.66416931152344, 206.21363830566406, 212.76312255859375, 219.31259155273438, 225.86207580566406, 232.41156005859375, 238.96102905273438, 245.510498046875, 252.0599822998047, 258.6094665527344, 265.158935546875, 271.7084045410156, 278.25787353515625, 284.807373046875, 291.3568420410156, 297.90631103515625, 304.4557800292969, 311.0052795410156, 317.55474853515625, 324.1042175292969, 330.6536865234375, 337.20318603515625, 343.7526550292969, 350.3021545410156, 356.85162353515625, 363.401123046875, 369.9505920410156, 376.50006103515625, 383.0495300292969, 389.5990295410156, 396.14849853515625, 402.6979675292969]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 6.0, 3.0, 12.0, 9.0, 12.0, 16.0, 19.0, 24.0, 24.0, 21.0, 24.0, 23.0, 26.0, 24.0, 33.0, 24.0, 38.0, 27.0, 35.0, 40.0, 44.0, 47.0, 41.0, 41.0, 37.0, 33.0, 37.0, 26.0, 38.0, 29.0, 15.0, 24.0, 25.0, 14.0, 14.0, 24.0, 6.0, 13.0, 7.0, 7.0, 8.0, 2.0, 8.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.56782913208008, -43.14304733276367, -41.71826934814453, -40.293487548828125, -38.86870574951172, -37.44392395019531, -36.019142150878906, -34.594364166259766, -33.16958236694336, -31.744800567626953, -30.32002067565918, -28.895240783691406, -27.470458984375, -26.045677185058594, -24.62089729309082, -23.196117401123047, -21.77133560180664, -20.346553802490234, -18.92177391052246, -17.496994018554688, -16.07221221923828, -14.647431373596191, -13.222650527954102, -11.797869682312012, -10.373088836669922, -8.948307991027832, -7.523527145385742, -6.098746299743652, -4.6739654541015625, -3.2491846084594727, -1.8244037628173828, -0.39962291717529297, 1.0251579284667969, 2.4499387741088867, 3.8747196197509766, 5.299500465393066, 6.724281311035156, 8.149062156677246, 9.573843002319336, 10.998623847961426, 12.423404693603516, 13.848185539245605, 15.272966384887695, 16.69774627685547, 18.122528076171875, 19.54730987548828, 20.972089767456055, 22.396869659423828, 23.821651458740234, 25.24643325805664, 26.671213150024414, 28.095993041992188, 29.520774841308594, 30.945556640625, 32.370338439941406, 33.79511642456055, 35.21989822387695, 36.64468002319336, 38.0694580078125, 39.494239807128906, 40.91902160644531, 42.34380340576172, 43.768585205078125, 45.193363189697266, 46.61814498901367]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 3.0, 9.0, 9.0, 9.0, 12.0, 18.0, 18.0, 19.0, 14.0, 16.0, 33.0, 31.0, 24.0, 29.0, 34.0, 44.0, 38.0, 34.0, 37.0, 31.0, 29.0, 51.0, 34.0, 37.0, 43.0, 26.0, 37.0, 26.0, 23.0, 28.0, 27.0, 24.0, 24.0, 18.0, 18.0, 12.0, 15.0, 9.0, 8.0, 6.0, 8.0, 3.0, 9.0, 1.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.921875, -7.6856689453125, -7.449462890625, -7.2132568359375, -6.97705078125, -6.7408447265625, -6.504638671875, -6.2684326171875, -6.0322265625, -5.7960205078125, -5.559814453125, -5.3236083984375, -5.08740234375, -4.8511962890625, -4.614990234375, -4.3787841796875, -4.142578125, -3.9063720703125, -3.670166015625, -3.4339599609375, -3.19775390625, -2.9615478515625, -2.725341796875, -2.4891357421875, -2.2529296875, -2.0167236328125, -1.780517578125, -1.5443115234375, -1.30810546875, -1.0718994140625, -0.835693359375, -0.5994873046875, -0.36328125, -0.1270751953125, 0.109130859375, 0.3453369140625, 0.58154296875, 0.8177490234375, 1.053955078125, 1.2901611328125, 1.5263671875, 1.7625732421875, 1.998779296875, 2.2349853515625, 2.47119140625, 2.7073974609375, 2.943603515625, 3.1798095703125, 3.416015625, 3.6522216796875, 3.888427734375, 4.1246337890625, 4.36083984375, 4.5970458984375, 4.833251953125, 5.0694580078125, 5.3056640625, 5.5418701171875, 5.778076171875, 6.0142822265625, 6.25048828125, 6.4866943359375, 6.722900390625, 6.9591064453125, 7.1953125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 14.0, 5.0, 13.0, 19.0, 23.0, 13.0, 24.0, 35.0, 32.0, 41.0, 49.0, 89.0, 161.0, 349.0, 1218.0, 5671.0, 73331.0, 3047073.0, 1041844.0, 19964.0, 2909.0, 718.0, 245.0, 110.0, 53.0, 47.0, 30.0, 28.0, 28.0, 17.0, 21.0, 16.0, 14.0, 8.0, 15.0, 7.0, 9.0, 3.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.46875, -26.546875, -25.625, -24.703125, -23.78125, -22.859375, -21.9375, -21.015625, -20.09375, -19.171875, -18.25, -17.328125, -16.40625, -15.484375, -14.5625, -13.640625, -12.71875, -11.796875, -10.875, -9.953125, -9.03125, -8.109375, -7.1875, -6.265625, -5.34375, -4.421875, -3.5, -2.578125, -1.65625, -0.734375, 0.1875, 1.109375, 2.03125, 2.953125, 3.875, 4.796875, 5.71875, 6.640625, 7.5625, 8.484375, 9.40625, 10.328125, 11.25, 12.171875, 13.09375, 14.015625, 14.9375, 15.859375, 16.78125, 17.703125, 18.625, 19.546875, 20.46875, 21.390625, 22.3125, 23.234375, 24.15625, 25.078125, 26.0, 26.921875, 27.84375, 28.765625, 29.6875, 30.609375, 31.53125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 8.0, 7.0, 7.0, 10.0, 8.0, 20.0, 27.0, 21.0, 34.0, 50.0, 59.0, 75.0, 110.0, 171.0, 254.0, 352.0, 430.0, 539.0, 494.0, 427.0, 281.0, 188.0, 157.0, 81.0, 66.0, 52.0, 38.0, 25.0, 25.0, 12.0, 13.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.7119140625, -11.353515625, -10.9951171875, -10.63671875, -10.2783203125, -9.919921875, -9.5615234375, -9.203125, -8.8447265625, -8.486328125, -8.1279296875, -7.76953125, -7.4111328125, -7.052734375, -6.6943359375, -6.3359375, -5.9775390625, -5.619140625, -5.2607421875, -4.90234375, -4.5439453125, -4.185546875, -3.8271484375, -3.46875, -3.1103515625, -2.751953125, -2.3935546875, -2.03515625, -1.6767578125, -1.318359375, -0.9599609375, -0.6015625, -0.2431640625, 0.115234375, 0.4736328125, 0.83203125, 1.1904296875, 1.548828125, 1.9072265625, 2.265625, 2.6240234375, 2.982421875, 3.3408203125, 3.69921875, 4.0576171875, 4.416015625, 4.7744140625, 5.1328125, 5.4912109375, 5.849609375, 6.2080078125, 6.56640625, 6.9248046875, 7.283203125, 7.6416015625, 8.0, 8.3583984375, 8.716796875, 9.0751953125, 9.43359375, 9.7919921875, 10.150390625, 10.5087890625, 10.8671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 12.0, 12.0, 21.0, 26.0, 28.0, 68.0, 77.0, 174.0, 325.0, 914.0, 4254.0, 53604.0, 3535002.0, 581137.0, 15267.0, 2089.0, 602.0, 246.0, 131.0, 89.0, 60.0, 44.0, 22.0, 20.0, 8.0, 9.0, 6.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-42.0625, -40.919189453125, -39.77587890625, -38.632568359375, -37.4892578125, -36.345947265625, -35.20263671875, -34.059326171875, -32.916015625, -31.772705078125, -30.62939453125, -29.486083984375, -28.3427734375, -27.199462890625, -26.05615234375, -24.912841796875, -23.76953125, -22.626220703125, -21.48291015625, -20.339599609375, -19.1962890625, -18.052978515625, -16.90966796875, -15.766357421875, -14.623046875, -13.479736328125, -12.33642578125, -11.193115234375, -10.0498046875, -8.906494140625, -7.76318359375, -6.619873046875, -5.4765625, -4.333251953125, -3.18994140625, -2.046630859375, -0.9033203125, 0.239990234375, 1.38330078125, 2.526611328125, 3.669921875, 4.813232421875, 5.95654296875, 7.099853515625, 8.2431640625, 9.386474609375, 10.52978515625, 11.673095703125, 12.81640625, 13.959716796875, 15.10302734375, 16.246337890625, 17.3896484375, 18.532958984375, 19.67626953125, 20.819580078125, 21.962890625, 23.106201171875, 24.24951171875, 25.392822265625, 26.5361328125, 27.679443359375, 28.82275390625, 29.966064453125, 31.109375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 46.0, 296.0, 457.0, 190.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.51425170898438, -162.16485595703125, -156.81544494628906, -151.46604919433594, -146.11663818359375, -140.76724243164062, -135.4178466796875, -130.0684356689453, -124.71903991699219, -119.36963653564453, -114.02023315429688, -108.67083740234375, -103.3214340209961, -97.97203063964844, -92.62262725830078, -87.27322387695312, -81.92382049560547, -76.57441711425781, -71.22501373291016, -65.8756103515625, -60.526214599609375, -55.17681121826172, -49.82740783691406, -44.47800827026367, -39.128604888916016, -33.77920150756836, -28.42980194091797, -23.080398559570312, -17.73099708557129, -12.381595611572266, -7.032192230224609, -1.6827926635742188, 3.6666107177734375, 9.016012191772461, 14.3654146194458, 19.71481704711914, 25.064218521118164, 30.413619995117188, 35.763023376464844, 41.112422943115234, 46.46182632446289, 51.81122970581055, 57.16062927246094, 62.510032653808594, 67.85943603515625, 73.20883178710938, 78.55824279785156, 83.90763854980469, 89.25704193115234, 94.6064453125, 99.95584869384766, 105.30525207519531, 110.65464782714844, 116.0040512084961, 121.35345458984375, 126.70285034179688, 132.05226135253906, 137.4016571044922, 142.75106811523438, 148.1004638671875, 153.4498748779297, 158.7992706298828, 164.148681640625, 169.49807739257812, 174.84747314453125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 11.0, 13.0, 18.0, 18.0, 23.0, 34.0, 27.0, 36.0, 23.0, 23.0, 31.0, 28.0, 36.0, 40.0, 21.0, 36.0, 38.0, 41.0, 53.0, 24.0, 41.0, 49.0, 31.0, 25.0, 22.0, 31.0, 33.0, 25.0, 14.0, 23.0, 15.0, 15.0, 9.0, 15.0, 7.0, 10.0, 8.0, 6.0, 3.0, 6.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.921142578125, -30.824615478515625, -29.72808837890625, -28.631561279296875, -27.5350341796875, -26.438507080078125, -25.34197998046875, -24.245452880859375, -23.14892578125, -22.052398681640625, -20.95587158203125, -19.859344482421875, -18.7628173828125, -17.666290283203125, -16.56976318359375, -15.473236083984375, -14.376708984375, -13.280181884765625, -12.18365478515625, -11.087127685546875, -9.9906005859375, -8.894073486328125, -7.79754638671875, -6.701019287109375, -5.6044921875, -4.507965087890625, -3.41143798828125, -2.314910888671875, -1.2183837890625, -0.121856689453125, 0.97467041015625, 2.071197509765625, 3.167724609375, 4.264251708984375, 5.36077880859375, 6.457305908203125, 7.5538330078125, 8.650360107421875, 9.74688720703125, 10.843414306640625, 11.93994140625, 13.036468505859375, 14.13299560546875, 15.229522705078125, 16.3260498046875, 17.422576904296875, 18.51910400390625, 19.615631103515625, 20.712158203125, 21.808685302734375, 22.90521240234375, 24.001739501953125, 25.0982666015625, 26.194793701171875, 27.29132080078125, 28.387847900390625, 29.484375, 30.580902099609375, 31.67742919921875, 32.773956298828125, 33.8704833984375, 34.967010498046875, 36.06353759765625, 37.160064697265625, 38.256591796875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 5.0, 14.0, 17.0, 16.0, 16.0, 20.0, 21.0, 17.0, 25.0, 35.0, 35.0, 39.0, 38.0, 30.0, 32.0, 32.0, 34.0, 31.0, 35.0, 53.0, 42.0, 29.0, 36.0, 34.0, 27.0, 29.0, 27.0, 35.0, 30.0, 23.0, 17.0, 21.0, 18.0, 12.0, 18.0, 3.0, 15.0, 3.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.453125, -8.20648193359375, -7.9598388671875, -7.71319580078125, -7.466552734375, -7.21990966796875, -6.9732666015625, -6.72662353515625, -6.47998046875, -6.23333740234375, -5.9866943359375, -5.74005126953125, -5.493408203125, -5.24676513671875, -5.0001220703125, -4.75347900390625, -4.5068359375, -4.26019287109375, -4.0135498046875, -3.76690673828125, -3.520263671875, -3.27362060546875, -3.0269775390625, -2.78033447265625, -2.53369140625, -2.28704833984375, -2.0404052734375, -1.79376220703125, -1.547119140625, -1.30047607421875, -1.0538330078125, -0.80718994140625, -0.560546875, -0.31390380859375, -0.0672607421875, 0.17938232421875, 0.426025390625, 0.67266845703125, 0.9193115234375, 1.16595458984375, 1.41259765625, 1.65924072265625, 1.9058837890625, 2.15252685546875, 2.399169921875, 2.64581298828125, 2.8924560546875, 3.13909912109375, 3.3857421875, 3.63238525390625, 3.8790283203125, 4.12567138671875, 4.372314453125, 4.61895751953125, 4.8656005859375, 5.11224365234375, 5.35888671875, 5.60552978515625, 5.8521728515625, 6.09881591796875, 6.345458984375, 6.59210205078125, 6.8387451171875, 7.08538818359375, 7.33203125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 28.0, 29.0, 61.0, 77.0, 125.0, 173.0, 275.0, 450.0, 704.0, 1105.0, 1686.0, 2702.0, 4171.0, 6606.0, 10400.0, 16147.0, 25838.0, 41588.0, 67314.0, 111828.0, 202906.0, 230200.0, 125667.0, 74728.0, 46022.0, 28516.0, 17783.0, 11332.0, 7248.0, 4648.0, 2935.0, 1870.0, 1196.0, 793.0, 490.0, 322.0, 208.0, 130.0, 88.0, 59.0, 26.0, 21.0, 14.0, 9.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3192596435546875, -1.278167724609375, -1.2370758056640625, -1.19598388671875, -1.1548919677734375, -1.113800048828125, -1.0727081298828125, -1.0316162109375, -0.9905242919921875, -0.949432373046875, -0.9083404541015625, -0.86724853515625, -0.8261566162109375, -0.785064697265625, -0.7439727783203125, -0.702880859375, -0.6617889404296875, -0.620697021484375, -0.5796051025390625, -0.53851318359375, -0.4974212646484375, -0.456329345703125, -0.4152374267578125, -0.3741455078125, -0.3330535888671875, -0.291961669921875, -0.2508697509765625, -0.20977783203125, -0.1686859130859375, -0.127593994140625, -0.0865020751953125, -0.04541015625, -0.0043182373046875, 0.036773681640625, 0.0778656005859375, 0.11895751953125, 0.1600494384765625, 0.201141357421875, 0.2422332763671875, 0.2833251953125, 0.3244171142578125, 0.365509033203125, 0.4066009521484375, 0.44769287109375, 0.4887847900390625, 0.529876708984375, 0.5709686279296875, 0.612060546875, 0.6531524658203125, 0.694244384765625, 0.7353363037109375, 0.77642822265625, 0.8175201416015625, 0.858612060546875, 0.8997039794921875, 0.9407958984375, 0.9818878173828125, 1.022979736328125, 1.0640716552734375, 1.10516357421875, 1.1462554931640625, 1.187347412109375, 1.2284393310546875, 1.26953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 6.0, 8.0, 10.0, 14.0, 12.0, 16.0, 25.0, 18.0, 25.0, 32.0, 30.0, 33.0, 26.0, 36.0, 36.0, 49.0, 35.0, 42.0, 45.0, 1061.0, 37.0, 48.0, 53.0, 25.0, 40.0, 30.0, 27.0, 42.0, 27.0, 20.0, 16.0, 22.0, 12.0, 7.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.65625, -5.4903564453125, -5.324462890625, -5.1585693359375, -4.99267578125, -4.8267822265625, -4.660888671875, -4.4949951171875, -4.3291015625, -4.1632080078125, -3.997314453125, -3.8314208984375, -3.66552734375, -3.4996337890625, -3.333740234375, -3.1678466796875, -3.001953125, -2.8360595703125, -2.670166015625, -2.5042724609375, -2.33837890625, -2.1724853515625, -2.006591796875, -1.8406982421875, -1.6748046875, -1.5089111328125, -1.343017578125, -1.1771240234375, -1.01123046875, -0.8453369140625, -0.679443359375, -0.5135498046875, -0.34765625, -0.1817626953125, -0.015869140625, 0.1500244140625, 0.31591796875, 0.4818115234375, 0.647705078125, 0.8135986328125, 0.9794921875, 1.1453857421875, 1.311279296875, 1.4771728515625, 1.64306640625, 1.8089599609375, 1.974853515625, 2.1407470703125, 2.306640625, 2.4725341796875, 2.638427734375, 2.8043212890625, 2.97021484375, 3.1361083984375, 3.302001953125, 3.4678955078125, 3.6337890625, 3.7996826171875, 3.965576171875, 4.1314697265625, 4.29736328125, 4.4632568359375, 4.629150390625, 4.7950439453125, 4.9609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 4.0, 13.0, 24.0, 24.0, 32.0, 50.0, 93.0, 131.0, 181.0, 271.0, 444.0, 640.0, 908.0, 1373.0, 1979.0, 2951.0, 4389.0, 6773.0, 10523.0, 16655.0, 26665.0, 43635.0, 74338.0, 130586.0, 1299009.0, 204016.0, 108605.0, 61908.0, 37097.0, 22763.0, 14380.0, 8926.0, 5919.0, 3800.0, 2586.0, 1772.0, 1199.0, 795.0, 552.0, 359.0, 253.0, 169.0, 104.0, 81.0, 54.0, 37.0, 25.0, 12.0, 11.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2509765625, -1.2116851806640625, -1.172393798828125, -1.1331024169921875, -1.09381103515625, -1.0545196533203125, -1.015228271484375, -0.9759368896484375, -0.9366455078125, -0.8973541259765625, -0.858062744140625, -0.8187713623046875, -0.77947998046875, -0.7401885986328125, -0.700897216796875, -0.6616058349609375, -0.622314453125, -0.5830230712890625, -0.543731689453125, -0.5044403076171875, -0.46514892578125, -0.4258575439453125, -0.386566162109375, -0.3472747802734375, -0.3079833984375, -0.2686920166015625, -0.229400634765625, -0.1901092529296875, -0.15081787109375, -0.1115264892578125, -0.072235107421875, -0.0329437255859375, 0.00634765625, 0.0456390380859375, 0.084930419921875, 0.1242218017578125, 0.16351318359375, 0.2028045654296875, 0.242095947265625, 0.2813873291015625, 0.3206787109375, 0.3599700927734375, 0.399261474609375, 0.4385528564453125, 0.47784423828125, 0.5171356201171875, 0.556427001953125, 0.5957183837890625, 0.635009765625, 0.6743011474609375, 0.713592529296875, 0.7528839111328125, 0.79217529296875, 0.8314666748046875, 0.870758056640625, 0.9100494384765625, 0.9493408203125, 0.9886322021484375, 1.027923583984375, 1.0672149658203125, 1.10650634765625, 1.1457977294921875, 1.185089111328125, 1.2243804931640625, 1.263671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 2.0, 6.0, 7.0, 6.0, 6.0, 9.0, 12.0, 19.0, 25.0, 17.0, 22.0, 31.0, 41.0, 37.0, 58.0, 54.0, 58.0, 73.0, 57.0, 55.0, 71.0, 61.0, 46.0, 40.0, 35.0, 22.0, 27.0, 22.0, 20.0, 13.0, 13.0, 6.0, 2.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0009264945983886719, -0.000896550714969635, -0.0008666068315505981, -0.0008366629481315613, -0.0008067190647125244, -0.0007767751812934875, -0.0007468312978744507, -0.0007168874144554138, -0.000686943531036377, -0.0006569996476173401, -0.0006270557641983032, -0.0005971118807792664, -0.0005671679973602295, -0.0005372241139411926, -0.0005072802305221558, -0.0004773363471031189, -0.00044739246368408203, -0.00041744858026504517, -0.0003875046968460083, -0.00035756081342697144, -0.00032761693000793457, -0.0002976730465888977, -0.00026772916316986084, -0.00023778527975082397, -0.0002078413963317871, -0.00017789751291275024, -0.00014795362949371338, -0.00011800974607467651, -8.806586265563965e-05, -5.812197923660278e-05, -2.8178095817565918e-05, 1.7657876014709473e-06, 3.170967102050781e-05, 6.165355443954468e-05, 9.159743785858154e-05, 0.00012154132127761841, 0.00015148520469665527, 0.00018142908811569214, 0.000211372971534729, 0.00024131685495376587, 0.00027126073837280273, 0.0003012046217918396, 0.00033114850521087646, 0.00036109238862991333, 0.0003910362720489502, 0.00042098015546798706, 0.0004509240388870239, 0.0004808679223060608, 0.0005108118057250977, 0.0005407556891441345, 0.0005706995725631714, 0.0006006434559822083, 0.0006305873394012451, 0.000660531222820282, 0.0006904751062393188, 0.0007204189896583557, 0.0007503628730773926, 0.0007803067564964294, 0.0008102506399154663, 0.0008401945233345032, 0.00087013840675354, 0.0009000822901725769, 0.0009300261735916138, 0.0009599700570106506, 0.0009899139404296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 7.0, 6.0, 11.0, 13.0, 8.0, 10.0, 22.0, 25.0, 27.0, 38.0, 48.0, 62.0, 92.0, 110.0, 186.0, 338.0, 703.0, 12171.0, 1030639.0, 2360.0, 592.0, 292.0, 207.0, 139.0, 98.0, 82.0, 47.0, 42.0, 28.0, 36.0, 27.0, 15.0, 12.0, 19.0, 10.0, 9.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019622802734375, -0.019016265869140625, -0.01840972900390625, -0.017803192138671875, -0.0171966552734375, -0.016590118408203125, -0.01598358154296875, -0.015377044677734375, -0.0147705078125, -0.014163970947265625, -0.01355743408203125, -0.012950897216796875, -0.0123443603515625, -0.011737823486328125, -0.01113128662109375, -0.010524749755859375, -0.009918212890625, -0.009311676025390625, -0.00870513916015625, -0.008098602294921875, -0.0074920654296875, -0.006885528564453125, -0.00627899169921875, -0.005672454833984375, -0.00506591796875, -0.004459381103515625, -0.00385284423828125, -0.003246307373046875, -0.0026397705078125, -0.002033233642578125, -0.00142669677734375, -0.000820159912109375, -0.000213623046875, 0.000392913818359375, 0.00099945068359375, 0.001605987548828125, 0.0022125244140625, 0.002819061279296875, 0.00342559814453125, 0.004032135009765625, 0.004638671875, 0.005245208740234375, 0.00585174560546875, 0.006458282470703125, 0.0070648193359375, 0.007671356201171875, 0.00827789306640625, 0.008884429931640625, 0.009490966796875, 0.010097503662109375, 0.01070404052734375, 0.011310577392578125, 0.0119171142578125, 0.012523651123046875, 0.01313018798828125, 0.013736724853515625, 0.01434326171875, 0.014949798583984375, 0.01555633544921875, 0.016162872314453125, 0.0167694091796875, 0.017375946044921875, 0.01798248291015625, 0.018589019775390625, 0.019195556640625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 20.0, 209.0, 563.0, 200.0, 18.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015271920710802078, -0.0014648339711129665, -0.0014024758711457253, -0.0013401176547631621, -0.0012777595547959208, -0.0012154014548286796, -0.0011530432384461164, -0.0010906851384788752, -0.0010283270385116339, -0.0009659689385443926, -0.0009036107803694904, -0.0008412526221945882, -0.0007788945222273469, -0.0007165364222601056, -0.0006541782640852034, -0.0005918201059103012, -0.0005294620059430599, -0.0004671038768719882, -0.00040474574780091643, -0.0003423876187298447, -0.00028002948965877295, -0.0002176713605877012, -0.00015531323151662946, -9.295510244555771e-05, -3.059697337448597e-05, 3.1761155696585774e-05, 9.411928476765752e-05, 0.00015647741383872926, 0.000218835542909801, 0.00028119367198087275, 0.0003435518010519445, 0.00040590993012301624, 0.000468268059194088, 0.0005306261591613293, 0.0005929843173362315, 0.0006553424755111337, 0.000717700575478375, 0.0007800586754456162, 0.0008424168336205184, 0.0009047749917954206, 0.0009671330917626619, 0.0010294911917299032, 0.0010918492916971445, 0.0011542075080797076, 0.001216565608046949, 0.0012789237080141902, 0.0013412819243967533, 0.0014036400243639946, 0.0014659981243312359, 0.0015283562242984772, 0.0015907143242657185, 0.0016530725406482816, 0.0017154306406155229, 0.0017777887405827641, 0.0018401469569653273, 0.0019025050569325686, 0.00196486315689981, 0.002027221256867051, 0.0020895793568342924, 0.0021519374568015337, 0.0022142957895994186, 0.00227665388956666, 0.002339011989533901, 0.0024013700895011425, 0.002463728189468384]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 5.0, 10.0, 12.0, 13.0, 7.0, 21.0, 10.0, 19.0, 26.0, 20.0, 34.0, 34.0, 39.0, 38.0, 34.0, 32.0, 37.0, 38.0, 36.0, 40.0, 49.0, 43.0, 43.0, 36.0, 39.0, 35.0, 35.0, 24.0, 28.0, 25.0, 15.0, 19.0, 21.0, 17.0, 5.0, 12.0, 11.0, 8.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004550814628601074, -0.00044012628495693207, -0.0004251711070537567, -0.00041021592915058136, -0.000395260751247406, -0.00038030557334423065, -0.0003653503954410553, -0.00035039521753787994, -0.0003354400396347046, -0.00032048486173152924, -0.0003055296838283539, -0.00029057450592517853, -0.0002756193280220032, -0.0002606641501188278, -0.00024570897221565247, -0.0002307537943124771, -0.00021579861640930176, -0.0002008434385061264, -0.00018588826060295105, -0.0001709330826997757, -0.00015597790479660034, -0.000141022726893425, -0.00012606754899024963, -0.00011111237108707428, -9.615719318389893e-05, -8.120201528072357e-05, -6.624683737754822e-05, -5.1291659474372864e-05, -3.633648157119751e-05, -2.1381303668022156e-05, -6.426125764846802e-06, 8.529052138328552e-06, 2.3484230041503906e-05, 3.843940794467926e-05, 5.3394585847854614e-05, 6.834976375102997e-05, 8.330494165420532e-05, 9.826011955738068e-05, 0.00011321529746055603, 0.00012817047536373138, 0.00014312565326690674, 0.0001580808311700821, 0.00017303600907325745, 0.0001879911869764328, 0.00020294636487960815, 0.0002179015427827835, 0.00023285672068595886, 0.0002478118985891342, 0.00026276707649230957, 0.0002777222543954849, 0.0002926774322986603, 0.00030763261020183563, 0.000322587788105011, 0.00033754296600818634, 0.0003524981439113617, 0.00036745332181453705, 0.0003824084997177124, 0.00039736367762088776, 0.0004123188555240631, 0.00042727403342723846, 0.0004422292113304138, 0.00045718438923358917, 0.0004721395671367645, 0.0004870947450399399, 0.0005020499229431152]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 5.0, 14.0, 17.0, 16.0, 16.0, 20.0, 21.0, 17.0, 25.0, 35.0, 35.0, 39.0, 38.0, 30.0, 32.0, 32.0, 34.0, 31.0, 35.0, 53.0, 42.0, 29.0, 36.0, 34.0, 27.0, 29.0, 27.0, 35.0, 30.0, 23.0, 16.0, 22.0, 18.0, 12.0, 18.0, 3.0, 15.0, 3.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.453125, -8.20648193359375, -7.9598388671875, -7.71319580078125, -7.466552734375, -7.21990966796875, -6.9732666015625, -6.72662353515625, -6.47998046875, -6.23333740234375, -5.9866943359375, -5.74005126953125, -5.493408203125, -5.24676513671875, -5.0001220703125, -4.75347900390625, -4.5068359375, -4.26019287109375, -4.0135498046875, -3.76690673828125, -3.520263671875, -3.27362060546875, -3.0269775390625, -2.78033447265625, -2.53369140625, -2.28704833984375, -2.0404052734375, -1.79376220703125, -1.547119140625, -1.30047607421875, -1.0538330078125, -0.80718994140625, -0.560546875, -0.31390380859375, -0.0672607421875, 0.17938232421875, 0.426025390625, 0.67266845703125, 0.9193115234375, 1.16595458984375, 1.41259765625, 1.65924072265625, 1.9058837890625, 2.15252685546875, 2.399169921875, 2.64581298828125, 2.8924560546875, 3.13909912109375, 3.3857421875, 3.63238525390625, 3.8790283203125, 4.12567138671875, 4.372314453125, 4.61895751953125, 4.8656005859375, 5.11224365234375, 5.35888671875, 5.60552978515625, 5.8521728515625, 6.09881591796875, 6.345458984375, 6.59210205078125, 6.8387451171875, 7.08538818359375, 7.33203125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 13.0, 16.0, 10.0, 22.0, 31.0, 40.0, 69.0, 85.0, 102.0, 142.0, 199.0, 298.0, 407.0, 583.0, 793.0, 1384.0, 2260.0, 4482.0, 10544.0, 28521.0, 91423.0, 299861.0, 402354.0, 135432.0, 41900.0, 14100.0, 5792.0, 2872.0, 1573.0, 997.0, 627.0, 429.0, 310.0, 238.0, 195.0, 122.0, 79.0, 79.0, 45.0, 34.0, 30.0, 18.0, 10.0, 12.0, 6.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4765625, -8.195556640625, -7.91455078125, -7.633544921875, -7.3525390625, -7.071533203125, -6.79052734375, -6.509521484375, -6.228515625, -5.947509765625, -5.66650390625, -5.385498046875, -5.1044921875, -4.823486328125, -4.54248046875, -4.261474609375, -3.98046875, -3.699462890625, -3.41845703125, -3.137451171875, -2.8564453125, -2.575439453125, -2.29443359375, -2.013427734375, -1.732421875, -1.451416015625, -1.17041015625, -0.889404296875, -0.6083984375, -0.327392578125, -0.04638671875, 0.234619140625, 0.515625, 0.796630859375, 1.07763671875, 1.358642578125, 1.6396484375, 1.920654296875, 2.20166015625, 2.482666015625, 2.763671875, 3.044677734375, 3.32568359375, 3.606689453125, 3.8876953125, 4.168701171875, 4.44970703125, 4.730712890625, 5.01171875, 5.292724609375, 5.57373046875, 5.854736328125, 6.1357421875, 6.416748046875, 6.69775390625, 6.978759765625, 7.259765625, 7.540771484375, 7.82177734375, 8.102783203125, 8.3837890625, 8.664794921875, 8.94580078125, 9.226806640625, 9.5078125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 3.0, 5.0, 8.0, 14.0, 16.0, 8.0, 25.0, 11.0, 23.0, 27.0, 35.0, 35.0, 38.0, 36.0, 57.0, 74.0, 109.0, 253.0, 1538.0, 185.0, 102.0, 65.0, 46.0, 42.0, 41.0, 35.0, 34.0, 31.0, 19.0, 25.0, 21.0, 12.0, 11.0, 8.0, 8.0, 11.0, 5.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0], "bins": [-22.484375, -21.8486328125, -21.212890625, -20.5771484375, -19.94140625, -19.3056640625, -18.669921875, -18.0341796875, -17.3984375, -16.7626953125, -16.126953125, -15.4912109375, -14.85546875, -14.2197265625, -13.583984375, -12.9482421875, -12.3125, -11.6767578125, -11.041015625, -10.4052734375, -9.76953125, -9.1337890625, -8.498046875, -7.8623046875, -7.2265625, -6.5908203125, -5.955078125, -5.3193359375, -4.68359375, -4.0478515625, -3.412109375, -2.7763671875, -2.140625, -1.5048828125, -0.869140625, -0.2333984375, 0.40234375, 1.0380859375, 1.673828125, 2.3095703125, 2.9453125, 3.5810546875, 4.216796875, 4.8525390625, 5.48828125, 6.1240234375, 6.759765625, 7.3955078125, 8.03125, 8.6669921875, 9.302734375, 9.9384765625, 10.57421875, 11.2099609375, 11.845703125, 12.4814453125, 13.1171875, 13.7529296875, 14.388671875, 15.0244140625, 15.66015625, 16.2958984375, 16.931640625, 17.5673828125, 18.203125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 7.0, 9.0, 9.0, 11.0, 9.0, 28.0, 35.0, 37.0, 54.0, 62.0, 97.0, 141.0, 179.0, 319.0, 454.0, 1237.0, 12762.0, 2677807.0, 444495.0, 5881.0, 829.0, 402.0, 247.0, 172.0, 105.0, 81.0, 55.0, 46.0, 34.0, 30.0, 22.0, 11.0, 10.0, 10.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-37.71875, -36.4970703125, -35.275390625, -34.0537109375, -32.83203125, -31.6103515625, -30.388671875, -29.1669921875, -27.9453125, -26.7236328125, -25.501953125, -24.2802734375, -23.05859375, -21.8369140625, -20.615234375, -19.3935546875, -18.171875, -16.9501953125, -15.728515625, -14.5068359375, -13.28515625, -12.0634765625, -10.841796875, -9.6201171875, -8.3984375, -7.1767578125, -5.955078125, -4.7333984375, -3.51171875, -2.2900390625, -1.068359375, 0.1533203125, 1.375, 2.5966796875, 3.818359375, 5.0400390625, 6.26171875, 7.4833984375, 8.705078125, 9.9267578125, 11.1484375, 12.3701171875, 13.591796875, 14.8134765625, 16.03515625, 17.2568359375, 18.478515625, 19.7001953125, 20.921875, 22.1435546875, 23.365234375, 24.5869140625, 25.80859375, 27.0302734375, 28.251953125, 29.4736328125, 30.6953125, 31.9169921875, 33.138671875, 34.3603515625, 35.58203125, 36.8037109375, 38.025390625, 39.2470703125, 40.46875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 244.0, 766.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.1175079345703, -183.98941040039062, -173.86129760742188, -163.7332000732422, -153.60508728027344, -143.47698974609375, -133.348876953125, -123.22077941894531, -113.0926742553711, -102.96456909179688, -92.83646392822266, -82.70835876464844, -72.58026123046875, -62.452152252197266, -52.32405090332031, -42.195945739746094, -32.067840576171875, -21.939735412597656, -11.81163215637207, -1.6835289001464844, 8.444576263427734, 18.572681427001953, 28.700782775878906, 38.828887939453125, 48.956993103027344, 59.08509826660156, 69.21320343017578, 79.34130859375, 89.46940612792969, 99.59751892089844, 109.72561645507812, 119.85372161865234, 129.9818115234375, 140.1099090576172, 150.23802185058594, 160.36611938476562, 170.49423217773438, 180.62232971191406, 190.75042724609375, 200.8785400390625, 211.00665283203125, 221.13475036621094, 231.2628631591797, 241.39096069335938, 251.51907348632812, 261.6471862792969, 271.7752685546875, 281.90338134765625, 292.031494140625, 302.15960693359375, 312.2876892089844, 322.4158020019531, 332.5439147949219, 342.6720275878906, 352.80010986328125, 362.92822265625, 373.0563049316406, 383.1844177246094, 393.3125, 403.44061279296875, 413.5687255859375, 423.69683837890625, 433.8249206542969, 443.9530334472656, 454.0811462402344]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 11.0, 7.0, 8.0, 11.0, 5.0, 4.0, 21.0, 17.0, 12.0, 22.0, 20.0, 20.0, 27.0, 29.0, 25.0, 31.0, 29.0, 41.0, 30.0, 36.0, 42.0, 42.0, 39.0, 41.0, 29.0, 39.0, 27.0, 33.0, 40.0, 26.0, 18.0, 23.0, 32.0, 18.0, 27.0, 12.0, 12.0, 17.0, 19.0, 9.0, 8.0, 13.0, 11.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.38108825683594, -36.10797119140625, -34.83485794067383, -33.561744689941406, -32.28862762451172, -31.015512466430664, -29.74239730834961, -28.469282150268555, -27.1961669921875, -25.923051834106445, -24.64993667602539, -23.376821517944336, -22.10370635986328, -20.830591201782227, -19.557476043701172, -18.284360885620117, -17.011245727539062, -15.738130569458008, -14.465015411376953, -13.191900253295898, -11.918785095214844, -10.645669937133789, -9.372554779052734, -8.09943962097168, -6.826324462890625, -5.55320930480957, -4.280094146728516, -3.006978988647461, -1.7338638305664062, -0.46074867248535156, 0.8123664855957031, 2.085481643676758, 3.3585968017578125, 4.631711959838867, 5.904827117919922, 7.177942276000977, 8.451057434082031, 9.724172592163086, 10.99728775024414, 12.270402908325195, 13.54351806640625, 14.816633224487305, 16.08974838256836, 17.362863540649414, 18.63597869873047, 19.909093856811523, 21.182209014892578, 22.455324172973633, 23.728439331054688, 25.001554489135742, 26.274669647216797, 27.54778480529785, 28.820899963378906, 30.09401512145996, 31.367130279541016, 32.64024353027344, 33.913360595703125, 35.18647766113281, 36.459590911865234, 37.732704162597656, 39.005821228027344, 40.27893829345703, 41.55205154418945, 42.825164794921875, 44.09828186035156]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 12.0, 12.0, 6.0, 12.0, 20.0, 21.0, 31.0, 27.0, 26.0, 37.0, 21.0, 28.0, 41.0, 47.0, 29.0, 40.0, 54.0, 49.0, 38.0, 46.0, 26.0, 43.0, 36.0, 35.0, 35.0, 34.0, 28.0, 33.0, 18.0, 28.0, 15.0, 14.0, 18.0, 9.0, 7.0, 3.0, 10.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-9.765625, -9.49163818359375, -9.2176513671875, -8.94366455078125, -8.669677734375, -8.39569091796875, -8.1217041015625, -7.84771728515625, -7.57373046875, -7.29974365234375, -7.0257568359375, -6.75177001953125, -6.477783203125, -6.20379638671875, -5.9298095703125, -5.65582275390625, -5.3818359375, -5.10784912109375, -4.8338623046875, -4.55987548828125, -4.285888671875, -4.01190185546875, -3.7379150390625, -3.46392822265625, -3.18994140625, -2.91595458984375, -2.6419677734375, -2.36798095703125, -2.093994140625, -1.82000732421875, -1.5460205078125, -1.27203369140625, -0.998046875, -0.72406005859375, -0.4500732421875, -0.17608642578125, 0.097900390625, 0.37188720703125, 0.6458740234375, 0.91986083984375, 1.19384765625, 1.46783447265625, 1.7418212890625, 2.01580810546875, 2.289794921875, 2.56378173828125, 2.8377685546875, 3.11175537109375, 3.3857421875, 3.65972900390625, 3.9337158203125, 4.20770263671875, 4.481689453125, 4.75567626953125, 5.0296630859375, 5.30364990234375, 5.57763671875, 5.85162353515625, 6.1256103515625, 6.39959716796875, 6.673583984375, 6.94757080078125, 7.2215576171875, 7.49554443359375, 7.76953125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 16.0, 11.0, 18.0, 20.0, 27.0, 27.0, 52.0, 50.0, 77.0, 86.0, 122.0, 176.0, 254.0, 289.0, 404.0, 490.0, 21437.0, 4168190.0, 784.0, 401.0, 304.0, 261.0, 190.0, 120.0, 109.0, 68.0, 58.0, 44.0, 39.0, 25.0, 25.0, 23.0, 10.0, 15.0, 8.0, 6.0, 7.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-237.625, -229.744140625, -221.86328125, -213.982421875, -206.1015625, -198.220703125, -190.33984375, -182.458984375, -174.578125, -166.697265625, -158.81640625, -150.935546875, -143.0546875, -135.173828125, -127.29296875, -119.412109375, -111.53125, -103.650390625, -95.76953125, -87.888671875, -80.0078125, -72.126953125, -64.24609375, -56.365234375, -48.484375, -40.603515625, -32.72265625, -24.841796875, -16.9609375, -9.080078125, -1.19921875, 6.681640625, 14.5625, 22.443359375, 30.32421875, 38.205078125, 46.0859375, 53.966796875, 61.84765625, 69.728515625, 77.609375, 85.490234375, 93.37109375, 101.251953125, 109.1328125, 117.013671875, 124.89453125, 132.775390625, 140.65625, 148.537109375, 156.41796875, 164.298828125, 172.1796875, 180.060546875, 187.94140625, 195.822265625, 203.703125, 211.583984375, 219.46484375, 227.345703125, 235.2265625, 243.107421875, 250.98828125, 258.869140625, 266.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 9.0, 6.0, 3.0, 9.0, 17.0, 16.0, 37.0, 62.0, 99.0, 153.0, 281.0, 555.0, 938.0, 894.0, 449.0, 223.0, 111.0, 67.0, 62.0, 26.0, 19.0, 15.0, 13.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.546875, -23.8623046875, -23.177734375, -22.4931640625, -21.80859375, -21.1240234375, -20.439453125, -19.7548828125, -19.0703125, -18.3857421875, -17.701171875, -17.0166015625, -16.33203125, -15.6474609375, -14.962890625, -14.2783203125, -13.59375, -12.9091796875, -12.224609375, -11.5400390625, -10.85546875, -10.1708984375, -9.486328125, -8.8017578125, -8.1171875, -7.4326171875, -6.748046875, -6.0634765625, -5.37890625, -4.6943359375, -4.009765625, -3.3251953125, -2.640625, -1.9560546875, -1.271484375, -0.5869140625, 0.09765625, 0.7822265625, 1.466796875, 2.1513671875, 2.8359375, 3.5205078125, 4.205078125, 4.8896484375, 5.57421875, 6.2587890625, 6.943359375, 7.6279296875, 8.3125, 8.9970703125, 9.681640625, 10.3662109375, 11.05078125, 11.7353515625, 12.419921875, 13.1044921875, 13.7890625, 14.4736328125, 15.158203125, 15.8427734375, 16.52734375, 17.2119140625, 17.896484375, 18.5810546875, 19.265625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 15.0, 13.0, 18.0, 31.0, 46.0, 60.0, 85.0, 105.0, 335.0, 3426790.0, 766139.0, 271.0, 108.0, 77.0, 48.0, 42.0, 35.0, 19.0, 16.0, 12.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-309.25, -301.8828125, -294.515625, -287.1484375, -279.78125, -272.4140625, -265.046875, -257.6796875, -250.3125, -242.9453125, -235.578125, -228.2109375, -220.84375, -213.4765625, -206.109375, -198.7421875, -191.375, -184.0078125, -176.640625, -169.2734375, -161.90625, -154.5390625, -147.171875, -139.8046875, -132.4375, -125.0703125, -117.703125, -110.3359375, -102.96875, -95.6015625, -88.234375, -80.8671875, -73.5, -66.1328125, -58.765625, -51.3984375, -44.03125, -36.6640625, -29.296875, -21.9296875, -14.5625, -7.1953125, 0.171875, 7.5390625, 14.90625, 22.2734375, 29.640625, 37.0078125, 44.375, 51.7421875, 59.109375, 66.4765625, 73.84375, 81.2109375, 88.578125, 95.9453125, 103.3125, 110.6796875, 118.046875, 125.4140625, 132.78125, 140.1484375, 147.515625, 154.8828125, 162.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 166.0, 590.0, 233.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.12466430664062, -245.7600555419922, -239.39544677734375, -233.03085327148438, -226.66624450683594, -220.3016357421875, -213.93702697753906, -207.57241821289062, -201.2078094482422, -194.84320068359375, -188.4785919189453, -182.11398315429688, -175.7493896484375, -169.38478088378906, -163.02017211914062, -156.6555633544922, -150.29095458984375, -143.9263458251953, -137.56173706054688, -131.1971435546875, -124.83252716064453, -118.46792602539062, -112.10331726074219, -105.73870849609375, -99.37411499023438, -93.00950622558594, -86.64490509033203, -80.2802963256836, -73.91568756103516, -67.55108642578125, -61.18647766113281, -54.821868896484375, -48.45726013183594, -42.092655181884766, -35.72804641723633, -29.363441467285156, -22.99883460998535, -16.634227752685547, -10.269622802734375, -3.9050140380859375, 2.4595909118652344, 8.824197769165039, 15.188803672790527, 21.553409576416016, 27.91801643371582, 34.282623291015625, 40.6472282409668, 47.011837005615234, 53.376441955566406, 59.74104690551758, 66.10565185546875, 72.47026062011719, 78.83486938476562, 85.19947814941406, 91.56407928466797, 97.9286880493164, 104.29328918457031, 110.65789794921875, 117.02249908447266, 123.3871078491211, 129.751708984375, 136.11631774902344, 142.48092651367188, 148.8455352783203, 155.21014404296875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 1.0, 1.0, 5.0, 7.0, 8.0, 6.0, 9.0, 13.0, 15.0, 17.0, 25.0, 17.0, 27.0, 25.0, 28.0, 30.0, 40.0, 30.0, 30.0, 33.0, 40.0, 41.0, 42.0, 47.0, 46.0, 31.0, 33.0, 38.0, 34.0, 38.0, 28.0, 35.0, 21.0, 23.0, 18.0, 23.0, 23.0, 15.0, 9.0, 14.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-45.00749206542969, -43.69382858276367, -42.38016891479492, -41.066505432128906, -39.752845764160156, -38.43918228149414, -37.12552261352539, -35.811859130859375, -34.498199462890625, -33.18453598022461, -31.87087631225586, -30.557214736938477, -29.243553161621094, -27.929889678955078, -26.616228103637695, -25.302566528320312, -23.988903045654297, -22.675241470336914, -21.36157989501953, -20.04791831970215, -18.734256744384766, -17.42059326171875, -16.106931686401367, -14.793270111083984, -13.479608535766602, -12.165946960449219, -10.852285385131836, -9.538622856140137, -8.224961280822754, -6.911299705505371, -5.59763765335083, -4.283975601196289, -2.9703140258789062, -1.6566522121429443, -0.3429903984069824, 0.9706714153289795, 2.2843332290649414, 3.597994804382324, 4.911656856536865, 6.225318908691406, 7.538980484008789, 8.852642059326172, 10.166303634643555, 11.479966163635254, 12.793627738952637, 14.10728931427002, 15.420951843261719, 16.7346134185791, 18.048274993896484, 19.361936569213867, 20.67559814453125, 21.989259719848633, 23.302921295166016, 24.61658477783203, 25.930246353149414, 27.243907928466797, 28.55756950378418, 29.871231079101562, 31.184892654418945, 32.49855422973633, 33.812217712402344, 35.125877380371094, 36.43954086303711, 37.753204345703125, 39.066864013671875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 10.0, 6.0, 11.0, 13.0, 12.0, 23.0, 23.0, 17.0, 25.0, 23.0, 28.0, 23.0, 28.0, 27.0, 44.0, 32.0, 31.0, 41.0, 34.0, 29.0, 44.0, 39.0, 36.0, 42.0, 39.0, 37.0, 29.0, 25.0, 19.0, 28.0, 22.0, 25.0, 17.0, 28.0, 23.0, 14.0, 11.0, 8.0, 6.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.87506103515625, -6.6368408203125, -6.39862060546875, -6.160400390625, -5.92218017578125, -5.6839599609375, -5.44573974609375, -5.20751953125, -4.96929931640625, -4.7310791015625, -4.49285888671875, -4.254638671875, -4.01641845703125, -3.7781982421875, -3.53997802734375, -3.3017578125, -3.06353759765625, -2.8253173828125, -2.58709716796875, -2.348876953125, -2.11065673828125, -1.8724365234375, -1.63421630859375, -1.39599609375, -1.15777587890625, -0.9195556640625, -0.68133544921875, -0.443115234375, -0.20489501953125, 0.0333251953125, 0.27154541015625, 0.509765625, 0.74798583984375, 0.9862060546875, 1.22442626953125, 1.462646484375, 1.70086669921875, 1.9390869140625, 2.17730712890625, 2.41552734375, 2.65374755859375, 2.8919677734375, 3.13018798828125, 3.368408203125, 3.60662841796875, 3.8448486328125, 4.08306884765625, 4.3212890625, 4.55950927734375, 4.7977294921875, 5.03594970703125, 5.274169921875, 5.51239013671875, 5.7506103515625, 5.98883056640625, 6.22705078125, 6.46527099609375, 6.7034912109375, 6.94171142578125, 7.179931640625, 7.41815185546875, 7.6563720703125, 7.89459228515625, 8.1328125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 9.0, 7.0, 19.0, 19.0, 34.0, 58.0, 79.0, 129.0, 174.0, 277.0, 451.0, 679.0, 1055.0, 1628.0, 2514.0, 3986.0, 6182.0, 9278.0, 14787.0, 22706.0, 34954.0, 54965.0, 88466.0, 152187.0, 251405.0, 155173.0, 91144.0, 55507.0, 35591.0, 23072.0, 14925.0, 9502.0, 6199.0, 4038.0, 2567.0, 1703.0, 1090.0, 696.0, 440.0, 304.0, 206.0, 127.0, 78.0, 49.0, 33.0, 23.0, 17.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.245635986328125, -1.20611572265625, -1.166595458984375, -1.1270751953125, -1.087554931640625, -1.04803466796875, -1.008514404296875, -0.968994140625, -0.929473876953125, -0.88995361328125, -0.850433349609375, -0.8109130859375, -0.771392822265625, -0.73187255859375, -0.692352294921875, -0.65283203125, -0.613311767578125, -0.57379150390625, -0.534271240234375, -0.4947509765625, -0.455230712890625, -0.41571044921875, -0.376190185546875, -0.336669921875, -0.297149658203125, -0.25762939453125, -0.218109130859375, -0.1785888671875, -0.139068603515625, -0.09954833984375, -0.060028076171875, -0.0205078125, 0.019012451171875, 0.05853271484375, 0.098052978515625, 0.1375732421875, 0.177093505859375, 0.21661376953125, 0.256134033203125, 0.295654296875, 0.335174560546875, 0.37469482421875, 0.414215087890625, 0.4537353515625, 0.493255615234375, 0.53277587890625, 0.572296142578125, 0.61181640625, 0.651336669921875, 0.69085693359375, 0.730377197265625, 0.7698974609375, 0.809417724609375, 0.84893798828125, 0.888458251953125, 0.927978515625, 0.967498779296875, 1.00701904296875, 1.046539306640625, 1.0860595703125, 1.125579833984375, 1.16510009765625, 1.204620361328125, 1.244140625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 13.0, 14.0, 11.0, 12.0, 24.0, 17.0, 25.0, 20.0, 25.0, 35.0, 26.0, 33.0, 28.0, 27.0, 33.0, 40.0, 46.0, 39.0, 1061.0, 32.0, 27.0, 37.0, 23.0, 27.0, 38.0, 30.0, 29.0, 28.0, 19.0, 20.0, 19.0, 24.0, 16.0, 19.0, 16.0, 12.0, 8.0, 8.0, 5.0, 9.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.0703125, -3.932373046875, -3.79443359375, -3.656494140625, -3.5185546875, -3.380615234375, -3.24267578125, -3.104736328125, -2.966796875, -2.828857421875, -2.69091796875, -2.552978515625, -2.4150390625, -2.277099609375, -2.13916015625, -2.001220703125, -1.86328125, -1.725341796875, -1.58740234375, -1.449462890625, -1.3115234375, -1.173583984375, -1.03564453125, -0.897705078125, -0.759765625, -0.621826171875, -0.48388671875, -0.345947265625, -0.2080078125, -0.070068359375, 0.06787109375, 0.205810546875, 0.34375, 0.481689453125, 0.61962890625, 0.757568359375, 0.8955078125, 1.033447265625, 1.17138671875, 1.309326171875, 1.447265625, 1.585205078125, 1.72314453125, 1.861083984375, 1.9990234375, 2.136962890625, 2.27490234375, 2.412841796875, 2.55078125, 2.688720703125, 2.82666015625, 2.964599609375, 3.1025390625, 3.240478515625, 3.37841796875, 3.516357421875, 3.654296875, 3.792236328125, 3.93017578125, 4.068115234375, 4.2060546875, 4.343994140625, 4.48193359375, 4.619873046875, 4.7578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 6.0, 17.0, 19.0, 19.0, 37.0, 64.0, 86.0, 116.0, 192.0, 264.0, 407.0, 564.0, 813.0, 1254.0, 1804.0, 2646.0, 3938.0, 5717.0, 8449.0, 12644.0, 18760.0, 28894.0, 43980.0, 69117.0, 113843.0, 199641.0, 1257802.0, 118639.0, 72086.0, 45711.0, 29391.0, 19482.0, 13224.0, 8718.0, 5975.0, 4068.0, 2788.0, 1890.0, 1306.0, 836.0, 635.0, 439.0, 273.0, 207.0, 127.0, 85.0, 55.0, 41.0, 27.0, 18.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0], "bins": [-1.1396484375, -1.106170654296875, -1.07269287109375, -1.039215087890625, -1.0057373046875, -0.972259521484375, -0.93878173828125, -0.905303955078125, -0.871826171875, -0.838348388671875, -0.80487060546875, -0.771392822265625, -0.7379150390625, -0.704437255859375, -0.67095947265625, -0.637481689453125, -0.60400390625, -0.570526123046875, -0.53704833984375, -0.503570556640625, -0.4700927734375, -0.436614990234375, -0.40313720703125, -0.369659423828125, -0.336181640625, -0.302703857421875, -0.26922607421875, -0.235748291015625, -0.2022705078125, -0.168792724609375, -0.13531494140625, -0.101837158203125, -0.068359375, -0.034881591796875, -0.00140380859375, 0.032073974609375, 0.0655517578125, 0.099029541015625, 0.13250732421875, 0.165985107421875, 0.199462890625, 0.232940673828125, 0.26641845703125, 0.299896240234375, 0.3333740234375, 0.366851806640625, 0.40032958984375, 0.433807373046875, 0.46728515625, 0.500762939453125, 0.53424072265625, 0.567718505859375, 0.6011962890625, 0.634674072265625, 0.66815185546875, 0.701629638671875, 0.735107421875, 0.768585205078125, 0.80206298828125, 0.835540771484375, 0.8690185546875, 0.902496337890625, 0.93597412109375, 0.969451904296875, 1.0029296875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 3.0, 5.0, 9.0, 6.0, 18.0, 21.0, 18.0, 28.0, 51.0, 71.0, 94.0, 104.0, 134.0, 121.0, 89.0, 66.0, 38.0, 17.0, 25.0, 15.0, 13.0, 13.0, 5.0, 5.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014142990112304688, -0.0013765990734100342, -0.0013388991355895996, -0.001301199197769165, -0.0012634992599487305, -0.001225799322128296, -0.0011880993843078613, -0.0011503994464874268, -0.0011126995086669922, -0.0010749995708465576, -0.001037299633026123, -0.0009995996952056885, -0.0009618997573852539, -0.0009241998195648193, -0.0008864998817443848, -0.0008487999439239502, -0.0008111000061035156, -0.0007734000682830811, -0.0007357001304626465, -0.0006980001926422119, -0.0006603002548217773, -0.0006226003170013428, -0.0005849003791809082, -0.0005472004413604736, -0.0005095005035400391, -0.0004718005657196045, -0.0004341006278991699, -0.00039640069007873535, -0.0003587007522583008, -0.0003210008144378662, -0.00028330087661743164, -0.00024560093879699707, -0.0002079010009765625, -0.00017020106315612793, -0.00013250112533569336, -9.480118751525879e-05, -5.710124969482422e-05, -1.940131187438965e-05, 1.8298625946044922e-05, 5.599856376647949e-05, 9.369850158691406e-05, 0.00013139843940734863, 0.0001690983772277832, 0.00020679831504821777, 0.00024449825286865234, 0.0002821981906890869, 0.0003198981285095215, 0.00035759806632995605, 0.0003952980041503906, 0.0004329979419708252, 0.00047069787979125977, 0.0005083978176116943, 0.0005460977554321289, 0.0005837976932525635, 0.000621497631072998, 0.0006591975688934326, 0.0006968975067138672, 0.0007345974445343018, 0.0007722973823547363, 0.0008099973201751709, 0.0008476972579956055, 0.00088539719581604, 0.0009230971336364746, 0.0009607970714569092, 0.0009984970092773438]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 8.0, 11.0, 16.0, 14.0, 13.0, 23.0, 42.0, 39.0, 67.0, 95.0, 167.0, 267.0, 409.0, 1045.0, 559244.0, 484729.0, 1044.0, 469.0, 273.0, 175.0, 97.0, 76.0, 58.0, 42.0, 31.0, 14.0, 19.0, 18.0, 7.0, 14.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01666259765625, -0.016045331954956055, -0.01542806625366211, -0.014810800552368164, -0.014193534851074219, -0.013576269149780273, -0.012959003448486328, -0.012341737747192383, -0.011724472045898438, -0.011107206344604492, -0.010489940643310547, -0.009872674942016602, -0.009255409240722656, -0.008638143539428711, -0.008020877838134766, -0.00740361213684082, -0.006786346435546875, -0.00616908073425293, -0.005551815032958984, -0.004934549331665039, -0.004317283630371094, -0.0037000179290771484, -0.003082752227783203, -0.002465486526489258, -0.0018482208251953125, -0.0012309551239013672, -0.0006136894226074219, 3.5762786865234375e-06, 0.0006208419799804688, 0.001238107681274414, 0.0018553733825683594, 0.0024726390838623047, 0.00308990478515625, 0.0037071704864501953, 0.004324436187744141, 0.004941701889038086, 0.005558967590332031, 0.0061762332916259766, 0.006793498992919922, 0.007410764694213867, 0.008028030395507812, 0.008645296096801758, 0.009262561798095703, 0.009879827499389648, 0.010497093200683594, 0.011114358901977539, 0.011731624603271484, 0.01234889030456543, 0.012966156005859375, 0.01358342170715332, 0.014200687408447266, 0.014817953109741211, 0.015435218811035156, 0.0160524845123291, 0.016669750213623047, 0.017287015914916992, 0.017904281616210938, 0.018521547317504883, 0.019138813018798828, 0.019756078720092773, 0.02037334442138672, 0.020990610122680664, 0.02160787582397461, 0.022225141525268555, 0.0228424072265625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 686.0, 309.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00072041607927531, -0.0006152072455734015, -0.0005099984118714929, -0.0004047896363772452, -0.0002995808026753366, -0.000194371968973428, -8.916319347918034e-05, 1.6045640222728252e-05, 0.00012125447392463684, 0.0002264632930746302, 0.00033167211222462356, 0.0004368809168227017, 0.0005420897505246103, 0.0006472985842265189, 0.0007525073597207665, 0.0008577161934226751, 0.0009629250271245837, 0.0010681338608264923, 0.001173342694528401, 0.0012785515282303095, 0.0013837602455168962, 0.0014889691956341267, 0.0015941779129207134, 0.001699386746622622, 0.0018045955803245306, 0.0019098044140264392, 0.0020150132477283478, 0.0021202219650149345, 0.002225430915132165, 0.0023306396324187517, 0.002435848582535982, 0.002541057299822569, 0.0026462660171091557, 0.0027514747343957424, 0.002856683684512973, 0.0029618924017995596, 0.00306710135191679, 0.0031723100692033768, 0.0032775187864899635, 0.003382727736607194, 0.0034879366867244244, 0.003593145404011011, 0.0036983543541282415, 0.0038035630714148283, 0.003908772021532059, 0.0040139807388186455, 0.004119189456105232, 0.004224398173391819, 0.004329606890678406, 0.0044348156079649925, 0.004540024325251579, 0.004645233508199453, 0.00475044222548604, 0.004855650942772627, 0.004960859660059214, 0.005066068843007088, 0.0051712775602936745, 0.005276486277580261, 0.005381694994866848, 0.005486904177814722, 0.005592112895101309, 0.005697321612387896, 0.005802530329674482, 0.005907739512622356, 0.006012948229908943]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 2.0, 8.0, 17.0, 6.0, 10.0, 6.0, 15.0, 12.0, 21.0, 23.0, 27.0, 16.0, 23.0, 30.0, 34.0, 28.0, 34.0, 35.0, 42.0, 48.0, 50.0, 30.0, 33.0, 38.0, 28.0, 38.0, 31.0, 28.0, 36.0, 21.0, 33.0, 27.0, 25.0, 20.0, 17.0, 13.0, 21.0, 17.0, 13.0, 2.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003616213798522949, -0.00034914351999759674, -0.00033666566014289856, -0.0003241878002882004, -0.0003117099404335022, -0.000299232080578804, -0.00028675422072410583, -0.00027427636086940765, -0.00026179850101470947, -0.0002493206411600113, -0.0002368427813053131, -0.00022436492145061493, -0.00021188706159591675, -0.00019940920174121857, -0.00018693134188652039, -0.0001744534820318222, -0.00016197562217712402, -0.00014949776232242584, -0.00013701990246772766, -0.00012454204261302948, -0.0001120641827583313, -9.958632290363312e-05, -8.710846304893494e-05, -7.463060319423676e-05, -6.215274333953857e-05, -4.967488348484039e-05, -3.719702363014221e-05, -2.471916377544403e-05, -1.224130392074585e-05, 2.3655593395233154e-07, 1.2714415788650513e-05, 2.5192275643348694e-05, 3.7670135498046875e-05, 5.0147995352745056e-05, 6.262585520744324e-05, 7.510371506214142e-05, 8.75815749168396e-05, 0.00010005943477153778, 0.00011253729462623596, 0.00012501515448093414, 0.00013749301433563232, 0.0001499708741903305, 0.0001624487340450287, 0.00017492659389972687, 0.00018740445375442505, 0.00019988231360912323, 0.0002123601734638214, 0.0002248380333185196, 0.00023731589317321777, 0.00024979375302791595, 0.00026227161288261414, 0.0002747494727373123, 0.0002872273325920105, 0.0002997051924467087, 0.00031218305230140686, 0.00032466091215610504, 0.0003371387720108032, 0.0003496166318655014, 0.0003620944917201996, 0.00037457235157489777, 0.00038705021142959595, 0.00039952807128429413, 0.0004120059311389923, 0.0004244837909936905, 0.00043696165084838867]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 10.0, 6.0, 11.0, 13.0, 12.0, 23.0, 23.0, 17.0, 25.0, 23.0, 28.0, 23.0, 28.0, 27.0, 44.0, 32.0, 31.0, 41.0, 33.0, 30.0, 44.0, 39.0, 36.0, 42.0, 39.0, 37.0, 29.0, 25.0, 19.0, 28.0, 22.0, 25.0, 17.0, 28.0, 23.0, 14.0, 11.0, 8.0, 6.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.87506103515625, -6.6368408203125, -6.39862060546875, -6.160400390625, -5.92218017578125, -5.6839599609375, -5.44573974609375, -5.20751953125, -4.96929931640625, -4.7310791015625, -4.49285888671875, -4.254638671875, -4.01641845703125, -3.7781982421875, -3.53997802734375, -3.3017578125, -3.06353759765625, -2.8253173828125, -2.58709716796875, -2.348876953125, -2.11065673828125, -1.8724365234375, -1.63421630859375, -1.39599609375, -1.15777587890625, -0.9195556640625, -0.68133544921875, -0.443115234375, -0.20489501953125, 0.0333251953125, 0.27154541015625, 0.509765625, 0.74798583984375, 0.9862060546875, 1.22442626953125, 1.462646484375, 1.70086669921875, 1.9390869140625, 2.17730712890625, 2.41552734375, 2.65374755859375, 2.8919677734375, 3.13018798828125, 3.368408203125, 3.60662841796875, 3.8448486328125, 4.08306884765625, 4.3212890625, 4.55950927734375, 4.7977294921875, 5.03594970703125, 5.274169921875, 5.51239013671875, 5.7506103515625, 5.98883056640625, 6.22705078125, 6.46527099609375, 6.7034912109375, 6.94171142578125, 7.179931640625, 7.41815185546875, 7.6563720703125, 7.89459228515625, 8.1328125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 2.0, 5.0, 23.0, 13.0, 22.0, 33.0, 40.0, 56.0, 92.0, 108.0, 135.0, 200.0, 206.0, 299.0, 373.0, 450.0, 564.0, 714.0, 857.0, 1165.0, 1975.0, 4425.0, 13642.0, 57837.0, 256005.0, 505602.0, 150958.0, 34322.0, 8929.0, 3009.0, 1559.0, 1010.0, 786.0, 662.0, 571.0, 426.0, 356.0, 267.0, 220.0, 151.0, 123.0, 99.0, 66.0, 46.0, 39.0, 24.0, 25.0, 20.0, 6.0, 10.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0], "bins": [-11.3984375, -11.0457763671875, -10.693115234375, -10.3404541015625, -9.98779296875, -9.6351318359375, -9.282470703125, -8.9298095703125, -8.5771484375, -8.2244873046875, -7.871826171875, -7.5191650390625, -7.16650390625, -6.8138427734375, -6.461181640625, -6.1085205078125, -5.755859375, -5.4031982421875, -5.050537109375, -4.6978759765625, -4.34521484375, -3.9925537109375, -3.639892578125, -3.2872314453125, -2.9345703125, -2.5819091796875, -2.229248046875, -1.8765869140625, -1.52392578125, -1.1712646484375, -0.818603515625, -0.4659423828125, -0.11328125, 0.2393798828125, 0.592041015625, 0.9447021484375, 1.29736328125, 1.6500244140625, 2.002685546875, 2.3553466796875, 2.7080078125, 3.0606689453125, 3.413330078125, 3.7659912109375, 4.11865234375, 4.4713134765625, 4.823974609375, 5.1766357421875, 5.529296875, 5.8819580078125, 6.234619140625, 6.5872802734375, 6.93994140625, 7.2926025390625, 7.645263671875, 7.9979248046875, 8.3505859375, 8.7032470703125, 9.055908203125, 9.4085693359375, 9.76123046875, 10.1138916015625, 10.466552734375, 10.8192138671875, 11.171875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 8.0, 6.0, 6.0, 11.0, 18.0, 12.0, 23.0, 12.0, 18.0, 29.0, 38.0, 40.0, 55.0, 49.0, 60.0, 106.0, 280.0, 1605.0, 151.0, 67.0, 64.0, 49.0, 51.0, 41.0, 42.0, 37.0, 31.0, 26.0, 16.0, 17.0, 15.0, 11.0, 8.0, 8.0, 4.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.640625, -15.982177734375, -15.32373046875, -14.665283203125, -14.0068359375, -13.348388671875, -12.68994140625, -12.031494140625, -11.373046875, -10.714599609375, -10.05615234375, -9.397705078125, -8.7392578125, -8.080810546875, -7.42236328125, -6.763916015625, -6.10546875, -5.447021484375, -4.78857421875, -4.130126953125, -3.4716796875, -2.813232421875, -2.15478515625, -1.496337890625, -0.837890625, -0.179443359375, 0.47900390625, 1.137451171875, 1.7958984375, 2.454345703125, 3.11279296875, 3.771240234375, 4.4296875, 5.088134765625, 5.74658203125, 6.405029296875, 7.0634765625, 7.721923828125, 8.38037109375, 9.038818359375, 9.697265625, 10.355712890625, 11.01416015625, 11.672607421875, 12.3310546875, 12.989501953125, 13.64794921875, 14.306396484375, 14.96484375, 15.623291015625, 16.28173828125, 16.940185546875, 17.5986328125, 18.257080078125, 18.91552734375, 19.573974609375, 20.232421875, 20.890869140625, 21.54931640625, 22.207763671875, 22.8662109375, 23.524658203125, 24.18310546875, 24.841552734375, 25.5]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 8.0, 5.0, 7.0, 9.0, 10.0, 15.0, 22.0, 30.0, 26.0, 41.0, 38.0, 65.0, 100.0, 147.0, 240.0, 346.0, 680.0, 2053.0, 2903397.0, 235483.0, 1523.0, 564.0, 312.0, 163.0, 114.0, 81.0, 55.0, 48.0, 25.0, 18.0, 15.0, 17.0, 14.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.0625, -66.8974609375, -64.732421875, -62.5673828125, -60.40234375, -58.2373046875, -56.072265625, -53.9072265625, -51.7421875, -49.5771484375, -47.412109375, -45.2470703125, -43.08203125, -40.9169921875, -38.751953125, -36.5869140625, -34.421875, -32.2568359375, -30.091796875, -27.9267578125, -25.76171875, -23.5966796875, -21.431640625, -19.2666015625, -17.1015625, -14.9365234375, -12.771484375, -10.6064453125, -8.44140625, -6.2763671875, -4.111328125, -1.9462890625, 0.21875, 2.3837890625, 4.548828125, 6.7138671875, 8.87890625, 11.0439453125, 13.208984375, 15.3740234375, 17.5390625, 19.7041015625, 21.869140625, 24.0341796875, 26.19921875, 28.3642578125, 30.529296875, 32.6943359375, 34.859375, 37.0244140625, 39.189453125, 41.3544921875, 43.51953125, 45.6845703125, 47.849609375, 50.0146484375, 52.1796875, 54.3447265625, 56.509765625, 58.6748046875, 60.83984375, 63.0048828125, 65.169921875, 67.3349609375, 69.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 848.0, 155.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.08770751953125, -261.9179992675781, -251.74827575683594, -241.57855224609375, -231.40884399414062, -221.2391357421875, -211.0694122314453, -200.89968872070312, -190.72998046875, -180.56027221679688, -170.3905487060547, -160.2208251953125, -150.05111694335938, -139.88140869140625, -129.71168518066406, -119.5419692993164, -109.37225341796875, -99.2025375366211, -89.03282165527344, -78.86310577392578, -68.69338989257812, -58.52367401123047, -48.35395812988281, -38.184242248535156, -28.0145263671875, -17.844810485839844, -7.6750946044921875, 2.4946212768554688, 12.664337158203125, 22.83405303955078, 33.00376892089844, 43.173484802246094, 53.343170166015625, 63.51288604736328, 73.68260192871094, 83.8523178100586, 94.02203369140625, 104.1917495727539, 114.36146545410156, 124.53118133544922, 134.70089721679688, 144.87060546875, 155.0403289794922, 165.21005249023438, 175.3797607421875, 185.54946899414062, 195.7191925048828, 205.888916015625, 216.05862426757812, 226.22833251953125, 236.39805603027344, 246.56777954101562, 256.73748779296875, 266.9071960449219, 277.076904296875, 287.24664306640625, 297.4163513183594, 307.5860595703125, 317.75579833984375, 327.9255065917969, 338.09521484375, 348.2649230957031, 358.43463134765625, 368.6043701171875, 378.7740783691406]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 6.0, 9.0, 12.0, 21.0, 17.0, 16.0, 24.0, 22.0, 36.0, 28.0, 26.0, 34.0, 23.0, 40.0, 26.0, 41.0, 55.0, 51.0, 47.0, 51.0, 34.0, 34.0, 24.0, 39.0, 38.0, 37.0, 29.0, 31.0, 19.0, 19.0, 18.0, 21.0, 7.0, 17.0, 9.0, 10.0, 7.0, 4.0, 5.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.91034698486328, -50.182552337646484, -48.45476150512695, -46.726966857910156, -44.999176025390625, -43.27138137817383, -41.54358673095703, -39.8157958984375, -38.0880012512207, -36.360206604003906, -34.632415771484375, -32.90462112426758, -31.176828384399414, -29.44903564453125, -27.721240997314453, -25.99344825744629, -24.265655517578125, -22.53786277770996, -20.810070037841797, -19.082275390625, -17.354482650756836, -15.626689910888672, -13.898896217346191, -12.171102523803711, -10.443309783935547, -8.715517044067383, -6.987723350524902, -5.25993013381958, -3.532136917114258, -1.8043441772460938, -0.07655048370361328, 1.6512432098388672, 3.3790359497070312, 5.1068291664123535, 6.834622383117676, 8.562416076660156, 10.29020881652832, 12.018001556396484, 13.745795249938965, 15.473588943481445, 17.20138168334961, 18.929174423217773, 20.656967163085938, 22.384761810302734, 24.1125545501709, 25.840347290039062, 27.56814193725586, 29.295934677124023, 31.023727416992188, 32.751522064208984, 34.479312896728516, 36.20710754394531, 37.934898376464844, 39.66269302368164, 41.39048767089844, 43.11827850341797, 44.846073150634766, 46.57386779785156, 48.301658630371094, 50.02945327758789, 51.75724792480469, 53.48503875732422, 55.212833404541016, 56.94062805175781, 58.668418884277344]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 8.0, 12.0, 7.0, 24.0, 10.0, 13.0, 21.0, 23.0, 34.0, 25.0, 43.0, 39.0, 40.0, 39.0, 48.0, 51.0, 43.0, 56.0, 42.0, 46.0, 42.0, 40.0, 42.0, 34.0, 26.0, 28.0, 27.0, 24.0, 25.0, 14.0, 22.0, 16.0, 12.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.1971435546875, -7.917724609375, -7.6383056640625, -7.35888671875, -7.0794677734375, -6.800048828125, -6.5206298828125, -6.2412109375, -5.9617919921875, -5.682373046875, -5.4029541015625, -5.12353515625, -4.8441162109375, -4.564697265625, -4.2852783203125, -4.005859375, -3.7264404296875, -3.447021484375, -3.1676025390625, -2.88818359375, -2.6087646484375, -2.329345703125, -2.0499267578125, -1.7705078125, -1.4910888671875, -1.211669921875, -0.9322509765625, -0.65283203125, -0.3734130859375, -0.093994140625, 0.1854248046875, 0.46484375, 0.7442626953125, 1.023681640625, 1.3031005859375, 1.58251953125, 1.8619384765625, 2.141357421875, 2.4207763671875, 2.7001953125, 2.9796142578125, 3.259033203125, 3.5384521484375, 3.81787109375, 4.0972900390625, 4.376708984375, 4.6561279296875, 4.935546875, 5.2149658203125, 5.494384765625, 5.7738037109375, 6.05322265625, 6.3326416015625, 6.612060546875, 6.8914794921875, 7.1708984375, 7.4503173828125, 7.729736328125, 8.0091552734375, 8.28857421875, 8.5679931640625, 8.847412109375, 9.1268310546875, 9.40625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 8.0, 10.0, 11.0, 15.0, 24.0, 30.0, 41.0, 58.0, 63.0, 83.0, 99.0, 120.0, 159.0, 245.0, 417.0, 984.0, 4015.0, 42689.0, 2030262.0, 2065570.0, 42800.0, 4167.0, 1052.0, 378.0, 224.0, 152.0, 135.0, 95.0, 72.0, 54.0, 52.0, 40.0, 37.0, 26.0, 20.0, 20.0, 11.0, 11.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.421875, -26.537353515625, -25.65283203125, -24.768310546875, -23.8837890625, -22.999267578125, -22.11474609375, -21.230224609375, -20.345703125, -19.461181640625, -18.57666015625, -17.692138671875, -16.8076171875, -15.923095703125, -15.03857421875, -14.154052734375, -13.26953125, -12.385009765625, -11.50048828125, -10.615966796875, -9.7314453125, -8.846923828125, -7.96240234375, -7.077880859375, -6.193359375, -5.308837890625, -4.42431640625, -3.539794921875, -2.6552734375, -1.770751953125, -0.88623046875, -0.001708984375, 0.8828125, 1.767333984375, 2.65185546875, 3.536376953125, 4.4208984375, 5.305419921875, 6.18994140625, 7.074462890625, 7.958984375, 8.843505859375, 9.72802734375, 10.612548828125, 11.4970703125, 12.381591796875, 13.26611328125, 14.150634765625, 15.03515625, 15.919677734375, 16.80419921875, 17.688720703125, 18.5732421875, 19.457763671875, 20.34228515625, 21.226806640625, 22.111328125, 22.995849609375, 23.88037109375, 24.764892578125, 25.6494140625, 26.533935546875, 27.41845703125, 28.302978515625, 29.1875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 13.0, 11.0, 17.0, 31.0, 39.0, 49.0, 71.0, 107.0, 110.0, 149.0, 222.0, 300.0, 425.0, 591.0, 516.0, 425.0, 237.0, 173.0, 150.0, 99.0, 86.0, 66.0, 42.0, 38.0, 25.0, 12.0, 19.0, 11.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.309814453125, -12.86181640625, -12.413818359375, -11.9658203125, -11.517822265625, -11.06982421875, -10.621826171875, -10.173828125, -9.725830078125, -9.27783203125, -8.829833984375, -8.3818359375, -7.933837890625, -7.48583984375, -7.037841796875, -6.58984375, -6.141845703125, -5.69384765625, -5.245849609375, -4.7978515625, -4.349853515625, -3.90185546875, -3.453857421875, -3.005859375, -2.557861328125, -2.10986328125, -1.661865234375, -1.2138671875, -0.765869140625, -0.31787109375, 0.130126953125, 0.578125, 1.026123046875, 1.47412109375, 1.922119140625, 2.3701171875, 2.818115234375, 3.26611328125, 3.714111328125, 4.162109375, 4.610107421875, 5.05810546875, 5.506103515625, 5.9541015625, 6.402099609375, 6.85009765625, 7.298095703125, 7.74609375, 8.194091796875, 8.64208984375, 9.090087890625, 9.5380859375, 9.986083984375, 10.43408203125, 10.882080078125, 11.330078125, 11.778076171875, 12.22607421875, 12.674072265625, 13.1220703125, 13.570068359375, 14.01806640625, 14.466064453125, 14.9140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 8.0, 15.0, 15.0, 44.0, 60.0, 134.0, 257.0, 813.0, 5636.0, 4060491.0, 124258.0, 1738.0, 426.0, 168.0, 104.0, 45.0, 28.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.9375, -79.435546875, -76.93359375, -74.431640625, -71.9296875, -69.427734375, -66.92578125, -64.423828125, -61.921875, -59.419921875, -56.91796875, -54.416015625, -51.9140625, -49.412109375, -46.91015625, -44.408203125, -41.90625, -39.404296875, -36.90234375, -34.400390625, -31.8984375, -29.396484375, -26.89453125, -24.392578125, -21.890625, -19.388671875, -16.88671875, -14.384765625, -11.8828125, -9.380859375, -6.87890625, -4.376953125, -1.875, 0.626953125, 3.12890625, 5.630859375, 8.1328125, 10.634765625, 13.13671875, 15.638671875, 18.140625, 20.642578125, 23.14453125, 25.646484375, 28.1484375, 30.650390625, 33.15234375, 35.654296875, 38.15625, 40.658203125, 43.16015625, 45.662109375, 48.1640625, 50.666015625, 53.16796875, 55.669921875, 58.171875, 60.673828125, 63.17578125, 65.677734375, 68.1796875, 70.681640625, 73.18359375, 75.685546875, 78.1875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 18.0, 410.0, 567.0, 18.0, 3.0, 2.0, 0.0, 1.0], "bins": [-562.8705444335938, -553.1758422851562, -543.4810791015625, -533.786376953125, -524.0916748046875, -514.3969116210938, -504.70220947265625, -495.00750732421875, -485.3127746582031, -475.6180419921875, -465.92333984375, -456.2286071777344, -446.53387451171875, -436.83917236328125, -427.1444396972656, -417.44970703125, -407.7550048828125, -398.0602722167969, -388.3655700683594, -378.67083740234375, -368.9761047363281, -359.2814025878906, -349.586669921875, -339.8919677734375, -330.19720458984375, -320.5024719238281, -310.8077697753906, -301.113037109375, -291.4183044433594, -281.7236022949219, -272.02886962890625, -262.33416748046875, -252.63941955566406, -242.9447021484375, -233.24996948242188, -223.5552520751953, -213.86053466796875, -204.16580200195312, -194.47108459472656, -184.7763671875, -175.08163452148438, -165.3869171142578, -155.6921844482422, -145.99746704101562, -136.30274963378906, -126.60802459716797, -116.91329956054688, -107.21858215332031, -97.52386474609375, -87.82913970947266, -78.1344223022461, -68.439697265625, -58.74497604370117, -49.050254821777344, -39.35552978515625, -29.660812377929688, -19.966087341308594, -10.27136516571045, -0.5766429901123047, 9.118080139160156, 18.812801361083984, 28.507522583007812, 38.202247619628906, 47.89696502685547, 57.59169006347656]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 5.0, 12.0, 18.0, 16.0, 14.0, 20.0, 30.0, 27.0, 18.0, 27.0, 35.0, 46.0, 53.0, 45.0, 52.0, 46.0, 41.0, 41.0, 41.0, 49.0, 34.0, 49.0, 39.0, 36.0, 27.0, 20.0, 21.0, 17.0, 16.0, 19.0, 9.0, 12.0, 10.0, 8.0, 6.0, 9.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.919647216796875, -47.3433723449707, -45.76709747314453, -44.19082260131836, -42.61454772949219, -41.03827667236328, -39.46200180053711, -37.88572692871094, -36.309452056884766, -34.733177185058594, -33.15690231323242, -31.580629348754883, -30.00435447692871, -28.42807960510254, -26.851806640625, -25.275531768798828, -23.699256896972656, -22.122982025146484, -20.546707153320312, -18.970434188842773, -17.3941593170166, -15.81788444519043, -14.241610527038574, -12.665336608886719, -11.089061737060547, -9.512786865234375, -7.9365129470825195, -6.360238552093506, -4.783964157104492, -3.2076897621154785, -1.6314153671264648, -0.055141448974609375, 1.5211334228515625, 3.097407817840576, 4.67368221282959, 6.2499566078186035, 7.826231002807617, 9.402505874633789, 10.978779792785645, 12.5550537109375, 14.131328582763672, 15.707603454589844, 17.283878326416016, 18.860151290893555, 20.436426162719727, 22.0127010345459, 23.588973999023438, 25.16524887084961, 26.74152374267578, 28.317798614501953, 29.894073486328125, 31.470346450805664, 33.04662322998047, 34.622894287109375, 36.19916915893555, 37.77544403076172, 39.35171890258789, 40.92799377441406, 42.504268646240234, 44.080543518066406, 45.65681457519531, 47.233089447021484, 48.809364318847656, 50.38563919067383, 51.9619140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 14.0, 21.0, 21.0, 14.0, 25.0, 24.0, 42.0, 38.0, 30.0, 36.0, 48.0, 34.0, 33.0, 44.0, 52.0, 59.0, 50.0, 44.0, 39.0, 45.0, 46.0, 38.0, 30.0, 22.0, 27.0, 22.0, 20.0, 18.0, 12.0, 12.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.48248291015625, -7.2540283203125, -7.02557373046875, -6.797119140625, -6.56866455078125, -6.3402099609375, -6.11175537109375, -5.88330078125, -5.65484619140625, -5.4263916015625, -5.19793701171875, -4.969482421875, -4.74102783203125, -4.5125732421875, -4.28411865234375, -4.0556640625, -3.82720947265625, -3.5987548828125, -3.37030029296875, -3.141845703125, -2.91339111328125, -2.6849365234375, -2.45648193359375, -2.22802734375, -1.99957275390625, -1.7711181640625, -1.54266357421875, -1.314208984375, -1.08575439453125, -0.8572998046875, -0.62884521484375, -0.400390625, -0.17193603515625, 0.0565185546875, 0.28497314453125, 0.513427734375, 0.74188232421875, 0.9703369140625, 1.19879150390625, 1.42724609375, 1.65570068359375, 1.8841552734375, 2.11260986328125, 2.341064453125, 2.56951904296875, 2.7979736328125, 3.02642822265625, 3.2548828125, 3.48333740234375, 3.7117919921875, 3.94024658203125, 4.168701171875, 4.39715576171875, 4.6256103515625, 4.85406494140625, 5.08251953125, 5.31097412109375, 5.5394287109375, 5.76788330078125, 5.996337890625, 6.22479248046875, 6.4532470703125, 6.68170166015625, 6.91015625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 11.0, 8.0, 21.0, 35.0, 48.0, 70.0, 103.0, 135.0, 239.0, 402.0, 581.0, 851.0, 1368.0, 2148.0, 3559.0, 5660.0, 9228.0, 14969.0, 24545.0, 40881.0, 68386.0, 121283.0, 235941.0, 230607.0, 118275.0, 66884.0, 39696.0, 24247.0, 14510.0, 8974.0, 5524.0, 3426.0, 2076.0, 1449.0, 837.0, 530.0, 361.0, 256.0, 139.0, 90.0, 71.0, 51.0, 25.0, 19.0, 13.0, 8.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.021392822265625, -0.98614501953125, -0.950897216796875, -0.9156494140625, -0.880401611328125, -0.84515380859375, -0.809906005859375, -0.774658203125, -0.739410400390625, -0.70416259765625, -0.668914794921875, -0.6336669921875, -0.598419189453125, -0.56317138671875, -0.527923583984375, -0.49267578125, -0.457427978515625, -0.42218017578125, -0.386932373046875, -0.3516845703125, -0.316436767578125, -0.28118896484375, -0.245941162109375, -0.210693359375, -0.175445556640625, -0.14019775390625, -0.104949951171875, -0.0697021484375, -0.034454345703125, 0.00079345703125, 0.036041259765625, 0.0712890625, 0.106536865234375, 0.14178466796875, 0.177032470703125, 0.2122802734375, 0.247528076171875, 0.28277587890625, 0.318023681640625, 0.353271484375, 0.388519287109375, 0.42376708984375, 0.459014892578125, 0.4942626953125, 0.529510498046875, 0.56475830078125, 0.600006103515625, 0.63525390625, 0.670501708984375, 0.70574951171875, 0.740997314453125, 0.7762451171875, 0.811492919921875, 0.84674072265625, 0.881988525390625, 0.917236328125, 0.952484130859375, 0.98773193359375, 1.022979736328125, 1.0582275390625, 1.093475341796875, 1.12872314453125, 1.163970947265625, 1.19921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 11.0, 11.0, 18.0, 19.0, 16.0, 15.0, 26.0, 26.0, 27.0, 32.0, 28.0, 24.0, 34.0, 37.0, 32.0, 38.0, 39.0, 1081.0, 33.0, 30.0, 38.0, 42.0, 46.0, 32.0, 47.0, 23.0, 30.0, 33.0, 27.0, 17.0, 20.0, 12.0, 12.0, 8.0, 12.0, 5.0, 3.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.3671875, -4.237152099609375, -4.10711669921875, -3.977081298828125, -3.8470458984375, -3.717010498046875, -3.58697509765625, -3.456939697265625, -3.326904296875, -3.196868896484375, -3.06683349609375, -2.936798095703125, -2.8067626953125, -2.676727294921875, -2.54669189453125, -2.416656494140625, -2.28662109375, -2.156585693359375, -2.02655029296875, -1.896514892578125, -1.7664794921875, -1.636444091796875, -1.50640869140625, -1.376373291015625, -1.246337890625, -1.116302490234375, -0.98626708984375, -0.856231689453125, -0.7261962890625, -0.596160888671875, -0.46612548828125, -0.336090087890625, -0.2060546875, -0.076019287109375, 0.05401611328125, 0.184051513671875, 0.3140869140625, 0.444122314453125, 0.57415771484375, 0.704193115234375, 0.834228515625, 0.964263916015625, 1.09429931640625, 1.224334716796875, 1.3543701171875, 1.484405517578125, 1.61444091796875, 1.744476318359375, 1.87451171875, 2.004547119140625, 2.13458251953125, 2.264617919921875, 2.3946533203125, 2.524688720703125, 2.65472412109375, 2.784759521484375, 2.914794921875, 3.044830322265625, 3.17486572265625, 3.304901123046875, 3.4349365234375, 3.564971923828125, 3.69500732421875, 3.825042724609375, 3.955078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 8.0, 10.0, 10.0, 9.0, 32.0, 35.0, 45.0, 79.0, 118.0, 205.0, 281.0, 445.0, 633.0, 944.0, 1404.0, 2033.0, 3222.0, 4869.0, 7306.0, 11425.0, 17637.0, 27430.0, 43137.0, 69060.0, 113360.0, 204137.0, 1266911.0, 121157.0, 73469.0, 45648.0, 28908.0, 18343.0, 11704.0, 7883.0, 5112.0, 3407.0, 2282.0, 1526.0, 937.0, 610.0, 439.0, 305.0, 218.0, 140.0, 84.0, 71.0, 51.0, 22.0, 15.0, 14.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89501953125, -0.8652420043945312, -0.8354644775390625, -0.8056869506835938, -0.775909423828125, -0.7461318969726562, -0.7163543701171875, -0.6865768432617188, -0.65679931640625, -0.6270217895507812, -0.5972442626953125, -0.5674667358398438, -0.537689208984375, -0.5079116821289062, -0.4781341552734375, -0.44835662841796875, -0.4185791015625, -0.38880157470703125, -0.3590240478515625, -0.32924652099609375, -0.299468994140625, -0.26969146728515625, -0.2399139404296875, -0.21013641357421875, -0.18035888671875, -0.15058135986328125, -0.1208038330078125, -0.09102630615234375, -0.061248779296875, -0.03147125244140625, -0.0016937255859375, 0.02808380126953125, 0.057861328125, 0.08763885498046875, 0.1174163818359375, 0.14719390869140625, 0.176971435546875, 0.20674896240234375, 0.2365264892578125, 0.26630401611328125, 0.29608154296875, 0.32585906982421875, 0.3556365966796875, 0.38541412353515625, 0.415191650390625, 0.44496917724609375, 0.4747467041015625, 0.5045242309570312, 0.5343017578125, 0.5640792846679688, 0.5938568115234375, 0.6236343383789062, 0.653411865234375, 0.6831893920898438, 0.7129669189453125, 0.7427444458007812, 0.77252197265625, 0.8022994995117188, 0.8320770263671875, 0.8618545532226562, 0.891632080078125, 0.9214096069335938, 0.9511871337890625, 0.9809646606445312, 1.0107421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 10.0, 7.0, 14.0, 22.0, 26.0, 26.0, 33.0, 34.0, 53.0, 64.0, 72.0, 82.0, 89.0, 82.0, 74.0, 57.0, 45.0, 44.0, 23.0, 35.0, 13.0, 14.0, 12.0, 13.0, 15.0, 6.0, 6.0, 10.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005064010620117188, -0.00048795342445373535, -0.00046950578689575195, -0.00045105814933776855, -0.00043261051177978516, -0.00041416287422180176, -0.00039571523666381836, -0.00037726759910583496, -0.00035881996154785156, -0.00034037232398986816, -0.00032192468643188477, -0.00030347704887390137, -0.00028502941131591797, -0.00026658177375793457, -0.00024813413619995117, -0.00022968649864196777, -0.00021123886108398438, -0.00019279122352600098, -0.00017434358596801758, -0.00015589594841003418, -0.00013744831085205078, -0.00011900067329406738, -0.00010055303573608398, -8.210539817810059e-05, -6.365776062011719e-05, -4.521012306213379e-05, -2.676248550415039e-05, -8.314847946166992e-06, 1.0132789611816406e-05, 2.8580427169799805e-05, 4.70280647277832e-05, 6.54757022857666e-05, 8.392333984375e-05, 0.0001023709774017334, 0.0001208186149597168, 0.0001392662525177002, 0.0001577138900756836, 0.000176161527633667, 0.0001946091651916504, 0.0002130568027496338, 0.0002315044403076172, 0.0002499520778656006, 0.000268399715423584, 0.0002868473529815674, 0.0003052949905395508, 0.0003237426280975342, 0.0003421902656555176, 0.000360637903213501, 0.0003790855407714844, 0.0003975331783294678, 0.00041598081588745117, 0.00043442845344543457, 0.00045287609100341797, 0.00047132372856140137, 0.0004897713661193848, 0.0005082190036773682, 0.0005266666412353516, 0.000545114278793335, 0.0005635619163513184, 0.0005820095539093018, 0.0006004571914672852, 0.0006189048290252686, 0.000637352466583252, 0.0006558001041412354, 0.0006742477416992188]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 8.0, 13.0, 21.0, 12.0, 29.0, 21.0, 44.0, 49.0, 49.0, 73.0, 115.0, 175.0, 266.0, 391.0, 777.0, 3341.0, 1028392.0, 12477.0, 869.0, 504.0, 287.0, 153.0, 137.0, 85.0, 59.0, 48.0, 45.0, 22.0, 21.0, 19.0, 10.0, 4.0, 10.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0120086669921875, -0.011640310287475586, -0.011271953582763672, -0.010903596878051758, -0.010535240173339844, -0.01016688346862793, -0.009798526763916016, -0.009430170059204102, -0.009061813354492188, -0.008693456649780273, -0.00832509994506836, -0.007956743240356445, -0.007588386535644531, -0.007220029830932617, -0.006851673126220703, -0.006483316421508789, -0.006114959716796875, -0.005746603012084961, -0.005378246307373047, -0.005009889602661133, -0.004641532897949219, -0.004273176193237305, -0.0039048194885253906, -0.0035364627838134766, -0.0031681060791015625, -0.0027997493743896484, -0.0024313926696777344, -0.0020630359649658203, -0.0016946792602539062, -0.0013263225555419922, -0.0009579658508300781, -0.0005896091461181641, -0.00022125244140625, 0.00014710426330566406, 0.0005154609680175781, 0.0008838176727294922, 0.0012521743774414062, 0.0016205310821533203, 0.0019888877868652344, 0.0023572444915771484, 0.0027256011962890625, 0.0030939579010009766, 0.0034623146057128906, 0.0038306713104248047, 0.004199028015136719, 0.004567384719848633, 0.004935741424560547, 0.005304098129272461, 0.005672454833984375, 0.006040811538696289, 0.006409168243408203, 0.006777524948120117, 0.007145881652832031, 0.007514238357543945, 0.00788259506225586, 0.008250951766967773, 0.008619308471679688, 0.008987665176391602, 0.009356021881103516, 0.00972437858581543, 0.010092735290527344, 0.010461091995239258, 0.010829448699951172, 0.011197805404663086, 0.011566162109375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 42.0, 417.0, 478.0, 71.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007842280901968479, -0.0007322087767533958, -0.0006801894633099437, -0.0006281701498664916, -0.0005761508364230394, -0.0005241315229795873, -0.0004721122095361352, -0.0004200928960926831, -0.00036807358264923096, -0.00031605426920577884, -0.0002640349557623267, -0.0002120156423188746, -0.00015999632887542248, -0.00010797701543197036, -5.595770198851824e-05, -3.938388545066118e-06, 4.8080924898386e-05, 0.00010010023834183812, 0.00015211955178529024, 0.00020413886522874236, 0.0002561581786721945, 0.0003081774921156466, 0.0003601968055590987, 0.00041221611900255084, 0.00046423543244600296, 0.0005162547458894551, 0.0005682740593329072, 0.0006202933727763593, 0.0006723126862198114, 0.0007243319996632636, 0.0007763513131067157, 0.0008283706265501678, 0.0008803899399936199, 0.000932409253437072, 0.0009844285668805242, 0.0010364479385316372, 0.0010884671937674284, 0.0011404864490032196, 0.0011925058206543326, 0.0012445251923054457, 0.0012965444475412369, 0.001348563702777028, 0.0014005830744281411, 0.0014526024460792542, 0.0015046217013150454, 0.0015566409565508366, 0.0016086603282019496, 0.0016606796998530626, 0.0017126989550888538, 0.001764718210324645, 0.001816737581975758, 0.0018687569536268711, 0.0019207762088626623, 0.0019727954640984535, 0.0020248149521648884, 0.0020768342074006796, 0.002128853462636471, 0.002180872717872262, 0.002232891973108053, 0.002284911461174488, 0.0023369307164102793, 0.0023889499716460705, 0.0024409694597125053, 0.0024929887149482965, 0.0025450079701840878]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 5.0, 9.0, 6.0, 8.0, 13.0, 20.0, 14.0, 15.0, 26.0, 25.0, 25.0, 21.0, 29.0, 37.0, 44.0, 43.0, 40.0, 35.0, 43.0, 45.0, 40.0, 52.0, 47.0, 37.0, 41.0, 41.0, 36.0, 38.0, 27.0, 19.0, 27.0, 24.0, 16.0, 11.0, 8.0, 8.0, 8.0, 2.0, 4.0, 2.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002828240394592285, -0.0002743285149335861, -0.0002658329904079437, -0.00025733746588230133, -0.00024884194135665894, -0.00024034641683101654, -0.00023185089230537415, -0.00022335536777973175, -0.00021485984325408936, -0.00020636431872844696, -0.00019786879420280457, -0.00018937326967716217, -0.00018087774515151978, -0.00017238222062587738, -0.00016388669610023499, -0.0001553911715745926, -0.0001468956470489502, -0.0001384001225233078, -0.0001299045979976654, -0.00012140907347202301, -0.00011291354894638062, -0.00010441802442073822, -9.592249989509583e-05, -8.742697536945343e-05, -7.893145084381104e-05, -7.043592631816864e-05, -6.194040179252625e-05, -5.344487726688385e-05, -4.4949352741241455e-05, -3.645382821559906e-05, -2.7958303689956665e-05, -1.946277916431427e-05, -1.0967254638671875e-05, -2.47173011302948e-06, 6.023794412612915e-06, 1.451931893825531e-05, 2.3014843463897705e-05, 3.15103679895401e-05, 4.0005892515182495e-05, 4.850141704082489e-05, 5.6996941566467285e-05, 6.549246609210968e-05, 7.398799061775208e-05, 8.248351514339447e-05, 9.097903966903687e-05, 9.947456419467926e-05, 0.00010797008872032166, 0.00011646561324596405, 0.00012496113777160645, 0.00013345666229724884, 0.00014195218682289124, 0.00015044771134853363, 0.00015894323587417603, 0.00016743876039981842, 0.00017593428492546082, 0.0001844298094511032, 0.0001929253339767456, 0.000201420858502388, 0.0002099163830280304, 0.0002184119075536728, 0.00022690743207931519, 0.00023540295660495758, 0.00024389848113059998, 0.00025239400565624237, 0.00026088953018188477]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 14.0, 21.0, 21.0, 14.0, 25.0, 24.0, 42.0, 38.0, 30.0, 36.0, 48.0, 34.0, 33.0, 44.0, 52.0, 59.0, 50.0, 44.0, 39.0, 45.0, 46.0, 38.0, 30.0, 22.0, 27.0, 22.0, 20.0, 18.0, 12.0, 12.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.48248291015625, -7.2540283203125, -7.02557373046875, -6.797119140625, -6.56866455078125, -6.3402099609375, -6.11175537109375, -5.88330078125, -5.65484619140625, -5.4263916015625, -5.19793701171875, -4.969482421875, -4.74102783203125, -4.5125732421875, -4.28411865234375, -4.0556640625, -3.82720947265625, -3.5987548828125, -3.37030029296875, -3.141845703125, -2.91339111328125, -2.6849365234375, -2.45648193359375, -2.22802734375, -1.99957275390625, -1.7711181640625, -1.54266357421875, -1.314208984375, -1.08575439453125, -0.8572998046875, -0.62884521484375, -0.400390625, -0.17193603515625, 0.0565185546875, 0.28497314453125, 0.513427734375, 0.74188232421875, 0.9703369140625, 1.19879150390625, 1.42724609375, 1.65570068359375, 1.8841552734375, 2.11260986328125, 2.341064453125, 2.56951904296875, 2.7979736328125, 3.02642822265625, 3.2548828125, 3.48333740234375, 3.7117919921875, 3.94024658203125, 4.168701171875, 4.39715576171875, 4.6256103515625, 4.85406494140625, 5.08251953125, 5.31097412109375, 5.5394287109375, 5.76788330078125, 5.996337890625, 6.22479248046875, 6.4532470703125, 6.68170166015625, 6.91015625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 12.0, 15.0, 11.0, 20.0, 39.0, 60.0, 79.0, 136.0, 201.0, 292.0, 424.0, 677.0, 1091.0, 1732.0, 3107.0, 6679.0, 27989.0, 373184.0, 574544.0, 41568.0, 8039.0, 3390.0, 1919.0, 1171.0, 769.0, 489.0, 319.0, 184.0, 112.0, 90.0, 73.0, 49.0, 25.0, 14.0, 24.0, 3.0, 4.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.55712890625, -16.9736328125, -16.39013671875, -15.806640625, -15.22314453125, -14.6396484375, -14.05615234375, -13.47265625, -12.88916015625, -12.3056640625, -11.72216796875, -11.138671875, -10.55517578125, -9.9716796875, -9.38818359375, -8.8046875, -8.22119140625, -7.6376953125, -7.05419921875, -6.470703125, -5.88720703125, -5.3037109375, -4.72021484375, -4.13671875, -3.55322265625, -2.9697265625, -2.38623046875, -1.802734375, -1.21923828125, -0.6357421875, -0.05224609375, 0.53125, 1.11474609375, 1.6982421875, 2.28173828125, 2.865234375, 3.44873046875, 4.0322265625, 4.61572265625, 5.19921875, 5.78271484375, 6.3662109375, 6.94970703125, 7.533203125, 8.11669921875, 8.7001953125, 9.28369140625, 9.8671875, 10.45068359375, 11.0341796875, 11.61767578125, 12.201171875, 12.78466796875, 13.3681640625, 13.95166015625, 14.53515625, 15.11865234375, 15.7021484375, 16.28564453125, 16.869140625, 17.45263671875, 18.0361328125, 18.61962890625, 19.203125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 3.0, 7.0, 9.0, 14.0, 17.0, 18.0, 29.0, 33.0, 27.0, 41.0, 46.0, 48.0, 43.0, 79.0, 204.0, 1624.0, 279.0, 97.0, 63.0, 47.0, 57.0, 46.0, 28.0, 43.0, 26.0, 21.0, 12.0, 12.0, 13.0, 9.0, 7.0, 3.0, 6.0, 5.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.875, -18.2978515625, -17.720703125, -17.1435546875, -16.56640625, -15.9892578125, -15.412109375, -14.8349609375, -14.2578125, -13.6806640625, -13.103515625, -12.5263671875, -11.94921875, -11.3720703125, -10.794921875, -10.2177734375, -9.640625, -9.0634765625, -8.486328125, -7.9091796875, -7.33203125, -6.7548828125, -6.177734375, -5.6005859375, -5.0234375, -4.4462890625, -3.869140625, -3.2919921875, -2.71484375, -2.1376953125, -1.560546875, -0.9833984375, -0.40625, 0.1708984375, 0.748046875, 1.3251953125, 1.90234375, 2.4794921875, 3.056640625, 3.6337890625, 4.2109375, 4.7880859375, 5.365234375, 5.9423828125, 6.51953125, 7.0966796875, 7.673828125, 8.2509765625, 8.828125, 9.4052734375, 9.982421875, 10.5595703125, 11.13671875, 11.7138671875, 12.291015625, 12.8681640625, 13.4453125, 14.0224609375, 14.599609375, 15.1767578125, 15.75390625, 16.3310546875, 16.908203125, 17.4853515625, 18.0625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 8.0, 7.0, 4.0, 9.0, 14.0, 29.0, 20.0, 27.0, 40.0, 43.0, 60.0, 57.0, 102.0, 124.0, 168.0, 267.0, 477.0, 1117.0, 7103.0, 3107598.0, 25295.0, 1459.0, 586.0, 305.0, 181.0, 134.0, 107.0, 83.0, 48.0, 57.0, 42.0, 26.0, 19.0, 18.0, 20.0, 9.0, 5.0, 12.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -45.9677734375, -44.466796875, -42.9658203125, -41.46484375, -39.9638671875, -38.462890625, -36.9619140625, -35.4609375, -33.9599609375, -32.458984375, -30.9580078125, -29.45703125, -27.9560546875, -26.455078125, -24.9541015625, -23.453125, -21.9521484375, -20.451171875, -18.9501953125, -17.44921875, -15.9482421875, -14.447265625, -12.9462890625, -11.4453125, -9.9443359375, -8.443359375, -6.9423828125, -5.44140625, -3.9404296875, -2.439453125, -0.9384765625, 0.5625, 2.0634765625, 3.564453125, 5.0654296875, 6.56640625, 8.0673828125, 9.568359375, 11.0693359375, 12.5703125, 14.0712890625, 15.572265625, 17.0732421875, 18.57421875, 20.0751953125, 21.576171875, 23.0771484375, 24.578125, 26.0791015625, 27.580078125, 29.0810546875, 30.58203125, 32.0830078125, 33.583984375, 35.0849609375, 36.5859375, 38.0869140625, 39.587890625, 41.0888671875, 42.58984375, 44.0908203125, 45.591796875, 47.0927734375, 48.59375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 17.0, 40.0, 70.0, 114.0, 164.0, 167.0, 180.0, 107.0, 72.0, 28.0, 20.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.86111831665039, -41.53313446044922, -40.20515060424805, -38.87716293334961, -37.54917907714844, -36.221195220947266, -34.893211364746094, -33.56522750854492, -32.23724365234375, -30.909259796142578, -29.581274032592773, -28.2532901763916, -26.925304412841797, -25.597320556640625, -24.269336700439453, -22.94135284423828, -21.613365173339844, -20.285381317138672, -18.957395553588867, -17.629411697387695, -16.30142593383789, -14.973442077636719, -13.645458221435547, -12.317473411560059, -10.98948860168457, -9.661503791809082, -8.333518981933594, -7.005535125732422, -5.677550315856934, -4.349565505981445, -3.0215811729431152, -1.6935968399047852, -0.36560821533203125, 0.9623763561248779, 2.290360927581787, 3.6183454990386963, 4.9463300704956055, 6.274314880371094, 7.602299213409424, 8.930283546447754, 10.258268356323242, 11.58625316619873, 12.914237976074219, 14.24222183227539, 15.570206642150879, 16.898191452026367, 18.22617530822754, 19.554161071777344, 20.882144927978516, 22.210128784179688, 23.538114547729492, 24.866098403930664, 26.19408416748047, 27.52206802368164, 28.850051879882812, 30.178035736083984, 31.50602149963379, 32.834007263183594, 34.161991119384766, 35.48997497558594, 36.81795883178711, 38.14594268798828, 39.47393035888672, 40.80191421508789, 42.12989807128906]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 9.0, 12.0, 7.0, 14.0, 14.0, 19.0, 18.0, 33.0, 39.0, 26.0, 21.0, 40.0, 41.0, 48.0, 37.0, 39.0, 55.0, 49.0, 47.0, 30.0, 48.0, 31.0, 19.0, 33.0, 36.0, 24.0, 22.0, 34.0, 19.0, 25.0, 16.0, 16.0, 9.0, 14.0, 9.0, 11.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-54.39656066894531, -52.722900390625, -51.04924392700195, -49.37558364868164, -47.701927185058594, -46.02826690673828, -44.354610443115234, -42.68095016479492, -41.007293701171875, -39.33363342285156, -37.659976959228516, -35.9863166809082, -34.312660217285156, -32.638999938964844, -30.965343475341797, -29.291683197021484, -27.618024826049805, -25.944366455078125, -24.270708084106445, -22.597049713134766, -20.923391342163086, -19.249732971191406, -17.576072692871094, -15.90241527557373, -14.22875690460205, -12.555098533630371, -10.881440162658691, -9.207780838012695, -7.534122943878174, -5.860464096069336, -4.186805725097656, -2.5131473541259766, -0.8394889831542969, 0.8341695070266724, 2.5078279972076416, 4.1814866065979, 5.85514497756958, 7.528803825378418, 9.202462196350098, 10.876120567321777, 12.549778938293457, 14.223437309265137, 15.897095680236816, 17.570755004882812, 19.244413375854492, 20.918071746826172, 22.59173011779785, 24.26538848876953, 25.93904685974121, 27.61270523071289, 29.28636360168457, 30.96002197265625, 32.63368225097656, 34.30733871459961, 35.98099899291992, 37.65465545654297, 39.32831573486328, 41.001976013183594, 42.67563247680664, 44.34929275512695, 46.02294921875, 47.69660949707031, 49.37026596069336, 51.04392623901367, 52.71758270263672]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 9.0, 9.0, 4.0, 15.0, 15.0, 16.0, 23.0, 22.0, 20.0, 34.0, 51.0, 33.0, 35.0, 52.0, 58.0, 52.0, 54.0, 41.0, 54.0, 34.0, 46.0, 41.0, 39.0, 37.0, 29.0, 29.0, 26.0, 20.0, 17.0, 34.0, 17.0, 12.0, 5.0, 8.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.140625, -8.8951416015625, -8.649658203125, -8.4041748046875, -8.15869140625, -7.9132080078125, -7.667724609375, -7.4222412109375, -7.1767578125, -6.9312744140625, -6.685791015625, -6.4403076171875, -6.19482421875, -5.9493408203125, -5.703857421875, -5.4583740234375, -5.212890625, -4.9674072265625, -4.721923828125, -4.4764404296875, -4.23095703125, -3.9854736328125, -3.739990234375, -3.4945068359375, -3.2490234375, -3.0035400390625, -2.758056640625, -2.5125732421875, -2.26708984375, -2.0216064453125, -1.776123046875, -1.5306396484375, -1.28515625, -1.0396728515625, -0.794189453125, -0.5487060546875, -0.30322265625, -0.0577392578125, 0.187744140625, 0.4332275390625, 0.6787109375, 0.9241943359375, 1.169677734375, 1.4151611328125, 1.66064453125, 1.9061279296875, 2.151611328125, 2.3970947265625, 2.642578125, 2.8880615234375, 3.133544921875, 3.3790283203125, 3.62451171875, 3.8699951171875, 4.115478515625, 4.3609619140625, 4.6064453125, 4.8519287109375, 5.097412109375, 5.3428955078125, 5.58837890625, 5.8338623046875, 6.079345703125, 6.3248291015625, 6.5703125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 14.0, 24.0, 26.0, 21.0, 43.0, 36.0, 76.0, 95.0, 145.0, 183.0, 325.0, 469.0, 785.0, 1252.0, 2412.0, 5423.0, 15014.0, 66552.0, 489791.0, 2062971.0, 1298972.0, 198383.0, 33438.0, 9602.0, 3630.0, 1808.0, 1013.0, 566.0, 371.0, 266.0, 157.0, 113.0, 81.0, 69.0, 41.0, 28.0, 24.0, 12.0, 15.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0], "bins": [-12.5234375, -12.1734619140625, -11.823486328125, -11.4735107421875, -11.12353515625, -10.7735595703125, -10.423583984375, -10.0736083984375, -9.7236328125, -9.3736572265625, -9.023681640625, -8.6737060546875, -8.32373046875, -7.9737548828125, -7.623779296875, -7.2738037109375, -6.923828125, -6.5738525390625, -6.223876953125, -5.8739013671875, -5.52392578125, -5.1739501953125, -4.823974609375, -4.4739990234375, -4.1240234375, -3.7740478515625, -3.424072265625, -3.0740966796875, -2.72412109375, -2.3741455078125, -2.024169921875, -1.6741943359375, -1.32421875, -0.9742431640625, -0.624267578125, -0.2742919921875, 0.07568359375, 0.4256591796875, 0.775634765625, 1.1256103515625, 1.4755859375, 1.8255615234375, 2.175537109375, 2.5255126953125, 2.87548828125, 3.2254638671875, 3.575439453125, 3.9254150390625, 4.275390625, 4.6253662109375, 4.975341796875, 5.3253173828125, 5.67529296875, 6.0252685546875, 6.375244140625, 6.7252197265625, 7.0751953125, 7.4251708984375, 7.775146484375, 8.1251220703125, 8.47509765625, 8.8250732421875, 9.175048828125, 9.5250244140625, 9.875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 13.0, 15.0, 41.0, 108.0, 393.0, 1098.0, 1620.0, 561.0, 167.0, 50.0, 10.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.03125, -41.650390625, -40.26953125, -38.888671875, -37.5078125, -36.126953125, -34.74609375, -33.365234375, -31.984375, -30.603515625, -29.22265625, -27.841796875, -26.4609375, -25.080078125, -23.69921875, -22.318359375, -20.9375, -19.556640625, -18.17578125, -16.794921875, -15.4140625, -14.033203125, -12.65234375, -11.271484375, -9.890625, -8.509765625, -7.12890625, -5.748046875, -4.3671875, -2.986328125, -1.60546875, -0.224609375, 1.15625, 2.537109375, 3.91796875, 5.298828125, 6.6796875, 8.060546875, 9.44140625, 10.822265625, 12.203125, 13.583984375, 14.96484375, 16.345703125, 17.7265625, 19.107421875, 20.48828125, 21.869140625, 23.25, 24.630859375, 26.01171875, 27.392578125, 28.7734375, 30.154296875, 31.53515625, 32.916015625, 34.296875, 35.677734375, 37.05859375, 38.439453125, 39.8203125, 41.201171875, 42.58203125, 43.962890625, 45.34375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 4.0, 19.0, 42.0, 75.0, 205.0, 756.0, 4187.0, 4170022.0, 17055.0, 1309.0, 360.0, 130.0, 48.0, 21.0, 12.0, 8.0, 8.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.3125, -87.548828125, -84.78515625, -82.021484375, -79.2578125, -76.494140625, -73.73046875, -70.966796875, -68.203125, -65.439453125, -62.67578125, -59.912109375, -57.1484375, -54.384765625, -51.62109375, -48.857421875, -46.09375, -43.330078125, -40.56640625, -37.802734375, -35.0390625, -32.275390625, -29.51171875, -26.748046875, -23.984375, -21.220703125, -18.45703125, -15.693359375, -12.9296875, -10.166015625, -7.40234375, -4.638671875, -1.875, 0.888671875, 3.65234375, 6.416015625, 9.1796875, 11.943359375, 14.70703125, 17.470703125, 20.234375, 22.998046875, 25.76171875, 28.525390625, 31.2890625, 34.052734375, 36.81640625, 39.580078125, 42.34375, 45.107421875, 47.87109375, 50.634765625, 53.3984375, 56.162109375, 58.92578125, 61.689453125, 64.453125, 67.216796875, 69.98046875, 72.744140625, 75.5078125, 78.271484375, 81.03515625, 83.798828125, 86.5625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 85.0, 592.0, 319.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.76255798339844, -240.84356689453125, -233.92457580566406, -227.00558471679688, -220.08657836914062, -213.16758728027344, -206.24859619140625, -199.32960510253906, -192.41061401367188, -185.4916229248047, -178.5726318359375, -171.65362548828125, -164.73463439941406, -157.81564331054688, -150.8966522216797, -143.9776611328125, -137.05865478515625, -130.13966369628906, -123.22066497802734, -116.30167388916016, -109.38267517089844, -102.46368408203125, -95.54469299316406, -88.62570190429688, -81.70670318603516, -74.78771209716797, -67.86871337890625, -60.94972229003906, -54.03072738647461, -47.111732482910156, -40.19274139404297, -33.273746490478516, -26.354736328125, -19.435741424560547, -12.516748428344727, -5.597755432128906, 1.3212394714355469, 8.240234375, 15.159225463867188, 22.07822036743164, 28.997215270996094, 35.91621017456055, 42.835205078125, 49.75419616699219, 56.67319107055664, 63.592185974121094, 70.51117706298828, 77.43017578125, 84.34916687011719, 91.26815795898438, 98.1871566772461, 105.10614776611328, 112.025146484375, 118.94413757324219, 125.86312866210938, 132.78211975097656, 139.70111083984375, 146.62010192871094, 153.53909301757812, 160.45809936523438, 167.37709045410156, 174.29608154296875, 181.21507263183594, 188.13406372070312, 195.05307006835938]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 7.0, 13.0, 12.0, 14.0, 14.0, 18.0, 18.0, 31.0, 30.0, 29.0, 29.0, 26.0, 55.0, 52.0, 41.0, 48.0, 42.0, 34.0, 46.0, 29.0, 48.0, 38.0, 38.0, 32.0, 28.0, 36.0, 23.0, 23.0, 26.0, 17.0, 19.0, 26.0, 9.0, 9.0, 6.0, 6.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.628509521484375, -38.98917770385742, -37.3498420715332, -35.71051025390625, -34.0711784362793, -32.431846618652344, -30.792510986328125, -29.153179168701172, -27.513845443725586, -25.87451171875, -24.235179901123047, -22.59584617614746, -20.956512451171875, -19.317180633544922, -17.677846908569336, -16.03851318359375, -14.399181365966797, -12.759848594665527, -11.120515823364258, -9.481182098388672, -7.841849327087402, -6.202516555786133, -4.563182830810547, -2.9238500595092773, -1.2845172882080078, 0.3548157215118408, 1.9941487312316895, 3.633481979370117, 5.272814750671387, 6.912147521972656, 8.551481246948242, 10.190814018249512, 11.830146789550781, 13.46947956085205, 15.10881233215332, 16.748146057128906, 18.38747787475586, 20.026811599731445, 21.66614532470703, 23.305477142333984, 24.94481086730957, 26.584144592285156, 28.22347640991211, 29.862810134887695, 31.50214385986328, 33.141475677490234, 34.78080749511719, 36.420143127441406, 38.05947494506836, 39.69880676269531, 41.33814239501953, 42.977474212646484, 44.61680603027344, 46.256141662597656, 47.89547348022461, 49.53480529785156, 51.17414093017578, 52.813472747802734, 54.45280838012695, 56.092140197753906, 57.73147201538086, 59.37080383300781, 61.01013946533203, 62.649471282958984, 64.28880310058594]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 12.0, 7.0, 13.0, 12.0, 12.0, 13.0, 15.0, 18.0, 25.0, 25.0, 28.0, 23.0, 26.0, 41.0, 38.0, 35.0, 37.0, 42.0, 43.0, 51.0, 38.0, 36.0, 30.0, 38.0, 44.0, 27.0, 29.0, 32.0, 31.0, 25.0, 18.0, 21.0, 14.0, 14.0, 11.0, 6.0, 9.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.62109375, -4.46685791015625, -4.3126220703125, -4.15838623046875, -4.004150390625, -3.84991455078125, -3.6956787109375, -3.54144287109375, -3.38720703125, -3.23297119140625, -3.0787353515625, -2.92449951171875, -2.770263671875, -2.61602783203125, -2.4617919921875, -2.30755615234375, -2.1533203125, -1.99908447265625, -1.8448486328125, -1.69061279296875, -1.536376953125, -1.38214111328125, -1.2279052734375, -1.07366943359375, -0.91943359375, -0.76519775390625, -0.6109619140625, -0.45672607421875, -0.302490234375, -0.14825439453125, 0.0059814453125, 0.16021728515625, 0.314453125, 0.46868896484375, 0.6229248046875, 0.77716064453125, 0.931396484375, 1.08563232421875, 1.2398681640625, 1.39410400390625, 1.54833984375, 1.70257568359375, 1.8568115234375, 2.01104736328125, 2.165283203125, 2.31951904296875, 2.4737548828125, 2.62799072265625, 2.7822265625, 2.93646240234375, 3.0906982421875, 3.24493408203125, 3.399169921875, 3.55340576171875, 3.7076416015625, 3.86187744140625, 4.01611328125, 4.17034912109375, 4.3245849609375, 4.47882080078125, 4.633056640625, 4.78729248046875, 4.9415283203125, 5.09576416015625, 5.25]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 17.0, 10.0, 29.0, 60.0, 76.0, 120.0, 199.0, 333.0, 531.0, 823.0, 1387.0, 2300.0, 3780.0, 6559.0, 11006.0, 18940.0, 32984.0, 59873.0, 112297.0, 224341.0, 271457.0, 136546.0, 71385.0, 39389.0, 22318.0, 12918.0, 7511.0, 4451.0, 2707.0, 1603.0, 946.0, 589.0, 384.0, 262.0, 150.0, 92.0, 51.0, 44.0, 22.0, 14.0, 14.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.962890625, -0.9298553466796875, -0.896820068359375, -0.8637847900390625, -0.83074951171875, -0.7977142333984375, -0.764678955078125, -0.7316436767578125, -0.6986083984375, -0.6655731201171875, -0.632537841796875, -0.5995025634765625, -0.56646728515625, -0.5334320068359375, -0.500396728515625, -0.4673614501953125, -0.434326171875, -0.4012908935546875, -0.368255615234375, -0.3352203369140625, -0.30218505859375, -0.2691497802734375, -0.236114501953125, -0.2030792236328125, -0.1700439453125, -0.1370086669921875, -0.103973388671875, -0.0709381103515625, -0.03790283203125, -0.0048675537109375, 0.028167724609375, 0.0612030029296875, 0.09423828125, 0.1272735595703125, 0.160308837890625, 0.1933441162109375, 0.22637939453125, 0.2594146728515625, 0.292449951171875, 0.3254852294921875, 0.3585205078125, 0.3915557861328125, 0.424591064453125, 0.4576263427734375, 0.49066162109375, 0.5236968994140625, 0.556732177734375, 0.5897674560546875, 0.622802734375, 0.6558380126953125, 0.688873291015625, 0.7219085693359375, 0.75494384765625, 0.7879791259765625, 0.821014404296875, 0.8540496826171875, 0.8870849609375, 0.9201202392578125, 0.953155517578125, 0.9861907958984375, 1.01922607421875, 1.0522613525390625, 1.085296630859375, 1.1183319091796875, 1.1513671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 14.0, 11.0, 18.0, 13.0, 12.0, 29.0, 26.0, 21.0, 25.0, 27.0, 34.0, 33.0, 37.0, 59.0, 44.0, 30.0, 1086.0, 34.0, 45.0, 45.0, 43.0, 39.0, 39.0, 32.0, 31.0, 25.0, 25.0, 26.0, 14.0, 18.0, 21.0, 10.0, 5.0, 9.0, 9.0, 7.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.10302734375, -2.9912109375, -2.87939453125, -2.767578125, -2.65576171875, -2.5439453125, -2.43212890625, -2.3203125, -2.20849609375, -2.0966796875, -1.98486328125, -1.873046875, -1.76123046875, -1.6494140625, -1.53759765625, -1.42578125, -1.31396484375, -1.2021484375, -1.09033203125, -0.978515625, -0.86669921875, -0.7548828125, -0.64306640625, -0.53125, -0.41943359375, -0.3076171875, -0.19580078125, -0.083984375, 0.02783203125, 0.1396484375, 0.25146484375, 0.36328125, 0.47509765625, 0.5869140625, 0.69873046875, 0.810546875, 0.92236328125, 1.0341796875, 1.14599609375, 1.2578125, 1.36962890625, 1.4814453125, 1.59326171875, 1.705078125, 1.81689453125, 1.9287109375, 2.04052734375, 2.15234375, 2.26416015625, 2.3759765625, 2.48779296875, 2.599609375, 2.71142578125, 2.8232421875, 2.93505859375, 3.046875, 3.15869140625, 3.2705078125, 3.38232421875, 3.494140625, 3.60595703125, 3.7177734375, 3.82958984375, 3.94140625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 11.0, 24.0, 20.0, 53.0, 73.0, 115.0, 152.0, 261.0, 377.0, 560.0, 819.0, 1430.0, 2106.0, 3165.0, 4943.0, 7481.0, 11731.0, 18655.0, 29653.0, 48221.0, 80743.0, 144426.0, 1299193.0, 184080.0, 101107.0, 59432.0, 36068.0, 22623.0, 14003.0, 9042.0, 5726.0, 3860.0, 2417.0, 1577.0, 1022.0, 708.0, 445.0, 272.0, 191.0, 113.0, 88.0, 49.0, 35.0, 18.0, 16.0, 7.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.86572265625, -0.8400344848632812, -0.8143463134765625, -0.7886581420898438, -0.762969970703125, -0.7372817993164062, -0.7115936279296875, -0.6859054565429688, -0.66021728515625, -0.6345291137695312, -0.6088409423828125, -0.5831527709960938, -0.557464599609375, -0.5317764282226562, -0.5060882568359375, -0.48040008544921875, -0.4547119140625, -0.42902374267578125, -0.4033355712890625, -0.37764739990234375, -0.351959228515625, -0.32627105712890625, -0.3005828857421875, -0.27489471435546875, -0.24920654296875, -0.22351837158203125, -0.1978302001953125, -0.17214202880859375, -0.146453857421875, -0.12076568603515625, -0.0950775146484375, -0.06938934326171875, -0.043701171875, -0.01801300048828125, 0.0076751708984375, 0.03336334228515625, 0.059051513671875, 0.08473968505859375, 0.1104278564453125, 0.13611602783203125, 0.16180419921875, 0.18749237060546875, 0.2131805419921875, 0.23886871337890625, 0.264556884765625, 0.29024505615234375, 0.3159332275390625, 0.34162139892578125, 0.3673095703125, 0.39299774169921875, 0.4186859130859375, 0.44437408447265625, 0.470062255859375, 0.49575042724609375, 0.5214385986328125, 0.5471267700195312, 0.57281494140625, 0.5985031127929688, 0.6241912841796875, 0.6498794555664062, 0.675567626953125, 0.7012557983398438, 0.7269439697265625, 0.7526321411132812, 0.7783203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 11.0, 13.0, 19.0, 31.0, 29.0, 38.0, 52.0, 54.0, 73.0, 66.0, 76.0, 68.0, 74.0, 71.0, 61.0, 51.0, 35.0, 31.0, 17.0, 16.0, 19.0, 17.0, 7.0, 8.0, 7.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007786750793457031, -0.0007538646459579468, -0.0007290542125701904, -0.0007042437791824341, -0.0006794333457946777, -0.0006546229124069214, -0.000629812479019165, -0.0006050020456314087, -0.0005801916122436523, -0.000555381178855896, -0.0005305707454681396, -0.0005057603120803833, -0.00048094987869262695, -0.0004561394453048706, -0.00043132901191711426, -0.0004065185785293579, -0.00038170814514160156, -0.0003568977117538452, -0.00033208727836608887, -0.0003072768449783325, -0.00028246641159057617, -0.0002576559782028198, -0.00023284554481506348, -0.00020803511142730713, -0.00018322467803955078, -0.00015841424465179443, -0.00013360381126403809, -0.00010879337787628174, -8.398294448852539e-05, -5.917251110076904e-05, -3.4362077713012695e-05, -9.551644325256348e-06, 1.52587890625e-05, 4.006922245025635e-05, 6.48796558380127e-05, 8.969008922576904e-05, 0.00011450052261352539, 0.00013931095600128174, 0.00016412138938903809, 0.00018893182277679443, 0.00021374225616455078, 0.00023855268955230713, 0.0002633631229400635, 0.0002881735563278198, 0.00031298398971557617, 0.0003377944231033325, 0.00036260485649108887, 0.0003874152898788452, 0.00041222572326660156, 0.0004370361566543579, 0.00046184659004211426, 0.0004866570234298706, 0.000511467456817627, 0.0005362778902053833, 0.0005610883235931396, 0.000585898756980896, 0.0006107091903686523, 0.0006355196237564087, 0.000660330057144165, 0.0006851404905319214, 0.0007099509239196777, 0.0007347613573074341, 0.0007595717906951904, 0.0007843822240829468, 0.0008091926574707031]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 11.0, 12.0, 13.0, 18.0, 15.0, 33.0, 31.0, 34.0, 53.0, 72.0, 92.0, 144.0, 218.0, 280.0, 497.0, 1020.0, 23066.0, 1019262.0, 1576.0, 707.0, 397.0, 254.0, 175.0, 146.0, 96.0, 69.0, 55.0, 46.0, 35.0, 28.0, 18.0, 21.0, 12.0, 12.0, 4.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01226806640625, -0.011887550354003906, -0.011507034301757812, -0.011126518249511719, -0.010746002197265625, -0.010365486145019531, -0.009984970092773438, -0.009604454040527344, -0.00922393798828125, -0.008843421936035156, -0.008462905883789062, -0.008082389831542969, -0.007701873779296875, -0.007321357727050781, -0.0069408416748046875, -0.006560325622558594, -0.0061798095703125, -0.005799293518066406, -0.0054187774658203125, -0.005038261413574219, -0.004657745361328125, -0.004277229309082031, -0.0038967132568359375, -0.0035161972045898438, -0.00313568115234375, -0.0027551651000976562, -0.0023746490478515625, -0.0019941329956054688, -0.001613616943359375, -0.0012331008911132812, -0.0008525848388671875, -0.00047206878662109375, -9.1552734375e-05, 0.00028896331787109375, 0.0006694793701171875, 0.0010499954223632812, 0.001430511474609375, 0.0018110275268554688, 0.0021915435791015625, 0.0025720596313476562, 0.00295257568359375, 0.0033330917358398438, 0.0037136077880859375, 0.004094123840332031, 0.004474639892578125, 0.004855155944824219, 0.0052356719970703125, 0.005616188049316406, 0.0059967041015625, 0.006377220153808594, 0.0067577362060546875, 0.007138252258300781, 0.007518768310546875, 0.007899284362792969, 0.008279800415039062, 0.008660316467285156, 0.00904083251953125, 0.009421348571777344, 0.009801864624023438, 0.010182380676269531, 0.010562896728515625, 0.010943412780761719, 0.011323928833007812, 0.011704444885253906, 0.0120849609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 815.0, 192.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019121458753943443, -0.0018243335653096437, -0.0017365212552249432, -0.0016487089451402426, -0.0015608965186402202, -0.0014730842085555196, -0.001385271898470819, -0.0012974594719707966, -0.001209647161886096, -0.0011218348518013954, -0.0010340225417166948, -0.0009462101734243333, -0.0008583978051319718, -0.0007705854950472713, -0.0006827731849625707, -0.0005949608166702092, -0.0005071485647931695, -0.00041933622560463846, -0.0003315238864161074, -0.00024371157633140683, -0.0001558992371428758, -6.808689795434475e-05, 1.9725412130355835e-05, 0.00010753778042271733, 0.00019535009050741792, 0.00028316242969594896, 0.00037097476888448, 0.0004587870789691806, 0.0005465993890538812, 0.0006344117573462427, 0.0007222240674309433, 0.0008100364357233047, 0.0008978487458080053, 0.000985661055892706, 0.0010734733659774065, 0.001161285676062107, 0.0012490981025621295, 0.00133691041264683, 0.0014247227227315307, 0.001512535149231553, 0.0016003474593162537, 0.0016881597694009542, 0.0017759720794856548, 0.0018637843895703554, 0.0019515968160703778, 0.0020394092425704002, 0.002127221319824457, 0.0022150338627398014, 0.0023028459399938583, 0.002390658250078559, 0.0024784705601632595, 0.00256628287024796, 0.0026540951803326607, 0.002741907723248005, 0.002829719800502062, 0.002917532343417406, 0.0030053446535021067, 0.0030931569635868073, 0.003180969273671508, 0.0032687815837562084, 0.003356593893840909, 0.0034444062039256096, 0.003532218746840954, 0.0036200310569256544, 0.003707843367010355]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 6.0, 4.0, 10.0, 10.0, 10.0, 9.0, 11.0, 13.0, 17.0, 17.0, 23.0, 33.0, 28.0, 30.0, 43.0, 33.0, 40.0, 34.0, 42.0, 47.0, 35.0, 40.0, 40.0, 33.0, 41.0, 37.0, 39.0, 33.0, 28.0, 34.0, 25.0, 28.0, 22.0, 11.0, 21.0, 14.0, 8.0, 13.0, 13.0, 6.0, 4.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000335693359375, -0.0003247419372200966, -0.0003137905150651932, -0.00030283909291028976, -0.00029188767075538635, -0.00028093624860048294, -0.00026998482644557953, -0.0002590334042906761, -0.0002480819821357727, -0.0002371305599808693, -0.00022617913782596588, -0.00021522771567106247, -0.00020427629351615906, -0.00019332487136125565, -0.00018237344920635223, -0.00017142202705144882, -0.0001604706048965454, -0.000149519182741642, -0.00013856776058673859, -0.00012761633843183517, -0.00011666491627693176, -0.00010571349412202835, -9.476207196712494e-05, -8.381064981222153e-05, -7.285922765731812e-05, -6.19078055024147e-05, -5.095638334751129e-05, -4.000496119260788e-05, -2.9053539037704468e-05, -1.8102116882801056e-05, -7.150694727897644e-06, 3.800727427005768e-06, 1.475214958190918e-05, 2.570357173681259e-05, 3.6654993891716003e-05, 4.7606416046619415e-05, 5.855783820152283e-05, 6.950926035642624e-05, 8.046068251132965e-05, 9.141210466623306e-05, 0.00010236352682113647, 0.00011331494897603989, 0.0001242663711309433, 0.0001352177932858467, 0.00014616921544075012, 0.00015712063759565353, 0.00016807205975055695, 0.00017902348190546036, 0.00018997490406036377, 0.00020092632621526718, 0.0002118777483701706, 0.000222829170525074, 0.00023378059267997742, 0.00024473201483488083, 0.00025568343698978424, 0.00026663485914468765, 0.00027758628129959106, 0.0002885377034544945, 0.0002994891256093979, 0.0003104405477643013, 0.0003213919699192047, 0.0003323433920741081, 0.00034329481422901154, 0.00035424623638391495, 0.00036519765853881836]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 12.0, 7.0, 13.0, 12.0, 12.0, 13.0, 15.0, 18.0, 25.0, 25.0, 28.0, 23.0, 26.0, 41.0, 38.0, 35.0, 37.0, 42.0, 43.0, 51.0, 38.0, 36.0, 30.0, 38.0, 44.0, 27.0, 29.0, 32.0, 30.0, 26.0, 18.0, 21.0, 14.0, 14.0, 11.0, 6.0, 9.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.62109375, -4.46685791015625, -4.3126220703125, -4.15838623046875, -4.004150390625, -3.84991455078125, -3.6956787109375, -3.54144287109375, -3.38720703125, -3.23297119140625, -3.0787353515625, -2.92449951171875, -2.770263671875, -2.61602783203125, -2.4617919921875, -2.30755615234375, -2.1533203125, -1.99908447265625, -1.8448486328125, -1.69061279296875, -1.536376953125, -1.38214111328125, -1.2279052734375, -1.07366943359375, -0.91943359375, -0.76519775390625, -0.6109619140625, -0.45672607421875, -0.302490234375, -0.14825439453125, 0.0059814453125, 0.16021728515625, 0.314453125, 0.46868896484375, 0.6229248046875, 0.77716064453125, 0.931396484375, 1.08563232421875, 1.2398681640625, 1.39410400390625, 1.54833984375, 1.70257568359375, 1.8568115234375, 2.01104736328125, 2.165283203125, 2.31951904296875, 2.4737548828125, 2.62799072265625, 2.7822265625, 2.93646240234375, 3.0906982421875, 3.24493408203125, 3.399169921875, 3.55340576171875, 3.7076416015625, 3.86187744140625, 4.01611328125, 4.17034912109375, 4.3245849609375, 4.47882080078125, 4.633056640625, 4.78729248046875, 4.9415283203125, 5.09576416015625, 5.25]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 11.0, 13.0, 18.0, 21.0, 29.0, 29.0, 47.0, 40.0, 80.0, 88.0, 134.0, 177.0, 254.0, 378.0, 604.0, 1000.0, 1737.0, 3690.0, 8814.0, 25052.0, 98952.0, 542341.0, 282807.0, 54008.0, 15715.0, 5930.0, 2650.0, 1400.0, 817.0, 529.0, 326.0, 224.0, 173.0, 112.0, 76.0, 59.0, 52.0, 36.0, 28.0, 22.0, 16.0, 12.0, 5.0, 9.0, 4.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-8.890625, -8.6019287109375, -8.313232421875, -8.0245361328125, -7.73583984375, -7.4471435546875, -7.158447265625, -6.8697509765625, -6.5810546875, -6.2923583984375, -6.003662109375, -5.7149658203125, -5.42626953125, -5.1375732421875, -4.848876953125, -4.5601806640625, -4.271484375, -3.9827880859375, -3.694091796875, -3.4053955078125, -3.11669921875, -2.8280029296875, -2.539306640625, -2.2506103515625, -1.9619140625, -1.6732177734375, -1.384521484375, -1.0958251953125, -0.80712890625, -0.5184326171875, -0.229736328125, 0.0589599609375, 0.34765625, 0.6363525390625, 0.925048828125, 1.2137451171875, 1.50244140625, 1.7911376953125, 2.079833984375, 2.3685302734375, 2.6572265625, 2.9459228515625, 3.234619140625, 3.5233154296875, 3.81201171875, 4.1007080078125, 4.389404296875, 4.6781005859375, 4.966796875, 5.2554931640625, 5.544189453125, 5.8328857421875, 6.12158203125, 6.4102783203125, 6.698974609375, 6.9876708984375, 7.2763671875, 7.5650634765625, 7.853759765625, 8.1424560546875, 8.43115234375, 8.7198486328125, 9.008544921875, 9.2972412109375, 9.5859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 12.0, 9.0, 18.0, 14.0, 17.0, 22.0, 39.0, 41.0, 48.0, 61.0, 64.0, 86.0, 264.0, 1801.0, 151.0, 76.0, 52.0, 46.0, 39.0, 43.0, 29.0, 29.0, 16.0, 16.0, 15.0, 7.0, 11.0, 4.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.939208984375, -16.36279296875, -15.786376953125, -15.2099609375, -14.633544921875, -14.05712890625, -13.480712890625, -12.904296875, -12.327880859375, -11.75146484375, -11.175048828125, -10.5986328125, -10.022216796875, -9.44580078125, -8.869384765625, -8.29296875, -7.716552734375, -7.14013671875, -6.563720703125, -5.9873046875, -5.410888671875, -4.83447265625, -4.258056640625, -3.681640625, -3.105224609375, -2.52880859375, -1.952392578125, -1.3759765625, -0.799560546875, -0.22314453125, 0.353271484375, 0.9296875, 1.506103515625, 2.08251953125, 2.658935546875, 3.2353515625, 3.811767578125, 4.38818359375, 4.964599609375, 5.541015625, 6.117431640625, 6.69384765625, 7.270263671875, 7.8466796875, 8.423095703125, 8.99951171875, 9.575927734375, 10.15234375, 10.728759765625, 11.30517578125, 11.881591796875, 12.4580078125, 13.034423828125, 13.61083984375, 14.187255859375, 14.763671875, 15.340087890625, 15.91650390625, 16.492919921875, 17.0693359375, 17.645751953125, 18.22216796875, 18.798583984375, 19.375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 8.0, 9.0, 13.0, 16.0, 23.0, 24.0, 41.0, 48.0, 62.0, 113.0, 241.0, 540.0, 1557.0, 3074440.0, 66520.0, 1073.0, 440.0, 195.0, 96.0, 80.0, 38.0, 29.0, 25.0, 19.0, 12.0, 10.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.15625, -53.4775390625, -51.798828125, -50.1201171875, -48.44140625, -46.7626953125, -45.083984375, -43.4052734375, -41.7265625, -40.0478515625, -38.369140625, -36.6904296875, -35.01171875, -33.3330078125, -31.654296875, -29.9755859375, -28.296875, -26.6181640625, -24.939453125, -23.2607421875, -21.58203125, -19.9033203125, -18.224609375, -16.5458984375, -14.8671875, -13.1884765625, -11.509765625, -9.8310546875, -8.15234375, -6.4736328125, -4.794921875, -3.1162109375, -1.4375, 0.2412109375, 1.919921875, 3.5986328125, 5.27734375, 6.9560546875, 8.634765625, 10.3134765625, 11.9921875, 13.6708984375, 15.349609375, 17.0283203125, 18.70703125, 20.3857421875, 22.064453125, 23.7431640625, 25.421875, 27.1005859375, 28.779296875, 30.4580078125, 32.13671875, 33.8154296875, 35.494140625, 37.1728515625, 38.8515625, 40.5302734375, 42.208984375, 43.8876953125, 45.56640625, 47.2451171875, 48.923828125, 50.6025390625, 52.28125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 84.0, 550.0, 348.0, 28.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-89.81062316894531, -87.4964828491211, -85.18234252929688, -82.86819458007812, -80.5540542602539, -78.23991394042969, -75.92576599121094, -73.61162567138672, -71.2974853515625, -68.98334503173828, -66.66920471191406, -64.35505676269531, -62.040916442871094, -59.726776123046875, -57.41263198852539, -55.098487854003906, -52.78434753417969, -50.47020721435547, -48.156063079833984, -45.8419189453125, -43.52777862548828, -41.21363830566406, -38.89949417114258, -36.585350036621094, -34.271209716796875, -31.957067489624023, -29.642925262451172, -27.32878303527832, -25.01464080810547, -22.700498580932617, -20.386356353759766, -18.072214126586914, -15.758068084716797, -13.443925857543945, -11.129783630371094, -8.815641403198242, -6.501499176025391, -4.187356948852539, -1.8732147216796875, 0.44092750549316406, 2.7550697326660156, 5.069211959838867, 7.383354187011719, 9.69749641418457, 12.011638641357422, 14.325780868530273, 16.639923095703125, 18.954065322875977, 21.268207550048828, 23.58234977722168, 25.89649200439453, 28.210634231567383, 30.524776458740234, 32.83892059326172, 35.15306091308594, 37.467201232910156, 39.78134536743164, 42.095489501953125, 44.409629821777344, 46.72377014160156, 49.03791427612305, 51.35205841064453, 53.66619873046875, 55.98033905029297, 58.29448318481445]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 8.0, 10.0, 6.0, 9.0, 26.0, 16.0, 17.0, 18.0, 24.0, 29.0, 34.0, 27.0, 23.0, 36.0, 35.0, 39.0, 34.0, 52.0, 53.0, 36.0, 51.0, 50.0, 43.0, 36.0, 29.0, 37.0, 26.0, 33.0, 25.0, 19.0, 22.0, 11.0, 13.0, 4.0, 17.0, 7.0, 4.0, 11.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-33.075252532958984, -32.07883834838867, -31.08242416381836, -30.086009979248047, -29.089595794677734, -28.093181610107422, -27.096765518188477, -26.100351333618164, -25.10393714904785, -24.10752296447754, -23.111108779907227, -22.114694595336914, -21.11827850341797, -20.121864318847656, -19.125450134277344, -18.12903594970703, -17.13262176513672, -16.136207580566406, -15.139793395996094, -14.143378257751465, -13.146964073181152, -12.15054988861084, -11.154134750366211, -10.157720565795898, -9.161306381225586, -8.164892196655273, -7.168477535247803, -6.172062873840332, -5.1756486892700195, -4.179234504699707, -3.1828198432922363, -2.1864051818847656, -1.1899909973144531, -0.19357657432556152, 0.8028378486633301, 1.7992522716522217, 2.7956666946411133, 3.792080879211426, 4.7884955406188965, 5.784910202026367, 6.78132438659668, 7.777738571166992, 8.774152755737305, 9.770567893981934, 10.766982078552246, 11.763396263122559, 12.759811401367188, 13.7562255859375, 14.752639770507812, 15.749053955078125, 16.745468139648438, 17.74188232421875, 18.738296508789062, 19.734710693359375, 20.73112678527832, 21.727540969848633, 22.723955154418945, 23.720369338989258, 24.71678352355957, 25.713197708129883, 26.709613800048828, 27.70602798461914, 28.702442169189453, 29.698856353759766, 30.695270538330078]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 3.0, 13.0, 7.0, 7.0, 14.0, 10.0, 9.0, 17.0, 19.0, 19.0, 26.0, 21.0, 22.0, 34.0, 38.0, 49.0, 42.0, 51.0, 37.0, 40.0, 56.0, 48.0, 39.0, 33.0, 37.0, 47.0, 32.0, 29.0, 29.0, 32.0, 22.0, 18.0, 19.0, 18.0, 8.0, 9.0, 11.0, 13.0, 2.0, 4.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.880859375, -5.6796875, -5.478515625, -5.27734375, -5.076171875, -4.875, -4.673828125, -4.47265625, -4.271484375, -4.0703125, -3.869140625, -3.66796875, -3.466796875, -3.265625, -3.064453125, -2.86328125, -2.662109375, -2.4609375, -2.259765625, -2.05859375, -1.857421875, -1.65625, -1.455078125, -1.25390625, -1.052734375, -0.8515625, -0.650390625, -0.44921875, -0.248046875, -0.046875, 0.154296875, 0.35546875, 0.556640625, 0.7578125, 0.958984375, 1.16015625, 1.361328125, 1.5625, 1.763671875, 1.96484375, 2.166015625, 2.3671875, 2.568359375, 2.76953125, 2.970703125, 3.171875, 3.373046875, 3.57421875, 3.775390625, 3.9765625, 4.177734375, 4.37890625, 4.580078125, 4.78125, 4.982421875, 5.18359375, 5.384765625, 5.5859375, 5.787109375, 5.98828125, 6.189453125, 6.390625, 6.591796875, 6.79296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 12.0, 16.0, 21.0, 27.0, 34.0, 35.0, 44.0, 66.0, 54.0, 94.0, 74.0, 122.0, 175.0, 216.0, 319.0, 489.0, 900.0, 2054.0, 14125.0, 2930471.0, 1233033.0, 7681.0, 1772.0, 719.0, 436.0, 288.0, 241.0, 166.0, 119.0, 82.0, 59.0, 57.0, 46.0, 44.0, 36.0, 31.0, 19.0, 20.0, 14.0, 17.0, 12.0, 8.0, 10.0, 7.0, 0.0, 1.0, 4.0, 2.0], "bins": [-44.8125, -43.56396484375, -42.3154296875, -41.06689453125, -39.818359375, -38.56982421875, -37.3212890625, -36.07275390625, -34.82421875, -33.57568359375, -32.3271484375, -31.07861328125, -29.830078125, -28.58154296875, -27.3330078125, -26.08447265625, -24.8359375, -23.58740234375, -22.3388671875, -21.09033203125, -19.841796875, -18.59326171875, -17.3447265625, -16.09619140625, -14.84765625, -13.59912109375, -12.3505859375, -11.10205078125, -9.853515625, -8.60498046875, -7.3564453125, -6.10791015625, -4.859375, -3.61083984375, -2.3623046875, -1.11376953125, 0.134765625, 1.38330078125, 2.6318359375, 3.88037109375, 5.12890625, 6.37744140625, 7.6259765625, 8.87451171875, 10.123046875, 11.37158203125, 12.6201171875, 13.86865234375, 15.1171875, 16.36572265625, 17.6142578125, 18.86279296875, 20.111328125, 21.35986328125, 22.6083984375, 23.85693359375, 25.10546875, 26.35400390625, 27.6025390625, 28.85107421875, 30.099609375, 31.34814453125, 32.5966796875, 33.84521484375, 35.09375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 12.0, 21.0, 23.0, 56.0, 82.0, 186.0, 375.0, 685.0, 951.0, 729.0, 428.0, 237.0, 114.0, 58.0, 45.0, 18.0, 10.0, 8.0, 7.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3515625, -12.8302001953125, -12.308837890625, -11.7874755859375, -11.26611328125, -10.7447509765625, -10.223388671875, -9.7020263671875, -9.1806640625, -8.6593017578125, -8.137939453125, -7.6165771484375, -7.09521484375, -6.5738525390625, -6.052490234375, -5.5311279296875, -5.009765625, -4.4884033203125, -3.967041015625, -3.4456787109375, -2.92431640625, -2.4029541015625, -1.881591796875, -1.3602294921875, -0.8388671875, -0.3175048828125, 0.203857421875, 0.7252197265625, 1.24658203125, 1.7679443359375, 2.289306640625, 2.8106689453125, 3.33203125, 3.8533935546875, 4.374755859375, 4.8961181640625, 5.41748046875, 5.9388427734375, 6.460205078125, 6.9815673828125, 7.5029296875, 8.0242919921875, 8.545654296875, 9.0670166015625, 9.58837890625, 10.1097412109375, 10.631103515625, 11.1524658203125, 11.673828125, 12.1951904296875, 12.716552734375, 13.2379150390625, 13.75927734375, 14.2806396484375, 14.802001953125, 15.3233642578125, 15.8447265625, 16.3660888671875, 16.887451171875, 17.4088134765625, 17.93017578125, 18.4515380859375, 18.972900390625, 19.4942626953125, 20.015625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 17.0, 24.0, 50.0, 120.0, 186.0, 492.0, 1762.0, 10817.0, 349651.0, 3759685.0, 64873.0, 4799.0, 1037.0, 373.0, 138.0, 93.0, 63.0, 25.0, 12.0, 4.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.5625, -20.80078125, -20.0390625, -19.27734375, -18.515625, -17.75390625, -16.9921875, -16.23046875, -15.46875, -14.70703125, -13.9453125, -13.18359375, -12.421875, -11.66015625, -10.8984375, -10.13671875, -9.375, -8.61328125, -7.8515625, -7.08984375, -6.328125, -5.56640625, -4.8046875, -4.04296875, -3.28125, -2.51953125, -1.7578125, -0.99609375, -0.234375, 0.52734375, 1.2890625, 2.05078125, 2.8125, 3.57421875, 4.3359375, 5.09765625, 5.859375, 6.62109375, 7.3828125, 8.14453125, 8.90625, 9.66796875, 10.4296875, 11.19140625, 11.953125, 12.71484375, 13.4765625, 14.23828125, 15.0, 15.76171875, 16.5234375, 17.28515625, 18.046875, 18.80859375, 19.5703125, 20.33203125, 21.09375, 21.85546875, 22.6171875, 23.37890625, 24.140625, 24.90234375, 25.6640625, 26.42578125, 27.1875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 2.0, 9.0, 13.0, 23.0, 32.0, 52.0, 106.0, 143.0, 145.0, 113.0, 135.0, 86.0, 52.0, 34.0, 26.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.99544525146484, -69.30860900878906, -66.62176513671875, -63.93492889404297, -61.24809265136719, -58.561256408691406, -55.87441635131836, -53.18757629394531, -50.50074005126953, -47.81390380859375, -45.1270637512207, -42.440223693847656, -39.753387451171875, -37.066551208496094, -34.37971115112305, -31.692873001098633, -29.00603485107422, -26.319196701049805, -23.63235855102539, -20.945520401000977, -18.258682250976562, -15.571844100952148, -12.885005950927734, -10.19816780090332, -7.511329650878906, -4.824491500854492, -2.137653350830078, 0.5491847991943359, 3.23602294921875, 5.922861099243164, 8.609699249267578, 11.296537399291992, 13.983367919921875, 16.67020606994629, 19.357044219970703, 22.043882369995117, 24.73072052001953, 27.417558670043945, 30.10439682006836, 32.791236877441406, 35.47807312011719, 38.16490936279297, 40.851749420166016, 43.53858947753906, 46.225425720214844, 48.912261962890625, 51.59910202026367, 54.28594207763672, 56.9727783203125, 59.65961456298828, 62.34645462036133, 65.03329467773438, 67.72013092041016, 70.40696716308594, 73.09381103515625, 75.78064727783203, 78.46748352050781, 81.1543197631836, 83.84115600585938, 86.52799987792969, 89.21483612060547, 91.90167236328125, 94.58851623535156, 97.27535247802734, 99.96218872070312]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 8.0, 9.0, 11.0, 16.0, 17.0, 20.0, 16.0, 21.0, 25.0, 32.0, 27.0, 41.0, 31.0, 44.0, 39.0, 40.0, 38.0, 39.0, 48.0, 41.0, 36.0, 34.0, 40.0, 33.0, 34.0, 35.0, 25.0, 28.0, 24.0, 30.0, 14.0, 17.0, 20.0, 10.0, 6.0, 6.0, 10.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.24128723144531, -31.13075065612793, -30.020212173461914, -28.90967559814453, -27.799137115478516, -26.688600540161133, -25.57806396484375, -24.467525482177734, -23.35698890686035, -22.24645233154297, -21.135913848876953, -20.02537727355957, -18.914840698242188, -17.804302215576172, -16.69376564025879, -15.58322811126709, -14.47269058227539, -13.362153053283691, -12.251615524291992, -11.14107894897461, -10.03054141998291, -8.920003890991211, -7.80946683883667, -6.698929786682129, -5.58839225769043, -4.4778547286987305, -3.3673176765441895, -2.2567803859710693, -1.1462430953979492, -0.03570556640625, 1.074831485748291, 2.185368537902832, 3.2959060668945312, 4.4064435958862305, 5.5169806480407715, 6.6275177001953125, 7.738055229187012, 8.848592758178711, 9.959129333496094, 11.069666862487793, 12.180204391479492, 13.290741920471191, 14.40127944946289, 15.511816024780273, 16.622352600097656, 17.732891082763672, 18.843427658081055, 19.953964233398438, 21.064502716064453, 22.175039291381836, 23.28557777404785, 24.396114349365234, 25.50665283203125, 26.617189407348633, 27.727725982666016, 28.83826446533203, 29.948801040649414, 31.059337615966797, 32.16987609863281, 33.28041458129883, 34.39094924926758, 35.501487731933594, 36.61202621459961, 37.72256088256836, 38.833099365234375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 11.0, 22.0, 16.0, 23.0, 30.0, 23.0, 24.0, 39.0, 35.0, 38.0, 36.0, 53.0, 39.0, 50.0, 39.0, 41.0, 44.0, 40.0, 40.0, 28.0, 43.0, 30.0, 34.0, 29.0, 23.0, 16.0, 28.0, 12.0, 15.0, 11.0, 8.0, 10.0, 10.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.60986328125, -45.8759765625, -44.14208984375, -42.408203125, -40.67431640625, -38.9404296875, -37.20654296875, -35.47265625, -33.73876953125, -32.0048828125, -30.27099609375, -28.537109375, -26.80322265625, -25.0693359375, -23.33544921875, -21.6015625, -19.86767578125, -18.1337890625, -16.39990234375, -14.666015625, -12.93212890625, -11.1982421875, -9.46435546875, -7.73046875, -5.99658203125, -4.2626953125, -2.52880859375, -0.794921875, 0.93896484375, 2.6728515625, 4.40673828125, 6.140625, 7.87451171875, 9.6083984375, 11.34228515625, 13.076171875, 14.81005859375, 16.5439453125, 18.27783203125, 20.01171875, 21.74560546875, 23.4794921875, 25.21337890625, 26.947265625, 28.68115234375, 30.4150390625, 32.14892578125, 33.8828125, 35.61669921875, 37.3505859375, 39.08447265625, 40.818359375, 42.55224609375, 44.2861328125, 46.02001953125, 47.75390625, 49.48779296875, 51.2216796875, 52.95556640625, 54.689453125, 56.42333984375, 58.1572265625, 59.89111328125, 61.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 11.0, 16.0, 21.0, 21.0, 24.0, 46.0, 80.0, 86.0, 150.0, 246.0, 498.0, 788.0, 1433.0, 2427.0, 4171.0, 7434.0, 13343.0, 25150.0, 48245.0, 95708.0, 194768.0, 303926.0, 172069.0, 84490.0, 42984.0, 22600.0, 12007.0, 6716.0, 3771.0, 2179.0, 1328.0, 691.0, 438.0, 260.0, 142.0, 96.0, 75.0, 38.0, 27.0, 11.0, 13.0, 9.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -10.120361328125, -9.76416015625, -9.407958984375, -9.0517578125, -8.695556640625, -8.33935546875, -7.983154296875, -7.626953125, -7.270751953125, -6.91455078125, -6.558349609375, -6.2021484375, -5.845947265625, -5.48974609375, -5.133544921875, -4.77734375, -4.421142578125, -4.06494140625, -3.708740234375, -3.3525390625, -2.996337890625, -2.64013671875, -2.283935546875, -1.927734375, -1.571533203125, -1.21533203125, -0.859130859375, -0.5029296875, -0.146728515625, 0.20947265625, 0.565673828125, 0.921875, 1.278076171875, 1.63427734375, 1.990478515625, 2.3466796875, 2.702880859375, 3.05908203125, 3.415283203125, 3.771484375, 4.127685546875, 4.48388671875, 4.840087890625, 5.1962890625, 5.552490234375, 5.90869140625, 6.264892578125, 6.62109375, 6.977294921875, 7.33349609375, 7.689697265625, 8.0458984375, 8.402099609375, 8.75830078125, 9.114501953125, 9.470703125, 9.826904296875, 10.18310546875, 10.539306640625, 10.8955078125, 11.251708984375, 11.60791015625, 11.964111328125, 12.3203125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 14.0, 16.0, 18.0, 12.0, 21.0, 26.0, 20.0, 31.0, 24.0, 27.0, 37.0, 40.0, 31.0, 34.0, 41.0, 39.0, 1070.0, 31.0, 46.0, 42.0, 40.0, 32.0, 32.0, 33.0, 28.0, 31.0, 21.0, 31.0, 20.0, 15.0, 17.0, 11.0, 10.0, 12.0, 7.0, 11.0, 7.0, 6.0, 7.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.59375, -33.569580078125, -32.54541015625, -31.521240234375, -30.4970703125, -29.472900390625, -28.44873046875, -27.424560546875, -26.400390625, -25.376220703125, -24.35205078125, -23.327880859375, -22.3037109375, -21.279541015625, -20.25537109375, -19.231201171875, -18.20703125, -17.182861328125, -16.15869140625, -15.134521484375, -14.1103515625, -13.086181640625, -12.06201171875, -11.037841796875, -10.013671875, -8.989501953125, -7.96533203125, -6.941162109375, -5.9169921875, -4.892822265625, -3.86865234375, -2.844482421875, -1.8203125, -0.796142578125, 0.22802734375, 1.252197265625, 2.2763671875, 3.300537109375, 4.32470703125, 5.348876953125, 6.373046875, 7.397216796875, 8.42138671875, 9.445556640625, 10.4697265625, 11.493896484375, 12.51806640625, 13.542236328125, 14.56640625, 15.590576171875, 16.61474609375, 17.638916015625, 18.6630859375, 19.687255859375, 20.71142578125, 21.735595703125, 22.759765625, 23.783935546875, 24.80810546875, 25.832275390625, 26.8564453125, 27.880615234375, 28.90478515625, 29.928955078125, 30.953125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 6.0, 13.0, 19.0, 28.0, 50.0, 69.0, 116.0, 148.0, 224.0, 368.0, 489.0, 856.0, 1244.0, 1912.0, 2789.0, 4096.0, 6190.0, 9393.0, 14672.0, 22080.0, 33854.0, 52633.0, 82189.0, 134749.0, 1268514.0, 171920.0, 103131.0, 64621.0, 41634.0, 26906.0, 17779.0, 11482.0, 7640.0, 5130.0, 3435.0, 2298.0, 1526.0, 1003.0, 657.0, 422.0, 300.0, 201.0, 112.0, 66.0, 69.0, 35.0, 20.0, 18.0, 8.0, 7.0, 7.0, 4.0, 0.0, 2.0, 1.0], "bins": [-7.8984375, -7.664306640625, -7.43017578125, -7.196044921875, -6.9619140625, -6.727783203125, -6.49365234375, -6.259521484375, -6.025390625, -5.791259765625, -5.55712890625, -5.322998046875, -5.0888671875, -4.854736328125, -4.62060546875, -4.386474609375, -4.15234375, -3.918212890625, -3.68408203125, -3.449951171875, -3.2158203125, -2.981689453125, -2.74755859375, -2.513427734375, -2.279296875, -2.045166015625, -1.81103515625, -1.576904296875, -1.3427734375, -1.108642578125, -0.87451171875, -0.640380859375, -0.40625, -0.172119140625, 0.06201171875, 0.296142578125, 0.5302734375, 0.764404296875, 0.99853515625, 1.232666015625, 1.466796875, 1.700927734375, 1.93505859375, 2.169189453125, 2.4033203125, 2.637451171875, 2.87158203125, 3.105712890625, 3.33984375, 3.573974609375, 3.80810546875, 4.042236328125, 4.2763671875, 4.510498046875, 4.74462890625, 4.978759765625, 5.212890625, 5.447021484375, 5.68115234375, 5.915283203125, 6.1494140625, 6.383544921875, 6.61767578125, 6.851806640625, 7.0859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 7.0, 9.0, 18.0, 15.0, 12.0, 19.0, 26.0, 31.0, 29.0, 38.0, 36.0, 36.0, 44.0, 56.0, 55.0, 72.0, 69.0, 56.0, 49.0, 38.0, 51.0, 34.0, 31.0, 30.0, 23.0, 18.0, 19.0, 22.0, 9.0, 10.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007305145263671875, -0.007081449031829834, -0.006857752799987793, -0.006634056568145752, -0.006410360336303711, -0.00618666410446167, -0.005962967872619629, -0.005739271640777588, -0.005515575408935547, -0.005291879177093506, -0.005068182945251465, -0.004844486713409424, -0.004620790481567383, -0.004397094249725342, -0.004173398017883301, -0.00394970178604126, -0.0037260055541992188, -0.0035023093223571777, -0.0032786130905151367, -0.0030549168586730957, -0.0028312206268310547, -0.0026075243949890137, -0.0023838281631469727, -0.0021601319313049316, -0.0019364356994628906, -0.0017127394676208496, -0.0014890432357788086, -0.0012653470039367676, -0.0010416507720947266, -0.0008179545402526855, -0.0005942583084106445, -0.0003705620765686035, -0.0001468658447265625, 7.683038711547852e-05, 0.00030052661895751953, 0.0005242228507995605, 0.0007479190826416016, 0.0009716153144836426, 0.0011953115463256836, 0.0014190077781677246, 0.0016427040100097656, 0.0018664002418518066, 0.0020900964736938477, 0.0023137927055358887, 0.0025374889373779297, 0.0027611851692199707, 0.0029848814010620117, 0.0032085776329040527, 0.0034322738647460938, 0.0036559700965881348, 0.0038796663284301758, 0.004103362560272217, 0.004327058792114258, 0.004550755023956299, 0.00477445125579834, 0.004998147487640381, 0.005221843719482422, 0.005445539951324463, 0.005669236183166504, 0.005892932415008545, 0.006116628646850586, 0.006340324878692627, 0.006564021110534668, 0.006787717342376709, 0.00701141357421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 16.0, 15.0, 13.0, 24.0, 26.0, 40.0, 66.0, 77.0, 108.0, 175.0, 252.0, 385.0, 634.0, 1109.0, 2881.0, 10136.0, 50185.0, 340683.0, 533954.0, 85041.0, 15307.0, 3879.0, 1479.0, 696.0, 402.0, 262.0, 203.0, 141.0, 100.0, 71.0, 55.0, 29.0, 23.0, 19.0, 20.0, 8.0, 6.0, 8.0, 7.0, 0.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.056182861328125, -0.05448770523071289, -0.05279254913330078, -0.05109739303588867, -0.04940223693847656, -0.04770708084106445, -0.046011924743652344, -0.044316768646240234, -0.042621612548828125, -0.040926456451416016, -0.039231300354003906, -0.0375361442565918, -0.03584098815917969, -0.03414583206176758, -0.03245067596435547, -0.03075551986694336, -0.02906036376953125, -0.02736520767211914, -0.02567005157470703, -0.023974895477294922, -0.022279739379882812, -0.020584583282470703, -0.018889427185058594, -0.017194271087646484, -0.015499114990234375, -0.013803958892822266, -0.012108802795410156, -0.010413646697998047, -0.008718490600585938, -0.007023334503173828, -0.005328178405761719, -0.0036330223083496094, -0.0019378662109375, -0.00024271011352539062, 0.0014524459838867188, 0.003147602081298828, 0.0048427581787109375, 0.006537914276123047, 0.008233070373535156, 0.009928226470947266, 0.011623382568359375, 0.013318538665771484, 0.015013694763183594, 0.016708850860595703, 0.018404006958007812, 0.020099163055419922, 0.02179431915283203, 0.02348947525024414, 0.02518463134765625, 0.02687978744506836, 0.02857494354248047, 0.030270099639892578, 0.03196525573730469, 0.0336604118347168, 0.035355567932128906, 0.037050724029541016, 0.038745880126953125, 0.040441036224365234, 0.042136192321777344, 0.04383134841918945, 0.04552650451660156, 0.04722166061401367, 0.04891681671142578, 0.05061197280883789, 0.05230712890625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 14.0, 16.0, 25.0, 51.0, 95.0, 139.0, 170.0, 173.0, 139.0, 74.0, 56.0, 28.0, 13.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.014539824798703194, -0.014208639971911907, -0.013877456076443195, -0.013546271249651909, -0.013215087354183197, -0.01288390252739191, -0.012552717700600624, -0.012221533805131912, -0.0118903499096632, -0.011559165082871914, -0.011227981187403202, -0.010896796360611916, -0.010565612465143204, -0.010234427638351917, -0.00990324281156063, -0.009572058916091919, -0.009240874089300632, -0.008909689262509346, -0.008578505367040634, -0.008247320540249348, -0.007916136644780636, -0.007584951817989349, -0.00725376745685935, -0.006922583095729351, -0.006591398734599352, -0.006260214373469353, -0.0059290300123393536, -0.005597845651209354, -0.005266660824418068, -0.004935476928949356, -0.00460429210215807, -0.0042731077410280704, -0.003941923845559359, -0.0036107394844293594, -0.0032795551232993603, -0.0029483705293387175, -0.0026171861682087183, -0.002286001807078719, -0.0019548172131180763, -0.0016236328519880772, -0.001292448490858078, -0.0009612640715204179, -0.0006300796521827579, -0.00029889517463743687, 3.2289186492562294e-05, 0.00036347354762256145, 0.0006946581415832043, 0.0010258425027132034, 0.0013570268638432026, 0.0016882112249732018, 0.002019395586103201, 0.0023505801800638437, 0.002681764541193843, 0.003012948902323842, 0.003344133496284485, 0.003675317857414484, 0.004006502218544483, 0.004337686579674482, 0.0046688709408044815, 0.005000055767595768, 0.00533123966306448, 0.005662424489855766, 0.0059936088509857655, 0.006324793212115765, 0.006655977573245764]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 4.0, 5.0, 10.0, 9.0, 13.0, 11.0, 20.0, 20.0, 22.0, 26.0, 29.0, 19.0, 30.0, 25.0, 40.0, 23.0, 33.0, 31.0, 40.0, 53.0, 41.0, 40.0, 46.0, 28.0, 37.0, 28.0, 31.0, 32.0, 31.0, 29.0, 20.0, 28.0, 19.0, 20.0, 14.0, 17.0, 10.0, 17.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.003273904323577881, -0.003166566602885723, -0.0030592288821935654, -0.0029518911615014076, -0.00284455344080925, -0.002737215720117092, -0.0026298779994249344, -0.0025225402787327766, -0.002415202558040619, -0.002307864837348461, -0.0022005271166563034, -0.0020931893959641457, -0.001985851675271988, -0.0018785139545798302, -0.0017711762338876724, -0.0016638385131955147, -0.001556500792503357, -0.0014491630718111992, -0.0013418253511190414, -0.0012344876304268837, -0.001127149909734726, -0.0010198121890425682, -0.0009124744683504105, -0.0008051367476582527, -0.000697799026966095, -0.0005904613062739372, -0.0004831235855817795, -0.00037578586488962173, -0.000268448144197464, -0.00016111042350530624, -5.37727028131485e-05, 5.356501787900925e-05, 0.000160902738571167, 0.00026824045926332474, 0.0003755781799554825, 0.00048291590064764023, 0.000590253621339798, 0.0006975913420319557, 0.0008049290627241135, 0.0009122667834162712, 0.001019604504108429, 0.0011269422248005867, 0.0012342799454927444, 0.0013416176661849022, 0.00144895538687706, 0.0015562931075692177, 0.0016636308282613754, 0.0017709685489535332, 0.001878306269645691, 0.0019856439903378487, 0.0020929817110300064, 0.002200319431722164, 0.002307657152414322, 0.0024149948731064796, 0.0025223325937986374, 0.002629670314490795, 0.002737008035182953, 0.0028443457558751106, 0.0029516834765672684, 0.003059021197259426, 0.003166358917951584, 0.0032736966386437416, 0.0033810343593358994, 0.003488372080028057, 0.003595709800720215]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 11.0, 22.0, 16.0, 23.0, 30.0, 24.0, 23.0, 39.0, 34.0, 39.0, 36.0, 53.0, 40.0, 49.0, 39.0, 44.0, 41.0, 40.0, 40.0, 28.0, 43.0, 30.0, 34.0, 29.0, 23.0, 18.0, 26.0, 12.0, 15.0, 11.0, 8.0, 10.0, 10.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.609375, -45.875, -44.140625, -42.40625, -40.671875, -38.9375, -37.203125, -35.46875, -33.734375, -32.0, -30.265625, -28.53125, -26.796875, -25.0625, -23.328125, -21.59375, -19.859375, -18.125, -16.390625, -14.65625, -12.921875, -11.1875, -9.453125, -7.71875, -5.984375, -4.25, -2.515625, -0.78125, 0.953125, 2.6875, 4.421875, 6.15625, 7.890625, 9.625, 11.359375, 13.09375, 14.828125, 16.5625, 18.296875, 20.03125, 21.765625, 23.5, 25.234375, 26.96875, 28.703125, 30.4375, 32.171875, 33.90625, 35.640625, 37.375, 39.109375, 40.84375, 42.578125, 44.3125, 46.046875, 47.78125, 49.515625, 51.25, 52.984375, 54.71875, 56.453125, 58.1875, 59.921875, 61.65625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 11.0, 21.0, 22.0, 18.0, 33.0, 48.0, 76.0, 107.0, 167.0, 266.0, 498.0, 890.0, 1829.0, 3895.0, 9665.0, 35704.0, 241512.0, 621348.0, 100866.0, 19355.0, 6368.0, 2755.0, 1337.0, 704.0, 411.0, 196.0, 132.0, 88.0, 52.0, 45.0, 34.0, 22.0, 22.0, 18.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8828125, -13.3338623046875, -12.784912109375, -12.2359619140625, -11.68701171875, -11.1380615234375, -10.589111328125, -10.0401611328125, -9.4912109375, -8.9422607421875, -8.393310546875, -7.8443603515625, -7.29541015625, -6.7464599609375, -6.197509765625, -5.6485595703125, -5.099609375, -4.5506591796875, -4.001708984375, -3.4527587890625, -2.90380859375, -2.3548583984375, -1.805908203125, -1.2569580078125, -0.7080078125, -0.1590576171875, 0.389892578125, 0.9388427734375, 1.48779296875, 2.0367431640625, 2.585693359375, 3.1346435546875, 3.68359375, 4.2325439453125, 4.781494140625, 5.3304443359375, 5.87939453125, 6.4283447265625, 6.977294921875, 7.5262451171875, 8.0751953125, 8.6241455078125, 9.173095703125, 9.7220458984375, 10.27099609375, 10.8199462890625, 11.368896484375, 11.9178466796875, 12.466796875, 13.0157470703125, 13.564697265625, 14.1136474609375, 14.66259765625, 15.2115478515625, 15.760498046875, 16.3094482421875, 16.8583984375, 17.4073486328125, 17.956298828125, 18.5052490234375, 19.05419921875, 19.6031494140625, 20.152099609375, 20.7010498046875, 21.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 11.0, 14.0, 28.0, 28.0, 36.0, 48.0, 70.0, 103.0, 101.0, 2147.0, 107.0, 80.0, 84.0, 54.0, 41.0, 32.0, 24.0, 11.0, 11.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-162.5, -157.533203125, -152.56640625, -147.599609375, -142.6328125, -137.666015625, -132.69921875, -127.732421875, -122.765625, -117.798828125, -112.83203125, -107.865234375, -102.8984375, -97.931640625, -92.96484375, -87.998046875, -83.03125, -78.064453125, -73.09765625, -68.130859375, -63.1640625, -58.197265625, -53.23046875, -48.263671875, -43.296875, -38.330078125, -33.36328125, -28.396484375, -23.4296875, -18.462890625, -13.49609375, -8.529296875, -3.5625, 1.404296875, 6.37109375, 11.337890625, 16.3046875, 21.271484375, 26.23828125, 31.205078125, 36.171875, 41.138671875, 46.10546875, 51.072265625, 56.0390625, 61.005859375, 65.97265625, 70.939453125, 75.90625, 80.873046875, 85.83984375, 90.806640625, 95.7734375, 100.740234375, 105.70703125, 110.673828125, 115.640625, 120.607421875, 125.57421875, 130.541015625, 135.5078125, 140.474609375, 145.44140625, 150.408203125, 155.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 7.0, 12.0, 23.0, 33.0, 53.0, 72.0, 104.0, 248.0, 590.0, 1407.0, 5013.0, 162847.0, 2955788.0, 15637.0, 2225.0, 850.0, 357.0, 156.0, 91.0, 60.0, 37.0, 32.0, 18.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.84375, -39.6142578125, -38.384765625, -37.1552734375, -35.92578125, -34.6962890625, -33.466796875, -32.2373046875, -31.0078125, -29.7783203125, -28.548828125, -27.3193359375, -26.08984375, -24.8603515625, -23.630859375, -22.4013671875, -21.171875, -19.9423828125, -18.712890625, -17.4833984375, -16.25390625, -15.0244140625, -13.794921875, -12.5654296875, -11.3359375, -10.1064453125, -8.876953125, -7.6474609375, -6.41796875, -5.1884765625, -3.958984375, -2.7294921875, -1.5, -0.2705078125, 0.958984375, 2.1884765625, 3.41796875, 4.6474609375, 5.876953125, 7.1064453125, 8.3359375, 9.5654296875, 10.794921875, 12.0244140625, 13.25390625, 14.4833984375, 15.712890625, 16.9423828125, 18.171875, 19.4013671875, 20.630859375, 21.8603515625, 23.08984375, 24.3193359375, 25.548828125, 26.7783203125, 28.0078125, 29.2373046875, 30.466796875, 31.6962890625, 32.92578125, 34.1552734375, 35.384765625, 36.6142578125, 37.84375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 16.0, 37.0, 70.0, 194.0, 354.0, 196.0, 67.0, 32.0, 10.0, 12.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.33833312988281, -79.69783020019531, -72.05732727050781, -64.41683197021484, -56.776329040527344, -49.135826110839844, -41.49532699584961, -33.854827880859375, -26.214324951171875, -18.573823928833008, -10.93332290649414, -3.2928218841552734, 4.347679138183594, 11.988182067871094, 19.628681182861328, 27.269180297851562, 34.90968322753906, 42.55018615722656, 50.1906852722168, 57.83118438720703, 65.47168731689453, 73.11219024658203, 80.752685546875, 88.3931884765625, 96.03369140625, 103.6741943359375, 111.314697265625, 118.95519256591797, 126.59569549560547, 134.2362060546875, 141.87669372558594, 149.51719665527344, 157.15768432617188, 164.79818725585938, 172.43869018554688, 180.07919311523438, 187.71969604492188, 195.36019897460938, 203.0006866455078, 210.6411895751953, 218.2816925048828, 225.9221954345703, 233.5626983642578, 241.2032012939453, 248.84368896484375, 256.48419189453125, 264.12469482421875, 271.76519775390625, 279.40570068359375, 287.04620361328125, 294.68670654296875, 302.32720947265625, 309.96771240234375, 317.60821533203125, 325.24871826171875, 332.88922119140625, 340.52972412109375, 348.17022705078125, 355.81072998046875, 363.45123291015625, 371.09173583984375, 378.73223876953125, 386.37274169921875, 394.01324462890625, 401.6537170410156]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 11.0, 8.0, 5.0, 7.0, 14.0, 16.0, 17.0, 17.0, 18.0, 22.0, 17.0, 37.0, 40.0, 39.0, 52.0, 50.0, 40.0, 52.0, 54.0, 49.0, 33.0, 37.0, 47.0, 52.0, 34.0, 28.0, 32.0, 27.0, 20.0, 20.0, 17.0, 14.0, 10.0, 7.0, 9.0, 11.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-96.98023986816406, -93.855224609375, -90.73020935058594, -87.60519409179688, -84.48017120361328, -81.35515594482422, -78.23014068603516, -75.1051254272461, -71.98011016845703, -68.85509490966797, -65.7300796508789, -62.60506057739258, -59.480045318603516, -56.35502624511719, -53.230010986328125, -50.10499572753906, -46.979976654052734, -43.85496139526367, -40.729942321777344, -37.60492706298828, -34.47991180419922, -31.354894638061523, -28.229877471923828, -25.104862213134766, -21.97984504699707, -18.854827880859375, -15.729812622070312, -12.604795455932617, -9.479779243469238, -6.354763031005859, -3.229745864868164, -0.10473060607910156, 3.0202865600585938, 6.145302772521973, 9.270318984985352, 12.395336151123047, 15.520352363586426, 18.645368576049805, 21.7703857421875, 24.895401000976562, 28.020418167114258, 31.145435333251953, 34.270450592041016, 37.395469665527344, 40.520484924316406, 43.64550018310547, 46.77051544189453, 49.895530700683594, 53.02054977416992, 56.145565032958984, 59.27058410644531, 62.395599365234375, 65.52061462402344, 68.6456298828125, 71.77064514160156, 74.89566040039062, 78.02068328857422, 81.14569854736328, 84.27071380615234, 87.39573669433594, 90.520751953125, 93.64576721191406, 96.77078247070312, 99.89579772949219, 103.02081298828125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 8.0, 9.0, 18.0, 30.0, 50.0, 57.0, 97.0, 160.0, 231.0, 346.0, 496.0, 721.0, 1221.0, 1041009.0, 1458.0, 876.0, 593.0, 392.0, 259.0, 180.0, 136.0, 76.0, 48.0, 33.0, 16.0, 14.0, 9.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.42410659790039, -38.71892547607422, -37.01374816894531, -35.30856704711914, -33.603389739990234, -31.898208618164062, -30.193029403686523, -28.487850189208984, -26.782670974731445, -25.077491760253906, -23.372312545776367, -21.667133331298828, -19.961952209472656, -18.25677490234375, -16.551593780517578, -14.846414566040039, -13.1412353515625, -11.436056137084961, -9.730876922607422, -8.025696754455566, -6.320517539978027, -4.615338325500488, -2.910158157348633, -1.2049789428710938, 0.5002002716064453, 2.2053797245025635, 3.9105591773986816, 5.615738868713379, 7.320918083190918, 9.026097297668457, 10.731277465820312, 12.436456680297852, 14.141632080078125, 15.846811294555664, 17.551990509033203, 19.257171630859375, 20.96234893798828, 22.667530059814453, 24.372709274291992, 26.07788848876953, 27.78306770324707, 29.48824691772461, 31.19342613220215, 32.89860534667969, 34.60378646850586, 36.308963775634766, 38.01414489746094, 39.719322204589844, 41.424503326416016, 43.12968444824219, 44.834861755371094, 46.540042877197266, 48.24522018432617, 49.950401306152344, 51.65557861328125, 53.36075973510742, 55.065940856933594, 56.771121978759766, 58.47629928588867, 60.181480407714844, 61.88665771484375, 63.59183883666992, 65.2970199584961, 67.002197265625, 68.7073745727539]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 13.0, 9.0, 12.0, 7.0, 9.0, 13.0, 29.0, 54.0, 425.0, 51462200.0, 191.0, 64.0, 27.0, 19.0, 7.0, 4.0, 4.0, 3.0, 4.0, 6.0, 11.0, 3.0, 3.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4720.0, -4518.69091796875, -4317.3818359375, -4116.07275390625, -3914.763671875, -3713.45458984375, -3512.1455078125, -3310.83642578125, -3109.52734375, -2908.21826171875, -2706.9091796875, -2505.60009765625, -2304.291015625, -2102.98193359375, -1901.6729736328125, -1700.3638916015625, -1499.054931640625, -1297.745849609375, -1096.436767578125, -895.1277465820312, -693.8186645507812, -492.50958251953125, -291.2005615234375, -89.8914794921875, 111.4176025390625, 312.7266845703125, 514.0357666015625, 715.3447875976562, 916.6538696289062, 1117.962890625, 1319.27197265625, 1520.5810546875, 1721.89013671875, 1923.19921875, 2124.50830078125, 2325.8173828125, 2527.12646484375, 2728.435546875, 2929.74462890625, 3131.0537109375, 3332.36279296875, 3533.671875, 3734.98095703125, 3936.2900390625, 4137.59912109375, 4338.908203125, 4540.21728515625, 4741.5263671875, 4942.8349609375, 5144.14404296875, 5345.453125, 5546.76220703125, 5748.0712890625, 5949.38037109375, 6150.689453125, 6351.99853515625, 6553.3076171875, 6754.61669921875, 6955.92578125, 7157.23486328125, 7358.5439453125, 7559.85302734375, 7761.162109375, 7962.47119140625, 8163.7802734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 9.0, 12.0, 6.0, 13.0, 20.0, 21.0, 34.0, 51.0, 94.0, 121.0, 172.0, 271.0, 365.0, 599.0, 845.0, 1368.0, 2096.0, 3248.0, 5217.0, 8273.0, 13101.0, 21116.0, 34397.0, 57158.0, 98917.0, 175744.0, 340485.0, 1365169.0, 3323656.0, 378720.0, 193464.0, 106601.0, 62497.0, 37086.0, 22284.0, 13949.0, 8834.0, 5599.0, 3397.0, 2212.0, 1386.0, 915.0, 616.0, 424.0, 281.0, 202.0, 121.0, 72.0, 74.0, 55.0, 27.0, 14.0, 14.0, 12.0, 7.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.06640625, -4.9132080078125, -4.760009765625, -4.6068115234375, -4.45361328125, -4.3004150390625, -4.147216796875, -3.9940185546875, -3.8408203125, -3.6876220703125, -3.534423828125, -3.3812255859375, -3.22802734375, -3.0748291015625, -2.921630859375, -2.7684326171875, -2.615234375, -2.4620361328125, -2.308837890625, -2.1556396484375, -2.00244140625, -1.8492431640625, -1.696044921875, -1.5428466796875, -1.3896484375, -1.2364501953125, -1.083251953125, -0.9300537109375, -0.77685546875, -0.6236572265625, -0.470458984375, -0.3172607421875, -0.1640625, -0.0108642578125, 0.142333984375, 0.2955322265625, 0.44873046875, 0.6019287109375, 0.755126953125, 0.9083251953125, 1.0615234375, 1.2147216796875, 1.367919921875, 1.5211181640625, 1.67431640625, 1.8275146484375, 1.980712890625, 2.1339111328125, 2.287109375, 2.4403076171875, 2.593505859375, 2.7467041015625, 2.89990234375, 3.0531005859375, 3.206298828125, 3.3594970703125, 3.5126953125, 3.6658935546875, 3.819091796875, 3.9722900390625, 4.12548828125, 4.2786865234375, 4.431884765625, 4.5850830078125, 4.73828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 2.0, 4.0, 10.0, 9.0, 11.0, 12.0, 16.0, 9.0, 20.0, 17.0, 27.0, 23.0, 29.0, 28.0, 31.0, 44.0, 34.0, 39.0, 50.0, 117.0, 355.0, 600.0, 101.0, 55.0, 40.0, 30.0, 34.0, 29.0, 37.0, 27.0, 27.0, 22.0, 18.0, 20.0, 17.0, 9.0, 12.0, 11.0, 8.0, 10.0, 6.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.5703125, -11.1998291015625, -10.829345703125, -10.4588623046875, -10.08837890625, -9.7178955078125, -9.347412109375, -8.9769287109375, -8.6064453125, -8.2359619140625, -7.865478515625, -7.4949951171875, -7.12451171875, -6.7540283203125, -6.383544921875, -6.0130615234375, -5.642578125, -5.2720947265625, -4.901611328125, -4.5311279296875, -4.16064453125, -3.7901611328125, -3.419677734375, -3.0491943359375, -2.6787109375, -2.3082275390625, -1.937744140625, -1.5672607421875, -1.19677734375, -0.8262939453125, -0.455810546875, -0.0853271484375, 0.28515625, 0.6556396484375, 1.026123046875, 1.3966064453125, 1.76708984375, 2.1375732421875, 2.508056640625, 2.8785400390625, 3.2490234375, 3.6195068359375, 3.989990234375, 4.3604736328125, 4.73095703125, 5.1014404296875, 5.471923828125, 5.8424072265625, 6.212890625, 6.5833740234375, 6.953857421875, 7.3243408203125, 7.69482421875, 8.0653076171875, 8.435791015625, 8.8062744140625, 9.1767578125, 9.5472412109375, 9.917724609375, 10.2882080078125, 10.65869140625, 11.0291748046875, 11.399658203125, 11.7701416015625, 12.140625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 7.0, 6.0, 11.0, 13.0, 22.0, 21.0, 55.0, 53.0, 120.0, 159.0, 326.0, 477.0, 773.0, 1331.0, 2328.0, 4158.0, 7435.0, 13803.0, 25708.0, 48981.0, 97003.0, 197367.0, 487541.0, 4177988.0, 730017.0, 250647.0, 118100.0, 58908.0, 30915.0, 16659.0, 8923.0, 4864.0, 2681.0, 1609.0, 913.0, 600.0, 342.0, 227.0, 132.0, 82.0, 40.0, 18.0, 19.0, 25.0, 16.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0], "bins": [-7.53515625, -7.31121826171875, -7.0872802734375, -6.86334228515625, -6.639404296875, -6.41546630859375, -6.1915283203125, -5.96759033203125, -5.74365234375, -5.51971435546875, -5.2957763671875, -5.07183837890625, -4.847900390625, -4.62396240234375, -4.4000244140625, -4.17608642578125, -3.9521484375, -3.72821044921875, -3.5042724609375, -3.28033447265625, -3.056396484375, -2.83245849609375, -2.6085205078125, -2.38458251953125, -2.16064453125, -1.93670654296875, -1.7127685546875, -1.48883056640625, -1.264892578125, -1.04095458984375, -0.8170166015625, -0.59307861328125, -0.369140625, -0.14520263671875, 0.0787353515625, 0.30267333984375, 0.526611328125, 0.75054931640625, 0.9744873046875, 1.19842529296875, 1.42236328125, 1.64630126953125, 1.8702392578125, 2.09417724609375, 2.318115234375, 2.54205322265625, 2.7659912109375, 2.98992919921875, 3.2138671875, 3.43780517578125, 3.6617431640625, 3.88568115234375, 4.109619140625, 4.33355712890625, 4.5574951171875, 4.78143310546875, 5.00537109375, 5.22930908203125, 5.4532470703125, 5.67718505859375, 5.901123046875, 6.12506103515625, 6.3489990234375, 6.57293701171875, 6.796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 12.0, 10.0, 12.0, 10.0, 19.0, 21.0, 24.0, 26.0, 26.0, 29.0, 44.0, 36.0, 42.0, 62.0, 67.0, 215.0, 624.0, 220.0, 81.0, 65.0, 46.0, 43.0, 28.0, 36.0, 32.0, 27.0, 29.0, 24.0, 19.0, 20.0, 14.0, 17.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.5546875, -9.2708740234375, -8.987060546875, -8.7032470703125, -8.41943359375, -8.1356201171875, -7.851806640625, -7.5679931640625, -7.2841796875, -7.0003662109375, -6.716552734375, -6.4327392578125, -6.14892578125, -5.8651123046875, -5.581298828125, -5.2974853515625, -5.013671875, -4.7298583984375, -4.446044921875, -4.1622314453125, -3.87841796875, -3.5946044921875, -3.310791015625, -3.0269775390625, -2.7431640625, -2.4593505859375, -2.175537109375, -1.8917236328125, -1.60791015625, -1.3240966796875, -1.040283203125, -0.7564697265625, -0.47265625, -0.1888427734375, 0.094970703125, 0.3787841796875, 0.66259765625, 0.9464111328125, 1.230224609375, 1.5140380859375, 1.7978515625, 2.0816650390625, 2.365478515625, 2.6492919921875, 2.93310546875, 3.2169189453125, 3.500732421875, 3.7845458984375, 4.068359375, 4.3521728515625, 4.635986328125, 4.9197998046875, 5.20361328125, 5.4874267578125, 5.771240234375, 6.0550537109375, 6.3388671875, 6.6226806640625, 6.906494140625, 7.1903076171875, 7.47412109375, 7.7579345703125, 8.041748046875, 8.3255615234375, 8.609375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 7.0, 5.0, 7.0, 18.0, 1.0, 5.0, 34.0, 33.0, 31.0, 30.0, 64.0, 66.0, 89.0, 118.0, 146.0, 196.0, 250.0, 299.0, 443.0, 562.0, 860.0, 1045.0, 1550.0, 2413.0, 3574.0, 6380.0, 12575.0, 28197.0, 86109.0, 5842378.0, 215349.0, 46719.0, 18404.0, 8920.0, 4907.0, 2859.0, 1835.0, 1389.0, 847.0, 685.0, 450.0, 382.0, 247.0, 220.0, 165.0, 129.0, 104.0, 89.0, 49.0, 48.0, 46.0, 13.0, 14.0, 26.0, 21.0, 23.0, 14.0, 1.0, 3.0, 9.0], "bins": [-16.90625, -16.4053955078125, -15.904541015625, -15.4036865234375, -14.90283203125, -14.4019775390625, -13.901123046875, -13.4002685546875, -12.8994140625, -12.3985595703125, -11.897705078125, -11.3968505859375, -10.89599609375, -10.3951416015625, -9.894287109375, -9.3934326171875, -8.892578125, -8.3917236328125, -7.890869140625, -7.3900146484375, -6.88916015625, -6.3883056640625, -5.887451171875, -5.3865966796875, -4.8857421875, -4.3848876953125, -3.884033203125, -3.3831787109375, -2.88232421875, -2.3814697265625, -1.880615234375, -1.3797607421875, -0.87890625, -0.3780517578125, 0.122802734375, 0.6236572265625, 1.12451171875, 1.6253662109375, 2.126220703125, 2.6270751953125, 3.1279296875, 3.6287841796875, 4.129638671875, 4.6304931640625, 5.13134765625, 5.6322021484375, 6.133056640625, 6.6339111328125, 7.134765625, 7.6356201171875, 8.136474609375, 8.6373291015625, 9.13818359375, 9.6390380859375, 10.139892578125, 10.6407470703125, 11.1416015625, 11.6424560546875, 12.143310546875, 12.6441650390625, 13.14501953125, 13.6458740234375, 14.146728515625, 14.6475830078125, 15.1484375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 6.0, 9.0, 7.0, 7.0, 17.0, 7.0, 12.0, 15.0, 18.0, 18.0, 19.0, 27.0, 36.0, 31.0, 36.0, 52.0, 53.0, 70.0, 114.0, 212.0, 443.0, 236.0, 107.0, 72.0, 54.0, 42.0, 30.0, 34.0, 39.0, 25.0, 25.0, 24.0, 14.0, 21.0, 10.0, 13.0, 16.0, 9.0, 7.0, 4.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.94140625, -5.76544189453125, -5.5894775390625, -5.41351318359375, -5.237548828125, -5.06158447265625, -4.8856201171875, -4.70965576171875, -4.53369140625, -4.35772705078125, -4.1817626953125, -4.00579833984375, -3.829833984375, -3.65386962890625, -3.4779052734375, -3.30194091796875, -3.1259765625, -2.95001220703125, -2.7740478515625, -2.59808349609375, -2.422119140625, -2.24615478515625, -2.0701904296875, -1.89422607421875, -1.71826171875, -1.54229736328125, -1.3663330078125, -1.19036865234375, -1.014404296875, -0.83843994140625, -0.6624755859375, -0.48651123046875, -0.310546875, -0.13458251953125, 0.0413818359375, 0.21734619140625, 0.393310546875, 0.56927490234375, 0.7452392578125, 0.92120361328125, 1.09716796875, 1.27313232421875, 1.4490966796875, 1.62506103515625, 1.801025390625, 1.97698974609375, 2.1529541015625, 2.32891845703125, 2.5048828125, 2.68084716796875, 2.8568115234375, 3.03277587890625, 3.208740234375, 3.38470458984375, 3.5606689453125, 3.73663330078125, 3.91259765625, 4.08856201171875, 4.2645263671875, 4.44049072265625, 4.616455078125, 4.79241943359375, 4.9683837890625, 5.14434814453125, 5.3203125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 16.0, 72.0, 251.0, 535.0, 92.0, 23.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-100.04877471923828, -98.23719787597656, -96.42562103271484, -94.6140365600586, -92.80245971679688, -90.99088287353516, -89.17930603027344, -87.36772918701172, -85.55615234375, -83.74457550048828, -81.93299865722656, -80.12141418457031, -78.3098373413086, -76.49826049804688, -74.68668365478516, -72.87510681152344, -71.06352233886719, -69.25194549560547, -67.44036865234375, -65.6287841796875, -63.81720733642578, -62.00563049316406, -60.194053649902344, -58.382476806640625, -56.57089614868164, -54.75931930541992, -52.94773864746094, -51.13616180419922, -49.3245849609375, -47.513004302978516, -45.7014274597168, -43.88984680175781, -42.07827377319336, -40.26669692993164, -38.455116271972656, -36.64353942871094, -34.83196258544922, -33.020381927490234, -31.208805084228516, -29.397226333618164, -27.585647583007812, -25.77406883239746, -23.96249008178711, -22.15091323852539, -20.33933448791504, -18.527755737304688, -16.71617889404297, -14.904600143432617, -13.093021392822266, -11.281442642211914, -9.469864845275879, -7.6582865715026855, -5.846708297729492, -4.035129547119141, -2.2235517501831055, -0.4119739532470703, 1.3996047973632812, 3.2111830711364746, 5.022761344909668, 6.834339618682861, 8.645917892456055, 10.457496643066406, 12.269074440002441, 14.080652236938477, 15.892230987548828]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 5.0, 5.0, 7.0, 13.0, 22.0, 14.0, 19.0, 32.0, 27.0, 29.0, 27.0, 38.0, 45.0, 43.0, 38.0, 41.0, 54.0, 49.0, 46.0, 33.0, 59.0, 43.0, 37.0, 41.0, 44.0, 22.0, 28.0, 26.0, 22.0, 28.0, 17.0, 14.0, 9.0, 8.0, 7.0, 3.0, 1.0, 8.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.205036163330078, -8.905710220336914, -8.60638427734375, -8.307058334350586, -8.007732391357422, -7.708406925201416, -7.409080982208252, -7.109755516052246, -6.810429573059082, -6.511103630065918, -6.211777687072754, -5.91245174407959, -5.613126277923584, -5.31380033493042, -5.014474391937256, -4.71514892578125, -4.415822505950928, -4.116496562957764, -3.8171708583831787, -3.5178449153900146, -3.2185192108154297, -2.9191932678222656, -2.6198673248291016, -2.3205416202545166, -2.0212156772613525, -1.721889853477478, -1.4225640296936035, -1.1232380867004395, -0.8239122629165649, -0.5245864391326904, -0.22526049613952637, 0.0740652084350586, 0.37339115142822266, 0.6727169752120972, 0.9720428586006165, 1.2713687419891357, 1.5706945657730103, 1.8700203895568848, 2.169346332550049, 2.468672037124634, 2.767997980117798, 3.067323923110962, 3.366649627685547, 3.665975570678711, 3.965301513671875, 4.264627456665039, 4.563953399658203, 4.863278865814209, 5.162604808807373, 5.461930751800537, 5.761256694793701, 6.060582160949707, 6.359908103942871, 6.659234046936035, 6.958559989929199, 7.257885932922363, 7.557211875915527, 7.856537818908691, 8.155863761901855, 8.45518970489502, 8.754515647888184, 9.053840637207031, 9.353166580200195, 9.65249252319336, 9.951818466186523]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 5.0, 5.0, 6.0, 5.0, 8.0, 14.0, 19.0, 23.0, 26.0, 45.0, 59.0, 79.0, 144.0, 223.0, 348.0, 572.0, 959.0, 1741.0, 3219.0, 7224.0, 21686.0, 3264130.0, 858073.0, 22007.0, 7435.0, 3115.0, 1447.0, 696.0, 360.0, 210.0, 139.0, 74.0, 51.0, 33.0, 28.0, 21.0, 14.0, 9.0, 4.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.035125732421875, -0.03412199020385742, -0.033118247985839844, -0.032114505767822266, -0.031110763549804688, -0.03010702133178711, -0.02910327911376953, -0.028099536895751953, -0.027095794677734375, -0.026092052459716797, -0.02508831024169922, -0.02408456802368164, -0.023080825805664062, -0.022077083587646484, -0.021073341369628906, -0.020069599151611328, -0.01906585693359375, -0.018062114715576172, -0.017058372497558594, -0.016054630279541016, -0.015050888061523438, -0.01404714584350586, -0.013043403625488281, -0.012039661407470703, -0.011035919189453125, -0.010032176971435547, -0.009028434753417969, -0.00802469253540039, -0.0070209503173828125, -0.006017208099365234, -0.005013465881347656, -0.004009723663330078, -0.0030059814453125, -0.002002239227294922, -0.0009984970092773438, 5.245208740234375e-06, 0.0010089874267578125, 0.0020127296447753906, 0.0030164718627929688, 0.004020214080810547, 0.005023956298828125, 0.006027698516845703, 0.007031440734863281, 0.00803518295288086, 0.009038925170898438, 0.010042667388916016, 0.011046409606933594, 0.012050151824951172, 0.01305389404296875, 0.014057636260986328, 0.015061378479003906, 0.016065120697021484, 0.017068862915039062, 0.01807260513305664, 0.01907634735107422, 0.020080089569091797, 0.021083831787109375, 0.022087574005126953, 0.02309131622314453, 0.02409505844116211, 0.025098800659179688, 0.026102542877197266, 0.027106285095214844, 0.028110027313232422, 0.02911376953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 5.0, 7.0, 6.0, 10.0, 6.0, 10.0, 6.0, 11.0, 14.0, 79.0, 499.0, 223.0, 23.0, 8.0, 9.0, 8.0, 10.0, 5.0, 11.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0016803741455078125, -0.0016288608312606812, -0.0015773475170135498, -0.0015258342027664185, -0.0014743208885192871, -0.0014228075742721558, -0.0013712942600250244, -0.001319780945777893, -0.0012682676315307617, -0.0012167543172836304, -0.001165241003036499, -0.0011137276887893677, -0.0010622143745422363, -0.001010701060295105, -0.0009591877460479736, -0.0009076744318008423, -0.0008561611175537109, -0.0008046478033065796, -0.0007531344890594482, -0.0007016211748123169, -0.0006501078605651855, -0.0005985945463180542, -0.0005470812320709229, -0.0004955679178237915, -0.00044405460357666016, -0.0003925412893295288, -0.00034102797508239746, -0.0002895146608352661, -0.00023800134658813477, -0.00018648803234100342, -0.00013497471809387207, -8.346140384674072e-05, -3.1948089599609375e-05, 1.9565224647521973e-05, 7.107853889465332e-05, 0.00012259185314178467, 0.00017410516738891602, 0.00022561848163604736, 0.0002771317958831787, 0.00032864511013031006, 0.0003801584243774414, 0.00043167173862457275, 0.0004831850528717041, 0.0005346983671188354, 0.0005862116813659668, 0.0006377249956130981, 0.0006892383098602295, 0.0007407516241073608, 0.0007922649383544922, 0.0008437782526016235, 0.0008952915668487549, 0.0009468048810958862, 0.0009983181953430176, 0.001049831509590149, 0.0011013448238372803, 0.0011528581380844116, 0.001204371452331543, 0.0012558847665786743, 0.0013073980808258057, 0.001358911395072937, 0.0014104247093200684, 0.0014619380235671997, 0.001513451337814331, 0.0015649646520614624, 0.0016164779663085938]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 14.0, 11.0, 9.0, 11.0, 19.0, 20.0, 31.0, 48.0, 78.0, 144.0, 213.0, 374.0, 689.0, 1334.0, 3684.0, 16811.0, 771253.0, 3372090.0, 20338.0, 3981.0, 1446.0, 680.0, 393.0, 217.0, 129.0, 75.0, 64.0, 34.0, 31.0, 13.0, 13.0, 9.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043060302734375, -0.041407108306884766, -0.03975391387939453, -0.0381007194519043, -0.03644752502441406, -0.03479433059692383, -0.033141136169433594, -0.03148794174194336, -0.029834747314453125, -0.02818155288696289, -0.026528358459472656, -0.024875164031982422, -0.023221969604492188, -0.021568775177001953, -0.01991558074951172, -0.018262386322021484, -0.01660919189453125, -0.014955997467041016, -0.013302803039550781, -0.011649608612060547, -0.009996414184570312, -0.008343219757080078, -0.006690025329589844, -0.005036830902099609, -0.003383636474609375, -0.0017304420471191406, -7.724761962890625e-05, 0.0015759468078613281, 0.0032291412353515625, 0.004882335662841797, 0.006535530090332031, 0.008188724517822266, 0.0098419189453125, 0.011495113372802734, 0.013148307800292969, 0.014801502227783203, 0.016454696655273438, 0.018107891082763672, 0.019761085510253906, 0.02141427993774414, 0.023067474365234375, 0.02472066879272461, 0.026373863220214844, 0.028027057647705078, 0.029680252075195312, 0.03133344650268555, 0.03298664093017578, 0.034639835357666016, 0.03629302978515625, 0.037946224212646484, 0.03959941864013672, 0.04125261306762695, 0.04290580749511719, 0.04455900192260742, 0.046212196350097656, 0.04786539077758789, 0.049518585205078125, 0.05117177963256836, 0.052824974060058594, 0.05447816848754883, 0.05613136291503906, 0.0577845573425293, 0.05943775177001953, 0.061090946197509766, 0.062744140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 11.0, 15.0, 20.0, 24.0, 23.0, 41.0, 44.0, 54.0, 68.0, 99.0, 128.0, 175.0, 298.0, 1478.0, 699.0, 233.0, 166.0, 122.0, 71.0, 66.0, 59.0, 33.0, 29.0, 28.0, 16.0, 12.0, 17.0, 9.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0033664703369140625, -0.0032411515712738037, -0.003115832805633545, -0.002990514039993286, -0.0028651952743530273, -0.0027398765087127686, -0.0026145577430725098, -0.002489238977432251, -0.002363920211791992, -0.0022386014461517334, -0.0021132826805114746, -0.001987963914871216, -0.001862645149230957, -0.0017373263835906982, -0.0016120076179504395, -0.0014866888523101807, -0.0013613700866699219, -0.001236051321029663, -0.0011107325553894043, -0.0009854137897491455, -0.0008600950241088867, -0.0007347762584686279, -0.0006094574928283691, -0.00048413872718811035, -0.00035881996154785156, -0.00023350119590759277, -0.00010818243026733398, 1.7136335372924805e-05, 0.0001424551010131836, 0.0002677738666534424, 0.00039309263229370117, 0.00051841139793396, 0.0006437301635742188, 0.0007690489292144775, 0.0008943676948547363, 0.0010196864604949951, 0.001145005226135254, 0.0012703239917755127, 0.0013956427574157715, 0.0015209615230560303, 0.001646280288696289, 0.0017715990543365479, 0.0018969178199768066, 0.0020222365856170654, 0.0021475553512573242, 0.002272874116897583, 0.002398192882537842, 0.0025235116481781006, 0.0026488304138183594, 0.002774149179458618, 0.002899467945098877, 0.0030247867107391357, 0.0031501054763793945, 0.0032754242420196533, 0.003400743007659912, 0.003526061773300171, 0.0036513805389404297, 0.0037766993045806885, 0.0039020180702209473, 0.004027336835861206, 0.004152655601501465, 0.004277974367141724, 0.004403293132781982, 0.004528611898422241, 0.0046539306640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 10.0, 18.0, 66.0, 231.0, 472.0, 136.0, 39.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0440877303481102, -0.04168759286403656, -0.03928745537996292, -0.03688731789588928, -0.03448718041181564, -0.032087042927742004, -0.029686905443668365, -0.027286767959594727, -0.024886630475521088, -0.02248649299144745, -0.02008635550737381, -0.01768621802330017, -0.015286080539226532, -0.012885943055152893, -0.010485805571079254, -0.008085668087005615, -0.005685530602931976, -0.0032853931188583374, -0.0008852556347846985, 0.0015148818492889404, 0.003915019333362579, 0.006315156817436218, 0.008715294301509857, 0.011115431785583496, 0.013515569269657135, 0.015915706753730774, 0.018315844237804413, 0.020715981721878052, 0.02311611920595169, 0.02551625669002533, 0.02791639417409897, 0.030316531658172607, 0.03271667659282684, 0.03511681407690048, 0.03751695156097412, 0.03991708904504776, 0.0423172265291214, 0.04471736401319504, 0.04711750149726868, 0.049517638981342316, 0.051917776465415955, 0.054317913949489594, 0.05671805143356323, 0.05911818891763687, 0.06151832640171051, 0.06391846388578415, 0.06631860136985779, 0.06871873885393143, 0.07111887633800507, 0.0735190138220787, 0.07591915130615234, 0.07831928879022598, 0.08071942627429962, 0.08311956375837326, 0.0855197012424469, 0.08791983872652054, 0.09031997621059418, 0.09272011369466782, 0.09512025117874146, 0.0975203886628151, 0.09992052614688873, 0.10232066363096237, 0.10472080111503601, 0.10712093859910965, 0.10952107608318329]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 13.0, 9.0, 21.0, 24.0, 33.0, 25.0, 35.0, 37.0, 53.0, 45.0, 47.0, 54.0, 61.0, 43.0, 60.0, 36.0, 48.0, 45.0, 55.0, 44.0, 29.0, 31.0, 28.0, 20.0, 21.0, 12.0, 15.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.013874709606170654, -0.013360245153307915, -0.012845780700445175, -0.012331316247582436, -0.011816851794719696, -0.011302387341856956, -0.010787922888994217, -0.010273458436131477, -0.009758993983268738, -0.009244529530405998, -0.008730065077543259, -0.008215600624680519, -0.0077011361718177795, -0.00718667171895504, -0.0066722072660923, -0.006157742813229561, -0.005643278360366821, -0.005128813907504082, -0.004614349454641342, -0.004099885001778603, -0.003585420548915863, -0.0030709560960531235, -0.002556491643190384, -0.0020420271903276443, -0.0015275627374649048, -0.0010130982846021652, -0.0004986338317394257, 1.5830621123313904e-05, 0.0005302950739860535, 0.001044759526848793, 0.0015592239797115326, 0.002073688432574272, 0.0025881528854370117, 0.0031026173382997513, 0.003617081791162491, 0.00413154624402523, 0.00464601069688797, 0.0051604751497507095, 0.005674939602613449, 0.006189404055476189, 0.006703868508338928, 0.007218332961201668, 0.007732797414064407, 0.008247261866927147, 0.008761726319789886, 0.009276190772652626, 0.009790655225515366, 0.010305119678378105, 0.010819584131240845, 0.011334048584103584, 0.011848513036966324, 0.012362977489829063, 0.012877441942691803, 0.013391906395554543, 0.013906370848417282, 0.014420835301280022, 0.014935299754142761, 0.0154497642070055, 0.01596422865986824, 0.01647869311273098, 0.01699315756559372, 0.01750762201845646, 0.0180220864713192, 0.018536550924181938, 0.019051015377044678]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 12.0, 20.0, 23.0, 19.0, 32.0, 43.0, 57.0, 80.0, 89.0, 141.0, 195.0, 277.0, 333.0, 544.0, 732.0, 1039.0, 1465.0, 2224.0, 3380.0, 5384.0, 8461.0, 15292.0, 34971.0, 819884.0, 100946.0, 21920.0, 11352.0, 6620.0, 4237.0, 2709.0, 1807.0, 1241.0, 843.0, 604.0, 420.0, 284.0, 232.0, 166.0, 138.0, 95.0, 62.0, 36.0, 38.0, 24.0, 17.0, 17.0, 9.0, 7.0, 8.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0], "bins": [-0.01934814453125, -0.018757343292236328, -0.018166542053222656, -0.017575740814208984, -0.016984939575195312, -0.01639413833618164, -0.01580333709716797, -0.015212535858154297, -0.014621734619140625, -0.014030933380126953, -0.013440132141113281, -0.01284933090209961, -0.012258529663085938, -0.011667728424072266, -0.011076927185058594, -0.010486125946044922, -0.00989532470703125, -0.009304523468017578, -0.008713722229003906, -0.008122920989990234, -0.0075321197509765625, -0.006941318511962891, -0.006350517272949219, -0.005759716033935547, -0.005168914794921875, -0.004578113555908203, -0.003987312316894531, -0.0033965110778808594, -0.0028057098388671875, -0.0022149085998535156, -0.0016241073608398438, -0.0010333061218261719, -0.0004425048828125, 0.00014829635620117188, 0.0007390975952148438, 0.0013298988342285156, 0.0019207000732421875, 0.0025115013122558594, 0.0031023025512695312, 0.003693103790283203, 0.004283905029296875, 0.004874706268310547, 0.005465507507324219, 0.006056308746337891, 0.0066471099853515625, 0.007237911224365234, 0.007828712463378906, 0.008419513702392578, 0.00901031494140625, 0.009601116180419922, 0.010191917419433594, 0.010782718658447266, 0.011373519897460938, 0.01196432113647461, 0.012555122375488281, 0.013145923614501953, 0.013736724853515625, 0.014327526092529297, 0.014918327331542969, 0.01550912857055664, 0.016099929809570312, 0.016690731048583984, 0.017281532287597656, 0.017872333526611328, 0.018463134765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 9.0, 7.0, 9.0, 13.0, 11.0, 65.0, 333.0, 341.0, 72.0, 19.0, 7.0, 11.0, 7.0, 9.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0017604827880859375, -0.001710057258605957, -0.0016596317291259766, -0.001609206199645996, -0.0015587806701660156, -0.0015083551406860352, -0.0014579296112060547, -0.0014075040817260742, -0.0013570785522460938, -0.0013066530227661133, -0.0012562274932861328, -0.0012058019638061523, -0.0011553764343261719, -0.0011049509048461914, -0.001054525375366211, -0.0010040998458862305, -0.00095367431640625, -0.0009032487869262695, -0.0008528232574462891, -0.0008023977279663086, -0.0007519721984863281, -0.0007015466690063477, -0.0006511211395263672, -0.0006006956100463867, -0.0005502700805664062, -0.0004998445510864258, -0.0004494190216064453, -0.00039899349212646484, -0.0003485679626464844, -0.0002981424331665039, -0.00024771690368652344, -0.00019729137420654297, -0.0001468658447265625, -9.644031524658203e-05, -4.601478576660156e-05, 4.410743713378906e-06, 5.4836273193359375e-05, 0.00010526180267333984, 0.0001556873321533203, 0.00020611286163330078, 0.00025653839111328125, 0.0003069639205932617, 0.0003573894500732422, 0.00040781497955322266, 0.0004582405090332031, 0.0005086660385131836, 0.0005590915679931641, 0.0006095170974731445, 0.000659942626953125, 0.0007103681564331055, 0.0007607936859130859, 0.0008112192153930664, 0.0008616447448730469, 0.0009120702743530273, 0.0009624958038330078, 0.0010129213333129883, 0.0010633468627929688, 0.0011137723922729492, 0.0011641979217529297, 0.0012146234512329102, 0.0012650489807128906, 0.001315474510192871, 0.0013659000396728516, 0.001416325569152832, 0.0014667510986328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 4.0, 3.0, 7.0, 5.0, 5.0, 16.0, 9.0, 19.0, 25.0, 24.0, 40.0, 39.0, 67.0, 66.0, 107.0, 188.0, 253.0, 307.0, 511.0, 791.0, 1293.0, 2166.0, 4475.0, 11437.0, 57456.0, 854643.0, 88800.0, 14125.0, 5240.0, 2424.0, 1380.0, 849.0, 517.0, 331.0, 233.0, 206.0, 133.0, 79.0, 71.0, 53.0, 43.0, 29.0, 19.0, 19.0, 10.0, 15.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.0357666015625, -0.034668922424316406, -0.03357124328613281, -0.03247356414794922, -0.031375885009765625, -0.03027820587158203, -0.029180526733398438, -0.028082847595214844, -0.02698516845703125, -0.025887489318847656, -0.024789810180664062, -0.02369213104248047, -0.022594451904296875, -0.02149677276611328, -0.020399093627929688, -0.019301414489746094, -0.0182037353515625, -0.017106056213378906, -0.016008377075195312, -0.014910697937011719, -0.013813018798828125, -0.012715339660644531, -0.011617660522460938, -0.010519981384277344, -0.00942230224609375, -0.008324623107910156, -0.0072269439697265625, -0.006129264831542969, -0.005031585693359375, -0.003933906555175781, -0.0028362274169921875, -0.0017385482788085938, -0.000640869140625, 0.00045680999755859375, 0.0015544891357421875, 0.0026521682739257812, 0.003749847412109375, 0.004847526550292969, 0.0059452056884765625, 0.007042884826660156, 0.00814056396484375, 0.009238243103027344, 0.010335922241210938, 0.011433601379394531, 0.012531280517578125, 0.013628959655761719, 0.014726638793945312, 0.015824317932128906, 0.0169219970703125, 0.018019676208496094, 0.019117355346679688, 0.02021503448486328, 0.021312713623046875, 0.02241039276123047, 0.023508071899414062, 0.024605751037597656, 0.02570343017578125, 0.026801109313964844, 0.027898788452148438, 0.02899646759033203, 0.030094146728515625, 0.03119182586669922, 0.03228950500488281, 0.033387184143066406, 0.03448486328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 6.0, 14.0, 11.0, 9.0, 12.0, 11.0, 18.0, 21.0, 28.0, 26.0, 30.0, 23.0, 41.0, 39.0, 37.0, 40.0, 46.0, 42.0, 39.0, 40.0, 37.0, 34.0, 47.0, 42.0, 41.0, 30.0, 26.0, 31.0, 40.0, 21.0, 18.0, 15.0, 17.0, 13.0, 7.0, 10.0, 6.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007640838623046875, -0.00741344690322876, -0.0071860551834106445, -0.006958663463592529, -0.006731271743774414, -0.006503880023956299, -0.006276488304138184, -0.006049096584320068, -0.005821704864501953, -0.005594313144683838, -0.005366921424865723, -0.005139529705047607, -0.004912137985229492, -0.004684746265411377, -0.004457354545593262, -0.0042299628257751465, -0.004002571105957031, -0.003775179386138916, -0.0035477876663208008, -0.0033203959465026855, -0.0030930042266845703, -0.002865612506866455, -0.00263822078704834, -0.0024108290672302246, -0.0021834373474121094, -0.001956045627593994, -0.001728653907775879, -0.0015012621879577637, -0.0012738704681396484, -0.0010464787483215332, -0.000819087028503418, -0.0005916953086853027, -0.0003643035888671875, -0.00013691186904907227, 9.047985076904297e-05, 0.0003178715705871582, 0.0005452632904052734, 0.0007726550102233887, 0.001000046730041504, 0.0012274384498596191, 0.0014548301696777344, 0.0016822218894958496, 0.0019096136093139648, 0.00213700532913208, 0.0023643970489501953, 0.0025917887687683105, 0.0028191804885864258, 0.003046572208404541, 0.0032739639282226562, 0.0035013556480407715, 0.0037287473678588867, 0.003956139087677002, 0.004183530807495117, 0.004410922527313232, 0.004638314247131348, 0.004865705966949463, 0.005093097686767578, 0.005320489406585693, 0.005547881126403809, 0.005775272846221924, 0.006002664566040039, 0.006230056285858154, 0.0064574480056762695, 0.006684839725494385, 0.0069122314453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 4.0, 9.0, 10.0, 8.0, 21.0, 42.0, 44.0, 86.0, 208.0, 671.0, 4318.0, 896820.0, 142225.0, 3062.0, 609.0, 164.0, 86.0, 39.0, 23.0, 12.0, 20.0, 12.0, 5.0, 10.0, 11.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0294189453125, -0.02868199348449707, -0.02794504165649414, -0.02720808982849121, -0.02647113800048828, -0.02573418617248535, -0.024997234344482422, -0.024260282516479492, -0.023523330688476562, -0.022786378860473633, -0.022049427032470703, -0.021312475204467773, -0.020575523376464844, -0.019838571548461914, -0.019101619720458984, -0.018364667892456055, -0.017627716064453125, -0.016890764236450195, -0.016153812408447266, -0.015416860580444336, -0.014679908752441406, -0.013942956924438477, -0.013206005096435547, -0.012469053268432617, -0.011732101440429688, -0.010995149612426758, -0.010258197784423828, -0.009521245956420898, -0.008784294128417969, -0.008047342300415039, -0.007310390472412109, -0.00657343864440918, -0.00583648681640625, -0.00509953498840332, -0.004362583160400391, -0.003625631332397461, -0.0028886795043945312, -0.0021517276763916016, -0.0014147758483886719, -0.0006778240203857422, 5.91278076171875e-05, 0.0007960796356201172, 0.0015330314636230469, 0.0022699832916259766, 0.0030069351196289062, 0.003743886947631836, 0.004480838775634766, 0.005217790603637695, 0.005954742431640625, 0.006691694259643555, 0.007428646087646484, 0.008165597915649414, 0.008902549743652344, 0.009639501571655273, 0.010376453399658203, 0.011113405227661133, 0.011850357055664062, 0.012587308883666992, 0.013324260711669922, 0.014061212539672852, 0.014798164367675781, 0.015535116195678711, 0.01627206802368164, 0.01700901985168457, 0.0177459716796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 14.0, 10.0, 16.0, 24.0, 37.0, 57.0, 89.0, 110.0, 125.0, 124.0, 114.0, 77.0, 63.0, 30.0, 35.0, 22.0, 7.0, 10.0, 13.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0471553802490234e-05, -3.940518945455551e-05, -3.833882510662079e-05, -3.7272460758686066e-05, -3.620609641075134e-05, -3.513973206281662e-05, -3.40733677148819e-05, -3.3007003366947174e-05, -3.194063901901245e-05, -3.087427467107773e-05, -2.9807910323143005e-05, -2.8741545975208282e-05, -2.767518162727356e-05, -2.6608817279338837e-05, -2.5542452931404114e-05, -2.447608858346939e-05, -2.3409724235534668e-05, -2.2343359887599945e-05, -2.1276995539665222e-05, -2.02106311917305e-05, -1.9144266843795776e-05, -1.8077902495861053e-05, -1.701153814792633e-05, -1.5945173799991608e-05, -1.4878809452056885e-05, -1.3812445104122162e-05, -1.2746080756187439e-05, -1.1679716408252716e-05, -1.0613352060317993e-05, -9.54698771238327e-06, -8.480623364448547e-06, -7.4142590165138245e-06, -6.3478946685791016e-06, -5.281530320644379e-06, -4.215165972709656e-06, -3.148801624774933e-06, -2.08243727684021e-06, -1.016072928905487e-06, 5.029141902923584e-08, 1.1166557669639587e-06, 2.1830201148986816e-06, 3.2493844628334045e-06, 4.3157488107681274e-06, 5.38211315870285e-06, 6.448477506637573e-06, 7.514841854572296e-06, 8.581206202507019e-06, 9.647570550441742e-06, 1.0713934898376465e-05, 1.1780299246311188e-05, 1.284666359424591e-05, 1.3913027942180634e-05, 1.4979392290115356e-05, 1.604575663805008e-05, 1.7112120985984802e-05, 1.8178485333919525e-05, 1.9244849681854248e-05, 2.031121402978897e-05, 2.1377578377723694e-05, 2.2443942725658417e-05, 2.351030707359314e-05, 2.4576671421527863e-05, 2.5643035769462585e-05, 2.670940011739731e-05, 2.777576446533203e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 4.0, 6.0, 11.0, 12.0, 15.0, 44.0, 57.0, 81.0, 111.0, 179.0, 293.0, 496.0, 993.0, 2428.0, 9335.0, 769458.0, 252584.0, 8059.0, 2137.0, 934.0, 508.0, 288.0, 157.0, 92.0, 69.0, 51.0, 42.0, 31.0, 13.0, 18.0, 7.0, 8.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0278778076171875, -0.027005434036254883, -0.026133060455322266, -0.02526068687438965, -0.02438831329345703, -0.023515939712524414, -0.022643566131591797, -0.02177119255065918, -0.020898818969726562, -0.020026445388793945, -0.019154071807861328, -0.01828169822692871, -0.017409324645996094, -0.016536951065063477, -0.01566457748413086, -0.014792203903198242, -0.013919830322265625, -0.013047456741333008, -0.01217508316040039, -0.011302709579467773, -0.010430335998535156, -0.009557962417602539, -0.008685588836669922, -0.007813215255737305, -0.0069408416748046875, -0.00606846809387207, -0.005196094512939453, -0.004323720932006836, -0.0034513473510742188, -0.0025789737701416016, -0.0017066001892089844, -0.0008342266082763672, 3.814697265625e-05, 0.0009105205535888672, 0.0017828941345214844, 0.0026552677154541016, 0.0035276412963867188, 0.004400014877319336, 0.005272388458251953, 0.00614476203918457, 0.0070171356201171875, 0.007889509201049805, 0.008761882781982422, 0.009634256362915039, 0.010506629943847656, 0.011379003524780273, 0.01225137710571289, 0.013123750686645508, 0.013996124267578125, 0.014868497848510742, 0.01574087142944336, 0.016613245010375977, 0.017485618591308594, 0.01835799217224121, 0.019230365753173828, 0.020102739334106445, 0.020975112915039062, 0.02184748649597168, 0.022719860076904297, 0.023592233657836914, 0.02446460723876953, 0.02533698081970215, 0.026209354400634766, 0.027081727981567383, 0.0279541015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 12.0, 12.0, 14.0, 22.0, 23.0, 34.0, 51.0, 74.0, 141.0, 195.0, 162.0, 81.0, 33.0, 32.0, 28.0, 17.0, 11.0, 7.0, 7.0, 6.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00684356689453125, -0.006638944149017334, -0.006434321403503418, -0.006229698657989502, -0.006025075912475586, -0.00582045316696167, -0.005615830421447754, -0.005411207675933838, -0.005206584930419922, -0.005001962184906006, -0.00479733943939209, -0.004592716693878174, -0.004388093948364258, -0.004183471202850342, -0.003978848457336426, -0.0037742257118225098, -0.0035696029663085938, -0.0033649802207946777, -0.0031603574752807617, -0.0029557347297668457, -0.0027511119842529297, -0.0025464892387390137, -0.0023418664932250977, -0.0021372437477111816, -0.0019326210021972656, -0.0017279982566833496, -0.0015233755111694336, -0.0013187527656555176, -0.0011141300201416016, -0.0009095072746276855, -0.0007048845291137695, -0.0005002617835998535, -0.0002956390380859375, -9.101629257202148e-05, 0.00011360645294189453, 0.00031822919845581055, 0.0005228519439697266, 0.0007274746894836426, 0.0009320974349975586, 0.0011367201805114746, 0.0013413429260253906, 0.0015459656715393066, 0.0017505884170532227, 0.0019552111625671387, 0.0021598339080810547, 0.0023644566535949707, 0.0025690793991088867, 0.0027737021446228027, 0.0029783248901367188, 0.0031829476356506348, 0.0033875703811645508, 0.003592193126678467, 0.003796815872192383, 0.004001438617706299, 0.004206061363220215, 0.004410684108734131, 0.004615306854248047, 0.004819929599761963, 0.005024552345275879, 0.005229175090789795, 0.005433797836303711, 0.005638420581817627, 0.005843043327331543, 0.006047666072845459, 0.006252288818359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 9.0, 8.0, 23.0, 154.0, 666.0, 63.0, 23.0, 21.0, 13.0, 3.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3244737386703491, -0.3105740547180176, -0.29667437076568604, -0.2827746570110321, -0.26887497305870056, -0.254975289106369, -0.24107559025287628, -0.22717589139938354, -0.213276207447052, -0.19937652349472046, -0.18547682464122772, -0.17157712578773499, -0.15767744183540344, -0.1437777578830719, -0.12987805902957916, -0.11597836762666702, -0.10207867622375488, -0.08817898482084274, -0.0742792934179306, -0.06037960201501846, -0.04647991061210632, -0.03258021920919418, -0.018680527806282043, -0.0047808364033699036, 0.009118854999542236, 0.023018546402454376, 0.036918237805366516, 0.050817929208278656, 0.0647176206111908, 0.07861731201410294, 0.09251700341701508, 0.10641669481992722, 0.12031638622283936, 0.1342160701751709, 0.14811576902866364, 0.16201546788215637, 0.17591515183448792, 0.18981483578681946, 0.2037145346403122, 0.21761423349380493, 0.23151391744613647, 0.24541360139846802, 0.25931328535079956, 0.2732129991054535, 0.28711268305778503, 0.3010123670101166, 0.3149120807647705, 0.32881176471710205, 0.3427114486694336, 0.35661113262176514, 0.3705108165740967, 0.3844105303287506, 0.39831021428108215, 0.4122098982334137, 0.4261096119880676, 0.44000929594039917, 0.4539089798927307, 0.46780866384506226, 0.4817083477973938, 0.49560806155204773, 0.5095077753067017, 0.5234074592590332, 0.5373071432113647, 0.5512068271636963, 0.5651065111160278]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 5.0, 8.0, 7.0, 7.0, 9.0, 20.0, 30.0, 53.0, 107.0, 126.0, 179.0, 150.0, 108.0, 60.0, 32.0, 18.0, 14.0, 11.0, 6.0, 5.0, 5.0, 9.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12328165769577026, -0.11845885217189789, -0.11363604664802551, -0.10881324112415314, -0.10399043560028076, -0.09916763007640839, -0.09434483200311661, -0.08952202647924423, -0.08469922095537186, -0.07987641543149948, -0.0750536099076271, -0.07023080438375473, -0.06540800631046295, -0.06058519706130028, -0.0557623952627182, -0.050939589738845825, -0.04611678421497345, -0.041293978691101074, -0.0364711731672287, -0.03164837136864662, -0.026825565844774246, -0.02200276032090187, -0.017179956659674644, -0.012357152998447418, -0.007534347474575043, -0.002711542882025242, 0.002111261710524559, 0.00693406630307436, 0.01175687089562416, 0.016579676419496536, 0.021402480080723763, 0.02622528374195099, 0.031048089265823364, 0.03587089478969574, 0.040693700313568115, 0.04551650211215019, 0.05033930763602257, 0.05516211315989494, 0.05998491495847702, 0.0648077204823494, 0.06963052600622177, 0.07445333153009415, 0.07927613705396652, 0.0840989425778389, 0.08892174065113068, 0.09374454617500305, 0.09856735169887543, 0.1033901572227478, 0.10821296274662018, 0.11303576827049255, 0.11785857379436493, 0.1226813793182373, 0.12750418484210968, 0.13232699036598206, 0.13714979588985443, 0.1419726014137268, 0.146795392036438, 0.15161819756031036, 0.15644100308418274, 0.16126380860805511, 0.1660866141319275, 0.17090941965579987, 0.17573222517967224, 0.18055501580238342, 0.185377836227417]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 10.0, 14.0, 18.0, 17.0, 20.0, 34.0, 58.0, 147.0, 1190.0, 50004.0, 4139548.0, 2817.0, 150.0, 50.0, 38.0, 26.0, 23.0, 21.0, 14.0, 13.0, 6.0, 3.0, 5.0, 10.0, 1.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.90625, -2.8321075439453125, -2.757965087890625, -2.6838226318359375, -2.60968017578125, -2.5355377197265625, -2.461395263671875, -2.3872528076171875, -2.3131103515625, -2.2389678955078125, -2.164825439453125, -2.0906829833984375, -2.01654052734375, -1.9423980712890625, -1.868255615234375, -1.7941131591796875, -1.719970703125, -1.6458282470703125, -1.571685791015625, -1.4975433349609375, -1.42340087890625, -1.3492584228515625, -1.275115966796875, -1.2009735107421875, -1.1268310546875, -1.0526885986328125, -0.978546142578125, -0.9044036865234375, -0.83026123046875, -0.7561187744140625, -0.681976318359375, -0.6078338623046875, -0.53369140625, -0.4595489501953125, -0.385406494140625, -0.3112640380859375, -0.23712158203125, -0.1629791259765625, -0.088836669921875, -0.0146942138671875, 0.0594482421875, 0.1335906982421875, 0.207733154296875, 0.2818756103515625, 0.35601806640625, 0.4301605224609375, 0.504302978515625, 0.5784454345703125, 0.652587890625, 0.7267303466796875, 0.800872802734375, 0.8750152587890625, 0.94915771484375, 1.0233001708984375, 1.097442626953125, 1.1715850830078125, 1.2457275390625, 1.3198699951171875, 1.394012451171875, 1.4681549072265625, 1.54229736328125, 1.6164398193359375, 1.690582275390625, 1.7647247314453125, 1.8388671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 5.0, 4.0, 9.0, 7.0, 9.0, 9.0, 24.0, 84.0, 283.0, 323.0, 97.0, 24.0, 15.0, 7.0, 7.0, 11.0, 7.0, 9.0, 7.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0014324188232421875, -0.0013889670372009277, -0.001345515251159668, -0.0013020634651184082, -0.0012586116790771484, -0.0012151598930358887, -0.001171708106994629, -0.0011282563209533691, -0.0010848045349121094, -0.0010413527488708496, -0.0009979009628295898, -0.0009544491767883301, -0.0009109973907470703, -0.0008675456047058105, -0.0008240938186645508, -0.000780642032623291, -0.0007371902465820312, -0.0006937384605407715, -0.0006502866744995117, -0.000606834888458252, -0.0005633831024169922, -0.0005199313163757324, -0.00047647953033447266, -0.0004330277442932129, -0.0003895759582519531, -0.00034612417221069336, -0.0003026723861694336, -0.00025922060012817383, -0.00021576881408691406, -0.0001723170280456543, -0.00012886524200439453, -8.541345596313477e-05, -4.1961669921875e-05, 1.4901161193847656e-06, 4.494190216064453e-05, 8.83936882019043e-05, 0.00013184547424316406, 0.00017529726028442383, 0.0002187490463256836, 0.00026220083236694336, 0.0003056526184082031, 0.0003491044044494629, 0.00039255619049072266, 0.0004360079765319824, 0.0004794597625732422, 0.000522911548614502, 0.0005663633346557617, 0.0006098151206970215, 0.0006532669067382812, 0.000696718692779541, 0.0007401704788208008, 0.0007836222648620605, 0.0008270740509033203, 0.0008705258369445801, 0.0009139776229858398, 0.0009574294090270996, 0.0010008811950683594, 0.0010443329811096191, 0.001087784767150879, 0.0011312365531921387, 0.0011746883392333984, 0.0012181401252746582, 0.001261591911315918, 0.0013050436973571777, 0.0013484954833984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 1.0, 18.0, 14.0, 36.0, 45.0, 78.0, 128.0, 208.0, 350.0, 106355.0, 4085870.0, 459.0, 233.0, 184.0, 120.0, 75.0, 49.0, 30.0, 22.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3667106628417969, -0.33864593505859375, -0.3105812072753906, -0.2825164794921875, -0.2544517517089844, -0.22638702392578125, -0.19832229614257812, -0.170257568359375, -0.14219284057617188, -0.11412811279296875, -0.08606338500976562, -0.0579986572265625, -0.029933929443359375, -0.00186920166015625, 0.026195526123046875, 0.05426025390625, 0.08232498168945312, 0.11038970947265625, 0.13845443725585938, 0.1665191650390625, 0.19458389282226562, 0.22264862060546875, 0.2507133483886719, 0.278778076171875, 0.3068428039550781, 0.33490753173828125, 0.3629722595214844, 0.3910369873046875, 0.4191017150878906, 0.44716644287109375, 0.4752311706542969, 0.5032958984375, 0.5313606262207031, 0.5594253540039062, 0.5874900817871094, 0.6155548095703125, 0.6436195373535156, 0.6716842651367188, 0.6997489929199219, 0.727813720703125, 0.7558784484863281, 0.7839431762695312, 0.8120079040527344, 0.8400726318359375, 0.8681373596191406, 0.8962020874023438, 0.9242668151855469, 0.95233154296875, 0.9803962707519531, 1.0084609985351562, 1.0365257263183594, 1.0645904541015625, 1.0926551818847656, 1.1207199096679688, 1.1487846374511719, 1.176849365234375, 1.2049140930175781, 1.2329788208007812, 1.2610435485839844, 1.2891082763671875, 1.3171730041503906, 1.3452377319335938, 1.3733024597167969, 1.4013671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 8.0, 15.0, 22.0, 36.0, 48.0, 100.0, 144.0, 236.0, 380.0, 1459.0, 581.0, 321.0, 234.0, 188.0, 111.0, 82.0, 48.0, 29.0, 21.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027332305908203125, -0.002521008253097534, -0.002308785915374756, -0.0020965635776519775, -0.0018843412399291992, -0.001672118902206421, -0.0014598965644836426, -0.0012476742267608643, -0.001035451889038086, -0.0008232295513153076, -0.0006110072135925293, -0.000398784875869751, -0.00018656253814697266, 2.5659799575805664e-05, 0.00023788213729858398, 0.0004501044750213623, 0.0006623268127441406, 0.0008745491504669189, 0.0010867714881896973, 0.0012989938259124756, 0.001511216163635254, 0.0017234385013580322, 0.0019356608390808105, 0.002147883176803589, 0.002360105514526367, 0.0025723278522491455, 0.002784550189971924, 0.002996772527694702, 0.0032089948654174805, 0.003421217203140259, 0.003633439540863037, 0.0038456618785858154, 0.004057884216308594, 0.004270106554031372, 0.00448232889175415, 0.004694551229476929, 0.004906773567199707, 0.005118995904922485, 0.005331218242645264, 0.005543440580368042, 0.00575566291809082, 0.005967885255813599, 0.006180107593536377, 0.006392329931259155, 0.006604552268981934, 0.006816774606704712, 0.00702899694442749, 0.0072412192821502686, 0.007453441619873047, 0.007665663957595825, 0.007877886295318604, 0.008090108633041382, 0.00830233097076416, 0.008514553308486938, 0.008726775646209717, 0.008938997983932495, 0.009151220321655273, 0.009363442659378052, 0.00957566499710083, 0.009787887334823608, 0.010000109672546387, 0.010212332010269165, 0.010424554347991943, 0.010636776685714722, 0.0108489990234375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [616.0, 389.0, 17.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0585235059261322, 0.003385651856660843, 0.06529480963945389, 0.12720397114753723, 0.18911312520503998, 0.2510222792625427, 0.31293144822120667, 0.3748405873775482, 0.43674975633621216, 0.4986589252948761, 0.56056809425354, 0.6224772334098816, 0.6843863725662231, 0.7462955713272095, 0.808204710483551, 0.8701138496398926, 0.9320230484008789, 0.9939321875572205, 1.055841326713562, 1.1177505254745483, 1.1796597242355347, 1.2415688037872314, 1.3034780025482178, 1.365387201309204, 1.4272962808609009, 1.4892054796218872, 1.551114559173584, 1.6130237579345703, 1.6749329566955566, 1.7368420362472534, 1.7987512350082397, 1.8606603145599365, 1.9225696325302124, 1.9844788312911987, 2.0463879108428955, 2.108297109603882, 2.170206308364868, 2.2321155071258545, 2.2940244674682617, 2.355933666229248, 2.4178428649902344, 2.4797520637512207, 2.541661262512207, 2.6035704612731934, 2.6654794216156006, 2.727388620376587, 2.7892978191375732, 2.8512070178985596, 2.913116216659546, 2.9750254154205322, 3.0369346141815186, 3.098843574523926, 3.160752773284912, 3.2226619720458984, 3.2845711708068848, 3.346480369567871, 3.4083893299102783, 3.4702985286712646, 3.532207727432251, 3.594116687774658, 3.6560258865356445, 3.717935085296631, 3.779844284057617, 3.8417534828186035, 3.90366268157959]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 40.0, 84.0, 118.0, 157.0, 179.0, 160.0, 119.0, 59.0, 35.0, 13.0, 12.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05067789554595947, -0.04592546075582504, -0.04117302596569061, -0.03642059490084648, -0.03166816011071205, -0.02691572532057762, -0.02216329239308834, -0.01741085946559906, -0.01265842467546463, -0.007905990816652775, -0.0031535569578409195, 0.0015988769009709358, 0.006351310759782791, 0.011103745549917221, 0.015856178477406502, 0.020608611404895782, 0.025361046195030212, 0.030113480985164642, 0.03486591577529907, 0.039618346840143204, 0.044370781630277634, 0.049123216420412064, 0.053875647485256195, 0.058628082275390625, 0.06338051706552505, 0.06813295185565948, 0.07288538664579391, 0.07763782143592834, 0.08239024877548218, 0.0871426910161972, 0.09189511835575104, 0.09664755314588547, 0.1013999879360199, 0.10615242272615433, 0.11090485751628876, 0.11565729230642319, 0.12040972709655762, 0.12516215443611145, 0.12991459667682648, 0.1346670240163803, 0.13941946625709534, 0.14417189359664917, 0.1489243358373642, 0.15367676317691803, 0.15842920541763306, 0.1631816327571869, 0.16793407499790192, 0.17268650233745575, 0.17743892967700958, 0.18219135701656342, 0.18694379925727844, 0.19169622659683228, 0.1964486688375473, 0.20120109617710114, 0.20595353841781616, 0.21070596575737, 0.21545839309692383, 0.22021082043647766, 0.2249632626771927, 0.22971569001674652, 0.23446813225746155, 0.23922055959701538, 0.2439730018377304, 0.24872542917728424, 0.25347787141799927]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 3.0, 9.0, 10.0, 24.0, 21.0, 46.0, 57.0, 86.0, 91.0, 131.0, 150.0, 206.0, 313.0, 452.0, 593.0, 799.0, 1159.0, 1507.0, 2261.0, 3063.0, 4583.0, 6814.0, 10889.0, 20465.0, 87547.0, 771677.0, 82316.0, 20096.0, 10755.0, 6754.0, 4612.0, 3134.0, 2187.0, 1515.0, 1180.0, 817.0, 567.0, 478.0, 283.0, 226.0, 173.0, 123.0, 97.0, 85.0, 51.0, 41.0, 26.0, 28.0, 18.0, 9.0, 15.0, 2.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.023101806640625, -0.022368192672729492, -0.021634578704833984, -0.020900964736938477, -0.02016735076904297, -0.01943373680114746, -0.018700122833251953, -0.017966508865356445, -0.017232894897460938, -0.01649928092956543, -0.015765666961669922, -0.015032052993774414, -0.014298439025878906, -0.013564825057983398, -0.01283121109008789, -0.012097597122192383, -0.011363983154296875, -0.010630369186401367, -0.00989675521850586, -0.009163141250610352, -0.008429527282714844, -0.007695913314819336, -0.006962299346923828, -0.00622868537902832, -0.0054950714111328125, -0.004761457443237305, -0.004027843475341797, -0.003294229507446289, -0.0025606155395507812, -0.0018270015716552734, -0.0010933876037597656, -0.0003597736358642578, 0.00037384033203125, 0.0011074542999267578, 0.0018410682678222656, 0.0025746822357177734, 0.0033082962036132812, 0.004041910171508789, 0.004775524139404297, 0.005509138107299805, 0.0062427520751953125, 0.00697636604309082, 0.007709980010986328, 0.008443593978881836, 0.009177207946777344, 0.009910821914672852, 0.01064443588256836, 0.011378049850463867, 0.012111663818359375, 0.012845277786254883, 0.01357889175415039, 0.014312505722045898, 0.015046119689941406, 0.015779733657836914, 0.016513347625732422, 0.01724696159362793, 0.017980575561523438, 0.018714189529418945, 0.019447803497314453, 0.02018141746520996, 0.02091503143310547, 0.021648645401000977, 0.022382259368896484, 0.023115873336791992, 0.0238494873046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 4.0, 3.0, 5.0, 6.0, 11.0, 3.0, 7.0, 8.0, 7.0, 18.0, 26.0, 88.0, 201.0, 246.0, 183.0, 74.0, 20.0, 11.0, 10.0, 8.0, 9.0, 7.0, 9.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014486312866210938, -0.0014037638902664185, -0.0013588964939117432, -0.0013140290975570679, -0.0012691617012023926, -0.0012242943048477173, -0.001179426908493042, -0.0011345595121383667, -0.0010896921157836914, -0.0010448247194290161, -0.0009999573230743408, -0.0009550899267196655, -0.0009102225303649902, -0.0008653551340103149, -0.0008204877376556396, -0.0007756203413009644, -0.0007307529449462891, -0.0006858855485916138, -0.0006410181522369385, -0.0005961507558822632, -0.0005512833595275879, -0.0005064159631729126, -0.0004615485668182373, -0.000416681170463562, -0.0003718137741088867, -0.0003269463777542114, -0.00028207898139953613, -0.00023721158504486084, -0.00019234418869018555, -0.00014747679233551025, -0.00010260939598083496, -5.774199962615967e-05, -1.2874603271484375e-05, 3.199279308319092e-05, 7.686018943786621e-05, 0.0001217275857925415, 0.0001665949821472168, 0.0002114623785018921, 0.0002563297748565674, 0.0003011971712112427, 0.00034606456756591797, 0.00039093196392059326, 0.00043579936027526855, 0.00048066675662994385, 0.0005255341529846191, 0.0005704015493392944, 0.0006152689456939697, 0.000660136342048645, 0.0007050037384033203, 0.0007498711347579956, 0.0007947385311126709, 0.0008396059274673462, 0.0008844733238220215, 0.0009293407201766968, 0.0009742081165313721, 0.0010190755128860474, 0.0010639429092407227, 0.001108810305595398, 0.0011536777019500732, 0.0011985450983047485, 0.0012434124946594238, 0.0012882798910140991, 0.0013331472873687744, 0.0013780146837234497, 0.001422882080078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 3.0, 7.0, 7.0, 9.0, 10.0, 12.0, 20.0, 14.0, 12.0, 13.0, 16.0, 21.0, 22.0, 20.0, 33.0, 30.0, 33.0, 52.0, 87.0, 259.0, 1271.0, 10789.0, 949243.0, 81908.0, 3709.0, 489.0, 106.0, 52.0, 29.0, 26.0, 32.0, 20.0, 32.0, 19.0, 17.0, 21.0, 14.0, 10.0, 18.0, 12.0, 13.0, 7.0, 5.0, 6.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.07745361328125, -0.07509040832519531, -0.07272720336914062, -0.07036399841308594, -0.06800079345703125, -0.06563758850097656, -0.06327438354492188, -0.06091117858886719, -0.0585479736328125, -0.05618476867675781, -0.053821563720703125, -0.05145835876464844, -0.04909515380859375, -0.04673194885253906, -0.044368743896484375, -0.04200553894042969, -0.039642333984375, -0.03727912902832031, -0.034915924072265625, -0.03255271911621094, -0.03018951416015625, -0.027826309204101562, -0.025463104248046875, -0.023099899291992188, -0.0207366943359375, -0.018373489379882812, -0.016010284423828125, -0.013647079467773438, -0.01128387451171875, -0.008920669555664062, -0.006557464599609375, -0.0041942596435546875, -0.0018310546875, 0.0005321502685546875, 0.002895355224609375, 0.0052585601806640625, 0.00762176513671875, 0.009984970092773438, 0.012348175048828125, 0.014711380004882812, 0.0170745849609375, 0.019437789916992188, 0.021800994873046875, 0.024164199829101562, 0.02652740478515625, 0.028890609741210938, 0.031253814697265625, 0.03361701965332031, 0.035980224609375, 0.03834342956542969, 0.040706634521484375, 0.04306983947753906, 0.04543304443359375, 0.04779624938964844, 0.050159454345703125, 0.05252265930175781, 0.0548858642578125, 0.05724906921386719, 0.059612274169921875, 0.06197547912597656, 0.06433868408203125, 0.06670188903808594, 0.06906509399414062, 0.07142829895019531, 0.07379150390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 2.0, 5.0, 3.0, 5.0, 6.0, 9.0, 12.0, 12.0, 12.0, 13.0, 15.0, 16.0, 18.0, 23.0, 35.0, 27.0, 31.0, 35.0, 32.0, 35.0, 41.0, 38.0, 45.0, 38.0, 41.0, 26.0, 36.0, 39.0, 42.0, 28.0, 39.0, 28.0, 25.0, 27.0, 25.0, 13.0, 20.0, 13.0, 13.0, 13.0, 18.0, 9.0, 7.0, 9.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004245758056640625, -0.0041138529777526855, -0.003981947898864746, -0.0038500428199768066, -0.003718137741088867, -0.0035862326622009277, -0.0034543275833129883, -0.003322422504425049, -0.0031905174255371094, -0.00305861234664917, -0.0029267072677612305, -0.002794802188873291, -0.0026628971099853516, -0.002530992031097412, -0.0023990869522094727, -0.002267181873321533, -0.0021352767944335938, -0.0020033717155456543, -0.0018714666366577148, -0.0017395615577697754, -0.001607656478881836, -0.0014757513999938965, -0.001343846321105957, -0.0012119412422180176, -0.0010800361633300781, -0.0009481310844421387, -0.0008162260055541992, -0.0006843209266662598, -0.0005524158477783203, -0.00042051076889038086, -0.0002886056900024414, -0.00015670061111450195, -2.47955322265625e-05, 0.00010710954666137695, 0.0002390146255493164, 0.00037091970443725586, 0.0005028247833251953, 0.0006347298622131348, 0.0007666349411010742, 0.0008985400199890137, 0.0010304450988769531, 0.0011623501777648926, 0.001294255256652832, 0.0014261603355407715, 0.001558065414428711, 0.0016899704933166504, 0.0018218755722045898, 0.0019537806510925293, 0.0020856857299804688, 0.002217590808868408, 0.0023494958877563477, 0.002481400966644287, 0.0026133060455322266, 0.002745211124420166, 0.0028771162033081055, 0.003009021282196045, 0.0031409263610839844, 0.003272831439971924, 0.0034047365188598633, 0.0035366415977478027, 0.003668546676635742, 0.0038004517555236816, 0.003932356834411621, 0.0040642619132995605, 0.0041961669921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 20.0, 23.0, 58.0, 146.0, 899.0, 967740.0, 78803.0, 610.0, 99.0, 58.0, 31.0, 12.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0650634765625, -0.06364703178405762, -0.062230587005615234, -0.06081414222717285, -0.05939769744873047, -0.057981252670288086, -0.0565648078918457, -0.05514836311340332, -0.05373191833496094, -0.052315473556518555, -0.05089902877807617, -0.04948258399963379, -0.048066139221191406, -0.04664969444274902, -0.04523324966430664, -0.04381680488586426, -0.042400360107421875, -0.04098391532897949, -0.03956747055053711, -0.03815102577209473, -0.036734580993652344, -0.03531813621520996, -0.03390169143676758, -0.032485246658325195, -0.031068801879882812, -0.02965235710144043, -0.028235912322998047, -0.026819467544555664, -0.02540302276611328, -0.0239865779876709, -0.022570133209228516, -0.021153688430786133, -0.01973724365234375, -0.018320798873901367, -0.016904354095458984, -0.015487909317016602, -0.014071464538574219, -0.012655019760131836, -0.011238574981689453, -0.00982213020324707, -0.008405685424804688, -0.006989240646362305, -0.005572795867919922, -0.004156351089477539, -0.0027399063110351562, -0.0013234615325927734, 9.298324584960938e-05, 0.0015094280242919922, 0.002925872802734375, 0.004342317581176758, 0.005758762359619141, 0.0071752071380615234, 0.008591651916503906, 0.010008096694946289, 0.011424541473388672, 0.012840986251831055, 0.014257431030273438, 0.01567387580871582, 0.017090320587158203, 0.018506765365600586, 0.01992321014404297, 0.02133965492248535, 0.022756099700927734, 0.024172544479370117, 0.0255889892578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 11.0, 21.0, 72.0, 415.0, 369.0, 58.0, 18.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002791881561279297, -0.0002709701657295227, -0.0002627521753311157, -0.00025453418493270874, -0.00024631619453430176, -0.00023809820413589478, -0.0002298802137374878, -0.0002216622233390808, -0.00021344423294067383, -0.00020522624254226685, -0.00019700825214385986, -0.00018879026174545288, -0.0001805722713470459, -0.00017235428094863892, -0.00016413629055023193, -0.00015591830015182495, -0.00014770030975341797, -0.00013948231935501099, -0.000131264328956604, -0.00012304633855819702, -0.00011482834815979004, -0.00010661035776138306, -9.839236736297607e-05, -9.017437696456909e-05, -8.195638656616211e-05, -7.373839616775513e-05, -6.552040576934814e-05, -5.730241537094116e-05, -4.908442497253418e-05, -4.08664345741272e-05, -3.2648444175720215e-05, -2.4430453777313232e-05, -1.621246337890625e-05, -7.994472980499268e-06, 2.2351741790771484e-07, 8.441507816314697e-06, 1.665949821472168e-05, 2.4877488613128662e-05, 3.3095479011535645e-05, 4.131346940994263e-05, 4.953145980834961e-05, 5.774945020675659e-05, 6.596744060516357e-05, 7.418543100357056e-05, 8.240342140197754e-05, 9.062141180038452e-05, 9.88394021987915e-05, 0.00010705739259719849, 0.00011527538299560547, 0.00012349337339401245, 0.00013171136379241943, 0.00013992935419082642, 0.0001481473445892334, 0.00015636533498764038, 0.00016458332538604736, 0.00017280131578445435, 0.00018101930618286133, 0.0001892372965812683, 0.0001974552869796753, 0.00020567327737808228, 0.00021389126777648926, 0.00022210925817489624, 0.00023032724857330322, 0.0002385452389717102, 0.0002467632293701172]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 3.0, 13.0, 17.0, 29.0, 61.0, 231.0, 1288.0, 36434.0, 1006640.0, 3276.0, 373.0, 99.0, 37.0, 11.0, 13.0, 10.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048492431640625, -0.04703187942504883, -0.045571327209472656, -0.044110774993896484, -0.04265022277832031, -0.04118967056274414, -0.03972911834716797, -0.0382685661315918, -0.036808013916015625, -0.03534746170043945, -0.03388690948486328, -0.03242635726928711, -0.030965805053710938, -0.029505252838134766, -0.028044700622558594, -0.026584148406982422, -0.02512359619140625, -0.023663043975830078, -0.022202491760253906, -0.020741939544677734, -0.019281387329101562, -0.01782083511352539, -0.01636028289794922, -0.014899730682373047, -0.013439178466796875, -0.011978626251220703, -0.010518074035644531, -0.00905752182006836, -0.0075969696044921875, -0.006136417388916016, -0.004675865173339844, -0.003215312957763672, -0.0017547607421875, -0.0002942085266113281, 0.0011663436889648438, 0.0026268959045410156, 0.0040874481201171875, 0.005548000335693359, 0.007008552551269531, 0.008469104766845703, 0.009929656982421875, 0.011390209197998047, 0.012850761413574219, 0.01431131362915039, 0.015771865844726562, 0.017232418060302734, 0.018692970275878906, 0.020153522491455078, 0.02161407470703125, 0.023074626922607422, 0.024535179138183594, 0.025995731353759766, 0.027456283569335938, 0.02891683578491211, 0.03037738800048828, 0.03183794021606445, 0.033298492431640625, 0.0347590446472168, 0.03621959686279297, 0.03768014907836914, 0.03914070129394531, 0.040601253509521484, 0.042061805725097656, 0.04352235794067383, 0.04498291015625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 15.0, 16.0, 42.0, 81.0, 148.0, 452.0, 93.0, 38.0, 25.0, 14.0, 19.0, 10.0, 10.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00852203369140625, -0.00831061601638794, -0.008099198341369629, -0.007887780666351318, -0.007676362991333008, -0.007464945316314697, -0.007253527641296387, -0.007042109966278076, -0.006830692291259766, -0.006619274616241455, -0.0064078569412231445, -0.006196439266204834, -0.0059850215911865234, -0.005773603916168213, -0.005562186241149902, -0.005350768566131592, -0.005139350891113281, -0.004927933216094971, -0.00471651554107666, -0.00450509786605835, -0.004293680191040039, -0.0040822625160217285, -0.003870844841003418, -0.0036594271659851074, -0.003448009490966797, -0.0032365918159484863, -0.0030251741409301758, -0.0028137564659118652, -0.0026023387908935547, -0.002390921115875244, -0.0021795034408569336, -0.001968085765838623, -0.0017566680908203125, -0.001545250415802002, -0.0013338327407836914, -0.0011224150657653809, -0.0009109973907470703, -0.0006995797157287598, -0.0004881620407104492, -0.00027674436569213867, -6.532669067382812e-05, 0.00014609098434448242, 0.00035750865936279297, 0.0005689263343811035, 0.0007803440093994141, 0.0009917616844177246, 0.0012031793594360352, 0.0014145970344543457, 0.0016260147094726562, 0.0018374323844909668, 0.0020488500595092773, 0.002260267734527588, 0.0024716854095458984, 0.002683103084564209, 0.0028945207595825195, 0.00310593843460083, 0.0033173561096191406, 0.003528773784637451, 0.0037401914596557617, 0.003951609134674072, 0.004163026809692383, 0.004374444484710693, 0.004585862159729004, 0.0047972798347473145, 0.005008697509765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 8.0, 10.0, 11.0, 13.0, 30.0, 86.0, 339.0, 326.0, 88.0, 27.0, 15.0, 13.0, 7.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08528926968574524, -0.08200879395008087, -0.07872831076383591, -0.07544783502817154, -0.07216735929250717, -0.06888687610626221, -0.06560640037059784, -0.06232592463493347, -0.059045445173978806, -0.05576496571302414, -0.05248448997735977, -0.049204010516405106, -0.04592353105545044, -0.04264305531978607, -0.039362575858831406, -0.03608209639787674, -0.03280162066221237, -0.029521143063902855, -0.026240665465593338, -0.022960186004638672, -0.019679708406329155, -0.016399230808019638, -0.013118751347064972, -0.009838273748755455, -0.006557796150445938, -0.003277318086475134, 3.1599774956703186e-06, 0.003283638507127762, 0.006564116105437279, 0.009844593703746796, 0.013125073164701462, 0.01640555076301098, 0.0196860209107399, 0.022966498509049416, 0.026246976107358932, 0.0295274555683136, 0.032807931303977966, 0.03608841076493263, 0.0393688902258873, 0.042649365961551666, 0.04592984542250633, 0.049210324883461, 0.052490800619125366, 0.05577128008008003, 0.0590517595410347, 0.062332235276699066, 0.06561271846294403, 0.0688931941986084, 0.07217366993427277, 0.07545414566993713, 0.0787346288561821, 0.08201510459184647, 0.08529558032751083, 0.0885760635137558, 0.09185653924942017, 0.09513701498508453, 0.0984174907207489, 0.10169796645641327, 0.10497844964265823, 0.1082589253783226, 0.11153940111398697, 0.11481988430023193, 0.1181003600358963, 0.12138083577156067, 0.12466131895780563]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 2.0, 5.0, 3.0, 8.0, 16.0, 21.0, 18.0, 36.0, 27.0, 47.0, 67.0, 66.0, 92.0, 89.0, 90.0, 72.0, 61.0, 70.0, 43.0, 36.0, 29.0, 24.0, 24.0, 11.0, 5.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0361018180847168, -0.03461151570081711, -0.03312121331691742, -0.03163091093301773, -0.030140608549118042, -0.028650306165218353, -0.027160003781318665, -0.025669701397418976, -0.024179399013519287, -0.0226890966296196, -0.02119879424571991, -0.01970849186182022, -0.018218189477920532, -0.016727887094020844, -0.015237584710121155, -0.013747282326221466, -0.012256979942321777, -0.010766677558422089, -0.0092763751745224, -0.007786072790622711, -0.0062957704067230225, -0.004805468022823334, -0.003315165638923645, -0.0018248632550239563, -0.0003345608711242676, 0.0011557415127754211, 0.00264604389667511, 0.004136346280574799, 0.005626648664474487, 0.007116951048374176, 0.008607253432273865, 0.010097555816173553, 0.011587858200073242, 0.013078160583972931, 0.01456846296787262, 0.01605876535177231, 0.017549067735671997, 0.019039370119571686, 0.020529672503471375, 0.022019974887371063, 0.023510277271270752, 0.02500057965517044, 0.02649088203907013, 0.027981184422969818, 0.029471486806869507, 0.030961789190769196, 0.032452091574668884, 0.03394239395856857, 0.03543269634246826, 0.03692299872636795, 0.03841330111026764, 0.03990360349416733, 0.04139390587806702, 0.042884208261966705, 0.044374510645866394, 0.04586481302976608, 0.04735511541366577, 0.04884541779756546, 0.05033572018146515, 0.05182602256536484, 0.053316324949264526, 0.054806627333164215, 0.056296929717063904, 0.05778723210096359, 0.05927753448486328]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 6.0, 8.0, 6.0, 6.0, 8.0, 4.0, 14.0, 7.0, 13.0, 12.0, 10.0, 12.0, 10.0, 34.0, 24.0, 112.0, 1803.0, 4191749.0, 220.0, 38.0, 30.0, 14.0, 8.0, 12.0, 14.0, 16.0, 12.0, 0.0, 4.0, 10.0, 6.0, 2.0, 16.0, 6.0, 2.0, 8.0, 4.0, 0.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.9111328125, -1.8597412109375, -1.808349609375, -1.7569580078125, -1.70556640625, -1.6541748046875, -1.602783203125, -1.5513916015625, -1.5, -1.4486083984375, -1.397216796875, -1.3458251953125, -1.29443359375, -1.2430419921875, -1.191650390625, -1.1402587890625, -1.0888671875, -1.0374755859375, -0.986083984375, -0.9346923828125, -0.88330078125, -0.8319091796875, -0.780517578125, -0.7291259765625, -0.677734375, -0.6263427734375, -0.574951171875, -0.5235595703125, -0.47216796875, -0.4207763671875, -0.369384765625, -0.3179931640625, -0.2666015625, -0.2152099609375, -0.163818359375, -0.1124267578125, -0.06103515625, -0.0096435546875, 0.041748046875, 0.0931396484375, 0.14453125, 0.1959228515625, 0.247314453125, 0.2987060546875, 0.35009765625, 0.4014892578125, 0.452880859375, 0.5042724609375, 0.5556640625, 0.6070556640625, 0.658447265625, 0.7098388671875, 0.76123046875, 0.8126220703125, 0.864013671875, 0.9154052734375, 0.966796875, 1.0181884765625, 1.069580078125, 1.1209716796875, 1.17236328125, 1.2237548828125, 1.275146484375, 1.3265380859375, 1.3779296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 5.0, 2.0, 6.0, 3.0, 5.0, 4.0, 11.0, 4.0, 6.0, 9.0, 14.0, 21.0, 49.0, 118.0, 175.0, 230.0, 147.0, 65.0, 32.0, 14.0, 10.0, 7.0, 8.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012407302856445312, -0.0012008696794509888, -0.0011610090732574463, -0.0011211484670639038, -0.0010812878608703613, -0.0010414272546768188, -0.0010015666484832764, -0.0009617060422897339, -0.0009218454360961914, -0.0008819848299026489, -0.0008421242237091064, -0.000802263617515564, -0.0007624030113220215, -0.000722542405128479, -0.0006826817989349365, -0.000642821192741394, -0.0006029605865478516, -0.0005630999803543091, -0.0005232393741607666, -0.0004833787679672241, -0.00044351816177368164, -0.00040365755558013916, -0.0003637969493865967, -0.0003239363431930542, -0.0002840757369995117, -0.00024421513080596924, -0.00020435452461242676, -0.00016449391841888428, -0.0001246333122253418, -8.477270603179932e-05, -4.4912099838256836e-05, -5.0514936447143555e-06, 3.4809112548828125e-05, 7.46697187423706e-05, 0.00011453032493591309, 0.00015439093112945557, 0.00019425153732299805, 0.00023411214351654053, 0.000273972749710083, 0.0003138333559036255, 0.00035369396209716797, 0.00039355456829071045, 0.00043341517448425293, 0.0004732757806777954, 0.0005131363868713379, 0.0005529969930648804, 0.0005928575992584229, 0.0006327182054519653, 0.0006725788116455078, 0.0007124394178390503, 0.0007523000240325928, 0.0007921606302261353, 0.0008320212364196777, 0.0008718818426132202, 0.0009117424488067627, 0.0009516030550003052, 0.0009914636611938477, 0.0010313242673873901, 0.0010711848735809326, 0.001111045479774475, 0.0011509060859680176, 0.00119076669216156, 0.0012306272983551025, 0.001270487904548645, 0.0013103485107421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 10.0, 19.0, 35.0, 88.0, 199.0, 883.0, 4192156.0, 642.0, 143.0, 46.0, 30.0, 16.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.982421875, -1.94384765625, -1.9052734375, -1.86669921875, -1.828125, -1.78955078125, -1.7509765625, -1.71240234375, -1.673828125, -1.63525390625, -1.5966796875, -1.55810546875, -1.51953125, -1.48095703125, -1.4423828125, -1.40380859375, -1.365234375, -1.32666015625, -1.2880859375, -1.24951171875, -1.2109375, -1.17236328125, -1.1337890625, -1.09521484375, -1.056640625, -1.01806640625, -0.9794921875, -0.94091796875, -0.90234375, -0.86376953125, -0.8251953125, -0.78662109375, -0.748046875, -0.70947265625, -0.6708984375, -0.63232421875, -0.59375, -0.55517578125, -0.5166015625, -0.47802734375, -0.439453125, -0.40087890625, -0.3623046875, -0.32373046875, -0.28515625, -0.24658203125, -0.2080078125, -0.16943359375, -0.130859375, -0.09228515625, -0.0537109375, -0.01513671875, 0.0234375, 0.06201171875, 0.1005859375, 0.13916015625, 0.177734375, 0.21630859375, 0.2548828125, 0.29345703125, 0.33203125, 0.37060546875, 0.4091796875, 0.44775390625, 0.486328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 15.0, 18.0, 38.0, 92.0, 126.0, 297.0, 974.0, 1818.0, 371.0, 166.0, 73.0, 34.0, 23.0, 15.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0030727386474609375, -0.0028822720050811768, -0.002691805362701416, -0.0025013387203216553, -0.0023108720779418945, -0.002120405435562134, -0.001929938793182373, -0.0017394721508026123, -0.0015490055084228516, -0.0013585388660430908, -0.00116807222366333, -0.0009776055812835693, -0.0007871389389038086, -0.0005966722965240479, -0.0004062056541442871, -0.00021573901176452637, -2.5272369384765625e-05, 0.00016519427299499512, 0.00035566091537475586, 0.0005461275577545166, 0.0007365942001342773, 0.0009270608425140381, 0.0011175274848937988, 0.0013079941272735596, 0.0014984607696533203, 0.001688927412033081, 0.0018793940544128418, 0.0020698606967926025, 0.0022603273391723633, 0.002450793981552124, 0.0026412606239318848, 0.0028317272663116455, 0.0030221939086914062, 0.003212660551071167, 0.0034031271934509277, 0.0035935938358306885, 0.0037840604782104492, 0.00397452712059021, 0.004164993762969971, 0.0043554604053497314, 0.004545927047729492, 0.004736393690109253, 0.004926860332489014, 0.005117326974868774, 0.005307793617248535, 0.005498260259628296, 0.005688726902008057, 0.005879193544387817, 0.006069660186767578, 0.006260126829147339, 0.0064505934715271, 0.00664106011390686, 0.006831526756286621, 0.007021993398666382, 0.007212460041046143, 0.007402926683425903, 0.007593393325805664, 0.007783859968185425, 0.007974326610565186, 0.008164793252944946, 0.008355259895324707, 0.008545726537704468, 0.008736193180084229, 0.00892665982246399, 0.00911712646484375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 1007.0, 1.0, 0.0, 2.0], "bins": [-4.851652145385742, -4.771372318267822, -4.691092491149902, -4.610812664031982, -4.5305328369140625, -4.450253009796143, -4.369973182678223, -4.2896928787231445, -4.209413051605225, -4.129133224487305, -4.048853397369385, -3.968573570251465, -3.888293504714966, -3.808013677597046, -3.727733850479126, -3.647454023361206, -3.5671744346618652, -3.4868946075439453, -3.4066147804260254, -3.3263349533081055, -3.2460548877716064, -3.1657750606536865, -3.0854952335357666, -3.0052154064178467, -2.9249353408813477, -2.8446555137634277, -2.764375686645508, -2.684095859527588, -2.603815793991089, -2.523535966873169, -2.443256139755249, -2.362976312637329, -2.2826967239379883, -2.2024168968200684, -2.1221370697021484, -2.0418572425842285, -1.961577296257019, -1.8812973499298096, -1.8010175228118896, -1.7207376956939697, -1.6404577493667603, -1.5601779222488403, -1.4798979759216309, -1.399618148803711, -1.319338321685791, -1.239058494567871, -1.1587785482406616, -1.0784987211227417, -0.9982188940048218, -0.9179390072822571, -0.8376591801643372, -0.7573792934417725, -0.6770994663238525, -0.5968195796012878, -0.5165396928787231, -0.4362598657608032, -0.35597994923591614, -0.27570009231567383, -0.19542022049427032, -0.11514034867286682, -0.03486049175262451, 0.0454193651676178, 0.1256992518901825, 0.20597907900810242, 0.2862589657306671]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 19.0, 56.0, 104.0, 201.0, 248.0, 186.0, 117.0, 43.0, 18.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04269814491271973, -0.03907020390033722, -0.03544226661324501, -0.0318143293261528, -0.028186388313770294, -0.024558449164032936, -0.020930510014295578, -0.01730257086455822, -0.013674631714820862, -0.010046692565083504, -0.006418753415346146, -0.0027908142656087875, 0.0008371248841285706, 0.004465064033865929, 0.008093003183603287, 0.011720942333340645, 0.015348881483078003, 0.01897682063281536, 0.02260475978255272, 0.026232698932290077, 0.029860638082027435, 0.03348857909440994, 0.03711651638150215, 0.04074445366859436, 0.04437239468097687, 0.048000335693359375, 0.051628272980451584, 0.05525621026754379, 0.0588841512799263, 0.06251209229230881, 0.06614002585411072, 0.06976796686649323, 0.07339590787887573, 0.07702384889125824, 0.08065178990364075, 0.08427972346544266, 0.08790766447782516, 0.09153560549020767, 0.09516353905200958, 0.09879148006439209, 0.1024194210767746, 0.1060473620891571, 0.10967530310153961, 0.11330323666334152, 0.11693117767572403, 0.12055911868810654, 0.12418705224990845, 0.12781499326229095, 0.13144293427467346, 0.13507087528705597, 0.13869881629943848, 0.14232675731182098, 0.1459546983242035, 0.1495826244354248, 0.1532105654478073, 0.15683850646018982, 0.16046644747257233, 0.16409438848495483, 0.16772232949733734, 0.17135027050971985, 0.17497819662094116, 0.17860613763332367, 0.18223407864570618, 0.18586201965808868, 0.1894899606704712]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 6.0, 6.0, 16.0, 8.0, 15.0, 18.0, 12.0, 17.0, 17.0, 18.0, 13.0, 21.0, 31.0, 41.0, 37.0, 36.0, 36.0, 37.0, 72.0, 249.0, 219949.0, 826988.0, 413.0, 92.0, 67.0, 33.0, 34.0, 33.0, 16.0, 27.0, 28.0, 29.0, 23.0, 18.0, 10.0, 21.0, 10.0, 10.0, 9.0, 5.0, 7.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.58935546875, -0.5720596313476562, -0.5547637939453125, -0.5374679565429688, -0.520172119140625, -0.5028762817382812, -0.4855804443359375, -0.46828460693359375, -0.45098876953125, -0.43369293212890625, -0.4163970947265625, -0.39910125732421875, -0.381805419921875, -0.36450958251953125, -0.3472137451171875, -0.32991790771484375, -0.3126220703125, -0.29532623291015625, -0.2780303955078125, -0.26073455810546875, -0.243438720703125, -0.22614288330078125, -0.2088470458984375, -0.19155120849609375, -0.17425537109375, -0.15695953369140625, -0.1396636962890625, -0.12236785888671875, -0.105072021484375, -0.08777618408203125, -0.0704803466796875, -0.05318450927734375, -0.035888671875, -0.01859283447265625, -0.0012969970703125, 0.01599884033203125, 0.033294677734375, 0.05059051513671875, 0.0678863525390625, 0.08518218994140625, 0.10247802734375, 0.11977386474609375, 0.1370697021484375, 0.15436553955078125, 0.171661376953125, 0.18895721435546875, 0.2062530517578125, 0.22354888916015625, 0.2408447265625, 0.25814056396484375, 0.2754364013671875, 0.29273223876953125, 0.310028076171875, 0.32732391357421875, 0.3446197509765625, 0.36191558837890625, 0.37921142578125, 0.39650726318359375, 0.4138031005859375, 0.43109893798828125, 0.448394775390625, 0.46569061279296875, 0.4829864501953125, 0.5002822875976562, 0.517578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [27.0, 273.0, 590.0, 121.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004947662353515625, -0.0028790831565856934, -0.0008105039596557617, 0.00125807523727417, 0.0033266544342041016, 0.005395233631134033, 0.007463812828063965, 0.009532392024993896, 0.011600971221923828, 0.01366955041885376, 0.01573812961578369, 0.017806708812713623, 0.019875288009643555, 0.021943867206573486, 0.024012446403503418, 0.02608102560043335, 0.02814960479736328, 0.030218183994293213, 0.032286763191223145, 0.034355342388153076, 0.03642392158508301, 0.03849250078201294, 0.04056107997894287, 0.0426296591758728, 0.044698238372802734, 0.046766817569732666, 0.0488353967666626, 0.05090397596359253, 0.05297255516052246, 0.05504113435745239, 0.057109713554382324, 0.059178292751312256, 0.06124687194824219, 0.06331545114517212, 0.06538403034210205, 0.06745260953903198, 0.06952118873596191, 0.07158976793289185, 0.07365834712982178, 0.07572692632675171, 0.07779550552368164, 0.07986408472061157, 0.0819326639175415, 0.08400124311447144, 0.08606982231140137, 0.0881384015083313, 0.09020698070526123, 0.09227555990219116, 0.0943441390991211, 0.09641271829605103, 0.09848129749298096, 0.10054987668991089, 0.10261845588684082, 0.10468703508377075, 0.10675561428070068, 0.10882419347763062, 0.11089277267456055, 0.11296135187149048, 0.11502993106842041, 0.11709851026535034, 0.11916708946228027, 0.1212356686592102, 0.12330424785614014, 0.12537282705307007, 0.12744140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 4.0, 7.0, 8.0, 16.0, 15.0, 24.0, 31.0, 27.0, 49.0, 64.0, 123.0, 202.0, 503.0, 1448.0, 5697.0, 32482.0, 381129.0, 570476.0, 45758.0, 7334.0, 1860.0, 640.0, 265.0, 122.0, 70.0, 35.0, 32.0, 28.0, 18.0, 14.0, 6.0, 16.0, 12.0, 7.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2357177734375, -0.22837066650390625, -0.2210235595703125, -0.21367645263671875, -0.206329345703125, -0.19898223876953125, -0.1916351318359375, -0.18428802490234375, -0.17694091796875, -0.16959381103515625, -0.1622467041015625, -0.15489959716796875, -0.147552490234375, -0.14020538330078125, -0.1328582763671875, -0.12551116943359375, -0.1181640625, -0.11081695556640625, -0.1034698486328125, -0.09612274169921875, -0.088775634765625, -0.08142852783203125, -0.0740814208984375, -0.06673431396484375, -0.05938720703125, -0.05204010009765625, -0.0446929931640625, -0.03734588623046875, -0.029998779296875, -0.02265167236328125, -0.0153045654296875, -0.00795745849609375, -0.0006103515625, 0.00673675537109375, 0.0140838623046875, 0.02143096923828125, 0.028778076171875, 0.03612518310546875, 0.0434722900390625, 0.05081939697265625, 0.05816650390625, 0.06551361083984375, 0.0728607177734375, 0.08020782470703125, 0.087554931640625, 0.09490203857421875, 0.1022491455078125, 0.10959625244140625, 0.116943359375, 0.12429046630859375, 0.1316375732421875, 0.13898468017578125, 0.146331787109375, 0.15367889404296875, 0.1610260009765625, 0.16837310791015625, 0.17572021484375, 0.18306732177734375, 0.1904144287109375, 0.19776153564453125, 0.205108642578125, 0.21245574951171875, 0.2198028564453125, 0.22714996337890625, 0.2344970703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 7.0, 12.0, 13.0, 15.0, 20.0, 26.0, 27.0, 29.0, 38.0, 45.0, 49.0, 52.0, 50.0, 65.0, 55.0, 73.0, 53.0, 51.0, 54.0, 38.0, 39.0, 33.0, 21.0, 25.0, 24.0, 12.0, 14.0, 11.0, 1.0, 4.0, 13.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.1256103515625, -0.12235069274902344, -0.11909103393554688, -0.11583137512207031, -0.11257171630859375, -0.10931205749511719, -0.10605239868164062, -0.10279273986816406, -0.0995330810546875, -0.09627342224121094, -0.09301376342773438, -0.08975410461425781, -0.08649444580078125, -0.08323478698730469, -0.07997512817382812, -0.07671546936035156, -0.073455810546875, -0.07019615173339844, -0.06693649291992188, -0.06367683410644531, -0.06041717529296875, -0.05715751647949219, -0.053897857666015625, -0.05063819885253906, -0.0473785400390625, -0.04411888122558594, -0.040859222412109375, -0.03759956359863281, -0.03433990478515625, -0.031080245971679688, -0.027820587158203125, -0.024560928344726562, -0.02130126953125, -0.018041610717773438, -0.014781951904296875, -0.011522293090820312, -0.00826263427734375, -0.0050029754638671875, -0.001743316650390625, 0.0015163421630859375, 0.0047760009765625, 0.008035659790039062, 0.011295318603515625, 0.014554977416992188, 0.01781463623046875, 0.021074295043945312, 0.024333953857421875, 0.027593612670898438, 0.030853271484375, 0.03411293029785156, 0.037372589111328125, 0.04063224792480469, 0.04389190673828125, 0.04715156555175781, 0.050411224365234375, 0.05367088317871094, 0.0569305419921875, 0.06019020080566406, 0.06344985961914062, 0.06670951843261719, 0.06996917724609375, 0.07322883605957031, 0.07648849487304688, 0.07974815368652344, 0.0830078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 2.0, 5.0, 7.0, 10.0, 15.0, 26.0, 27.0, 46.0, 85.0, 135.0, 295.0, 574.0, 1525.0, 4876.0, 24841.0, 591626.0, 397082.0, 20427.0, 4345.0, 1428.0, 541.0, 273.0, 124.0, 71.0, 47.0, 34.0, 25.0, 24.0, 11.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22418975830078125, -0.2164459228515625, -0.20870208740234375, -0.200958251953125, -0.19321441650390625, -0.1854705810546875, -0.17772674560546875, -0.16998291015625, -0.16223907470703125, -0.1544952392578125, -0.14675140380859375, -0.139007568359375, -0.13126373291015625, -0.1235198974609375, -0.11577606201171875, -0.1080322265625, -0.10028839111328125, -0.0925445556640625, -0.08480072021484375, -0.077056884765625, -0.06931304931640625, -0.0615692138671875, -0.05382537841796875, -0.04608154296875, -0.03833770751953125, -0.0305938720703125, -0.02285003662109375, -0.015106201171875, -0.00736236572265625, 0.0003814697265625, 0.00812530517578125, 0.015869140625, 0.02361297607421875, 0.0313568115234375, 0.03910064697265625, 0.046844482421875, 0.05458831787109375, 0.0623321533203125, 0.07007598876953125, 0.07781982421875, 0.08556365966796875, 0.0933074951171875, 0.10105133056640625, 0.108795166015625, 0.11653900146484375, 0.1242828369140625, 0.13202667236328125, 0.1397705078125, 0.14751434326171875, 0.1552581787109375, 0.16300201416015625, 0.170745849609375, 0.17848968505859375, 0.1862335205078125, 0.19397735595703125, 0.20172119140625, 0.20946502685546875, 0.2172088623046875, 0.22495269775390625, 0.232696533203125, 0.24044036865234375, 0.2481842041015625, 0.25592803955078125, 0.263671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 6.0, 8.0, 10.0, 13.0, 18.0, 18.0, 37.0, 45.0, 68.0, 105.0, 156.0, 102.0, 112.0, 88.0, 58.0, 31.0, 23.0, 23.0, 19.0, 6.0, 9.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7702579498291016e-05, -1.7132610082626343e-05, -1.656264066696167e-05, -1.5992671251296997e-05, -1.5422701835632324e-05, -1.4852732419967651e-05, -1.4282763004302979e-05, -1.3712793588638306e-05, -1.3142824172973633e-05, -1.257285475730896e-05, -1.2002885341644287e-05, -1.1432915925979614e-05, -1.0862946510314941e-05, -1.0292977094650269e-05, -9.723007678985596e-06, -9.153038263320923e-06, -8.58306884765625e-06, -8.013099431991577e-06, -7.443130016326904e-06, -6.8731606006622314e-06, -6.303191184997559e-06, -5.733221769332886e-06, -5.163252353668213e-06, -4.59328293800354e-06, -4.023313522338867e-06, -3.4533441066741943e-06, -2.8833746910095215e-06, -2.3134052753448486e-06, -1.7434358596801758e-06, -1.173466444015503e-06, -6.034970283508301e-07, -3.3527612686157227e-08, 5.364418029785156e-07, 1.1064112186431885e-06, 1.6763806343078613e-06, 2.246350049972534e-06, 2.816319465637207e-06, 3.38628888130188e-06, 3.956258296966553e-06, 4.526227712631226e-06, 5.0961971282958984e-06, 5.666166543960571e-06, 6.236135959625244e-06, 6.806105375289917e-06, 7.37607479095459e-06, 7.946044206619263e-06, 8.516013622283936e-06, 9.085983037948608e-06, 9.655952453613281e-06, 1.0225921869277954e-05, 1.0795891284942627e-05, 1.13658607006073e-05, 1.1935830116271973e-05, 1.2505799531936646e-05, 1.3075768947601318e-05, 1.3645738363265991e-05, 1.4215707778930664e-05, 1.4785677194595337e-05, 1.535564661026001e-05, 1.5925616025924683e-05, 1.6495585441589355e-05, 1.706555485725403e-05, 1.76355242729187e-05, 1.8205493688583374e-05, 1.8775463104248047e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 13.0, 16.0, 36.0, 54.0, 86.0, 252.0, 995.0, 13498.0, 997796.0, 33814.0, 1510.0, 279.0, 89.0, 45.0, 23.0, 11.0, 13.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68408203125, -0.6676445007324219, -0.6512069702148438, -0.6347694396972656, -0.6183319091796875, -0.6018943786621094, -0.5854568481445312, -0.5690193176269531, -0.552581787109375, -0.5361442565917969, -0.5197067260742188, -0.5032691955566406, -0.4868316650390625, -0.4703941345214844, -0.45395660400390625, -0.4375190734863281, -0.42108154296875, -0.4046440124511719, -0.38820648193359375, -0.3717689514160156, -0.3553314208984375, -0.3388938903808594, -0.32245635986328125, -0.3060188293457031, -0.289581298828125, -0.2731437683105469, -0.25670623779296875, -0.24026870727539062, -0.2238311767578125, -0.20739364624023438, -0.19095611572265625, -0.17451858520507812, -0.1580810546875, -0.14164352416992188, -0.12520599365234375, -0.10876846313476562, -0.0923309326171875, -0.07589340209960938, -0.05945587158203125, -0.043018341064453125, -0.026580810546875, -0.010143280029296875, 0.00629425048828125, 0.022731781005859375, 0.0391693115234375, 0.055606842041015625, 0.07204437255859375, 0.08848190307617188, 0.10491943359375, 0.12135696411132812, 0.13779449462890625, 0.15423202514648438, 0.1706695556640625, 0.18710708618164062, 0.20354461669921875, 0.21998214721679688, 0.236419677734375, 0.2528572082519531, 0.26929473876953125, 0.2857322692871094, 0.3021697998046875, 0.3186073303222656, 0.33504486083984375, 0.3514823913574219, 0.367919921875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 0.0, 5.0, 9.0, 9.0, 10.0, 20.0, 20.0, 28.0, 66.0, 129.0, 285.0, 209.0, 92.0, 45.0, 30.0, 11.0, 9.0, 9.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275390625, -0.268951416015625, -0.26251220703125, -0.256072998046875, -0.2496337890625, -0.243194580078125, -0.23675537109375, -0.230316162109375, -0.223876953125, -0.217437744140625, -0.21099853515625, -0.204559326171875, -0.1981201171875, -0.191680908203125, -0.18524169921875, -0.178802490234375, -0.17236328125, -0.165924072265625, -0.15948486328125, -0.153045654296875, -0.1466064453125, -0.140167236328125, -0.13372802734375, -0.127288818359375, -0.120849609375, -0.114410400390625, -0.10797119140625, -0.101531982421875, -0.0950927734375, -0.088653564453125, -0.08221435546875, -0.075775146484375, -0.0693359375, -0.062896728515625, -0.05645751953125, -0.050018310546875, -0.0435791015625, -0.037139892578125, -0.03070068359375, -0.024261474609375, -0.017822265625, -0.011383056640625, -0.00494384765625, 0.001495361328125, 0.0079345703125, 0.014373779296875, 0.02081298828125, 0.027252197265625, 0.03369140625, 0.040130615234375, 0.04656982421875, 0.053009033203125, 0.0594482421875, 0.065887451171875, 0.07232666015625, 0.078765869140625, 0.085205078125, 0.091644287109375, 0.09808349609375, 0.104522705078125, 0.1109619140625, 0.117401123046875, 0.12384033203125, 0.130279541015625, 0.13671875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 12.0, 186.0, 814.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9015557765960693, -2.4335384368896484, -1.9655213356018066, -1.4975041151046753, -1.029486894607544, -0.5614697933197021, -0.09345245361328125, 0.37456488609313965, 0.8425819873809814, 1.3105992078781128, 1.7786164283752441, 2.246633529663086, 2.714650869369507, 3.1826679706573486, 3.6506853103637695, 4.1187028884887695, 4.586719512939453, 5.054736614227295, 5.522753715515137, 5.990771293640137, 6.4587883949279785, 6.92680549621582, 7.39482307434082, 7.862840175628662, 8.330857276916504, 8.798874855041504, 9.266891479492188, 9.734909057617188, 10.202926635742188, 10.670943260192871, 11.138960838317871, 11.606977462768555, 12.074995040893555, 12.543012619018555, 13.011029243469238, 13.479046821594238, 13.947063446044922, 14.415081024169922, 14.883098602294922, 15.351116180419922, 15.819132804870605, 16.28714942932129, 16.75516700744629, 17.22318458557129, 17.69120216369629, 18.159217834472656, 18.627235412597656, 19.095252990722656, 19.563270568847656, 20.031288146972656, 20.499305725097656, 20.967321395874023, 21.435338973999023, 21.903356552124023, 22.371374130249023, 22.839391708374023, 23.30740737915039, 23.77542495727539, 24.24344253540039, 24.711458206176758, 25.179475784301758, 25.647493362426758, 26.115510940551758, 26.583528518676758, 27.051546096801758]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 3.0, 26.0, 30.0, 49.0, 59.0, 71.0, 102.0, 96.0, 105.0, 101.0, 94.0, 90.0, 71.0, 40.0, 27.0, 19.0, 9.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.814208984375, -0.7695979475975037, -0.7249868512153625, -0.6803758144378662, -0.6357647180557251, -0.5911536812782288, -0.5465426445007324, -0.5019315481185913, -0.45732051134109497, -0.41270944476127625, -0.3680983781814575, -0.3234873414039612, -0.27887627482414246, -0.23426520824432373, -0.1896541714668274, -0.14504310488700867, -0.10043203830718994, -0.05582097917795181, -0.011209920048713684, 0.03340113162994385, 0.07801219820976257, 0.1226232647895813, 0.16723430156707764, 0.21184536814689636, 0.2564564347267151, 0.3010675013065338, 0.34567856788635254, 0.3902896046638489, 0.4349006712436676, 0.47951173782348633, 0.5241227746009827, 0.568733811378479, 0.6133449077606201, 0.6579559445381165, 0.7025670409202576, 0.7471780776977539, 0.791789174079895, 0.8364002108573914, 0.8810112476348877, 0.9256223440170288, 0.9702333807945251, 1.0148444175720215, 1.0594555139541626, 1.1040666103363037, 1.1486775875091553, 1.1932886838912964, 1.2378997802734375, 1.282510757446289, 1.3271218538284302, 1.3717329502105713, 1.4163439273834229, 1.460955023765564, 1.505566120147705, 1.5501770973205566, 1.5947881937026978, 1.6393992900848389, 1.6840102672576904, 1.7286213636398315, 1.773232340812683, 1.8178434371948242, 1.8624545335769653, 1.9070656299591064, 1.951676607131958, 1.9962877035140991, 2.0408987998962402]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 12.0, 50.0, 265.0, 16782.0, 4175799.0, 907.0, 230.0, 102.0, 59.0, 44.0, 20.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.54974365234375, -0.4432373046875, -0.33673095703125, -0.230224609375, -0.12371826171875, -0.0172119140625, 0.08929443359375, 0.19580078125, 0.30230712890625, 0.4088134765625, 0.51531982421875, 0.621826171875, 0.72833251953125, 0.8348388671875, 0.94134521484375, 1.0478515625, 1.15435791015625, 1.2608642578125, 1.36737060546875, 1.473876953125, 1.58038330078125, 1.6868896484375, 1.79339599609375, 1.89990234375, 2.00640869140625, 2.1129150390625, 2.21942138671875, 2.325927734375, 2.43243408203125, 2.5389404296875, 2.64544677734375, 2.751953125, 2.85845947265625, 2.9649658203125, 3.07147216796875, 3.177978515625, 3.28448486328125, 3.3909912109375, 3.49749755859375, 3.60400390625, 3.71051025390625, 3.8170166015625, 3.92352294921875, 4.030029296875, 4.13653564453125, 4.2430419921875, 4.34954833984375, 4.4560546875, 4.56256103515625, 4.6690673828125, 4.77557373046875, 4.882080078125, 4.98858642578125, 5.0950927734375, 5.20159912109375, 5.30810546875, 5.41461181640625, 5.5211181640625, 5.62762451171875, 5.734130859375, 5.84063720703125, 5.9471435546875, 6.05364990234375, 6.16015625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 10.0, 59.0, 141.0, 284.0, 304.0, 157.0, 37.0, 22.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0188446044921875, -0.016173601150512695, -0.01350259780883789, -0.010831594467163086, -0.008160591125488281, -0.0054895877838134766, -0.002818584442138672, -0.0001475811004638672, 0.0025234222412109375, 0.005194425582885742, 0.007865428924560547, 0.010536432266235352, 0.013207435607910156, 0.01587843894958496, 0.018549442291259766, 0.02122044563293457, 0.023891448974609375, 0.02656245231628418, 0.029233455657958984, 0.03190445899963379, 0.034575462341308594, 0.0372464656829834, 0.0399174690246582, 0.04258847236633301, 0.04525947570800781, 0.04793047904968262, 0.05060148239135742, 0.05327248573303223, 0.05594348907470703, 0.058614492416381836, 0.06128549575805664, 0.06395649909973145, 0.06662750244140625, 0.06929850578308105, 0.07196950912475586, 0.07464051246643066, 0.07731151580810547, 0.07998251914978027, 0.08265352249145508, 0.08532452583312988, 0.08799552917480469, 0.09066653251647949, 0.0933375358581543, 0.0960085391998291, 0.0986795425415039, 0.10135054588317871, 0.10402154922485352, 0.10669255256652832, 0.10936355590820312, 0.11203455924987793, 0.11470556259155273, 0.11737656593322754, 0.12004756927490234, 0.12271857261657715, 0.12538957595825195, 0.12806057929992676, 0.13073158264160156, 0.13340258598327637, 0.13607358932495117, 0.13874459266662598, 0.14141559600830078, 0.14408659934997559, 0.1467576026916504, 0.1494286060333252, 0.152099609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 8.0, 23.0, 62.0, 92.0, 120.0, 219.0, 497.0, 96348.0, 4095591.0, 537.0, 247.0, 170.0, 132.0, 76.0, 57.0, 39.0, 33.0, 8.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.326385498046875, -3.18206787109375, -3.037750244140625, -2.8934326171875, -2.749114990234375, -2.60479736328125, -2.460479736328125, -2.316162109375, -2.171844482421875, -2.02752685546875, -1.883209228515625, -1.7388916015625, -1.594573974609375, -1.45025634765625, -1.305938720703125, -1.16162109375, -1.017303466796875, -0.87298583984375, -0.728668212890625, -0.5843505859375, -0.440032958984375, -0.29571533203125, -0.151397705078125, -0.007080078125, 0.137237548828125, 0.28155517578125, 0.425872802734375, 0.5701904296875, 0.714508056640625, 0.85882568359375, 1.003143310546875, 1.1474609375, 1.291778564453125, 1.43609619140625, 1.580413818359375, 1.7247314453125, 1.869049072265625, 2.01336669921875, 2.157684326171875, 2.302001953125, 2.446319580078125, 2.59063720703125, 2.734954833984375, 2.8792724609375, 3.023590087890625, 3.16790771484375, 3.312225341796875, 3.45654296875, 3.600860595703125, 3.74517822265625, 3.889495849609375, 4.0338134765625, 4.178131103515625, 4.32244873046875, 4.466766357421875, 4.611083984375, 4.755401611328125, 4.89971923828125, 5.044036865234375, 5.1883544921875, 5.332672119140625, 5.47698974609375, 5.621307373046875, 5.765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 24.0, 131.0, 3686.0, 226.0, 10.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12420654296875, -0.10988330841064453, -0.09556007385253906, -0.0812368392944336, -0.06691360473632812, -0.052590370178222656, -0.03826713562011719, -0.02394390106201172, -0.00962066650390625, 0.004702568054199219, 0.019025802612304688, 0.033349037170410156, 0.047672271728515625, 0.061995506286621094, 0.07631874084472656, 0.09064197540283203, 0.1049652099609375, 0.11928844451904297, 0.13361167907714844, 0.1479349136352539, 0.16225814819335938, 0.17658138275146484, 0.1909046173095703, 0.20522785186767578, 0.21955108642578125, 0.23387432098388672, 0.2481975555419922, 0.26252079010009766, 0.2768440246582031, 0.2911672592163086, 0.30549049377441406, 0.31981372833251953, 0.334136962890625, 0.34846019744873047, 0.36278343200683594, 0.3771066665649414, 0.3914299011230469, 0.40575313568115234, 0.4200763702392578, 0.4343996047973633, 0.44872283935546875, 0.4630460739135742, 0.4773693084716797, 0.49169254302978516, 0.5060157775878906, 0.5203390121459961, 0.5346622467041016, 0.548985481262207, 0.5633087158203125, 0.577631950378418, 0.5919551849365234, 0.6062784194946289, 0.6206016540527344, 0.6349248886108398, 0.6492481231689453, 0.6635713577270508, 0.6778945922851562, 0.6922178268432617, 0.7065410614013672, 0.7208642959594727, 0.7351875305175781, 0.7495107650756836, 0.7638339996337891, 0.7781572341918945, 0.79248046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 12.0, 55.0, 476.0, 428.0, 32.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884055137634277, -0.9903718829154968, -0.7923382520675659, -0.594304621219635, -0.3962709903717041, -0.1982373595237732, -0.00020372867584228516, 0.1978299617767334, 0.39586353302001953, 0.5938971638679504, 0.7919307947158813, 0.9899644255638123, 1.1879980564117432, 1.3860316276550293, 1.584065318107605, 1.7820990085601807, 1.9801325798034668, 2.178166151046753, 2.376199722290039, 2.5742335319519043, 2.7722671031951904, 2.9703006744384766, 3.168334484100342, 3.366368055343628, 3.564401626586914, 3.7624351978302, 3.9604687690734863, 4.158502578735352, 4.356535911560059, 4.554569721221924, 4.752603530883789, 4.950636863708496, 5.148670196533203, 5.346704006195068, 5.544737339019775, 5.742771148681641, 5.940804481506348, 6.138838291168213, 6.336872100830078, 6.534905433654785, 6.73293924331665, 6.930973052978516, 7.129006385803223, 7.327040195465088, 7.525074005126953, 7.72310733795166, 7.921141147613525, 8.11917495727539, 8.317208290100098, 8.515241622924805, 8.713275909423828, 8.911309242248535, 9.109342575073242, 9.307376861572266, 9.505410194396973, 9.70344352722168, 9.901477813720703, 10.09951114654541, 10.297545433044434, 10.49557876586914, 10.693612098693848, 10.891646385192871, 11.089679718017578, 11.287713050842285, 11.485746383666992]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 14.0, 17.0, 65.0, 80.0, 96.0, 150.0, 169.0, 143.0, 105.0, 74.0, 39.0, 25.0, 13.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.661320686340332, -2.579507827758789, -2.497695207595825, -2.4158823490142822, -2.3340697288513184, -2.2522568702697754, -2.1704442501068115, -2.0886313915252686, -2.0068187713623047, -1.9250060319900513, -1.8431932926177979, -1.7613805532455444, -1.679567813873291, -1.597754955291748, -1.5159422159194946, -1.4341294765472412, -1.3523166179656982, -1.2705038785934448, -1.1886911392211914, -1.106878399848938, -1.0250656604766846, -0.9432528614997864, -0.8614400625228882, -0.7796273231506348, -0.6978145837783813, -0.6160018444061279, -0.5341891050338745, -0.4523763060569763, -0.3705635666847229, -0.2887508273124695, -0.20693805813789368, -0.12512528896331787, -0.04331254959106445, 0.03850020468235016, 0.12031295895576477, 0.20212571322917938, 0.283938467502594, 0.3657512068748474, 0.4475639760494232, 0.529376745223999, 0.6111894845962524, 0.6930022239685059, 0.7748149633407593, 0.8566277623176575, 0.9384405016899109, 1.0202531814575195, 1.1020660400390625, 1.183878779411316, 1.2656915187835693, 1.3475042581558228, 1.4293169975280762, 1.5111297369003296, 1.592942476272583, 1.674755334854126, 1.7565680742263794, 1.8383808135986328, 1.9201935529708862, 2.0020062923431396, 2.0838191509246826, 2.1656317710876465, 2.2474446296691895, 2.3292572498321533, 2.4110701084136963, 2.49288272857666, 2.574695587158203]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 16.0, 26.0, 18.0, 22.0, 41.0, 69.0, 97.0, 235.0, 468.0, 1264.0, 4637.0, 54883.0, 909519.0, 69523.0, 5327.0, 1327.0, 508.0, 231.0, 102.0, 76.0, 38.0, 28.0, 20.0, 19.0, 12.0, 15.0, 7.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.07464599609375, -1.0369873046875, -0.99932861328125, -0.961669921875, -0.92401123046875, -0.8863525390625, -0.84869384765625, -0.81103515625, -0.77337646484375, -0.7357177734375, -0.69805908203125, -0.660400390625, -0.62274169921875, -0.5850830078125, -0.54742431640625, -0.509765625, -0.47210693359375, -0.4344482421875, -0.39678955078125, -0.359130859375, -0.32147216796875, -0.2838134765625, -0.24615478515625, -0.20849609375, -0.17083740234375, -0.1331787109375, -0.09552001953125, -0.057861328125, -0.02020263671875, 0.0174560546875, 0.05511474609375, 0.0927734375, 0.13043212890625, 0.1680908203125, 0.20574951171875, 0.243408203125, 0.28106689453125, 0.3187255859375, 0.35638427734375, 0.39404296875, 0.43170166015625, 0.4693603515625, 0.50701904296875, 0.544677734375, 0.58233642578125, 0.6199951171875, 0.65765380859375, 0.6953125, 0.73297119140625, 0.7706298828125, 0.80828857421875, 0.845947265625, 0.88360595703125, 0.9212646484375, 0.95892333984375, 0.99658203125, 1.03424072265625, 1.0718994140625, 1.10955810546875, 1.147216796875, 1.18487548828125, 1.2225341796875, 1.26019287109375, 1.2978515625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 14.0, 33.0, 49.0, 86.0, 128.0, 190.0, 162.0, 136.0, 94.0, 56.0, 34.0, 14.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.101806640625, -0.09648704528808594, -0.09116744995117188, -0.08584785461425781, -0.08052825927734375, -0.07520866394042969, -0.06988906860351562, -0.06456947326660156, -0.0592498779296875, -0.05393028259277344, -0.048610687255859375, -0.04329109191894531, -0.03797149658203125, -0.03265190124511719, -0.027332305908203125, -0.022012710571289062, -0.016693115234375, -0.011373519897460938, -0.006053924560546875, -0.0007343292236328125, 0.00458526611328125, 0.009904861450195312, 0.015224456787109375, 0.020544052124023438, 0.0258636474609375, 0.031183242797851562, 0.036502838134765625, 0.04182243347167969, 0.04714202880859375, 0.05246162414550781, 0.057781219482421875, 0.06310081481933594, 0.06842041015625, 0.07374000549316406, 0.07905960083007812, 0.08437919616699219, 0.08969879150390625, 0.09501838684082031, 0.10033798217773438, 0.10565757751464844, 0.1109771728515625, 0.11629676818847656, 0.12161636352539062, 0.1269359588623047, 0.13225555419921875, 0.1375751495361328, 0.14289474487304688, 0.14821434020996094, 0.153533935546875, 0.15885353088378906, 0.16417312622070312, 0.1694927215576172, 0.17481231689453125, 0.1801319122314453, 0.18545150756835938, 0.19077110290527344, 0.1960906982421875, 0.20141029357910156, 0.20672988891601562, 0.2120494842529297, 0.21736907958984375, 0.2226886749267578, 0.22800827026367188, 0.23332786560058594, 0.2386474609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 11.0, 9.0, 13.0, 24.0, 20.0, 42.0, 60.0, 80.0, 163.0, 395.0, 1140.0, 4874.0, 36280.0, 717816.0, 265930.0, 17211.0, 2912.0, 836.0, 320.0, 139.0, 83.0, 59.0, 26.0, 22.0, 20.0, 22.0, 7.0, 2.0, 11.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5893630981445312, -0.5673980712890625, -0.5454330444335938, -0.523468017578125, -0.5015029907226562, -0.4795379638671875, -0.45757293701171875, -0.43560791015625, -0.41364288330078125, -0.3916778564453125, -0.36971282958984375, -0.347747802734375, -0.32578277587890625, -0.3038177490234375, -0.28185272216796875, -0.2598876953125, -0.23792266845703125, -0.2159576416015625, -0.19399261474609375, -0.172027587890625, -0.15006256103515625, -0.1280975341796875, -0.10613250732421875, -0.08416748046875, -0.06220245361328125, -0.0402374267578125, -0.01827239990234375, 0.003692626953125, 0.02565765380859375, 0.0476226806640625, 0.06958770751953125, 0.091552734375, 0.11351776123046875, 0.1354827880859375, 0.15744781494140625, 0.179412841796875, 0.20137786865234375, 0.2233428955078125, 0.24530792236328125, 0.26727294921875, 0.28923797607421875, 0.3112030029296875, 0.33316802978515625, 0.355133056640625, 0.37709808349609375, 0.3990631103515625, 0.42102813720703125, 0.4429931640625, 0.46495819091796875, 0.4869232177734375, 0.5088882446289062, 0.530853271484375, 0.5528182983398438, 0.5747833251953125, 0.5967483520507812, 0.61871337890625, 0.6406784057617188, 0.6626434326171875, 0.6846084594726562, 0.706573486328125, 0.7285385131835938, 0.7505035400390625, 0.7724685668945312, 0.79443359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 16.0, 17.0, 14.0, 26.0, 28.0, 26.0, 30.0, 52.0, 47.0, 64.0, 69.0, 52.0, 60.0, 66.0, 66.0, 61.0, 51.0, 47.0, 44.0, 26.0, 27.0, 20.0, 16.0, 10.0, 7.0, 8.0, 6.0, 10.0, 1.0, 5.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.27091217041015625, -0.2613067626953125, -0.25170135498046875, -0.242095947265625, -0.23249053955078125, -0.2228851318359375, -0.21327972412109375, -0.20367431640625, -0.19406890869140625, -0.1844635009765625, -0.17485809326171875, -0.165252685546875, -0.15564727783203125, -0.1460418701171875, -0.13643646240234375, -0.1268310546875, -0.11722564697265625, -0.1076202392578125, -0.09801483154296875, -0.088409423828125, -0.07880401611328125, -0.0691986083984375, -0.05959320068359375, -0.04998779296875, -0.04038238525390625, -0.0307769775390625, -0.02117156982421875, -0.011566162109375, -0.00196075439453125, 0.0076446533203125, 0.01725006103515625, 0.02685546875, 0.03646087646484375, 0.0460662841796875, 0.05567169189453125, 0.065277099609375, 0.07488250732421875, 0.0844879150390625, 0.09409332275390625, 0.10369873046875, 0.11330413818359375, 0.1229095458984375, 0.13251495361328125, 0.142120361328125, 0.15172576904296875, 0.1613311767578125, 0.17093658447265625, 0.1805419921875, 0.19014739990234375, 0.1997528076171875, 0.20935821533203125, 0.218963623046875, 0.22856903076171875, 0.2381744384765625, 0.24777984619140625, 0.25738525390625, 0.26699066162109375, 0.2765960693359375, 0.28620147705078125, 0.295806884765625, 0.30541229248046875, 0.3150177001953125, 0.32462310791015625, 0.334228515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 15.0, 26.0, 55.0, 121.0, 357.0, 1336.0, 11917.0, 968466.0, 62416.0, 2901.0, 593.0, 201.0, 75.0, 35.0, 21.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451416015625, -0.4331474304199219, -0.41487884521484375, -0.3966102600097656, -0.3783416748046875, -0.3600730895996094, -0.34180450439453125, -0.3235359191894531, -0.305267333984375, -0.2869987487792969, -0.26873016357421875, -0.2504615783691406, -0.2321929931640625, -0.21392440795898438, -0.19565582275390625, -0.17738723754882812, -0.15911865234375, -0.14085006713867188, -0.12258148193359375, -0.10431289672851562, -0.0860443115234375, -0.06777572631835938, -0.04950714111328125, -0.031238555908203125, -0.012969970703125, 0.005298614501953125, 0.02356719970703125, 0.041835784912109375, 0.0601043701171875, 0.07837295532226562, 0.09664154052734375, 0.11491012573242188, 0.1331787109375, 0.15144729614257812, 0.16971588134765625, 0.18798446655273438, 0.2062530517578125, 0.22452163696289062, 0.24279022216796875, 0.2610588073730469, 0.279327392578125, 0.2975959777832031, 0.31586456298828125, 0.3341331481933594, 0.3524017333984375, 0.3706703186035156, 0.38893890380859375, 0.4072074890136719, 0.42547607421875, 0.4437446594238281, 0.46201324462890625, 0.4802818298339844, 0.4985504150390625, 0.5168190002441406, 0.5350875854492188, 0.5533561706542969, 0.571624755859375, 0.5898933410644531, 0.6081619262695312, 0.6264305114746094, 0.6446990966796875, 0.6629676818847656, 0.6812362670898438, 0.6995048522949219, 0.7177734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 18.0, 12.0, 24.0, 21.0, 34.0, 53.0, 58.0, 82.0, 88.0, 97.0, 103.0, 87.0, 78.0, 59.0, 47.0, 38.0, 17.0, 19.0, 16.0, 9.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.823902130126953e-05, -1.7666257917881012e-05, -1.7093494534492493e-05, -1.6520731151103973e-05, -1.5947967767715454e-05, -1.5375204384326935e-05, -1.4802441000938416e-05, -1.4229677617549896e-05, -1.3656914234161377e-05, -1.3084150850772858e-05, -1.2511387467384338e-05, -1.1938624083995819e-05, -1.13658607006073e-05, -1.079309731721878e-05, -1.0220333933830261e-05, -9.647570550441742e-06, -9.074807167053223e-06, -8.502043783664703e-06, -7.929280400276184e-06, -7.356517016887665e-06, -6.7837536334991455e-06, -6.210990250110626e-06, -5.638226866722107e-06, -5.065463483333588e-06, -4.492700099945068e-06, -3.919936716556549e-06, -3.3471733331680298e-06, -2.7744099497795105e-06, -2.201646566390991e-06, -1.628883183002472e-06, -1.0561197996139526e-06, -4.833564162254333e-07, 8.940696716308594e-08, 6.621703505516052e-07, 1.2349337339401245e-06, 1.8076971173286438e-06, 2.380460500717163e-06, 2.9532238841056824e-06, 3.5259872674942017e-06, 4.098750650882721e-06, 4.67151403427124e-06, 5.2442774176597595e-06, 5.817040801048279e-06, 6.389804184436798e-06, 6.962567567825317e-06, 7.535330951213837e-06, 8.108094334602356e-06, 8.680857717990875e-06, 9.253621101379395e-06, 9.826384484767914e-06, 1.0399147868156433e-05, 1.0971911251544952e-05, 1.1544674634933472e-05, 1.2117438018321991e-05, 1.269020140171051e-05, 1.326296478509903e-05, 1.3835728168487549e-05, 1.4408491551876068e-05, 1.4981254935264587e-05, 1.5554018318653107e-05, 1.6126781702041626e-05, 1.6699545085430145e-05, 1.7272308468818665e-05, 1.7845071852207184e-05, 1.8417835235595703e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 11.0, 20.0, 13.0, 29.0, 56.0, 104.0, 183.0, 574.0, 2249.0, 35003.0, 977870.0, 29338.0, 2050.0, 544.0, 235.0, 105.0, 59.0, 36.0, 23.0, 12.0, 15.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.3297882080078125, -0.316314697265625, -0.3028411865234375, -0.28936767578125, -0.2758941650390625, -0.262420654296875, -0.2489471435546875, -0.2354736328125, -0.2220001220703125, -0.208526611328125, -0.1950531005859375, -0.18157958984375, -0.1681060791015625, -0.154632568359375, -0.1411590576171875, -0.127685546875, -0.1142120361328125, -0.100738525390625, -0.0872650146484375, -0.07379150390625, -0.0603179931640625, -0.046844482421875, -0.0333709716796875, -0.0198974609375, -0.0064239501953125, 0.007049560546875, 0.0205230712890625, 0.03399658203125, 0.0474700927734375, 0.060943603515625, 0.0744171142578125, 0.087890625, 0.1013641357421875, 0.114837646484375, 0.1283111572265625, 0.14178466796875, 0.1552581787109375, 0.168731689453125, 0.1822052001953125, 0.1956787109375, 0.2091522216796875, 0.222625732421875, 0.2360992431640625, 0.24957275390625, 0.2630462646484375, 0.276519775390625, 0.2899932861328125, 0.303466796875, 0.3169403076171875, 0.330413818359375, 0.3438873291015625, 0.35736083984375, 0.3708343505859375, 0.384307861328125, 0.3977813720703125, 0.4112548828125, 0.4247283935546875, 0.438201904296875, 0.4516754150390625, 0.46514892578125, 0.4786224365234375, 0.492095947265625, 0.5055694580078125, 0.51904296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 5.0, 12.0, 20.0, 16.0, 32.0, 60.0, 96.0, 155.0, 183.0, 140.0, 90.0, 57.0, 35.0, 31.0, 12.0, 12.0, 16.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10589599609375, -0.10045719146728516, -0.09501838684082031, -0.08957958221435547, -0.08414077758789062, -0.07870197296142578, -0.07326316833496094, -0.0678243637084961, -0.06238555908203125, -0.056946754455566406, -0.05150794982910156, -0.04606914520263672, -0.040630340576171875, -0.03519153594970703, -0.029752731323242188, -0.024313926696777344, -0.0188751220703125, -0.013436317443847656, -0.007997512817382812, -0.0025587081909179688, 0.002880096435546875, 0.008318901062011719, 0.013757705688476562, 0.019196510314941406, 0.02463531494140625, 0.030074119567871094, 0.03551292419433594, 0.04095172882080078, 0.046390533447265625, 0.05182933807373047, 0.05726814270019531, 0.06270694732666016, 0.068145751953125, 0.07358455657958984, 0.07902336120605469, 0.08446216583251953, 0.08990097045898438, 0.09533977508544922, 0.10077857971191406, 0.1062173843383789, 0.11165618896484375, 0.1170949935913086, 0.12253379821777344, 0.12797260284423828, 0.13341140747070312, 0.13885021209716797, 0.1442890167236328, 0.14972782135009766, 0.1551666259765625, 0.16060543060302734, 0.1660442352294922, 0.17148303985595703, 0.17692184448242188, 0.18236064910888672, 0.18779945373535156, 0.1932382583618164, 0.19867706298828125, 0.2041158676147461, 0.20955467224121094, 0.21499347686767578, 0.22043228149414062, 0.22587108612060547, 0.2313098907470703, 0.23674869537353516, 0.2421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 54.0, 904.0, 54.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.636589050292969, -8.08128833770752, -7.525986671447754, -6.970685958862305, -6.415384292602539, -5.86008358001709, -5.304782390594482, -4.749481201171875, -4.194180011749268, -3.63887882232666, -3.0835776329040527, -2.5282766819000244, -1.972975492477417, -1.4176743030548096, -0.8623733520507812, -0.30707216262817383, 0.2482290267944336, 0.8035301566123962, 1.3588312864303589, 1.9141323566436768, 2.469433546066284, 3.0247347354888916, 3.58003568649292, 4.135336875915527, 4.690638065338135, 5.245939254760742, 5.80124044418335, 6.356541633605957, 6.911842346191406, 7.467144012451172, 8.022444725036621, 8.57774543762207, 9.133047103881836, 9.688347816467285, 10.24364948272705, 10.7989501953125, 11.354251861572266, 11.909552574157715, 12.464853286743164, 13.02015495300293, 13.575456619262695, 14.130757331848145, 14.68605899810791, 15.24135971069336, 15.796661376953125, 16.35196304321289, 16.907262802124023, 17.46256446838379, 18.017864227294922, 18.573165893554688, 19.12846565246582, 19.683767318725586, 20.23906898498535, 20.794370651245117, 21.34967041015625, 21.904972076416016, 22.46027374267578, 23.015575408935547, 23.57087516784668, 24.126176834106445, 24.68147850036621, 25.236780166625977, 25.79207992553711, 26.347381591796875, 26.90268325805664]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 11.0, 8.0, 17.0, 23.0, 28.0, 42.0, 41.0, 41.0, 61.0, 64.0, 62.0, 69.0, 61.0, 62.0, 57.0, 59.0, 49.0, 57.0, 47.0, 35.0, 21.0, 19.0, 19.0, 6.0, 8.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1347343921661377, -2.068380117416382, -2.002025604248047, -1.9356712102890015, -1.869316816329956, -1.8029624223709106, -1.7366080284118652, -1.6702537536621094, -1.6038992404937744, -1.537544846534729, -1.4711904525756836, -1.4048360586166382, -1.3384816646575928, -1.2721272706985474, -1.205772876739502, -1.139418601989746, -1.0730642080307007, -1.0067098140716553, -0.9403554201126099, -0.8740010261535645, -0.807646632194519, -0.7412922382354736, -0.674937903881073, -0.6085835099220276, -0.5422291159629822, -0.47587472200393677, -0.40952032804489136, -0.34316596388816833, -0.2768115699291229, -0.21045717597007751, -0.1441028118133545, -0.07774841785430908, -0.011394023895263672, 0.05496036261320114, 0.12131474912166595, 0.18766912817955017, 0.2540235221385956, 0.320377916097641, 0.386732280254364, 0.4530866742134094, 0.5194410681724548, 0.5857954621315002, 0.6521498560905457, 0.7185041904449463, 0.7848585844039917, 0.8512129783630371, 0.9175673723220825, 0.9839217662811279, 1.0502761602401733, 1.1166305541992188, 1.1829849481582642, 1.2493393421173096, 1.315693736076355, 1.3820481300354004, 1.4484024047851562, 1.5147569179534912, 1.581111192703247, 1.6474655866622925, 1.713819980621338, 1.7801743745803833, 1.8465287685394287, 1.9128831624984741, 1.9792375564575195, 2.0455918312072754, 2.1119463443756104]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 3.0, 4.0, 11.0, 14.0, 35.0, 107.0, 196.0, 504.0, 1500.0, 5215.0, 22996.0, 585576.0, 3537854.0, 30744.0, 6015.0, 1758.0, 721.0, 362.0, 205.0, 127.0, 67.0, 58.0, 40.0, 36.0, 21.0, 15.0, 13.0, 13.0, 9.0, 8.0, 8.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44482421875, -0.41082000732421875, -0.3768157958984375, -0.34281158447265625, -0.308807373046875, -0.27480316162109375, -0.2407989501953125, -0.20679473876953125, -0.17279052734375, -0.13878631591796875, -0.1047821044921875, -0.07077789306640625, -0.036773681640625, -0.00276947021484375, 0.0312347412109375, 0.06523895263671875, 0.0992431640625, 0.13324737548828125, 0.1672515869140625, 0.20125579833984375, 0.235260009765625, 0.26926422119140625, 0.3032684326171875, 0.33727264404296875, 0.37127685546875, 0.40528106689453125, 0.4392852783203125, 0.47328948974609375, 0.507293701171875, 0.5412979125976562, 0.5753021240234375, 0.6093063354492188, 0.643310546875, 0.6773147583007812, 0.7113189697265625, 0.7453231811523438, 0.779327392578125, 0.8133316040039062, 0.8473358154296875, 0.8813400268554688, 0.91534423828125, 0.9493484497070312, 0.9833526611328125, 1.0173568725585938, 1.051361083984375, 1.0853652954101562, 1.1193695068359375, 1.1533737182617188, 1.1873779296875, 1.2213821411132812, 1.2553863525390625, 1.2893905639648438, 1.323394775390625, 1.3573989868164062, 1.3914031982421875, 1.4254074096679688, 1.45941162109375, 1.4934158325195312, 1.5274200439453125, 1.5614242553710938, 1.595428466796875, 1.6294326782226562, 1.6634368896484375, 1.6974411010742188, 1.7314453125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 14.0, 21.0, 29.0, 49.0, 61.0, 116.0, 129.0, 154.0, 123.0, 104.0, 77.0, 60.0, 31.0, 14.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06976318359375, -0.0649557113647461, -0.06014823913574219, -0.05534076690673828, -0.050533294677734375, -0.04572582244873047, -0.04091835021972656, -0.036110877990722656, -0.03130340576171875, -0.026495933532714844, -0.021688461303710938, -0.01688098907470703, -0.012073516845703125, -0.007266044616699219, -0.0024585723876953125, 0.0023488998413085938, 0.0071563720703125, 0.011963844299316406, 0.016771316528320312, 0.02157878875732422, 0.026386260986328125, 0.03119373321533203, 0.03600120544433594, 0.040808677673339844, 0.04561614990234375, 0.050423622131347656, 0.05523109436035156, 0.06003856658935547, 0.06484603881835938, 0.06965351104736328, 0.07446098327636719, 0.0792684555053711, 0.084075927734375, 0.0888833999633789, 0.09369087219238281, 0.09849834442138672, 0.10330581665039062, 0.10811328887939453, 0.11292076110839844, 0.11772823333740234, 0.12253570556640625, 0.12734317779541016, 0.13215065002441406, 0.13695812225341797, 0.14176559448242188, 0.14657306671142578, 0.1513805389404297, 0.1561880111694336, 0.1609954833984375, 0.1658029556274414, 0.1706104278564453, 0.17541790008544922, 0.18022537231445312, 0.18503284454345703, 0.18984031677246094, 0.19464778900146484, 0.19945526123046875, 0.20426273345947266, 0.20907020568847656, 0.21387767791748047, 0.21868515014648438, 0.22349262237548828, 0.2283000946044922, 0.2331075668334961, 0.2379150390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 12.0, 19.0, 46.0, 113.0, 586.0, 4132447.0, 59990.0, 702.0, 224.0, 73.0, 41.0, 24.0, 12.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.837158203125, -3.59619140625, -3.355224609375, -3.1142578125, -2.873291015625, -2.63232421875, -2.391357421875, -2.150390625, -1.909423828125, -1.66845703125, -1.427490234375, -1.1865234375, -0.945556640625, -0.70458984375, -0.463623046875, -0.22265625, 0.018310546875, 0.25927734375, 0.500244140625, 0.7412109375, 0.982177734375, 1.22314453125, 1.464111328125, 1.705078125, 1.946044921875, 2.18701171875, 2.427978515625, 2.6689453125, 2.909912109375, 3.15087890625, 3.391845703125, 3.6328125, 3.873779296875, 4.11474609375, 4.355712890625, 4.5966796875, 4.837646484375, 5.07861328125, 5.319580078125, 5.560546875, 5.801513671875, 6.04248046875, 6.283447265625, 6.5244140625, 6.765380859375, 7.00634765625, 7.247314453125, 7.48828125, 7.729248046875, 7.97021484375, 8.211181640625, 8.4521484375, 8.693115234375, 8.93408203125, 9.175048828125, 9.416015625, 9.656982421875, 9.89794921875, 10.138916015625, 10.3798828125, 10.620849609375, 10.86181640625, 11.102783203125, 11.34375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 10.0, 28.0, 117.0, 3439.0, 402.0, 54.0, 17.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1568603515625, -0.13651084899902344, -0.11616134643554688, -0.09581184387207031, -0.07546234130859375, -0.05511283874511719, -0.034763336181640625, -0.014413833618164062, 0.0059356689453125, 0.026285171508789062, 0.046634674072265625, 0.06698417663574219, 0.08733367919921875, 0.10768318176269531, 0.12803268432617188, 0.14838218688964844, 0.168731689453125, 0.18908119201660156, 0.20943069458007812, 0.2297801971435547, 0.25012969970703125, 0.2704792022705078, 0.2908287048339844, 0.31117820739746094, 0.3315277099609375, 0.35187721252441406, 0.3722267150878906, 0.3925762176513672, 0.41292572021484375, 0.4332752227783203, 0.4536247253417969, 0.47397422790527344, 0.49432373046875, 0.5146732330322266, 0.5350227355957031, 0.5553722381591797, 0.5757217407226562, 0.5960712432861328, 0.6164207458496094, 0.6367702484130859, 0.6571197509765625, 0.6774692535400391, 0.6978187561035156, 0.7181682586669922, 0.7385177612304688, 0.7588672637939453, 0.7792167663574219, 0.7995662689208984, 0.819915771484375, 0.8402652740478516, 0.8606147766113281, 0.8809642791748047, 0.9013137817382812, 0.9216632843017578, 0.9420127868652344, 0.9623622894287109, 0.9827117919921875, 1.003061294555664, 1.0234107971191406, 1.0437602996826172, 1.0641098022460938, 1.0844593048095703, 1.1048088073730469, 1.1251583099365234, 1.1455078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 9.0, 19.0, 206.0, 676.0, 69.0, 15.0, 6.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.629086971282959, -5.429607391357422, -5.230128288269043, -5.030648708343506, -4.831169128417969, -4.63169002532959, -4.432210445404053, -4.232730865478516, -4.033251762390137, -3.8337724208831787, -3.6342928409576416, -3.4348134994506836, -3.2353339195251465, -3.0358545780181885, -2.8363752365112305, -2.6368956565856934, -2.4374160766601562, -2.2379367351531982, -2.038457155227661, -1.8389778137207031, -1.6394983530044556, -1.440018892288208, -1.24053955078125, -1.0410600900650024, -0.8415806293487549, -0.6421011686325073, -0.44262176752090454, -0.24314236640930176, -0.0436629056930542, 0.15581655502319336, 0.35529589653015137, 0.5547753572463989, 0.7542543411254883, 0.9537338018417358, 1.1532132625579834, 1.3526926040649414, 1.552172064781189, 1.7516515254974365, 1.9511308670043945, 2.1506104469299316, 2.3500897884368896, 2.5495691299438477, 2.7490487098693848, 2.9485280513763428, 3.148007392883301, 3.347486972808838, 3.546966314315796, 3.746445655822754, 3.945925235748291, 4.145404815673828, 4.344883918762207, 4.544363498687744, 4.743843078613281, 4.94332218170166, 5.142801761627197, 5.342281341552734, 5.541760444641113, 5.74124002456665, 5.940719127655029, 6.140198707580566, 6.3396782875061035, 6.539157867431641, 6.7386369705200195, 6.938116550445557, 7.137596130371094]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 14.0, 26.0, 33.0, 57.0, 72.0, 79.0, 84.0, 97.0, 101.0, 122.0, 78.0, 62.0, 49.0, 48.0, 37.0, 10.0, 13.0, 6.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9486967325210571, -1.88349449634552, -1.818292260169983, -1.7530900239944458, -1.6878877878189087, -1.6226855516433716, -1.557483434677124, -1.492281198501587, -1.4270789623260498, -1.3618767261505127, -1.2966744899749756, -1.2314722537994385, -1.1662700176239014, -1.1010677814483643, -1.0358655452728271, -0.9706633687019348, -0.9054610729217529, -0.8402588367462158, -0.7750566005706787, -0.7098543643951416, -0.6446521282196045, -0.5794498920440674, -0.514247715473175, -0.44904547929763794, -0.38384324312210083, -0.3186410069465637, -0.2534387707710266, -0.1882365643978119, -0.12303432822227478, -0.05783209204673767, 0.007370114326477051, 0.07257235050201416, 0.13777470588684082, 0.20297694206237793, 0.26817917823791504, 0.33338138461112976, 0.39858362078666687, 0.463785856962204, 0.5289880633354187, 0.5941902995109558, 0.6593925356864929, 0.72459477186203, 0.7897970080375671, 0.8549991846084595, 0.9202014207839966, 0.9854036569595337, 1.0506058931350708, 1.115808129310608, 1.181010365486145, 1.2462126016616821, 1.3114148378372192, 1.3766170740127563, 1.4418193101882935, 1.5070215463638306, 1.5722236633300781, 1.6374258995056152, 1.7026281356811523, 1.7678303718566895, 1.8330326080322266, 1.8982348442077637, 1.9634370803833008, 2.028639316558838, 2.093841552734375, 2.159043788909912, 2.224246025085449]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 5.0, 10.0, 19.0, 21.0, 22.0, 27.0, 42.0, 50.0, 73.0, 102.0, 134.0, 194.0, 347.0, 654.0, 1207.0, 2839.0, 8151.0, 32208.0, 192188.0, 667237.0, 110906.0, 21350.0, 5985.0, 2221.0, 995.0, 519.0, 307.0, 222.0, 144.0, 103.0, 68.0, 59.0, 31.0, 27.0, 11.0, 13.0, 9.0, 5.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.697265625, -0.6743011474609375, -0.651336669921875, -0.6283721923828125, -0.60540771484375, -0.5824432373046875, -0.559478759765625, -0.5365142822265625, -0.5135498046875, -0.4905853271484375, -0.467620849609375, -0.4446563720703125, -0.42169189453125, -0.3987274169921875, -0.375762939453125, -0.3527984619140625, -0.329833984375, -0.3068695068359375, -0.283905029296875, -0.2609405517578125, -0.23797607421875, -0.2150115966796875, -0.192047119140625, -0.1690826416015625, -0.1461181640625, -0.1231536865234375, -0.100189208984375, -0.0772247314453125, -0.05426025390625, -0.0312957763671875, -0.008331298828125, 0.0146331787109375, 0.03759765625, 0.0605621337890625, 0.083526611328125, 0.1064910888671875, 0.12945556640625, 0.1524200439453125, 0.175384521484375, 0.1983489990234375, 0.2213134765625, 0.2442779541015625, 0.267242431640625, 0.2902069091796875, 0.31317138671875, 0.3361358642578125, 0.359100341796875, 0.3820648193359375, 0.405029296875, 0.4279937744140625, 0.450958251953125, 0.4739227294921875, 0.49688720703125, 0.5198516845703125, 0.542816162109375, 0.5657806396484375, 0.5887451171875, 0.6117095947265625, 0.634674072265625, 0.6576385498046875, 0.68060302734375, 0.7035675048828125, 0.726531982421875, 0.7494964599609375, 0.7724609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 12.0, 18.0, 31.0, 31.0, 66.0, 64.0, 87.0, 91.0, 101.0, 106.0, 94.0, 72.0, 68.0, 44.0, 44.0, 34.0, 13.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11504077911376953, -0.10929298400878906, -0.1035451889038086, -0.09779739379882812, -0.09204959869384766, -0.08630180358886719, -0.08055400848388672, -0.07480621337890625, -0.06905841827392578, -0.06331062316894531, -0.057562828063964844, -0.051815032958984375, -0.046067237854003906, -0.04031944274902344, -0.03457164764404297, -0.0288238525390625, -0.02307605743408203, -0.017328262329101562, -0.011580467224121094, -0.005832672119140625, -8.487701416015625e-05, 0.0056629180908203125, 0.011410713195800781, 0.01715850830078125, 0.02290630340576172, 0.028654098510742188, 0.034401893615722656, 0.040149688720703125, 0.045897483825683594, 0.05164527893066406, 0.05739307403564453, 0.063140869140625, 0.06888866424560547, 0.07463645935058594, 0.0803842544555664, 0.08613204956054688, 0.09187984466552734, 0.09762763977050781, 0.10337543487548828, 0.10912322998046875, 0.11487102508544922, 0.12061882019042969, 0.12636661529541016, 0.13211441040039062, 0.1378622055053711, 0.14361000061035156, 0.14935779571533203, 0.1551055908203125, 0.16085338592529297, 0.16660118103027344, 0.1723489761352539, 0.17809677124023438, 0.18384456634521484, 0.1895923614501953, 0.19534015655517578, 0.20108795166015625, 0.20683574676513672, 0.2125835418701172, 0.21833133697509766, 0.22407913208007812, 0.2298269271850586, 0.23557472229003906, 0.24132251739501953, 0.2470703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 6.0, 7.0, 15.0, 15.0, 23.0, 35.0, 47.0, 77.0, 119.0, 246.0, 491.0, 1025.0, 2864.0, 9099.0, 40351.0, 322658.0, 584789.0, 66704.0, 13451.0, 3846.0, 1360.0, 594.0, 286.0, 143.0, 95.0, 66.0, 36.0, 29.0, 12.0, 16.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.66015625, -0.639617919921875, -0.61907958984375, -0.598541259765625, -0.5780029296875, -0.557464599609375, -0.53692626953125, -0.516387939453125, -0.495849609375, -0.475311279296875, -0.45477294921875, -0.434234619140625, -0.4136962890625, -0.393157958984375, -0.37261962890625, -0.352081298828125, -0.33154296875, -0.311004638671875, -0.29046630859375, -0.269927978515625, -0.2493896484375, -0.228851318359375, -0.20831298828125, -0.187774658203125, -0.167236328125, -0.146697998046875, -0.12615966796875, -0.105621337890625, -0.0850830078125, -0.064544677734375, -0.04400634765625, -0.023468017578125, -0.0029296875, 0.017608642578125, 0.03814697265625, 0.058685302734375, 0.0792236328125, 0.099761962890625, 0.12030029296875, 0.140838623046875, 0.161376953125, 0.181915283203125, 0.20245361328125, 0.222991943359375, 0.2435302734375, 0.264068603515625, 0.28460693359375, 0.305145263671875, 0.32568359375, 0.346221923828125, 0.36676025390625, 0.387298583984375, 0.4078369140625, 0.428375244140625, 0.44891357421875, 0.469451904296875, 0.489990234375, 0.510528564453125, 0.53106689453125, 0.551605224609375, 0.5721435546875, 0.592681884765625, 0.61322021484375, 0.633758544921875, 0.654296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 4.0, 10.0, 21.0, 11.0, 21.0, 24.0, 35.0, 43.0, 41.0, 53.0, 52.0, 62.0, 64.0, 62.0, 46.0, 71.0, 45.0, 54.0, 41.0, 53.0, 33.0, 26.0, 30.0, 16.0, 12.0, 10.0, 10.0, 10.0, 4.0, 9.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49951171875, -0.48384857177734375, -0.4681854248046875, -0.45252227783203125, -0.436859130859375, -0.42119598388671875, -0.4055328369140625, -0.38986968994140625, -0.37420654296875, -0.35854339599609375, -0.3428802490234375, -0.32721710205078125, -0.311553955078125, -0.29589080810546875, -0.2802276611328125, -0.26456451416015625, -0.2489013671875, -0.23323822021484375, -0.2175750732421875, -0.20191192626953125, -0.186248779296875, -0.17058563232421875, -0.1549224853515625, -0.13925933837890625, -0.12359619140625, -0.10793304443359375, -0.0922698974609375, -0.07660675048828125, -0.060943603515625, -0.04528045654296875, -0.0296173095703125, -0.01395416259765625, 0.001708984375, 0.01737213134765625, 0.0330352783203125, 0.04869842529296875, 0.064361572265625, 0.08002471923828125, 0.0956878662109375, 0.11135101318359375, 0.12701416015625, 0.14267730712890625, 0.1583404541015625, 0.17400360107421875, 0.189666748046875, 0.20532989501953125, 0.2209930419921875, 0.23665618896484375, 0.2523193359375, 0.26798248291015625, 0.2836456298828125, 0.29930877685546875, 0.314971923828125, 0.33063507080078125, 0.3462982177734375, 0.36196136474609375, 0.37762451171875, 0.39328765869140625, 0.4089508056640625, 0.42461395263671875, 0.440277099609375, 0.45594024658203125, 0.4716033935546875, 0.48726654052734375, 0.5029296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 11.0, 12.0, 16.0, 28.0, 38.0, 47.0, 90.0, 169.0, 420.0, 1284.0, 5783.0, 92392.0, 909461.0, 33629.0, 3640.0, 890.0, 298.0, 117.0, 81.0, 40.0, 30.0, 25.0, 19.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337646484375, -0.3265266418457031, -0.31540679931640625, -0.3042869567871094, -0.2931671142578125, -0.2820472717285156, -0.27092742919921875, -0.2598075866699219, -0.248687744140625, -0.23756790161132812, -0.22644805908203125, -0.21532821655273438, -0.2042083740234375, -0.19308853149414062, -0.18196868896484375, -0.17084884643554688, -0.15972900390625, -0.14860916137695312, -0.13748931884765625, -0.12636947631835938, -0.1152496337890625, -0.10412979125976562, -0.09300994873046875, -0.08189010620117188, -0.070770263671875, -0.059650421142578125, -0.04853057861328125, -0.037410736083984375, -0.0262908935546875, -0.015171051025390625, -0.00405120849609375, 0.007068634033203125, 0.0181884765625, 0.029308319091796875, 0.04042816162109375, 0.051548004150390625, 0.0626678466796875, 0.07378768920898438, 0.08490753173828125, 0.09602737426757812, 0.107147216796875, 0.11826705932617188, 0.12938690185546875, 0.14050674438476562, 0.1516265869140625, 0.16274642944335938, 0.17386627197265625, 0.18498611450195312, 0.19610595703125, 0.20722579956054688, 0.21834564208984375, 0.22946548461914062, 0.2405853271484375, 0.2517051696777344, 0.26282501220703125, 0.2739448547363281, 0.285064697265625, 0.2961845397949219, 0.30730438232421875, 0.3184242248535156, 0.3295440673828125, 0.3406639099121094, 0.35178375244140625, 0.3629035949707031, 0.3740234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 11.0, 11.0, 9.0, 16.0, 17.0, 23.0, 29.0, 32.0, 42.0, 43.0, 63.0, 68.0, 65.0, 66.0, 77.0, 76.0, 61.0, 51.0, 35.0, 37.0, 39.0, 23.0, 18.0, 27.0, 8.0, 8.0, 7.0, 5.0, 3.0, 5.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4781951904296875e-05, -1.433398574590683e-05, -1.3886019587516785e-05, -1.343805342912674e-05, -1.2990087270736694e-05, -1.254212111234665e-05, -1.2094154953956604e-05, -1.1646188795566559e-05, -1.1198222637176514e-05, -1.0750256478786469e-05, -1.0302290320396423e-05, -9.854324162006378e-06, -9.406358003616333e-06, -8.958391845226288e-06, -8.510425686836243e-06, -8.062459528446198e-06, -7.614493370056152e-06, -7.166527211666107e-06, -6.718561053276062e-06, -6.270594894886017e-06, -5.822628736495972e-06, -5.3746625781059265e-06, -4.926696419715881e-06, -4.478730261325836e-06, -4.030764102935791e-06, -3.582797944545746e-06, -3.1348317861557007e-06, -2.6868656277656555e-06, -2.2388994693756104e-06, -1.7909333109855652e-06, -1.34296715259552e-06, -8.950009942054749e-07, -4.470348358154297e-07, 9.313225746154785e-10, 4.4889748096466064e-07, 8.968636393547058e-07, 1.344829797744751e-06, 1.7927959561347961e-06, 2.2407621145248413e-06, 2.6887282729148865e-06, 3.1366944313049316e-06, 3.584660589694977e-06, 4.032626748085022e-06, 4.480592906475067e-06, 4.928559064865112e-06, 5.3765252232551575e-06, 5.824491381645203e-06, 6.272457540035248e-06, 6.720423698425293e-06, 7.168389856815338e-06, 7.616356015205383e-06, 8.064322173595428e-06, 8.512288331985474e-06, 8.960254490375519e-06, 9.408220648765564e-06, 9.856186807155609e-06, 1.0304152965545654e-05, 1.07521191239357e-05, 1.1200085282325745e-05, 1.164805144071579e-05, 1.2096017599105835e-05, 1.254398375749588e-05, 1.2991949915885925e-05, 1.343991607427597e-05, 1.3887882232666016e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 11.0, 8.0, 21.0, 28.0, 29.0, 80.0, 104.0, 192.0, 474.0, 1109.0, 3620.0, 17935.0, 297673.0, 682779.0, 36124.0, 5563.0, 1597.0, 590.0, 252.0, 134.0, 77.0, 43.0, 33.0, 20.0, 6.0, 4.0, 7.0, 5.0, 2.0, 7.0, 5.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.228759765625, -0.2214183807373047, -0.21407699584960938, -0.20673561096191406, -0.19939422607421875, -0.19205284118652344, -0.18471145629882812, -0.1773700714111328, -0.1700286865234375, -0.1626873016357422, -0.15534591674804688, -0.14800453186035156, -0.14066314697265625, -0.13332176208496094, -0.12598037719726562, -0.11863899230957031, -0.111297607421875, -0.10395622253417969, -0.09661483764648438, -0.08927345275878906, -0.08193206787109375, -0.07459068298339844, -0.06724929809570312, -0.05990791320800781, -0.0525665283203125, -0.04522514343261719, -0.037883758544921875, -0.030542373657226562, -0.02320098876953125, -0.015859603881835938, -0.008518218994140625, -0.0011768341064453125, 0.00616455078125, 0.013505935668945312, 0.020847320556640625, 0.028188705444335938, 0.03553009033203125, 0.04287147521972656, 0.050212860107421875, 0.05755424499511719, 0.0648956298828125, 0.07223701477050781, 0.07957839965820312, 0.08691978454589844, 0.09426116943359375, 0.10160255432128906, 0.10894393920898438, 0.11628532409667969, 0.123626708984375, 0.1309680938720703, 0.13830947875976562, 0.14565086364746094, 0.15299224853515625, 0.16033363342285156, 0.16767501831054688, 0.1750164031982422, 0.1823577880859375, 0.1896991729736328, 0.19704055786132812, 0.20438194274902344, 0.21172332763671875, 0.21906471252441406, 0.22640609741210938, 0.2337474822998047, 0.2410888671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 13.0, 10.0, 23.0, 18.0, 34.0, 56.0, 79.0, 96.0, 121.0, 148.0, 121.0, 80.0, 55.0, 38.0, 27.0, 25.0, 13.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.162841796875, -0.1579151153564453, -0.15298843383789062, -0.14806175231933594, -0.14313507080078125, -0.13820838928222656, -0.13328170776367188, -0.1283550262451172, -0.1234283447265625, -0.11850166320800781, -0.11357498168945312, -0.10864830017089844, -0.10372161865234375, -0.09879493713378906, -0.09386825561523438, -0.08894157409667969, -0.084014892578125, -0.07908821105957031, -0.07416152954101562, -0.06923484802246094, -0.06430816650390625, -0.05938148498535156, -0.054454803466796875, -0.04952812194824219, -0.0446014404296875, -0.03967475891113281, -0.034748077392578125, -0.029821395874023438, -0.02489471435546875, -0.019968032836914062, -0.015041351318359375, -0.010114669799804688, -0.00518798828125, -0.0002613067626953125, 0.004665374755859375, 0.009592056274414062, 0.01451873779296875, 0.019445419311523438, 0.024372100830078125, 0.029298782348632812, 0.0342254638671875, 0.03915214538574219, 0.044078826904296875, 0.04900550842285156, 0.05393218994140625, 0.05885887145996094, 0.06378555297851562, 0.06871223449707031, 0.073638916015625, 0.07856559753417969, 0.08349227905273438, 0.08841896057128906, 0.09334564208984375, 0.09827232360839844, 0.10319900512695312, 0.10812568664550781, 0.1130523681640625, 0.11797904968261719, 0.12290573120117188, 0.12783241271972656, 0.13275909423828125, 0.13768577575683594, 0.14261245727539062, 0.1475391387939453, 0.1524658203125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 9.0, 14.0, 25.0, 58.0, 101.0, 244.0, 301.0, 134.0, 55.0, 30.0, 12.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.129291534423828, -1.997900366783142, -1.8665093183517456, -1.7351181507110596, -1.603727102279663, -1.472335934638977, -1.340944766998291, -1.2095537185668945, -1.0781625509262085, -0.9467714428901672, -0.815380334854126, -0.6839891672134399, -0.5525980591773987, -0.4212069511413574, -0.2898157835006714, -0.15842467546463013, -0.027033567428588867, 0.10435755550861359, 0.23574867844581604, 0.3671398162841797, 0.49853092432022095, 0.6299220323562622, 0.7613131999969482, 0.8927043080329895, 1.0240954160690308, 1.1554865837097168, 1.2868776321411133, 1.4182687997817993, 1.5496599674224854, 1.6810510158538818, 1.8124421834945679, 1.943833351135254, 2.0752243995666504, 2.206615447998047, 2.3380067348480225, 2.469397783279419, 2.6007888317108154, 2.732180118560791, 2.8635711669921875, 2.994962215423584, 3.1263532638549805, 3.257744312286377, 3.3891355991363525, 3.520526647567749, 3.6519176959991455, 3.783308982849121, 3.9147000312805176, 4.046091079711914, 4.177482604980469, 4.308873653411865, 4.440264701843262, 4.571656227111816, 4.703047275543213, 4.834438323974609, 4.965829372406006, 5.097220420837402, 5.228611469268799, 5.360002517700195, 5.491393566131592, 5.622784614562988, 5.754176139831543, 5.8855671882629395, 6.016958236694336, 6.148349285125732, 6.279740333557129]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 5.0, 7.0, 16.0, 22.0, 19.0, 26.0, 31.0, 24.0, 30.0, 45.0, 39.0, 49.0, 37.0, 65.0, 61.0, 48.0, 69.0, 59.0, 35.0, 40.0, 40.0, 33.0, 30.0, 29.0, 25.0, 18.0, 10.0, 11.0, 8.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2502613067626953, -2.168671131134033, -2.087080955505371, -2.005490779876709, -1.9239004850387573, -1.8423101902008057, -1.7607200145721436, -1.6791298389434814, -1.5975396633148193, -1.5159494876861572, -1.4343591928482056, -1.3527690172195435, -1.2711788415908813, -1.1895885467529297, -1.1079983711242676, -1.0264081954956055, -0.9448179006576538, -0.8632276654243469, -0.7816374897956848, -0.7000472545623779, -0.6184570789337158, -0.5368668437004089, -0.45527660846710205, -0.37368643283843994, -0.29209619760513306, -0.21050599217414856, -0.12891577184200287, -0.04732555150985718, 0.03426465392112732, 0.11585485935211182, 0.1974450945854187, 0.2790352702140808, 0.3606255054473877, 0.4422157108783722, 0.5238059163093567, 0.6053961515426636, 0.6869863271713257, 0.7685765624046326, 0.8501667976379395, 0.9317569732666016, 1.0133471488952637, 1.0949373245239258, 1.1765276193618774, 1.2581177949905396, 1.3397079706192017, 1.4212982654571533, 1.5028884410858154, 1.5844786167144775, 1.6660689115524292, 1.7476590871810913, 1.829249382019043, 1.910839557647705, 1.9924297332763672, 2.0740199089050293, 2.1556100845336914, 2.2372002601623535, 2.3187906742095947, 2.400380849838257, 2.481971025466919, 2.56356143951416, 2.6451516151428223, 2.7267417907714844, 2.8083319664001465, 2.8899221420288086, 2.9715123176574707]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 6.0, 9.0, 8.0, 5.0, 23.0, 9.0, 34.0, 66.0, 130.0, 204.0, 436.0, 827.0, 1890.0, 5315.0, 21035.0, 215583.0, 3864410.0, 66281.0, 11279.0, 3431.0, 1450.0, 684.0, 390.0, 215.0, 157.0, 115.0, 60.0, 59.0, 42.0, 31.0, 27.0, 14.0, 7.0, 8.0, 8.0, 9.0, 1.0, 9.0, 4.0, 0.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.61083984375, -0.5846328735351562, -0.5584259033203125, -0.5322189331054688, -0.506011962890625, -0.47980499267578125, -0.4535980224609375, -0.42739105224609375, -0.40118408203125, -0.37497711181640625, -0.3487701416015625, -0.32256317138671875, -0.296356201171875, -0.27014923095703125, -0.2439422607421875, -0.21773529052734375, -0.1915283203125, -0.16532135009765625, -0.1391143798828125, -0.11290740966796875, -0.086700439453125, -0.06049346923828125, -0.0342864990234375, -0.00807952880859375, 0.01812744140625, 0.04433441162109375, 0.0705413818359375, 0.09674835205078125, 0.122955322265625, 0.14916229248046875, 0.1753692626953125, 0.20157623291015625, 0.227783203125, 0.25399017333984375, 0.2801971435546875, 0.30640411376953125, 0.332611083984375, 0.35881805419921875, 0.3850250244140625, 0.41123199462890625, 0.43743896484375, 0.46364593505859375, 0.4898529052734375, 0.5160598754882812, 0.542266845703125, 0.5684738159179688, 0.5946807861328125, 0.6208877563476562, 0.6470947265625, 0.6733016967773438, 0.6995086669921875, 0.7257156372070312, 0.751922607421875, 0.7781295776367188, 0.8043365478515625, 0.8305435180664062, 0.85675048828125, 0.8829574584960938, 0.9091644287109375, 0.9353713989257812, 0.961578369140625, 0.9877853393554688, 1.0139923095703125, 1.0401992797851562, 1.06640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 13.0, 12.0, 34.0, 29.0, 49.0, 63.0, 59.0, 91.0, 96.0, 86.0, 99.0, 87.0, 69.0, 65.0, 44.0, 37.0, 26.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12211418151855469, -0.11617660522460938, -0.11023902893066406, -0.10430145263671875, -0.09836387634277344, -0.09242630004882812, -0.08648872375488281, -0.0805511474609375, -0.07461357116699219, -0.06867599487304688, -0.06273841857910156, -0.05680084228515625, -0.05086326599121094, -0.044925689697265625, -0.03898811340332031, -0.033050537109375, -0.027112960815429688, -0.021175384521484375, -0.015237808227539062, -0.00930023193359375, -0.0033626556396484375, 0.002574920654296875, 0.008512496948242188, 0.0144500732421875, 0.020387649536132812, 0.026325225830078125, 0.03226280212402344, 0.03820037841796875, 0.04413795471191406, 0.050075531005859375, 0.05601310729980469, 0.06195068359375, 0.06788825988769531, 0.07382583618164062, 0.07976341247558594, 0.08570098876953125, 0.09163856506347656, 0.09757614135742188, 0.10351371765136719, 0.1094512939453125, 0.11538887023925781, 0.12132644653320312, 0.12726402282714844, 0.13320159912109375, 0.13913917541503906, 0.14507675170898438, 0.1510143280029297, 0.156951904296875, 0.1628894805908203, 0.16882705688476562, 0.17476463317871094, 0.18070220947265625, 0.18663978576660156, 0.19257736206054688, 0.1985149383544922, 0.2044525146484375, 0.2103900909423828, 0.21632766723632812, 0.22226524353027344, 0.22820281982421875, 0.23414039611816406, 0.24007797241210938, 0.2460155487060547, 0.251953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 3.0, 6.0, 5.0, 9.0, 15.0, 18.0, 20.0, 21.0, 20.0, 47.0, 56.0, 76.0, 96.0, 183.0, 355.0, 1676.0, 3465489.0, 723890.0, 1417.0, 319.0, 174.0, 107.0, 76.0, 52.0, 44.0, 22.0, 21.0, 8.0, 9.0, 12.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.244140625, -3.156402587890625, -3.06866455078125, -2.980926513671875, -2.8931884765625, -2.805450439453125, -2.71771240234375, -2.629974365234375, -2.542236328125, -2.454498291015625, -2.36676025390625, -2.279022216796875, -2.1912841796875, -2.103546142578125, -2.01580810546875, -1.928070068359375, -1.84033203125, -1.752593994140625, -1.66485595703125, -1.577117919921875, -1.4893798828125, -1.401641845703125, -1.31390380859375, -1.226165771484375, -1.138427734375, -1.050689697265625, -0.96295166015625, -0.875213623046875, -0.7874755859375, -0.699737548828125, -0.61199951171875, -0.524261474609375, -0.4365234375, -0.348785400390625, -0.26104736328125, -0.173309326171875, -0.0855712890625, 0.002166748046875, 0.08990478515625, 0.177642822265625, 0.265380859375, 0.353118896484375, 0.44085693359375, 0.528594970703125, 0.6163330078125, 0.704071044921875, 0.79180908203125, 0.879547119140625, 0.96728515625, 1.055023193359375, 1.14276123046875, 1.230499267578125, 1.3182373046875, 1.405975341796875, 1.49371337890625, 1.581451416015625, 1.669189453125, 1.756927490234375, 1.84466552734375, 1.932403564453125, 2.0201416015625, 2.107879638671875, 2.19561767578125, 2.283355712890625, 2.37109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 16.0, 44.0, 151.0, 3057.0, 671.0, 92.0, 31.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64306640625, -0.6273002624511719, -0.6115341186523438, -0.5957679748535156, -0.5800018310546875, -0.5642356872558594, -0.5484695434570312, -0.5327033996582031, -0.516937255859375, -0.5011711120605469, -0.48540496826171875, -0.4696388244628906, -0.4538726806640625, -0.4381065368652344, -0.42234039306640625, -0.4065742492675781, -0.39080810546875, -0.3750419616699219, -0.35927581787109375, -0.3435096740722656, -0.3277435302734375, -0.3119773864746094, -0.29621124267578125, -0.2804450988769531, -0.264678955078125, -0.24891281127929688, -0.23314666748046875, -0.21738052368164062, -0.2016143798828125, -0.18584823608398438, -0.17008209228515625, -0.15431594848632812, -0.1385498046875, -0.12278366088867188, -0.10701751708984375, -0.09125137329101562, -0.0754852294921875, -0.059719085693359375, -0.04395294189453125, -0.028186798095703125, -0.012420654296875, 0.003345489501953125, 0.01911163330078125, 0.034877777099609375, 0.0506439208984375, 0.06641006469726562, 0.08217620849609375, 0.09794235229492188, 0.11370849609375, 0.12947463989257812, 0.14524078369140625, 0.16100692749023438, 0.1767730712890625, 0.19253921508789062, 0.20830535888671875, 0.22407150268554688, 0.239837646484375, 0.2556037902832031, 0.27136993408203125, 0.2871360778808594, 0.3029022216796875, 0.3186683654785156, 0.33443450927734375, 0.3502006530761719, 0.365966796875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 51.0, 877.0, 69.0, 5.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.579231262207031, -9.342940330505371, -9.106649398803711, -8.870357513427734, -8.634066581726074, -8.397775650024414, -8.161483764648438, -7.925192832946777, -7.688901901245117, -7.452610969543457, -7.216319561004639, -6.98002815246582, -6.74373722076416, -6.5074462890625, -6.271154880523682, -6.034863471984863, -5.798572540283203, -5.562281608581543, -5.325990200042725, -5.089698791503906, -4.853407859802246, -4.617116928100586, -4.380825519561768, -4.144534111022949, -3.908243179321289, -3.67195200920105, -3.4356608390808105, -3.1993696689605713, -2.963078498840332, -2.7267873287200928, -2.4904961585998535, -2.2542049884796143, -2.017913818359375, -1.7816226482391357, -1.5453314781188965, -1.3090403079986572, -1.072749137878418, -0.8364579677581787, -0.6001667976379395, -0.3638756275177002, -0.12758445739746094, 0.10870671272277832, 0.3449978828430176, 0.5812890529632568, 0.8175802230834961, 1.0538713932037354, 1.2901625633239746, 1.5264537334442139, 1.7627449035644531, 1.9990360736846924, 2.2353272438049316, 2.471618413925171, 2.70790958404541, 2.9442007541656494, 3.1804919242858887, 3.416783094406128, 3.653074264526367, 3.8893654346466064, 4.125656604766846, 4.361948013305664, 4.598238945007324, 4.834529876708984, 5.070821285247803, 5.307112693786621, 5.543403625488281]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 11.0, 16.0, 22.0, 31.0, 42.0, 67.0, 77.0, 72.0, 80.0, 80.0, 87.0, 79.0, 77.0, 69.0, 54.0, 36.0, 38.0, 27.0, 16.0, 9.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7951920628547668, -0.7656492590904236, -0.7361063957214355, -0.7065635919570923, -0.677020788192749, -0.6474779844284058, -0.6179351806640625, -0.5883923172950745, -0.5588495135307312, -0.5293067097663879, -0.4997638761997223, -0.47022104263305664, -0.4406782388687134, -0.4111354351043701, -0.38159260153770447, -0.3520497679710388, -0.32250696420669556, -0.2929641604423523, -0.26342132687568665, -0.2338785082101822, -0.20433568954467773, -0.17479287087917328, -0.14525005221366882, -0.11570723354816437, -0.08616441488265991, -0.05662159621715546, -0.027078777551651, 0.0024640411138534546, 0.03200685977935791, 0.061549678444862366, 0.09109249711036682, 0.12063531577587128, 0.1501781940460205, 0.17972101271152496, 0.20926383137702942, 0.23880665004253387, 0.26834946870803833, 0.2978922724723816, 0.32743510603904724, 0.3569779396057129, 0.38652074337005615, 0.4160635471343994, 0.44560638070106506, 0.4751492142677307, 0.504692018032074, 0.5342348217964172, 0.5637776851654053, 0.5933204889297485, 0.6228632926940918, 0.6524060964584351, 0.6819489002227783, 0.7114917635917664, 0.7410345673561096, 0.7705773711204529, 0.8001202344894409, 0.8296630382537842, 0.8592058420181274, 0.8887486457824707, 0.918291449546814, 0.947834312915802, 0.9773771166801453, 1.0069199800491333, 1.0364627838134766, 1.0660055875778198, 1.095548391342163]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 16.0, 15.0, 18.0, 37.0, 36.0, 42.0, 65.0, 89.0, 149.0, 238.0, 390.0, 655.0, 1145.0, 2503.0, 7058.0, 23284.0, 100318.0, 575891.0, 268951.0, 46848.0, 12754.0, 4262.0, 1685.0, 801.0, 487.0, 279.0, 173.0, 102.0, 92.0, 39.0, 35.0, 28.0, 20.0, 12.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.472900390625, -0.4545402526855469, -0.43618011474609375, -0.4178199768066406, -0.3994598388671875, -0.3810997009277344, -0.36273956298828125, -0.3443794250488281, -0.326019287109375, -0.3076591491699219, -0.28929901123046875, -0.2709388732910156, -0.2525787353515625, -0.23421859741210938, -0.21585845947265625, -0.19749832153320312, -0.17913818359375, -0.16077804565429688, -0.14241790771484375, -0.12405776977539062, -0.1056976318359375, -0.08733749389648438, -0.06897735595703125, -0.050617218017578125, -0.032257080078125, -0.013896942138671875, 0.00446319580078125, 0.022823333740234375, 0.0411834716796875, 0.059543609619140625, 0.07790374755859375, 0.09626388549804688, 0.1146240234375, 0.13298416137695312, 0.15134429931640625, 0.16970443725585938, 0.1880645751953125, 0.20642471313476562, 0.22478485107421875, 0.24314498901367188, 0.261505126953125, 0.2798652648925781, 0.29822540283203125, 0.3165855407714844, 0.3349456787109375, 0.3533058166503906, 0.37166595458984375, 0.3900260925292969, 0.40838623046875, 0.4267463684082031, 0.44510650634765625, 0.4634666442871094, 0.4818267822265625, 0.5001869201660156, 0.5185470581054688, 0.5369071960449219, 0.555267333984375, 0.5736274719238281, 0.5919876098632812, 0.6103477478027344, 0.6287078857421875, 0.6470680236816406, 0.6654281616210938, 0.6837882995605469, 0.7021484375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 8.0, 6.0, 13.0, 27.0, 22.0, 25.0, 50.0, 57.0, 54.0, 60.0, 82.0, 85.0, 92.0, 80.0, 65.0, 55.0, 55.0, 45.0, 28.0, 32.0, 25.0, 5.0, 16.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10821533203125, -0.10307979583740234, -0.09794425964355469, -0.09280872344970703, -0.08767318725585938, -0.08253765106201172, -0.07740211486816406, -0.0722665786743164, -0.06713104248046875, -0.061995506286621094, -0.05685997009277344, -0.05172443389892578, -0.046588897705078125, -0.04145336151123047, -0.03631782531738281, -0.031182289123535156, -0.0260467529296875, -0.020911216735839844, -0.015775680541992188, -0.010640144348144531, -0.005504608154296875, -0.00036907196044921875, 0.0047664642333984375, 0.009902000427246094, 0.01503753662109375, 0.020173072814941406, 0.025308609008789062, 0.03044414520263672, 0.035579681396484375, 0.04071521759033203, 0.04585075378417969, 0.050986289978027344, 0.056121826171875, 0.061257362365722656, 0.06639289855957031, 0.07152843475341797, 0.07666397094726562, 0.08179950714111328, 0.08693504333496094, 0.0920705795288086, 0.09720611572265625, 0.1023416519165039, 0.10747718811035156, 0.11261272430419922, 0.11774826049804688, 0.12288379669189453, 0.1280193328857422, 0.13315486907958984, 0.1382904052734375, 0.14342594146728516, 0.1485614776611328, 0.15369701385498047, 0.15883255004882812, 0.16396808624267578, 0.16910362243652344, 0.1742391586303711, 0.17937469482421875, 0.1845102310180664, 0.18964576721191406, 0.19478130340576172, 0.19991683959960938, 0.20505237579345703, 0.2101879119873047, 0.21532344818115234, 0.220458984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 6.0, 14.0, 17.0, 22.0, 29.0, 56.0, 80.0, 107.0, 237.0, 431.0, 982.0, 2425.0, 7258.0, 28649.0, 207456.0, 686674.0, 89642.0, 16478.0, 4666.0, 1689.0, 760.0, 352.0, 188.0, 109.0, 64.0, 35.0, 29.0, 25.0, 14.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67333984375, -0.6495590209960938, -0.6257781982421875, -0.6019973754882812, -0.578216552734375, -0.5544357299804688, -0.5306549072265625, -0.5068740844726562, -0.48309326171875, -0.45931243896484375, -0.4355316162109375, -0.41175079345703125, -0.387969970703125, -0.36418914794921875, -0.3404083251953125, -0.31662750244140625, -0.2928466796875, -0.26906585693359375, -0.2452850341796875, -0.22150421142578125, -0.197723388671875, -0.17394256591796875, -0.1501617431640625, -0.12638092041015625, -0.10260009765625, -0.07881927490234375, -0.0550384521484375, -0.03125762939453125, -0.007476806640625, 0.01630401611328125, 0.0400848388671875, 0.06386566162109375, 0.087646484375, 0.11142730712890625, 0.1352081298828125, 0.15898895263671875, 0.182769775390625, 0.20655059814453125, 0.2303314208984375, 0.25411224365234375, 0.27789306640625, 0.30167388916015625, 0.3254547119140625, 0.34923553466796875, 0.373016357421875, 0.39679718017578125, 0.4205780029296875, 0.44435882568359375, 0.4681396484375, 0.49192047119140625, 0.5157012939453125, 0.5394821166992188, 0.563262939453125, 0.5870437622070312, 0.6108245849609375, 0.6346054077148438, 0.65838623046875, 0.6821670532226562, 0.7059478759765625, 0.7297286987304688, 0.753509521484375, 0.7772903442382812, 0.8010711669921875, 0.8248519897460938, 0.8486328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 9.0, 8.0, 15.0, 14.0, 19.0, 31.0, 30.0, 43.0, 49.0, 49.0, 55.0, 59.0, 78.0, 76.0, 60.0, 75.0, 51.0, 55.0, 43.0, 31.0, 22.0, 27.0, 16.0, 17.0, 9.0, 9.0, 4.0, 10.0, 6.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57421875, -0.5531234741210938, -0.5320281982421875, -0.5109329223632812, -0.489837646484375, -0.46874237060546875, -0.4476470947265625, -0.42655181884765625, -0.40545654296875, -0.38436126708984375, -0.3632659912109375, -0.34217071533203125, -0.321075439453125, -0.29998016357421875, -0.2788848876953125, -0.25778961181640625, -0.2366943359375, -0.21559906005859375, -0.1945037841796875, -0.17340850830078125, -0.152313232421875, -0.13121795654296875, -0.1101226806640625, -0.08902740478515625, -0.06793212890625, -0.04683685302734375, -0.0257415771484375, -0.00464630126953125, 0.016448974609375, 0.03754425048828125, 0.0586395263671875, 0.07973480224609375, 0.100830078125, 0.12192535400390625, 0.1430206298828125, 0.16411590576171875, 0.185211181640625, 0.20630645751953125, 0.2274017333984375, 0.24849700927734375, 0.26959228515625, 0.29068756103515625, 0.3117828369140625, 0.33287811279296875, 0.353973388671875, 0.37506866455078125, 0.3961639404296875, 0.41725921630859375, 0.4383544921875, 0.45944976806640625, 0.4805450439453125, 0.5016403198242188, 0.522735595703125, 0.5438308715820312, 0.5649261474609375, 0.5860214233398438, 0.60711669921875, 0.6282119750976562, 0.6493072509765625, 0.6704025268554688, 0.691497802734375, 0.7125930786132812, 0.7336883544921875, 0.7547836303710938, 0.77587890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 11.0, 9.0, 23.0, 33.0, 60.0, 104.0, 154.0, 311.0, 792.0, 2363.0, 12536.0, 424421.0, 588699.0, 14799.0, 2571.0, 818.0, 383.0, 168.0, 109.0, 60.0, 39.0, 21.0, 17.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.398193359375, -0.3853645324707031, -0.37253570556640625, -0.3597068786621094, -0.3468780517578125, -0.3340492248535156, -0.32122039794921875, -0.3083915710449219, -0.295562744140625, -0.2827339172363281, -0.26990509033203125, -0.2570762634277344, -0.2442474365234375, -0.23141860961914062, -0.21858978271484375, -0.20576095581054688, -0.19293212890625, -0.18010330200195312, -0.16727447509765625, -0.15444564819335938, -0.1416168212890625, -0.12878799438476562, -0.11595916748046875, -0.10313034057617188, -0.090301513671875, -0.07747268676757812, -0.06464385986328125, -0.051815032958984375, -0.0389862060546875, -0.026157379150390625, -0.01332855224609375, -0.000499725341796875, 0.0123291015625, 0.025157928466796875, 0.03798675537109375, 0.050815582275390625, 0.0636444091796875, 0.07647323608398438, 0.08930206298828125, 0.10213088989257812, 0.114959716796875, 0.12778854370117188, 0.14061737060546875, 0.15344619750976562, 0.1662750244140625, 0.17910385131835938, 0.19193267822265625, 0.20476150512695312, 0.21759033203125, 0.23041915893554688, 0.24324798583984375, 0.2560768127441406, 0.2689056396484375, 0.2817344665527344, 0.29456329345703125, 0.3073921203613281, 0.320220947265625, 0.3330497741699219, 0.34587860107421875, 0.3587074279785156, 0.3715362548828125, 0.3843650817871094, 0.39719390869140625, 0.4100227355957031, 0.4228515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 14.0, 15.0, 30.0, 44.0, 73.0, 121.0, 157.0, 150.0, 111.0, 92.0, 72.0, 43.0, 24.0, 14.0, 9.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.89354133605957e-05, -4.780478775501251e-05, -4.667416214942932e-05, -4.554353654384613e-05, -4.441291093826294e-05, -4.328228533267975e-05, -4.215165972709656e-05, -4.102103412151337e-05, -3.9890408515930176e-05, -3.8759782910346985e-05, -3.7629157304763794e-05, -3.64985316991806e-05, -3.536790609359741e-05, -3.423728048801422e-05, -3.310665488243103e-05, -3.197602927684784e-05, -3.084540367126465e-05, -2.9714778065681458e-05, -2.8584152460098267e-05, -2.7453526854515076e-05, -2.6322901248931885e-05, -2.5192275643348694e-05, -2.4061650037765503e-05, -2.2931024432182312e-05, -2.180039882659912e-05, -2.066977322101593e-05, -1.953914761543274e-05, -1.840852200984955e-05, -1.7277896404266357e-05, -1.6147270798683167e-05, -1.5016645193099976e-05, -1.3886019587516785e-05, -1.2755393981933594e-05, -1.1624768376350403e-05, -1.0494142770767212e-05, -9.363517165184021e-06, -8.23289155960083e-06, -7.102265954017639e-06, -5.971640348434448e-06, -4.841014742851257e-06, -3.7103891372680664e-06, -2.5797635316848755e-06, -1.4491379261016846e-06, -3.1851232051849365e-07, 8.121132850646973e-07, 1.942738890647888e-06, 3.073364496231079e-06, 4.20399010181427e-06, 5.334615707397461e-06, 6.465241312980652e-06, 7.595866918563843e-06, 8.726492524147034e-06, 9.857118129730225e-06, 1.0987743735313416e-05, 1.2118369340896606e-05, 1.3248994946479797e-05, 1.4379620552062988e-05, 1.551024615764618e-05, 1.664087176322937e-05, 1.777149736881256e-05, 1.8902122974395752e-05, 2.0032748579978943e-05, 2.1163374185562134e-05, 2.2293999791145325e-05, 2.3424625396728516e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 15.0, 20.0, 18.0, 42.0, 73.0, 129.0, 311.0, 815.0, 3148.0, 28623.0, 914507.0, 93365.0, 5518.0, 1178.0, 412.0, 179.0, 77.0, 42.0, 24.0, 16.0, 15.0, 5.0, 7.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.484130859375, -0.471923828125, -0.459716796875, -0.447509765625, -0.435302734375, -0.423095703125, -0.410888671875, -0.398681640625, -0.386474609375, -0.374267578125, -0.362060546875, -0.349853515625, -0.337646484375, -0.325439453125, -0.313232421875, -0.301025390625, -0.288818359375, -0.276611328125, -0.264404296875, -0.252197265625, -0.239990234375, -0.227783203125, -0.215576171875, -0.203369140625, -0.191162109375, -0.178955078125, -0.166748046875, -0.154541015625, -0.142333984375, -0.130126953125, -0.117919921875, -0.105712890625, -0.093505859375, -0.081298828125, -0.069091796875, -0.056884765625, -0.044677734375, -0.032470703125, -0.020263671875, -0.008056640625, 0.004150390625, 0.016357421875, 0.028564453125, 0.040771484375, 0.052978515625, 0.065185546875, 0.077392578125, 0.089599609375, 0.101806640625, 0.114013671875, 0.126220703125, 0.138427734375, 0.150634765625, 0.162841796875, 0.175048828125, 0.187255859375, 0.199462890625, 0.211669921875, 0.223876953125, 0.236083984375, 0.248291015625, 0.260498046875, 0.272705078125, 0.284912109375, 0.297119140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 12.0, 13.0, 27.0, 34.0, 55.0, 116.0, 193.0, 206.0, 145.0, 89.0, 46.0, 23.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.413818359375, -0.4048786163330078, -0.3959388732910156, -0.38699913024902344, -0.37805938720703125, -0.36911964416503906, -0.3601799011230469, -0.3512401580810547, -0.3423004150390625, -0.3333606719970703, -0.3244209289550781, -0.31548118591308594, -0.30654144287109375, -0.29760169982910156, -0.2886619567871094, -0.2797222137451172, -0.270782470703125, -0.2618427276611328, -0.2529029846191406, -0.24396324157714844, -0.23502349853515625, -0.22608375549316406, -0.21714401245117188, -0.2082042694091797, -0.1992645263671875, -0.1903247833251953, -0.18138504028320312, -0.17244529724121094, -0.16350555419921875, -0.15456581115722656, -0.14562606811523438, -0.1366863250732422, -0.12774658203125, -0.11880683898925781, -0.10986709594726562, -0.10092735290527344, -0.09198760986328125, -0.08304786682128906, -0.07410812377929688, -0.06516838073730469, -0.0562286376953125, -0.04728889465332031, -0.038349151611328125, -0.029409408569335938, -0.02046966552734375, -0.011529922485351562, -0.002590179443359375, 0.0063495635986328125, 0.015289306640625, 0.024229049682617188, 0.033168792724609375, 0.04210853576660156, 0.05104827880859375, 0.05998802185058594, 0.06892776489257812, 0.07786750793457031, 0.0868072509765625, 0.09574699401855469, 0.10468673706054688, 0.11362648010253906, 0.12256622314453125, 0.13150596618652344, 0.14044570922851562, 0.1493854522705078, 0.1583251953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 17.0, 47.0, 176.0, 471.0, 203.0, 56.0, 17.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7482404708862305, -3.4502804279327393, -3.152320384979248, -2.854360342025757, -2.5564002990722656, -2.2584402561187744, -1.9604802131652832, -1.662520170211792, -1.3645601272583008, -1.0666000843048096, -0.7686400413513184, -0.47067999839782715, -0.17271995544433594, 0.12524008750915527, 0.4232001304626465, 0.7211601734161377, 1.019120216369629, 1.3170802593231201, 1.6150403022766113, 1.9130003452301025, 2.2109603881835938, 2.508920431137085, 2.806880474090576, 3.1048405170440674, 3.4028005599975586, 3.70076060295105, 3.998720645904541, 4.296680450439453, 4.594640731811523, 4.892601013183594, 5.190560817718506, 5.488520622253418, 5.786481857299805, 6.084442138671875, 6.382401943206787, 6.680361747741699, 6.9783220291137695, 7.27628231048584, 7.574242115020752, 7.872201919555664, 8.170162200927734, 8.468122482299805, 8.766082763671875, 9.064042091369629, 9.3620023727417, 9.65996265411377, 9.957921981811523, 10.255882263183594, 10.553842544555664, 10.851802825927734, 11.149763107299805, 11.447722434997559, 11.745682716369629, 12.0436429977417, 12.341602325439453, 12.639562606811523, 12.937522888183594, 13.235483169555664, 13.533443450927734, 13.831402778625488, 14.129363059997559, 14.427323341369629, 14.725282669067383, 15.023242950439453, 15.321203231811523]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 7.0, 10.0, 13.0, 6.0, 11.0, 10.0, 24.0, 22.0, 26.0, 23.0, 31.0, 27.0, 37.0, 45.0, 54.0, 44.0, 47.0, 53.0, 47.0, 52.0, 53.0, 54.0, 41.0, 29.0, 41.0, 26.0, 31.0, 24.0, 12.0, 14.0, 19.0, 13.0, 5.0, 8.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0459728240966797, -2.943551778793335, -2.8411309719085693, -2.7387099266052246, -2.636289119720459, -2.5338680744171143, -2.4314470291137695, -2.329026222229004, -2.226605176925659, -2.1241841316223145, -2.021763324737549, -1.919342279434204, -1.816921353340149, -1.7145004272460938, -1.6120795011520386, -1.5096585750579834, -1.4072376489639282, -1.304816722869873, -1.2023957967758179, -1.0999748706817627, -0.997553825378418, -0.8951328992843628, -0.7927119731903076, -0.6902909874916077, -0.5878700613975525, -0.4854491055011749, -0.38302814960479736, -0.2806072235107422, -0.17818626761436462, -0.07576531171798706, 0.026655614376068115, 0.12907660007476807, 0.23149752616882324, 0.3339184820652008, 0.43633943796157837, 0.5387603640556335, 0.6411813497543335, 0.7436022758483887, 0.8460232019424438, 0.9484441876411438, 1.0508651733398438, 1.153286099433899, 1.255707025527954, 1.3581280708312988, 1.460548996925354, 1.5629699230194092, 1.6653908491134644, 1.7678117752075195, 1.8702327013015747, 1.9726536273956299, 2.0750746726989746, 2.1774954795837402, 2.279916524887085, 2.3823375701904297, 2.4847583770751953, 2.58717942237854, 2.6896002292633057, 2.7920212745666504, 2.894442081451416, 2.9968631267547607, 3.0992839336395264, 3.201704978942871, 3.3041257858276367, 3.4065468311309814, 3.508967876434326]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 14.0, 11.0, 28.0, 38.0, 60.0, 89.0, 152.0, 271.0, 512.0, 956.0, 2053.0, 4815.0, 14754.0, 74741.0, 3726191.0, 325265.0, 29724.0, 8209.0, 3077.0, 1470.0, 754.0, 416.0, 208.0, 139.0, 101.0, 60.0, 44.0, 29.0, 26.0, 18.0, 10.0, 5.0, 6.0, 7.0, 1.0, 6.0, 8.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6582183837890625, -0.627960205078125, -0.5977020263671875, -0.56744384765625, -0.5371856689453125, -0.506927490234375, -0.4766693115234375, -0.4464111328125, -0.4161529541015625, -0.385894775390625, -0.3556365966796875, -0.32537841796875, -0.2951202392578125, -0.264862060546875, -0.2346038818359375, -0.204345703125, -0.1740875244140625, -0.143829345703125, -0.1135711669921875, -0.08331298828125, -0.0530548095703125, -0.022796630859375, 0.0074615478515625, 0.0377197265625, 0.0679779052734375, 0.098236083984375, 0.1284942626953125, 0.15875244140625, 0.1890106201171875, 0.219268798828125, 0.2495269775390625, 0.27978515625, 0.3100433349609375, 0.340301513671875, 0.3705596923828125, 0.40081787109375, 0.4310760498046875, 0.461334228515625, 0.4915924072265625, 0.5218505859375, 0.5521087646484375, 0.582366943359375, 0.6126251220703125, 0.64288330078125, 0.6731414794921875, 0.703399658203125, 0.7336578369140625, 0.763916015625, 0.7941741943359375, 0.824432373046875, 0.8546905517578125, 0.88494873046875, 0.9152069091796875, 0.945465087890625, 0.9757232666015625, 1.0059814453125, 1.0362396240234375, 1.066497802734375, 1.0967559814453125, 1.12701416015625, 1.1572723388671875, 1.187530517578125, 1.2177886962890625, 1.248046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 13.0, 11.0, 23.0, 21.0, 24.0, 45.0, 53.0, 61.0, 53.0, 80.0, 88.0, 75.0, 84.0, 62.0, 56.0, 50.0, 44.0, 44.0, 30.0, 28.0, 19.0, 8.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11968994140625, -0.11406803131103516, -0.10844612121582031, -0.10282421112060547, -0.09720230102539062, -0.09158039093017578, -0.08595848083496094, -0.0803365707397461, -0.07471466064453125, -0.0690927505493164, -0.06347084045410156, -0.05784893035888672, -0.052227020263671875, -0.04660511016845703, -0.04098320007324219, -0.035361289978027344, -0.0297393798828125, -0.024117469787597656, -0.018495559692382812, -0.012873649597167969, -0.007251739501953125, -0.0016298294067382812, 0.0039920806884765625, 0.009613990783691406, 0.01523590087890625, 0.020857810974121094, 0.026479721069335938, 0.03210163116455078, 0.037723541259765625, 0.04334545135498047, 0.04896736145019531, 0.054589271545410156, 0.060211181640625, 0.06583309173583984, 0.07145500183105469, 0.07707691192626953, 0.08269882202148438, 0.08832073211669922, 0.09394264221191406, 0.0995645523071289, 0.10518646240234375, 0.1108083724975586, 0.11643028259277344, 0.12205219268798828, 0.12767410278320312, 0.13329601287841797, 0.1389179229736328, 0.14453983306884766, 0.1501617431640625, 0.15578365325927734, 0.1614055633544922, 0.16702747344970703, 0.17264938354492188, 0.17827129364013672, 0.18389320373535156, 0.1895151138305664, 0.19513702392578125, 0.2007589340209961, 0.20638084411621094, 0.21200275421142578, 0.21762466430664062, 0.22324657440185547, 0.2288684844970703, 0.23449039459228516, 0.2401123046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 6.0, 15.0, 28.0, 19.0, 45.0, 91.0, 232.0, 569.0, 2152.0, 15763.0, 4073019.0, 94952.0, 5309.0, 1204.0, 423.0, 175.0, 85.0, 62.0, 47.0, 31.0, 17.0, 10.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.242279052734375, -1.17596435546875, -1.109649658203125, -1.0433349609375, -0.977020263671875, -0.91070556640625, -0.844390869140625, -0.778076171875, -0.711761474609375, -0.64544677734375, -0.579132080078125, -0.5128173828125, -0.446502685546875, -0.38018798828125, -0.313873291015625, -0.24755859375, -0.181243896484375, -0.11492919921875, -0.048614501953125, 0.0177001953125, 0.084014892578125, 0.15032958984375, 0.216644287109375, 0.282958984375, 0.349273681640625, 0.41558837890625, 0.481903076171875, 0.5482177734375, 0.614532470703125, 0.68084716796875, 0.747161865234375, 0.8134765625, 0.879791259765625, 0.94610595703125, 1.012420654296875, 1.0787353515625, 1.145050048828125, 1.21136474609375, 1.277679443359375, 1.343994140625, 1.410308837890625, 1.47662353515625, 1.542938232421875, 1.6092529296875, 1.675567626953125, 1.74188232421875, 1.808197021484375, 1.87451171875, 1.940826416015625, 2.00714111328125, 2.073455810546875, 2.1397705078125, 2.206085205078125, 2.27239990234375, 2.338714599609375, 2.405029296875, 2.471343994140625, 2.53765869140625, 2.603973388671875, 2.6702880859375, 2.736602783203125, 2.80291748046875, 2.869232177734375, 2.935546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 17.0, 27.0, 79.0, 230.0, 2730.0, 723.0, 126.0, 58.0, 21.0, 15.0, 12.0, 10.0, 7.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298828125, -0.27716064453125, -0.2554931640625, -0.23382568359375, -0.212158203125, -0.19049072265625, -0.1688232421875, -0.14715576171875, -0.12548828125, -0.10382080078125, -0.0821533203125, -0.06048583984375, -0.038818359375, -0.01715087890625, 0.0045166015625, 0.02618408203125, 0.0478515625, 0.06951904296875, 0.0911865234375, 0.11285400390625, 0.134521484375, 0.15618896484375, 0.1778564453125, 0.19952392578125, 0.22119140625, 0.24285888671875, 0.2645263671875, 0.28619384765625, 0.307861328125, 0.32952880859375, 0.3511962890625, 0.37286376953125, 0.39453125, 0.41619873046875, 0.4378662109375, 0.45953369140625, 0.481201171875, 0.50286865234375, 0.5245361328125, 0.54620361328125, 0.56787109375, 0.58953857421875, 0.6112060546875, 0.63287353515625, 0.654541015625, 0.67620849609375, 0.6978759765625, 0.71954345703125, 0.7412109375, 0.76287841796875, 0.7845458984375, 0.80621337890625, 0.827880859375, 0.84954833984375, 0.8712158203125, 0.89288330078125, 0.91455078125, 0.93621826171875, 0.9578857421875, 0.97955322265625, 1.001220703125, 1.02288818359375, 1.0445556640625, 1.06622314453125, 1.087890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 37.0, 74.0, 187.0, 335.0, 206.0, 79.0, 38.0, 16.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.143627882003784, -2.0527660846710205, -1.9619044065475464, -1.8710427284240723, -1.7801809310913086, -1.689319133758545, -1.5984574556350708, -1.5075957775115967, -1.416733980178833, -1.3258721828460693, -1.2350105047225952, -1.144148826599121, -1.0532870292663574, -0.9624252915382385, -0.8715635538101196, -0.7807018160820007, -0.6898400783538818, -0.5989783406257629, -0.508116602897644, -0.41725486516952515, -0.32639312744140625, -0.23553138971328735, -0.14466965198516846, -0.05380791425704956, 0.037053823471069336, 0.12791556119918823, 0.21877729892730713, 0.309639036655426, 0.4005007743835449, 0.4913625121116638, 0.5822242498397827, 0.6730859875679016, 0.7639479637145996, 0.8548097014427185, 0.9456714391708374, 1.0365331172943115, 1.1273949146270752, 1.2182567119598389, 1.309118390083313, 1.399980068206787, 1.4908418655395508, 1.5817036628723145, 1.6725653409957886, 1.7634270191192627, 1.8542888164520264, 1.94515061378479, 2.0360121726989746, 2.1268739700317383, 2.217735767364502, 2.3085975646972656, 2.3994593620300293, 2.490320920944214, 2.5811827182769775, 2.672044515609741, 2.762906074523926, 2.8537678718566895, 2.944629669189453, 3.035491466522217, 3.1263532638549805, 3.217214822769165, 3.3080766201019287, 3.3989384174346924, 3.489799976348877, 3.5806617736816406, 3.6715235710144043]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 20.0, 35.0, 39.0, 64.0, 90.0, 96.0, 104.0, 104.0, 111.0, 107.0, 72.0, 49.0, 48.0, 20.0, 5.0, 10.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.661919593811035, -2.5783746242523193, -2.4948296546936035, -2.4112846851348877, -2.327739715576172, -2.244194746017456, -2.1606497764587402, -2.0771048069000244, -1.9935598373413086, -1.9100148677825928, -1.826469898223877, -1.7429249286651611, -1.6593799591064453, -1.5758349895477295, -1.4922900199890137, -1.4087450504302979, -1.3252002000808716, -1.2416552305221558, -1.15811026096344, -1.0745652914047241, -0.9910203218460083, -0.9074753522872925, -0.8239304423332214, -0.7403854727745056, -0.6568405032157898, -0.573295533657074, -0.48975056409835815, -0.4062056243419647, -0.3226606547832489, -0.23911568522453308, -0.15557074546813965, -0.07202577590942383, 0.011519193649291992, 0.09506415575742722, 0.17860911786556244, 0.26215407252311707, 0.3456990420818329, 0.4292440116405487, 0.5127889513969421, 0.596333920955658, 0.6798788905143738, 0.7634238600730896, 0.8469688296318054, 0.9305137395858765, 1.0140587091445923, 1.097603678703308, 1.181148648262024, 1.2646936178207397, 1.3482385873794556, 1.4317835569381714, 1.5153285264968872, 1.598873496055603, 1.6824184656143188, 1.7659634351730347, 1.849508285522461, 1.9330532550811768, 2.0165982246398926, 2.1001431941986084, 2.183688163757324, 2.26723313331604, 2.350778102874756, 2.4343230724334717, 2.5178680419921875, 2.6014130115509033, 2.684957981109619]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 9.0, 5.0, 9.0, 17.0, 17.0, 13.0, 25.0, 41.0, 41.0, 70.0, 111.0, 166.0, 288.0, 526.0, 959.0, 2240.0, 6322.0, 23412.0, 119175.0, 641237.0, 204378.0, 35157.0, 8615.0, 2933.0, 1269.0, 615.0, 335.0, 183.0, 122.0, 68.0, 42.0, 38.0, 25.0, 33.0, 20.0, 15.0, 4.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7980499267578125, -0.774322509765625, -0.7505950927734375, -0.72686767578125, -0.7031402587890625, -0.679412841796875, -0.6556854248046875, -0.6319580078125, -0.6082305908203125, -0.584503173828125, -0.5607757568359375, -0.53704833984375, -0.5133209228515625, -0.489593505859375, -0.4658660888671875, -0.442138671875, -0.4184112548828125, -0.394683837890625, -0.3709564208984375, -0.34722900390625, -0.3235015869140625, -0.299774169921875, -0.2760467529296875, -0.2523193359375, -0.2285919189453125, -0.204864501953125, -0.1811370849609375, -0.15740966796875, -0.1336822509765625, -0.109954833984375, -0.0862274169921875, -0.0625, -0.0387725830078125, -0.015045166015625, 0.0086822509765625, 0.03240966796875, 0.0561370849609375, 0.079864501953125, 0.1035919189453125, 0.1273193359375, 0.1510467529296875, 0.174774169921875, 0.1985015869140625, 0.22222900390625, 0.2459564208984375, 0.269683837890625, 0.2934112548828125, 0.317138671875, 0.3408660888671875, 0.364593505859375, 0.3883209228515625, 0.41204833984375, 0.4357757568359375, 0.459503173828125, 0.4832305908203125, 0.5069580078125, 0.5306854248046875, 0.554412841796875, 0.5781402587890625, 0.60186767578125, 0.6255950927734375, 0.649322509765625, 0.6730499267578125, 0.69677734375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 8.0, 24.0, 20.0, 43.0, 54.0, 68.0, 93.0, 98.0, 119.0, 95.0, 88.0, 78.0, 55.0, 58.0, 42.0, 21.0, 10.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14321517944335938, -0.13555145263671875, -0.12788772583007812, -0.1202239990234375, -0.11256027221679688, -0.10489654541015625, -0.09723281860351562, -0.089569091796875, -0.08190536499023438, -0.07424163818359375, -0.06657791137695312, -0.0589141845703125, -0.051250457763671875, -0.04358673095703125, -0.035923004150390625, -0.02825927734375, -0.020595550537109375, -0.01293182373046875, -0.005268096923828125, 0.0023956298828125, 0.010059356689453125, 0.01772308349609375, 0.025386810302734375, 0.033050537109375, 0.040714263916015625, 0.04837799072265625, 0.056041717529296875, 0.0637054443359375, 0.07136917114257812, 0.07903289794921875, 0.08669662475585938, 0.0943603515625, 0.10202407836914062, 0.10968780517578125, 0.11735153198242188, 0.1250152587890625, 0.13267898559570312, 0.14034271240234375, 0.14800643920898438, 0.155670166015625, 0.16333389282226562, 0.17099761962890625, 0.17866134643554688, 0.1863250732421875, 0.19398880004882812, 0.20165252685546875, 0.20931625366210938, 0.21697998046875, 0.22464370727539062, 0.23230743408203125, 0.23997116088867188, 0.2476348876953125, 0.2552986145019531, 0.26296234130859375, 0.2706260681152344, 0.278289794921875, 0.2859535217285156, 0.29361724853515625, 0.3012809753417969, 0.3089447021484375, 0.3166084289550781, 0.32427215576171875, 0.3319358825683594, 0.339599609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 17.0, 10.0, 38.0, 43.0, 51.0, 71.0, 127.0, 176.0, 294.0, 515.0, 945.0, 1918.0, 3986.0, 9265.0, 22677.0, 63959.0, 230935.0, 471991.0, 160876.0, 48394.0, 18034.0, 7456.0, 3210.0, 1578.0, 822.0, 422.0, 258.0, 154.0, 123.0, 60.0, 44.0, 31.0, 15.0, 9.0, 9.0, 8.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38623046875, -0.3726158142089844, -0.35900115966796875, -0.3453865051269531, -0.3317718505859375, -0.3181571960449219, -0.30454254150390625, -0.2909278869628906, -0.277313232421875, -0.2636985778808594, -0.25008392333984375, -0.23646926879882812, -0.2228546142578125, -0.20923995971679688, -0.19562530517578125, -0.18201065063476562, -0.16839599609375, -0.15478134155273438, -0.14116668701171875, -0.12755203247070312, -0.1139373779296875, -0.10032272338867188, -0.08670806884765625, -0.07309341430664062, -0.059478759765625, -0.045864105224609375, -0.03224945068359375, -0.018634796142578125, -0.0050201416015625, 0.008594512939453125, 0.02220916748046875, 0.035823822021484375, 0.0494384765625, 0.06305313110351562, 0.07666778564453125, 0.09028244018554688, 0.1038970947265625, 0.11751174926757812, 0.13112640380859375, 0.14474105834960938, 0.158355712890625, 0.17197036743164062, 0.18558502197265625, 0.19919967651367188, 0.2128143310546875, 0.22642898559570312, 0.24004364013671875, 0.2536582946777344, 0.26727294921875, 0.2808876037597656, 0.29450225830078125, 0.3081169128417969, 0.3217315673828125, 0.3353462219238281, 0.34896087646484375, 0.3625755310058594, 0.376190185546875, 0.3898048400878906, 0.40341949462890625, 0.4170341491699219, 0.4306488037109375, 0.4442634582519531, 0.45787811279296875, 0.4714927673339844, 0.485107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 9.0, 9.0, 11.0, 14.0, 12.0, 15.0, 19.0, 19.0, 26.0, 35.0, 42.0, 33.0, 50.0, 46.0, 54.0, 36.0, 49.0, 52.0, 40.0, 58.0, 46.0, 61.0, 35.0, 30.0, 25.0, 16.0, 28.0, 23.0, 27.0, 14.0, 14.0, 10.0, 5.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.474853515625, -0.4575767517089844, -0.44029998779296875, -0.4230232238769531, -0.4057464599609375, -0.3884696960449219, -0.37119293212890625, -0.3539161682128906, -0.336639404296875, -0.3193626403808594, -0.30208587646484375, -0.2848091125488281, -0.2675323486328125, -0.2502555847167969, -0.23297882080078125, -0.21570205688476562, -0.19842529296875, -0.18114852905273438, -0.16387176513671875, -0.14659500122070312, -0.1293182373046875, -0.11204147338867188, -0.09476470947265625, -0.07748794555664062, -0.060211181640625, -0.042934417724609375, -0.02565765380859375, -0.008380889892578125, 0.0088958740234375, 0.026172637939453125, 0.04344940185546875, 0.060726165771484375, 0.0780029296875, 0.09527969360351562, 0.11255645751953125, 0.12983322143554688, 0.1471099853515625, 0.16438674926757812, 0.18166351318359375, 0.19894027709960938, 0.216217041015625, 0.23349380493164062, 0.25077056884765625, 0.2680473327636719, 0.2853240966796875, 0.3026008605957031, 0.31987762451171875, 0.3371543884277344, 0.35443115234375, 0.3717079162597656, 0.38898468017578125, 0.4062614440917969, 0.4235382080078125, 0.4408149719238281, 0.45809173583984375, 0.4753684997558594, 0.492645263671875, 0.5099220275878906, 0.5271987915039062, 0.5444755554199219, 0.5617523193359375, 0.5790290832519531, 0.5963058471679688, 0.6135826110839844, 0.630859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 12.0, 15.0, 19.0, 25.0, 41.0, 36.0, 63.0, 107.0, 143.0, 283.0, 431.0, 858.0, 1700.0, 3952.0, 12598.0, 72772.0, 540012.0, 359060.0, 41346.0, 8915.0, 3100.0, 1346.0, 727.0, 371.0, 197.0, 147.0, 76.0, 50.0, 32.0, 13.0, 20.0, 18.0, 11.0, 13.0, 7.0, 5.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158203125, -0.1520862579345703, -0.14596939086914062, -0.13985252380371094, -0.13373565673828125, -0.12761878967285156, -0.12150192260742188, -0.11538505554199219, -0.1092681884765625, -0.10315132141113281, -0.09703445434570312, -0.09091758728027344, -0.08480072021484375, -0.07868385314941406, -0.07256698608398438, -0.06645011901855469, -0.060333251953125, -0.05421638488769531, -0.048099517822265625, -0.04198265075683594, -0.03586578369140625, -0.029748916625976562, -0.023632049560546875, -0.017515182495117188, -0.0113983154296875, -0.0052814483642578125, 0.000835418701171875, 0.0069522857666015625, 0.01306915283203125, 0.019186019897460938, 0.025302886962890625, 0.03141975402832031, 0.03753662109375, 0.04365348815917969, 0.049770355224609375, 0.05588722229003906, 0.06200408935546875, 0.06812095642089844, 0.07423782348632812, 0.08035469055175781, 0.0864715576171875, 0.09258842468261719, 0.09870529174804688, 0.10482215881347656, 0.11093902587890625, 0.11705589294433594, 0.12317276000976562, 0.1292896270751953, 0.135406494140625, 0.1415233612060547, 0.14764022827148438, 0.15375709533691406, 0.15987396240234375, 0.16599082946777344, 0.17210769653320312, 0.1782245635986328, 0.1843414306640625, 0.1904582977294922, 0.19657516479492188, 0.20269203186035156, 0.20880889892578125, 0.21492576599121094, 0.22104263305664062, 0.2271595001220703, 0.2332763671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 6.0, 8.0, 11.0, 17.0, 18.0, 29.0, 39.0, 49.0, 47.0, 53.0, 58.0, 83.0, 77.0, 66.0, 79.0, 59.0, 60.0, 48.0, 47.0, 25.0, 30.0, 19.0, 15.0, 12.0, 9.0, 10.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.4705583453178406e-05, -1.4092773199081421e-05, -1.3479962944984436e-05, -1.2867152690887451e-05, -1.2254342436790466e-05, -1.1641532182693481e-05, -1.1028721928596497e-05, -1.0415911674499512e-05, -9.803101420402527e-06, -9.190291166305542e-06, -8.577480912208557e-06, -7.964670658111572e-06, -7.351860404014587e-06, -6.7390501499176025e-06, -6.126239895820618e-06, -5.513429641723633e-06, -4.900619387626648e-06, -4.287809133529663e-06, -3.6749988794326782e-06, -3.0621886253356934e-06, -2.4493783712387085e-06, -1.8365681171417236e-06, -1.2237578630447388e-06, -6.109476089477539e-07, 1.862645149230957e-09, 6.146728992462158e-07, 1.2274831533432007e-06, 1.8402934074401855e-06, 2.4531036615371704e-06, 3.0659139156341553e-06, 3.67872416973114e-06, 4.291534423828125e-06, 4.90434467792511e-06, 5.517154932022095e-06, 6.12996518611908e-06, 6.7427754402160645e-06, 7.355585694313049e-06, 7.968395948410034e-06, 8.581206202507019e-06, 9.194016456604004e-06, 9.806826710700989e-06, 1.0419636964797974e-05, 1.1032447218894958e-05, 1.1645257472991943e-05, 1.2258067727088928e-05, 1.2870877981185913e-05, 1.3483688235282898e-05, 1.4096498489379883e-05, 1.4709308743476868e-05, 1.5322118997573853e-05, 1.5934929251670837e-05, 1.6547739505767822e-05, 1.7160549759864807e-05, 1.7773360013961792e-05, 1.8386170268058777e-05, 1.8998980522155762e-05, 1.9611790776252747e-05, 2.022460103034973e-05, 2.0837411284446716e-05, 2.14502215385437e-05, 2.2063031792640686e-05, 2.267584204673767e-05, 2.3288652300834656e-05, 2.390146255493164e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 14.0, 13.0, 19.0, 36.0, 45.0, 68.0, 127.0, 234.0, 473.0, 1032.0, 2690.0, 8247.0, 34322.0, 235640.0, 598235.0, 135681.0, 22117.0, 5816.0, 1946.0, 852.0, 408.0, 214.0, 108.0, 68.0, 41.0, 35.0, 15.0, 8.0, 16.0, 5.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1793212890625, -0.17394638061523438, -0.16857147216796875, -0.16319656372070312, -0.1578216552734375, -0.15244674682617188, -0.14707183837890625, -0.14169692993164062, -0.136322021484375, -0.13094711303710938, -0.12557220458984375, -0.12019729614257812, -0.1148223876953125, -0.10944747924804688, -0.10407257080078125, -0.09869766235351562, -0.09332275390625, -0.08794784545898438, -0.08257293701171875, -0.07719802856445312, -0.0718231201171875, -0.06644821166992188, -0.06107330322265625, -0.055698394775390625, -0.050323486328125, -0.044948577880859375, -0.03957366943359375, -0.034198760986328125, -0.0288238525390625, -0.023448944091796875, -0.01807403564453125, -0.012699127197265625, -0.00732421875, -0.001949310302734375, 0.00342559814453125, 0.008800506591796875, 0.0141754150390625, 0.019550323486328125, 0.02492523193359375, 0.030300140380859375, 0.035675048828125, 0.041049957275390625, 0.04642486572265625, 0.051799774169921875, 0.0571746826171875, 0.06254959106445312, 0.06792449951171875, 0.07329940795898438, 0.07867431640625, 0.08404922485351562, 0.08942413330078125, 0.09479904174804688, 0.1001739501953125, 0.10554885864257812, 0.11092376708984375, 0.11629867553710938, 0.121673583984375, 0.12704849243164062, 0.13242340087890625, 0.13779830932617188, 0.1431732177734375, 0.14854812622070312, 0.15392303466796875, 0.15929794311523438, 0.1646728515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 7.0, 8.0, 5.0, 13.0, 16.0, 28.0, 34.0, 41.0, 67.0, 92.0, 91.0, 113.0, 110.0, 88.0, 87.0, 45.0, 46.0, 29.0, 20.0, 12.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.211181640625, -0.2049388885498047, -0.19869613647460938, -0.19245338439941406, -0.18621063232421875, -0.17996788024902344, -0.17372512817382812, -0.1674823760986328, -0.1612396240234375, -0.1549968719482422, -0.14875411987304688, -0.14251136779785156, -0.13626861572265625, -0.13002586364746094, -0.12378311157226562, -0.11754035949707031, -0.111297607421875, -0.10505485534667969, -0.09881210327148438, -0.09256935119628906, -0.08632659912109375, -0.08008384704589844, -0.07384109497070312, -0.06759834289550781, -0.0613555908203125, -0.05511283874511719, -0.048870086669921875, -0.04262733459472656, -0.03638458251953125, -0.030141830444335938, -0.023899078369140625, -0.017656326293945312, -0.01141357421875, -0.0051708221435546875, 0.001071929931640625, 0.0073146820068359375, 0.01355743408203125, 0.019800186157226562, 0.026042938232421875, 0.03228569030761719, 0.0385284423828125, 0.04477119445800781, 0.051013946533203125, 0.05725669860839844, 0.06349945068359375, 0.06974220275878906, 0.07598495483398438, 0.08222770690917969, 0.088470458984375, 0.09471321105957031, 0.10095596313476562, 0.10719871520996094, 0.11344146728515625, 0.11968421936035156, 0.12592697143554688, 0.1321697235107422, 0.1384124755859375, 0.1446552276611328, 0.15089797973632812, 0.15714073181152344, 0.16338348388671875, 0.16962623596191406, 0.17586898803710938, 0.1821117401123047, 0.1883544921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 8.0, 17.0, 37.0, 78.0, 187.0, 347.0, 207.0, 78.0, 16.0, 18.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.164790153503418, -6.9453654289245605, -6.725940704345703, -6.506516456604004, -6.2870917320251465, -6.067667007446289, -5.848242282867432, -5.628817558288574, -5.409393310546875, -5.189968585968018, -4.97054386138916, -4.751119613647461, -4.5316948890686035, -4.312270164489746, -4.092845439910889, -3.8734207153320312, -3.653995990753174, -3.4345712661743164, -3.215146780014038, -2.9957220554351807, -2.7762975692749023, -2.556872844696045, -2.3374481201171875, -2.11802339553833, -1.8985989093780518, -1.6791743040084839, -1.459749698638916, -1.2403249740600586, -1.0209003686904907, -0.8014757633209229, -0.5820510387420654, -0.36262643337249756, -0.1432023048400879, 0.07622233033180237, 0.2956469655036926, 0.5150716304779053, 0.7344962358474731, 0.953920841217041, 1.1733455657958984, 1.3927701711654663, 1.6121947765350342, 1.831619381904602, 2.05104398727417, 2.2704687118530273, 2.4898934364318848, 2.709317922592163, 2.9287426471710205, 3.148167133331299, 3.3675918579101562, 3.5870165824890137, 3.806441068649292, 4.02586555480957, 4.245290279388428, 4.464715003967285, 4.684139728546143, 4.903564453125, 5.122988700866699, 5.342413425445557, 5.561838150024414, 5.781262397766113, 6.000687122344971, 6.220111846923828, 6.4395365715026855, 6.658961296081543, 6.8783860206604]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 11.0, 7.0, 11.0, 13.0, 20.0, 30.0, 26.0, 30.0, 46.0, 54.0, 58.0, 55.0, 53.0, 59.0, 67.0, 52.0, 56.0, 53.0, 51.0, 36.0, 50.0, 36.0, 26.0, 24.0, 15.0, 17.0, 11.0, 10.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.710875988006592, -3.5751142501831055, -3.43935227394104, -3.3035905361175537, -3.1678285598754883, -3.032066822052002, -2.8963050842285156, -2.7605433464050293, -2.624781370162964, -2.4890196323394775, -2.353257656097412, -2.217495918273926, -2.0817341804504395, -1.945972204208374, -1.8102104663848877, -1.6744486093521118, -1.538686752319336, -1.40292489528656, -1.2671630382537842, -1.1314013004302979, -0.995639443397522, -0.8598775863647461, -0.724115788936615, -0.5883539915084839, -0.452592134475708, -0.3168303072452545, -0.18106848001480103, -0.045306652784347534, 0.09045517444610596, 0.22621703147888184, 0.36197882890701294, 0.49774062633514404, 0.6335020065307617, 0.7692638635635376, 0.9050256609916687, 1.0407874584197998, 1.1765493154525757, 1.3123111724853516, 1.448072910308838, 1.5838347673416138, 1.7195966243743896, 1.8553584814071655, 1.9911203384399414, 2.1268820762634277, 2.262643814086914, 2.3984057903289795, 2.534167528152466, 2.6699295043945312, 2.8056912422180176, 2.941452980041504, 3.0772149562835693, 3.2129766941070557, 3.348738670349121, 3.4845004081726074, 3.6202621459960938, 3.75602388381958, 3.8917858600616455, 4.027547836303711, 4.163309574127197, 4.299071311950684, 4.43483304977417, 4.570594787597656, 4.706357002258301, 4.842118740081787, 4.977880477905273]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 10.0, 11.0, 16.0, 10.0, 21.0, 29.0, 71.0, 116.0, 221.0, 474.0, 950.0, 2753.0, 10563.0, 88091.0, 3967664.0, 106046.0, 12001.0, 2939.0, 1120.0, 490.0, 260.0, 151.0, 82.0, 53.0, 41.0, 33.0, 21.0, 14.0, 7.0, 3.0, 11.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5185546875, -0.494476318359375, -0.47039794921875, -0.446319580078125, -0.4222412109375, -0.398162841796875, -0.37408447265625, -0.350006103515625, -0.325927734375, -0.301849365234375, -0.27777099609375, -0.253692626953125, -0.2296142578125, -0.205535888671875, -0.18145751953125, -0.157379150390625, -0.13330078125, -0.109222412109375, -0.08514404296875, -0.061065673828125, -0.0369873046875, -0.012908935546875, 0.01116943359375, 0.035247802734375, 0.059326171875, 0.083404541015625, 0.10748291015625, 0.131561279296875, 0.1556396484375, 0.179718017578125, 0.20379638671875, 0.227874755859375, 0.251953125, 0.276031494140625, 0.30010986328125, 0.324188232421875, 0.3482666015625, 0.372344970703125, 0.39642333984375, 0.420501708984375, 0.444580078125, 0.468658447265625, 0.49273681640625, 0.516815185546875, 0.5408935546875, 0.564971923828125, 0.58905029296875, 0.613128662109375, 0.63720703125, 0.661285400390625, 0.68536376953125, 0.709442138671875, 0.7335205078125, 0.757598876953125, 0.78167724609375, 0.805755615234375, 0.829833984375, 0.853912353515625, 0.87799072265625, 0.902069091796875, 0.9261474609375, 0.950225830078125, 0.97430419921875, 0.998382568359375, 1.0224609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 7.0, 3.0, 16.0, 25.0, 33.0, 37.0, 78.0, 64.0, 84.0, 101.0, 93.0, 96.0, 79.0, 72.0, 65.0, 48.0, 39.0, 25.0, 13.0, 9.0, 6.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146484375, -0.13861465454101562, -0.13074493408203125, -0.12287521362304688, -0.1150054931640625, -0.10713577270507812, -0.09926605224609375, -0.09139633178710938, -0.083526611328125, -0.07565689086914062, -0.06778717041015625, -0.059917449951171875, -0.0520477294921875, -0.044178009033203125, -0.03630828857421875, -0.028438568115234375, -0.02056884765625, -0.012699127197265625, -0.00482940673828125, 0.003040313720703125, 0.0109100341796875, 0.018779754638671875, 0.02664947509765625, 0.034519195556640625, 0.042388916015625, 0.050258636474609375, 0.05812835693359375, 0.06599807739257812, 0.0738677978515625, 0.08173751831054688, 0.08960723876953125, 0.09747695922851562, 0.1053466796875, 0.11321640014648438, 0.12108612060546875, 0.12895584106445312, 0.1368255615234375, 0.14469528198242188, 0.15256500244140625, 0.16043472290039062, 0.168304443359375, 0.17617416381835938, 0.18404388427734375, 0.19191360473632812, 0.1997833251953125, 0.20765304565429688, 0.21552276611328125, 0.22339248657226562, 0.23126220703125, 0.23913192749023438, 0.24700164794921875, 0.2548713684082031, 0.2627410888671875, 0.2706108093261719, 0.27848052978515625, 0.2863502502441406, 0.294219970703125, 0.3020896911621094, 0.30995941162109375, 0.3178291320800781, 0.3256988525390625, 0.3335685729980469, 0.34143829345703125, 0.3493080139160156, 0.357177734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 7.0, 19.0, 46.0, 85.0, 132.0, 213.0, 378.0, 736.0, 1646.0, 5044.0, 32228.0, 3855073.0, 280317.0, 13150.0, 2823.0, 1136.0, 520.0, 287.0, 159.0, 92.0, 55.0, 46.0, 25.0, 23.0, 12.0, 10.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0390625, -1.0115737915039062, -0.9840850830078125, -0.9565963745117188, -0.929107666015625, -0.9016189575195312, -0.8741302490234375, -0.8466415405273438, -0.81915283203125, -0.7916641235351562, -0.7641754150390625, -0.7366867065429688, -0.709197998046875, -0.6817092895507812, -0.6542205810546875, -0.6267318725585938, -0.5992431640625, -0.5717544555664062, -0.5442657470703125, -0.5167770385742188, -0.489288330078125, -0.46179962158203125, -0.4343109130859375, -0.40682220458984375, -0.37933349609375, -0.35184478759765625, -0.3243560791015625, -0.29686737060546875, -0.269378662109375, -0.24188995361328125, -0.2144012451171875, -0.18691253662109375, -0.159423828125, -0.13193511962890625, -0.1044464111328125, -0.07695770263671875, -0.049468994140625, -0.02198028564453125, 0.0055084228515625, 0.03299713134765625, 0.06048583984375, 0.08797454833984375, 0.1154632568359375, 0.14295196533203125, 0.170440673828125, 0.19792938232421875, 0.2254180908203125, 0.25290679931640625, 0.2803955078125, 0.30788421630859375, 0.3353729248046875, 0.36286163330078125, 0.390350341796875, 0.41783905029296875, 0.4453277587890625, 0.47281646728515625, 0.50030517578125, 0.5277938842773438, 0.5552825927734375, 0.5827713012695312, 0.610260009765625, 0.6377487182617188, 0.6652374267578125, 0.6927261352539062, 0.72021484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 6.0, 4.0, 4.0, 5.0, 10.0, 13.0, 28.0, 45.0, 100.0, 346.0, 2676.0, 595.0, 117.0, 58.0, 21.0, 23.0, 10.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.294921875, -0.2842674255371094, -0.27361297607421875, -0.2629585266113281, -0.2523040771484375, -0.24164962768554688, -0.23099517822265625, -0.22034072875976562, -0.209686279296875, -0.19903182983398438, -0.18837738037109375, -0.17772293090820312, -0.1670684814453125, -0.15641403198242188, -0.14575958251953125, -0.13510513305664062, -0.12445068359375, -0.11379623413085938, -0.10314178466796875, -0.09248733520507812, -0.0818328857421875, -0.07117843627929688, -0.06052398681640625, -0.049869537353515625, -0.039215087890625, -0.028560638427734375, -0.01790618896484375, -0.007251739501953125, 0.0034027099609375, 0.014057159423828125, 0.02471160888671875, 0.035366058349609375, 0.0460205078125, 0.056674957275390625, 0.06732940673828125, 0.07798385620117188, 0.0886383056640625, 0.09929275512695312, 0.10994720458984375, 0.12060165405273438, 0.131256103515625, 0.14191055297851562, 0.15256500244140625, 0.16321945190429688, 0.1738739013671875, 0.18452835083007812, 0.19518280029296875, 0.20583724975585938, 0.21649169921875, 0.22714614868164062, 0.23780059814453125, 0.24845504760742188, 0.2591094970703125, 0.2697639465332031, 0.28041839599609375, 0.2910728454589844, 0.301727294921875, 0.3123817443847656, 0.32303619384765625, 0.3336906433105469, 0.3443450927734375, 0.3549995422363281, 0.36565399169921875, 0.3763084411621094, 0.386962890625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 23.0, 48.0, 141.0, 278.0, 293.0, 140.0, 37.0, 15.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8432812690734863, -2.777459144592285, -2.711637020111084, -2.645815134048462, -2.5799930095672607, -2.5141708850860596, -2.4483487606048584, -2.3825266361236572, -2.316704750061035, -2.250882625579834, -2.185060501098633, -2.1192386150360107, -2.0534164905548096, -1.9875943660736084, -1.9217722415924072, -1.855950117111206, -1.7901279926300049, -1.7243058681488037, -1.658483862876892, -1.592661738395691, -1.5268397331237793, -1.4610176086425781, -1.395195484161377, -1.3293733596801758, -1.2635513544082642, -1.197729229927063, -1.1319072246551514, -1.0660851001739502, -1.000262975692749, -0.9344409704208374, -0.8686188459396362, -0.8027967810630798, -0.7369744777679443, -0.6711524128913879, -0.6053303480148315, -0.5395082235336304, -0.473686158657074, -0.4078640937805176, -0.3420419991016388, -0.27621990442276, -0.2103978395462036, -0.14457575976848602, -0.07875367999076843, -0.012931600213050842, 0.05289047956466675, 0.11871254444122314, 0.18453463912010193, 0.2503567337989807, 0.3161787986755371, 0.3820008635520935, 0.4478229582309723, 0.5136450529098511, 0.5794671177864075, 0.6452891826629639, 0.711111307144165, 0.7769333720207214, 0.8427554368972778, 0.9085775017738342, 0.9743995666503906, 1.0402216911315918, 1.106043815612793, 1.1718658208847046, 1.2376879453659058, 1.3035099506378174, 1.3693320751190186]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 11.0, 17.0, 20.0, 26.0, 26.0, 34.0, 59.0, 71.0, 70.0, 109.0, 75.0, 83.0, 85.0, 82.0, 60.0, 59.0, 36.0, 23.0, 21.0, 11.0, 13.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1679142713546753, -1.1222763061523438, -1.0766383409500122, -1.0310003757476807, -0.9853624105453491, -0.9397244453430176, -0.8940865397453308, -0.8484485745429993, -0.8028106093406677, -0.7571726441383362, -0.7115346789360046, -0.6658967733383179, -0.6202588081359863, -0.5746208429336548, -0.5289828777313232, -0.4833449125289917, -0.43770694732666016, -0.3920689821243286, -0.34643101692199707, -0.3007930815219879, -0.25515511631965637, -0.20951715111732483, -0.16387921571731567, -0.11824125051498413, -0.07260328531265259, -0.026965327560901642, 0.018672630190849304, 0.06431058049201965, 0.1099485456943512, 0.15558651089668274, 0.2012244462966919, 0.24686241149902344, 0.29250025749206543, 0.338138222694397, 0.3837761878967285, 0.42941412329673767, 0.4750520884990692, 0.5206900835037231, 0.5663279891014099, 0.6119659543037415, 0.657603919506073, 0.7032418847084045, 0.7488798499107361, 0.7945177555084229, 0.8401557207107544, 0.8857936859130859, 0.9314316511154175, 0.977069616317749, 1.0227075815200806, 1.068345546722412, 1.1139835119247437, 1.1596214771270752, 1.2052594423294067, 1.2508974075317383, 1.2965352535247803, 1.3421733379364014, 1.3878111839294434, 1.433449149131775, 1.4790871143341064, 1.524725079536438, 1.5703630447387695, 1.616001009941101, 1.6616389751434326, 1.7072768211364746, 1.7529149055480957]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 9.0, 15.0, 20.0, 24.0, 35.0, 42.0, 72.0, 111.0, 183.0, 312.0, 636.0, 1369.0, 3224.0, 8501.0, 26132.0, 97755.0, 446157.0, 354888.0, 75699.0, 20943.0, 7089.0, 2803.0, 1172.0, 522.0, 308.0, 170.0, 104.0, 66.0, 48.0, 31.0, 23.0, 9.0, 18.0, 4.0, 5.0, 5.0, 6.0, 3.0, 5.0, 4.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.626953125, -0.6079025268554688, -0.5888519287109375, -0.5698013305664062, -0.550750732421875, -0.5317001342773438, -0.5126495361328125, -0.49359893798828125, -0.47454833984375, -0.45549774169921875, -0.4364471435546875, -0.41739654541015625, -0.398345947265625, -0.37929534912109375, -0.3602447509765625, -0.34119415283203125, -0.3221435546875, -0.30309295654296875, -0.2840423583984375, -0.26499176025390625, -0.245941162109375, -0.22689056396484375, -0.2078399658203125, -0.18878936767578125, -0.16973876953125, -0.15068817138671875, -0.1316375732421875, -0.11258697509765625, -0.093536376953125, -0.07448577880859375, -0.0554351806640625, -0.03638458251953125, -0.017333984375, 0.00171661376953125, 0.0207672119140625, 0.03981781005859375, 0.058868408203125, 0.07791900634765625, 0.0969696044921875, 0.11602020263671875, 0.13507080078125, 0.15412139892578125, 0.1731719970703125, 0.19222259521484375, 0.211273193359375, 0.23032379150390625, 0.2493743896484375, 0.26842498779296875, 0.2874755859375, 0.30652618408203125, 0.3255767822265625, 0.34462738037109375, 0.363677978515625, 0.38272857666015625, 0.4017791748046875, 0.42082977294921875, 0.43988037109375, 0.45893096923828125, 0.4779815673828125, 0.49703216552734375, 0.516082763671875, 0.5351333618164062, 0.5541839599609375, 0.5732345581054688, 0.59228515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 2.0, 10.0, 10.0, 10.0, 39.0, 44.0, 64.0, 63.0, 56.0, 80.0, 109.0, 82.0, 99.0, 71.0, 65.0, 51.0, 39.0, 37.0, 26.0, 13.0, 12.0, 7.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14599609375, -0.13876724243164062, -0.13153839111328125, -0.12430953979492188, -0.1170806884765625, -0.10985183715820312, -0.10262298583984375, -0.09539413452148438, -0.088165283203125, -0.08093643188476562, -0.07370758056640625, -0.06647872924804688, -0.0592498779296875, -0.052021026611328125, -0.04479217529296875, -0.037563323974609375, -0.03033447265625, -0.023105621337890625, -0.01587677001953125, -0.008647918701171875, -0.0014190673828125, 0.005809783935546875, 0.01303863525390625, 0.020267486572265625, 0.027496337890625, 0.034725189208984375, 0.04195404052734375, 0.049182891845703125, 0.0564117431640625, 0.06364059448242188, 0.07086944580078125, 0.07809829711914062, 0.0853271484375, 0.09255599975585938, 0.09978485107421875, 0.10701370239257812, 0.1142425537109375, 0.12147140502929688, 0.12870025634765625, 0.13592910766601562, 0.143157958984375, 0.15038681030273438, 0.15761566162109375, 0.16484451293945312, 0.1720733642578125, 0.17930221557617188, 0.18653106689453125, 0.19375991821289062, 0.20098876953125, 0.20821762084960938, 0.21544647216796875, 0.22267532348632812, 0.2299041748046875, 0.23713302612304688, 0.24436187744140625, 0.2515907287597656, 0.258819580078125, 0.2660484313964844, 0.27327728271484375, 0.2805061340332031, 0.2877349853515625, 0.2949638366699219, 0.30219268798828125, 0.3094215393066406, 0.316650390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 8.0, 5.0, 13.0, 24.0, 26.0, 41.0, 67.0, 106.0, 124.0, 237.0, 290.0, 578.0, 901.0, 1601.0, 2987.0, 5597.0, 11595.0, 25743.0, 63298.0, 180797.0, 404174.0, 218566.0, 74688.0, 29811.0, 13179.0, 6362.0, 3307.0, 1827.0, 952.0, 584.0, 355.0, 248.0, 120.0, 100.0, 70.0, 57.0, 40.0, 15.0, 9.0, 9.0, 10.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.345703125, -0.3344001770019531, -0.32309722900390625, -0.3117942810058594, -0.3004913330078125, -0.2891883850097656, -0.27788543701171875, -0.2665824890136719, -0.255279541015625, -0.24397659301757812, -0.23267364501953125, -0.22137069702148438, -0.2100677490234375, -0.19876480102539062, -0.18746185302734375, -0.17615890502929688, -0.16485595703125, -0.15355300903320312, -0.14225006103515625, -0.13094711303710938, -0.1196441650390625, -0.10834121704101562, -0.09703826904296875, -0.08573532104492188, -0.074432373046875, -0.06312942504882812, -0.05182647705078125, -0.040523529052734375, -0.0292205810546875, -0.017917633056640625, -0.00661468505859375, 0.004688262939453125, 0.0159912109375, 0.027294158935546875, 0.03859710693359375, 0.049900054931640625, 0.0612030029296875, 0.07250595092773438, 0.08380889892578125, 0.09511184692382812, 0.106414794921875, 0.11771774291992188, 0.12902069091796875, 0.14032363891601562, 0.1516265869140625, 0.16292953491210938, 0.17423248291015625, 0.18553543090820312, 0.19683837890625, 0.20814132690429688, 0.21944427490234375, 0.23074722290039062, 0.2420501708984375, 0.2533531188964844, 0.26465606689453125, 0.2759590148925781, 0.287261962890625, 0.2985649108886719, 0.30986785888671875, 0.3211708068847656, 0.3324737548828125, 0.3437767028808594, 0.35507965087890625, 0.3663825988769531, 0.377685546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 5.0, 8.0, 12.0, 5.0, 16.0, 17.0, 17.0, 19.0, 28.0, 28.0, 36.0, 39.0, 32.0, 35.0, 46.0, 46.0, 52.0, 48.0, 42.0, 47.0, 57.0, 43.0, 45.0, 39.0, 26.0, 36.0, 28.0, 32.0, 25.0, 17.0, 20.0, 17.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.542205810546875, -0.52386474609375, -0.505523681640625, -0.4871826171875, -0.468841552734375, -0.45050048828125, -0.432159423828125, -0.413818359375, -0.395477294921875, -0.37713623046875, -0.358795166015625, -0.3404541015625, -0.322113037109375, -0.30377197265625, -0.285430908203125, -0.26708984375, -0.248748779296875, -0.23040771484375, -0.212066650390625, -0.1937255859375, -0.175384521484375, -0.15704345703125, -0.138702392578125, -0.120361328125, -0.102020263671875, -0.08367919921875, -0.065338134765625, -0.0469970703125, -0.028656005859375, -0.01031494140625, 0.008026123046875, 0.0263671875, 0.044708251953125, 0.06304931640625, 0.081390380859375, 0.0997314453125, 0.118072509765625, 0.13641357421875, 0.154754638671875, 0.173095703125, 0.191436767578125, 0.20977783203125, 0.228118896484375, 0.2464599609375, 0.264801025390625, 0.28314208984375, 0.301483154296875, 0.31982421875, 0.338165283203125, 0.35650634765625, 0.374847412109375, 0.3931884765625, 0.411529541015625, 0.42987060546875, 0.448211669921875, 0.466552734375, 0.484893798828125, 0.50323486328125, 0.521575927734375, 0.5399169921875, 0.558258056640625, 0.57659912109375, 0.594940185546875, 0.61328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 12.0, 7.0, 15.0, 24.0, 51.0, 67.0, 139.0, 276.0, 575.0, 1470.0, 4763.0, 27533.0, 357622.0, 594042.0, 51391.0, 7161.0, 1968.0, 750.0, 306.0, 184.0, 74.0, 49.0, 27.0, 19.0, 9.0, 9.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2093505859375, -0.20163536071777344, -0.19392013549804688, -0.1862049102783203, -0.17848968505859375, -0.1707744598388672, -0.16305923461914062, -0.15534400939941406, -0.1476287841796875, -0.13991355895996094, -0.13219833374023438, -0.12448310852050781, -0.11676788330078125, -0.10905265808105469, -0.10133743286132812, -0.09362220764160156, -0.085906982421875, -0.07819175720214844, -0.07047653198242188, -0.06276130676269531, -0.05504608154296875, -0.04733085632324219, -0.039615631103515625, -0.03190040588378906, -0.0241851806640625, -0.016469955444335938, -0.008754730224609375, -0.0010395050048828125, 0.00667572021484375, 0.014390945434570312, 0.022106170654296875, 0.029821395874023438, 0.03753662109375, 0.04525184631347656, 0.052967071533203125, 0.06068229675292969, 0.06839752197265625, 0.07611274719238281, 0.08382797241210938, 0.09154319763183594, 0.0992584228515625, 0.10697364807128906, 0.11468887329101562, 0.12240409851074219, 0.13011932373046875, 0.1378345489501953, 0.14554977416992188, 0.15326499938964844, 0.160980224609375, 0.16869544982910156, 0.17641067504882812, 0.1841259002685547, 0.19184112548828125, 0.1995563507080078, 0.20727157592773438, 0.21498680114746094, 0.2227020263671875, 0.23041725158691406, 0.23813247680664062, 0.2458477020263672, 0.25356292724609375, 0.2612781524658203, 0.2689933776855469, 0.27670860290527344, 0.284423828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 21.0, 38.0, 53.0, 135.0, 178.0, 202.0, 160.0, 114.0, 54.0, 26.0, 14.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849102020263672e-05, -2.675037831068039e-05, -2.500973641872406e-05, -2.326909452676773e-05, -2.15284526348114e-05, -1.9787810742855072e-05, -1.8047168850898743e-05, -1.6306526958942413e-05, -1.4565885066986084e-05, -1.2825243175029755e-05, -1.1084601283073425e-05, -9.343959391117096e-06, -7.603317499160767e-06, -5.862675607204437e-06, -4.122033715248108e-06, -2.3813918232917786e-06, -6.407499313354492e-07, 1.0998919606208801e-06, 2.8405338525772095e-06, 4.581175744533539e-06, 6.321817636489868e-06, 8.062459528446198e-06, 9.803101420402527e-06, 1.1543743312358856e-05, 1.3284385204315186e-05, 1.5025027096271515e-05, 1.6765668988227844e-05, 1.8506310880184174e-05, 2.0246952772140503e-05, 2.1987594664096832e-05, 2.372823655605316e-05, 2.546887844800949e-05, 2.720952033996582e-05, 2.895016223192215e-05, 3.069080412387848e-05, 3.243144601583481e-05, 3.417208790779114e-05, 3.591272979974747e-05, 3.7653371691703796e-05, 3.9394013583660126e-05, 4.1134655475616455e-05, 4.2875297367572784e-05, 4.4615939259529114e-05, 4.635658115148544e-05, 4.809722304344177e-05, 4.98378649353981e-05, 5.157850682735443e-05, 5.331914871931076e-05, 5.505979061126709e-05, 5.680043250322342e-05, 5.854107439517975e-05, 6.028171628713608e-05, 6.202235817909241e-05, 6.376300007104874e-05, 6.550364196300507e-05, 6.72442838549614e-05, 6.898492574691772e-05, 7.072556763887405e-05, 7.246620953083038e-05, 7.420685142278671e-05, 7.594749331474304e-05, 7.768813520669937e-05, 7.94287770986557e-05, 8.116941899061203e-05, 8.291006088256836e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 18.0, 15.0, 48.0, 59.0, 91.0, 214.0, 527.0, 1468.0, 5365.0, 30572.0, 386623.0, 565807.0, 47647.0, 7081.0, 1790.0, 606.0, 249.0, 143.0, 68.0, 41.0, 32.0, 18.0, 17.0, 13.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2769584655761719, -0.26949310302734375, -0.2620277404785156, -0.2545623779296875, -0.24709701538085938, -0.23963165283203125, -0.23216629028320312, -0.224700927734375, -0.21723556518554688, -0.20977020263671875, -0.20230484008789062, -0.1948394775390625, -0.18737411499023438, -0.17990875244140625, -0.17244338989257812, -0.16497802734375, -0.15751266479492188, -0.15004730224609375, -0.14258193969726562, -0.1351165771484375, -0.12765121459960938, -0.12018585205078125, -0.11272048950195312, -0.105255126953125, -0.09778976440429688, -0.09032440185546875, -0.08285903930664062, -0.0753936767578125, -0.06792831420898438, -0.06046295166015625, -0.052997589111328125, -0.0455322265625, -0.038066864013671875, -0.03060150146484375, -0.023136138916015625, -0.0156707763671875, -0.008205413818359375, -0.00074005126953125, 0.006725311279296875, 0.014190673828125, 0.021656036376953125, 0.02912139892578125, 0.036586761474609375, 0.0440521240234375, 0.051517486572265625, 0.05898284912109375, 0.06644821166992188, 0.07391357421875, 0.08137893676757812, 0.08884429931640625, 0.09630966186523438, 0.1037750244140625, 0.11124038696289062, 0.11870574951171875, 0.12617111206054688, 0.133636474609375, 0.14110183715820312, 0.14856719970703125, 0.15603256225585938, 0.1634979248046875, 0.17096328735351562, 0.17842864990234375, 0.18589401245117188, 0.193359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 10.0, 17.0, 22.0, 36.0, 45.0, 74.0, 85.0, 88.0, 110.0, 118.0, 86.0, 69.0, 75.0, 28.0, 30.0, 21.0, 25.0, 15.0, 9.0, 5.0, 5.0, 3.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1976318359375, -0.19101715087890625, -0.1844024658203125, -0.17778778076171875, -0.171173095703125, -0.16455841064453125, -0.1579437255859375, -0.15132904052734375, -0.14471435546875, -0.13809967041015625, -0.1314849853515625, -0.12487030029296875, -0.118255615234375, -0.11164093017578125, -0.1050262451171875, -0.09841156005859375, -0.091796875, -0.08518218994140625, -0.0785675048828125, -0.07195281982421875, -0.065338134765625, -0.05872344970703125, -0.0521087646484375, -0.04549407958984375, -0.03887939453125, -0.03226470947265625, -0.0256500244140625, -0.01903533935546875, -0.012420654296875, -0.00580596923828125, 0.0008087158203125, 0.00742340087890625, 0.0140380859375, 0.02065277099609375, 0.0272674560546875, 0.03388214111328125, 0.040496826171875, 0.04711151123046875, 0.0537261962890625, 0.06034088134765625, 0.06695556640625, 0.07357025146484375, 0.0801849365234375, 0.08679962158203125, 0.093414306640625, 0.10002899169921875, 0.1066436767578125, 0.11325836181640625, 0.119873046875, 0.12648773193359375, 0.1331024169921875, 0.13971710205078125, 0.146331787109375, 0.15294647216796875, 0.1595611572265625, 0.16617584228515625, 0.17279052734375, 0.17940521240234375, 0.1860198974609375, 0.19263458251953125, 0.199249267578125, 0.20586395263671875, 0.2124786376953125, 0.21909332275390625, 0.2257080078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 21.0, 80.0, 295.0, 459.0, 107.0, 32.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.836428642272949, -6.480191707611084, -6.123955249786377, -5.767718315124512, -5.411481857299805, -5.0552449226379395, -4.699007987976074, -4.342771530151367, -3.986534833908081, -3.630298137664795, -3.274061441421509, -2.9178247451782227, -2.5615878105163574, -2.2053513526916504, -1.8491144180297852, -1.492877721786499, -1.136641025543213, -0.7804043292999268, -0.42416757345199585, -0.06793081760406494, 0.2883058786392212, 0.6445425748825073, 1.000779390335083, 1.3570160865783691, 1.7132527828216553, 2.0694894790649414, 2.4257261753082275, 2.7819628715515137, 3.138199806213379, 3.494436264038086, 3.850673198699951, 4.206910133361816, 4.563146591186523, 4.919383525848389, 5.275619983673096, 5.631856918334961, 5.988093376159668, 6.344330310821533, 6.700567245483398, 7.0568037033081055, 7.4130401611328125, 7.769277095794678, 8.125514030456543, 8.48175048828125, 8.837986946105957, 9.194223403930664, 9.550460815429688, 9.906697273254395, 10.262933731079102, 10.619170188903809, 10.975407600402832, 11.331644058227539, 11.687880516052246, 12.044116973876953, 12.400354385375977, 12.756590843200684, 13.112828254699707, 13.469064712524414, 13.825302124023438, 14.181538581848145, 14.537775039672852, 14.894011497497559, 15.250248908996582, 15.606485366821289, 15.962721824645996]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 12.0, 17.0, 16.0, 24.0, 14.0, 30.0, 28.0, 29.0, 42.0, 32.0, 44.0, 47.0, 51.0, 66.0, 37.0, 42.0, 59.0, 48.0, 54.0, 36.0, 42.0, 33.0, 28.0, 24.0, 20.0, 22.0, 18.0, 18.0, 9.0, 9.0, 8.0, 6.0, 7.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7749481201171875, -3.656970500946045, -3.5389928817749023, -3.421015501022339, -3.3030378818511963, -3.1850602626800537, -3.067082643508911, -2.9491052627563477, -2.831127643585205, -2.7131500244140625, -2.59517240524292, -2.4771950244903564, -2.359217405319214, -2.2412397861480713, -2.1232621669769287, -2.0052847862243652, -1.887307047843933, -1.7693294286727905, -1.6513519287109375, -1.533374309539795, -1.415396809577942, -1.2974191904067993, -1.1794416904449463, -1.0614640712738037, -0.9434865117073059, -0.8255089521408081, -0.7075313925743103, -0.5895538330078125, -0.4715762436389923, -0.3535986542701721, -0.23562109470367432, -0.11764353513717651, 0.00033402442932128906, 0.11831159144639969, 0.2362891584634781, 0.3542667329311371, 0.4722442924976349, 0.5902218818664551, 0.7081994414329529, 0.8261770009994507, 0.9441545605659485, 1.0621321201324463, 1.1801097393035889, 1.298087239265442, 1.4160648584365845, 1.5340423583984375, 1.65201997756958, 1.7699975967407227, 1.8879750967025757, 2.0059525966644287, 2.1239302158355713, 2.241907835006714, 2.3598854541778564, 2.47786283493042, 2.5958404541015625, 2.713818073272705, 2.8317956924438477, 2.9497733116149902, 3.067750930786133, 3.1857283115386963, 3.303705930709839, 3.4216835498809814, 3.539661169052124, 3.6576385498046875, 3.77561616897583]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 17.0, 18.0, 43.0, 59.0, 100.0, 165.0, 368.0, 945.0, 2746.0, 15327.0, 3808720.0, 351967.0, 9937.0, 2220.0, 823.0, 362.0, 176.0, 100.0, 65.0, 31.0, 25.0, 14.0, 15.0, 9.0, 8.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88134765625, -0.8370437622070312, -0.7927398681640625, -0.7484359741210938, -0.704132080078125, -0.6598281860351562, -0.6155242919921875, -0.5712203979492188, -0.52691650390625, -0.48261260986328125, -0.4383087158203125, -0.39400482177734375, -0.349700927734375, -0.30539703369140625, -0.2610931396484375, -0.21678924560546875, -0.1724853515625, -0.12818145751953125, -0.0838775634765625, -0.03957366943359375, 0.004730224609375, 0.04903411865234375, 0.0933380126953125, 0.13764190673828125, 0.18194580078125, 0.22624969482421875, 0.2705535888671875, 0.31485748291015625, 0.359161376953125, 0.40346527099609375, 0.4477691650390625, 0.49207305908203125, 0.536376953125, 0.5806808471679688, 0.6249847412109375, 0.6692886352539062, 0.713592529296875, 0.7578964233398438, 0.8022003173828125, 0.8465042114257812, 0.89080810546875, 0.9351119995117188, 0.9794158935546875, 1.0237197875976562, 1.068023681640625, 1.1123275756835938, 1.1566314697265625, 1.2009353637695312, 1.2452392578125, 1.2895431518554688, 1.3338470458984375, 1.3781509399414062, 1.422454833984375, 1.4667587280273438, 1.5110626220703125, 1.5553665161132812, 1.59967041015625, 1.6439743041992188, 1.6882781982421875, 1.7325820922851562, 1.776885986328125, 1.8211898803710938, 1.8654937744140625, 1.9097976684570312, 1.9541015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 10.0, 9.0, 16.0, 29.0, 28.0, 37.0, 44.0, 50.0, 62.0, 67.0, 73.0, 85.0, 63.0, 61.0, 63.0, 67.0, 59.0, 32.0, 32.0, 24.0, 24.0, 23.0, 14.0, 10.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.14116477966308594, -0.13376998901367188, -0.1263751983642578, -0.11898040771484375, -0.11158561706542969, -0.10419082641601562, -0.09679603576660156, -0.0894012451171875, -0.08200645446777344, -0.07461166381835938, -0.06721687316894531, -0.05982208251953125, -0.05242729187011719, -0.045032501220703125, -0.03763771057128906, -0.030242919921875, -0.022848129272460938, -0.015453338623046875, -0.008058547973632812, -0.00066375732421875, 0.0067310333251953125, 0.014125823974609375, 0.021520614624023438, 0.0289154052734375, 0.03631019592285156, 0.043704986572265625, 0.05109977722167969, 0.05849456787109375, 0.06588935852050781, 0.07328414916992188, 0.08067893981933594, 0.08807373046875, 0.09546852111816406, 0.10286331176757812, 0.11025810241699219, 0.11765289306640625, 0.1250476837158203, 0.13244247436523438, 0.13983726501464844, 0.1472320556640625, 0.15462684631347656, 0.16202163696289062, 0.1694164276123047, 0.17681121826171875, 0.1842060089111328, 0.19160079956054688, 0.19899559020996094, 0.206390380859375, 0.21378517150878906, 0.22117996215820312, 0.2285747528076172, 0.23596954345703125, 0.2433643341064453, 0.2507591247558594, 0.25815391540527344, 0.2655487060546875, 0.27294349670410156, 0.2803382873535156, 0.2877330780029297, 0.29512786865234375, 0.3025226593017578, 0.3099174499511719, 0.31731224060058594, 0.32470703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 13.0, 20.0, 46.0, 102.0, 197.0, 383.0, 929.0, 3065.0, 20925.0, 3953860.0, 203971.0, 7952.0, 1615.0, 599.0, 272.0, 150.0, 75.0, 58.0, 26.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0278778076171875, -0.986419677734375, -0.9449615478515625, -0.90350341796875, -0.8620452880859375, -0.820587158203125, -0.7791290283203125, -0.7376708984375, -0.6962127685546875, -0.654754638671875, -0.6132965087890625, -0.57183837890625, -0.5303802490234375, -0.488922119140625, -0.4474639892578125, -0.406005859375, -0.3645477294921875, -0.323089599609375, -0.2816314697265625, -0.24017333984375, -0.1987152099609375, -0.157257080078125, -0.1157989501953125, -0.0743408203125, -0.0328826904296875, 0.008575439453125, 0.0500335693359375, 0.09149169921875, 0.1329498291015625, 0.174407958984375, 0.2158660888671875, 0.25732421875, 0.2987823486328125, 0.340240478515625, 0.3816986083984375, 0.42315673828125, 0.4646148681640625, 0.506072998046875, 0.5475311279296875, 0.5889892578125, 0.6304473876953125, 0.671905517578125, 0.7133636474609375, 0.75482177734375, 0.7962799072265625, 0.837738037109375, 0.8791961669921875, 0.920654296875, 0.9621124267578125, 1.003570556640625, 1.0450286865234375, 1.08648681640625, 1.1279449462890625, 1.169403076171875, 1.2108612060546875, 1.2523193359375, 1.2937774658203125, 1.335235595703125, 1.3766937255859375, 1.41815185546875, 1.4596099853515625, 1.501068115234375, 1.5425262451171875, 1.583984375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 13.0, 22.0, 26.0, 65.0, 203.0, 2129.0, 1280.0, 172.0, 58.0, 36.0, 23.0, 14.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5027847290039062, -0.4865264892578125, -0.47026824951171875, -0.454010009765625, -0.43775177001953125, -0.4214935302734375, -0.40523529052734375, -0.38897705078125, -0.37271881103515625, -0.3564605712890625, -0.34020233154296875, -0.323944091796875, -0.30768585205078125, -0.2914276123046875, -0.27516937255859375, -0.2589111328125, -0.24265289306640625, -0.2263946533203125, -0.21013641357421875, -0.193878173828125, -0.17761993408203125, -0.1613616943359375, -0.14510345458984375, -0.12884521484375, -0.11258697509765625, -0.0963287353515625, -0.08007049560546875, -0.063812255859375, -0.04755401611328125, -0.0312957763671875, -0.01503753662109375, 0.001220703125, 0.01747894287109375, 0.0337371826171875, 0.04999542236328125, 0.066253662109375, 0.08251190185546875, 0.0987701416015625, 0.11502838134765625, 0.13128662109375, 0.14754486083984375, 0.1638031005859375, 0.18006134033203125, 0.196319580078125, 0.21257781982421875, 0.2288360595703125, 0.24509429931640625, 0.2613525390625, 0.27761077880859375, 0.2938690185546875, 0.31012725830078125, 0.326385498046875, 0.34264373779296875, 0.3589019775390625, 0.37516021728515625, 0.39141845703125, 0.40767669677734375, 0.4239349365234375, 0.44019317626953125, 0.456451416015625, 0.47270965576171875, 0.4889678955078125, 0.5052261352539062, 0.521484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 28.0, 201.0, 637.0, 116.0, 16.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-11.237338066101074, -11.038126945495605, -10.838916778564453, -10.639705657958984, -10.440495491027832, -10.241284370422363, -10.042074203491211, -9.842863082885742, -9.643651962280273, -9.444440841674805, -9.245230674743652, -9.046019554138184, -8.846809387207031, -8.647598266601562, -8.44838809967041, -8.249176979064941, -8.049966812133789, -7.8507561683654785, -7.651545524597168, -7.452334880828857, -7.253124237060547, -7.053913116455078, -6.854702472686768, -6.655491828918457, -6.4562811851501465, -6.257070541381836, -6.057859897613525, -5.858649253845215, -5.659438133239746, -5.4602274894714355, -5.261016845703125, -5.0618062019348145, -4.862595081329346, -4.663384437561035, -4.464173793792725, -4.264963150024414, -4.065752029418945, -3.866541624069214, -3.667330741882324, -3.4681200981140137, -3.268909454345703, -3.0696988105773926, -2.870488166809082, -2.6712772846221924, -2.472066640853882, -2.2728559970855713, -2.0736451148986816, -1.874434471130371, -1.6752238273620605, -1.47601318359375, -1.27680242061615, -1.0775916576385498, -0.8783810138702393, -0.6791703104972839, -0.4799596071243286, -0.2807488441467285, -0.08153820037841797, 0.11767250299453735, 0.3168832063674927, 0.516093909740448, 0.7153046131134033, 0.9145153164863586, 1.113726019859314, 1.312936782836914, 1.5121474266052246]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 10.0, 6.0, 23.0, 21.0, 24.0, 34.0, 24.0, 31.0, 42.0, 51.0, 46.0, 64.0, 52.0, 60.0, 58.0, 50.0, 56.0, 50.0, 51.0, 46.0, 32.0, 28.0, 26.0, 27.0, 17.0, 18.0, 9.0, 8.0, 10.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.520456075668335, -1.4812712669372559, -1.4420864582061768, -1.4029016494750977, -1.3637168407440186, -1.3245320320129395, -1.2853472232818604, -1.2461625337600708, -1.2069777250289917, -1.1677929162979126, -1.1286081075668335, -1.0894232988357544, -1.0502384901046753, -1.0110538005828857, -0.9718689322471619, -0.9326841831207275, -0.8934993147850037, -0.8543145060539246, -0.8151296973228455, -0.7759449481964111, -0.736760139465332, -0.6975753307342529, -0.6583905220031738, -0.6192057132720947, -0.5800209045410156, -0.5408360958099365, -0.5016512870788574, -0.4624665081501007, -0.423281729221344, -0.3840969204902649, -0.3449121117591858, -0.3057273328304291, -0.26654261350631714, -0.22735781967639923, -0.18817302584648132, -0.14898821711540222, -0.10980342328548431, -0.0706186294555664, -0.031433820724487305, 0.007750958204269409, 0.04693576693534851, 0.08612056076526642, 0.12530535459518433, 0.16449016332626343, 0.20367495715618134, 0.24285975098609924, 0.28204455971717834, 0.32122933864593506, 0.36041414737701416, 0.39959895610809326, 0.43878373503685, 0.4779685437679291, 0.5171533226966858, 0.5563381314277649, 0.595522940158844, 0.6347076892852783, 0.6738924980163574, 0.7130773067474365, 0.7522621154785156, 0.7914469242095947, 0.830631673336029, 0.8698164820671082, 0.9090012907981873, 0.9481860399246216, 0.9873709082603455]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 11.0, 11.0, 23.0, 27.0, 44.0, 84.0, 115.0, 179.0, 251.0, 468.0, 890.0, 1895.0, 4348.0, 10882.0, 33016.0, 120173.0, 529693.0, 258169.0, 58105.0, 18112.0, 6599.0, 2611.0, 1290.0, 661.0, 347.0, 207.0, 106.0, 74.0, 42.0, 34.0, 35.0, 14.0, 12.0, 13.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5654296875, -0.54345703125, -0.521484375, -0.49951171875, -0.4775390625, -0.45556640625, -0.43359375, -0.41162109375, -0.3896484375, -0.36767578125, -0.345703125, -0.32373046875, -0.3017578125, -0.27978515625, -0.2578125, -0.23583984375, -0.2138671875, -0.19189453125, -0.169921875, -0.14794921875, -0.1259765625, -0.10400390625, -0.08203125, -0.06005859375, -0.0380859375, -0.01611328125, 0.005859375, 0.02783203125, 0.0498046875, 0.07177734375, 0.09375, 0.11572265625, 0.1376953125, 0.15966796875, 0.181640625, 0.20361328125, 0.2255859375, 0.24755859375, 0.26953125, 0.29150390625, 0.3134765625, 0.33544921875, 0.357421875, 0.37939453125, 0.4013671875, 0.42333984375, 0.4453125, 0.46728515625, 0.4892578125, 0.51123046875, 0.533203125, 0.55517578125, 0.5771484375, 0.59912109375, 0.62109375, 0.64306640625, 0.6650390625, 0.68701171875, 0.708984375, 0.73095703125, 0.7529296875, 0.77490234375, 0.796875, 0.81884765625, 0.8408203125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 14.0, 22.0, 34.0, 25.0, 23.0, 28.0, 35.0, 35.0, 40.0, 59.0, 52.0, 55.0, 55.0, 62.0, 56.0, 58.0, 57.0, 39.0, 35.0, 45.0, 29.0, 32.0, 17.0, 13.0, 20.0, 9.0, 13.0, 8.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.151611328125, -0.14554595947265625, -0.1394805908203125, -0.13341522216796875, -0.127349853515625, -0.12128448486328125, -0.1152191162109375, -0.10915374755859375, -0.10308837890625, -0.09702301025390625, -0.0909576416015625, -0.08489227294921875, -0.078826904296875, -0.07276153564453125, -0.0666961669921875, -0.06063079833984375, -0.0545654296875, -0.04850006103515625, -0.0424346923828125, -0.03636932373046875, -0.030303955078125, -0.02423858642578125, -0.0181732177734375, -0.01210784912109375, -0.00604248046875, 2.288818359375e-05, 0.0060882568359375, 0.01215362548828125, 0.018218994140625, 0.02428436279296875, 0.0303497314453125, 0.03641510009765625, 0.04248046875, 0.04854583740234375, 0.0546112060546875, 0.06067657470703125, 0.066741943359375, 0.07280731201171875, 0.0788726806640625, 0.08493804931640625, 0.09100341796875, 0.09706878662109375, 0.1031341552734375, 0.10919952392578125, 0.115264892578125, 0.12133026123046875, 0.1273956298828125, 0.13346099853515625, 0.1395263671875, 0.14559173583984375, 0.1516571044921875, 0.15772247314453125, 0.163787841796875, 0.16985321044921875, 0.1759185791015625, 0.18198394775390625, 0.18804931640625, 0.19411468505859375, 0.2001800537109375, 0.20624542236328125, 0.212310791015625, 0.21837615966796875, 0.2244415283203125, 0.23050689697265625, 0.236572265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 3.0, 7.0, 7.0, 7.0, 14.0, 7.0, 12.0, 23.0, 30.0, 40.0, 58.0, 77.0, 118.0, 255.0, 414.0, 785.0, 1736.0, 4224.0, 12335.0, 43323.0, 217363.0, 600549.0, 124059.0, 28368.0, 8643.0, 3155.0, 1398.0, 639.0, 317.0, 207.0, 135.0, 76.0, 40.0, 34.0, 15.0, 14.0, 14.0, 13.0, 8.0, 7.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67578125, -0.6535110473632812, -0.6312408447265625, -0.6089706420898438, -0.586700439453125, -0.5644302368164062, -0.5421600341796875, -0.5198898315429688, -0.49761962890625, -0.47534942626953125, -0.4530792236328125, -0.43080902099609375, -0.408538818359375, -0.38626861572265625, -0.3639984130859375, -0.34172821044921875, -0.3194580078125, -0.29718780517578125, -0.2749176025390625, -0.25264739990234375, -0.230377197265625, -0.20810699462890625, -0.1858367919921875, -0.16356658935546875, -0.14129638671875, -0.11902618408203125, -0.0967559814453125, -0.07448577880859375, -0.052215576171875, -0.02994537353515625, -0.0076751708984375, 0.01459503173828125, 0.036865234375, 0.05913543701171875, 0.0814056396484375, 0.10367584228515625, 0.125946044921875, 0.14821624755859375, 0.1704864501953125, 0.19275665283203125, 0.21502685546875, 0.23729705810546875, 0.2595672607421875, 0.28183746337890625, 0.304107666015625, 0.32637786865234375, 0.3486480712890625, 0.37091827392578125, 0.3931884765625, 0.41545867919921875, 0.4377288818359375, 0.45999908447265625, 0.482269287109375, 0.5045394897460938, 0.5268096923828125, 0.5490798950195312, 0.57135009765625, 0.5936203002929688, 0.6158905029296875, 0.6381607055664062, 0.660430908203125, 0.6827011108398438, 0.7049713134765625, 0.7272415161132812, 0.74951171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 10.0, 11.0, 13.0, 18.0, 24.0, 16.0, 25.0, 28.0, 37.0, 41.0, 43.0, 59.0, 39.0, 48.0, 57.0, 55.0, 51.0, 51.0, 40.0, 40.0, 38.0, 45.0, 33.0, 31.0, 22.0, 18.0, 24.0, 12.0, 8.0, 7.0, 10.0, 9.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.78955078125, -0.7642898559570312, -0.7390289306640625, -0.7137680053710938, -0.688507080078125, -0.6632461547851562, -0.6379852294921875, -0.6127243041992188, -0.58746337890625, -0.5622024536132812, -0.5369415283203125, -0.5116806030273438, -0.486419677734375, -0.46115875244140625, -0.4358978271484375, -0.41063690185546875, -0.3853759765625, -0.36011505126953125, -0.3348541259765625, -0.30959320068359375, -0.284332275390625, -0.25907135009765625, -0.2338104248046875, -0.20854949951171875, -0.18328857421875, -0.15802764892578125, -0.1327667236328125, -0.10750579833984375, -0.082244873046875, -0.05698394775390625, -0.0317230224609375, -0.00646209716796875, 0.018798828125, 0.04405975341796875, 0.0693206787109375, 0.09458160400390625, 0.119842529296875, 0.14510345458984375, 0.1703643798828125, 0.19562530517578125, 0.22088623046875, 0.24614715576171875, 0.2714080810546875, 0.29666900634765625, 0.321929931640625, 0.34719085693359375, 0.3724517822265625, 0.39771270751953125, 0.4229736328125, 0.44823455810546875, 0.4734954833984375, 0.49875640869140625, 0.524017333984375, 0.5492782592773438, 0.5745391845703125, 0.5998001098632812, 0.62506103515625, 0.6503219604492188, 0.6755828857421875, 0.7008438110351562, 0.726104736328125, 0.7513656616210938, 0.7766265869140625, 0.8018875122070312, 0.8271484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 5.0, 12.0, 13.0, 45.0, 145.0, 375.0, 1438.0, 20299.0, 1013143.0, 11538.0, 1061.0, 278.0, 120.0, 43.0, 14.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.230377197265625, -1.19122314453125, -1.152069091796875, -1.1129150390625, -1.073760986328125, -1.03460693359375, -0.995452880859375, -0.956298828125, -0.917144775390625, -0.87799072265625, -0.838836669921875, -0.7996826171875, -0.760528564453125, -0.72137451171875, -0.682220458984375, -0.64306640625, -0.603912353515625, -0.56475830078125, -0.525604248046875, -0.4864501953125, -0.447296142578125, -0.40814208984375, -0.368988037109375, -0.329833984375, -0.290679931640625, -0.25152587890625, -0.212371826171875, -0.1732177734375, -0.134063720703125, -0.09490966796875, -0.055755615234375, -0.0166015625, 0.022552490234375, 0.06170654296875, 0.100860595703125, 0.1400146484375, 0.179168701171875, 0.21832275390625, 0.257476806640625, 0.296630859375, 0.335784912109375, 0.37493896484375, 0.414093017578125, 0.4532470703125, 0.492401123046875, 0.53155517578125, 0.570709228515625, 0.60986328125, 0.649017333984375, 0.68817138671875, 0.727325439453125, 0.7664794921875, 0.805633544921875, 0.84478759765625, 0.883941650390625, 0.923095703125, 0.962249755859375, 1.00140380859375, 1.040557861328125, 1.0797119140625, 1.118865966796875, 1.15802001953125, 1.197174072265625, 1.236328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 8.0, 26.0, 37.0, 48.0, 88.0, 135.0, 168.0, 166.0, 104.0, 78.0, 51.0, 20.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1975250244140625e-05, -5.034264177083969e-05, -4.871003329753876e-05, -4.7077424824237823e-05, -4.544481635093689e-05, -4.3812207877635956e-05, -4.217959940433502e-05, -4.054699093103409e-05, -3.8914382457733154e-05, -3.728177398443222e-05, -3.564916551113129e-05, -3.401655703783035e-05, -3.238394856452942e-05, -3.0751340091228485e-05, -2.911873161792755e-05, -2.7486123144626617e-05, -2.5853514671325684e-05, -2.422090619802475e-05, -2.2588297724723816e-05, -2.0955689251422882e-05, -1.9323080778121948e-05, -1.7690472304821014e-05, -1.605786383152008e-05, -1.4425255358219147e-05, -1.2792646884918213e-05, -1.1160038411617279e-05, -9.527429938316345e-06, -7.894821465015411e-06, -6.2622129917144775e-06, -4.629604518413544e-06, -2.99699604511261e-06, -1.364387571811676e-06, 2.682209014892578e-07, 1.9008293747901917e-06, 3.5334378480911255e-06, 5.166046321392059e-06, 6.798654794692993e-06, 8.431263267993927e-06, 1.006387174129486e-05, 1.1696480214595795e-05, 1.3329088687896729e-05, 1.4961697161197662e-05, 1.6594305634498596e-05, 1.822691410779953e-05, 1.9859522581100464e-05, 2.1492131054401398e-05, 2.312473952770233e-05, 2.4757348001003265e-05, 2.63899564743042e-05, 2.8022564947605133e-05, 2.9655173420906067e-05, 3.1287781894207e-05, 3.2920390367507935e-05, 3.455299884080887e-05, 3.61856073141098e-05, 3.7818215787410736e-05, 3.945082426071167e-05, 4.1083432734012604e-05, 4.271604120731354e-05, 4.434864968061447e-05, 4.5981258153915405e-05, 4.761386662721634e-05, 4.924647510051727e-05, 5.087908357381821e-05, 5.251169204711914e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 19.0, 35.0, 60.0, 94.0, 159.0, 282.0, 1059.0, 31374.0, 1009323.0, 5096.0, 505.0, 211.0, 117.0, 86.0, 41.0, 24.0, 23.0, 11.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.115234375, -1.0758209228515625, -1.036407470703125, -0.9969940185546875, -0.95758056640625, -0.9181671142578125, -0.878753662109375, -0.8393402099609375, -0.7999267578125, -0.7605133056640625, -0.721099853515625, -0.6816864013671875, -0.64227294921875, -0.6028594970703125, -0.563446044921875, -0.5240325927734375, -0.484619140625, -0.4452056884765625, -0.405792236328125, -0.3663787841796875, -0.32696533203125, -0.2875518798828125, -0.248138427734375, -0.2087249755859375, -0.1693115234375, -0.1298980712890625, -0.090484619140625, -0.0510711669921875, -0.01165771484375, 0.0277557373046875, 0.067169189453125, 0.1065826416015625, 0.14599609375, 0.1854095458984375, 0.224822998046875, 0.2642364501953125, 0.30364990234375, 0.3430633544921875, 0.382476806640625, 0.4218902587890625, 0.4613037109375, 0.5007171630859375, 0.540130615234375, 0.5795440673828125, 0.61895751953125, 0.6583709716796875, 0.697784423828125, 0.7371978759765625, 0.776611328125, 0.8160247802734375, 0.855438232421875, 0.8948516845703125, 0.93426513671875, 0.9736785888671875, 1.013092041015625, 1.0525054931640625, 1.0919189453125, 1.1313323974609375, 1.170745849609375, 1.2101593017578125, 1.24957275390625, 1.2889862060546875, 1.328399658203125, 1.3678131103515625, 1.4072265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 35.0, 212.0, 530.0, 171.0, 35.0, 8.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.172760009765625, -1.12677001953125, -1.080780029296875, -1.0347900390625, -0.988800048828125, -0.94281005859375, -0.896820068359375, -0.850830078125, -0.804840087890625, -0.75885009765625, -0.712860107421875, -0.6668701171875, -0.620880126953125, -0.57489013671875, -0.528900146484375, -0.48291015625, -0.436920166015625, -0.39093017578125, -0.344940185546875, -0.2989501953125, -0.252960205078125, -0.20697021484375, -0.160980224609375, -0.114990234375, -0.069000244140625, -0.02301025390625, 0.022979736328125, 0.0689697265625, 0.114959716796875, 0.16094970703125, 0.206939697265625, 0.2529296875, 0.298919677734375, 0.34490966796875, 0.390899658203125, 0.4368896484375, 0.482879638671875, 0.52886962890625, 0.574859619140625, 0.620849609375, 0.666839599609375, 0.71282958984375, 0.758819580078125, 0.8048095703125, 0.850799560546875, 0.89678955078125, 0.942779541015625, 0.98876953125, 1.034759521484375, 1.08074951171875, 1.126739501953125, 1.1727294921875, 1.218719482421875, 1.26470947265625, 1.310699462890625, 1.356689453125, 1.402679443359375, 1.44866943359375, 1.494659423828125, 1.5406494140625, 1.586639404296875, 1.63262939453125, 1.678619384765625, 1.724609375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 19.0, 39.0, 93.0, 336.0, 335.0, 134.0, 33.0, 10.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6794753074645996, -3.3204543590545654, -2.9614334106445312, -2.602412223815918, -2.243391275405884, -1.8843703269958496, -1.5253491401672363, -1.1663281917572021, -0.807307243347168, -0.448286235332489, -0.08926522731781006, 0.26975584030151367, 0.6287767887115479, 0.987797737121582, 1.3468189239501953, 1.7058398723602295, 2.0648608207702637, 2.423881769180298, 2.782902717590332, 3.1419239044189453, 3.5009448528289795, 3.8599658012390137, 4.218986988067627, 4.578007698059082, 4.937028884887695, 5.296050071716309, 5.655070781707764, 6.014091968536377, 6.373112678527832, 6.732133865356445, 7.091155052185059, 7.450176239013672, 7.809196472167969, 8.168217658996582, 8.527238845825195, 8.886259078979492, 9.245280265808105, 9.604301452636719, 9.963322639465332, 10.322343826293945, 10.681364059448242, 11.040385246276855, 11.399406433105469, 11.758426666259766, 12.117447853088379, 12.476469039916992, 12.835490226745605, 13.194511413574219, 13.553532600402832, 13.912553787231445, 14.271574974060059, 14.630596160888672, 14.989616394042969, 15.348637580871582, 15.707658767700195, 16.066679000854492, 16.425701141357422, 16.78472137451172, 17.14374351501465, 17.502763748168945, 17.861785888671875, 18.220806121826172, 18.57982635498047, 18.9388484954834, 19.297868728637695]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 3.0, 9.0, 9.0, 11.0, 13.0, 15.0, 13.0, 14.0, 20.0, 36.0, 33.0, 41.0, 39.0, 32.0, 43.0, 37.0, 57.0, 46.0, 47.0, 42.0, 39.0, 41.0, 50.0, 30.0, 33.0, 28.0, 21.0, 39.0, 25.0, 25.0, 17.0, 21.0, 13.0, 10.0, 3.0, 8.0, 3.0, 2.0, 6.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.138191223144531, -4.019832134246826, -3.901472806930542, -3.783113479614258, -3.6647541522979736, -3.5463948249816895, -3.4280357360839844, -3.3096764087677, -3.191317081451416, -3.072957754135132, -2.9545986652374268, -2.8362393379211426, -2.7178800106048584, -2.599520683288574, -2.481161594390869, -2.362802267074585, -2.24444317817688, -2.1260838508605957, -2.0077247619628906, -1.8893654346466064, -1.7710061073303223, -1.6526468992233276, -1.534287691116333, -1.4159283638000488, -1.2975691556930542, -1.1792099475860596, -1.0608506202697754, -0.9424914121627808, -0.8241321444511414, -0.705772876739502, -0.5874136686325073, -0.4690544009208679, -0.3506953716278076, -0.2323361188173294, -0.1139768660068512, 0.00438237190246582, 0.12274163961410522, 0.24110090732574463, 0.35946011543273926, 0.47781938314437866, 0.5961786508560181, 0.7145379185676575, 0.8328971862792969, 0.9512563943862915, 1.0696156024932861, 1.1879749298095703, 1.306334137916565, 1.4246933460235596, 1.5430526733398438, 1.6614118814468384, 1.7797712087631226, 1.8981304168701172, 2.0164897441864014, 2.1348490715026855, 2.2532081604003906, 2.371567487716675, 2.489926815032959, 2.608286142349243, 2.7266452312469482, 2.8450045585632324, 2.9633638858795166, 3.081723213195801, 3.200082302093506, 3.31844162940979, 3.436800718307495]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 10.0, 8.0, 16.0, 19.0, 35.0, 56.0, 56.0, 78.0, 132.0, 169.0, 290.0, 436.0, 732.0, 1358.0, 2491.0, 5211.0, 13318.0, 43272.0, 374223.0, 3620227.0, 93592.0, 22271.0, 8065.0, 3622.0, 1888.0, 1034.0, 554.0, 347.0, 247.0, 159.0, 107.0, 67.0, 59.0, 34.0, 24.0, 19.0, 15.0, 11.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.5380859375, -0.5228157043457031, -0.5075454711914062, -0.4922752380371094, -0.4770050048828125, -0.4617347717285156, -0.44646453857421875, -0.4311943054199219, -0.415924072265625, -0.4006538391113281, -0.38538360595703125, -0.3701133728027344, -0.3548431396484375, -0.3395729064941406, -0.32430267333984375, -0.3090324401855469, -0.29376220703125, -0.2784919738769531, -0.26322174072265625, -0.24795150756835938, -0.2326812744140625, -0.21741104125976562, -0.20214080810546875, -0.18687057495117188, -0.171600341796875, -0.15633010864257812, -0.14105987548828125, -0.12578964233398438, -0.1105194091796875, -0.09524917602539062, -0.07997894287109375, -0.06470870971679688, -0.0494384765625, -0.034168243408203125, -0.01889801025390625, -0.003627777099609375, 0.0116424560546875, 0.026912689208984375, 0.04218292236328125, 0.057453155517578125, 0.072723388671875, 0.08799362182617188, 0.10326385498046875, 0.11853408813476562, 0.1338043212890625, 0.14907455444335938, 0.16434478759765625, 0.17961502075195312, 0.19488525390625, 0.21015548706054688, 0.22542572021484375, 0.24069595336914062, 0.2559661865234375, 0.2712364196777344, 0.28650665283203125, 0.3017768859863281, 0.317047119140625, 0.3323173522949219, 0.34758758544921875, 0.3628578186035156, 0.3781280517578125, 0.3933982849121094, 0.40866851806640625, 0.4239387512207031, 0.439208984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 6.0, 11.0, 14.0, 22.0, 24.0, 29.0, 36.0, 36.0, 42.0, 62.0, 55.0, 45.0, 48.0, 56.0, 39.0, 62.0, 51.0, 34.0, 43.0, 36.0, 33.0, 42.0, 32.0, 25.0, 15.0, 17.0, 14.0, 15.0, 7.0, 11.0, 14.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.15790748596191406, -0.15114212036132812, -0.1443767547607422, -0.13761138916015625, -0.1308460235595703, -0.12408065795898438, -0.11731529235839844, -0.1105499267578125, -0.10378456115722656, -0.09701919555664062, -0.09025382995605469, -0.08348846435546875, -0.07672309875488281, -0.06995773315429688, -0.06319236755371094, -0.056427001953125, -0.04966163635253906, -0.042896270751953125, -0.03613090515136719, -0.02936553955078125, -0.022600173950195312, -0.015834808349609375, -0.009069442749023438, -0.0023040771484375, 0.0044612884521484375, 0.011226654052734375, 0.017992019653320312, 0.02475738525390625, 0.03152275085449219, 0.038288116455078125, 0.04505348205566406, 0.05181884765625, 0.05858421325683594, 0.06534957885742188, 0.07211494445800781, 0.07888031005859375, 0.08564567565917969, 0.09241104125976562, 0.09917640686035156, 0.1059417724609375, 0.11270713806152344, 0.11947250366210938, 0.1262378692626953, 0.13300323486328125, 0.1397686004638672, 0.14653396606445312, 0.15329933166503906, 0.160064697265625, 0.16683006286621094, 0.17359542846679688, 0.1803607940673828, 0.18712615966796875, 0.1938915252685547, 0.20065689086914062, 0.20742225646972656, 0.2141876220703125, 0.22095298767089844, 0.22771835327148438, 0.2344837188720703, 0.24124908447265625, 0.2480144500732422, 0.2547798156738281, 0.26154518127441406, 0.268310546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 11.0, 22.0, 17.0, 27.0, 35.0, 62.0, 76.0, 122.0, 235.0, 391.0, 962.0, 3668.0, 30723.0, 4049555.0, 99334.0, 6509.0, 1340.0, 474.0, 242.0, 145.0, 83.0, 75.0, 63.0, 38.0, 23.0, 14.0, 7.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0830078125, -1.039093017578125, -0.99517822265625, -0.951263427734375, -0.9073486328125, -0.863433837890625, -0.81951904296875, -0.775604248046875, -0.731689453125, -0.687774658203125, -0.64385986328125, -0.599945068359375, -0.5560302734375, -0.512115478515625, -0.46820068359375, -0.424285888671875, -0.38037109375, -0.336456298828125, -0.29254150390625, -0.248626708984375, -0.2047119140625, -0.160797119140625, -0.11688232421875, -0.072967529296875, -0.029052734375, 0.014862060546875, 0.05877685546875, 0.102691650390625, 0.1466064453125, 0.190521240234375, 0.23443603515625, 0.278350830078125, 0.322265625, 0.366180419921875, 0.41009521484375, 0.454010009765625, 0.4979248046875, 0.541839599609375, 0.58575439453125, 0.629669189453125, 0.673583984375, 0.717498779296875, 0.76141357421875, 0.805328369140625, 0.8492431640625, 0.893157958984375, 0.93707275390625, 0.980987548828125, 1.02490234375, 1.068817138671875, 1.11273193359375, 1.156646728515625, 1.2005615234375, 1.244476318359375, 1.28839111328125, 1.332305908203125, 1.376220703125, 1.420135498046875, 1.46405029296875, 1.507965087890625, 1.5518798828125, 1.595794677734375, 1.63970947265625, 1.683624267578125, 1.7275390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 15.0, 26.0, 64.0, 430.0, 3240.0, 198.0, 52.0, 18.0, 12.0, 9.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5309219360351562, -0.5071563720703125, -0.48339080810546875, -0.459625244140625, -0.43585968017578125, -0.4120941162109375, -0.38832855224609375, -0.36456298828125, -0.34079742431640625, -0.3170318603515625, -0.29326629638671875, -0.269500732421875, -0.24573516845703125, -0.2219696044921875, -0.19820404052734375, -0.1744384765625, -0.15067291259765625, -0.1269073486328125, -0.10314178466796875, -0.079376220703125, -0.05561065673828125, -0.0318450927734375, -0.00807952880859375, 0.01568603515625, 0.03945159912109375, 0.0632171630859375, 0.08698272705078125, 0.110748291015625, 0.13451385498046875, 0.1582794189453125, 0.18204498291015625, 0.205810546875, 0.22957611083984375, 0.2533416748046875, 0.27710723876953125, 0.300872802734375, 0.32463836669921875, 0.3484039306640625, 0.37216949462890625, 0.39593505859375, 0.41970062255859375, 0.4434661865234375, 0.46723175048828125, 0.490997314453125, 0.5147628784179688, 0.5385284423828125, 0.5622940063476562, 0.5860595703125, 0.6098251342773438, 0.6335906982421875, 0.6573562622070312, 0.681121826171875, 0.7048873901367188, 0.7286529541015625, 0.7524185180664062, 0.77618408203125, 0.7999496459960938, 0.8237152099609375, 0.8474807739257812, 0.871246337890625, 0.8950119018554688, 0.9187774658203125, 0.9425430297851562, 0.96630859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 27.0, 138.0, 365.0, 346.0, 84.0, 18.0, 10.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.105861186981201, -5.992343425750732, -5.8788251876831055, -5.765307426452637, -5.651789665222168, -5.538271903991699, -5.424753665924072, -5.3112359046936035, -5.197718143463135, -5.084200382232666, -4.970682144165039, -4.85716438293457, -4.743646621704102, -4.630128860473633, -4.516610622406006, -4.403092861175537, -4.28957462310791, -4.176056861877441, -4.0625386238098145, -3.9490208625793457, -3.835503101348877, -3.721985101699829, -3.6084671020507812, -3.4949493408203125, -3.3814315795898438, -3.267913579940796, -3.154395818710327, -3.0408778190612793, -2.9273600578308105, -2.8138420581817627, -2.700324058532715, -2.586806297302246, -2.4732885360717773, -2.3597705364227295, -2.2462527751922607, -2.132734775543213, -2.019217014312744, -1.9056990146636963, -1.792181134223938, -1.6786632537841797, -1.5651453733444214, -1.451627492904663, -1.3381096124649048, -1.2245917320251465, -1.1110737323760986, -0.9975559115409851, -0.884037971496582, -0.7705200910568237, -0.6570022106170654, -0.5434843301773071, -0.42996641993522644, -0.31644850969314575, -0.20293062925338745, -0.08941274881362915, 0.024105191230773926, 0.13762307167053223, 0.2511409521102905, 0.36465883255004883, 0.4781767427921295, 0.5916946530342102, 0.7052125334739685, 0.8187304139137268, 0.9322483539581299, 1.0457662343978882, 1.1592841148376465]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 2.0, 2.0, 6.0, 8.0, 11.0, 9.0, 19.0, 23.0, 22.0, 27.0, 37.0, 41.0, 40.0, 48.0, 52.0, 51.0, 64.0, 62.0, 51.0, 73.0, 43.0, 43.0, 43.0, 43.0, 50.0, 21.0, 22.0, 20.0, 17.0, 10.0, 10.0, 7.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.045449137687683, -1.0140300989151, -0.9826111197471619, -0.9511920809745789, -0.9197731018066406, -0.8883540630340576, -0.8569350242614746, -0.8255160450935364, -0.7940970659255981, -0.7626780271530151, -0.7312590479850769, -0.6998400092124939, -0.6684210300445557, -0.6370019912719727, -0.6055829524993896, -0.5741639733314514, -0.5427449345588684, -0.5113258957862854, -0.47990691661834717, -0.44848787784576416, -0.4170688986778259, -0.3856498599052429, -0.3542308509349823, -0.3228118419647217, -0.29139283299446106, -0.25997382402420044, -0.22855481505393982, -0.197135791182518, -0.16571678221225739, -0.13429777324199677, -0.10287874937057495, -0.07145974040031433, -0.040040671825408936, -0.008621659129858017, 0.0227973535656929, 0.05421636998653412, 0.08563537895679474, 0.11705438792705536, 0.14847341179847717, 0.1798924207687378, 0.2113114297389984, 0.24273043870925903, 0.27414944767951965, 0.3055684566497803, 0.3369874954223633, 0.3684064745903015, 0.3998255133628845, 0.43124452233314514, 0.46266353130340576, 0.4940825402736664, 0.525501549243927, 0.55692058801651, 0.5883395671844482, 0.6197586059570312, 0.6511776447296143, 0.6825966238975525, 0.7140156030654907, 0.7454346418380737, 0.776853621006012, 0.808272659778595, 0.8396916389465332, 0.8711106777191162, 0.9025297164916992, 0.9339486956596375, 0.9653677344322205]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 12.0, 9.0, 12.0, 18.0, 21.0, 41.0, 49.0, 94.0, 158.0, 271.0, 465.0, 913.0, 1873.0, 4215.0, 10009.0, 26018.0, 80193.0, 301120.0, 435571.0, 125442.0, 37700.0, 13792.0, 5429.0, 2516.0, 1142.0, 614.0, 327.0, 170.0, 116.0, 70.0, 45.0, 40.0, 16.0, 19.0, 11.0, 17.0, 3.0, 12.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6953125, -0.6755447387695312, -0.6557769775390625, -0.6360092163085938, -0.616241455078125, -0.5964736938476562, -0.5767059326171875, -0.5569381713867188, -0.53717041015625, -0.5174026489257812, -0.4976348876953125, -0.47786712646484375, -0.458099365234375, -0.43833160400390625, -0.4185638427734375, -0.39879608154296875, -0.3790283203125, -0.35926055908203125, -0.3394927978515625, -0.31972503662109375, -0.299957275390625, -0.28018951416015625, -0.2604217529296875, -0.24065399169921875, -0.22088623046875, -0.20111846923828125, -0.1813507080078125, -0.16158294677734375, -0.141815185546875, -0.12204742431640625, -0.1022796630859375, -0.08251190185546875, -0.062744140625, -0.04297637939453125, -0.0232086181640625, -0.00344085693359375, 0.016326904296875, 0.03609466552734375, 0.0558624267578125, 0.07563018798828125, 0.09539794921875, 0.11516571044921875, 0.1349334716796875, 0.15470123291015625, 0.174468994140625, 0.19423675537109375, 0.2140045166015625, 0.23377227783203125, 0.2535400390625, 0.27330780029296875, 0.2930755615234375, 0.31284332275390625, 0.332611083984375, 0.35237884521484375, 0.3721466064453125, 0.39191436767578125, 0.41168212890625, 0.43144989013671875, 0.4512176513671875, 0.47098541259765625, 0.490753173828125, 0.5105209350585938, 0.5302886962890625, 0.5500564575195312, 0.56982421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 1.0, 5.0, 2.0, 3.0, 9.0, 11.0, 18.0, 18.0, 30.0, 32.0, 32.0, 37.0, 52.0, 49.0, 50.0, 54.0, 49.0, 49.0, 43.0, 51.0, 47.0, 36.0, 49.0, 37.0, 32.0, 29.0, 31.0, 28.0, 18.0, 26.0, 9.0, 11.0, 12.0, 11.0, 8.0, 5.0, 9.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1771240234375, -0.17061233520507812, -0.16410064697265625, -0.15758895874023438, -0.1510772705078125, -0.14456558227539062, -0.13805389404296875, -0.13154220581054688, -0.125030517578125, -0.11851882934570312, -0.11200714111328125, -0.10549545288085938, -0.0989837646484375, -0.09247207641601562, -0.08596038818359375, -0.07944869995117188, -0.07293701171875, -0.06642532348632812, -0.05991363525390625, -0.053401947021484375, -0.0468902587890625, -0.040378570556640625, -0.03386688232421875, -0.027355194091796875, -0.020843505859375, -0.014331817626953125, -0.00782012939453125, -0.001308441162109375, 0.0052032470703125, 0.011714935302734375, 0.01822662353515625, 0.024738311767578125, 0.03125, 0.037761688232421875, 0.04427337646484375, 0.050785064697265625, 0.0572967529296875, 0.06380844116210938, 0.07032012939453125, 0.07683181762695312, 0.083343505859375, 0.08985519409179688, 0.09636688232421875, 0.10287857055664062, 0.1093902587890625, 0.11590194702148438, 0.12241363525390625, 0.12892532348632812, 0.13543701171875, 0.14194869995117188, 0.14846038818359375, 0.15497207641601562, 0.1614837646484375, 0.16799545288085938, 0.17450714111328125, 0.18101882934570312, 0.187530517578125, 0.19404220581054688, 0.20055389404296875, 0.20706558227539062, 0.2135772705078125, 0.22008895874023438, 0.22660064697265625, 0.23311233520507812, 0.2396240234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 8.0, 12.0, 17.0, 31.0, 23.0, 41.0, 69.0, 79.0, 148.0, 246.0, 484.0, 1146.0, 2982.0, 9075.0, 32433.0, 147508.0, 574759.0, 216300.0, 44788.0, 11868.0, 3782.0, 1422.0, 596.0, 289.0, 142.0, 95.0, 45.0, 40.0, 37.0, 17.0, 14.0, 13.0, 8.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.693359375, -0.6699447631835938, -0.6465301513671875, -0.6231155395507812, -0.599700927734375, -0.5762863159179688, -0.5528717041015625, -0.5294570922851562, -0.50604248046875, -0.48262786865234375, -0.4592132568359375, -0.43579864501953125, -0.412384033203125, -0.38896942138671875, -0.3655548095703125, -0.34214019775390625, -0.3187255859375, -0.29531097412109375, -0.2718963623046875, -0.24848175048828125, -0.225067138671875, -0.20165252685546875, -0.1782379150390625, -0.15482330322265625, -0.13140869140625, -0.10799407958984375, -0.0845794677734375, -0.06116485595703125, -0.037750244140625, -0.01433563232421875, 0.0090789794921875, 0.03249359130859375, 0.055908203125, 0.07932281494140625, 0.1027374267578125, 0.12615203857421875, 0.149566650390625, 0.17298126220703125, 0.1963958740234375, 0.21981048583984375, 0.24322509765625, 0.26663970947265625, 0.2900543212890625, 0.31346893310546875, 0.336883544921875, 0.36029815673828125, 0.3837127685546875, 0.40712738037109375, 0.4305419921875, 0.45395660400390625, 0.4773712158203125, 0.5007858276367188, 0.524200439453125, 0.5476150512695312, 0.5710296630859375, 0.5944442749023438, 0.61785888671875, 0.6412734985351562, 0.6646881103515625, 0.6881027221679688, 0.711517333984375, 0.7349319458007812, 0.7583465576171875, 0.7817611694335938, 0.80517578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 10.0, 8.0, 17.0, 15.0, 28.0, 20.0, 27.0, 31.0, 34.0, 31.0, 31.0, 44.0, 54.0, 47.0, 46.0, 46.0, 38.0, 45.0, 40.0, 44.0, 37.0, 34.0, 31.0, 30.0, 31.0, 29.0, 21.0, 15.0, 15.0, 16.0, 23.0, 7.0, 5.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7900390625, -0.7654495239257812, -0.7408599853515625, -0.7162704467773438, -0.691680908203125, -0.6670913696289062, -0.6425018310546875, -0.6179122924804688, -0.59332275390625, -0.5687332153320312, -0.5441436767578125, -0.5195541381835938, -0.494964599609375, -0.47037506103515625, -0.4457855224609375, -0.42119598388671875, -0.3966064453125, -0.37201690673828125, -0.3474273681640625, -0.32283782958984375, -0.298248291015625, -0.27365875244140625, -0.2490692138671875, -0.22447967529296875, -0.19989013671875, -0.17530059814453125, -0.1507110595703125, -0.12612152099609375, -0.101531982421875, -0.07694244384765625, -0.0523529052734375, -0.02776336669921875, -0.003173828125, 0.02141571044921875, 0.0460052490234375, 0.07059478759765625, 0.095184326171875, 0.11977386474609375, 0.1443634033203125, 0.16895294189453125, 0.19354248046875, 0.21813201904296875, 0.2427215576171875, 0.26731109619140625, 0.291900634765625, 0.31649017333984375, 0.3410797119140625, 0.36566925048828125, 0.3902587890625, 0.41484832763671875, 0.4394378662109375, 0.46402740478515625, 0.488616943359375, 0.5132064819335938, 0.5377960205078125, 0.5623855590820312, 0.58697509765625, 0.6115646362304688, 0.6361541748046875, 0.6607437133789062, 0.685333251953125, 0.7099227905273438, 0.7345123291015625, 0.7591018676757812, 0.78369140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 6.0, 17.0, 17.0, 28.0, 32.0, 47.0, 106.0, 176.0, 266.0, 601.0, 1358.0, 3752.0, 14470.0, 92496.0, 581781.0, 303688.0, 37969.0, 7517.0, 2215.0, 943.0, 408.0, 247.0, 125.0, 91.0, 51.0, 40.0, 22.0, 23.0, 12.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23232078552246094, -0.22330856323242188, -0.2142963409423828, -0.20528411865234375, -0.1962718963623047, -0.18725967407226562, -0.17824745178222656, -0.1692352294921875, -0.16022300720214844, -0.15121078491210938, -0.1421985626220703, -0.13318634033203125, -0.12417411804199219, -0.11516189575195312, -0.10614967346191406, -0.097137451171875, -0.08812522888183594, -0.07911300659179688, -0.07010078430175781, -0.06108856201171875, -0.05207633972167969, -0.043064117431640625, -0.03405189514160156, -0.0250396728515625, -0.016027450561523438, -0.007015228271484375, 0.0019969940185546875, 0.01100921630859375, 0.020021438598632812, 0.029033660888671875, 0.03804588317871094, 0.04705810546875, 0.05607032775878906, 0.06508255004882812, 0.07409477233886719, 0.08310699462890625, 0.09211921691894531, 0.10113143920898438, 0.11014366149902344, 0.1191558837890625, 0.12816810607910156, 0.13718032836914062, 0.1461925506591797, 0.15520477294921875, 0.1642169952392578, 0.17322921752929688, 0.18224143981933594, 0.191253662109375, 0.20026588439941406, 0.20927810668945312, 0.2182903289794922, 0.22730255126953125, 0.2363147735595703, 0.24532699584960938, 0.25433921813964844, 0.2633514404296875, 0.27236366271972656, 0.2813758850097656, 0.2903881072998047, 0.29940032958984375, 0.3084125518798828, 0.3174247741699219, 0.32643699645996094, 0.33544921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 7.0, 20.0, 17.0, 22.0, 42.0, 59.0, 100.0, 124.0, 123.0, 129.0, 111.0, 69.0, 60.0, 32.0, 22.0, 14.0, 8.0, 15.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849102020263672e-05, -2.6963651180267334e-05, -2.543628215789795e-05, -2.3908913135528564e-05, -2.238154411315918e-05, -2.0854175090789795e-05, -1.932680606842041e-05, -1.7799437046051025e-05, -1.627206802368164e-05, -1.4744699001312256e-05, -1.3217329978942871e-05, -1.1689960956573486e-05, -1.0162591934204102e-05, -8.635222911834717e-06, -7.107853889465332e-06, -5.580484867095947e-06, -4.0531158447265625e-06, -2.5257468223571777e-06, -9.98377799987793e-07, 5.289912223815918e-07, 2.0563602447509766e-06, 3.5837292671203613e-06, 5.111098289489746e-06, 6.638467311859131e-06, 8.165836334228516e-06, 9.6932053565979e-06, 1.1220574378967285e-05, 1.274794340133667e-05, 1.4275312423706055e-05, 1.580268144607544e-05, 1.7330050468444824e-05, 1.885741949081421e-05, 2.0384788513183594e-05, 2.191215753555298e-05, 2.3439526557922363e-05, 2.4966895580291748e-05, 2.6494264602661133e-05, 2.8021633625030518e-05, 2.9549002647399902e-05, 3.107637166976929e-05, 3.260374069213867e-05, 3.413110971450806e-05, 3.565847873687744e-05, 3.7185847759246826e-05, 3.871321678161621e-05, 4.0240585803985596e-05, 4.176795482635498e-05, 4.3295323848724365e-05, 4.482269287109375e-05, 4.6350061893463135e-05, 4.787743091583252e-05, 4.9404799938201904e-05, 5.093216896057129e-05, 5.2459537982940674e-05, 5.398690700531006e-05, 5.551427602767944e-05, 5.704164505004883e-05, 5.856901407241821e-05, 6.00963830947876e-05, 6.162375211715698e-05, 6.315112113952637e-05, 6.467849016189575e-05, 6.620585918426514e-05, 6.773322820663452e-05, 6.92605972290039e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 6.0, 13.0, 21.0, 21.0, 40.0, 71.0, 138.0, 332.0, 910.0, 3882.0, 27952.0, 410564.0, 558445.0, 39473.0, 4929.0, 1028.0, 346.0, 187.0, 91.0, 42.0, 26.0, 12.0, 11.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.442626953125, -0.43068695068359375, -0.4187469482421875, -0.40680694580078125, -0.394866943359375, -0.38292694091796875, -0.3709869384765625, -0.35904693603515625, -0.34710693359375, -0.33516693115234375, -0.3232269287109375, -0.31128692626953125, -0.299346923828125, -0.28740692138671875, -0.2754669189453125, -0.26352691650390625, -0.2515869140625, -0.23964691162109375, -0.2277069091796875, -0.21576690673828125, -0.203826904296875, -0.19188690185546875, -0.1799468994140625, -0.16800689697265625, -0.15606689453125, -0.14412689208984375, -0.1321868896484375, -0.12024688720703125, -0.108306884765625, -0.09636688232421875, -0.0844268798828125, -0.07248687744140625, -0.060546875, -0.04860687255859375, -0.0366668701171875, -0.02472686767578125, -0.012786865234375, -0.00084686279296875, 0.0110931396484375, 0.02303314208984375, 0.03497314453125, 0.04691314697265625, 0.0588531494140625, 0.07079315185546875, 0.082733154296875, 0.09467315673828125, 0.1066131591796875, 0.11855316162109375, 0.1304931640625, 0.14243316650390625, 0.1543731689453125, 0.16631317138671875, 0.178253173828125, 0.19019317626953125, 0.2021331787109375, 0.21407318115234375, 0.22601318359375, 0.23795318603515625, 0.2498931884765625, 0.26183319091796875, 0.273773193359375, 0.28571319580078125, 0.2976531982421875, 0.30959320068359375, 0.321533203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 14.0, 15.0, 25.0, 38.0, 49.0, 63.0, 95.0, 115.0, 122.0, 120.0, 92.0, 76.0, 68.0, 31.0, 29.0, 18.0, 11.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4931640625, -0.4816303253173828, -0.4700965881347656, -0.45856285095214844, -0.44702911376953125, -0.43549537658691406, -0.4239616394042969, -0.4124279022216797, -0.4008941650390625, -0.3893604278564453, -0.3778266906738281, -0.36629295349121094, -0.35475921630859375, -0.34322547912597656, -0.3316917419433594, -0.3201580047607422, -0.308624267578125, -0.2970905303955078, -0.2855567932128906, -0.27402305603027344, -0.26248931884765625, -0.25095558166503906, -0.23942184448242188, -0.2278881072998047, -0.2163543701171875, -0.2048206329345703, -0.19328689575195312, -0.18175315856933594, -0.17021942138671875, -0.15868568420410156, -0.14715194702148438, -0.1356182098388672, -0.12408447265625, -0.11255073547363281, -0.10101699829101562, -0.08948326110839844, -0.07794952392578125, -0.06641578674316406, -0.054882049560546875, -0.04334831237792969, -0.0318145751953125, -0.020280838012695312, -0.008747100830078125, 0.0027866363525390625, 0.01432037353515625, 0.025854110717773438, 0.037387847900390625, 0.04892158508300781, 0.060455322265625, 0.07198905944824219, 0.08352279663085938, 0.09505653381347656, 0.10659027099609375, 0.11812400817871094, 0.12965774536132812, 0.1411914825439453, 0.1527252197265625, 0.1642589569091797, 0.17579269409179688, 0.18732643127441406, 0.19886016845703125, 0.21039390563964844, 0.22192764282226562, 0.2334613800048828, 0.2449951171875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 14.0, 14.0, 29.0, 64.0, 135.0, 270.0, 237.0, 146.0, 51.0, 23.0, 13.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.018630027770996, -11.787850379943848, -11.557071685791016, -11.326292037963867, -11.095513343811035, -10.864733695983887, -10.633955001831055, -10.403175354003906, -10.172395706176758, -9.94161605834961, -9.710837364196777, -9.480057716369629, -9.249279022216797, -9.018499374389648, -8.787720680236816, -8.556941032409668, -8.326162338256836, -8.095382690429688, -7.8646039962768555, -7.633824825286865, -7.403045654296875, -7.172266006469727, -6.941486835479736, -6.710707664489746, -6.479928493499756, -6.249149322509766, -6.018370151519775, -5.787590980529785, -5.556811332702637, -5.326032638549805, -5.095252990722656, -4.864473819732666, -4.633694171905518, -4.402915000915527, -4.172135829925537, -3.9413564205169678, -3.7105772495269775, -3.4797980785369873, -3.249018669128418, -3.0182394981384277, -2.7874603271484375, -2.5566811561584473, -2.325901985168457, -2.0951225757598877, -1.8643434047698975, -1.6335642337799072, -1.4027849435806274, -1.1720056533813477, -0.9412264823913574, -0.7104472517967224, -0.4796680212020874, -0.2488887906074524, -0.018109560012817383, 0.21266961097717285, 0.44344890117645264, 0.6742281913757324, 0.9050073623657227, 1.135786533355713, 1.3665658235549927, 1.5973451137542725, 1.8281242847442627, 2.058903455734253, 2.2896828651428223, 2.5204620361328125, 2.7512412071228027]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 9.0, 11.0, 11.0, 15.0, 13.0, 21.0, 15.0, 25.0, 28.0, 30.0, 31.0, 39.0, 45.0, 48.0, 50.0, 52.0, 51.0, 36.0, 45.0, 60.0, 47.0, 44.0, 38.0, 41.0, 42.0, 27.0, 21.0, 26.0, 9.0, 15.0, 13.0, 8.0, 4.0, 3.0, 7.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.715194225311279, -4.5851969718933105, -4.455199241638184, -4.325201988220215, -4.195204734802246, -4.065207481384277, -3.9352097511291504, -3.8052124977111816, -3.675215005874634, -3.545217514038086, -3.415220260620117, -3.2852227687835693, -3.1552252769470215, -3.0252280235290527, -2.895230531692505, -2.765233039855957, -2.6352357864379883, -2.5052382946014404, -2.3752410411834717, -2.245243549346924, -2.115246295928955, -1.9852488040924072, -1.8552513122558594, -1.725253939628601, -1.5952565670013428, -1.4652591943740845, -1.3352618217468262, -1.2052643299102783, -1.07526695728302, -0.9452695846557617, -0.8152721524238586, -0.6852747201919556, -0.5552773475646973, -0.4252799451351166, -0.2952825427055359, -0.1652851402759552, -0.03528773784637451, 0.09470963478088379, 0.22470706701278687, 0.35470449924468994, 0.48470187187194824, 0.6146992444992065, 0.7446966767311096, 0.8746941089630127, 1.004691481590271, 1.1346888542175293, 1.2646863460540771, 1.3946837186813354, 1.5246810913085938, 1.654678463935852, 1.7846758365631104, 1.9146733283996582, 2.044670581817627, 2.174668073654175, 2.3046655654907227, 2.4346628189086914, 2.5646603107452393, 2.694657802581787, 2.824655055999756, 2.9546525478363037, 3.0846500396728516, 3.2146472930908203, 3.344644784927368, 3.474642276763916, 3.6046395301818848]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 9.0, 9.0, 8.0, 16.0, 17.0, 32.0, 35.0, 52.0, 73.0, 110.0, 165.0, 235.0, 349.0, 517.0, 868.0, 1490.0, 2905.0, 6534.0, 18435.0, 131393.0, 3931024.0, 74163.0, 14468.0, 5376.0, 2470.0, 1404.0, 776.0, 438.0, 290.0, 206.0, 134.0, 81.0, 45.0, 45.0, 34.0, 19.0, 20.0, 12.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.0478515625, -1.0198287963867188, -0.9918060302734375, -0.9637832641601562, -0.935760498046875, -0.9077377319335938, -0.8797149658203125, -0.8516921997070312, -0.82366943359375, -0.7956466674804688, -0.7676239013671875, -0.7396011352539062, -0.711578369140625, -0.6835556030273438, -0.6555328369140625, -0.6275100708007812, -0.5994873046875, -0.5714645385742188, -0.5434417724609375, -0.5154190063476562, -0.487396240234375, -0.45937347412109375, -0.4313507080078125, -0.40332794189453125, -0.37530517578125, -0.34728240966796875, -0.3192596435546875, -0.29123687744140625, -0.263214111328125, -0.23519134521484375, -0.2071685791015625, -0.17914581298828125, -0.151123046875, -0.12310028076171875, -0.0950775146484375, -0.06705474853515625, -0.039031982421875, -0.01100921630859375, 0.0170135498046875, 0.04503631591796875, 0.07305908203125, 0.10108184814453125, 0.1291046142578125, 0.15712738037109375, 0.185150146484375, 0.21317291259765625, 0.2411956787109375, 0.26921844482421875, 0.2972412109375, 0.32526397705078125, 0.3532867431640625, 0.38130950927734375, 0.409332275390625, 0.43735504150390625, 0.4653778076171875, 0.49340057373046875, 0.52142333984375, 0.5494461059570312, 0.5774688720703125, 0.6054916381835938, 0.633514404296875, 0.6615371704101562, 0.6895599365234375, 0.7175827026367188, 0.74560546875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 9.0, 1.0, 4.0, 12.0, 11.0, 10.0, 20.0, 17.0, 24.0, 34.0, 33.0, 36.0, 39.0, 40.0, 48.0, 34.0, 47.0, 46.0, 53.0, 47.0, 48.0, 46.0, 42.0, 35.0, 42.0, 32.0, 24.0, 39.0, 24.0, 27.0, 15.0, 14.0, 11.0, 9.0, 7.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.246337890625, -0.23920059204101562, -0.23206329345703125, -0.22492599487304688, -0.2177886962890625, -0.21065139770507812, -0.20351409912109375, -0.19637680053710938, -0.189239501953125, -0.18210220336914062, -0.17496490478515625, -0.16782760620117188, -0.1606903076171875, -0.15355300903320312, -0.14641571044921875, -0.13927841186523438, -0.13214111328125, -0.12500381469726562, -0.11786651611328125, -0.11072921752929688, -0.1035919189453125, -0.09645462036132812, -0.08931732177734375, -0.08218002319335938, -0.075042724609375, -0.06790542602539062, -0.06076812744140625, -0.053630828857421875, -0.0464935302734375, -0.039356231689453125, -0.03221893310546875, -0.025081634521484375, -0.0179443359375, -0.010807037353515625, -0.00366973876953125, 0.003467559814453125, 0.0106048583984375, 0.017742156982421875, 0.02487945556640625, 0.032016754150390625, 0.039154052734375, 0.046291351318359375, 0.05342864990234375, 0.060565948486328125, 0.0677032470703125, 0.07484054565429688, 0.08197784423828125, 0.08911514282226562, 0.09625244140625, 0.10338973999023438, 0.11052703857421875, 0.11766433715820312, 0.1248016357421875, 0.13193893432617188, 0.13907623291015625, 0.14621353149414062, 0.153350830078125, 0.16048812866210938, 0.16762542724609375, 0.17476272583007812, 0.1819000244140625, 0.18903732299804688, 0.19617462158203125, 0.20331192016601562, 0.21044921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 13.0, 18.0, 20.0, 37.0, 43.0, 46.0, 73.0, 114.0, 164.0, 297.0, 1068.0, 8642.0, 4046995.0, 131870.0, 3483.0, 718.0, 259.0, 120.0, 62.0, 69.0, 47.0, 30.0, 34.0, 24.0, 11.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.0960235595703125, -3.016265869140625, -2.9365081787109375, -2.85675048828125, -2.7769927978515625, -2.697235107421875, -2.6174774169921875, -2.5377197265625, -2.4579620361328125, -2.378204345703125, -2.2984466552734375, -2.21868896484375, -2.1389312744140625, -2.059173583984375, -1.9794158935546875, -1.899658203125, -1.8199005126953125, -1.740142822265625, -1.6603851318359375, -1.58062744140625, -1.5008697509765625, -1.421112060546875, -1.3413543701171875, -1.2615966796875, -1.1818389892578125, -1.102081298828125, -1.0223236083984375, -0.94256591796875, -0.8628082275390625, -0.783050537109375, -0.7032928466796875, -0.62353515625, -0.5437774658203125, -0.464019775390625, -0.3842620849609375, -0.30450439453125, -0.2247467041015625, -0.144989013671875, -0.0652313232421875, 0.0145263671875, 0.0942840576171875, 0.174041748046875, 0.2537994384765625, 0.33355712890625, 0.4133148193359375, 0.493072509765625, 0.5728302001953125, 0.652587890625, 0.7323455810546875, 0.812103271484375, 0.8918609619140625, 0.97161865234375, 1.0513763427734375, 1.131134033203125, 1.2108917236328125, 1.2906494140625, 1.3704071044921875, 1.450164794921875, 1.5299224853515625, 1.60968017578125, 1.6894378662109375, 1.769195556640625, 1.8489532470703125, 1.9287109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 14.0, 29.0, 170.0, 3608.0, 197.0, 36.0, 10.0, 9.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.7155685424804688, -1.6743011474609375, -1.6330337524414062, -1.591766357421875, -1.5504989624023438, -1.5092315673828125, -1.4679641723632812, -1.42669677734375, -1.3854293823242188, -1.3441619873046875, -1.3028945922851562, -1.261627197265625, -1.2203598022460938, -1.1790924072265625, -1.1378250122070312, -1.0965576171875, -1.0552902221679688, -1.0140228271484375, -0.9727554321289062, -0.931488037109375, -0.8902206420898438, -0.8489532470703125, -0.8076858520507812, -0.76641845703125, -0.7251510620117188, -0.6838836669921875, -0.6426162719726562, -0.601348876953125, -0.5600814819335938, -0.5188140869140625, -0.47754669189453125, -0.436279296875, -0.39501190185546875, -0.3537445068359375, -0.31247711181640625, -0.271209716796875, -0.22994232177734375, -0.1886749267578125, -0.14740753173828125, -0.10614013671875, -0.06487274169921875, -0.0236053466796875, 0.01766204833984375, 0.058929443359375, 0.10019683837890625, 0.1414642333984375, 0.18273162841796875, 0.2239990234375, 0.26526641845703125, 0.3065338134765625, 0.34780120849609375, 0.389068603515625, 0.43033599853515625, 0.4716033935546875, 0.5128707885742188, 0.55413818359375, 0.5954055786132812, 0.6366729736328125, 0.6779403686523438, 0.719207763671875, 0.7604751586914062, 0.8017425537109375, 0.8430099487304688, 0.88427734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 14.0, 25.0, 81.0, 233.0, 374.0, 184.0, 51.0, 18.0, 13.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.567192077636719, -5.452269077301025, -5.33734655380249, -5.222423553466797, -5.1075005531311035, -4.99257755279541, -4.877655029296875, -4.762732028961182, -4.647809028625488, -4.532886028289795, -4.41796350479126, -4.303040504455566, -4.188117504119873, -4.07319450378418, -3.9582719802856445, -3.843348979949951, -3.728426218032837, -3.6135034561157227, -3.4985804557800293, -3.383657693862915, -3.2687346935272217, -3.1538119316101074, -3.038888931274414, -2.9239661693573, -2.8090434074401855, -2.6941206455230713, -2.579197645187378, -2.4642748832702637, -2.3493518829345703, -2.234429121017456, -2.119506359100342, -2.0045833587646484, -1.8896605968475342, -1.7747377157211304, -1.6598148345947266, -1.5448920726776123, -1.429969072341919, -1.3150463104248047, -1.2001234292984009, -1.085200548171997, -0.9702776670455933, -0.8553547859191895, -0.7404319047927856, -0.6255090832710266, -0.5105862021446228, -0.395663321018219, -0.28074049949645996, -0.16581761837005615, -0.050894737243652344, 0.06402812898159027, 0.17895099520683289, 0.2938738465309143, 0.4087967276573181, 0.5237196087837219, 0.638642430305481, 0.7535653114318848, 0.8684881925582886, 0.9834110736846924, 1.0983339548110962, 1.2132568359375, 1.3281795978546143, 1.4431025981903076, 1.5580253601074219, 1.6729482412338257, 1.7878711223602295]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 5.0, 13.0, 18.0, 16.0, 22.0, 27.0, 33.0, 49.0, 43.0, 42.0, 53.0, 53.0, 59.0, 61.0, 68.0, 65.0, 46.0, 55.0, 44.0, 39.0, 34.0, 34.0, 25.0, 22.0, 16.0, 11.0, 9.0, 12.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7369763851165771, -1.688307523727417, -1.6396386623382568, -1.5909698009490967, -1.542301058769226, -1.493632197380066, -1.4449633359909058, -1.3962944746017456, -1.347625732421875, -1.2989568710327148, -1.2502880096435547, -1.2016191482543945, -1.152950406074524, -1.1042815446853638, -1.0556126832962036, -1.0069438219070435, -0.9582749605178833, -0.9096060991287231, -0.8609372973442078, -0.8122684359550476, -0.7635996341705322, -0.7149307727813721, -0.6662619113922119, -0.6175930500030518, -0.5689242482185364, -0.5202553868293762, -0.47158658504486084, -0.4229177236557007, -0.3742488920688629, -0.32558006048202515, -0.276911199092865, -0.22824236750602722, -0.17957353591918945, -0.13090470433235168, -0.08223585784435272, -0.03356701135635376, 0.015101820230484009, 0.06377065181732178, 0.11243951320648193, 0.1611083447933197, 0.20977717638015747, 0.25844600796699524, 0.307114839553833, 0.35578370094299316, 0.40445253252983093, 0.4531213641166687, 0.5017902255058289, 0.5504590272903442, 0.5991278886795044, 0.6477967500686646, 0.6964655518531799, 0.7451344132423401, 0.7938032150268555, 0.8424720764160156, 0.8911409378051758, 0.9398097991943359, 0.9884786009788513, 1.0371474027633667, 1.0858162641525269, 1.134485125541687, 1.1831539869308472, 1.2318227291107178, 1.280491590499878, 1.329160451889038, 1.3778293132781982]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 8.0, 6.0, 5.0, 14.0, 25.0, 27.0, 42.0, 62.0, 101.0, 157.0, 198.0, 305.0, 469.0, 749.0, 1106.0, 1860.0, 3004.0, 5051.0, 8424.0, 14055.0, 24676.0, 45371.0, 88630.0, 182522.0, 278690.0, 190445.0, 93278.0, 46930.0, 25539.0, 14580.0, 8642.0, 5055.0, 3179.0, 1929.0, 1154.0, 824.0, 490.0, 310.0, 213.0, 143.0, 103.0, 58.0, 35.0, 29.0, 22.0, 11.0, 11.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4019508361816406, -0.38959503173828125, -0.3772392272949219, -0.3648834228515625, -0.3525276184082031, -0.34017181396484375, -0.3278160095214844, -0.315460205078125, -0.3031044006347656, -0.29074859619140625, -0.2783927917480469, -0.2660369873046875, -0.2536811828613281, -0.24132537841796875, -0.22896957397460938, -0.21661376953125, -0.20425796508789062, -0.19190216064453125, -0.17954635620117188, -0.1671905517578125, -0.15483474731445312, -0.14247894287109375, -0.13012313842773438, -0.117767333984375, -0.10541152954101562, -0.09305572509765625, -0.08069992065429688, -0.0683441162109375, -0.055988311767578125, -0.04363250732421875, -0.031276702880859375, -0.0189208984375, -0.006565093994140625, 0.00579071044921875, 0.018146514892578125, 0.0305023193359375, 0.042858123779296875, 0.05521392822265625, 0.06756973266601562, 0.079925537109375, 0.09228134155273438, 0.10463714599609375, 0.11699295043945312, 0.1293487548828125, 0.14170455932617188, 0.15406036376953125, 0.16641616821289062, 0.17877197265625, 0.19112777709960938, 0.20348358154296875, 0.21583938598632812, 0.2281951904296875, 0.24055099487304688, 0.25290679931640625, 0.2652626037597656, 0.277618408203125, 0.2899742126464844, 0.30233001708984375, 0.3146858215332031, 0.3270416259765625, 0.3393974304199219, 0.35175323486328125, 0.3641090393066406, 0.37646484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 11.0, 5.0, 9.0, 4.0, 14.0, 18.0, 12.0, 16.0, 16.0, 23.0, 28.0, 35.0, 25.0, 26.0, 53.0, 56.0, 55.0, 52.0, 42.0, 37.0, 47.0, 43.0, 40.0, 57.0, 36.0, 40.0, 24.0, 27.0, 28.0, 26.0, 22.0, 15.0, 17.0, 15.0, 11.0, 3.0, 7.0, 5.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.26850128173828125, -0.2608795166015625, -0.25325775146484375, -0.245635986328125, -0.23801422119140625, -0.2303924560546875, -0.22277069091796875, -0.21514892578125, -0.20752716064453125, -0.1999053955078125, -0.19228363037109375, -0.184661865234375, -0.17704010009765625, -0.1694183349609375, -0.16179656982421875, -0.1541748046875, -0.14655303955078125, -0.1389312744140625, -0.13130950927734375, -0.123687744140625, -0.11606597900390625, -0.1084442138671875, -0.10082244873046875, -0.09320068359375, -0.08557891845703125, -0.0779571533203125, -0.07033538818359375, -0.062713623046875, -0.05509185791015625, -0.0474700927734375, -0.03984832763671875, -0.0322265625, -0.02460479736328125, -0.0169830322265625, -0.00936126708984375, -0.001739501953125, 0.00588226318359375, 0.0135040283203125, 0.02112579345703125, 0.02874755859375, 0.03636932373046875, 0.0439910888671875, 0.05161285400390625, 0.059234619140625, 0.06685638427734375, 0.0744781494140625, 0.08209991455078125, 0.0897216796875, 0.09734344482421875, 0.1049652099609375, 0.11258697509765625, 0.120208740234375, 0.12783050537109375, 0.1354522705078125, 0.14307403564453125, 0.15069580078125, 0.15831756591796875, 0.1659393310546875, 0.17356109619140625, 0.181182861328125, 0.18880462646484375, 0.1964263916015625, 0.20404815673828125, 0.211669921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 11.0, 28.0, 27.0, 54.0, 56.0, 113.0, 168.0, 231.0, 400.0, 689.0, 1268.0, 2467.0, 5210.0, 12077.0, 32922.0, 112516.0, 426444.0, 328512.0, 81379.0, 25347.0, 9715.0, 4175.0, 2035.0, 1103.0, 582.0, 392.0, 225.0, 137.0, 92.0, 47.0, 31.0, 25.0, 20.0, 10.0, 5.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.6753921508789062, -0.6535186767578125, -0.6316452026367188, -0.609771728515625, -0.5878982543945312, -0.5660247802734375, -0.5441513061523438, -0.52227783203125, -0.5004043579101562, -0.4785308837890625, -0.45665740966796875, -0.434783935546875, -0.41291046142578125, -0.3910369873046875, -0.36916351318359375, -0.3472900390625, -0.32541656494140625, -0.3035430908203125, -0.28166961669921875, -0.259796142578125, -0.23792266845703125, -0.2160491943359375, -0.19417572021484375, -0.17230224609375, -0.15042877197265625, -0.1285552978515625, -0.10668182373046875, -0.084808349609375, -0.06293487548828125, -0.0410614013671875, -0.01918792724609375, 0.002685546875, 0.02455902099609375, 0.0464324951171875, 0.06830596923828125, 0.090179443359375, 0.11205291748046875, 0.1339263916015625, 0.15579986572265625, 0.17767333984375, 0.19954681396484375, 0.2214202880859375, 0.24329376220703125, 0.265167236328125, 0.28704071044921875, 0.3089141845703125, 0.33078765869140625, 0.3526611328125, 0.37453460693359375, 0.3964080810546875, 0.41828155517578125, 0.440155029296875, 0.46202850341796875, 0.4839019775390625, 0.5057754516601562, 0.52764892578125, 0.5495223999023438, 0.5713958740234375, 0.5932693481445312, 0.615142822265625, 0.6370162963867188, 0.6588897705078125, 0.6807632446289062, 0.70263671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 7.0, 15.0, 8.0, 10.0, 14.0, 19.0, 19.0, 34.0, 45.0, 47.0, 50.0, 52.0, 51.0, 56.0, 54.0, 60.0, 56.0, 60.0, 71.0, 47.0, 37.0, 43.0, 25.0, 26.0, 19.0, 18.0, 18.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4541015625, -1.409881591796875, -1.36566162109375, -1.321441650390625, -1.2772216796875, -1.233001708984375, -1.18878173828125, -1.144561767578125, -1.100341796875, -1.056121826171875, -1.01190185546875, -0.967681884765625, -0.9234619140625, -0.879241943359375, -0.83502197265625, -0.790802001953125, -0.74658203125, -0.702362060546875, -0.65814208984375, -0.613922119140625, -0.5697021484375, -0.525482177734375, -0.48126220703125, -0.437042236328125, -0.392822265625, -0.348602294921875, -0.30438232421875, -0.260162353515625, -0.2159423828125, -0.171722412109375, -0.12750244140625, -0.083282470703125, -0.0390625, 0.005157470703125, 0.04937744140625, 0.093597412109375, 0.1378173828125, 0.182037353515625, 0.22625732421875, 0.270477294921875, 0.314697265625, 0.358917236328125, 0.40313720703125, 0.447357177734375, 0.4915771484375, 0.535797119140625, 0.58001708984375, 0.624237060546875, 0.66845703125, 0.712677001953125, 0.75689697265625, 0.801116943359375, 0.8453369140625, 0.889556884765625, 0.93377685546875, 0.977996826171875, 1.022216796875, 1.066436767578125, 1.11065673828125, 1.154876708984375, 1.1990966796875, 1.243316650390625, 1.28753662109375, 1.331756591796875, 1.3759765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 10.0, 14.0, 20.0, 36.0, 58.0, 123.0, 224.0, 537.0, 1238.0, 3678.0, 17622.0, 189456.0, 722939.0, 96710.0, 11240.0, 2732.0, 1005.0, 442.0, 220.0, 101.0, 60.0, 32.0, 18.0, 14.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4705238342285156, -0.45886993408203125, -0.4472160339355469, -0.4355621337890625, -0.4239082336425781, -0.41225433349609375, -0.4006004333496094, -0.388946533203125, -0.3772926330566406, -0.36563873291015625, -0.3539848327636719, -0.3423309326171875, -0.3306770324707031, -0.31902313232421875, -0.3073692321777344, -0.29571533203125, -0.2840614318847656, -0.27240753173828125, -0.2607536315917969, -0.2490997314453125, -0.23744583129882812, -0.22579193115234375, -0.21413803100585938, -0.202484130859375, -0.19083023071289062, -0.17917633056640625, -0.16752243041992188, -0.1558685302734375, -0.14421463012695312, -0.13256072998046875, -0.12090682983398438, -0.1092529296875, -0.09759902954101562, -0.08594512939453125, -0.07429122924804688, -0.0626373291015625, -0.050983428955078125, -0.03932952880859375, -0.027675628662109375, -0.016021728515625, -0.004367828369140625, 0.00728607177734375, 0.018939971923828125, 0.0305938720703125, 0.042247772216796875, 0.05390167236328125, 0.06555557250976562, 0.07720947265625, 0.08886337280273438, 0.10051727294921875, 0.11217117309570312, 0.1238250732421875, 0.13547897338867188, 0.14713287353515625, 0.15878677368164062, 0.170440673828125, 0.18209457397460938, 0.19374847412109375, 0.20540237426757812, 0.2170562744140625, 0.22871017456054688, 0.24036407470703125, 0.2520179748535156, 0.263671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 6.0, 5.0, 12.0, 18.0, 15.0, 28.0, 58.0, 57.0, 83.0, 115.0, 109.0, 122.0, 93.0, 79.0, 53.0, 41.0, 33.0, 15.0, 15.0, 11.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.023313522338867e-05, -3.877934068441391e-05, -3.732554614543915e-05, -3.5871751606464386e-05, -3.4417957067489624e-05, -3.296416252851486e-05, -3.15103679895401e-05, -3.0056573450565338e-05, -2.8602778911590576e-05, -2.7148984372615814e-05, -2.5695189833641052e-05, -2.424139529466629e-05, -2.278760075569153e-05, -2.1333806216716766e-05, -1.9880011677742004e-05, -1.8426217138767242e-05, -1.697242259979248e-05, -1.551862806081772e-05, -1.4064833521842957e-05, -1.2611038982868195e-05, -1.1157244443893433e-05, -9.70344990491867e-06, -8.249655365943909e-06, -6.795860826969147e-06, -5.342066287994385e-06, -3.888271749019623e-06, -2.434477210044861e-06, -9.806826710700989e-07, 4.731118679046631e-07, 1.926906406879425e-06, 3.380700945854187e-06, 4.834495484828949e-06, 6.288290023803711e-06, 7.742084562778473e-06, 9.195879101753235e-06, 1.0649673640727997e-05, 1.2103468179702759e-05, 1.355726271867752e-05, 1.5011057257652283e-05, 1.6464851796627045e-05, 1.7918646335601807e-05, 1.937244087457657e-05, 2.082623541355133e-05, 2.2280029952526093e-05, 2.3733824491500854e-05, 2.5187619030475616e-05, 2.664141356945038e-05, 2.809520810842514e-05, 2.9549002647399902e-05, 3.1002797186374664e-05, 3.2456591725349426e-05, 3.391038626432419e-05, 3.536418080329895e-05, 3.681797534227371e-05, 3.8271769881248474e-05, 3.9725564420223236e-05, 4.1179358959198e-05, 4.263315349817276e-05, 4.408694803714752e-05, 4.5540742576122284e-05, 4.6994537115097046e-05, 4.844833165407181e-05, 4.990212619304657e-05, 5.135592073202133e-05, 5.2809715270996094e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 11.0, 23.0, 27.0, 46.0, 59.0, 99.0, 142.0, 283.0, 477.0, 943.0, 2229.0, 6490.0, 25430.0, 131253.0, 491219.0, 309384.0, 60746.0, 12963.0, 3784.0, 1384.0, 638.0, 363.0, 214.0, 126.0, 72.0, 44.0, 27.0, 19.0, 9.0, 8.0, 11.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2508888244628906, -0.24323272705078125, -0.23557662963867188, -0.2279205322265625, -0.22026443481445312, -0.21260833740234375, -0.20495223999023438, -0.197296142578125, -0.18964004516601562, -0.18198394775390625, -0.17432785034179688, -0.1666717529296875, -0.15901565551757812, -0.15135955810546875, -0.14370346069335938, -0.13604736328125, -0.12839126586914062, -0.12073516845703125, -0.11307907104492188, -0.1054229736328125, -0.09776687622070312, -0.09011077880859375, -0.08245468139648438, -0.074798583984375, -0.06714248657226562, -0.05948638916015625, -0.051830291748046875, -0.0441741943359375, -0.036518096923828125, -0.02886199951171875, -0.021205902099609375, -0.0135498046875, -0.005893707275390625, 0.00176239013671875, 0.009418487548828125, 0.0170745849609375, 0.024730682373046875, 0.03238677978515625, 0.040042877197265625, 0.047698974609375, 0.055355072021484375, 0.06301116943359375, 0.07066726684570312, 0.0783233642578125, 0.08597946166992188, 0.09363555908203125, 0.10129165649414062, 0.10894775390625, 0.11660385131835938, 0.12425994873046875, 0.13191604614257812, 0.1395721435546875, 0.14722824096679688, 0.15488433837890625, 0.16254043579101562, 0.170196533203125, 0.17785263061523438, 0.18550872802734375, 0.19316482543945312, 0.2008209228515625, 0.20847702026367188, 0.21613311767578125, 0.22378921508789062, 0.2314453125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 5.0, 13.0, 15.0, 23.0, 36.0, 58.0, 54.0, 84.0, 99.0, 93.0, 104.0, 98.0, 79.0, 69.0, 44.0, 37.0, 24.0, 16.0, 12.0, 11.0, 8.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.449951171875, -0.43747711181640625, -0.4250030517578125, -0.41252899169921875, -0.400054931640625, -0.38758087158203125, -0.3751068115234375, -0.36263275146484375, -0.35015869140625, -0.33768463134765625, -0.3252105712890625, -0.31273651123046875, -0.300262451171875, -0.28778839111328125, -0.2753143310546875, -0.26284027099609375, -0.2503662109375, -0.23789215087890625, -0.2254180908203125, -0.21294403076171875, -0.200469970703125, -0.18799591064453125, -0.1755218505859375, -0.16304779052734375, -0.15057373046875, -0.13809967041015625, -0.1256256103515625, -0.11315155029296875, -0.100677490234375, -0.08820343017578125, -0.0757293701171875, -0.06325531005859375, -0.05078125, -0.03830718994140625, -0.0258331298828125, -0.01335906982421875, -0.000885009765625, 0.01158905029296875, 0.0240631103515625, 0.03653717041015625, 0.04901123046875, 0.06148529052734375, 0.0739593505859375, 0.08643341064453125, 0.098907470703125, 0.11138153076171875, 0.1238555908203125, 0.13632965087890625, 0.1488037109375, 0.16127777099609375, 0.1737518310546875, 0.18622589111328125, 0.198699951171875, 0.21117401123046875, 0.2236480712890625, 0.23612213134765625, 0.24859619140625, 0.26107025146484375, 0.2735443115234375, 0.28601837158203125, 0.298492431640625, 0.31096649169921875, 0.3234405517578125, 0.33591461181640625, 0.348388671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 17.0, 29.0, 61.0, 134.0, 216.0, 278.0, 161.0, 50.0, 28.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.122644901275635, -6.786108493804932, -6.449572563171387, -6.113036155700684, -5.776500225067139, -5.4399638175964355, -5.103427886962891, -4.7668914794921875, -4.430355072021484, -4.093818664550781, -3.7572827339172363, -3.420746326446533, -3.0842103958129883, -2.747673988342285, -2.411137819290161, -2.074601650238037, -1.7380657196044922, -1.4015295505523682, -1.0649933815002441, -0.7284570932388306, -0.39192092418670654, -0.05538475513458252, 0.28115153312683105, 0.6176877021789551, 0.9542238712310791, 1.2907600402832031, 1.6272962093353271, 1.9638324975967407, 2.3003687858581543, 2.636904716491699, 2.9734411239624023, 3.3099772930145264, 3.646512985229492, 3.983049154281616, 4.31958532333374, 4.656121730804443, 4.992657661437988, 5.329194068908691, 5.6657304763793945, 6.0022664070129395, 6.338802337646484, 6.6753387451171875, 7.011874675750732, 7.3484110832214355, 7.6849470138549805, 8.021483421325684, 8.358019828796387, 8.694555282592773, 9.031091690063477, 9.36762809753418, 9.704164505004883, 10.04069995880127, 10.377236366271973, 10.713772773742676, 11.050309181213379, 11.386844635009766, 11.723381996154785, 12.059918403625488, 12.396454811096191, 12.732990264892578, 13.069526672363281, 13.406063079833984, 13.742599487304688, 14.07913589477539, 14.415671348571777]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 14.0, 5.0, 8.0, 17.0, 29.0, 13.0, 23.0, 22.0, 17.0, 25.0, 29.0, 39.0, 22.0, 41.0, 39.0, 51.0, 38.0, 39.0, 34.0, 49.0, 31.0, 34.0, 44.0, 37.0, 31.0, 35.0, 25.0, 12.0, 23.0, 23.0, 10.0, 19.0, 18.0, 14.0, 8.0, 10.0, 7.0, 11.0, 8.0, 1.0, 8.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0], "bins": [-5.70883321762085, -5.541421413421631, -5.374009132385254, -5.206597328186035, -5.039185047149658, -4.8717732429504395, -4.7043609619140625, -4.536949157714844, -4.369537353515625, -4.202125549316406, -4.034713268280029, -3.8673014640808105, -3.6998894214630127, -3.532477378845215, -3.365065336227417, -3.197653293609619, -3.0302412509918213, -2.8628292083740234, -2.6954171657562256, -2.5280051231384277, -2.360593318939209, -2.193181276321411, -2.0257692337036133, -1.858357310295105, -1.6909452676773071, -1.5235332250595093, -1.356121301651001, -1.1887092590332031, -1.0212972164154053, -0.853885293006897, -0.6864732503890991, -0.5190613269805908, -0.35164928436279297, -0.1842372864484787, -0.01682528853416443, 0.15058672428131104, 0.3179987072944641, 0.4854106903076172, 0.652822732925415, 0.8202346563339233, 0.9876466989517212, 1.155058741569519, 1.3224706649780273, 1.4898827075958252, 1.657294750213623, 1.8247066736221313, 1.9921187162399292, 2.1595306396484375, 2.3269426822662354, 2.494354724884033, 2.661766767501831, 2.829178810119629, 2.9965906143188477, 3.1640026569366455, 3.3314146995544434, 3.498826503753662, 3.666238784790039, 3.833650827407837, 4.001062870025635, 4.1684746742248535, 4.3358869552612305, 4.503298759460449, 4.670710563659668, 4.838122844696045, 5.005534648895264]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 3.0, 7.0, 6.0, 8.0, 7.0, 12.0, 28.0, 44.0, 31.0, 58.0, 82.0, 105.0, 132.0, 215.0, 317.0, 431.0, 599.0, 985.0, 1446.0, 2431.0, 4020.0, 7956.0, 18302.0, 68608.0, 3794607.0, 236065.0, 31690.0, 11480.0, 5830.0, 3123.0, 1941.0, 1229.0, 804.0, 536.0, 351.0, 238.0, 178.0, 109.0, 85.0, 63.0, 30.0, 30.0, 21.0, 14.0, 7.0, 5.0, 9.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8818359375, -0.8557052612304688, -0.8295745849609375, -0.8034439086914062, -0.777313232421875, -0.7511825561523438, -0.7250518798828125, -0.6989212036132812, -0.67279052734375, -0.6466598510742188, -0.6205291748046875, -0.5943984985351562, -0.568267822265625, -0.5421371459960938, -0.5160064697265625, -0.48987579345703125, -0.4637451171875, -0.43761444091796875, -0.4114837646484375, -0.38535308837890625, -0.359222412109375, -0.33309173583984375, -0.3069610595703125, -0.28083038330078125, -0.25469970703125, -0.22856903076171875, -0.2024383544921875, -0.17630767822265625, -0.150177001953125, -0.12404632568359375, -0.0979156494140625, -0.07178497314453125, -0.045654296875, -0.01952362060546875, 0.0066070556640625, 0.03273773193359375, 0.058868408203125, 0.08499908447265625, 0.1111297607421875, 0.13726043701171875, 0.16339111328125, 0.18952178955078125, 0.2156524658203125, 0.24178314208984375, 0.267913818359375, 0.29404449462890625, 0.3201751708984375, 0.34630584716796875, 0.3724365234375, 0.39856719970703125, 0.4246978759765625, 0.45082855224609375, 0.476959228515625, 0.5030899047851562, 0.5292205810546875, 0.5553512573242188, 0.58148193359375, 0.6076126098632812, 0.6337432861328125, 0.6598739624023438, 0.686004638671875, 0.7121353149414062, 0.7382659912109375, 0.7643966674804688, 0.79052734375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 4.0, 8.0, 13.0, 9.0, 16.0, 23.0, 23.0, 29.0, 24.0, 37.0, 39.0, 38.0, 35.0, 52.0, 48.0, 52.0, 54.0, 47.0, 38.0, 41.0, 50.0, 38.0, 36.0, 29.0, 32.0, 35.0, 25.0, 26.0, 11.0, 12.0, 14.0, 20.0, 8.0, 7.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3349609375, -0.32505035400390625, -0.3151397705078125, -0.30522918701171875, -0.295318603515625, -0.28540802001953125, -0.2754974365234375, -0.26558685302734375, -0.25567626953125, -0.24576568603515625, -0.2358551025390625, -0.22594451904296875, -0.216033935546875, -0.20612335205078125, -0.1962127685546875, -0.18630218505859375, -0.1763916015625, -0.16648101806640625, -0.1565704345703125, -0.14665985107421875, -0.136749267578125, -0.12683868408203125, -0.1169281005859375, -0.10701751708984375, -0.09710693359375, -0.08719635009765625, -0.0772857666015625, -0.06737518310546875, -0.057464599609375, -0.04755401611328125, -0.0376434326171875, -0.02773284912109375, -0.017822265625, -0.00791168212890625, 0.0019989013671875, 0.01190948486328125, 0.021820068359375, 0.03173065185546875, 0.0416412353515625, 0.05155181884765625, 0.06146240234375, 0.07137298583984375, 0.0812835693359375, 0.09119415283203125, 0.101104736328125, 0.11101531982421875, 0.1209259033203125, 0.13083648681640625, 0.1407470703125, 0.15065765380859375, 0.1605682373046875, 0.17047882080078125, 0.180389404296875, 0.19029998779296875, 0.2002105712890625, 0.21012115478515625, 0.22003173828125, 0.22994232177734375, 0.2398529052734375, 0.24976348876953125, 0.259674072265625, 0.26958465576171875, 0.2794952392578125, 0.28940582275390625, 0.29931640625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 8.0, 12.0, 23.0, 20.0, 23.0, 39.0, 43.0, 79.0, 95.0, 156.0, 252.0, 436.0, 944.0, 2410.0, 7841.0, 34619.0, 821932.0, 3270736.0, 40730.0, 8878.0, 2709.0, 1062.0, 477.0, 233.0, 138.0, 109.0, 59.0, 46.0, 35.0, 35.0, 16.0, 22.0, 17.0, 11.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.359375, -1.320587158203125, -1.28179931640625, -1.243011474609375, -1.2042236328125, -1.165435791015625, -1.12664794921875, -1.087860107421875, -1.049072265625, -1.010284423828125, -0.97149658203125, -0.932708740234375, -0.8939208984375, -0.855133056640625, -0.81634521484375, -0.777557373046875, -0.73876953125, -0.699981689453125, -0.66119384765625, -0.622406005859375, -0.5836181640625, -0.544830322265625, -0.50604248046875, -0.467254638671875, -0.428466796875, -0.389678955078125, -0.35089111328125, -0.312103271484375, -0.2733154296875, -0.234527587890625, -0.19573974609375, -0.156951904296875, -0.1181640625, -0.079376220703125, -0.04058837890625, -0.001800537109375, 0.0369873046875, 0.075775146484375, 0.11456298828125, 0.153350830078125, 0.192138671875, 0.230926513671875, 0.26971435546875, 0.308502197265625, 0.3472900390625, 0.386077880859375, 0.42486572265625, 0.463653564453125, 0.50244140625, 0.541229248046875, 0.58001708984375, 0.618804931640625, 0.6575927734375, 0.696380615234375, 0.73516845703125, 0.773956298828125, 0.812744140625, 0.851531982421875, 0.89031982421875, 0.929107666015625, 0.9678955078125, 1.006683349609375, 1.04547119140625, 1.084259033203125, 1.123046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 13.0, 20.0, 29.0, 44.0, 108.0, 681.0, 2889.0, 135.0, 60.0, 37.0, 23.0, 8.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2293243408203125, -1.197906494140625, -1.1664886474609375, -1.13507080078125, -1.1036529541015625, -1.072235107421875, -1.0408172607421875, -1.0093994140625, -0.9779815673828125, -0.946563720703125, -0.9151458740234375, -0.88372802734375, -0.8523101806640625, -0.820892333984375, -0.7894744873046875, -0.758056640625, -0.7266387939453125, -0.695220947265625, -0.6638031005859375, -0.63238525390625, -0.6009674072265625, -0.569549560546875, -0.5381317138671875, -0.5067138671875, -0.4752960205078125, -0.443878173828125, -0.4124603271484375, -0.38104248046875, -0.3496246337890625, -0.318206787109375, -0.2867889404296875, -0.25537109375, -0.2239532470703125, -0.192535400390625, -0.1611175537109375, -0.12969970703125, -0.0982818603515625, -0.066864013671875, -0.0354461669921875, -0.0040283203125, 0.0273895263671875, 0.058807373046875, 0.0902252197265625, 0.12164306640625, 0.1530609130859375, 0.184478759765625, 0.2158966064453125, 0.247314453125, 0.2787322998046875, 0.310150146484375, 0.3415679931640625, 0.37298583984375, 0.4044036865234375, 0.435821533203125, 0.4672393798828125, 0.4986572265625, 0.5300750732421875, 0.561492919921875, 0.5929107666015625, 0.62432861328125, 0.6557464599609375, 0.687164306640625, 0.7185821533203125, 0.75]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 23.0, 48.0, 131.0, 276.0, 283.0, 148.0, 50.0, 15.0, 11.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9765621423721313, -1.8348950147628784, -1.693228006362915, -1.551560878753662, -1.4098937511444092, -1.2682267427444458, -1.1265596151351929, -0.9848925471305847, -0.8432254791259766, -0.7015584111213684, -0.5598913431167603, -0.4182242155075073, -0.27655714750289917, -0.13489007949829102, 0.006777048110961914, 0.14844411611557007, 0.2901111841201782, 0.4317782521247864, 0.5734453201293945, 0.7151124477386475, 0.8567795157432556, 0.9984465837478638, 1.1401137113571167, 1.28178071975708, 1.423447847366333, 1.565114974975586, 1.7067819833755493, 1.8484491109848022, 1.9901161193847656, 2.1317832469940186, 2.2734503746032715, 2.4151175022125244, 2.5567846298217773, 2.6984517574310303, 2.840118885040283, 2.981785774230957, 3.12345290184021, 3.265120029449463, 3.406787157058716, 3.5484542846679688, 3.6901211738586426, 3.8317883014678955, 3.9734554290771484, 4.115122318267822, 4.256789684295654, 4.398456573486328, 4.54012393951416, 4.681790828704834, 4.823457717895508, 4.965124607086182, 5.106791973114014, 5.2484588623046875, 5.3901262283325195, 5.531793117523193, 5.673460006713867, 5.815127372741699, 5.956794738769531, 6.098461627960205, 6.240128993988037, 6.381795883178711, 6.523463249206543, 6.665130138397217, 6.806797027587891, 6.948464393615723, 7.0901312828063965]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 11.0, 14.0, 16.0, 17.0, 23.0, 14.0, 25.0, 29.0, 39.0, 46.0, 49.0, 40.0, 53.0, 48.0, 40.0, 51.0, 47.0, 60.0, 46.0, 49.0, 41.0, 37.0, 41.0, 22.0, 16.0, 20.0, 18.0, 17.0, 12.0, 7.0, 6.0, 13.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4657471179962158, -1.4160938262939453, -1.3664405345916748, -1.3167871236801147, -1.2671338319778442, -1.2174805402755737, -1.1678271293640137, -1.1181738376617432, -1.0685205459594727, -1.0188672542572021, -0.9692139029502869, -0.9195605516433716, -0.8699072599411011, -0.8202539682388306, -0.7706006169319153, -0.720947265625, -0.6712939739227295, -0.621640682220459, -0.5719873309135437, -0.5223339796066284, -0.4726806879043579, -0.423027366399765, -0.3733740448951721, -0.3237207233905792, -0.27406740188598633, -0.22441408038139343, -0.17476075887680054, -0.12510743737220764, -0.07545411586761475, -0.02580079436302185, 0.023852527141571045, 0.07350584864616394, 0.12315917015075684, 0.17281249165534973, 0.22246581315994263, 0.2721191346645355, 0.3217724561691284, 0.3714257776737213, 0.4210790991783142, 0.4707324206829071, 0.5203857421875, 0.5700390338897705, 0.6196923851966858, 0.6693457365036011, 0.7189990282058716, 0.7686523199081421, 0.8183056712150574, 0.8679590225219727, 0.9176123142242432, 0.9672656059265137, 1.0169188976287842, 1.0665723085403442, 1.1162256002426147, 1.1658788919448853, 1.2155323028564453, 1.2651855945587158, 1.3148388862609863, 1.3644921779632568, 1.4141454696655273, 1.4637988805770874, 1.513452172279358, 1.5631054639816284, 1.6127588748931885, 1.662412166595459, 1.7120654582977295]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 5.0, 11.0, 9.0, 12.0, 20.0, 30.0, 36.0, 47.0, 66.0, 72.0, 120.0, 187.0, 307.0, 477.0, 855.0, 1560.0, 3109.0, 6440.0, 13781.0, 32801.0, 91299.0, 312042.0, 392365.0, 119401.0, 41268.0, 16610.0, 7623.0, 3635.0, 1806.0, 982.0, 547.0, 325.0, 206.0, 147.0, 93.0, 64.0, 46.0, 35.0, 32.0, 16.0, 18.0, 14.0, 8.0, 8.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.9971389770507812, -0.9679107666015625, -0.9386825561523438, -0.909454345703125, -0.8802261352539062, -0.8509979248046875, -0.8217697143554688, -0.79254150390625, -0.7633132934570312, -0.7340850830078125, -0.7048568725585938, -0.675628662109375, -0.6464004516601562, -0.6171722412109375, -0.5879440307617188, -0.5587158203125, -0.5294876098632812, -0.5002593994140625, -0.47103118896484375, -0.441802978515625, -0.41257476806640625, -0.3833465576171875, -0.35411834716796875, -0.32489013671875, -0.29566192626953125, -0.2664337158203125, -0.23720550537109375, -0.207977294921875, -0.17874908447265625, -0.1495208740234375, -0.12029266357421875, -0.091064453125, -0.06183624267578125, -0.0326080322265625, -0.00337982177734375, 0.025848388671875, 0.05507659912109375, 0.0843048095703125, 0.11353302001953125, 0.14276123046875, 0.17198944091796875, 0.2012176513671875, 0.23044586181640625, 0.259674072265625, 0.28890228271484375, 0.3181304931640625, 0.34735870361328125, 0.3765869140625, 0.40581512451171875, 0.4350433349609375, 0.46427154541015625, 0.493499755859375, 0.5227279663085938, 0.5519561767578125, 0.5811843872070312, 0.61041259765625, 0.6396408081054688, 0.6688690185546875, 0.6980972290039062, 0.727325439453125, 0.7565536499023438, 0.7857818603515625, 0.8150100708007812, 0.84423828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 6.0, 8.0, 6.0, 5.0, 13.0, 15.0, 18.0, 18.0, 25.0, 19.0, 35.0, 27.0, 34.0, 44.0, 41.0, 49.0, 45.0, 45.0, 51.0, 48.0, 54.0, 49.0, 32.0, 47.0, 38.0, 37.0, 38.0, 27.0, 29.0, 20.0, 12.0, 12.0, 8.0, 17.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3818359375, -0.37113189697265625, -0.3604278564453125, -0.34972381591796875, -0.339019775390625, -0.32831573486328125, -0.3176116943359375, -0.30690765380859375, -0.29620361328125, -0.28549957275390625, -0.2747955322265625, -0.26409149169921875, -0.253387451171875, -0.24268341064453125, -0.2319793701171875, -0.22127532958984375, -0.2105712890625, -0.19986724853515625, -0.1891632080078125, -0.17845916748046875, -0.167755126953125, -0.15705108642578125, -0.1463470458984375, -0.13564300537109375, -0.12493896484375, -0.11423492431640625, -0.1035308837890625, -0.09282684326171875, -0.082122802734375, -0.07141876220703125, -0.0607147216796875, -0.05001068115234375, -0.039306640625, -0.02860260009765625, -0.0178985595703125, -0.00719451904296875, 0.003509521484375, 0.01421356201171875, 0.0249176025390625, 0.03562164306640625, 0.04632568359375, 0.05702972412109375, 0.0677337646484375, 0.07843780517578125, 0.089141845703125, 0.09984588623046875, 0.1105499267578125, 0.12125396728515625, 0.1319580078125, 0.14266204833984375, 0.1533660888671875, 0.16407012939453125, 0.174774169921875, 0.18547821044921875, 0.1961822509765625, 0.20688629150390625, 0.21759033203125, 0.22829437255859375, 0.2389984130859375, 0.24970245361328125, 0.260406494140625, 0.27111053466796875, 0.2818145751953125, 0.29251861572265625, 0.30322265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 16.0, 21.0, 28.0, 32.0, 82.0, 166.0, 295.0, 630.0, 1471.0, 3809.0, 11562.0, 43396.0, 300229.0, 585061.0, 75343.0, 17160.0, 5560.0, 1979.0, 867.0, 390.0, 196.0, 93.0, 56.0, 30.0, 24.0, 13.0, 15.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.73828125, -1.6915130615234375, -1.644744873046875, -1.5979766845703125, -1.55120849609375, -1.5044403076171875, -1.457672119140625, -1.4109039306640625, -1.3641357421875, -1.3173675537109375, -1.270599365234375, -1.2238311767578125, -1.17706298828125, -1.1302947998046875, -1.083526611328125, -1.0367584228515625, -0.989990234375, -0.9432220458984375, -0.896453857421875, -0.8496856689453125, -0.80291748046875, -0.7561492919921875, -0.709381103515625, -0.6626129150390625, -0.6158447265625, -0.5690765380859375, -0.522308349609375, -0.4755401611328125, -0.42877197265625, -0.3820037841796875, -0.335235595703125, -0.2884674072265625, -0.24169921875, -0.1949310302734375, -0.148162841796875, -0.1013946533203125, -0.05462646484375, -0.0078582763671875, 0.038909912109375, 0.0856781005859375, 0.1324462890625, 0.1792144775390625, 0.225982666015625, 0.2727508544921875, 0.31951904296875, 0.3662872314453125, 0.413055419921875, 0.4598236083984375, 0.506591796875, 0.5533599853515625, 0.600128173828125, 0.6468963623046875, 0.69366455078125, 0.7404327392578125, 0.787200927734375, 0.8339691162109375, 0.8807373046875, 0.9275054931640625, 0.974273681640625, 1.0210418701171875, 1.06781005859375, 1.1145782470703125, 1.161346435546875, 1.2081146240234375, 1.2548828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 8.0, 6.0, 10.0, 18.0, 17.0, 29.0, 30.0, 30.0, 27.0, 32.0, 40.0, 50.0, 55.0, 46.0, 53.0, 55.0, 68.0, 55.0, 45.0, 55.0, 42.0, 39.0, 29.0, 27.0, 30.0, 21.0, 17.0, 16.0, 16.0, 9.0, 3.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.86328125, -1.802642822265625, -1.74200439453125, -1.681365966796875, -1.6207275390625, -1.560089111328125, -1.49945068359375, -1.438812255859375, -1.378173828125, -1.317535400390625, -1.25689697265625, -1.196258544921875, -1.1356201171875, -1.074981689453125, -1.01434326171875, -0.953704833984375, -0.89306640625, -0.832427978515625, -0.77178955078125, -0.711151123046875, -0.6505126953125, -0.589874267578125, -0.52923583984375, -0.468597412109375, -0.407958984375, -0.347320556640625, -0.28668212890625, -0.226043701171875, -0.1654052734375, -0.104766845703125, -0.04412841796875, 0.016510009765625, 0.0771484375, 0.137786865234375, 0.19842529296875, 0.259063720703125, 0.3197021484375, 0.380340576171875, 0.44097900390625, 0.501617431640625, 0.562255859375, 0.622894287109375, 0.68353271484375, 0.744171142578125, 0.8048095703125, 0.865447998046875, 0.92608642578125, 0.986724853515625, 1.04736328125, 1.108001708984375, 1.16864013671875, 1.229278564453125, 1.2899169921875, 1.350555419921875, 1.41119384765625, 1.471832275390625, 1.532470703125, 1.593109130859375, 1.65374755859375, 1.714385986328125, 1.7750244140625, 1.835662841796875, 1.89630126953125, 1.956939697265625, 2.017578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 14.0, 23.0, 26.0, 32.0, 46.0, 72.0, 124.0, 172.0, 256.0, 546.0, 926.0, 1984.0, 5488.0, 29126.0, 722163.0, 264476.0, 15608.0, 3946.0, 1615.0, 764.0, 393.0, 264.0, 161.0, 96.0, 59.0, 51.0, 30.0, 18.0, 15.0, 12.0, 9.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9462890625, -0.9191360473632812, -0.8919830322265625, -0.8648300170898438, -0.837677001953125, -0.8105239868164062, -0.7833709716796875, -0.7562179565429688, -0.72906494140625, -0.7019119262695312, -0.6747589111328125, -0.6476058959960938, -0.620452880859375, -0.5932998657226562, -0.5661468505859375, -0.5389938354492188, -0.5118408203125, -0.48468780517578125, -0.4575347900390625, -0.43038177490234375, -0.403228759765625, -0.37607574462890625, -0.3489227294921875, -0.32176971435546875, -0.29461669921875, -0.26746368408203125, -0.2403106689453125, -0.21315765380859375, -0.186004638671875, -0.15885162353515625, -0.1316986083984375, -0.10454559326171875, -0.077392578125, -0.05023956298828125, -0.0230865478515625, 0.00406646728515625, 0.031219482421875, 0.05837249755859375, 0.0855255126953125, 0.11267852783203125, 0.13983154296875, 0.16698455810546875, 0.1941375732421875, 0.22129058837890625, 0.248443603515625, 0.27559661865234375, 0.3027496337890625, 0.32990264892578125, 0.3570556640625, 0.38420867919921875, 0.4113616943359375, 0.43851470947265625, 0.465667724609375, 0.49282073974609375, 0.5199737548828125, 0.5471267700195312, 0.57427978515625, 0.6014328002929688, 0.6285858154296875, 0.6557388305664062, 0.682891845703125, 0.7100448608398438, 0.7371978759765625, 0.7643508911132812, 0.79150390625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 9.0, 9.0, 13.0, 24.0, 58.0, 124.0, 259.0, 247.0, 143.0, 58.0, 28.0, 15.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.249243885278702e-05, -8.765049278736115e-05, -8.280854672193527e-05, -7.79666006565094e-05, -7.312465459108353e-05, -6.828270852565765e-05, -6.344076246023178e-05, -5.859881639480591e-05, -5.3756870329380035e-05, -4.891492426395416e-05, -4.407297819852829e-05, -3.923103213310242e-05, -3.4389086067676544e-05, -2.954714000225067e-05, -2.47051939368248e-05, -1.9863247871398926e-05, -1.5021301805973053e-05, -1.017935574054718e-05, -5.337409675121307e-06, -4.954636096954346e-07, 4.346482455730438e-06, 9.188428521156311e-06, 1.4030374586582184e-05, 1.8872320652008057e-05, 2.371426671743393e-05, 2.8556212782859802e-05, 3.3398158848285675e-05, 3.824010491371155e-05, 4.308205097913742e-05, 4.7923997044563293e-05, 5.2765943109989166e-05, 5.760788917541504e-05, 6.244983524084091e-05, 6.729178130626678e-05, 7.213372737169266e-05, 7.697567343711853e-05, 8.18176195025444e-05, 8.665956556797028e-05, 9.150151163339615e-05, 9.634345769882202e-05, 0.0001011854037642479, 0.00010602734982967377, 0.00011086929589509964, 0.00011571124196052551, 0.00012055318802595139, 0.00012539513409137726, 0.00013023708015680313, 0.000135079026222229, 0.00013992097228765488, 0.00014476291835308075, 0.00014960486441850662, 0.0001544468104839325, 0.00015928875654935837, 0.00016413070261478424, 0.0001689726486802101, 0.00017381459474563599, 0.00017865654081106186, 0.00018349848687648773, 0.0001883404329419136, 0.00019318237900733948, 0.00019802432507276535, 0.00020286627113819122, 0.0002077082172036171, 0.00021255016326904297]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 16.0, 21.0, 22.0, 31.0, 51.0, 77.0, 132.0, 209.0, 415.0, 727.0, 1610.0, 4331.0, 26443.0, 823529.0, 176325.0, 9458.0, 2589.0, 1141.0, 599.0, 329.0, 181.0, 113.0, 61.0, 50.0, 25.0, 18.0, 14.0, 14.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.884765625, -0.85504150390625, -0.8253173828125, -0.79559326171875, -0.765869140625, -0.73614501953125, -0.7064208984375, -0.67669677734375, -0.64697265625, -0.61724853515625, -0.5875244140625, -0.55780029296875, -0.528076171875, -0.49835205078125, -0.4686279296875, -0.43890380859375, -0.4091796875, -0.37945556640625, -0.3497314453125, -0.32000732421875, -0.290283203125, -0.26055908203125, -0.2308349609375, -0.20111083984375, -0.17138671875, -0.14166259765625, -0.1119384765625, -0.08221435546875, -0.052490234375, -0.02276611328125, 0.0069580078125, 0.03668212890625, 0.06640625, 0.09613037109375, 0.1258544921875, 0.15557861328125, 0.185302734375, 0.21502685546875, 0.2447509765625, 0.27447509765625, 0.30419921875, 0.33392333984375, 0.3636474609375, 0.39337158203125, 0.423095703125, 0.45281982421875, 0.4825439453125, 0.51226806640625, 0.5419921875, 0.57171630859375, 0.6014404296875, 0.63116455078125, 0.660888671875, 0.69061279296875, 0.7203369140625, 0.75006103515625, 0.77978515625, 0.80950927734375, 0.8392333984375, 0.86895751953125, 0.898681640625, 0.92840576171875, 0.9581298828125, 0.98785400390625, 1.017578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 8.0, 13.0, 15.0, 32.0, 94.0, 213.0, 281.0, 176.0, 88.0, 34.0, 15.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.8074569702148438, -0.7609100341796875, -0.7143630981445312, -0.667816162109375, -0.6212692260742188, -0.5747222900390625, -0.5281753540039062, -0.48162841796875, -0.43508148193359375, -0.3885345458984375, -0.34198760986328125, -0.295440673828125, -0.24889373779296875, -0.2023468017578125, -0.15579986572265625, -0.1092529296875, -0.06270599365234375, -0.0161590576171875, 0.03038787841796875, 0.076934814453125, 0.12348175048828125, 0.1700286865234375, 0.21657562255859375, 0.26312255859375, 0.30966949462890625, 0.3562164306640625, 0.40276336669921875, 0.449310302734375, 0.49585723876953125, 0.5424041748046875, 0.5889511108398438, 0.635498046875, 0.6820449829101562, 0.7285919189453125, 0.7751388549804688, 0.821685791015625, 0.8682327270507812, 0.9147796630859375, 0.9613265991210938, 1.00787353515625, 1.0544204711914062, 1.1009674072265625, 1.1475143432617188, 1.194061279296875, 1.2406082153320312, 1.2871551513671875, 1.3337020874023438, 1.3802490234375, 1.4267959594726562, 1.4733428955078125, 1.5198898315429688, 1.566436767578125, 1.6129837036132812, 1.6595306396484375, 1.7060775756835938, 1.75262451171875, 1.7991714477539062, 1.8457183837890625, 1.8922653198242188, 1.938812255859375, 1.9853591918945312, 2.0319061279296875, 2.0784530639648438, 2.125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 19.0, 45.0, 88.0, 215.0, 259.0, 172.0, 112.0, 47.0, 10.0, 13.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.22579574584961, -17.72553062438965, -17.225263595581055, -16.724998474121094, -16.224733352661133, -15.724466323852539, -15.224201202392578, -14.7239351272583, -14.223669052124023, -13.723402976989746, -13.223137855529785, -12.722871780395508, -12.22260570526123, -11.722339630126953, -11.222074508666992, -10.721808433532715, -10.221543312072754, -9.721277236938477, -9.221012115478516, -8.720746040344238, -8.220479965209961, -7.720214366912842, -7.219948768615723, -6.719682693481445, -6.219417095184326, -5.719151496887207, -5.21888542175293, -4.7186198234558105, -4.218354225158691, -3.718088150024414, -3.217822551727295, -2.7175567150115967, -2.2172908782958984, -1.7170250415802002, -1.2167593240737915, -0.7164936065673828, -0.21622776985168457, 0.28403806686401367, 0.7843036651611328, 1.284569501876831, 1.7848353385925293, 2.2851011753082275, 2.785367012023926, 3.285632610321045, 3.785898447036743, 4.286164283752441, 4.7864298820495605, 5.28669548034668, 5.786961555480957, 6.287227153778076, 6.7874932289123535, 7.287758827209473, 7.78802490234375, 8.288290023803711, 8.788556098937988, 9.288822174072266, 9.789087295532227, 10.289353370666504, 10.789618492126465, 11.289884567260742, 11.79015064239502, 12.290416717529297, 12.790681838989258, 13.290947914123535, 13.791213989257812]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 10.0, 10.0, 10.0, 14.0, 10.0, 11.0, 18.0, 20.0, 28.0, 29.0, 36.0, 28.0, 37.0, 55.0, 51.0, 51.0, 40.0, 33.0, 51.0, 38.0, 37.0, 44.0, 47.0, 38.0, 30.0, 26.0, 29.0, 34.0, 16.0, 26.0, 20.0, 16.0, 17.0, 6.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0], "bins": [-10.728023529052734, -10.451824188232422, -10.17562484741211, -9.899425506591797, -9.6232271194458, -9.347027778625488, -9.070828437805176, -8.794629096984863, -8.51842975616455, -8.242230415344238, -7.966031551361084, -7.6898322105407715, -7.413632869720459, -7.137434005737305, -6.861234664916992, -6.58503532409668, -6.308836460113525, -6.032637119293213, -5.756438255310059, -5.480238914489746, -5.204039573669434, -4.927840232849121, -4.651641368865967, -4.375442028045654, -4.0992431640625, -3.8230440616607666, -3.546844720840454, -3.2706456184387207, -2.994446277618408, -2.718247175216675, -2.4420480728149414, -2.165848731994629, -1.8896493911743164, -1.6134501695632935, -1.3372509479522705, -1.061051845550537, -0.7848526239395142, -0.5086534023284912, -0.2324542999267578, 0.04374492168426514, 0.3199441432952881, 0.596143364906311, 0.8723425269126892, 1.1485416889190674, 1.4247409105300903, 1.7009401321411133, 1.9771392345428467, 2.25333833694458, 2.5295376777648926, 2.805736780166626, 3.0819361209869385, 3.358135223388672, 3.6343345642089844, 3.9105336666107178, 4.186732769012451, 4.462932109832764, 4.739130973815918, 5.0153303146362305, 5.291529178619385, 5.567728519439697, 5.84392786026001, 6.120126724243164, 6.396326065063477, 6.672525405883789, 6.948724746704102]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 3.0, 5.0, 7.0, 7.0, 12.0, 14.0, 12.0, 20.0, 22.0, 36.0, 42.0, 48.0, 54.0, 83.0, 97.0, 137.0, 141.0, 195.0, 297.0, 425.0, 669.0, 1185.0, 2582.0, 14315.0, 4146562.0, 20518.0, 3103.0, 1244.0, 710.0, 431.0, 345.0, 239.0, 161.0, 102.0, 106.0, 83.0, 72.0, 41.0, 34.0, 27.0, 21.0, 25.0, 7.0, 10.0, 13.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.52734375, -2.4542236328125, -2.381103515625, -2.3079833984375, -2.23486328125, -2.1617431640625, -2.088623046875, -2.0155029296875, -1.9423828125, -1.8692626953125, -1.796142578125, -1.7230224609375, -1.64990234375, -1.5767822265625, -1.503662109375, -1.4305419921875, -1.357421875, -1.2843017578125, -1.211181640625, -1.1380615234375, -1.06494140625, -0.9918212890625, -0.918701171875, -0.8455810546875, -0.7724609375, -0.6993408203125, -0.626220703125, -0.5531005859375, -0.47998046875, -0.4068603515625, -0.333740234375, -0.2606201171875, -0.1875, -0.1143798828125, -0.041259765625, 0.0318603515625, 0.10498046875, 0.1781005859375, 0.251220703125, 0.3243408203125, 0.3974609375, 0.4705810546875, 0.543701171875, 0.6168212890625, 0.68994140625, 0.7630615234375, 0.836181640625, 0.9093017578125, 0.982421875, 1.0555419921875, 1.128662109375, 1.2017822265625, 1.27490234375, 1.3480224609375, 1.421142578125, 1.4942626953125, 1.5673828125, 1.6405029296875, 1.713623046875, 1.7867431640625, 1.85986328125, 1.9329833984375, 2.006103515625, 2.0792236328125, 2.15234375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 13.0, 13.0, 14.0, 15.0, 20.0, 14.0, 23.0, 21.0, 33.0, 36.0, 27.0, 38.0, 42.0, 45.0, 44.0, 51.0, 39.0, 41.0, 42.0, 53.0, 23.0, 44.0, 24.0, 33.0, 32.0, 30.0, 21.0, 29.0, 18.0, 20.0, 16.0, 9.0, 9.0, 10.0, 7.0, 5.0, 6.0, 3.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.431640625, -0.4192352294921875, -0.406829833984375, -0.3944244384765625, -0.38201904296875, -0.3696136474609375, -0.357208251953125, -0.3448028564453125, -0.3323974609375, -0.3199920654296875, -0.307586669921875, -0.2951812744140625, -0.28277587890625, -0.2703704833984375, -0.257965087890625, -0.2455596923828125, -0.233154296875, -0.2207489013671875, -0.208343505859375, -0.1959381103515625, -0.18353271484375, -0.1711273193359375, -0.158721923828125, -0.1463165283203125, -0.1339111328125, -0.1215057373046875, -0.109100341796875, -0.0966949462890625, -0.08428955078125, -0.0718841552734375, -0.059478759765625, -0.0470733642578125, -0.03466796875, -0.0222625732421875, -0.009857177734375, 0.0025482177734375, 0.01495361328125, 0.0273590087890625, 0.039764404296875, 0.0521697998046875, 0.0645751953125, 0.0769805908203125, 0.089385986328125, 0.1017913818359375, 0.11419677734375, 0.1266021728515625, 0.139007568359375, 0.1514129638671875, 0.163818359375, 0.1762237548828125, 0.188629150390625, 0.2010345458984375, 0.21343994140625, 0.2258453369140625, 0.238250732421875, 0.2506561279296875, 0.2630615234375, 0.2754669189453125, 0.287872314453125, 0.3002777099609375, 0.31268310546875, 0.3250885009765625, 0.337493896484375, 0.3498992919921875, 0.3623046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 7.0, 11.0, 13.0, 10.0, 15.0, 20.0, 32.0, 34.0, 53.0, 60.0, 107.0, 120.0, 142.0, 211.0, 279.0, 377.0, 561.0, 828.0, 1255.0, 2232.0, 5159.0, 17769.0, 4053889.0, 92173.0, 10007.0, 3560.0, 1786.0, 1064.0, 734.0, 453.0, 339.0, 254.0, 181.0, 148.0, 104.0, 67.0, 62.0, 39.0, 39.0, 23.0, 18.0, 10.0, 13.0, 11.0, 12.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.857421875, -1.7990264892578125, -1.740631103515625, -1.6822357177734375, -1.62384033203125, -1.5654449462890625, -1.507049560546875, -1.4486541748046875, -1.3902587890625, -1.3318634033203125, -1.273468017578125, -1.2150726318359375, -1.15667724609375, -1.0982818603515625, -1.039886474609375, -0.9814910888671875, -0.923095703125, -0.8647003173828125, -0.806304931640625, -0.7479095458984375, -0.68951416015625, -0.6311187744140625, -0.572723388671875, -0.5143280029296875, -0.4559326171875, -0.3975372314453125, -0.339141845703125, -0.2807464599609375, -0.22235107421875, -0.1639556884765625, -0.105560302734375, -0.0471649169921875, 0.01123046875, 0.0696258544921875, 0.128021240234375, 0.1864166259765625, 0.24481201171875, 0.3032073974609375, 0.361602783203125, 0.4199981689453125, 0.4783935546875, 0.5367889404296875, 0.595184326171875, 0.6535797119140625, 0.71197509765625, 0.7703704833984375, 0.828765869140625, 0.8871612548828125, 0.945556640625, 1.0039520263671875, 1.062347412109375, 1.1207427978515625, 1.17913818359375, 1.2375335693359375, 1.295928955078125, 1.3543243408203125, 1.4127197265625, 1.4711151123046875, 1.529510498046875, 1.5879058837890625, 1.64630126953125, 1.7046966552734375, 1.763092041015625, 1.8214874267578125, 1.8798828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 22.0, 141.0, 3818.0, 41.0, 16.0, 12.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7828445434570312, -0.7585601806640625, -0.7342758178710938, -0.709991455078125, -0.6857070922851562, -0.6614227294921875, -0.6371383666992188, -0.61285400390625, -0.5885696411132812, -0.5642852783203125, -0.5400009155273438, -0.515716552734375, -0.49143218994140625, -0.4671478271484375, -0.44286346435546875, -0.4185791015625, -0.39429473876953125, -0.3700103759765625, -0.34572601318359375, -0.321441650390625, -0.29715728759765625, -0.2728729248046875, -0.24858856201171875, -0.22430419921875, -0.20001983642578125, -0.1757354736328125, -0.15145111083984375, -0.127166748046875, -0.10288238525390625, -0.0785980224609375, -0.05431365966796875, -0.030029296875, -0.00574493408203125, 0.0185394287109375, 0.04282379150390625, 0.067108154296875, 0.09139251708984375, 0.1156768798828125, 0.13996124267578125, 0.16424560546875, 0.18852996826171875, 0.2128143310546875, 0.23709869384765625, 0.261383056640625, 0.28566741943359375, 0.3099517822265625, 0.33423614501953125, 0.3585205078125, 0.38280487060546875, 0.4070892333984375, 0.43137359619140625, 0.455657958984375, 0.47994232177734375, 0.5042266845703125, 0.5285110473632812, 0.55279541015625, 0.5770797729492188, 0.6013641357421875, 0.6256484985351562, 0.649932861328125, 0.6742172241210938, 0.6985015869140625, 0.7227859497070312, 0.7470703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 23.0, 18.0, 38.0, 64.0, 81.0, 121.0, 162.0, 160.0, 126.0, 73.0, 51.0, 25.0, 14.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1238667964935303, -1.0766856670379639, -1.029504418373108, -0.9823232889175415, -0.9351420998573303, -0.8879609107971191, -0.8407797813415527, -0.7935985922813416, -0.7464174032211304, -0.6992362141609192, -0.652055025100708, -0.6048738956451416, -0.5576927065849304, -0.5105115175247192, -0.46333035826683044, -0.41614919900894165, -0.36896800994873047, -0.3217868208885193, -0.2746056616306305, -0.2274244874715805, -0.18024331331253052, -0.13306213915348053, -0.08588096499443054, -0.03869980573654175, 0.008481383323669434, 0.05566255748271942, 0.10284373164176941, 0.1500249058008194, 0.19720607995986938, 0.24438725411891937, 0.29156842827796936, 0.33874958753585815, 0.3859308958053589, 0.43311208486557007, 0.48029324412345886, 0.5274744033813477, 0.5746555924415588, 0.62183678150177, 0.6690179109573364, 0.7161991000175476, 0.7633802890777588, 0.81056147813797, 0.8577426671981812, 0.9049237966537476, 0.9521049857139587, 0.9992861747741699, 1.0464673042297363, 1.0936484336853027, 1.1408296823501587, 1.188010811805725, 1.235192060470581, 1.2823731899261475, 1.3295543193817139, 1.3767355680465698, 1.4239166975021362, 1.4710979461669922, 1.5182790756225586, 1.565460205078125, 1.612641453742981, 1.6598225831985474, 1.7070038318634033, 1.7541849613189697, 1.8013660907745361, 1.8485472202301025, 1.8957284688949585]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 8.0, 12.0, 10.0, 21.0, 19.0, 21.0, 22.0, 30.0, 43.0, 45.0, 39.0, 38.0, 57.0, 48.0, 51.0, 62.0, 51.0, 42.0, 47.0, 39.0, 33.0, 43.0, 33.0, 35.0, 25.0, 27.0, 22.0, 16.0, 11.0, 10.0, 12.0, 4.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0886290073394775, -1.0520042181015015, -1.0153794288635254, -0.9787546396255493, -0.9421297907829285, -0.9055050015449524, -0.8688802123069763, -0.8322553634643555, -0.7956305742263794, -0.7590057849884033, -0.7223809957504272, -0.6857562065124512, -0.6491313576698303, -0.6125065684318542, -0.5758817791938782, -0.5392569303512573, -0.502632200717926, -0.46600741147994995, -0.4293825924396515, -0.3927578032016754, -0.35613298416137695, -0.3195081949234009, -0.2828834056854248, -0.24625858664512634, -0.20963379740715027, -0.173008993268013, -0.13638418912887573, -0.09975939989089966, -0.06313459575176239, -0.026509791612625122, 0.010114997625350952, 0.046739816665649414, 0.08336460590362549, 0.11998941004276276, 0.15661421418190002, 0.1932390034198761, 0.22986380755901337, 0.26648861169815063, 0.3031134009361267, 0.33973821997642517, 0.37636300921440125, 0.4129877984523773, 0.4496126174926758, 0.48623740673065186, 0.5228621959686279, 0.559486985206604, 0.5961117744445801, 0.6327366232872009, 0.669361412525177, 0.7059862017631531, 0.7426109910011292, 0.77923583984375, 0.8158606290817261, 0.8524854183197021, 0.8891102075576782, 0.9257349967956543, 0.9623597860336304, 0.9989845752716064, 1.0356093645095825, 1.0722341537475586, 1.1088589429855347, 1.1454837322235107, 1.1821086406707764, 1.2187334299087524, 1.2553582191467285]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 10.0, 4.0, 12.0, 8.0, 18.0, 30.0, 32.0, 63.0, 84.0, 102.0, 171.0, 203.0, 369.0, 525.0, 864.0, 1235.0, 1960.0, 3221.0, 5181.0, 8589.0, 14497.0, 25269.0, 46626.0, 92741.0, 202872.0, 298189.0, 170851.0, 78779.0, 40597.0, 22292.0, 12845.0, 7558.0, 4728.0, 2787.0, 1804.0, 1145.0, 756.0, 509.0, 334.0, 211.0, 145.0, 100.0, 72.0, 54.0, 31.0, 24.0, 20.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 3.0], "bins": [-0.70458984375, -0.6834869384765625, -0.662384033203125, -0.6412811279296875, -0.62017822265625, -0.5990753173828125, -0.577972412109375, -0.5568695068359375, -0.5357666015625, -0.5146636962890625, -0.493560791015625, -0.4724578857421875, -0.45135498046875, -0.4302520751953125, -0.409149169921875, -0.3880462646484375, -0.366943359375, -0.3458404541015625, -0.324737548828125, -0.3036346435546875, -0.28253173828125, -0.2614288330078125, -0.240325927734375, -0.2192230224609375, -0.1981201171875, -0.1770172119140625, -0.155914306640625, -0.1348114013671875, -0.11370849609375, -0.0926055908203125, -0.071502685546875, -0.0503997802734375, -0.029296875, -0.0081939697265625, 0.012908935546875, 0.0340118408203125, 0.05511474609375, 0.0762176513671875, 0.097320556640625, 0.1184234619140625, 0.1395263671875, 0.1606292724609375, 0.181732177734375, 0.2028350830078125, 0.22393798828125, 0.2450408935546875, 0.266143798828125, 0.2872467041015625, 0.308349609375, 0.3294525146484375, 0.350555419921875, 0.3716583251953125, 0.39276123046875, 0.4138641357421875, 0.434967041015625, 0.4560699462890625, 0.4771728515625, 0.4982757568359375, 0.519378662109375, 0.5404815673828125, 0.56158447265625, 0.5826873779296875, 0.603790283203125, 0.6248931884765625, 0.64599609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 7.0, 5.0, 7.0, 9.0, 14.0, 16.0, 12.0, 17.0, 20.0, 15.0, 35.0, 35.0, 30.0, 31.0, 45.0, 37.0, 52.0, 44.0, 55.0, 50.0, 34.0, 32.0, 44.0, 40.0, 34.0, 36.0, 24.0, 28.0, 30.0, 23.0, 17.0, 21.0, 20.0, 16.0, 8.0, 12.0, 9.0, 5.0, 7.0, 3.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5107421875, -0.495849609375, -0.48095703125, -0.466064453125, -0.451171875, -0.436279296875, -0.42138671875, -0.406494140625, -0.3916015625, -0.376708984375, -0.36181640625, -0.346923828125, -0.33203125, -0.317138671875, -0.30224609375, -0.287353515625, -0.2724609375, -0.257568359375, -0.24267578125, -0.227783203125, -0.212890625, -0.197998046875, -0.18310546875, -0.168212890625, -0.1533203125, -0.138427734375, -0.12353515625, -0.108642578125, -0.09375, -0.078857421875, -0.06396484375, -0.049072265625, -0.0341796875, -0.019287109375, -0.00439453125, 0.010498046875, 0.025390625, 0.040283203125, 0.05517578125, 0.070068359375, 0.0849609375, 0.099853515625, 0.11474609375, 0.129638671875, 0.14453125, 0.159423828125, 0.17431640625, 0.189208984375, 0.2041015625, 0.218994140625, 0.23388671875, 0.248779296875, 0.263671875, 0.278564453125, 0.29345703125, 0.308349609375, 0.3232421875, 0.338134765625, 0.35302734375, 0.367919921875, 0.3828125, 0.397705078125, 0.41259765625, 0.427490234375, 0.4423828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 13.0, 13.0, 20.0, 35.0, 37.0, 39.0, 58.0, 125.0, 212.0, 409.0, 917.0, 2196.0, 6318.0, 21465.0, 91138.0, 546609.0, 304387.0, 53108.0, 14038.0, 4383.0, 1544.0, 684.0, 318.0, 174.0, 82.0, 61.0, 47.0, 26.0, 28.0, 18.0, 8.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.001953125, -1.946075439453125, -1.89019775390625, -1.834320068359375, -1.7784423828125, -1.722564697265625, -1.66668701171875, -1.610809326171875, -1.554931640625, -1.499053955078125, -1.44317626953125, -1.387298583984375, -1.3314208984375, -1.275543212890625, -1.21966552734375, -1.163787841796875, -1.10791015625, -1.052032470703125, -0.99615478515625, -0.940277099609375, -0.8843994140625, -0.828521728515625, -0.77264404296875, -0.716766357421875, -0.660888671875, -0.605010986328125, -0.54913330078125, -0.493255615234375, -0.4373779296875, -0.381500244140625, -0.32562255859375, -0.269744873046875, -0.2138671875, -0.157989501953125, -0.10211181640625, -0.046234130859375, 0.0096435546875, 0.065521240234375, 0.12139892578125, 0.177276611328125, 0.233154296875, 0.289031982421875, 0.34490966796875, 0.400787353515625, 0.4566650390625, 0.512542724609375, 0.56842041015625, 0.624298095703125, 0.68017578125, 0.736053466796875, 0.79193115234375, 0.847808837890625, 0.9036865234375, 0.959564208984375, 1.01544189453125, 1.071319580078125, 1.127197265625, 1.183074951171875, 1.23895263671875, 1.294830322265625, 1.3507080078125, 1.406585693359375, 1.46246337890625, 1.518341064453125, 1.57421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 4.0, 9.0, 11.0, 18.0, 17.0, 23.0, 23.0, 29.0, 23.0, 30.0, 47.0, 40.0, 49.0, 39.0, 57.0, 45.0, 45.0, 31.0, 52.0, 48.0, 54.0, 46.0, 41.0, 37.0, 33.0, 23.0, 19.0, 16.0, 18.0, 12.0, 9.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.103515625, -3.010284423828125, -2.91705322265625, -2.823822021484375, -2.7305908203125, -2.637359619140625, -2.54412841796875, -2.450897216796875, -2.357666015625, -2.264434814453125, -2.17120361328125, -2.077972412109375, -1.9847412109375, -1.891510009765625, -1.79827880859375, -1.705047607421875, -1.61181640625, -1.518585205078125, -1.42535400390625, -1.332122802734375, -1.2388916015625, -1.145660400390625, -1.05242919921875, -0.959197998046875, -0.865966796875, -0.772735595703125, -0.67950439453125, -0.586273193359375, -0.4930419921875, -0.399810791015625, -0.30657958984375, -0.213348388671875, -0.1201171875, -0.026885986328125, 0.06634521484375, 0.159576416015625, 0.2528076171875, 0.346038818359375, 0.43927001953125, 0.532501220703125, 0.625732421875, 0.718963623046875, 0.81219482421875, 0.905426025390625, 0.9986572265625, 1.091888427734375, 1.18511962890625, 1.278350830078125, 1.37158203125, 1.464813232421875, 1.55804443359375, 1.651275634765625, 1.7445068359375, 1.837738037109375, 1.93096923828125, 2.024200439453125, 2.117431640625, 2.210662841796875, 2.30389404296875, 2.397125244140625, 2.4903564453125, 2.583587646484375, 2.67681884765625, 2.770050048828125, 2.86328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 12.0, 14.0, 19.0, 46.0, 85.0, 265.0, 720.0, 2837.0, 24508.0, 737815.0, 268202.0, 11408.0, 1827.0, 451.0, 155.0, 78.0, 41.0, 21.0, 14.0, 13.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8729629516601562, -0.8391876220703125, -0.8054122924804688, -0.771636962890625, -0.7378616333007812, -0.7040863037109375, -0.6703109741210938, -0.63653564453125, -0.6027603149414062, -0.5689849853515625, -0.5352096557617188, -0.501434326171875, -0.46765899658203125, -0.4338836669921875, -0.40010833740234375, -0.3663330078125, -0.33255767822265625, -0.2987823486328125, -0.26500701904296875, -0.231231689453125, -0.19745635986328125, -0.1636810302734375, -0.12990570068359375, -0.09613037109375, -0.06235504150390625, -0.0285797119140625, 0.00519561767578125, 0.038970947265625, 0.07274627685546875, 0.1065216064453125, 0.14029693603515625, 0.174072265625, 0.20784759521484375, 0.2416229248046875, 0.27539825439453125, 0.309173583984375, 0.34294891357421875, 0.3767242431640625, 0.41049957275390625, 0.44427490234375, 0.47805023193359375, 0.5118255615234375, 0.5456008911132812, 0.579376220703125, 0.6131515502929688, 0.6469268798828125, 0.6807022094726562, 0.7144775390625, 0.7482528686523438, 0.7820281982421875, 0.8158035278320312, 0.849578857421875, 0.8833541870117188, 0.9171295166015625, 0.9509048461914062, 0.98468017578125, 1.0184555053710938, 1.0522308349609375, 1.0860061645507812, 1.119781494140625, 1.1535568237304688, 1.1873321533203125, 1.2211074829101562, 1.2548828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 6.0, 9.0, 26.0, 26.0, 63.0, 95.0, 117.0, 146.0, 155.0, 118.0, 89.0, 57.0, 33.0, 24.0, 13.0, 9.0, 8.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010907649993896484, -0.0001053251326084137, -0.00010157376527786255, -9.78223979473114e-05, -9.407103061676025e-05, -9.03196632862091e-05, -8.656829595565796e-05, -8.281692862510681e-05, -7.906556129455566e-05, -7.531419396400452e-05, -7.156282663345337e-05, -6.781145930290222e-05, -6.406009197235107e-05, -6.030872464179993e-05, -5.655735731124878e-05, -5.280598998069763e-05, -4.9054622650146484e-05, -4.530325531959534e-05, -4.155188798904419e-05, -3.780052065849304e-05, -3.4049153327941895e-05, -3.0297785997390747e-05, -2.65464186668396e-05, -2.2795051336288452e-05, -1.9043684005737305e-05, -1.5292316675186157e-05, -1.154094934463501e-05, -7.789582014083862e-06, -4.038214683532715e-06, -2.868473529815674e-07, 3.46451997756958e-06, 7.2158873081207275e-06, 1.0967254638671875e-05, 1.4718621969223022e-05, 1.846998929977417e-05, 2.2221356630325317e-05, 2.5972723960876465e-05, 2.9724091291427612e-05, 3.347545862197876e-05, 3.722682595252991e-05, 4.0978193283081055e-05, 4.47295606136322e-05, 4.848092794418335e-05, 5.22322952747345e-05, 5.5983662605285645e-05, 5.973502993583679e-05, 6.348639726638794e-05, 6.723776459693909e-05, 7.098913192749023e-05, 7.474049925804138e-05, 7.849186658859253e-05, 8.224323391914368e-05, 8.599460124969482e-05, 8.974596858024597e-05, 9.349733591079712e-05, 9.724870324134827e-05, 0.00010100007057189941, 0.00010475143790245056, 0.00010850280523300171, 0.00011225417256355286, 0.000116005539894104, 0.00011975690722465515, 0.0001235082745552063, 0.00012725964188575745, 0.0001310110092163086]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 10.0, 7.0, 9.0, 27.0, 43.0, 54.0, 122.0, 304.0, 904.0, 4352.0, 37119.0, 608022.0, 370969.0, 22481.0, 2976.0, 685.0, 231.0, 101.0, 57.0, 36.0, 23.0, 9.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45458984375, -0.43053436279296875, -0.4064788818359375, -0.38242340087890625, -0.358367919921875, -0.33431243896484375, -0.3102569580078125, -0.28620147705078125, -0.26214599609375, -0.23809051513671875, -0.2140350341796875, -0.18997955322265625, -0.165924072265625, -0.14186859130859375, -0.1178131103515625, -0.09375762939453125, -0.0697021484375, -0.04564666748046875, -0.0215911865234375, 0.00246429443359375, 0.026519775390625, 0.05057525634765625, 0.0746307373046875, 0.09868621826171875, 0.12274169921875, 0.14679718017578125, 0.1708526611328125, 0.19490814208984375, 0.218963623046875, 0.24301910400390625, 0.2670745849609375, 0.29113006591796875, 0.315185546875, 0.33924102783203125, 0.3632965087890625, 0.38735198974609375, 0.411407470703125, 0.43546295166015625, 0.4595184326171875, 0.48357391357421875, 0.50762939453125, 0.5316848754882812, 0.5557403564453125, 0.5797958374023438, 0.603851318359375, 0.6279067993164062, 0.6519622802734375, 0.6760177612304688, 0.7000732421875, 0.7241287231445312, 0.7481842041015625, 0.7722396850585938, 0.796295166015625, 0.8203506469726562, 0.8444061279296875, 0.8684616088867188, 0.89251708984375, 0.9165725708007812, 0.9406280517578125, 0.9646835327148438, 0.988739013671875, 1.0127944946289062, 1.0368499755859375, 1.0609054565429688, 1.0849609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 8.0, 22.0, 26.0, 38.0, 43.0, 50.0, 73.0, 89.0, 91.0, 105.0, 80.0, 97.0, 59.0, 44.0, 38.0, 39.0, 19.0, 10.0, 9.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.462646484375, -0.4397773742675781, -0.41690826416015625, -0.3940391540527344, -0.3711700439453125, -0.3483009338378906, -0.32543182373046875, -0.3025627136230469, -0.279693603515625, -0.2568244934082031, -0.23395538330078125, -0.21108627319335938, -0.1882171630859375, -0.16534805297851562, -0.14247894287109375, -0.11960983276367188, -0.09674072265625, -0.07387161254882812, -0.05100250244140625, -0.028133392333984375, -0.0052642822265625, 0.017604827880859375, 0.04047393798828125, 0.06334304809570312, 0.086212158203125, 0.10908126831054688, 0.13195037841796875, 0.15481948852539062, 0.1776885986328125, 0.20055770874023438, 0.22342681884765625, 0.24629592895507812, 0.2691650390625, 0.2920341491699219, 0.31490325927734375, 0.3377723693847656, 0.3606414794921875, 0.3835105895996094, 0.40637969970703125, 0.4292488098144531, 0.452117919921875, 0.4749870300292969, 0.49785614013671875, 0.5207252502441406, 0.5435943603515625, 0.5664634704589844, 0.5893325805664062, 0.6122016906738281, 0.63507080078125, 0.6579399108886719, 0.6808090209960938, 0.7036781311035156, 0.7265472412109375, 0.7494163513183594, 0.7722854614257812, 0.7951545715332031, 0.818023681640625, 0.8408927917480469, 0.8637619018554688, 0.8866310119628906, 0.9095001220703125, 0.9323692321777344, 0.9552383422851562, 0.9781074523925781, 1.0009765625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 10.0, 18.0, 34.0, 65.0, 179.0, 327.0, 221.0, 77.0, 49.0, 18.0, 9.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.836753845214844, -6.047939777374268, -5.259125709533691, -4.470311164855957, -3.68149733543396, -2.892683267593384, -2.1038689613342285, -1.3150548934936523, -0.5262408256530762, 0.2625733017921448, 1.0513874292373657, 1.8402016162872314, 2.6290156841278076, 3.417829751968384, 4.206644058227539, 4.995458126068115, 5.784272193908691, 6.573086261749268, 7.361900329589844, 8.150714874267578, 8.939528465270996, 9.72834300994873, 10.517156600952148, 11.305971145629883, 12.094785690307617, 12.883600234985352, 13.67241382598877, 14.461228370666504, 15.250041961669922, 16.038856506347656, 16.82767105102539, 17.616485595703125, 18.405298233032227, 19.19411277770996, 19.982927322387695, 20.771739959716797, 21.56055450439453, 22.349369049072266, 23.13818359375, 23.926998138427734, 24.715810775756836, 25.50462532043457, 26.293439865112305, 27.082252502441406, 27.87106704711914, 28.659881591796875, 29.44869613647461, 30.237510681152344, 31.026325225830078, 31.815139770507812, 32.60395431518555, 33.39276885986328, 34.181583404541016, 34.970394134521484, 35.75920867919922, 36.54802322387695, 37.33683776855469, 38.12565231323242, 38.914466857910156, 39.70328140258789, 40.492095947265625, 41.280906677246094, 42.06972122192383, 42.85853576660156, 43.6473503112793]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 6.0, 7.0, 11.0, 15.0, 21.0, 18.0, 16.0, 28.0, 30.0, 54.0, 42.0, 36.0, 54.0, 71.0, 65.0, 62.0, 62.0, 56.0, 43.0, 35.0, 44.0, 34.0, 22.0, 20.0, 28.0, 24.0, 18.0, 19.0, 5.0, 11.0, 5.0, 5.0, 11.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.14488983154297, -15.629015922546387, -15.113142967224121, -14.597269058227539, -14.081395149230957, -13.565521240234375, -13.04964828491211, -12.533774375915527, -12.017900466918945, -11.502026557922363, -10.986153602600098, -10.470279693603516, -9.954405784606934, -9.438531875610352, -8.922658920288086, -8.406785011291504, -7.890912055969238, -7.3750386238098145, -6.859164714813232, -6.343291282653809, -5.827417373657227, -5.311543941497803, -4.795670509338379, -4.279796600341797, -3.763923168182373, -3.24804949760437, -2.732175827026367, -2.2163023948669434, -1.7004287242889404, -1.1845550537109375, -0.6686816215515137, -0.15280795097351074, 0.3630657196044922, 0.8789393305778503, 1.3948129415512085, 1.9106864929199219, 2.426560163497925, 2.9424338340759277, 3.4583072662353516, 3.9741809368133545, 4.490054607391357, 5.005928039550781, 5.521801948547363, 6.037675380706787, 6.553548812866211, 7.069422721862793, 7.585296154022217, 8.10116958618164, 8.617043495178223, 9.132917404174805, 9.64879035949707, 10.164664268493652, 10.680538177490234, 11.1964111328125, 11.712285041809082, 12.228158950805664, 12.74403190612793, 13.259905815124512, 13.775778770446777, 14.29165267944336, 14.807526588439941, 15.323400497436523, 15.839273452758789, 16.355146408081055, 16.871021270751953]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 12.0, 11.0, 16.0, 32.0, 26.0, 36.0, 48.0, 75.0, 110.0, 151.0, 248.0, 346.0, 570.0, 943.0, 1746.0, 3912.0, 11646.0, 264044.0, 3888578.0, 13006.0, 3973.0, 1892.0, 1013.0, 594.0, 407.0, 225.0, 189.0, 112.0, 87.0, 51.0, 34.0, 31.0, 19.0, 19.0, 15.0, 23.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.3076171875, -1.2667999267578125, -1.225982666015625, -1.1851654052734375, -1.14434814453125, -1.1035308837890625, -1.062713623046875, -1.0218963623046875, -0.9810791015625, -0.9402618408203125, -0.899444580078125, -0.8586273193359375, -0.81781005859375, -0.7769927978515625, -0.736175537109375, -0.6953582763671875, -0.654541015625, -0.6137237548828125, -0.572906494140625, -0.5320892333984375, -0.49127197265625, -0.4504547119140625, -0.409637451171875, -0.3688201904296875, -0.3280029296875, -0.2871856689453125, -0.246368408203125, -0.2055511474609375, -0.16473388671875, -0.1239166259765625, -0.083099365234375, -0.0422821044921875, -0.00146484375, 0.0393524169921875, 0.080169677734375, 0.1209869384765625, 0.16180419921875, 0.2026214599609375, 0.243438720703125, 0.2842559814453125, 0.3250732421875, 0.3658905029296875, 0.406707763671875, 0.4475250244140625, 0.48834228515625, 0.5291595458984375, 0.569976806640625, 0.6107940673828125, 0.651611328125, 0.6924285888671875, 0.733245849609375, 0.7740631103515625, 0.81488037109375, 0.8556976318359375, 0.896514892578125, 0.9373321533203125, 0.9781494140625, 1.0189666748046875, 1.059783935546875, 1.1006011962890625, 1.14141845703125, 1.1822357177734375, 1.223052978515625, 1.2638702392578125, 1.3046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 9.0, 11.0, 16.0, 11.0, 12.0, 15.0, 32.0, 21.0, 27.0, 51.0, 37.0, 38.0, 49.0, 56.0, 59.0, 57.0, 66.0, 66.0, 57.0, 47.0, 33.0, 34.0, 39.0, 31.0, 19.0, 20.0, 9.0, 10.0, 20.0, 5.0, 6.0, 7.0, 8.0, 6.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7090606689453125, -0.685211181640625, -0.6613616943359375, -0.63751220703125, -0.6136627197265625, -0.589813232421875, -0.5659637451171875, -0.5421142578125, -0.5182647705078125, -0.494415283203125, -0.4705657958984375, -0.44671630859375, -0.4228668212890625, -0.399017333984375, -0.3751678466796875, -0.351318359375, -0.3274688720703125, -0.303619384765625, -0.2797698974609375, -0.25592041015625, -0.2320709228515625, -0.208221435546875, -0.1843719482421875, -0.1605224609375, -0.1366729736328125, -0.112823486328125, -0.0889739990234375, -0.06512451171875, -0.0412750244140625, -0.017425537109375, 0.0064239501953125, 0.0302734375, 0.0541229248046875, 0.077972412109375, 0.1018218994140625, 0.12567138671875, 0.1495208740234375, 0.173370361328125, 0.1972198486328125, 0.2210693359375, 0.2449188232421875, 0.268768310546875, 0.2926177978515625, 0.31646728515625, 0.3403167724609375, 0.364166259765625, 0.3880157470703125, 0.411865234375, 0.4357147216796875, 0.459564208984375, 0.4834136962890625, 0.50726318359375, 0.5311126708984375, 0.554962158203125, 0.5788116455078125, 0.6026611328125, 0.6265106201171875, 0.650360107421875, 0.6742095947265625, 0.69805908203125, 0.7219085693359375, 0.745758056640625, 0.7696075439453125, 0.79345703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 10.0, 5.0, 5.0, 7.0, 17.0, 13.0, 23.0, 34.0, 41.0, 45.0, 69.0, 97.0, 130.0, 145.0, 207.0, 319.0, 408.0, 590.0, 1049.0, 1736.0, 3353.0, 8608.0, 36344.0, 4031026.0, 86530.0, 13033.0, 4525.0, 2129.0, 1183.0, 777.0, 530.0, 326.0, 254.0, 194.0, 123.0, 105.0, 77.0, 66.0, 41.0, 33.0, 25.0, 17.0, 10.0, 7.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2587890625, -1.2148895263671875, -1.170989990234375, -1.1270904541015625, -1.08319091796875, -1.0392913818359375, -0.995391845703125, -0.9514923095703125, -0.9075927734375, -0.8636932373046875, -0.819793701171875, -0.7758941650390625, -0.73199462890625, -0.6880950927734375, -0.644195556640625, -0.6002960205078125, -0.556396484375, -0.5124969482421875, -0.468597412109375, -0.4246978759765625, -0.38079833984375, -0.3368988037109375, -0.292999267578125, -0.2490997314453125, -0.2052001953125, -0.1613006591796875, -0.117401123046875, -0.0735015869140625, -0.02960205078125, 0.0142974853515625, 0.058197021484375, 0.1020965576171875, 0.14599609375, 0.1898956298828125, 0.233795166015625, 0.2776947021484375, 0.32159423828125, 0.3654937744140625, 0.409393310546875, 0.4532928466796875, 0.4971923828125, 0.5410919189453125, 0.584991455078125, 0.6288909912109375, 0.67279052734375, 0.7166900634765625, 0.760589599609375, 0.8044891357421875, 0.848388671875, 0.8922882080078125, 0.936187744140625, 0.9800872802734375, 1.02398681640625, 1.0678863525390625, 1.111785888671875, 1.1556854248046875, 1.1995849609375, 1.2434844970703125, 1.287384033203125, 1.3312835693359375, 1.37518310546875, 1.4190826416015625, 1.462982177734375, 1.5068817138671875, 1.55078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 20.0, 62.0, 3318.0, 530.0, 58.0, 21.0, 21.0, 9.0, 1.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5976524353027344, -0.5805587768554688, -0.5634651184082031, -0.5463714599609375, -0.5292778015136719, -0.5121841430664062, -0.4950904846191406, -0.477996826171875, -0.4609031677246094, -0.44380950927734375, -0.4267158508300781, -0.4096221923828125, -0.3925285339355469, -0.37543487548828125, -0.3583412170410156, -0.34124755859375, -0.3241539001464844, -0.30706024169921875, -0.2899665832519531, -0.2728729248046875, -0.2557792663574219, -0.23868560791015625, -0.22159194946289062, -0.204498291015625, -0.18740463256835938, -0.17031097412109375, -0.15321731567382812, -0.1361236572265625, -0.11902999877929688, -0.10193634033203125, -0.08484268188476562, -0.0677490234375, -0.050655364990234375, -0.03356170654296875, -0.016468048095703125, 0.0006256103515625, 0.017719268798828125, 0.03481292724609375, 0.051906585693359375, 0.069000244140625, 0.08609390258789062, 0.10318756103515625, 0.12028121948242188, 0.1373748779296875, 0.15446853637695312, 0.17156219482421875, 0.18865585327148438, 0.20574951171875, 0.22284317016601562, 0.23993682861328125, 0.2570304870605469, 0.2741241455078125, 0.2912178039550781, 0.30831146240234375, 0.3254051208496094, 0.342498779296875, 0.3595924377441406, 0.37668609619140625, 0.3937797546386719, 0.4108734130859375, 0.4279670715332031, 0.44506072998046875, 0.4621543884277344, 0.479248046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 8.0, 33.0, 87.0, 179.0, 280.0, 242.0, 105.0, 42.0, 18.0, 13.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7683079242706299, -1.677186131477356, -1.586064338684082, -1.4949424266815186, -1.4038207530975342, -1.3126988410949707, -1.2215770483016968, -1.1304552555084229, -1.039333462715149, -0.948211669921875, -0.8570898771286011, -0.7659680247306824, -0.6748462319374084, -0.5837244391441345, -0.4926025867462158, -0.4014807939529419, -0.31035900115966797, -0.21923719346523285, -0.12811538577079773, -0.036993563175201416, 0.05412822961807251, 0.14525002241134644, 0.23637187480926514, 0.32749366760253906, 0.418615460395813, 0.5097372531890869, 0.6008590459823608, 0.6919808983802795, 0.7831026911735535, 0.8742244839668274, 0.9653463363647461, 1.05646812915802, 1.147590160369873, 1.238711953163147, 1.329833745956421, 1.4209556579589844, 1.5120773315429688, 1.6031992435455322, 1.6943210363388062, 1.78544282913208, 1.876564621925354, 1.967686414718628, 2.0588083267211914, 2.149930000305176, 2.2410519123077393, 2.3321735858917236, 2.423295497894287, 2.5144171714782715, 2.605539083480835, 2.6966609954833984, 2.787782669067383, 2.8789045810699463, 2.9700262546539307, 3.061148166656494, 3.1522698402404785, 3.243391752243042, 3.3345136642456055, 3.425635576248169, 3.5167572498321533, 3.607879161834717, 3.699000835418701, 3.7901227474212646, 3.881244659423828, 3.9723663330078125, 4.063488006591797]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 15.0, 3.0, 12.0, 10.0, 13.0, 15.0, 22.0, 21.0, 40.0, 23.0, 31.0, 41.0, 40.0, 35.0, 54.0, 39.0, 56.0, 55.0, 53.0, 52.0, 38.0, 51.0, 41.0, 31.0, 35.0, 31.0, 22.0, 22.0, 15.0, 16.0, 16.0, 10.0, 10.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8254018425941467, -0.7982668876647949, -0.7711318731307983, -0.7439968585968018, -0.71686190366745, -0.6897269487380981, -0.6625919342041016, -0.635456919670105, -0.6083219647407532, -0.5811870098114014, -0.5540519952774048, -0.5269169807434082, -0.4997820258140564, -0.4726470410823822, -0.445512056350708, -0.4183770716190338, -0.3912420868873596, -0.3641071021556854, -0.33697211742401123, -0.30983713269233704, -0.28270214796066284, -0.25556716322898865, -0.22843217849731445, -0.20129719376564026, -0.17416220903396606, -0.14702722430229187, -0.11989223957061768, -0.09275725483894348, -0.06562227010726929, -0.03848728537559509, -0.011352300643920898, 0.015782684087753296, 0.042917728424072266, 0.07005271315574646, 0.09718769788742065, 0.12432268261909485, 0.15145766735076904, 0.17859265208244324, 0.20572763681411743, 0.23286262154579163, 0.2599976062774658, 0.28713259100914, 0.3142675757408142, 0.3414025604724884, 0.3685375452041626, 0.3956725299358368, 0.422807514667511, 0.4499424993991852, 0.4770774841308594, 0.504212498664856, 0.5313474535942078, 0.5584824085235596, 0.5856174230575562, 0.6127524375915527, 0.6398873925209045, 0.6670223474502563, 0.6941573619842529, 0.7212923765182495, 0.7484273314476013, 0.7755622863769531, 0.8026973009109497, 0.8298323154449463, 0.8569672703742981, 0.8841022253036499, 0.9112372398376465]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 8.0, 8.0, 6.0, 6.0, 16.0, 18.0, 29.0, 45.0, 58.0, 63.0, 130.0, 157.0, 195.0, 363.0, 551.0, 836.0, 1379.0, 2377.0, 4430.0, 8048.0, 16741.0, 37775.0, 101033.0, 321511.0, 357503.0, 114955.0, 41939.0, 18208.0, 8847.0, 4687.0, 2511.0, 1451.0, 905.0, 576.0, 378.0, 246.0, 158.0, 117.0, 83.0, 58.0, 42.0, 37.0, 18.0, 16.0, 11.0, 6.0, 8.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.0625, -1.028289794921875, -0.99407958984375, -0.959869384765625, -0.9256591796875, -0.891448974609375, -0.85723876953125, -0.823028564453125, -0.788818359375, -0.754608154296875, -0.72039794921875, -0.686187744140625, -0.6519775390625, -0.617767333984375, -0.58355712890625, -0.549346923828125, -0.51513671875, -0.480926513671875, -0.44671630859375, -0.412506103515625, -0.3782958984375, -0.344085693359375, -0.30987548828125, -0.275665283203125, -0.241455078125, -0.207244873046875, -0.17303466796875, -0.138824462890625, -0.1046142578125, -0.070404052734375, -0.03619384765625, -0.001983642578125, 0.0322265625, 0.066436767578125, 0.10064697265625, 0.134857177734375, 0.1690673828125, 0.203277587890625, 0.23748779296875, 0.271697998046875, 0.305908203125, 0.340118408203125, 0.37432861328125, 0.408538818359375, 0.4427490234375, 0.476959228515625, 0.51116943359375, 0.545379638671875, 0.57958984375, 0.613800048828125, 0.64801025390625, 0.682220458984375, 0.7164306640625, 0.750640869140625, 0.78485107421875, 0.819061279296875, 0.853271484375, 0.887481689453125, 0.92169189453125, 0.955902099609375, 0.9901123046875, 1.024322509765625, 1.05853271484375, 1.092742919921875, 1.126953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 8.0, 6.0, 12.0, 13.0, 7.0, 15.0, 25.0, 23.0, 29.0, 29.0, 36.0, 35.0, 33.0, 49.0, 63.0, 56.0, 51.0, 63.0, 71.0, 50.0, 53.0, 46.0, 28.0, 42.0, 29.0, 14.0, 18.0, 17.0, 11.0, 10.0, 14.0, 9.0, 4.0, 5.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.763671875, -0.739715576171875, -0.71575927734375, -0.691802978515625, -0.6678466796875, -0.643890380859375, -0.61993408203125, -0.595977783203125, -0.572021484375, -0.548065185546875, -0.52410888671875, -0.500152587890625, -0.4761962890625, -0.452239990234375, -0.42828369140625, -0.404327392578125, -0.38037109375, -0.356414794921875, -0.33245849609375, -0.308502197265625, -0.2845458984375, -0.260589599609375, -0.23663330078125, -0.212677001953125, -0.188720703125, -0.164764404296875, -0.14080810546875, -0.116851806640625, -0.0928955078125, -0.068939208984375, -0.04498291015625, -0.021026611328125, 0.0029296875, 0.026885986328125, 0.05084228515625, 0.074798583984375, 0.0987548828125, 0.122711181640625, 0.14666748046875, 0.170623779296875, 0.194580078125, 0.218536376953125, 0.24249267578125, 0.266448974609375, 0.2904052734375, 0.314361572265625, 0.33831787109375, 0.362274169921875, 0.38623046875, 0.410186767578125, 0.43414306640625, 0.458099365234375, 0.4820556640625, 0.506011962890625, 0.52996826171875, 0.553924560546875, 0.577880859375, 0.601837158203125, 0.62579345703125, 0.649749755859375, 0.6737060546875, 0.697662353515625, 0.72161865234375, 0.745574951171875, 0.76953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 7.0, 10.0, 16.0, 16.0, 38.0, 52.0, 77.0, 148.0, 259.0, 515.0, 1262.0, 3791.0, 17940.0, 218053.0, 747979.0, 47726.0, 7227.0, 1891.0, 750.0, 352.0, 179.0, 110.0, 48.0, 42.0, 24.0, 14.0, 8.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.2064208984375, -3.100341796875, -2.9942626953125, -2.88818359375, -2.7821044921875, -2.676025390625, -2.5699462890625, -2.4638671875, -2.3577880859375, -2.251708984375, -2.1456298828125, -2.03955078125, -1.9334716796875, -1.827392578125, -1.7213134765625, -1.615234375, -1.5091552734375, -1.403076171875, -1.2969970703125, -1.19091796875, -1.0848388671875, -0.978759765625, -0.8726806640625, -0.7666015625, -0.6605224609375, -0.554443359375, -0.4483642578125, -0.34228515625, -0.2362060546875, -0.130126953125, -0.0240478515625, 0.08203125, 0.1881103515625, 0.294189453125, 0.4002685546875, 0.50634765625, 0.6124267578125, 0.718505859375, 0.8245849609375, 0.9306640625, 1.0367431640625, 1.142822265625, 1.2489013671875, 1.35498046875, 1.4610595703125, 1.567138671875, 1.6732177734375, 1.779296875, 1.8853759765625, 1.991455078125, 2.0975341796875, 2.20361328125, 2.3096923828125, 2.415771484375, 2.5218505859375, 2.6279296875, 2.7340087890625, 2.840087890625, 2.9461669921875, 3.05224609375, 3.1583251953125, 3.264404296875, 3.3704833984375, 3.4765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 13.0, 22.0, 39.0, 48.0, 64.0, 65.0, 82.0, 76.0, 81.0, 98.0, 71.0, 71.0, 59.0, 58.0, 38.0, 24.0, 22.0, 11.0, 11.0, 11.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.258544921875, -5.07177734375, -4.885009765625, -4.6982421875, -4.511474609375, -4.32470703125, -4.137939453125, -3.951171875, -3.764404296875, -3.57763671875, -3.390869140625, -3.2041015625, -3.017333984375, -2.83056640625, -2.643798828125, -2.45703125, -2.270263671875, -2.08349609375, -1.896728515625, -1.7099609375, -1.523193359375, -1.33642578125, -1.149658203125, -0.962890625, -0.776123046875, -0.58935546875, -0.402587890625, -0.2158203125, -0.029052734375, 0.15771484375, 0.344482421875, 0.53125, 0.718017578125, 0.90478515625, 1.091552734375, 1.2783203125, 1.465087890625, 1.65185546875, 1.838623046875, 2.025390625, 2.212158203125, 2.39892578125, 2.585693359375, 2.7724609375, 2.959228515625, 3.14599609375, 3.332763671875, 3.51953125, 3.706298828125, 3.89306640625, 4.079833984375, 4.2666015625, 4.453369140625, 4.64013671875, 4.826904296875, 5.013671875, 5.200439453125, 5.38720703125, 5.573974609375, 5.7607421875, 5.947509765625, 6.13427734375, 6.321044921875, 6.5078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 3.0, 7.0, 14.0, 15.0, 23.0, 37.0, 65.0, 162.0, 365.0, 1022.0, 3618.0, 31385.0, 991660.0, 15999.0, 2682.0, 858.0, 320.0, 149.0, 67.0, 36.0, 22.0, 17.0, 11.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8115234375, -1.7268524169921875, -1.642181396484375, -1.5575103759765625, -1.47283935546875, -1.3881683349609375, -1.303497314453125, -1.2188262939453125, -1.1341552734375, -1.0494842529296875, -0.964813232421875, -0.8801422119140625, -0.79547119140625, -0.7108001708984375, -0.626129150390625, -0.5414581298828125, -0.456787109375, -0.3721160888671875, -0.287445068359375, -0.2027740478515625, -0.11810302734375, -0.0334320068359375, 0.051239013671875, 0.1359100341796875, 0.2205810546875, 0.3052520751953125, 0.389923095703125, 0.4745941162109375, 0.55926513671875, 0.6439361572265625, 0.728607177734375, 0.8132781982421875, 0.89794921875, 0.9826202392578125, 1.067291259765625, 1.1519622802734375, 1.23663330078125, 1.3213043212890625, 1.405975341796875, 1.4906463623046875, 1.5753173828125, 1.6599884033203125, 1.744659423828125, 1.8293304443359375, 1.91400146484375, 1.9986724853515625, 2.083343505859375, 2.1680145263671875, 2.252685546875, 2.3373565673828125, 2.422027587890625, 2.5066986083984375, 2.59136962890625, 2.6760406494140625, 2.760711669921875, 2.8453826904296875, 2.9300537109375, 3.0147247314453125, 3.099395751953125, 3.1840667724609375, 3.26873779296875, 3.3534088134765625, 3.438079833984375, 3.5227508544921875, 3.607421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 11.0, 9.0, 21.0, 29.0, 29.0, 32.0, 76.0, 138.0, 190.0, 148.0, 112.0, 63.0, 45.0, 23.0, 14.0, 11.0, 9.0, 3.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001690387725830078, -0.00016478542238473892, -0.00016053207218647003, -0.00015627872198820114, -0.00015202537178993225, -0.00014777202159166336, -0.00014351867139339447, -0.00013926532119512558, -0.0001350119709968567, -0.0001307586207985878, -0.0001265052706003189, -0.00012225192040205002, -0.00011799857020378113, -0.00011374522000551224, -0.00010949186980724335, -0.00010523851960897446, -0.00010098516941070557, -9.673181921243668e-05, -9.247846901416779e-05, -8.82251188158989e-05, -8.397176861763e-05, -7.971841841936111e-05, -7.546506822109222e-05, -7.121171802282333e-05, -6.695836782455444e-05, -6.270501762628555e-05, -5.845166742801666e-05, -5.419831722974777e-05, -4.994496703147888e-05, -4.569161683320999e-05, -4.14382666349411e-05, -3.718491643667221e-05, -3.293156623840332e-05, -2.867821604013443e-05, -2.442486584186554e-05, -2.017151564359665e-05, -1.591816544532776e-05, -1.1664815247058868e-05, -7.411465048789978e-06, -3.1581148505210876e-06, 1.0952353477478027e-06, 5.348585546016693e-06, 9.601935744285583e-06, 1.3855285942554474e-05, 1.8108636140823364e-05, 2.2361986339092255e-05, 2.6615336537361145e-05, 3.0868686735630035e-05, 3.5122036933898926e-05, 3.9375387132167816e-05, 4.3628737330436707e-05, 4.78820875287056e-05, 5.213543772697449e-05, 5.638878792524338e-05, 6.064213812351227e-05, 6.489548832178116e-05, 6.914883852005005e-05, 7.340218871831894e-05, 7.765553891658783e-05, 8.190888911485672e-05, 8.616223931312561e-05, 9.04155895113945e-05, 9.466893970966339e-05, 9.892228990793228e-05, 0.00010317564010620117]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 9.0, 6.0, 12.0, 18.0, 43.0, 48.0, 78.0, 141.0, 392.0, 1563.0, 16920.0, 1017246.0, 10140.0, 1238.0, 336.0, 148.0, 72.0, 40.0, 34.0, 18.0, 13.0, 11.0, 10.0, 5.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.224884033203125, -4.11773681640625, -4.010589599609375, -3.9034423828125, -3.796295166015625, -3.68914794921875, -3.582000732421875, -3.474853515625, -3.367706298828125, -3.26055908203125, -3.153411865234375, -3.0462646484375, -2.939117431640625, -2.83197021484375, -2.724822998046875, -2.61767578125, -2.510528564453125, -2.40338134765625, -2.296234130859375, -2.1890869140625, -2.081939697265625, -1.97479248046875, -1.867645263671875, -1.760498046875, -1.653350830078125, -1.54620361328125, -1.439056396484375, -1.3319091796875, -1.224761962890625, -1.11761474609375, -1.010467529296875, -0.9033203125, -0.796173095703125, -0.68902587890625, -0.581878662109375, -0.4747314453125, -0.367584228515625, -0.26043701171875, -0.153289794921875, -0.046142578125, 0.061004638671875, 0.16815185546875, 0.275299072265625, 0.3824462890625, 0.489593505859375, 0.59674072265625, 0.703887939453125, 0.81103515625, 0.918182373046875, 1.02532958984375, 1.132476806640625, 1.2396240234375, 1.346771240234375, 1.45391845703125, 1.561065673828125, 1.668212890625, 1.775360107421875, 1.88250732421875, 1.989654541015625, 2.0968017578125, 2.203948974609375, 2.31109619140625, 2.418243408203125, 2.525390625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 43.0, 271.0, 569.0, 77.0, 21.0, 10.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4453125, -9.260955810546875, -9.07659912109375, -8.892242431640625, -8.7078857421875, -8.523529052734375, -8.33917236328125, -8.154815673828125, -7.970458984375, -7.786102294921875, -7.60174560546875, -7.417388916015625, -7.2330322265625, -7.048675537109375, -6.86431884765625, -6.679962158203125, -6.49560546875, -6.311248779296875, -6.12689208984375, -5.942535400390625, -5.7581787109375, -5.573822021484375, -5.38946533203125, -5.205108642578125, -5.020751953125, -4.836395263671875, -4.65203857421875, -4.467681884765625, -4.2833251953125, -4.098968505859375, -3.91461181640625, -3.730255126953125, -3.5458984375, -3.361541748046875, -3.17718505859375, -2.992828369140625, -2.8084716796875, -2.624114990234375, -2.43975830078125, -2.255401611328125, -2.071044921875, -1.886688232421875, -1.70233154296875, -1.517974853515625, -1.3336181640625, -1.149261474609375, -0.96490478515625, -0.780548095703125, -0.59619140625, -0.411834716796875, -0.22747802734375, -0.043121337890625, 0.1412353515625, 0.325592041015625, 0.50994873046875, 0.694305419921875, 0.878662109375, 1.063018798828125, 1.24737548828125, 1.431732177734375, 1.6160888671875, 1.800445556640625, 1.98480224609375, 2.169158935546875, 2.353515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 29.0, 51.0, 123.0, 256.0, 279.0, 156.0, 55.0, 23.0, 7.0, 5.0, 5.0, 0.0, 0.0, 1.0], "bins": [-61.468017578125, -60.33716583251953, -59.2063102722168, -58.07545852661133, -56.944602966308594, -55.813751220703125, -54.68289566040039, -53.55204391479492, -52.42118835449219, -51.29033660888672, -50.159481048583984, -49.028629302978516, -47.89777374267578, -46.76692199707031, -45.63606643676758, -44.50521469116211, -43.37436294555664, -42.24351119995117, -41.11265563964844, -39.98180389404297, -38.850948333740234, -37.720096588134766, -36.58924102783203, -35.45838928222656, -34.327537536621094, -33.196685791015625, -32.06583023071289, -30.93497657775879, -29.804122924804688, -28.67327117919922, -27.542417526245117, -26.411563873291016, -25.280712127685547, -24.149858474731445, -23.019004821777344, -21.888151168823242, -20.75729751586914, -19.626445770263672, -18.49559211730957, -17.36473846435547, -16.233882904052734, -15.103029251098633, -13.972175598144531, -12.841322898864746, -11.710469245910645, -10.579615592956543, -9.448762893676758, -8.317909240722656, -7.187056541442871, -6.0562028884887695, -4.925349712371826, -3.7944962978363037, -2.6636428833007812, -1.5327892303466797, -0.40193605422973633, 0.728917121887207, 1.8597707748413086, 2.990624189376831, 4.1214776039123535, 5.252330780029297, 6.383184432983398, 7.5140380859375, 8.644891738891602, 9.775744438171387, 10.906598091125488]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 9.0, 7.0, 8.0, 12.0, 20.0, 8.0, 14.0, 21.0, 23.0, 29.0, 32.0, 36.0, 49.0, 42.0, 52.0, 43.0, 54.0, 59.0, 59.0, 47.0, 37.0, 42.0, 36.0, 45.0, 35.0, 30.0, 29.0, 19.0, 26.0, 23.0, 14.0, 6.0, 9.0, 3.0, 2.0, 5.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.26739501953125, -16.66203498840332, -16.056676864624023, -15.451316833496094, -14.84595775604248, -14.240598678588867, -13.635239601135254, -13.02988052368164, -12.424520492553711, -11.819161415100098, -11.213802337646484, -10.608442306518555, -10.003083229064941, -9.397724151611328, -8.792365074157715, -8.187005996704102, -7.581646919250488, -6.976287841796875, -6.3709282875061035, -5.76556921005249, -5.160209655761719, -4.5548505783081055, -3.949491500854492, -3.3441319465637207, -2.7387728691101074, -2.133413553237915, -1.5280543565750122, -0.9226951599121094, -0.317335844039917, 0.2880234718322754, 0.8933825492858887, 1.4987421035766602, 2.1041011810302734, 2.709460496902466, 3.314819812774658, 3.9201788902282715, 4.525538444519043, 5.130897521972656, 5.7362565994262695, 6.341616153717041, 6.946975231170654, 7.552334308624268, 8.157693862915039, 8.763052940368652, 9.368412017822266, 9.973772048950195, 10.579130172729492, 11.184490203857422, 11.789849281311035, 12.395208358764648, 13.000567436218262, 13.605926513671875, 14.211286544799805, 14.816645622253418, 15.422004699707031, 16.02736473083496, 16.632722854614258, 17.238082885742188, 17.843441009521484, 18.448801040649414, 19.05415916442871, 19.65951919555664, 20.264877319335938, 20.870237350463867, 21.475597381591797]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 14.0, 13.0, 22.0, 31.0, 44.0, 66.0, 85.0, 111.0, 196.0, 312.0, 620.0, 1389.0, 5572.0, 4092387.0, 86698.0, 4083.0, 1232.0, 497.0, 293.0, 169.0, 124.0, 85.0, 63.0, 38.0, 39.0, 23.0, 18.0, 7.0, 15.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3671875, -3.27838134765625, -3.1895751953125, -3.10076904296875, -3.011962890625, -2.92315673828125, -2.8343505859375, -2.74554443359375, -2.65673828125, -2.56793212890625, -2.4791259765625, -2.39031982421875, -2.301513671875, -2.21270751953125, -2.1239013671875, -2.03509521484375, -1.9462890625, -1.85748291015625, -1.7686767578125, -1.67987060546875, -1.591064453125, -1.50225830078125, -1.4134521484375, -1.32464599609375, -1.23583984375, -1.14703369140625, -1.0582275390625, -0.96942138671875, -0.880615234375, -0.79180908203125, -0.7030029296875, -0.61419677734375, -0.525390625, -0.43658447265625, -0.3477783203125, -0.25897216796875, -0.170166015625, -0.08135986328125, 0.0074462890625, 0.09625244140625, 0.18505859375, 0.27386474609375, 0.3626708984375, 0.45147705078125, 0.540283203125, 0.62908935546875, 0.7178955078125, 0.80670166015625, 0.8955078125, 0.98431396484375, 1.0731201171875, 1.16192626953125, 1.250732421875, 1.33953857421875, 1.4283447265625, 1.51715087890625, 1.60595703125, 1.69476318359375, 1.7835693359375, 1.87237548828125, 1.961181640625, 2.04998779296875, 2.1387939453125, 2.22760009765625, 2.31640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 8.0, 7.0, 7.0, 16.0, 6.0, 19.0, 24.0, 39.0, 34.0, 57.0, 55.0, 82.0, 70.0, 87.0, 71.0, 74.0, 55.0, 68.0, 49.0, 34.0, 16.0, 22.0, 25.0, 11.0, 16.0, 13.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2237472534179688, -1.1887054443359375, -1.1536636352539062, -1.118621826171875, -1.0835800170898438, -1.0485382080078125, -1.0134963989257812, -0.97845458984375, -0.9434127807617188, -0.9083709716796875, -0.8733291625976562, -0.838287353515625, -0.8032455444335938, -0.7682037353515625, -0.7331619262695312, -0.6981201171875, -0.6630783081054688, -0.6280364990234375, -0.5929946899414062, -0.557952880859375, -0.5229110717773438, -0.4878692626953125, -0.45282745361328125, -0.41778564453125, -0.38274383544921875, -0.3477020263671875, -0.31266021728515625, -0.277618408203125, -0.24257659912109375, -0.2075347900390625, -0.17249298095703125, -0.137451171875, -0.10240936279296875, -0.0673675537109375, -0.03232574462890625, 0.002716064453125, 0.03775787353515625, 0.0727996826171875, 0.10784149169921875, 0.14288330078125, 0.17792510986328125, 0.2129669189453125, 0.24800872802734375, 0.283050537109375, 0.31809234619140625, 0.3531341552734375, 0.38817596435546875, 0.4232177734375, 0.45825958251953125, 0.4933013916015625, 0.5283432006835938, 0.563385009765625, 0.5984268188476562, 0.6334686279296875, 0.6685104370117188, 0.70355224609375, 0.7385940551757812, 0.7736358642578125, 0.8086776733398438, 0.843719482421875, 0.8787612915039062, 0.9138031005859375, 0.9488449096679688, 0.98388671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 13.0, 13.0, 32.0, 26.0, 34.0, 52.0, 88.0, 92.0, 133.0, 203.0, 357.0, 586.0, 1422.0, 3668.0, 14786.0, 4081463.0, 78034.0, 8327.0, 2480.0, 1009.0, 461.0, 272.0, 185.0, 143.0, 100.0, 78.0, 67.0, 42.0, 28.0, 23.0, 16.0, 8.0, 5.0, 5.0, 5.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.07159423828125, -2.0064697265625, -1.94134521484375, -1.876220703125, -1.81109619140625, -1.7459716796875, -1.68084716796875, -1.61572265625, -1.55059814453125, -1.4854736328125, -1.42034912109375, -1.355224609375, -1.29010009765625, -1.2249755859375, -1.15985107421875, -1.0947265625, -1.02960205078125, -0.9644775390625, -0.89935302734375, -0.834228515625, -0.76910400390625, -0.7039794921875, -0.63885498046875, -0.57373046875, -0.50860595703125, -0.4434814453125, -0.37835693359375, -0.313232421875, -0.24810791015625, -0.1829833984375, -0.11785888671875, -0.052734375, 0.01239013671875, 0.0775146484375, 0.14263916015625, 0.207763671875, 0.27288818359375, 0.3380126953125, 0.40313720703125, 0.46826171875, 0.53338623046875, 0.5985107421875, 0.66363525390625, 0.728759765625, 0.79388427734375, 0.8590087890625, 0.92413330078125, 0.9892578125, 1.05438232421875, 1.1195068359375, 1.18463134765625, 1.249755859375, 1.31488037109375, 1.3800048828125, 1.44512939453125, 1.51025390625, 1.57537841796875, 1.6405029296875, 1.70562744140625, 1.770751953125, 1.83587646484375, 1.9010009765625, 1.96612548828125, 2.03125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 23.0, 77.0, 3817.0, 85.0, 27.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23583984375, -0.2169342041015625, -0.198028564453125, -0.1791229248046875, -0.16021728515625, -0.1413116455078125, -0.122406005859375, -0.1035003662109375, -0.0845947265625, -0.0656890869140625, -0.046783447265625, -0.0278778076171875, -0.00897216796875, 0.0099334716796875, 0.028839111328125, 0.0477447509765625, 0.066650390625, 0.0855560302734375, 0.104461669921875, 0.1233673095703125, 0.14227294921875, 0.1611785888671875, 0.180084228515625, 0.1989898681640625, 0.2178955078125, 0.2368011474609375, 0.255706787109375, 0.2746124267578125, 0.29351806640625, 0.3124237060546875, 0.331329345703125, 0.3502349853515625, 0.369140625, 0.3880462646484375, 0.406951904296875, 0.4258575439453125, 0.44476318359375, 0.4636688232421875, 0.482574462890625, 0.5014801025390625, 0.5203857421875, 0.5392913818359375, 0.558197021484375, 0.5771026611328125, 0.59600830078125, 0.6149139404296875, 0.633819580078125, 0.6527252197265625, 0.671630859375, 0.6905364990234375, 0.709442138671875, 0.7283477783203125, 0.74725341796875, 0.7661590576171875, 0.785064697265625, 0.8039703369140625, 0.8228759765625, 0.8417816162109375, 0.860687255859375, 0.8795928955078125, 0.89849853515625, 0.9174041748046875, 0.936309814453125, 0.9552154541015625, 0.97412109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 130.0, 745.0, 118.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.236989974975586, -9.93779468536377, -9.638599395751953, -9.339405059814453, -9.040209770202637, -8.74101448059082, -8.441819190979004, -8.142623901367188, -7.843428611755371, -7.544233322143555, -7.2450385093688965, -6.94584321975708, -6.646647930145264, -6.3474531173706055, -6.048257827758789, -5.749062538146973, -5.4498677253723145, -5.150672435760498, -4.85147762298584, -4.552282333374023, -4.253087043762207, -3.9538919925689697, -3.6546969413757324, -3.355501651763916, -3.0563066005706787, -2.7571115493774414, -2.457916259765625, -2.1587212085723877, -1.8595260381698608, -1.560330867767334, -1.2611358165740967, -0.9619405269622803, -0.662745475769043, -0.3635503351688385, -0.06435519456863403, 0.23483991622924805, 0.5340350866317749, 0.8332302570343018, 1.132425308227539, 1.4316205978393555, 1.7308156490325928, 2.03001070022583, 2.3292059898376465, 2.628401041030884, 2.927596092224121, 3.2267913818359375, 3.525986433029175, 3.825181722640991, 4.1243767738342285, 4.423572063446045, 4.722766876220703, 5.0219621658325195, 5.321157455444336, 5.620352745056152, 5.9195475578308105, 6.218742847442627, 6.517937660217285, 6.817132949829102, 7.11632776260376, 7.415523052215576, 7.714718341827393, 8.01391315460205, 8.313108444213867, 8.612303733825684, 8.9114990234375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 9.0, 5.0, 8.0, 11.0, 18.0, 16.0, 21.0, 27.0, 25.0, 30.0, 37.0, 36.0, 43.0, 40.0, 44.0, 54.0, 49.0, 54.0, 57.0, 51.0, 39.0, 40.0, 34.0, 35.0, 28.0, 35.0, 25.0, 26.0, 20.0, 11.0, 26.0, 14.0, 16.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9321097731590271, -0.8937767744064331, -0.8554438352584839, -0.8171108365058899, -0.7787778973579407, -0.7404448986053467, -0.7021119594573975, -0.6637789607048035, -0.6254459619522095, -0.5871129631996155, -0.5487800240516663, -0.5104470252990723, -0.47211408615112305, -0.43378108739852905, -0.39544811844825745, -0.35711514949798584, -0.3187822103500366, -0.280449241399765, -0.2421162724494934, -0.2037832885980606, -0.165450319647789, -0.1271173506975174, -0.0887843668460846, -0.05045139789581299, -0.012118428945541382, 0.026214543730020523, 0.06454751640558243, 0.10288049280643463, 0.14121346175670624, 0.17954643070697784, 0.21787941455841064, 0.25621238350868225, 0.29454541206359863, 0.33287838101387024, 0.37121134996414185, 0.40954434871673584, 0.44787728786468506, 0.48621028661727905, 0.524543285369873, 0.5628762245178223, 0.6012091636657715, 0.6395421624183655, 0.6778751015663147, 0.7162081003189087, 0.7545410394668579, 0.7928740382194519, 0.8312070369720459, 0.8695399761199951, 0.9078729748725891, 0.9462059736251831, 0.9845389127731323, 1.0228718519210815, 1.0612049102783203, 1.0995378494262695, 1.1378707885742188, 1.176203727722168, 1.2145367860794067, 1.252869725227356, 1.2912027835845947, 1.329535722732544, 1.3678686618804932, 1.4062016010284424, 1.4445346593856812, 1.4828675985336304, 1.5212005376815796]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 7.0, 6.0, 13.0, 19.0, 30.0, 40.0, 59.0, 67.0, 132.0, 199.0, 289.0, 474.0, 860.0, 1676.0, 3304.0, 7881.0, 21945.0, 83774.0, 503186.0, 337929.0, 57257.0, 16906.0, 6379.0, 2828.0, 1319.0, 749.0, 454.0, 254.0, 160.0, 101.0, 76.0, 62.0, 34.0, 19.0, 22.0, 10.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.16796875, -2.103973388671875, -2.03997802734375, -1.975982666015625, -1.9119873046875, -1.847991943359375, -1.78399658203125, -1.720001220703125, -1.656005859375, -1.592010498046875, -1.52801513671875, -1.464019775390625, -1.4000244140625, -1.336029052734375, -1.27203369140625, -1.208038330078125, -1.14404296875, -1.080047607421875, -1.01605224609375, -0.952056884765625, -0.8880615234375, -0.824066162109375, -0.76007080078125, -0.696075439453125, -0.632080078125, -0.568084716796875, -0.50408935546875, -0.440093994140625, -0.3760986328125, -0.312103271484375, -0.24810791015625, -0.184112548828125, -0.1201171875, -0.056121826171875, 0.00787353515625, 0.071868896484375, 0.1358642578125, 0.199859619140625, 0.26385498046875, 0.327850341796875, 0.391845703125, 0.455841064453125, 0.51983642578125, 0.583831787109375, 0.6478271484375, 0.711822509765625, 0.77581787109375, 0.839813232421875, 0.90380859375, 0.967803955078125, 1.03179931640625, 1.095794677734375, 1.1597900390625, 1.223785400390625, 1.28778076171875, 1.351776123046875, 1.415771484375, 1.479766845703125, 1.54376220703125, 1.607757568359375, 1.6717529296875, 1.735748291015625, 1.79974365234375, 1.863739013671875, 1.927734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 10.0, 7.0, 5.0, 20.0, 18.0, 27.0, 26.0, 30.0, 52.0, 55.0, 67.0, 72.0, 77.0, 73.0, 67.0, 68.0, 60.0, 55.0, 44.0, 30.0, 21.0, 25.0, 14.0, 19.0, 11.0, 13.0, 10.0, 2.0, 2.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2147293090820312, -1.1804351806640625, -1.1461410522460938, -1.111846923828125, -1.0775527954101562, -1.0432586669921875, -1.0089645385742188, -0.97467041015625, -0.9403762817382812, -0.9060821533203125, -0.8717880249023438, -0.837493896484375, -0.8031997680664062, -0.7689056396484375, -0.7346115112304688, -0.7003173828125, -0.6660232543945312, -0.6317291259765625, -0.5974349975585938, -0.563140869140625, -0.5288467407226562, -0.4945526123046875, -0.46025848388671875, -0.42596435546875, -0.39167022705078125, -0.3573760986328125, -0.32308197021484375, -0.288787841796875, -0.25449371337890625, -0.2201995849609375, -0.18590545654296875, -0.151611328125, -0.11731719970703125, -0.0830230712890625, -0.04872894287109375, -0.014434814453125, 0.01985931396484375, 0.0541534423828125, 0.08844757080078125, 0.12274169921875, 0.15703582763671875, 0.1913299560546875, 0.22562408447265625, 0.259918212890625, 0.29421234130859375, 0.3285064697265625, 0.36280059814453125, 0.3970947265625, 0.43138885498046875, 0.4656829833984375, 0.49997711181640625, 0.534271240234375, 0.5685653686523438, 0.6028594970703125, 0.6371536254882812, 0.67144775390625, 0.7057418823242188, 0.7400360107421875, 0.7743301391601562, 0.808624267578125, 0.8429183959960938, 0.8772125244140625, 0.9115066528320312, 0.94580078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 15.0, 27.0, 38.0, 70.0, 124.0, 235.0, 432.0, 789.0, 1716.0, 4406.0, 19612.0, 333780.0, 649232.0, 28537.0, 5559.0, 1958.0, 901.0, 470.0, 247.0, 133.0, 86.0, 64.0, 37.0, 16.0, 13.0, 9.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.619903564453125, -3.50347900390625, -3.387054443359375, -3.2706298828125, -3.154205322265625, -3.03778076171875, -2.921356201171875, -2.804931640625, -2.688507080078125, -2.57208251953125, -2.455657958984375, -2.3392333984375, -2.222808837890625, -2.10638427734375, -1.989959716796875, -1.87353515625, -1.757110595703125, -1.64068603515625, -1.524261474609375, -1.4078369140625, -1.291412353515625, -1.17498779296875, -1.058563232421875, -0.942138671875, -0.825714111328125, -0.70928955078125, -0.592864990234375, -0.4764404296875, -0.360015869140625, -0.24359130859375, -0.127166748046875, -0.0107421875, 0.105682373046875, 0.22210693359375, 0.338531494140625, 0.4549560546875, 0.571380615234375, 0.68780517578125, 0.804229736328125, 0.920654296875, 1.037078857421875, 1.15350341796875, 1.269927978515625, 1.3863525390625, 1.502777099609375, 1.61920166015625, 1.735626220703125, 1.85205078125, 1.968475341796875, 2.08489990234375, 2.201324462890625, 2.3177490234375, 2.434173583984375, 2.55059814453125, 2.667022705078125, 2.783447265625, 2.899871826171875, 3.01629638671875, 3.132720947265625, 3.2491455078125, 3.365570068359375, 3.48199462890625, 3.598419189453125, 3.71484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 5.0, 10.0, 7.0, 15.0, 18.0, 23.0, 32.0, 38.0, 41.0, 62.0, 57.0, 53.0, 64.0, 63.0, 79.0, 63.0, 62.0, 62.0, 44.0, 49.0, 36.0, 35.0, 20.0, 16.0, 12.0, 6.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.62005615234375, -4.4471435546875, -4.27423095703125, -4.101318359375, -3.92840576171875, -3.7554931640625, -3.58258056640625, -3.40966796875, -3.23675537109375, -3.0638427734375, -2.89093017578125, -2.718017578125, -2.54510498046875, -2.3721923828125, -2.19927978515625, -2.0263671875, -1.85345458984375, -1.6805419921875, -1.50762939453125, -1.334716796875, -1.16180419921875, -0.9888916015625, -0.81597900390625, -0.64306640625, -0.47015380859375, -0.2972412109375, -0.12432861328125, 0.048583984375, 0.22149658203125, 0.3944091796875, 0.56732177734375, 0.740234375, 0.91314697265625, 1.0860595703125, 1.25897216796875, 1.431884765625, 1.60479736328125, 1.7777099609375, 1.95062255859375, 2.12353515625, 2.29644775390625, 2.4693603515625, 2.64227294921875, 2.815185546875, 2.98809814453125, 3.1610107421875, 3.33392333984375, 3.5068359375, 3.67974853515625, 3.8526611328125, 4.02557373046875, 4.198486328125, 4.37139892578125, 4.5443115234375, 4.71722412109375, 4.89013671875, 5.06304931640625, 5.2359619140625, 5.40887451171875, 5.581787109375, 5.75469970703125, 5.9276123046875, 6.10052490234375, 6.2734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 11.0, 14.0, 32.0, 102.0, 341.0, 1446.0, 13347.0, 1020230.0, 11188.0, 1394.0, 271.0, 92.0, 50.0, 13.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.53125, -6.36578369140625, -6.2003173828125, -6.03485107421875, -5.869384765625, -5.70391845703125, -5.5384521484375, -5.37298583984375, -5.20751953125, -5.04205322265625, -4.8765869140625, -4.71112060546875, -4.545654296875, -4.38018798828125, -4.2147216796875, -4.04925537109375, -3.8837890625, -3.71832275390625, -3.5528564453125, -3.38739013671875, -3.221923828125, -3.05645751953125, -2.8909912109375, -2.72552490234375, -2.56005859375, -2.39459228515625, -2.2291259765625, -2.06365966796875, -1.898193359375, -1.73272705078125, -1.5672607421875, -1.40179443359375, -1.236328125, -1.07086181640625, -0.9053955078125, -0.73992919921875, -0.574462890625, -0.40899658203125, -0.2435302734375, -0.07806396484375, 0.08740234375, 0.25286865234375, 0.4183349609375, 0.58380126953125, 0.749267578125, 0.91473388671875, 1.0802001953125, 1.24566650390625, 1.4111328125, 1.57659912109375, 1.7420654296875, 1.90753173828125, 2.072998046875, 2.23846435546875, 2.4039306640625, 2.56939697265625, 2.73486328125, 2.90032958984375, 3.0657958984375, 3.23126220703125, 3.396728515625, 3.56219482421875, 3.7276611328125, 3.89312744140625, 4.05859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 9.0, 7.0, 16.0, 33.0, 70.0, 189.0, 274.0, 205.0, 112.0, 45.0, 12.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022149085998535156, -0.0002125091850757599, -0.0002035275101661682, -0.00019454583525657654, -0.00018556416034698486, -0.0001765824854373932, -0.00016760081052780151, -0.00015861913561820984, -0.00014963746070861816, -0.0001406557857990265, -0.00013167411088943481, -0.00012269243597984314, -0.00011371076107025146, -0.00010472908616065979, -9.574741125106812e-05, -8.676573634147644e-05, -7.778406143188477e-05, -6.880238652229309e-05, -5.9820711612701416e-05, -5.083903670310974e-05, -4.1857361793518066e-05, -3.287568688392639e-05, -2.3894011974334717e-05, -1.4912337064743042e-05, -5.930662155151367e-06, 3.0510127544403076e-06, 1.2032687664031982e-05, 2.1014362573623657e-05, 2.9996037483215332e-05, 3.897771239280701e-05, 4.795938730239868e-05, 5.6941062211990356e-05, 6.592273712158203e-05, 7.49044120311737e-05, 8.388608694076538e-05, 9.286776185035706e-05, 0.00010184943675994873, 0.0001108311116695404, 0.00011981278657913208, 0.00012879446148872375, 0.00013777613639831543, 0.0001467578113079071, 0.00015573948621749878, 0.00016472116112709045, 0.00017370283603668213, 0.0001826845109462738, 0.00019166618585586548, 0.00020064786076545715, 0.00020962953567504883, 0.0002186112105846405, 0.00022759288549423218, 0.00023657456040382385, 0.00024555623531341553, 0.0002545379102230072, 0.0002635195851325989, 0.00027250126004219055, 0.0002814829349517822, 0.0002904646098613739, 0.0002994462847709656, 0.00030842795968055725, 0.0003174096345901489, 0.0003263913094997406, 0.0003353729844093323, 0.00034435465931892395, 0.0003533363342285156]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 11.0, 4.0, 13.0, 12.0, 16.0, 39.0, 46.0, 73.0, 144.0, 279.0, 543.0, 1326.0, 3478.0, 12171.0, 778799.0, 237282.0, 9244.0, 2793.0, 1156.0, 551.0, 234.0, 128.0, 63.0, 59.0, 27.0, 21.0, 13.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.9482421875, -1.873046875, -1.7978515625, -1.72265625, -1.6474609375, -1.572265625, -1.4970703125, -1.421875, -1.3466796875, -1.271484375, -1.1962890625, -1.12109375, -1.0458984375, -0.970703125, -0.8955078125, -0.8203125, -0.7451171875, -0.669921875, -0.5947265625, -0.51953125, -0.4443359375, -0.369140625, -0.2939453125, -0.21875, -0.1435546875, -0.068359375, 0.0068359375, 0.08203125, 0.1572265625, 0.232421875, 0.3076171875, 0.3828125, 0.4580078125, 0.533203125, 0.6083984375, 0.68359375, 0.7587890625, 0.833984375, 0.9091796875, 0.984375, 1.0595703125, 1.134765625, 1.2099609375, 1.28515625, 1.3603515625, 1.435546875, 1.5107421875, 1.5859375, 1.6611328125, 1.736328125, 1.8115234375, 1.88671875, 1.9619140625, 2.037109375, 2.1123046875, 2.1875, 2.2626953125, 2.337890625, 2.4130859375, 2.48828125, 2.5634765625, 2.638671875, 2.7138671875, 2.7890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 9.0, 23.0, 92.0, 354.0, 331.0, 94.0, 19.0, 12.0, 9.0, 5.0, 3.0, 2.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.859222412109375, -2.70867919921875, -2.558135986328125, -2.4075927734375, -2.257049560546875, -2.10650634765625, -1.955963134765625, -1.805419921875, -1.654876708984375, -1.50433349609375, -1.353790283203125, -1.2032470703125, -1.052703857421875, -0.90216064453125, -0.751617431640625, -0.60107421875, -0.450531005859375, -0.29998779296875, -0.149444580078125, 0.0010986328125, 0.151641845703125, 0.30218505859375, 0.452728271484375, 0.603271484375, 0.753814697265625, 0.90435791015625, 1.054901123046875, 1.2054443359375, 1.355987548828125, 1.50653076171875, 1.657073974609375, 1.8076171875, 1.958160400390625, 2.10870361328125, 2.259246826171875, 2.4097900390625, 2.560333251953125, 2.71087646484375, 2.861419677734375, 3.011962890625, 3.162506103515625, 3.31304931640625, 3.463592529296875, 3.6141357421875, 3.764678955078125, 3.91522216796875, 4.065765380859375, 4.21630859375, 4.366851806640625, 4.51739501953125, 4.667938232421875, 4.8184814453125, 4.969024658203125, 5.11956787109375, 5.270111083984375, 5.420654296875, 5.571197509765625, 5.72174072265625, 5.872283935546875, 6.0228271484375, 6.173370361328125, 6.32391357421875, 6.474456787109375, 6.625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 12.0, 41.0, 132.0, 289.0, 278.0, 128.0, 70.0, 29.0, 19.0, 9.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.160404205322266, -25.91027069091797, -24.660137176513672, -23.410003662109375, -22.159870147705078, -20.90973663330078, -19.659605026245117, -18.40947151184082, -17.159337997436523, -15.909204483032227, -14.65907096862793, -13.40893840789795, -12.158804893493652, -10.908671379089355, -9.658538818359375, -8.408405303955078, -7.158271789550781, -5.908138275146484, -4.658005237579346, -3.407871961593628, -2.15773868560791, -0.9076051712036133, 0.3425278663635254, 1.592660903930664, 2.842794418334961, 4.092927932739258, 5.3430609703063965, 6.593194007873535, 7.843327522277832, 9.093461036682129, 10.34359359741211, 11.593727111816406, 12.843864440917969, 14.093997955322266, 15.344131469726562, 16.59426498413086, 17.844398498535156, 19.094532012939453, 20.344663619995117, 21.594797134399414, 22.84493064880371, 24.095064163208008, 25.345197677612305, 26.5953311920166, 27.845462799072266, 29.095596313476562, 30.34572982788086, 31.595863342285156, 32.84599685668945, 34.09613037109375, 35.34626388549805, 36.596397399902344, 37.84653091430664, 39.09666442871094, 40.346797943115234, 41.59693145751953, 42.84706115722656, 44.09719467163086, 45.347328186035156, 46.59746170043945, 47.84759521484375, 49.09772872924805, 50.347862243652344, 51.597991943359375, 52.84812927246094]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 7.0, 6.0, 12.0, 10.0, 17.0, 8.0, 17.0, 12.0, 19.0, 18.0, 24.0, 24.0, 21.0, 31.0, 22.0, 50.0, 42.0, 45.0, 40.0, 42.0, 30.0, 44.0, 47.0, 45.0, 40.0, 44.0, 37.0, 31.0, 30.0, 28.0, 31.0, 13.0, 16.0, 21.0, 18.0, 18.0, 10.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.617327690124512, -15.052301406860352, -14.487274169921875, -13.922247886657715, -13.357221603393555, -12.792194366455078, -12.227168083190918, -11.662141799926758, -11.097114562988281, -10.532088279724121, -9.967061042785645, -9.402034759521484, -8.837007522583008, -8.271981239318848, -7.7069549560546875, -7.141928195953369, -6.576901435852051, -6.011874675750732, -5.446847915649414, -4.881821632385254, -4.3167948722839355, -3.751768112182617, -3.186741590499878, -2.6217150688171387, -2.0566883087158203, -1.4916616678237915, -0.9266350269317627, -0.3616083860397339, 0.20341825485229492, 0.7684450149536133, 1.3334715366363525, 1.8984980583190918, 2.4635257720947266, 3.028552532196045, 3.593579053878784, 4.158605575561523, 4.723632335662842, 5.28865909576416, 5.85368537902832, 6.418712139129639, 6.983738899230957, 7.548765659332275, 8.113792419433594, 8.678818702697754, 9.243844985961914, 9.80887222290039, 10.37389850616455, 10.938924789428711, 11.503952026367188, 12.068978309631348, 12.634005546569824, 13.199031829833984, 13.764059066772461, 14.329085350036621, 14.894111633300781, 15.459138870239258, 16.024166107177734, 16.58919334411621, 17.154218673706055, 17.71924591064453, 18.284273147583008, 18.849300384521484, 19.414325714111328, 19.979352951049805, 20.54437828063965]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 9.0, 6.0, 4.0, 9.0, 13.0, 10.0, 18.0, 26.0, 39.0, 54.0, 81.0, 136.0, 233.0, 425.0, 1018.0, 3183.0, 28463.0, 4143983.0, 12394.0, 2365.0, 814.0, 367.0, 212.0, 131.0, 86.0, 55.0, 25.0, 21.0, 18.0, 19.0, 17.0, 6.0, 15.0, 10.0, 3.0, 4.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.88714599609375, -3.7547607421875, -3.62237548828125, -3.489990234375, -3.35760498046875, -3.2252197265625, -3.09283447265625, -2.96044921875, -2.82806396484375, -2.6956787109375, -2.56329345703125, -2.430908203125, -2.29852294921875, -2.1661376953125, -2.03375244140625, -1.9013671875, -1.76898193359375, -1.6365966796875, -1.50421142578125, -1.371826171875, -1.23944091796875, -1.1070556640625, -0.97467041015625, -0.84228515625, -0.70989990234375, -0.5775146484375, -0.44512939453125, -0.312744140625, -0.18035888671875, -0.0479736328125, 0.08441162109375, 0.216796875, 0.34918212890625, 0.4815673828125, 0.61395263671875, 0.746337890625, 0.87872314453125, 1.0111083984375, 1.14349365234375, 1.27587890625, 1.40826416015625, 1.5406494140625, 1.67303466796875, 1.805419921875, 1.93780517578125, 2.0701904296875, 2.20257568359375, 2.3349609375, 2.46734619140625, 2.5997314453125, 2.73211669921875, 2.864501953125, 2.99688720703125, 3.1292724609375, 3.26165771484375, 3.39404296875, 3.52642822265625, 3.6588134765625, 3.79119873046875, 3.923583984375, 4.05596923828125, 4.1883544921875, 4.32073974609375, 4.453125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 8.0, 14.0, 16.0, 27.0, 34.0, 34.0, 51.0, 48.0, 59.0, 78.0, 67.0, 70.0, 81.0, 73.0, 63.0, 54.0, 42.0, 34.0, 30.0, 22.0, 12.0, 16.0, 11.0, 9.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8544921875, -0.81842041015625, -0.7823486328125, -0.74627685546875, -0.710205078125, -0.67413330078125, -0.6380615234375, -0.60198974609375, -0.56591796875, -0.52984619140625, -0.4937744140625, -0.45770263671875, -0.421630859375, -0.38555908203125, -0.3494873046875, -0.31341552734375, -0.27734375, -0.24127197265625, -0.2052001953125, -0.16912841796875, -0.133056640625, -0.09698486328125, -0.0609130859375, -0.02484130859375, 0.01123046875, 0.04730224609375, 0.0833740234375, 0.11944580078125, 0.155517578125, 0.19158935546875, 0.2276611328125, 0.26373291015625, 0.2998046875, 0.33587646484375, 0.3719482421875, 0.40802001953125, 0.444091796875, 0.48016357421875, 0.5162353515625, 0.55230712890625, 0.58837890625, 0.62445068359375, 0.6605224609375, 0.69659423828125, 0.732666015625, 0.76873779296875, 0.8048095703125, 0.84088134765625, 0.876953125, 0.91302490234375, 0.9490966796875, 0.98516845703125, 1.021240234375, 1.05731201171875, 1.0933837890625, 1.12945556640625, 1.16552734375, 1.20159912109375, 1.2376708984375, 1.27374267578125, 1.309814453125, 1.34588623046875, 1.3819580078125, 1.41802978515625, 1.4541015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 9.0, 7.0, 15.0, 18.0, 17.0, 37.0, 34.0, 38.0, 60.0, 69.0, 105.0, 117.0, 191.0, 247.0, 299.0, 385.0, 897.0, 10436.0, 4175136.0, 4050.0, 650.0, 328.0, 256.0, 181.0, 184.0, 106.0, 87.0, 80.0, 60.0, 39.0, 28.0, 22.0, 22.0, 18.0, 10.0, 11.0, 11.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.63671875, -11.265625, -10.89453125, -10.5234375, -10.15234375, -9.78125, -9.41015625, -9.0390625, -8.66796875, -8.296875, -7.92578125, -7.5546875, -7.18359375, -6.8125, -6.44140625, -6.0703125, -5.69921875, -5.328125, -4.95703125, -4.5859375, -4.21484375, -3.84375, -3.47265625, -3.1015625, -2.73046875, -2.359375, -1.98828125, -1.6171875, -1.24609375, -0.875, -0.50390625, -0.1328125, 0.23828125, 0.609375, 0.98046875, 1.3515625, 1.72265625, 2.09375, 2.46484375, 2.8359375, 3.20703125, 3.578125, 3.94921875, 4.3203125, 4.69140625, 5.0625, 5.43359375, 5.8046875, 6.17578125, 6.546875, 6.91796875, 7.2890625, 7.66015625, 8.03125, 8.40234375, 8.7734375, 9.14453125, 9.515625, 9.88671875, 10.2578125, 10.62890625, 11.0, 11.37109375, 11.7421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 25.0, 4003.0, 40.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.640625, -13.37078857421875, -13.1009521484375, -12.83111572265625, -12.561279296875, -12.29144287109375, -12.0216064453125, -11.75177001953125, -11.48193359375, -11.21209716796875, -10.9422607421875, -10.67242431640625, -10.402587890625, -10.13275146484375, -9.8629150390625, -9.59307861328125, -9.3232421875, -9.05340576171875, -8.7835693359375, -8.51373291015625, -8.243896484375, -7.97406005859375, -7.7042236328125, -7.43438720703125, -7.16455078125, -6.89471435546875, -6.6248779296875, -6.35504150390625, -6.085205078125, -5.81536865234375, -5.5455322265625, -5.27569580078125, -5.005859375, -4.73602294921875, -4.4661865234375, -4.19635009765625, -3.926513671875, -3.65667724609375, -3.3868408203125, -3.11700439453125, -2.84716796875, -2.57733154296875, -2.3074951171875, -2.03765869140625, -1.767822265625, -1.49798583984375, -1.2281494140625, -0.95831298828125, -0.6884765625, -0.41864013671875, -0.1488037109375, 0.12103271484375, 0.390869140625, 0.66070556640625, 0.9305419921875, 1.20037841796875, 1.47021484375, 1.74005126953125, 2.0098876953125, 2.27972412109375, 2.549560546875, 2.81939697265625, 3.0892333984375, 3.35906982421875, 3.62890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 24.0, 55.0, 184.0, 438.0, 212.0, 62.0, 12.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.379966735839844, -33.69788360595703, -33.01579666137695, -32.33371353149414, -31.651628494262695, -30.96954345703125, -30.287460327148438, -29.605375289916992, -28.923290252685547, -28.2412052154541, -27.55912208557129, -26.877037048339844, -26.1949520111084, -25.512866973876953, -24.83078384399414, -24.148698806762695, -23.466615676879883, -22.784530639648438, -22.102447509765625, -21.42036247253418, -20.738277435302734, -20.056194305419922, -19.374109268188477, -18.69202423095703, -18.00994110107422, -17.327856063842773, -16.64577293395996, -15.963687896728516, -15.28160285949707, -14.599518775939941, -13.917434692382812, -13.235349655151367, -12.553266525268555, -11.871182441711426, -11.18909740447998, -10.507013320922852, -9.824928283691406, -9.142844200134277, -8.460760116577148, -7.778675556182861, -7.096590995788574, -6.414506435394287, -5.732421875, -5.050337791442871, -4.368253231048584, -3.686168670654297, -3.004084587097168, -2.322000026702881, -1.6399154663085938, -0.9578310251235962, -0.27574658393859863, 0.4063377380371094, 1.0884222984313965, 1.7705068588256836, 2.4525909423828125, 3.1346755027770996, 3.8167600631713867, 4.498844623565674, 5.180929183959961, 5.86301326751709, 6.545097827911377, 7.227182388305664, 7.909266471862793, 8.591350555419922, 9.273435592651367]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 17.0, 20.0, 38.0, 64.0, 90.0, 123.0, 163.0, 140.0, 114.0, 69.0, 49.0, 41.0, 20.0, 17.0, 5.0, 9.0, 0.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28121566772461, -20.547666549682617, -19.814117431640625, -19.08056640625, -18.347017288208008, -17.613468170166016, -16.879919052124023, -16.14636993408203, -15.412819862365723, -14.67927074432373, -13.945720672607422, -13.21217155456543, -12.478622436523438, -11.745072364807129, -11.011523246765137, -10.277973175048828, -9.544424057006836, -8.810874938964844, -8.077324867248535, -7.343775749206543, -6.610226154327393, -5.876676559448242, -5.14312744140625, -4.4095778465271, -3.676028251647949, -2.942478656768799, -2.2089293003082275, -1.4753799438476562, -0.7418303489685059, -0.008280754089355469, 0.7252683639526367, 1.458817958831787, 2.1923694610595703, 2.9259190559387207, 3.659468412399292, 4.393017768859863, 5.126567363739014, 5.860116958618164, 6.593666076660156, 7.327215671539307, 8.060765266418457, 8.79431438446045, 9.527864456176758, 10.26141357421875, 10.994962692260742, 11.72851276397705, 12.462061882019043, 13.195611953735352, 13.929161071777344, 14.662710189819336, 15.396260261535645, 16.129810333251953, 16.863359451293945, 17.596908569335938, 18.33045768737793, 19.064006805419922, 19.797557830810547, 20.53110694885254, 21.26465606689453, 21.998207092285156, 22.73175621032715, 23.46530532836914, 24.198854446411133, 24.932403564453125, 25.665952682495117]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 18.0, 19.0, 40.0, 55.0, 107.0, 178.0, 336.0, 652.0, 1696.0, 5319.0, 22103.0, 151814.0, 714412.0, 124756.0, 19520.0, 4613.0, 1502.0, 676.0, 306.0, 157.0, 102.0, 62.0, 32.0, 22.0, 19.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.9449462890625, -2.844970703125, -2.7449951171875, -2.64501953125, -2.5450439453125, -2.445068359375, -2.3450927734375, -2.2451171875, -2.1451416015625, -2.045166015625, -1.9451904296875, -1.84521484375, -1.7452392578125, -1.645263671875, -1.5452880859375, -1.4453125, -1.3453369140625, -1.245361328125, -1.1453857421875, -1.04541015625, -0.9454345703125, -0.845458984375, -0.7454833984375, -0.6455078125, -0.5455322265625, -0.445556640625, -0.3455810546875, -0.24560546875, -0.1456298828125, -0.045654296875, 0.0543212890625, 0.154296875, 0.2542724609375, 0.354248046875, 0.4542236328125, 0.55419921875, 0.6541748046875, 0.754150390625, 0.8541259765625, 0.9541015625, 1.0540771484375, 1.154052734375, 1.2540283203125, 1.35400390625, 1.4539794921875, 1.553955078125, 1.6539306640625, 1.75390625, 1.8538818359375, 1.953857421875, 2.0538330078125, 2.15380859375, 2.2537841796875, 2.353759765625, 2.4537353515625, 2.5537109375, 2.6536865234375, 2.753662109375, 2.8536376953125, 2.95361328125, 3.0535888671875, 3.153564453125, 3.2535400390625, 3.353515625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 8.0, 18.0, 18.0, 21.0, 35.0, 39.0, 55.0, 66.0, 79.0, 100.0, 96.0, 97.0, 90.0, 75.0, 46.0, 45.0, 22.0, 16.0, 20.0, 12.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.876953125, -1.8171234130859375, -1.757293701171875, -1.6974639892578125, -1.63763427734375, -1.5778045654296875, -1.517974853515625, -1.4581451416015625, -1.3983154296875, -1.3384857177734375, -1.278656005859375, -1.2188262939453125, -1.15899658203125, -1.0991668701171875, -1.039337158203125, -0.9795074462890625, -0.919677734375, -0.8598480224609375, -0.800018310546875, -0.7401885986328125, -0.68035888671875, -0.6205291748046875, -0.560699462890625, -0.5008697509765625, -0.4410400390625, -0.3812103271484375, -0.321380615234375, -0.2615509033203125, -0.20172119140625, -0.1418914794921875, -0.082061767578125, -0.0222320556640625, 0.03759765625, 0.0974273681640625, 0.157257080078125, 0.2170867919921875, 0.27691650390625, 0.3367462158203125, 0.396575927734375, 0.4564056396484375, 0.5162353515625, 0.5760650634765625, 0.635894775390625, 0.6957244873046875, 0.75555419921875, 0.8153839111328125, 0.875213623046875, 0.9350433349609375, 0.994873046875, 1.0547027587890625, 1.114532470703125, 1.1743621826171875, 1.23419189453125, 1.2940216064453125, 1.353851318359375, 1.4136810302734375, 1.4735107421875, 1.5333404541015625, 1.593170166015625, 1.6529998779296875, 1.71282958984375, 1.7726593017578125, 1.832489013671875, 1.8923187255859375, 1.9521484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 14.0, 18.0, 20.0, 36.0, 48.0, 90.0, 147.0, 276.0, 717.0, 3284.0, 110577.0, 921293.0, 9946.0, 1177.0, 411.0, 192.0, 118.0, 78.0, 41.0, 23.0, 7.0, 11.0, 10.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69921875, -7.43572998046875, -7.1722412109375, -6.90875244140625, -6.645263671875, -6.38177490234375, -6.1182861328125, -5.85479736328125, -5.59130859375, -5.32781982421875, -5.0643310546875, -4.80084228515625, -4.537353515625, -4.27386474609375, -4.0103759765625, -3.74688720703125, -3.4833984375, -3.21990966796875, -2.9564208984375, -2.69293212890625, -2.429443359375, -2.16595458984375, -1.9024658203125, -1.63897705078125, -1.37548828125, -1.11199951171875, -0.8485107421875, -0.58502197265625, -0.321533203125, -0.05804443359375, 0.2054443359375, 0.46893310546875, 0.732421875, 0.99591064453125, 1.2593994140625, 1.52288818359375, 1.786376953125, 2.04986572265625, 2.3133544921875, 2.57684326171875, 2.84033203125, 3.10382080078125, 3.3673095703125, 3.63079833984375, 3.894287109375, 4.15777587890625, 4.4212646484375, 4.68475341796875, 4.9482421875, 5.21173095703125, 5.4752197265625, 5.73870849609375, 6.002197265625, 6.26568603515625, 6.5291748046875, 6.79266357421875, 7.05615234375, 7.31964111328125, 7.5831298828125, 7.84661865234375, 8.110107421875, 8.37359619140625, 8.6370849609375, 8.90057373046875, 9.1640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 39.0, 68.0, 112.0, 168.0, 184.0, 158.0, 122.0, 92.0, 30.0, 13.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.880859375, -21.35546875, -20.830078125, -20.3046875, -19.779296875, -19.25390625, -18.728515625, -18.203125, -17.677734375, -17.15234375, -16.626953125, -16.1015625, -15.576171875, -15.05078125, -14.525390625, -14.0, -13.474609375, -12.94921875, -12.423828125, -11.8984375, -11.373046875, -10.84765625, -10.322265625, -9.796875, -9.271484375, -8.74609375, -8.220703125, -7.6953125, -7.169921875, -6.64453125, -6.119140625, -5.59375, -5.068359375, -4.54296875, -4.017578125, -3.4921875, -2.966796875, -2.44140625, -1.916015625, -1.390625, -0.865234375, -0.33984375, 0.185546875, 0.7109375, 1.236328125, 1.76171875, 2.287109375, 2.8125, 3.337890625, 3.86328125, 4.388671875, 4.9140625, 5.439453125, 5.96484375, 6.490234375, 7.015625, 7.541015625, 8.06640625, 8.591796875, 9.1171875, 9.642578125, 10.16796875, 10.693359375, 11.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 13.0, 16.0, 20.0, 24.0, 45.0, 87.0, 169.0, 515.0, 1960.0, 13064.0, 646920.0, 372543.0, 10619.0, 1718.0, 463.0, 166.0, 68.0, 27.0, 39.0, 12.0, 9.0, 7.0, 12.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.173828125, -2.119415283203125, -2.06500244140625, -2.010589599609375, -1.9561767578125, -1.901763916015625, -1.84735107421875, -1.792938232421875, -1.738525390625, -1.684112548828125, -1.62969970703125, -1.575286865234375, -1.5208740234375, -1.466461181640625, -1.41204833984375, -1.357635498046875, -1.30322265625, -1.248809814453125, -1.19439697265625, -1.139984130859375, -1.0855712890625, -1.031158447265625, -0.97674560546875, -0.922332763671875, -0.867919921875, -0.813507080078125, -0.75909423828125, -0.704681396484375, -0.6502685546875, -0.595855712890625, -0.54144287109375, -0.487030029296875, -0.4326171875, -0.378204345703125, -0.32379150390625, -0.269378662109375, -0.2149658203125, -0.160552978515625, -0.10614013671875, -0.051727294921875, 0.002685546875, 0.057098388671875, 0.11151123046875, 0.165924072265625, 0.2203369140625, 0.274749755859375, 0.32916259765625, 0.383575439453125, 0.43798828125, 0.492401123046875, 0.54681396484375, 0.601226806640625, 0.6556396484375, 0.710052490234375, 0.76446533203125, 0.818878173828125, 0.873291015625, 0.927703857421875, 0.98211669921875, 1.036529541015625, 1.0909423828125, 1.145355224609375, 1.19976806640625, 1.254180908203125, 1.30859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 8.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 16.0, 12.0, 25.0, 49.0, 57.0, 72.0, 117.0, 127.0, 124.0, 101.0, 77.0, 46.0, 30.0, 24.0, 18.0, 15.0, 11.0, 10.0, 6.0, 5.0, 7.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011783838272094727, -0.0001134360209107399, -0.00010903365910053253, -0.00010463129729032516, -0.0001002289354801178, -9.582657366991043e-05, -9.142421185970306e-05, -8.70218500494957e-05, -8.261948823928833e-05, -7.821712642908096e-05, -7.38147646188736e-05, -6.941240280866623e-05, -6.501004099845886e-05, -6.0607679188251495e-05, -5.620531737804413e-05, -5.180295556783676e-05, -4.7400593757629395e-05, -4.299823194742203e-05, -3.859587013721466e-05, -3.4193508327007294e-05, -2.9791146516799927e-05, -2.538878470659256e-05, -2.0986422896385193e-05, -1.6584061086177826e-05, -1.2181699275970459e-05, -7.779337465763092e-06, -3.376975655555725e-06, 1.0253861546516418e-06, 5.427747964859009e-06, 9.830109775066376e-06, 1.4232471585273743e-05, 1.863483339548111e-05, 2.3037195205688477e-05, 2.7439557015895844e-05, 3.184191882610321e-05, 3.624428063631058e-05, 4.0646642446517944e-05, 4.504900425672531e-05, 4.945136606693268e-05, 5.3853727877140045e-05, 5.825608968734741e-05, 6.265845149755478e-05, 6.706081330776215e-05, 7.146317511796951e-05, 7.586553692817688e-05, 8.026789873838425e-05, 8.467026054859161e-05, 8.907262235879898e-05, 9.347498416900635e-05, 9.787734597921371e-05, 0.00010227970778942108, 0.00010668206959962845, 0.00011108443140983582, 0.00011548679322004318, 0.00011988915503025055, 0.00012429151684045792, 0.00012869387865066528, 0.00013309624046087265, 0.00013749860227108002, 0.00014190096408128738, 0.00014630332589149475, 0.00015070568770170212, 0.00015510804951190948, 0.00015951041132211685, 0.00016391277313232422]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 9.0, 12.0, 8.0, 32.0, 62.0, 117.0, 240.0, 650.0, 2354.0, 21714.0, 986760.0, 32660.0, 2666.0, 732.0, 275.0, 105.0, 59.0, 36.0, 19.0, 11.0, 8.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -2.007232666015625, -1.93438720703125, -1.861541748046875, -1.7886962890625, -1.715850830078125, -1.64300537109375, -1.570159912109375, -1.497314453125, -1.424468994140625, -1.35162353515625, -1.278778076171875, -1.2059326171875, -1.133087158203125, -1.06024169921875, -0.987396240234375, -0.91455078125, -0.841705322265625, -0.76885986328125, -0.696014404296875, -0.6231689453125, -0.550323486328125, -0.47747802734375, -0.404632568359375, -0.331787109375, -0.258941650390625, -0.18609619140625, -0.113250732421875, -0.0404052734375, 0.032440185546875, 0.10528564453125, 0.178131103515625, 0.2509765625, 0.323822021484375, 0.39666748046875, 0.469512939453125, 0.5423583984375, 0.615203857421875, 0.68804931640625, 0.760894775390625, 0.833740234375, 0.906585693359375, 0.97943115234375, 1.052276611328125, 1.1251220703125, 1.197967529296875, 1.27081298828125, 1.343658447265625, 1.41650390625, 1.489349365234375, 1.56219482421875, 1.635040283203125, 1.7078857421875, 1.780731201171875, 1.85357666015625, 1.926422119140625, 1.999267578125, 2.072113037109375, 2.14495849609375, 2.217803955078125, 2.2906494140625, 2.363494873046875, 2.43634033203125, 2.509185791015625, 2.58203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 12.0, 8.0, 14.0, 19.0, 44.0, 88.0, 133.0, 160.0, 184.0, 136.0, 78.0, 44.0, 26.0, 15.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33203125, -1.278717041015625, -1.22540283203125, -1.172088623046875, -1.1187744140625, -1.065460205078125, -1.01214599609375, -0.958831787109375, -0.905517578125, -0.852203369140625, -0.79888916015625, -0.745574951171875, -0.6922607421875, -0.638946533203125, -0.58563232421875, -0.532318115234375, -0.47900390625, -0.425689697265625, -0.37237548828125, -0.319061279296875, -0.2657470703125, -0.212432861328125, -0.15911865234375, -0.105804443359375, -0.052490234375, 0.000823974609375, 0.05413818359375, 0.107452392578125, 0.1607666015625, 0.214080810546875, 0.26739501953125, 0.320709228515625, 0.3740234375, 0.427337646484375, 0.48065185546875, 0.533966064453125, 0.5872802734375, 0.640594482421875, 0.69390869140625, 0.747222900390625, 0.800537109375, 0.853851318359375, 0.90716552734375, 0.960479736328125, 1.0137939453125, 1.067108154296875, 1.12042236328125, 1.173736572265625, 1.22705078125, 1.280364990234375, 1.33367919921875, 1.386993408203125, 1.4403076171875, 1.493621826171875, 1.54693603515625, 1.600250244140625, 1.653564453125, 1.706878662109375, 1.76019287109375, 1.813507080078125, 1.8668212890625, 1.920135498046875, 1.97344970703125, 2.026763916015625, 2.080078125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 17.0, 122.0, 653.0, 203.0, 16.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.2798309326172, -128.9432373046875, -124.60664367675781, -120.27005004882812, -115.93345642089844, -111.59686279296875, -107.26026916503906, -102.92367553710938, -98.58708190917969, -94.25048828125, -89.91389465332031, -85.57730102539062, -81.24070739746094, -76.90411376953125, -72.56752014160156, -68.23092651367188, -63.89433288574219, -59.5577392578125, -55.22114562988281, -50.884552001953125, -46.54795837402344, -42.21136474609375, -37.87477111816406, -33.538177490234375, -29.201583862304688, -24.864990234375, -20.528396606445312, -16.191802978515625, -11.855209350585938, -7.51861572265625, -3.1820220947265625, 1.154571533203125, 5.49114990234375, 9.827743530273438, 14.164337158203125, 18.500930786132812, 22.8375244140625, 27.174118041992188, 31.510711669921875, 35.84730529785156, 40.18389892578125, 44.52049255371094, 48.857086181640625, 53.19367980957031, 57.5302734375, 61.86686706542969, 66.20346069335938, 70.54005432128906, 74.87664794921875, 79.21324157714844, 83.54983520507812, 87.88642883300781, 92.2230224609375, 96.55961608886719, 100.89620971679688, 105.23280334472656, 109.56939697265625, 113.90599060058594, 118.24258422851562, 122.57917785644531, 126.915771484375, 131.2523651123047, 135.58895874023438, 139.92555236816406, 144.26214599609375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 16.0, 16.0, 17.0, 21.0, 30.0, 23.0, 43.0, 29.0, 37.0, 58.0, 54.0, 59.0, 60.0, 67.0, 60.0, 55.0, 52.0, 47.0, 38.0, 43.0, 27.0, 32.0, 23.0, 18.0, 7.0, 12.0, 20.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.70851135253906, -40.5550422668457, -39.401573181152344, -38.248104095458984, -37.094635009765625, -35.941165924072266, -34.787696838378906, -33.63422775268555, -32.48075866699219, -31.327289581298828, -30.17382049560547, -29.02035140991211, -27.86688232421875, -26.71341323852539, -25.55994415283203, -24.406475067138672, -23.253005981445312, -22.099536895751953, -20.946067810058594, -19.792598724365234, -18.639129638671875, -17.485660552978516, -16.332191467285156, -15.178722381591797, -14.025253295898438, -12.871784210205078, -11.718315124511719, -10.56484603881836, -9.411376953125, -8.25790786743164, -7.104438781738281, -5.950969696044922, -4.797496795654297, -3.6440277099609375, -2.490558624267578, -1.3370895385742188, -0.18362045288085938, 0.9698486328125, 2.1233177185058594, 3.2767868041992188, 4.430255889892578, 5.5837249755859375, 6.737194061279297, 7.890663146972656, 9.044132232666016, 10.197601318359375, 11.351070404052734, 12.504539489746094, 13.658008575439453, 14.811477661132812, 15.964946746826172, 17.11841583251953, 18.27188491821289, 19.42535400390625, 20.57882308959961, 21.73229217529297, 22.885761260986328, 24.039230346679688, 25.192699432373047, 26.346168518066406, 27.499637603759766, 28.653106689453125, 29.806575775146484, 30.960044860839844, 32.1135139465332]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 12.0, 9.0, 20.0, 26.0, 33.0, 55.0, 58.0, 114.0, 123.0, 205.0, 270.0, 402.0, 620.0, 1033.0, 1720.0, 2806.0, 4930.0, 10407.0, 26163.0, 109223.0, 1439583.0, 2415902.0, 128950.0, 26415.0, 10630.0, 5546.0, 3159.0, 1944.0, 1219.0, 788.0, 575.0, 376.0, 267.0, 202.0, 146.0, 92.0, 62.0, 55.0, 40.0, 28.0, 17.0, 14.0, 11.0, 6.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9634246826171875, -0.927825927734375, -0.8922271728515625, -0.85662841796875, -0.8210296630859375, -0.785430908203125, -0.7498321533203125, -0.7142333984375, -0.6786346435546875, -0.643035888671875, -0.6074371337890625, -0.57183837890625, -0.5362396240234375, -0.500640869140625, -0.4650421142578125, -0.429443359375, -0.3938446044921875, -0.358245849609375, -0.3226470947265625, -0.28704833984375, -0.2514495849609375, -0.215850830078125, -0.1802520751953125, -0.1446533203125, -0.1090545654296875, -0.073455810546875, -0.0378570556640625, -0.00225830078125, 0.0333404541015625, 0.068939208984375, 0.1045379638671875, 0.14013671875, 0.1757354736328125, 0.211334228515625, 0.2469329833984375, 0.28253173828125, 0.3181304931640625, 0.353729248046875, 0.3893280029296875, 0.4249267578125, 0.4605255126953125, 0.496124267578125, 0.5317230224609375, 0.56732177734375, 0.6029205322265625, 0.638519287109375, 0.6741180419921875, 0.709716796875, 0.7453155517578125, 0.780914306640625, 0.8165130615234375, 0.85211181640625, 0.8877105712890625, 0.923309326171875, 0.9589080810546875, 0.9945068359375, 1.0301055908203125, 1.065704345703125, 1.1013031005859375, 1.13690185546875, 1.1725006103515625, 1.208099365234375, 1.2436981201171875, 1.279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 7.0, 16.0, 10.0, 15.0, 26.0, 26.0, 24.0, 27.0, 36.0, 44.0, 58.0, 57.0, 53.0, 56.0, 58.0, 61.0, 56.0, 60.0, 42.0, 37.0, 41.0, 35.0, 26.0, 17.0, 18.0, 23.0, 13.0, 9.0, 5.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9189453125, -0.8869171142578125, -0.854888916015625, -0.8228607177734375, -0.79083251953125, -0.7588043212890625, -0.726776123046875, -0.6947479248046875, -0.6627197265625, -0.6306915283203125, -0.598663330078125, -0.5666351318359375, -0.53460693359375, -0.5025787353515625, -0.470550537109375, -0.4385223388671875, -0.406494140625, -0.3744659423828125, -0.342437744140625, -0.3104095458984375, -0.27838134765625, -0.2463531494140625, -0.214324951171875, -0.1822967529296875, -0.1502685546875, -0.1182403564453125, -0.086212158203125, -0.0541839599609375, -0.02215576171875, 0.0098724365234375, 0.041900634765625, 0.0739288330078125, 0.10595703125, 0.1379852294921875, 0.170013427734375, 0.2020416259765625, 0.23406982421875, 0.2660980224609375, 0.298126220703125, 0.3301544189453125, 0.3621826171875, 0.3942108154296875, 0.426239013671875, 0.4582672119140625, 0.49029541015625, 0.5223236083984375, 0.554351806640625, 0.5863800048828125, 0.618408203125, 0.6504364013671875, 0.682464599609375, 0.7144927978515625, 0.74652099609375, 0.7785491943359375, 0.810577392578125, 0.8426055908203125, 0.8746337890625, 0.9066619873046875, 0.938690185546875, 0.9707183837890625, 1.00274658203125, 1.0347747802734375, 1.066802978515625, 1.0988311767578125, 1.130859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 5.0, 9.0, 19.0, 16.0, 31.0, 50.0, 103.0, 221.0, 395.0, 999.0, 3259.0, 18390.0, 611125.0, 3525401.0, 27485.0, 4352.0, 1245.0, 490.0, 266.0, 141.0, 88.0, 36.0, 28.0, 17.0, 17.0, 13.0, 7.0, 3.0, 6.0, 7.0, 2.0, 4.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.7000732421875, -3.591552734375, -3.4830322265625, -3.37451171875, -3.2659912109375, -3.157470703125, -3.0489501953125, -2.9404296875, -2.8319091796875, -2.723388671875, -2.6148681640625, -2.50634765625, -2.3978271484375, -2.289306640625, -2.1807861328125, -2.072265625, -1.9637451171875, -1.855224609375, -1.7467041015625, -1.63818359375, -1.5296630859375, -1.421142578125, -1.3126220703125, -1.2041015625, -1.0955810546875, -0.987060546875, -0.8785400390625, -0.77001953125, -0.6614990234375, -0.552978515625, -0.4444580078125, -0.3359375, -0.2274169921875, -0.118896484375, -0.0103759765625, 0.09814453125, 0.2066650390625, 0.315185546875, 0.4237060546875, 0.5322265625, 0.6407470703125, 0.749267578125, 0.8577880859375, 0.96630859375, 1.0748291015625, 1.183349609375, 1.2918701171875, 1.400390625, 1.5089111328125, 1.617431640625, 1.7259521484375, 1.83447265625, 1.9429931640625, 2.051513671875, 2.1600341796875, 2.2685546875, 2.3770751953125, 2.485595703125, 2.5941162109375, 2.70263671875, 2.8111572265625, 2.919677734375, 3.0281982421875, 3.13671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 8.0, 10.0, 10.0, 14.0, 24.0, 23.0, 32.0, 58.0, 183.0, 784.0, 1964.0, 623.0, 140.0, 61.0, 35.0, 21.0, 26.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.044921875, -1.949798583984375, -1.85467529296875, -1.759552001953125, -1.6644287109375, -1.569305419921875, -1.47418212890625, -1.379058837890625, -1.283935546875, -1.188812255859375, -1.09368896484375, -0.998565673828125, -0.9034423828125, -0.808319091796875, -0.71319580078125, -0.618072509765625, -0.52294921875, -0.427825927734375, -0.33270263671875, -0.237579345703125, -0.1424560546875, -0.047332763671875, 0.04779052734375, 0.142913818359375, 0.238037109375, 0.333160400390625, 0.42828369140625, 0.523406982421875, 0.6185302734375, 0.713653564453125, 0.80877685546875, 0.903900146484375, 0.9990234375, 1.094146728515625, 1.18927001953125, 1.284393310546875, 1.3795166015625, 1.474639892578125, 1.56976318359375, 1.664886474609375, 1.760009765625, 1.855133056640625, 1.95025634765625, 2.045379638671875, 2.1405029296875, 2.235626220703125, 2.33074951171875, 2.425872802734375, 2.52099609375, 2.616119384765625, 2.71124267578125, 2.806365966796875, 2.9014892578125, 2.996612548828125, 3.09173583984375, 3.186859130859375, 3.281982421875, 3.377105712890625, 3.47222900390625, 3.567352294921875, 3.6624755859375, 3.757598876953125, 3.85272216796875, 3.947845458984375, 4.04296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 4.0, 18.0, 19.0, 26.0, 47.0, 91.0, 129.0, 140.0, 154.0, 119.0, 90.0, 56.0, 31.0, 12.0, 18.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.957306861877441, -12.5669584274292, -12.176609992980957, -11.786261558532715, -11.395913124084473, -11.00556468963623, -10.615216255187988, -10.224867820739746, -9.834519386291504, -9.444170951843262, -9.05382251739502, -8.663474082946777, -8.273125648498535, -7.882777214050293, -7.492428779602051, -7.102080345153809, -6.711731910705566, -6.321383476257324, -5.931035041809082, -5.54068660736084, -5.150338172912598, -4.7599897384643555, -4.369641304016113, -3.979292869567871, -3.588944435119629, -3.1985960006713867, -2.8082475662231445, -2.4178991317749023, -2.02755069732666, -1.637202262878418, -1.2468538284301758, -0.8565053939819336, -0.466156005859375, -0.07580757141113281, 0.3145408630371094, 0.7048892974853516, 1.0952377319335938, 1.485586166381836, 1.8759346008300781, 2.2662830352783203, 2.6566314697265625, 3.0469799041748047, 3.437328338623047, 3.827676773071289, 4.218025207519531, 4.608373641967773, 4.998722076416016, 5.389070510864258, 5.7794189453125, 6.169767379760742, 6.560115814208984, 6.950464248657227, 7.340812683105469, 7.731161117553711, 8.121509552001953, 8.511857986450195, 8.902206420898438, 9.29255485534668, 9.682903289794922, 10.073251724243164, 10.463600158691406, 10.853948593139648, 11.24429702758789, 11.634645462036133, 12.024993896484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 12.0, 9.0, 19.0, 29.0, 20.0, 21.0, 28.0, 33.0, 40.0, 45.0, 41.0, 52.0, 54.0, 82.0, 64.0, 71.0, 52.0, 34.0, 57.0, 39.0, 31.0, 38.0, 26.0, 23.0, 14.0, 17.0, 13.0, 7.0, 4.0, 5.0, 1.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.359330177307129, -9.958972930908203, -9.558615684509277, -9.158258438110352, -8.757902145385742, -8.3575439453125, -7.957187652587891, -7.556830406188965, -7.156473159790039, -6.756115913391113, -6.3557586669921875, -5.95540189743042, -5.555044651031494, -5.154687404632568, -4.754330635070801, -4.353973388671875, -3.953616142272949, -3.5532588958740234, -3.1529018878936768, -2.75254487991333, -2.3521876335144043, -1.9518303871154785, -1.5514733791351318, -1.1511163711547852, -0.7507591247558594, -0.35040199756622314, 0.049955129623413086, 0.4503122568130493, 0.8506693840026855, 1.2510266304016113, 1.651383638381958, 2.0517406463623047, 2.4520978927612305, 2.8524551391601562, 3.252812147140503, 3.6531691551208496, 4.053526401519775, 4.453883647918701, 4.854240417480469, 5.2545976638793945, 5.65495491027832, 6.055312156677246, 6.455669403076172, 6.8560261726379395, 7.256383419036865, 7.656740665435791, 8.057097434997559, 8.457454681396484, 8.85781192779541, 9.258169174194336, 9.658526420593262, 10.058883666992188, 10.459239959716797, 10.859598159790039, 11.259954452514648, 11.660311698913574, 12.0606689453125, 12.461026191711426, 12.861383438110352, 13.261740684509277, 13.662097930908203, 14.062454223632812, 14.462811470031738, 14.863168716430664, 15.26352596282959]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 17.0, 22.0, 24.0, 52.0, 63.0, 91.0, 136.0, 194.0, 291.0, 446.0, 683.0, 1125.0, 1674.0, 2910.0, 4910.0, 8425.0, 15237.0, 28004.0, 54273.0, 111025.0, 217306.0, 271049.0, 162404.0, 79597.0, 39851.0, 20718.0, 11697.0, 6468.0, 3677.0, 2260.0, 1412.0, 881.0, 577.0, 377.0, 232.0, 142.0, 94.0, 64.0, 47.0, 34.0, 20.0, 13.0, 11.0, 11.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.6571121215820312, -0.6320953369140625, -0.6070785522460938, -0.582061767578125, -0.5570449829101562, -0.5320281982421875, -0.5070114135742188, -0.48199462890625, -0.45697784423828125, -0.4319610595703125, -0.40694427490234375, -0.381927490234375, -0.35691070556640625, -0.3318939208984375, -0.30687713623046875, -0.2818603515625, -0.25684356689453125, -0.2318267822265625, -0.20680999755859375, -0.181793212890625, -0.15677642822265625, -0.1317596435546875, -0.10674285888671875, -0.08172607421875, -0.05670928955078125, -0.0316925048828125, -0.00667572021484375, 0.018341064453125, 0.04335784912109375, 0.0683746337890625, 0.09339141845703125, 0.118408203125, 0.14342498779296875, 0.1684417724609375, 0.19345855712890625, 0.218475341796875, 0.24349212646484375, 0.2685089111328125, 0.29352569580078125, 0.31854248046875, 0.34355926513671875, 0.3685760498046875, 0.39359283447265625, 0.418609619140625, 0.44362640380859375, 0.4686431884765625, 0.49365997314453125, 0.5186767578125, 0.5436935424804688, 0.5687103271484375, 0.5937271118164062, 0.618743896484375, 0.6437606811523438, 0.6687774658203125, 0.6937942504882812, 0.71881103515625, 0.7438278198242188, 0.7688446044921875, 0.7938613891601562, 0.818878173828125, 0.8438949584960938, 0.8689117431640625, 0.8939285278320312, 0.9189453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 22.0, 18.0, 13.0, 19.0, 20.0, 29.0, 27.0, 42.0, 32.0, 38.0, 51.0, 46.0, 53.0, 47.0, 70.0, 59.0, 54.0, 60.0, 39.0, 36.0, 29.0, 22.0, 33.0, 31.0, 25.0, 15.0, 11.0, 10.0, 10.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.7779388427734375, -0.748260498046875, -0.7185821533203125, -0.68890380859375, -0.6592254638671875, -0.629547119140625, -0.5998687744140625, -0.5701904296875, -0.5405120849609375, -0.510833740234375, -0.4811553955078125, -0.45147705078125, -0.4217987060546875, -0.392120361328125, -0.3624420166015625, -0.332763671875, -0.3030853271484375, -0.273406982421875, -0.2437286376953125, -0.21405029296875, -0.1843719482421875, -0.154693603515625, -0.1250152587890625, -0.0953369140625, -0.0656585693359375, -0.035980224609375, -0.0063018798828125, 0.02337646484375, 0.0530548095703125, 0.082733154296875, 0.1124114990234375, 0.14208984375, 0.1717681884765625, 0.201446533203125, 0.2311248779296875, 0.26080322265625, 0.2904815673828125, 0.320159912109375, 0.3498382568359375, 0.3795166015625, 0.4091949462890625, 0.438873291015625, 0.4685516357421875, 0.49822998046875, 0.5279083251953125, 0.557586669921875, 0.5872650146484375, 0.616943359375, 0.6466217041015625, 0.676300048828125, 0.7059783935546875, 0.73565673828125, 0.7653350830078125, 0.795013427734375, 0.8246917724609375, 0.8543701171875, 0.8840484619140625, 0.913726806640625, 0.9434051513671875, 0.97308349609375, 1.0027618408203125, 1.032440185546875, 1.0621185302734375, 1.091796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 7.0, 12.0, 16.0, 22.0, 51.0, 71.0, 121.0, 180.0, 301.0, 573.0, 1171.0, 3068.0, 13614.0, 165124.0, 796046.0, 57059.0, 7296.0, 2016.0, 791.0, 419.0, 221.0, 122.0, 86.0, 51.0, 35.0, 24.0, 16.0, 8.0, 4.0, 6.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.784820556640625, -2.67901611328125, -2.573211669921875, -2.4674072265625, -2.361602783203125, -2.25579833984375, -2.149993896484375, -2.044189453125, -1.938385009765625, -1.83258056640625, -1.726776123046875, -1.6209716796875, -1.515167236328125, -1.40936279296875, -1.303558349609375, -1.19775390625, -1.091949462890625, -0.98614501953125, -0.880340576171875, -0.7745361328125, -0.668731689453125, -0.56292724609375, -0.457122802734375, -0.351318359375, -0.245513916015625, -0.13970947265625, -0.033905029296875, 0.0718994140625, 0.177703857421875, 0.28350830078125, 0.389312744140625, 0.4951171875, 0.600921630859375, 0.70672607421875, 0.812530517578125, 0.9183349609375, 1.024139404296875, 1.12994384765625, 1.235748291015625, 1.341552734375, 1.447357177734375, 1.55316162109375, 1.658966064453125, 1.7647705078125, 1.870574951171875, 1.97637939453125, 2.082183837890625, 2.18798828125, 2.293792724609375, 2.39959716796875, 2.505401611328125, 2.6112060546875, 2.717010498046875, 2.82281494140625, 2.928619384765625, 3.034423828125, 3.140228271484375, 3.24603271484375, 3.351837158203125, 3.4576416015625, 3.563446044921875, 3.66925048828125, 3.775054931640625, 3.880859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 10.0, 7.0, 12.0, 15.0, 27.0, 24.0, 22.0, 32.0, 43.0, 36.0, 45.0, 46.0, 49.0, 57.0, 50.0, 45.0, 40.0, 76.0, 47.0, 39.0, 36.0, 37.0, 33.0, 32.0, 27.0, 15.0, 16.0, 13.0, 9.0, 11.0, 6.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.767578125, -3.635955810546875, -3.50433349609375, -3.372711181640625, -3.2410888671875, -3.109466552734375, -2.97784423828125, -2.846221923828125, -2.714599609375, -2.582977294921875, -2.45135498046875, -2.319732666015625, -2.1881103515625, -2.056488037109375, -1.92486572265625, -1.793243408203125, -1.66162109375, -1.529998779296875, -1.39837646484375, -1.266754150390625, -1.1351318359375, -1.003509521484375, -0.87188720703125, -0.740264892578125, -0.608642578125, -0.477020263671875, -0.34539794921875, -0.213775634765625, -0.0821533203125, 0.049468994140625, 0.18109130859375, 0.312713623046875, 0.4443359375, 0.575958251953125, 0.70758056640625, 0.839202880859375, 0.9708251953125, 1.102447509765625, 1.23406982421875, 1.365692138671875, 1.497314453125, 1.628936767578125, 1.76055908203125, 1.892181396484375, 2.0238037109375, 2.155426025390625, 2.28704833984375, 2.418670654296875, 2.55029296875, 2.681915283203125, 2.81353759765625, 2.945159912109375, 3.0767822265625, 3.208404541015625, 3.34002685546875, 3.471649169921875, 3.603271484375, 3.734893798828125, 3.86651611328125, 3.998138427734375, 4.1297607421875, 4.261383056640625, 4.39300537109375, 4.524627685546875, 4.65625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 15.0, 19.0, 23.0, 35.0, 55.0, 98.0, 169.0, 299.0, 577.0, 1441.0, 3695.0, 16382.0, 423640.0, 576819.0, 18406.0, 3983.0, 1438.0, 650.0, 297.0, 172.0, 112.0, 56.0, 44.0, 23.0, 14.0, 8.0, 9.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1591796875, -1.120574951171875, -1.08197021484375, -1.043365478515625, -1.0047607421875, -0.966156005859375, -0.92755126953125, -0.888946533203125, -0.850341796875, -0.811737060546875, -0.77313232421875, -0.734527587890625, -0.6959228515625, -0.657318115234375, -0.61871337890625, -0.580108642578125, -0.54150390625, -0.502899169921875, -0.46429443359375, -0.425689697265625, -0.3870849609375, -0.348480224609375, -0.30987548828125, -0.271270751953125, -0.232666015625, -0.194061279296875, -0.15545654296875, -0.116851806640625, -0.0782470703125, -0.039642333984375, -0.00103759765625, 0.037567138671875, 0.076171875, 0.114776611328125, 0.15338134765625, 0.191986083984375, 0.2305908203125, 0.269195556640625, 0.30780029296875, 0.346405029296875, 0.385009765625, 0.423614501953125, 0.46221923828125, 0.500823974609375, 0.5394287109375, 0.578033447265625, 0.61663818359375, 0.655242919921875, 0.69384765625, 0.732452392578125, 0.77105712890625, 0.809661865234375, 0.8482666015625, 0.886871337890625, 0.92547607421875, 0.964080810546875, 1.002685546875, 1.041290283203125, 1.07989501953125, 1.118499755859375, 1.1571044921875, 1.195709228515625, 1.23431396484375, 1.272918701171875, 1.3115234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 9.0, 6.0, 13.0, 14.0, 31.0, 53.0, 88.0, 131.0, 184.0, 183.0, 108.0, 69.0, 37.0, 31.0, 11.0, 14.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00027108192443847656, -0.00026389583945274353, -0.0002567097544670105, -0.00024952366948127747, -0.00024233758449554443, -0.0002351514995098114, -0.00022796541452407837, -0.00022077932953834534, -0.0002135932445526123, -0.00020640715956687927, -0.00019922107458114624, -0.0001920349895954132, -0.00018484890460968018, -0.00017766281962394714, -0.0001704767346382141, -0.00016329064965248108, -0.00015610456466674805, -0.00014891847968101501, -0.00014173239469528198, -0.00013454630970954895, -0.00012736022472381592, -0.00012017413973808289, -0.00011298805475234985, -0.00010580196976661682, -9.861588478088379e-05, -9.142979979515076e-05, -8.424371480941772e-05, -7.705762982368469e-05, -6.987154483795166e-05, -6.268545985221863e-05, -5.5499374866485596e-05, -4.8313289880752563e-05, -4.112720489501953e-05, -3.39411199092865e-05, -2.6755034923553467e-05, -1.9568949937820435e-05, -1.2382864952087402e-05, -5.19677996635437e-06, 1.989305019378662e-06, 9.175390005111694e-06, 1.6361474990844727e-05, 2.354755997657776e-05, 3.073364496231079e-05, 3.791972994804382e-05, 4.5105814933776855e-05, 5.229189991950989e-05, 5.947798490524292e-05, 6.666406989097595e-05, 7.385015487670898e-05, 8.103623986244202e-05, 8.822232484817505e-05, 9.540840983390808e-05, 0.00010259449481964111, 0.00010978057980537415, 0.00011696666479110718, 0.0001241527497768402, 0.00013133883476257324, 0.00013852491974830627, 0.0001457110047340393, 0.00015289708971977234, 0.00016008317470550537, 0.0001672692596912384, 0.00017445534467697144, 0.00018164142966270447, 0.0001888275146484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 3.0, 5.0, 13.0, 12.0, 13.0, 28.0, 30.0, 48.0, 71.0, 107.0, 194.0, 387.0, 904.0, 2658.0, 11446.0, 250725.0, 754746.0, 21049.0, 3770.0, 1238.0, 476.0, 216.0, 123.0, 87.0, 57.0, 29.0, 26.0, 17.0, 11.0, 7.0, 10.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3076171875, -1.266937255859375, -1.22625732421875, -1.185577392578125, -1.1448974609375, -1.104217529296875, -1.06353759765625, -1.022857666015625, -0.982177734375, -0.941497802734375, -0.90081787109375, -0.860137939453125, -0.8194580078125, -0.778778076171875, -0.73809814453125, -0.697418212890625, -0.65673828125, -0.616058349609375, -0.57537841796875, -0.534698486328125, -0.4940185546875, -0.453338623046875, -0.41265869140625, -0.371978759765625, -0.331298828125, -0.290618896484375, -0.24993896484375, -0.209259033203125, -0.1685791015625, -0.127899169921875, -0.08721923828125, -0.046539306640625, -0.005859375, 0.034820556640625, 0.07550048828125, 0.116180419921875, 0.1568603515625, 0.197540283203125, 0.23822021484375, 0.278900146484375, 0.319580078125, 0.360260009765625, 0.40093994140625, 0.441619873046875, 0.4822998046875, 0.522979736328125, 0.56365966796875, 0.604339599609375, 0.64501953125, 0.685699462890625, 0.72637939453125, 0.767059326171875, 0.8077392578125, 0.848419189453125, 0.88909912109375, 0.929779052734375, 0.970458984375, 1.011138916015625, 1.05181884765625, 1.092498779296875, 1.1331787109375, 1.173858642578125, 1.21453857421875, 1.255218505859375, 1.2958984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 14.0, 12.0, 21.0, 38.0, 49.0, 60.0, 88.0, 116.0, 117.0, 107.0, 82.0, 73.0, 64.0, 39.0, 31.0, 26.0, 10.0, 6.0, 4.0, 5.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.173828125, -1.1358489990234375, -1.097869873046875, -1.0598907470703125, -1.02191162109375, -0.9839324951171875, -0.945953369140625, -0.9079742431640625, -0.8699951171875, -0.8320159912109375, -0.794036865234375, -0.7560577392578125, -0.71807861328125, -0.6800994873046875, -0.642120361328125, -0.6041412353515625, -0.566162109375, -0.5281829833984375, -0.490203857421875, -0.4522247314453125, -0.41424560546875, -0.3762664794921875, -0.338287353515625, -0.3003082275390625, -0.2623291015625, -0.2243499755859375, -0.186370849609375, -0.1483917236328125, -0.11041259765625, -0.0724334716796875, -0.034454345703125, 0.0035247802734375, 0.04150390625, 0.0794830322265625, 0.117462158203125, 0.1554412841796875, 0.19342041015625, 0.2313995361328125, 0.269378662109375, 0.3073577880859375, 0.3453369140625, 0.3833160400390625, 0.421295166015625, 0.4592742919921875, 0.49725341796875, 0.5352325439453125, 0.573211669921875, 0.6111907958984375, 0.649169921875, 0.6871490478515625, 0.725128173828125, 0.7631072998046875, 0.80108642578125, 0.8390655517578125, 0.877044677734375, 0.9150238037109375, 0.9530029296875, 0.9909820556640625, 1.028961181640625, 1.0669403076171875, 1.10491943359375, 1.1428985595703125, 1.180877685546875, 1.2188568115234375, 1.2568359375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 21.0, 230.0, 561.0, 145.0, 23.0, 8.0, 10.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-101.09318542480469, -99.19454956054688, -97.2959213256836, -95.39728546142578, -93.4986572265625, -91.60002136230469, -89.7013931274414, -87.8027572631836, -85.90412902832031, -84.0054931640625, -82.10686492919922, -80.2082290649414, -78.30960083007812, -76.41096496582031, -74.51233673095703, -72.61370086669922, -70.71507263183594, -68.81643676757812, -66.91780853271484, -65.01917266845703, -63.12054443359375, -61.2219123840332, -59.323280334472656, -57.424644470214844, -55.52600860595703, -53.627376556396484, -51.72874450683594, -49.83011245727539, -47.931480407714844, -46.0328483581543, -44.13421630859375, -42.23558044433594, -40.336952209472656, -38.43832015991211, -36.53968811035156, -34.641056060791016, -32.74242401123047, -30.843791961669922, -28.945158004760742, -27.046525955200195, -25.14789581298828, -23.249263763427734, -21.350631713867188, -19.45199966430664, -17.553367614746094, -15.65473461151123, -13.756101608276367, -11.85746955871582, -9.958837509155273, -8.060205459594727, -6.1615729331970215, -4.262940406799316, -2.3643083572387695, -0.46567630767822266, 1.4329566955566406, 3.3315887451171875, 5.230220794677734, 7.128852844238281, 9.027484893798828, 10.926117897033691, 12.824749946594238, 14.723381996154785, 16.62201499938965, 18.520647048950195, 20.419279098510742]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 3.0, 8.0, 18.0, 22.0, 11.0, 18.0, 17.0, 32.0, 24.0, 34.0, 35.0, 35.0, 40.0, 47.0, 56.0, 54.0, 66.0, 48.0, 51.0, 44.0, 41.0, 28.0, 34.0, 28.0, 32.0, 30.0, 21.0, 21.0, 28.0, 19.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.727006912231445, -15.239923477172852, -14.752840042114258, -14.265755653381348, -13.778672218322754, -13.29158878326416, -12.804505348205566, -12.317420959472656, -11.830337524414062, -11.343254089355469, -10.856170654296875, -10.369086265563965, -9.882002830505371, -9.394919395446777, -8.907835960388184, -8.420751571655273, -7.933668613433838, -7.446585178375244, -6.959501266479492, -6.472417831420898, -5.9853339195251465, -5.498250484466553, -5.011166572570801, -4.524083137512207, -4.036999702453613, -3.5499160289764404, -3.0628323554992676, -2.575748920440674, -2.088665008544922, -1.6015815734863281, -1.1144979000091553, -0.6274142265319824, -0.14033031463623047, 0.34675332903862, 0.8338369727134705, 1.3209205865859985, 1.8080042600631714, 2.2950878143310547, 2.7821714878082275, 3.2692551612854004, 3.7563388347625732, 4.243422508239746, 4.73050594329834, 5.217589855194092, 5.7046732902526855, 6.1917572021484375, 6.678840637207031, 7.165924072265625, 7.653007984161377, 8.140091896057129, 8.627175331115723, 9.114258766174316, 9.60134220123291, 10.08842658996582, 10.575510025024414, 11.062593460083008, 11.549676895141602, 12.036760330200195, 12.523843765258789, 13.0109281539917, 13.498011589050293, 13.985095024108887, 14.47217845916748, 14.95926284790039, 15.446346282958984]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 4.0, 10.0, 12.0, 19.0, 36.0, 51.0, 87.0, 179.0, 413.0, 1385.0, 6620.0, 79166.0, 4022893.0, 75163.0, 5772.0, 1374.0, 500.0, 220.0, 129.0, 72.0, 42.0, 39.0, 20.0, 16.0, 12.0, 12.0, 10.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.412109375, -3.32989501953125, -3.2476806640625, -3.16546630859375, -3.083251953125, -3.00103759765625, -2.9188232421875, -2.83660888671875, -2.75439453125, -2.67218017578125, -2.5899658203125, -2.50775146484375, -2.425537109375, -2.34332275390625, -2.2611083984375, -2.17889404296875, -2.0966796875, -2.01446533203125, -1.9322509765625, -1.85003662109375, -1.767822265625, -1.68560791015625, -1.6033935546875, -1.52117919921875, -1.43896484375, -1.35675048828125, -1.2745361328125, -1.19232177734375, -1.110107421875, -1.02789306640625, -0.9456787109375, -0.86346435546875, -0.78125, -0.69903564453125, -0.6168212890625, -0.53460693359375, -0.452392578125, -0.37017822265625, -0.2879638671875, -0.20574951171875, -0.12353515625, -0.04132080078125, 0.0408935546875, 0.12310791015625, 0.205322265625, 0.28753662109375, 0.3697509765625, 0.45196533203125, 0.5341796875, 0.61639404296875, 0.6986083984375, 0.78082275390625, 0.863037109375, 0.94525146484375, 1.0274658203125, 1.10968017578125, 1.19189453125, 1.27410888671875, 1.3563232421875, 1.43853759765625, 1.520751953125, 1.60296630859375, 1.6851806640625, 1.76739501953125, 1.849609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 7.0, 9.0, 15.0, 15.0, 18.0, 33.0, 44.0, 46.0, 60.0, 67.0, 76.0, 70.0, 81.0, 84.0, 88.0, 68.0, 62.0, 35.0, 34.0, 27.0, 21.0, 9.0, 12.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8896484375, -0.847930908203125, -0.80621337890625, -0.764495849609375, -0.7227783203125, -0.681060791015625, -0.63934326171875, -0.597625732421875, -0.555908203125, -0.514190673828125, -0.47247314453125, -0.430755615234375, -0.3890380859375, -0.347320556640625, -0.30560302734375, -0.263885498046875, -0.22216796875, -0.180450439453125, -0.13873291015625, -0.097015380859375, -0.0552978515625, -0.013580322265625, 0.02813720703125, 0.069854736328125, 0.111572265625, 0.153289794921875, 0.19500732421875, 0.236724853515625, 0.2784423828125, 0.320159912109375, 0.36187744140625, 0.403594970703125, 0.4453125, 0.487030029296875, 0.52874755859375, 0.570465087890625, 0.6121826171875, 0.653900146484375, 0.69561767578125, 0.737335205078125, 0.779052734375, 0.820770263671875, 0.86248779296875, 0.904205322265625, 0.9459228515625, 0.987640380859375, 1.02935791015625, 1.071075439453125, 1.11279296875, 1.154510498046875, 1.19622802734375, 1.237945556640625, 1.2796630859375, 1.321380615234375, 1.36309814453125, 1.404815673828125, 1.446533203125, 1.488250732421875, 1.52996826171875, 1.571685791015625, 1.6134033203125, 1.655120849609375, 1.69683837890625, 1.738555908203125, 1.7802734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 13.0, 19.0, 44.0, 102.0, 165.0, 414.0, 1618.0, 12416.0, 1715599.0, 2449847.0, 11654.0, 1506.0, 418.0, 215.0, 112.0, 60.0, 38.0, 18.0, 15.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.29595947265625, -3.1739501953125, -3.05194091796875, -2.929931640625, -2.80792236328125, -2.6859130859375, -2.56390380859375, -2.44189453125, -2.31988525390625, -2.1978759765625, -2.07586669921875, -1.953857421875, -1.83184814453125, -1.7098388671875, -1.58782958984375, -1.4658203125, -1.34381103515625, -1.2218017578125, -1.09979248046875, -0.977783203125, -0.85577392578125, -0.7337646484375, -0.61175537109375, -0.48974609375, -0.36773681640625, -0.2457275390625, -0.12371826171875, -0.001708984375, 0.12030029296875, 0.2423095703125, 0.36431884765625, 0.486328125, 0.60833740234375, 0.7303466796875, 0.85235595703125, 0.974365234375, 1.09637451171875, 1.2183837890625, 1.34039306640625, 1.46240234375, 1.58441162109375, 1.7064208984375, 1.82843017578125, 1.950439453125, 2.07244873046875, 2.1944580078125, 2.31646728515625, 2.4384765625, 2.56048583984375, 2.6824951171875, 2.80450439453125, 2.926513671875, 3.04852294921875, 3.1705322265625, 3.29254150390625, 3.41455078125, 3.53656005859375, 3.6585693359375, 3.78057861328125, 3.902587890625, 4.02459716796875, 4.1466064453125, 4.26861572265625, 4.390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 8.0, 8.0, 10.0, 13.0, 24.0, 45.0, 60.0, 181.0, 851.0, 1971.0, 612.0, 156.0, 59.0, 34.0, 17.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.283203125, -2.19342041015625, -2.1036376953125, -2.01385498046875, -1.924072265625, -1.83428955078125, -1.7445068359375, -1.65472412109375, -1.56494140625, -1.47515869140625, -1.3853759765625, -1.29559326171875, -1.205810546875, -1.11602783203125, -1.0262451171875, -0.93646240234375, -0.8466796875, -0.75689697265625, -0.6671142578125, -0.57733154296875, -0.487548828125, -0.39776611328125, -0.3079833984375, -0.21820068359375, -0.12841796875, -0.03863525390625, 0.0511474609375, 0.14093017578125, 0.230712890625, 0.32049560546875, 0.4102783203125, 0.50006103515625, 0.58984375, 0.67962646484375, 0.7694091796875, 0.85919189453125, 0.948974609375, 1.03875732421875, 1.1285400390625, 1.21832275390625, 1.30810546875, 1.39788818359375, 1.4876708984375, 1.57745361328125, 1.667236328125, 1.75701904296875, 1.8468017578125, 1.93658447265625, 2.0263671875, 2.11614990234375, 2.2059326171875, 2.29571533203125, 2.385498046875, 2.47528076171875, 2.5650634765625, 2.65484619140625, 2.74462890625, 2.83441162109375, 2.9241943359375, 3.01397705078125, 3.103759765625, 3.19354248046875, 3.2833251953125, 3.37310791015625, 3.462890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 10.0, 33.0, 105.0, 238.0, 272.0, 160.0, 85.0, 30.0, 24.0, 9.0, 12.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.11816120147705, -12.63796615600586, -12.157770156860352, -11.67757511138916, -11.197380065917969, -10.717184066772461, -10.23698902130127, -9.756793975830078, -9.27659797668457, -8.796402931213379, -8.316206932067871, -7.83601188659668, -7.35581636428833, -6.8756208419799805, -6.395425796508789, -5.9152302742004395, -5.43503475189209, -4.95483922958374, -4.474643707275391, -3.994448661804199, -3.5142531394958496, -3.0340576171875, -2.5538623332977295, -2.073667049407959, -1.5934715270996094, -1.1132761240005493, -0.6330807209014893, -0.1528853178024292, 0.32731008529663086, 0.8075056076049805, 1.287700891494751, 1.7678961753845215, 2.2480926513671875, 2.728288173675537, 3.2084834575653076, 3.688678741455078, 4.168874263763428, 4.649069786071777, 5.129264831542969, 5.609460353851318, 6.089655876159668, 6.569851398468018, 7.050046920776367, 7.530241966247559, 8.01043701171875, 8.490633010864258, 8.97082805633545, 9.45102310180664, 9.931219100952148, 10.41141414642334, 10.891610145568848, 11.371805191040039, 11.852001190185547, 12.332196235656738, 12.81239128112793, 13.292587280273438, 13.772782325744629, 14.25297737121582, 14.733173370361328, 15.21336841583252, 15.693563461303711, 16.17375946044922, 16.653955459594727, 17.1341495513916, 17.61434555053711]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 5.0, 10.0, 8.0, 14.0, 13.0, 24.0, 17.0, 30.0, 27.0, 26.0, 42.0, 44.0, 50.0, 48.0, 62.0, 59.0, 58.0, 59.0, 53.0, 70.0, 50.0, 47.0, 38.0, 28.0, 24.0, 27.0, 14.0, 16.0, 5.0, 6.0, 3.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.063533782958984, -7.807955265045166, -7.552376747131348, -7.2967987060546875, -7.041220188140869, -6.785641670227051, -6.530063629150391, -6.274485111236572, -6.018906593322754, -5.7633280754089355, -5.507749557495117, -5.252171516418457, -4.996592998504639, -4.74101448059082, -4.48543643951416, -4.229857921600342, -3.9742794036865234, -3.718700885772705, -3.463122606277466, -3.2075443267822266, -2.951965808868408, -2.69638729095459, -2.4408090114593506, -2.1852307319641113, -1.929652214050293, -1.6740738153457642, -1.4184954166412354, -1.1629170179367065, -0.9073386192321777, -0.6517602205276489, -0.3961818218231201, -0.1406034231185913, 0.1149740219116211, 0.3705524206161499, 0.6261308193206787, 0.8817092180252075, 1.1372876167297363, 1.3928660154342651, 1.648444414138794, 1.9040228128433228, 2.1596012115478516, 2.41517972946167, 2.670758008956909, 2.9263362884521484, 3.181914806365967, 3.437493324279785, 3.6930716037750244, 3.9486498832702637, 4.204228401184082, 4.4598069190979, 4.715385437011719, 4.970963478088379, 5.226541996002197, 5.482120513916016, 5.737698554992676, 5.993277072906494, 6.2488555908203125, 6.504434108734131, 6.760012626647949, 7.015590667724609, 7.271169185638428, 7.526747703552246, 7.782325744628906, 8.037904739379883, 8.293482780456543]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 6.0, 20.0, 29.0, 49.0, 60.0, 98.0, 170.0, 331.0, 548.0, 1008.0, 2010.0, 4301.0, 9109.0, 21604.0, 53445.0, 143826.0, 334642.0, 288602.0, 113434.0, 42865.0, 17406.0, 7700.0, 3463.0, 1763.0, 883.0, 485.0, 254.0, 150.0, 82.0, 71.0, 57.0, 19.0, 17.0, 7.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96875, -0.9340057373046875, -0.899261474609375, -0.8645172119140625, -0.82977294921875, -0.7950286865234375, -0.760284423828125, -0.7255401611328125, -0.6907958984375, -0.6560516357421875, -0.621307373046875, -0.5865631103515625, -0.55181884765625, -0.5170745849609375, -0.482330322265625, -0.4475860595703125, -0.412841796875, -0.3780975341796875, -0.343353271484375, -0.3086090087890625, -0.27386474609375, -0.2391204833984375, -0.204376220703125, -0.1696319580078125, -0.1348876953125, -0.1001434326171875, -0.065399169921875, -0.0306549072265625, 0.00408935546875, 0.0388336181640625, 0.073577880859375, 0.1083221435546875, 0.14306640625, 0.1778106689453125, 0.212554931640625, 0.2472991943359375, 0.28204345703125, 0.3167877197265625, 0.351531982421875, 0.3862762451171875, 0.4210205078125, 0.4557647705078125, 0.490509033203125, 0.5252532958984375, 0.55999755859375, 0.5947418212890625, 0.629486083984375, 0.6642303466796875, 0.698974609375, 0.7337188720703125, 0.768463134765625, 0.8032073974609375, 0.83795166015625, 0.8726959228515625, 0.907440185546875, 0.9421844482421875, 0.9769287109375, 1.0116729736328125, 1.046417236328125, 1.0811614990234375, 1.11590576171875, 1.1506500244140625, 1.185394287109375, 1.2201385498046875, 1.2548828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 0.0, 2.0, 4.0, 8.0, 4.0, 15.0, 6.0, 12.0, 13.0, 16.0, 14.0, 15.0, 29.0, 25.0, 36.0, 33.0, 42.0, 48.0, 46.0, 46.0, 40.0, 45.0, 34.0, 48.0, 60.0, 49.0, 56.0, 38.0, 27.0, 33.0, 27.0, 34.0, 17.0, 9.0, 14.0, 17.0, 8.0, 15.0, 2.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6422576904296875, -0.616546630859375, -0.5908355712890625, -0.56512451171875, -0.5394134521484375, -0.513702392578125, -0.4879913330078125, -0.4622802734375, -0.4365692138671875, -0.410858154296875, -0.3851470947265625, -0.35943603515625, -0.3337249755859375, -0.308013916015625, -0.2823028564453125, -0.256591796875, -0.2308807373046875, -0.205169677734375, -0.1794586181640625, -0.15374755859375, -0.1280364990234375, -0.102325439453125, -0.0766143798828125, -0.0509033203125, -0.0251922607421875, 0.000518798828125, 0.0262298583984375, 0.05194091796875, 0.0776519775390625, 0.103363037109375, 0.1290740966796875, 0.15478515625, 0.1804962158203125, 0.206207275390625, 0.2319183349609375, 0.25762939453125, 0.2833404541015625, 0.309051513671875, 0.3347625732421875, 0.3604736328125, 0.3861846923828125, 0.411895751953125, 0.4376068115234375, 0.46331787109375, 0.4890289306640625, 0.514739990234375, 0.5404510498046875, 0.566162109375, 0.5918731689453125, 0.617584228515625, 0.6432952880859375, 0.66900634765625, 0.6947174072265625, 0.720428466796875, 0.7461395263671875, 0.7718505859375, 0.7975616455078125, 0.823272705078125, 0.8489837646484375, 0.87469482421875, 0.9004058837890625, 0.926116943359375, 0.9518280029296875, 0.9775390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 8.0, 12.0, 16.0, 18.0, 24.0, 39.0, 70.0, 95.0, 131.0, 243.0, 399.0, 853.0, 2248.0, 9028.0, 80321.0, 789538.0, 146809.0, 13571.0, 2859.0, 1005.0, 481.0, 273.0, 161.0, 103.0, 60.0, 50.0, 34.0, 26.0, 22.0, 16.0, 9.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.62109375, -3.524810791015625, -3.42852783203125, -3.332244873046875, -3.2359619140625, -3.139678955078125, -3.04339599609375, -2.947113037109375, -2.850830078125, -2.754547119140625, -2.65826416015625, -2.561981201171875, -2.4656982421875, -2.369415283203125, -2.27313232421875, -2.176849365234375, -2.08056640625, -1.984283447265625, -1.88800048828125, -1.791717529296875, -1.6954345703125, -1.599151611328125, -1.50286865234375, -1.406585693359375, -1.310302734375, -1.214019775390625, -1.11773681640625, -1.021453857421875, -0.9251708984375, -0.828887939453125, -0.73260498046875, -0.636322021484375, -0.5400390625, -0.443756103515625, -0.34747314453125, -0.251190185546875, -0.1549072265625, -0.058624267578125, 0.03765869140625, 0.133941650390625, 0.230224609375, 0.326507568359375, 0.42279052734375, 0.519073486328125, 0.6153564453125, 0.711639404296875, 0.80792236328125, 0.904205322265625, 1.00048828125, 1.096771240234375, 1.19305419921875, 1.289337158203125, 1.3856201171875, 1.481903076171875, 1.57818603515625, 1.674468994140625, 1.770751953125, 1.867034912109375, 1.96331787109375, 2.059600830078125, 2.1558837890625, 2.252166748046875, 2.34844970703125, 2.444732666015625, 2.541015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 13.0, 12.0, 16.0, 26.0, 34.0, 54.0, 40.0, 68.0, 53.0, 76.0, 81.0, 93.0, 79.0, 65.0, 51.0, 55.0, 44.0, 43.0, 23.0, 19.0, 15.0, 6.0, 7.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.5625, -6.40203857421875, -6.2415771484375, -6.08111572265625, -5.920654296875, -5.76019287109375, -5.5997314453125, -5.43927001953125, -5.27880859375, -5.11834716796875, -4.9578857421875, -4.79742431640625, -4.636962890625, -4.47650146484375, -4.3160400390625, -4.15557861328125, -3.9951171875, -3.83465576171875, -3.6741943359375, -3.51373291015625, -3.353271484375, -3.19281005859375, -3.0323486328125, -2.87188720703125, -2.71142578125, -2.55096435546875, -2.3905029296875, -2.23004150390625, -2.069580078125, -1.90911865234375, -1.7486572265625, -1.58819580078125, -1.427734375, -1.26727294921875, -1.1068115234375, -0.94635009765625, -0.785888671875, -0.62542724609375, -0.4649658203125, -0.30450439453125, -0.14404296875, 0.01641845703125, 0.1768798828125, 0.33734130859375, 0.497802734375, 0.65826416015625, 0.8187255859375, 0.97918701171875, 1.1396484375, 1.30010986328125, 1.4605712890625, 1.62103271484375, 1.781494140625, 1.94195556640625, 2.1024169921875, 2.26287841796875, 2.42333984375, 2.58380126953125, 2.7442626953125, 2.90472412109375, 3.065185546875, 3.22564697265625, 3.3861083984375, 3.54656982421875, 3.70703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 1.0, 6.0, 17.0, 19.0, 44.0, 62.0, 104.0, 231.0, 492.0, 1541.0, 8684.0, 251693.0, 766552.0, 15680.0, 2248.0, 617.0, 276.0, 119.0, 70.0, 32.0, 24.0, 14.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.064453125, -2.0039520263671875, -1.943450927734375, -1.8829498291015625, -1.82244873046875, -1.7619476318359375, -1.701446533203125, -1.6409454345703125, -1.5804443359375, -1.5199432373046875, -1.459442138671875, -1.3989410400390625, -1.33843994140625, -1.2779388427734375, -1.217437744140625, -1.1569366455078125, -1.096435546875, -1.0359344482421875, -0.975433349609375, -0.9149322509765625, -0.85443115234375, -0.7939300537109375, -0.733428955078125, -0.6729278564453125, -0.6124267578125, -0.5519256591796875, -0.491424560546875, -0.4309234619140625, -0.37042236328125, -0.3099212646484375, -0.249420166015625, -0.1889190673828125, -0.12841796875, -0.0679168701171875, -0.007415771484375, 0.0530853271484375, 0.11358642578125, 0.1740875244140625, 0.234588623046875, 0.2950897216796875, 0.3555908203125, 0.4160919189453125, 0.476593017578125, 0.5370941162109375, 0.59759521484375, 0.6580963134765625, 0.718597412109375, 0.7790985107421875, 0.839599609375, 0.9001007080078125, 0.960601806640625, 1.0211029052734375, 1.08160400390625, 1.1421051025390625, 1.202606201171875, 1.2631072998046875, 1.3236083984375, 1.3841094970703125, 1.444610595703125, 1.5051116943359375, 1.56561279296875, 1.6261138916015625, 1.686614990234375, 1.7471160888671875, 1.8076171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 31.0, 70.0, 133.0, 208.0, 244.0, 140.0, 64.0, 47.0, 21.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033402442932128906, -0.00032171234488487244, -0.0003094002604484558, -0.0002970881760120392, -0.00028477609157562256, -0.00027246400713920593, -0.0002601519227027893, -0.0002478398382663727, -0.00023552775382995605, -0.00022321566939353943, -0.0002109035849571228, -0.00019859150052070618, -0.00018627941608428955, -0.00017396733164787292, -0.0001616552472114563, -0.00014934316277503967, -0.00013703107833862305, -0.00012471899390220642, -0.0001124069094657898, -0.00010009482502937317, -8.778274059295654e-05, -7.547065615653992e-05, -6.315857172012329e-05, -5.0846487283706665e-05, -3.853440284729004e-05, -2.6222318410873413e-05, -1.3910233974456787e-05, -1.5981495380401611e-06, 1.0713934898376465e-05, 2.302601933479309e-05, 3.533810377120972e-05, 4.765018820762634e-05, 5.996227264404297e-05, 7.22743570804596e-05, 8.458644151687622e-05, 9.689852595329285e-05, 0.00010921061038970947, 0.0001215226948261261, 0.00013383477926254272, 0.00014614686369895935, 0.00015845894813537598, 0.0001707710325717926, 0.00018308311700820923, 0.00019539520144462585, 0.00020770728588104248, 0.0002200193703174591, 0.00023233145475387573, 0.00024464353919029236, 0.000256955623626709, 0.0002692677080631256, 0.00028157979249954224, 0.00029389187693595886, 0.0003062039613723755, 0.0003185160458087921, 0.00033082813024520874, 0.00034314021468162537, 0.000355452299118042, 0.0003677643835544586, 0.00038007646799087524, 0.00039238855242729187, 0.0004047006368637085, 0.0004170127213001251, 0.00042932480573654175, 0.0004416368901729584, 0.000453948974609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 13.0, 11.0, 17.0, 28.0, 27.0, 42.0, 79.0, 118.0, 161.0, 265.0, 513.0, 1096.0, 2633.0, 9249.0, 52057.0, 595036.0, 341491.0, 34315.0, 6984.0, 2249.0, 931.0, 454.0, 258.0, 148.0, 94.0, 73.0, 40.0, 41.0, 27.0, 15.0, 12.0, 13.0, 9.0, 9.0, 9.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.95849609375, -0.9310302734375, -0.903564453125, -0.8760986328125, -0.8486328125, -0.8211669921875, -0.793701171875, -0.7662353515625, -0.73876953125, -0.7113037109375, -0.683837890625, -0.6563720703125, -0.62890625, -0.6014404296875, -0.573974609375, -0.5465087890625, -0.51904296875, -0.4915771484375, -0.464111328125, -0.4366455078125, -0.4091796875, -0.3817138671875, -0.354248046875, -0.3267822265625, -0.29931640625, -0.2718505859375, -0.244384765625, -0.2169189453125, -0.189453125, -0.1619873046875, -0.134521484375, -0.1070556640625, -0.07958984375, -0.0521240234375, -0.024658203125, 0.0028076171875, 0.0302734375, 0.0577392578125, 0.085205078125, 0.1126708984375, 0.14013671875, 0.1676025390625, 0.195068359375, 0.2225341796875, 0.25, 0.2774658203125, 0.304931640625, 0.3323974609375, 0.35986328125, 0.3873291015625, 0.414794921875, 0.4422607421875, 0.4697265625, 0.4971923828125, 0.524658203125, 0.5521240234375, 0.57958984375, 0.6070556640625, 0.634521484375, 0.6619873046875, 0.689453125, 0.7169189453125, 0.744384765625, 0.7718505859375, 0.79931640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 4.0, 8.0, 15.0, 12.0, 17.0, 29.0, 41.0, 46.0, 57.0, 64.0, 82.0, 72.0, 87.0, 86.0, 68.0, 56.0, 54.0, 44.0, 38.0, 28.0, 20.0, 8.0, 13.0, 13.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.738555908203125, -0.71148681640625, -0.684417724609375, -0.6573486328125, -0.630279541015625, -0.60321044921875, -0.576141357421875, -0.549072265625, -0.522003173828125, -0.49493408203125, -0.467864990234375, -0.4407958984375, -0.413726806640625, -0.38665771484375, -0.359588623046875, -0.33251953125, -0.305450439453125, -0.27838134765625, -0.251312255859375, -0.2242431640625, -0.197174072265625, -0.17010498046875, -0.143035888671875, -0.115966796875, -0.088897705078125, -0.06182861328125, -0.034759521484375, -0.0076904296875, 0.019378662109375, 0.04644775390625, 0.073516845703125, 0.1005859375, 0.127655029296875, 0.15472412109375, 0.181793212890625, 0.2088623046875, 0.235931396484375, 0.26300048828125, 0.290069580078125, 0.317138671875, 0.344207763671875, 0.37127685546875, 0.398345947265625, 0.4254150390625, 0.452484130859375, 0.47955322265625, 0.506622314453125, 0.53369140625, 0.560760498046875, 0.58782958984375, 0.614898681640625, 0.6419677734375, 0.669036865234375, 0.69610595703125, 0.723175048828125, 0.750244140625, 0.777313232421875, 0.80438232421875, 0.831451416015625, 0.8585205078125, 0.885589599609375, 0.91265869140625, 0.939727783203125, 0.966796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 25.0, 71.0, 310.0, 467.0, 104.0, 9.0, 11.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.674224853515625, -58.15066909790039, -56.62711715698242, -55.10356140136719, -53.58000946044922, -52.056453704833984, -50.53289794921875, -49.00934600830078, -47.48579025268555, -45.96223449707031, -44.438682556152344, -42.91512680053711, -41.391571044921875, -39.868019104003906, -38.34446334838867, -36.82090759277344, -35.29735565185547, -33.773799896240234, -32.250247955322266, -30.72669219970703, -29.20313835144043, -27.679584503173828, -26.156028747558594, -24.632474899291992, -23.10892105102539, -21.58536720275879, -20.061813354492188, -18.538257598876953, -17.01470375061035, -15.49114990234375, -13.967595100402832, -12.444040298461914, -10.920482635498047, -9.396928787231445, -7.873373985290527, -6.349819660186768, -4.826265335083008, -3.302711009979248, -1.7791566848754883, -0.2556018829345703, 1.2679519653320312, 2.791506290435791, 4.315060615539551, 5.8386149406433105, 7.36216926574707, 8.885723114013672, 10.40927791595459, 11.932832717895508, 13.45638656616211, 14.979940414428711, 16.503494262695312, 18.027050018310547, 19.55060386657715, 21.07415771484375, 22.597713470458984, 24.121267318725586, 25.644821166992188, 27.16837501525879, 28.69192886352539, 30.215484619140625, 31.739038467407227, 33.26259231567383, 34.78614807128906, 36.30970001220703, 37.833255767822266]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 5.0, 12.0, 13.0, 14.0, 20.0, 20.0, 29.0, 29.0, 37.0, 49.0, 65.0, 55.0, 65.0, 66.0, 76.0, 65.0, 60.0, 44.0, 34.0, 46.0, 31.0, 30.0, 29.0, 20.0, 15.0, 10.0, 18.0, 15.0, 4.0, 3.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.69677734375, -13.10966682434082, -12.522557258605957, -11.935446739196777, -11.348337173461914, -10.761226654052734, -10.174116134643555, -9.587005615234375, -8.999896049499512, -8.412785530090332, -7.825675964355469, -7.238565444946289, -6.651455402374268, -6.064345359802246, -5.477234840393066, -4.890124797821045, -4.303014755249023, -3.715904712677002, -3.1287944316864014, -2.541684150695801, -1.9545741081237793, -1.3674640655517578, -0.7803537845611572, -0.19324350357055664, 0.39386653900146484, 0.9809767007827759, 1.568086862564087, 2.1551971435546875, 2.742307186126709, 3.3294172286987305, 3.916527509689331, 4.503637790679932, 5.090749740600586, 5.677859783172607, 6.264969825744629, 6.852080345153809, 7.43919038772583, 8.026300430297852, 8.613410949707031, 9.200521469116211, 9.787631034851074, 10.374741554260254, 10.961851119995117, 11.548961639404297, 12.136072158813477, 12.72318172454834, 13.31029224395752, 13.897401809692383, 14.484512329101562, 15.071622848510742, 15.658732414245605, 16.24584197998047, 16.83295249938965, 17.420063018798828, 18.007173538208008, 18.594284057617188, 19.181392669677734, 19.768503189086914, 20.355613708496094, 20.94272232055664, 21.52983283996582, 22.116943359375, 22.70405387878418, 23.29116439819336, 23.87827491760254]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 12.0, 7.0, 19.0, 43.0, 74.0, 84.0, 154.0, 288.0, 501.0, 992.0, 2029.0, 4975.0, 14202.0, 50340.0, 423179.0, 2995062.0, 617424.0, 61539.0, 13585.0, 4993.0, 2175.0, 1099.0, 600.0, 366.0, 185.0, 102.0, 87.0, 53.0, 29.0, 20.0, 16.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7802734375, -0.747161865234375, -0.71405029296875, -0.680938720703125, -0.6478271484375, -0.614715576171875, -0.58160400390625, -0.548492431640625, -0.515380859375, -0.482269287109375, -0.44915771484375, -0.416046142578125, -0.3829345703125, -0.349822998046875, -0.31671142578125, -0.283599853515625, -0.25048828125, -0.217376708984375, -0.18426513671875, -0.151153564453125, -0.1180419921875, -0.084930419921875, -0.05181884765625, -0.018707275390625, 0.014404296875, 0.047515869140625, 0.08062744140625, 0.113739013671875, 0.1468505859375, 0.179962158203125, 0.21307373046875, 0.246185302734375, 0.279296875, 0.312408447265625, 0.34552001953125, 0.378631591796875, 0.4117431640625, 0.444854736328125, 0.47796630859375, 0.511077880859375, 0.544189453125, 0.577301025390625, 0.61041259765625, 0.643524169921875, 0.6766357421875, 0.709747314453125, 0.74285888671875, 0.775970458984375, 0.80908203125, 0.842193603515625, 0.87530517578125, 0.908416748046875, 0.9415283203125, 0.974639892578125, 1.00775146484375, 1.040863037109375, 1.073974609375, 1.107086181640625, 1.14019775390625, 1.173309326171875, 1.2064208984375, 1.239532470703125, 1.27264404296875, 1.305755615234375, 1.3388671875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 3.0, 9.0, 4.0, 8.0, 12.0, 10.0, 14.0, 15.0, 17.0, 18.0, 30.0, 24.0, 28.0, 41.0, 48.0, 41.0, 49.0, 63.0, 57.0, 68.0, 41.0, 64.0, 54.0, 53.0, 40.0, 39.0, 35.0, 31.0, 18.0, 19.0, 14.0, 6.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.60888671875, -0.5812759399414062, -0.5536651611328125, -0.5260543823242188, -0.498443603515625, -0.47083282470703125, -0.4432220458984375, -0.41561126708984375, -0.38800048828125, -0.36038970947265625, -0.3327789306640625, -0.30516815185546875, -0.277557373046875, -0.24994659423828125, -0.2223358154296875, -0.19472503662109375, -0.1671142578125, -0.13950347900390625, -0.1118927001953125, -0.08428192138671875, -0.056671142578125, -0.02906036376953125, -0.0014495849609375, 0.02616119384765625, 0.05377197265625, 0.08138275146484375, 0.1089935302734375, 0.13660430908203125, 0.164215087890625, 0.19182586669921875, 0.2194366455078125, 0.24704742431640625, 0.274658203125, 0.30226898193359375, 0.3298797607421875, 0.35749053955078125, 0.385101318359375, 0.41271209716796875, 0.4403228759765625, 0.46793365478515625, 0.49554443359375, 0.5231552124023438, 0.5507659912109375, 0.5783767700195312, 0.605987548828125, 0.6335983276367188, 0.6612091064453125, 0.6888198852539062, 0.7164306640625, 0.7440414428710938, 0.7716522216796875, 0.7992630004882812, 0.826873779296875, 0.8544845581054688, 0.8820953369140625, 0.9097061157226562, 0.93731689453125, 0.9649276733398438, 0.9925384521484375, 1.0201492309570312, 1.047760009765625, 1.0753707885742188, 1.1029815673828125, 1.1305923461914062, 1.158203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 11.0, 22.0, 35.0, 43.0, 57.0, 124.0, 237.0, 514.0, 1250.0, 5052.0, 31882.0, 948313.0, 3146846.0, 49956.0, 7245.0, 1637.0, 533.0, 212.0, 107.0, 45.0, 35.0, 34.0, 25.0, 16.0, 10.0, 12.0, 8.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7578125, -2.687286376953125, -2.61676025390625, -2.546234130859375, -2.4757080078125, -2.405181884765625, -2.33465576171875, -2.264129638671875, -2.193603515625, -2.123077392578125, -2.05255126953125, -1.982025146484375, -1.9114990234375, -1.840972900390625, -1.77044677734375, -1.699920654296875, -1.62939453125, -1.558868408203125, -1.48834228515625, -1.417816162109375, -1.3472900390625, -1.276763916015625, -1.20623779296875, -1.135711669921875, -1.065185546875, -0.994659423828125, -0.92413330078125, -0.853607177734375, -0.7830810546875, -0.712554931640625, -0.64202880859375, -0.571502685546875, -0.5009765625, -0.430450439453125, -0.35992431640625, -0.289398193359375, -0.2188720703125, -0.148345947265625, -0.07781982421875, -0.007293701171875, 0.063232421875, 0.133758544921875, 0.20428466796875, 0.274810791015625, 0.3453369140625, 0.415863037109375, 0.48638916015625, 0.556915283203125, 0.62744140625, 0.697967529296875, 0.76849365234375, 0.839019775390625, 0.9095458984375, 0.980072021484375, 1.05059814453125, 1.121124267578125, 1.191650390625, 1.262176513671875, 1.33270263671875, 1.403228759765625, 1.4737548828125, 1.544281005859375, 1.61480712890625, 1.685333251953125, 1.755859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 6.0, 10.0, 4.0, 8.0, 12.0, 15.0, 27.0, 27.0, 36.0, 59.0, 101.0, 157.0, 317.0, 712.0, 1028.0, 753.0, 350.0, 157.0, 88.0, 44.0, 43.0, 18.0, 18.0, 13.0, 11.0, 15.0, 8.0, 6.0, 5.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.16796875, -2.1130828857421875, -2.058197021484375, -2.0033111572265625, -1.94842529296875, -1.8935394287109375, -1.838653564453125, -1.7837677001953125, -1.7288818359375, -1.6739959716796875, -1.619110107421875, -1.5642242431640625, -1.50933837890625, -1.4544525146484375, -1.399566650390625, -1.3446807861328125, -1.289794921875, -1.2349090576171875, -1.180023193359375, -1.1251373291015625, -1.07025146484375, -1.0153656005859375, -0.960479736328125, -0.9055938720703125, -0.8507080078125, -0.7958221435546875, -0.740936279296875, -0.6860504150390625, -0.63116455078125, -0.5762786865234375, -0.521392822265625, -0.4665069580078125, -0.41162109375, -0.3567352294921875, -0.301849365234375, -0.2469635009765625, -0.19207763671875, -0.1371917724609375, -0.082305908203125, -0.0274200439453125, 0.0274658203125, 0.0823516845703125, 0.137237548828125, 0.1921234130859375, 0.24700927734375, 0.3018951416015625, 0.356781005859375, 0.4116668701171875, 0.466552734375, 0.5214385986328125, 0.576324462890625, 0.6312103271484375, 0.68609619140625, 0.7409820556640625, 0.795867919921875, 0.8507537841796875, 0.9056396484375, 0.9605255126953125, 1.015411376953125, 1.0702972412109375, 1.12518310546875, 1.1800689697265625, 1.234954833984375, 1.2898406982421875, 1.3447265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 16.0, 56.0, 116.0, 241.0, 269.0, 175.0, 63.0, 18.0, 12.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4849853515625, -19.87091636657715, -19.256847381591797, -18.642778396606445, -18.028709411621094, -17.414640426635742, -16.80057144165039, -16.18650245666504, -15.572433471679688, -14.958364486694336, -14.344295501708984, -13.730226516723633, -13.116157531738281, -12.50208854675293, -11.888019561767578, -11.273950576782227, -10.659881591796875, -10.045812606811523, -9.431743621826172, -8.81767463684082, -8.203605651855469, -7.589536666870117, -6.975467681884766, -6.361398696899414, -5.7473297119140625, -5.133260726928711, -4.519191741943359, -3.905122756958008, -3.2910537719726562, -2.6769847869873047, -2.062915802001953, -1.4488468170166016, -0.8347797393798828, -0.22071075439453125, 0.3933582305908203, 1.0074272155761719, 1.6214962005615234, 2.235565185546875, 2.8496341705322266, 3.463703155517578, 4.07777214050293, 4.691841125488281, 5.305910110473633, 5.919979095458984, 6.534048080444336, 7.1481170654296875, 7.762186050415039, 8.37625503540039, 8.990324020385742, 9.604393005371094, 10.218461990356445, 10.832530975341797, 11.446599960327148, 12.0606689453125, 12.674737930297852, 13.288806915283203, 13.902875900268555, 14.516944885253906, 15.131013870239258, 15.74508285522461, 16.35915184020996, 16.973220825195312, 17.587289810180664, 18.201358795166016, 18.815427780151367]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 19.0, 11.0, 5.0, 19.0, 14.0, 24.0, 23.0, 23.0, 22.0, 31.0, 40.0, 39.0, 37.0, 61.0, 47.0, 59.0, 46.0, 47.0, 58.0, 47.0, 65.0, 40.0, 43.0, 31.0, 28.0, 20.0, 22.0, 14.0, 15.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.67354965209961, -8.42505931854248, -8.176568031311035, -7.928077220916748, -7.679586410522461, -7.431096076965332, -7.182604789733887, -6.934114456176758, -6.685623645782471, -6.437132835388184, -6.1886420249938965, -5.940151214599609, -5.691660404205322, -5.443169593811035, -5.194679260253906, -4.946188449859619, -4.697697639465332, -4.449206829071045, -4.200716018676758, -3.9522252082824707, -3.7037346363067627, -3.4552438259124756, -3.2067530155181885, -2.9582624435424805, -2.709771156311035, -2.461280345916748, -2.212789535522461, -1.9642988443374634, -1.7158081531524658, -1.4673173427581787, -1.2188265323638916, -0.970335841178894, -0.7218451499938965, -0.47335439920425415, -0.22486361861228943, 0.023627161979675293, 0.2721179127693176, 0.52060866355896, 0.7690994739532471, 1.0175901651382446, 1.2660809755325317, 1.5145717859268188, 1.7630624771118164, 2.0115532875061035, 2.2600440979003906, 2.5085349082946777, 2.757025718688965, 3.005516290664673, 3.25400710105896, 3.502497911453247, 3.750988721847534, 3.999479293823242, 4.247970104217529, 4.496460914611816, 4.7449517250061035, 4.993442535400391, 5.241933345794678, 5.490424156188965, 5.738914966583252, 5.987405776977539, 6.235896587371826, 6.484387397766113, 6.732877731323242, 6.981368541717529, 7.229859352111816]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 20.0, 26.0, 40.0, 62.0, 86.0, 160.0, 266.0, 414.0, 659.0, 1326.0, 2510.0, 5295.0, 11824.0, 29277.0, 75233.0, 192931.0, 340281.0, 231265.0, 93445.0, 36044.0, 14661.0, 6303.0, 2845.0, 1547.0, 811.0, 493.0, 276.0, 169.0, 89.0, 59.0, 44.0, 26.0, 27.0, 8.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8629074096679688, -0.8327484130859375, -0.8025894165039062, -0.772430419921875, -0.7422714233398438, -0.7121124267578125, -0.6819534301757812, -0.65179443359375, -0.6216354370117188, -0.5914764404296875, -0.5613174438476562, -0.531158447265625, -0.5009994506835938, -0.4708404541015625, -0.44068145751953125, -0.4105224609375, -0.38036346435546875, -0.3502044677734375, -0.32004547119140625, -0.289886474609375, -0.25972747802734375, -0.2295684814453125, -0.19940948486328125, -0.16925048828125, -0.13909149169921875, -0.1089324951171875, -0.07877349853515625, -0.048614501953125, -0.01845550537109375, 0.0117034912109375, 0.04186248779296875, 0.072021484375, 0.10218048095703125, 0.1323394775390625, 0.16249847412109375, 0.192657470703125, 0.22281646728515625, 0.2529754638671875, 0.28313446044921875, 0.31329345703125, 0.34345245361328125, 0.3736114501953125, 0.40377044677734375, 0.433929443359375, 0.46408843994140625, 0.4942474365234375, 0.5244064331054688, 0.5545654296875, 0.5847244262695312, 0.6148834228515625, 0.6450424194335938, 0.675201416015625, 0.7053604125976562, 0.7355194091796875, 0.7656784057617188, 0.79583740234375, 0.8259963989257812, 0.8561553955078125, 0.8863143920898438, 0.916473388671875, 0.9466323852539062, 0.9767913818359375, 1.0069503784179688, 1.037109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 11.0, 4.0, 9.0, 6.0, 15.0, 17.0, 15.0, 20.0, 31.0, 23.0, 38.0, 27.0, 41.0, 62.0, 58.0, 60.0, 54.0, 51.0, 63.0, 57.0, 66.0, 40.0, 43.0, 41.0, 33.0, 25.0, 26.0, 17.0, 17.0, 10.0, 9.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68359375, -0.65625, -0.62890625, -0.6015625, -0.57421875, -0.546875, -0.51953125, -0.4921875, -0.46484375, -0.4375, -0.41015625, -0.3828125, -0.35546875, -0.328125, -0.30078125, -0.2734375, -0.24609375, -0.21875, -0.19140625, -0.1640625, -0.13671875, -0.109375, -0.08203125, -0.0546875, -0.02734375, 0.0, 0.02734375, 0.0546875, 0.08203125, 0.109375, 0.13671875, 0.1640625, 0.19140625, 0.21875, 0.24609375, 0.2734375, 0.30078125, 0.328125, 0.35546875, 0.3828125, 0.41015625, 0.4375, 0.46484375, 0.4921875, 0.51953125, 0.546875, 0.57421875, 0.6015625, 0.62890625, 0.65625, 0.68359375, 0.7109375, 0.73828125, 0.765625, 0.79296875, 0.8203125, 0.84765625, 0.875, 0.90234375, 0.9296875, 0.95703125, 0.984375, 1.01171875, 1.0390625, 1.06640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 0.0, 4.0, 6.0, 11.0, 7.0, 11.0, 24.0, 17.0, 28.0, 46.0, 40.0, 52.0, 63.0, 87.0, 132.0, 159.0, 183.0, 278.0, 398.0, 608.0, 904.0, 1759.0, 4255.0, 15313.0, 91048.0, 660537.0, 228063.0, 31364.0, 7044.0, 2453.0, 1149.0, 703.0, 454.0, 335.0, 237.0, 179.0, 147.0, 93.0, 85.0, 58.0, 40.0, 39.0, 33.0, 28.0, 22.0, 18.0, 10.0, 12.0, 4.0, 4.0, 4.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-1.978515625, -1.9180450439453125, -1.857574462890625, -1.7971038818359375, -1.73663330078125, -1.6761627197265625, -1.615692138671875, -1.5552215576171875, -1.4947509765625, -1.4342803955078125, -1.373809814453125, -1.3133392333984375, -1.25286865234375, -1.1923980712890625, -1.131927490234375, -1.0714569091796875, -1.010986328125, -0.9505157470703125, -0.890045166015625, -0.8295745849609375, -0.76910400390625, -0.7086334228515625, -0.648162841796875, -0.5876922607421875, -0.5272216796875, -0.4667510986328125, -0.406280517578125, -0.3458099365234375, -0.28533935546875, -0.2248687744140625, -0.164398193359375, -0.1039276123046875, -0.04345703125, 0.0170135498046875, 0.077484130859375, 0.1379547119140625, 0.19842529296875, 0.2588958740234375, 0.319366455078125, 0.3798370361328125, 0.4403076171875, 0.5007781982421875, 0.561248779296875, 0.6217193603515625, 0.68218994140625, 0.7426605224609375, 0.803131103515625, 0.8636016845703125, 0.924072265625, 0.9845428466796875, 1.045013427734375, 1.1054840087890625, 1.16595458984375, 1.2264251708984375, 1.286895751953125, 1.3473663330078125, 1.4078369140625, 1.4683074951171875, 1.528778076171875, 1.5892486572265625, 1.64971923828125, 1.7101898193359375, 1.770660400390625, 1.8311309814453125, 1.8916015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 9.0, 5.0, 8.0, 4.0, 8.0, 12.0, 11.0, 6.0, 19.0, 15.0, 21.0, 23.0, 27.0, 26.0, 51.0, 44.0, 36.0, 41.0, 47.0, 51.0, 61.0, 46.0, 34.0, 44.0, 49.0, 36.0, 43.0, 33.0, 27.0, 25.0, 26.0, 23.0, 12.0, 15.0, 9.0, 18.0, 4.0, 7.0, 12.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.83203125, -2.734161376953125, -2.63629150390625, -2.538421630859375, -2.4405517578125, -2.342681884765625, -2.24481201171875, -2.146942138671875, -2.049072265625, -1.951202392578125, -1.85333251953125, -1.755462646484375, -1.6575927734375, -1.559722900390625, -1.46185302734375, -1.363983154296875, -1.26611328125, -1.168243408203125, -1.07037353515625, -0.972503662109375, -0.8746337890625, -0.776763916015625, -0.67889404296875, -0.581024169921875, -0.483154296875, -0.385284423828125, -0.28741455078125, -0.189544677734375, -0.0916748046875, 0.006195068359375, 0.10406494140625, 0.201934814453125, 0.2998046875, 0.397674560546875, 0.49554443359375, 0.593414306640625, 0.6912841796875, 0.789154052734375, 0.88702392578125, 0.984893798828125, 1.082763671875, 1.180633544921875, 1.27850341796875, 1.376373291015625, 1.4742431640625, 1.572113037109375, 1.66998291015625, 1.767852783203125, 1.86572265625, 1.963592529296875, 2.06146240234375, 2.159332275390625, 2.2572021484375, 2.355072021484375, 2.45294189453125, 2.550811767578125, 2.648681640625, 2.746551513671875, 2.84442138671875, 2.942291259765625, 3.0401611328125, 3.138031005859375, 3.23590087890625, 3.333770751953125, 3.431640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 17.0, 24.0, 29.0, 53.0, 70.0, 151.0, 365.0, 1019.0, 4580.0, 48778.0, 956226.0, 31871.0, 3793.0, 870.0, 302.0, 155.0, 68.0, 52.0, 36.0, 11.0, 16.0, 14.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.46484375, -1.416717529296875, -1.36859130859375, -1.320465087890625, -1.2723388671875, -1.224212646484375, -1.17608642578125, -1.127960205078125, -1.079833984375, -1.031707763671875, -0.98358154296875, -0.935455322265625, -0.8873291015625, -0.839202880859375, -0.79107666015625, -0.742950439453125, -0.69482421875, -0.646697998046875, -0.59857177734375, -0.550445556640625, -0.5023193359375, -0.454193115234375, -0.40606689453125, -0.357940673828125, -0.309814453125, -0.261688232421875, -0.21356201171875, -0.165435791015625, -0.1173095703125, -0.069183349609375, -0.02105712890625, 0.027069091796875, 0.0751953125, 0.123321533203125, 0.17144775390625, 0.219573974609375, 0.2677001953125, 0.315826416015625, 0.36395263671875, 0.412078857421875, 0.460205078125, 0.508331298828125, 0.55645751953125, 0.604583740234375, 0.6527099609375, 0.700836181640625, 0.74896240234375, 0.797088623046875, 0.84521484375, 0.893341064453125, 0.94146728515625, 0.989593505859375, 1.0377197265625, 1.085845947265625, 1.13397216796875, 1.182098388671875, 1.230224609375, 1.278350830078125, 1.32647705078125, 1.374603271484375, 1.4227294921875, 1.470855712890625, 1.51898193359375, 1.567108154296875, 1.615234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 5.0, 7.0, 23.0, 20.0, 36.0, 56.0, 109.0, 158.0, 200.0, 124.0, 88.0, 63.0, 30.0, 22.0, 10.0, 8.0, 9.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024127960205078125, -0.00023337453603744507, -0.0002254694700241089, -0.0002175644040107727, -0.00020965933799743652, -0.00020175427198410034, -0.00019384920597076416, -0.00018594413995742798, -0.0001780390739440918, -0.00017013400793075562, -0.00016222894191741943, -0.00015432387590408325, -0.00014641880989074707, -0.0001385137438774109, -0.0001306086778640747, -0.00012270361185073853, -0.00011479854583740234, -0.00010689347982406616, -9.898841381072998e-05, -9.10833477973938e-05, -8.317828178405762e-05, -7.527321577072144e-05, -6.736814975738525e-05, -5.946308374404907e-05, -5.155801773071289e-05, -4.365295171737671e-05, -3.574788570404053e-05, -2.7842819690704346e-05, -1.9937753677368164e-05, -1.2032687664031982e-05, -4.127621650695801e-06, 3.777444362640381e-06, 1.1682510375976562e-05, 1.9587576389312744e-05, 2.7492642402648926e-05, 3.539770841598511e-05, 4.330277442932129e-05, 5.120784044265747e-05, 5.911290645599365e-05, 6.701797246932983e-05, 7.492303848266602e-05, 8.28281044960022e-05, 9.073317050933838e-05, 9.863823652267456e-05, 0.00010654330253601074, 0.00011444836854934692, 0.0001223534345626831, 0.0001302585005760193, 0.00013816356658935547, 0.00014606863260269165, 0.00015397369861602783, 0.00016187876462936401, 0.0001697838306427002, 0.00017768889665603638, 0.00018559396266937256, 0.00019349902868270874, 0.00020140409469604492, 0.0002093091607093811, 0.00021721422672271729, 0.00022511929273605347, 0.00023302435874938965, 0.00024092942476272583, 0.000248834490776062, 0.0002567395567893982, 0.0002646446228027344]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 14.0, 21.0, 23.0, 43.0, 60.0, 83.0, 138.0, 339.0, 906.0, 3032.0, 17444.0, 789835.0, 222703.0, 10377.0, 2173.0, 684.0, 299.0, 121.0, 75.0, 51.0, 24.0, 24.0, 16.0, 14.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3416900634765625, -1.299591064453125, -1.2574920654296875, -1.21539306640625, -1.1732940673828125, -1.131195068359375, -1.0890960693359375, -1.0469970703125, -1.0048980712890625, -0.962799072265625, -0.9207000732421875, -0.87860107421875, -0.8365020751953125, -0.794403076171875, -0.7523040771484375, -0.710205078125, -0.6681060791015625, -0.626007080078125, -0.5839080810546875, -0.54180908203125, -0.4997100830078125, -0.457611083984375, -0.4155120849609375, -0.3734130859375, -0.3313140869140625, -0.289215087890625, -0.2471160888671875, -0.20501708984375, -0.1629180908203125, -0.120819091796875, -0.0787200927734375, -0.03662109375, 0.0054779052734375, 0.047576904296875, 0.0896759033203125, 0.13177490234375, 0.1738739013671875, 0.215972900390625, 0.2580718994140625, 0.3001708984375, 0.3422698974609375, 0.384368896484375, 0.4264678955078125, 0.46856689453125, 0.5106658935546875, 0.552764892578125, 0.5948638916015625, 0.636962890625, 0.6790618896484375, 0.721160888671875, 0.7632598876953125, 0.80535888671875, 0.8474578857421875, 0.889556884765625, 0.9316558837890625, 0.9737548828125, 1.0158538818359375, 1.057952880859375, 1.1000518798828125, 1.14215087890625, 1.1842498779296875, 1.226348876953125, 1.2684478759765625, 1.310546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 8.0, 8.0, 9.0, 16.0, 19.0, 19.0, 26.0, 40.0, 49.0, 61.0, 76.0, 94.0, 131.0, 90.0, 83.0, 59.0, 53.0, 38.0, 29.0, 15.0, 17.0, 11.0, 11.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7275390625, -0.705535888671875, -0.68353271484375, -0.661529541015625, -0.6395263671875, -0.617523193359375, -0.59552001953125, -0.573516845703125, -0.551513671875, -0.529510498046875, -0.50750732421875, -0.485504150390625, -0.4635009765625, -0.441497802734375, -0.41949462890625, -0.397491455078125, -0.37548828125, -0.353485107421875, -0.33148193359375, -0.309478759765625, -0.2874755859375, -0.265472412109375, -0.24346923828125, -0.221466064453125, -0.199462890625, -0.177459716796875, -0.15545654296875, -0.133453369140625, -0.1114501953125, -0.089447021484375, -0.06744384765625, -0.045440673828125, -0.0234375, -0.001434326171875, 0.02056884765625, 0.042572021484375, 0.0645751953125, 0.086578369140625, 0.10858154296875, 0.130584716796875, 0.152587890625, 0.174591064453125, 0.19659423828125, 0.218597412109375, 0.2406005859375, 0.262603759765625, 0.28460693359375, 0.306610107421875, 0.32861328125, 0.350616455078125, 0.37261962890625, 0.394622802734375, 0.4166259765625, 0.438629150390625, 0.46063232421875, 0.482635498046875, 0.504638671875, 0.526641845703125, 0.54864501953125, 0.570648193359375, 0.5926513671875, 0.614654541015625, 0.63665771484375, 0.658660888671875, 0.6806640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 13.0, 9.0, 40.0, 83.0, 142.0, 272.0, 244.0, 95.0, 55.0, 23.0, 12.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.1849308013916, -23.5288028717041, -22.8726749420166, -22.216548919677734, -21.560420989990234, -20.904293060302734, -20.248165130615234, -19.592037200927734, -18.935909271240234, -18.279781341552734, -17.623653411865234, -16.967527389526367, -16.311399459838867, -15.655271530151367, -14.999143600463867, -14.343015670776367, -13.6868896484375, -13.03076171875, -12.374634742736816, -11.718506813049316, -11.062379837036133, -10.406251907348633, -9.750123977661133, -9.093996047973633, -8.43786907196045, -7.781741619110107, -7.125614166259766, -6.469486236572266, -5.813358783721924, -5.157231330871582, -4.501103401184082, -3.8449759483337402, -3.1888465881347656, -2.532719135284424, -1.876591444015503, -1.2204638719558716, -0.5643362998962402, 0.09179115295410156, 0.7479188442230225, 1.4040465354919434, 2.060173988342285, 2.716301441192627, 3.372429132461548, 4.028556823730469, 4.6846842765808105, 5.340811729431152, 5.996939659118652, 6.653067111968994, 7.309194564819336, 7.965322017669678, 8.62144947052002, 9.27757740020752, 9.933704376220703, 10.589832305908203, 11.245960235595703, 11.902088165283203, 12.558215141296387, 13.214343070983887, 13.87047004699707, 14.52659797668457, 15.18272590637207, 15.838852882385254, 16.494979858398438, 17.151107788085938, 17.807235717773438]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 11.0, 22.0, 13.0, 14.0, 21.0, 22.0, 22.0, 20.0, 28.0, 34.0, 19.0, 35.0, 57.0, 55.0, 57.0, 75.0, 77.0, 51.0, 35.0, 38.0, 43.0, 36.0, 24.0, 32.0, 27.0, 16.0, 14.0, 17.0, 17.0, 13.0, 9.0, 12.0, 4.0, 6.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0], "bins": [-16.52168083190918, -16.101119995117188, -15.680558204650879, -15.259997367858887, -14.839435577392578, -14.418874740600586, -13.998313903808594, -13.577753067016602, -13.157191276550293, -12.7366304397583, -12.316068649291992, -11.8955078125, -11.474946975708008, -11.0543851852417, -10.633824348449707, -10.213262557983398, -9.792701721191406, -9.372140884399414, -8.951579093933105, -8.531018257141113, -8.110456466674805, -7.6898956298828125, -7.26933479309082, -6.84877347946167, -6.4282121658325195, -6.007650852203369, -5.587089538574219, -5.166528701782227, -4.745967388153076, -4.325406074523926, -3.9048449993133545, -3.484283924102783, -3.0637216567993164, -2.643160343170166, -2.2225992679595947, -1.8020380735397339, -1.381476879119873, -0.9609155654907227, -0.5403544902801514, -0.11979341506958008, 0.3007678985595703, 0.7213290929794312, 1.141890287399292, 1.5624514818191528, 1.9830126762390137, 2.403573989868164, 2.8241350650787354, 3.2446961402893066, 3.665257453918457, 4.085818767547607, 4.506380081176758, 4.92694091796875, 5.3475022315979, 5.768063545227051, 6.188624382019043, 6.609185695648193, 7.029747009277344, 7.450308322906494, 7.8708696365356445, 8.291430473327637, 8.711992263793945, 9.132553100585938, 9.55311393737793, 9.973674774169922, 10.39423656463623]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 11.0, 14.0, 10.0, 12.0, 27.0, 37.0, 43.0, 56.0, 70.0, 124.0, 182.0, 340.0, 611.0, 1235.0, 2556.0, 6729.0, 23107.0, 123401.0, 867678.0, 2411322.0, 636301.0, 89584.0, 18707.0, 6430.0, 2833.0, 1294.0, 632.0, 349.0, 184.0, 146.0, 66.0, 45.0, 48.0, 28.0, 23.0, 12.0, 12.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6026763916015625, -0.579864501953125, -0.5570526123046875, -0.53424072265625, -0.5114288330078125, -0.488616943359375, -0.4658050537109375, -0.4429931640625, -0.4201812744140625, -0.397369384765625, -0.3745574951171875, -0.35174560546875, -0.3289337158203125, -0.306121826171875, -0.2833099365234375, -0.260498046875, -0.2376861572265625, -0.214874267578125, -0.1920623779296875, -0.16925048828125, -0.1464385986328125, -0.123626708984375, -0.1008148193359375, -0.0780029296875, -0.0551910400390625, -0.032379150390625, -0.0095672607421875, 0.01324462890625, 0.0360565185546875, 0.058868408203125, 0.0816802978515625, 0.1044921875, 0.1273040771484375, 0.150115966796875, 0.1729278564453125, 0.19573974609375, 0.2185516357421875, 0.241363525390625, 0.2641754150390625, 0.2869873046875, 0.3097991943359375, 0.332611083984375, 0.3554229736328125, 0.37823486328125, 0.4010467529296875, 0.423858642578125, 0.4466705322265625, 0.469482421875, 0.4922943115234375, 0.515106201171875, 0.5379180908203125, 0.56072998046875, 0.5835418701171875, 0.606353759765625, 0.6291656494140625, 0.6519775390625, 0.6747894287109375, 0.697601318359375, 0.7204132080078125, 0.74322509765625, 0.7660369873046875, 0.788848876953125, 0.8116607666015625, 0.83447265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 5.0, 7.0, 12.0, 21.0, 26.0, 24.0, 27.0, 36.0, 60.0, 41.0, 63.0, 62.0, 80.0, 73.0, 66.0, 62.0, 59.0, 56.0, 46.0, 38.0, 34.0, 32.0, 23.0, 12.0, 10.0, 8.0, 6.0, 10.0, 6.0, 2.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3820114135742188, -1.3509368896484375, -1.3198623657226562, -1.288787841796875, -1.2577133178710938, -1.2266387939453125, -1.1955642700195312, -1.16448974609375, -1.1334152221679688, -1.1023406982421875, -1.0712661743164062, -1.040191650390625, -1.0091171264648438, -0.9780426025390625, -0.9469680786132812, -0.9158935546875, -0.8848190307617188, -0.8537445068359375, -0.8226699829101562, -0.791595458984375, -0.7605209350585938, -0.7294464111328125, -0.6983718872070312, -0.66729736328125, -0.6362228393554688, -0.6051483154296875, -0.5740737915039062, -0.542999267578125, -0.5119247436523438, -0.4808502197265625, -0.44977569580078125, -0.418701171875, -0.38762664794921875, -0.3565521240234375, -0.32547760009765625, -0.294403076171875, -0.26332855224609375, -0.2322540283203125, -0.20117950439453125, -0.17010498046875, -0.13903045654296875, -0.1079559326171875, -0.07688140869140625, -0.045806884765625, -0.01473236083984375, 0.0163421630859375, 0.04741668701171875, 0.0784912109375, 0.10956573486328125, 0.1406402587890625, 0.17171478271484375, 0.202789306640625, 0.23386383056640625, 0.2649383544921875, 0.29601287841796875, 0.32708740234375, 0.35816192626953125, 0.3892364501953125, 0.42031097412109375, 0.451385498046875, 0.48246002197265625, 0.5135345458984375, 0.5446090698242188, 0.57568359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 9.0, 4.0, 15.0, 15.0, 20.0, 42.0, 62.0, 112.0, 213.0, 342.0, 678.0, 1551.0, 4548.0, 18603.0, 148192.0, 3584400.0, 390295.0, 33145.0, 7320.0, 2482.0, 1028.0, 524.0, 263.0, 167.0, 74.0, 70.0, 28.0, 21.0, 12.0, 8.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.5927734375, -1.5467987060546875, -1.500823974609375, -1.4548492431640625, -1.40887451171875, -1.3628997802734375, -1.316925048828125, -1.2709503173828125, -1.2249755859375, -1.1790008544921875, -1.133026123046875, -1.0870513916015625, -1.04107666015625, -0.9951019287109375, -0.949127197265625, -0.9031524658203125, -0.857177734375, -0.8112030029296875, -0.765228271484375, -0.7192535400390625, -0.67327880859375, -0.6273040771484375, -0.581329345703125, -0.5353546142578125, -0.4893798828125, -0.4434051513671875, -0.397430419921875, -0.3514556884765625, -0.30548095703125, -0.2595062255859375, -0.213531494140625, -0.1675567626953125, -0.12158203125, -0.0756072998046875, -0.029632568359375, 0.0163421630859375, 0.06231689453125, 0.1082916259765625, 0.154266357421875, 0.2002410888671875, 0.2462158203125, 0.2921905517578125, 0.338165283203125, 0.3841400146484375, 0.43011474609375, 0.4760894775390625, 0.522064208984375, 0.5680389404296875, 0.614013671875, 0.6599884033203125, 0.705963134765625, 0.7519378662109375, 0.79791259765625, 0.8438873291015625, 0.889862060546875, 0.9358367919921875, 0.9818115234375, 1.0277862548828125, 1.073760986328125, 1.1197357177734375, 1.16571044921875, 1.2116851806640625, 1.257659912109375, 1.3036346435546875, 1.349609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 6.0, 2.0, 18.0, 26.0, 61.0, 69.0, 149.0, 355.0, 709.0, 1054.0, 851.0, 361.0, 160.0, 81.0, 44.0, 32.0, 22.0, 16.0, 12.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.342803955078125, -1.28326416015625, -1.223724365234375, -1.1641845703125, -1.104644775390625, -1.04510498046875, -0.985565185546875, -0.926025390625, -0.866485595703125, -0.80694580078125, -0.747406005859375, -0.6878662109375, -0.628326416015625, -0.56878662109375, -0.509246826171875, -0.44970703125, -0.390167236328125, -0.33062744140625, -0.271087646484375, -0.2115478515625, -0.152008056640625, -0.09246826171875, -0.032928466796875, 0.026611328125, 0.086151123046875, 0.14569091796875, 0.205230712890625, 0.2647705078125, 0.324310302734375, 0.38385009765625, 0.443389892578125, 0.5029296875, 0.562469482421875, 0.62200927734375, 0.681549072265625, 0.7410888671875, 0.800628662109375, 0.86016845703125, 0.919708251953125, 0.979248046875, 1.038787841796875, 1.09832763671875, 1.157867431640625, 1.2174072265625, 1.276947021484375, 1.33648681640625, 1.396026611328125, 1.45556640625, 1.515106201171875, 1.57464599609375, 1.634185791015625, 1.6937255859375, 1.753265380859375, 1.81280517578125, 1.872344970703125, 1.931884765625, 1.991424560546875, 2.05096435546875, 2.110504150390625, 2.1700439453125, 2.229583740234375, 2.28912353515625, 2.348663330078125, 2.408203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 9.0, 17.0, 59.0, 124.0, 255.0, 280.0, 147.0, 59.0, 17.0, 13.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.396169662475586, -11.836724281311035, -11.277278900146484, -10.71783447265625, -10.1583890914917, -9.598943710327148, -9.039499282836914, -8.480053901672363, -7.9206085205078125, -7.361163139343262, -6.801718235015869, -6.242273330688477, -5.682827949523926, -5.123382568359375, -4.563937664031982, -4.00449275970459, -3.445047378540039, -2.8856022357940674, -2.3261570930480957, -1.766711950302124, -1.2072668075561523, -0.6478216648101807, -0.08837652206420898, 0.4710686206817627, 1.0305137634277344, 1.589958906173706, 2.1494040489196777, 2.7088491916656494, 3.268294334411621, 3.8277394771575928, 4.3871846199035645, 4.946629524230957, 5.506076812744141, 6.065522193908691, 6.624967098236084, 7.184412002563477, 7.743857383728027, 8.303302764892578, 8.862747192382812, 9.422192573547363, 9.981637954711914, 10.541083335876465, 11.100528717041016, 11.65997314453125, 12.2194185256958, 12.778863906860352, 13.338308334350586, 13.897753715515137, 14.457199096679688, 15.016644477844238, 15.576089859008789, 16.135534286499023, 16.69498062133789, 17.254425048828125, 17.81386947631836, 18.373315811157227, 18.93276023864746, 19.492204666137695, 20.051651000976562, 20.611095428466797, 21.17053985595703, 21.7299861907959, 22.289430618286133, 22.848876953125, 23.408321380615234]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 6.0, 5.0, 2.0, 9.0, 14.0, 20.0, 25.0, 33.0, 38.0, 52.0, 59.0, 70.0, 84.0, 85.0, 79.0, 80.0, 69.0, 58.0, 64.0, 35.0, 33.0, 26.0, 15.0, 16.0, 9.0, 5.0, 9.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.438441753387451, -6.079217433929443, -5.7199931144714355, -5.360769271850586, -5.001544952392578, -4.64232063293457, -4.2830963134765625, -3.9238719940185547, -3.564647674560547, -3.205423355102539, -2.8461990356445312, -2.4869749546051025, -2.1277506351470947, -1.768526315689087, -1.4093022346496582, -1.0500779151916504, -0.6908535957336426, -0.33162933588027954, 0.027594923973083496, 0.38681912422180176, 0.7460434436798096, 1.1052677631378174, 1.464491844177246, 1.823716163635254, 2.1829404830932617, 2.5421648025512695, 2.9013891220092773, 3.260613203048706, 3.619837522506714, 3.9790618419647217, 4.33828592300415, 4.697510242462158, 5.056734085083008, 5.415958404541016, 5.775182723999023, 6.134407043457031, 6.493631362915039, 6.852855682373047, 7.2120795249938965, 7.571303844451904, 7.930528163909912, 8.289752006530762, 8.64897632598877, 9.008200645446777, 9.367424964904785, 9.726649284362793, 10.0858736038208, 10.445097923278809, 10.804322242736816, 11.163546562194824, 11.522770881652832, 11.88199520111084, 12.241219520568848, 12.600443840026855, 12.959667205810547, 13.318891525268555, 13.678115844726562, 14.03734016418457, 14.396564483642578, 14.755788803100586, 15.115013122558594, 15.474237442016602, 15.83346176147461, 16.192686080932617, 16.551910400390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 1.0, 5.0, 13.0, 20.0, 25.0, 40.0, 73.0, 91.0, 181.0, 366.0, 595.0, 1205.0, 2368.0, 5045.0, 11011.0, 26206.0, 63823.0, 157310.0, 320730.0, 264593.0, 114039.0, 45595.0, 19181.0, 8205.0, 3842.0, 1857.0, 951.0, 491.0, 293.0, 186.0, 80.0, 48.0, 25.0, 17.0, 10.0, 9.0, 11.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98974609375, -0.960479736328125, -0.93121337890625, -0.901947021484375, -0.8726806640625, -0.843414306640625, -0.81414794921875, -0.784881591796875, -0.755615234375, -0.726348876953125, -0.69708251953125, -0.667816162109375, -0.6385498046875, -0.609283447265625, -0.58001708984375, -0.550750732421875, -0.521484375, -0.492218017578125, -0.46295166015625, -0.433685302734375, -0.4044189453125, -0.375152587890625, -0.34588623046875, -0.316619873046875, -0.287353515625, -0.258087158203125, -0.22882080078125, -0.199554443359375, -0.1702880859375, -0.141021728515625, -0.11175537109375, -0.082489013671875, -0.05322265625, -0.023956298828125, 0.00531005859375, 0.034576416015625, 0.0638427734375, 0.093109130859375, 0.12237548828125, 0.151641845703125, 0.180908203125, 0.210174560546875, 0.23944091796875, 0.268707275390625, 0.2979736328125, 0.327239990234375, 0.35650634765625, 0.385772705078125, 0.4150390625, 0.444305419921875, 0.47357177734375, 0.502838134765625, 0.5321044921875, 0.561370849609375, 0.59063720703125, 0.619903564453125, 0.649169921875, 0.678436279296875, 0.70770263671875, 0.736968994140625, 0.7662353515625, 0.795501708984375, 0.82476806640625, 0.854034423828125, 0.88330078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 8.0, 5.0, 10.0, 17.0, 12.0, 13.0, 11.0, 10.0, 21.0, 27.0, 18.0, 26.0, 35.0, 32.0, 38.0, 56.0, 41.0, 37.0, 33.0, 38.0, 39.0, 43.0, 35.0, 40.0, 36.0, 44.0, 36.0, 29.0, 27.0, 27.0, 17.0, 25.0, 21.0, 19.0, 15.0, 16.0, 4.0, 11.0, 9.0, 5.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.630859375, -0.6124343872070312, -0.5940093994140625, -0.5755844116210938, -0.557159423828125, -0.5387344360351562, -0.5203094482421875, -0.5018844604492188, -0.48345947265625, -0.46503448486328125, -0.4466094970703125, -0.42818450927734375, -0.409759521484375, -0.39133453369140625, -0.3729095458984375, -0.35448455810546875, -0.3360595703125, -0.31763458251953125, -0.2992095947265625, -0.28078460693359375, -0.262359619140625, -0.24393463134765625, -0.2255096435546875, -0.20708465576171875, -0.18865966796875, -0.17023468017578125, -0.1518096923828125, -0.13338470458984375, -0.114959716796875, -0.09653472900390625, -0.0781097412109375, -0.05968475341796875, -0.041259765625, -0.02283477783203125, -0.0044097900390625, 0.01401519775390625, 0.032440185546875, 0.05086517333984375, 0.0692901611328125, 0.08771514892578125, 0.10614013671875, 0.12456512451171875, 0.1429901123046875, 0.16141510009765625, 0.179840087890625, 0.19826507568359375, 0.2166900634765625, 0.23511505126953125, 0.2535400390625, 0.27196502685546875, 0.2903900146484375, 0.30881500244140625, 0.327239990234375, 0.34566497802734375, 0.3640899658203125, 0.38251495361328125, 0.40093994140625, 0.41936492919921875, 0.4377899169921875, 0.45621490478515625, 0.474639892578125, 0.49306488037109375, 0.5114898681640625, 0.5299148559570312, 0.54833984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 11.0, 24.0, 27.0, 49.0, 48.0, 47.0, 71.0, 113.0, 169.0, 235.0, 297.0, 473.0, 709.0, 1247.0, 2608.0, 8269.0, 42291.0, 324050.0, 589704.0, 60451.0, 10541.0, 3255.0, 1362.0, 770.0, 510.0, 347.0, 228.0, 178.0, 118.0, 92.0, 60.0, 50.0, 47.0, 23.0, 22.0, 17.0, 5.0, 2.0, 8.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.216796875, -2.15362548828125, -2.0904541015625, -2.02728271484375, -1.964111328125, -1.90093994140625, -1.8377685546875, -1.77459716796875, -1.71142578125, -1.64825439453125, -1.5850830078125, -1.52191162109375, -1.458740234375, -1.39556884765625, -1.3323974609375, -1.26922607421875, -1.2060546875, -1.14288330078125, -1.0797119140625, -1.01654052734375, -0.953369140625, -0.89019775390625, -0.8270263671875, -0.76385498046875, -0.70068359375, -0.63751220703125, -0.5743408203125, -0.51116943359375, -0.447998046875, -0.38482666015625, -0.3216552734375, -0.25848388671875, -0.1953125, -0.13214111328125, -0.0689697265625, -0.00579833984375, 0.057373046875, 0.12054443359375, 0.1837158203125, 0.24688720703125, 0.31005859375, 0.37322998046875, 0.4364013671875, 0.49957275390625, 0.562744140625, 0.62591552734375, 0.6890869140625, 0.75225830078125, 0.8154296875, 0.87860107421875, 0.9417724609375, 1.00494384765625, 1.068115234375, 1.13128662109375, 1.1944580078125, 1.25762939453125, 1.32080078125, 1.38397216796875, 1.4471435546875, 1.51031494140625, 1.573486328125, 1.63665771484375, 1.6998291015625, 1.76300048828125, 1.826171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 9.0, 11.0, 14.0, 20.0, 12.0, 22.0, 28.0, 27.0, 26.0, 35.0, 47.0, 47.0, 54.0, 50.0, 53.0, 51.0, 43.0, 54.0, 47.0, 35.0, 45.0, 34.0, 30.0, 29.0, 22.0, 21.0, 15.0, 18.0, 20.0, 12.0, 6.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.572265625, -2.49383544921875, -2.4154052734375, -2.33697509765625, -2.258544921875, -2.18011474609375, -2.1016845703125, -2.02325439453125, -1.94482421875, -1.86639404296875, -1.7879638671875, -1.70953369140625, -1.631103515625, -1.55267333984375, -1.4742431640625, -1.39581298828125, -1.3173828125, -1.23895263671875, -1.1605224609375, -1.08209228515625, -1.003662109375, -0.92523193359375, -0.8468017578125, -0.76837158203125, -0.68994140625, -0.61151123046875, -0.5330810546875, -0.45465087890625, -0.376220703125, -0.29779052734375, -0.2193603515625, -0.14093017578125, -0.0625, 0.01593017578125, 0.0943603515625, 0.17279052734375, 0.251220703125, 0.32965087890625, 0.4080810546875, 0.48651123046875, 0.56494140625, 0.64337158203125, 0.7218017578125, 0.80023193359375, 0.878662109375, 0.95709228515625, 1.0355224609375, 1.11395263671875, 1.1923828125, 1.27081298828125, 1.3492431640625, 1.42767333984375, 1.506103515625, 1.58453369140625, 1.6629638671875, 1.74139404296875, 1.81982421875, 1.89825439453125, 1.9766845703125, 2.05511474609375, 2.133544921875, 2.21197509765625, 2.2904052734375, 2.36883544921875, 2.447265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 8.0, 7.0, 11.0, 13.0, 16.0, 33.0, 52.0, 67.0, 114.0, 170.0, 251.0, 474.0, 772.0, 1543.0, 3033.0, 6460.0, 18591.0, 86268.0, 694176.0, 188944.0, 29762.0, 9516.0, 3901.0, 1900.0, 970.0, 557.0, 340.0, 206.0, 124.0, 87.0, 53.0, 42.0, 24.0, 18.0, 14.0, 10.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7421875, -0.72015380859375, -0.6981201171875, -0.67608642578125, -0.654052734375, -0.63201904296875, -0.6099853515625, -0.58795166015625, -0.56591796875, -0.54388427734375, -0.5218505859375, -0.49981689453125, -0.477783203125, -0.45574951171875, -0.4337158203125, -0.41168212890625, -0.3896484375, -0.36761474609375, -0.3455810546875, -0.32354736328125, -0.301513671875, -0.27947998046875, -0.2574462890625, -0.23541259765625, -0.21337890625, -0.19134521484375, -0.1693115234375, -0.14727783203125, -0.125244140625, -0.10321044921875, -0.0811767578125, -0.05914306640625, -0.037109375, -0.01507568359375, 0.0069580078125, 0.02899169921875, 0.051025390625, 0.07305908203125, 0.0950927734375, 0.11712646484375, 0.13916015625, 0.16119384765625, 0.1832275390625, 0.20526123046875, 0.227294921875, 0.24932861328125, 0.2713623046875, 0.29339599609375, 0.3154296875, 0.33746337890625, 0.3594970703125, 0.38153076171875, 0.403564453125, 0.42559814453125, 0.4476318359375, 0.46966552734375, 0.49169921875, 0.51373291015625, 0.5357666015625, 0.55780029296875, 0.579833984375, 0.60186767578125, 0.6239013671875, 0.64593505859375, 0.66796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 6.0, 8.0, 21.0, 42.0, 164.0, 401.0, 203.0, 64.0, 25.0, 16.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004868507385253906, -0.00046428292989730835, -0.0004417151212692261, -0.0004191473126411438, -0.0003965795040130615, -0.00037401169538497925, -0.00035144388675689697, -0.0003288760781288147, -0.0003063082695007324, -0.00028374046087265015, -0.00026117265224456787, -0.0002386048436164856, -0.00021603703498840332, -0.00019346922636032104, -0.00017090141773223877, -0.0001483336091041565, -0.00012576580047607422, -0.00010319799184799194, -8.063018321990967e-05, -5.806237459182739e-05, -3.549456596374512e-05, -1.2926757335662842e-05, 9.641051292419434e-06, 3.220885992050171e-05, 5.4776668548583984e-05, 7.734447717666626e-05, 9.991228580474854e-05, 0.0001224800944328308, 0.00014504790306091309, 0.00016761571168899536, 0.00019018352031707764, 0.0002127513289451599, 0.0002353191375732422, 0.00025788694620132446, 0.00028045475482940674, 0.000303022563457489, 0.0003255903720855713, 0.00034815818071365356, 0.00037072598934173584, 0.0003932937979698181, 0.0004158616065979004, 0.00043842941522598267, 0.00046099722385406494, 0.0004835650324821472, 0.0005061328411102295, 0.0005287006497383118, 0.000551268458366394, 0.0005738362669944763, 0.0005964040756225586, 0.0006189718842506409, 0.0006415396928787231, 0.0006641075015068054, 0.0006866753101348877, 0.00070924311876297, 0.0007318109273910522, 0.0007543787360191345, 0.0007769465446472168, 0.0007995143532752991, 0.0008220821619033813, 0.0008446499705314636, 0.0008672177791595459, 0.0008897855877876282, 0.0009123533964157104, 0.0009349212050437927, 0.000957489013671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 8.0, 10.0, 26.0, 27.0, 65.0, 105.0, 247.0, 504.0, 1648.0, 8827.0, 237929.0, 779079.0, 16374.0, 2425.0, 699.0, 284.0, 121.0, 74.0, 42.0, 20.0, 8.0, 13.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.7332763671875, -1.685302734375, -1.6373291015625, -1.58935546875, -1.5413818359375, -1.493408203125, -1.4454345703125, -1.3974609375, -1.3494873046875, -1.301513671875, -1.2535400390625, -1.20556640625, -1.1575927734375, -1.109619140625, -1.0616455078125, -1.013671875, -0.9656982421875, -0.917724609375, -0.8697509765625, -0.82177734375, -0.7738037109375, -0.725830078125, -0.6778564453125, -0.6298828125, -0.5819091796875, -0.533935546875, -0.4859619140625, -0.43798828125, -0.3900146484375, -0.342041015625, -0.2940673828125, -0.24609375, -0.1981201171875, -0.150146484375, -0.1021728515625, -0.05419921875, -0.0062255859375, 0.041748046875, 0.0897216796875, 0.1376953125, 0.1856689453125, 0.233642578125, 0.2816162109375, 0.32958984375, 0.3775634765625, 0.425537109375, 0.4735107421875, 0.521484375, 0.5694580078125, 0.617431640625, 0.6654052734375, 0.71337890625, 0.7613525390625, 0.809326171875, 0.8572998046875, 0.9052734375, 0.9532470703125, 1.001220703125, 1.0491943359375, 1.09716796875, 1.1451416015625, 1.193115234375, 1.2410888671875, 1.2890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 9.0, 3.0, 6.0, 7.0, 11.0, 13.0, 21.0, 20.0, 22.0, 31.0, 36.0, 47.0, 62.0, 44.0, 60.0, 63.0, 71.0, 75.0, 60.0, 52.0, 45.0, 34.0, 28.0, 21.0, 37.0, 17.0, 11.0, 13.0, 13.0, 11.0, 8.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.494384765625, -0.47887420654296875, -0.4633636474609375, -0.44785308837890625, -0.432342529296875, -0.41683197021484375, -0.4013214111328125, -0.38581085205078125, -0.37030029296875, -0.35478973388671875, -0.3392791748046875, -0.32376861572265625, -0.308258056640625, -0.29274749755859375, -0.2772369384765625, -0.26172637939453125, -0.2462158203125, -0.23070526123046875, -0.2151947021484375, -0.19968414306640625, -0.184173583984375, -0.16866302490234375, -0.1531524658203125, -0.13764190673828125, -0.12213134765625, -0.10662078857421875, -0.0911102294921875, -0.07559967041015625, -0.060089111328125, -0.04457855224609375, -0.0290679931640625, -0.01355743408203125, 0.001953125, 0.01746368408203125, 0.0329742431640625, 0.04848480224609375, 0.063995361328125, 0.07950592041015625, 0.0950164794921875, 0.11052703857421875, 0.12603759765625, 0.14154815673828125, 0.1570587158203125, 0.17256927490234375, 0.188079833984375, 0.20359039306640625, 0.2191009521484375, 0.23461151123046875, 0.2501220703125, 0.26563262939453125, 0.2811431884765625, 0.29665374755859375, 0.312164306640625, 0.32767486572265625, 0.3431854248046875, 0.35869598388671875, 0.37420654296875, 0.38971710205078125, 0.4052276611328125, 0.42073822021484375, 0.436248779296875, 0.45175933837890625, 0.4672698974609375, 0.48278045654296875, 0.498291015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 20.0, 51.0, 155.0, 334.0, 275.0, 102.0, 32.0, 8.0, 12.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.361270904541016, -33.52109146118164, -32.680908203125, -31.840726852416992, -31.000545501708984, -30.160364151000977, -29.32018280029297, -28.480003356933594, -27.639820098876953, -26.799638748168945, -25.959457397460938, -25.11927604675293, -24.279094696044922, -23.438913345336914, -22.598731994628906, -21.75855255126953, -20.918371200561523, -20.078189849853516, -19.238008499145508, -18.3978271484375, -17.557645797729492, -16.717464447021484, -15.877284049987793, -15.037102699279785, -14.196921348571777, -13.35673999786377, -12.516558647155762, -11.67637825012207, -10.836196899414062, -9.996015548706055, -9.155834197998047, -8.315652847290039, -7.475473403930664, -6.635292053222656, -5.795110702514648, -4.954929828643799, -4.114748477935791, -3.274567127227783, -2.4343862533569336, -1.5942049026489258, -0.754023551940918, 0.08615767955780029, 0.9263389110565186, 1.7665200233459473, 2.606701374053955, 3.446882724761963, 4.2870635986328125, 5.12724494934082, 5.967426300048828, 6.807607650756836, 7.647789001464844, 8.487970352172852, 9.32815170288086, 10.168333053588867, 11.008513450622559, 11.848694801330566, 12.688876152038574, 13.529057502746582, 14.36923885345459, 15.209419250488281, 16.04960060119629, 16.889781951904297, 17.729963302612305, 18.570144653320312, 19.41032600402832]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 8.0, 9.0, 16.0, 16.0, 12.0, 20.0, 14.0, 34.0, 34.0, 25.0, 31.0, 32.0, 34.0, 40.0, 47.0, 72.0, 82.0, 57.0, 49.0, 58.0, 26.0, 32.0, 28.0, 28.0, 25.0, 18.0, 27.0, 19.0, 21.0, 13.0, 10.0, 15.0, 8.0, 6.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.247876167297363, -7.950588703155518, -7.65330171585083, -7.356014251708984, -7.058727264404297, -6.761439800262451, -6.4641523361206055, -6.166865348815918, -5.869577884674072, -5.572290420532227, -5.275003433227539, -4.977715969085693, -4.680428504943848, -4.38314151763916, -4.0858540534973145, -3.788566827774048, -3.4912796020507812, -3.1939923763275146, -2.896705150604248, -2.5994176864624023, -2.3021304607391357, -2.004843235015869, -1.707555890083313, -1.4102685451507568, -1.1129813194274902, -0.8156940340995789, -0.5184067487716675, -0.2211194634437561, 0.07616782188415527, 0.3734550476074219, 0.670742392539978, 0.9680297374725342, 1.2653179168701172, 1.5626051425933838, 1.85989248752594, 2.157179832458496, 2.4544670581817627, 2.7517542839050293, 3.049041748046875, 3.3463289737701416, 3.643616199493408, 3.940903425216675, 4.238190650939941, 4.535478115081787, 4.832765579223633, 5.13005256652832, 5.427340030670166, 5.724627494812012, 6.021914482116699, 6.319201946258545, 6.616488933563232, 6.913776397705078, 7.211063385009766, 7.508350849151611, 7.805638313293457, 8.102925300598145, 8.400213241577148, 8.697500228881836, 8.99478816986084, 9.292075157165527, 9.589362144470215, 9.886650085449219, 10.183937072753906, 10.481224060058594, 10.778511047363281]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 14.0, 12.0, 16.0, 24.0, 27.0, 46.0, 48.0, 100.0, 146.0, 217.0, 409.0, 763.0, 1796.0, 5694.0, 27704.0, 366074.0, 2889491.0, 834415.0, 54204.0, 8441.0, 2437.0, 992.0, 457.0, 256.0, 164.0, 105.0, 75.0, 45.0, 33.0, 24.0, 18.0, 13.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84375, -0.813232421875, -0.78271484375, -0.752197265625, -0.7216796875, -0.691162109375, -0.66064453125, -0.630126953125, -0.599609375, -0.569091796875, -0.53857421875, -0.508056640625, -0.4775390625, -0.447021484375, -0.41650390625, -0.385986328125, -0.35546875, -0.324951171875, -0.29443359375, -0.263916015625, -0.2333984375, -0.202880859375, -0.17236328125, -0.141845703125, -0.111328125, -0.080810546875, -0.05029296875, -0.019775390625, 0.0107421875, 0.041259765625, 0.07177734375, 0.102294921875, 0.1328125, 0.163330078125, 0.19384765625, 0.224365234375, 0.2548828125, 0.285400390625, 0.31591796875, 0.346435546875, 0.376953125, 0.407470703125, 0.43798828125, 0.468505859375, 0.4990234375, 0.529541015625, 0.56005859375, 0.590576171875, 0.62109375, 0.651611328125, 0.68212890625, 0.712646484375, 0.7431640625, 0.773681640625, 0.80419921875, 0.834716796875, 0.865234375, 0.895751953125, 0.92626953125, 0.956787109375, 0.9873046875, 1.017822265625, 1.04833984375, 1.078857421875, 1.109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 7.0, 12.0, 9.0, 15.0, 18.0, 17.0, 11.0, 24.0, 29.0, 27.0, 26.0, 29.0, 46.0, 34.0, 47.0, 37.0, 49.0, 48.0, 46.0, 43.0, 51.0, 30.0, 38.0, 35.0, 38.0, 24.0, 27.0, 22.0, 23.0, 32.0, 20.0, 18.0, 12.0, 8.0, 6.0, 3.0, 9.0, 6.0, 10.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58984375, -0.5720291137695312, -0.5542144775390625, -0.5363998413085938, -0.518585205078125, -0.5007705688476562, -0.4829559326171875, -0.46514129638671875, -0.44732666015625, -0.42951202392578125, -0.4116973876953125, -0.39388275146484375, -0.376068115234375, -0.35825347900390625, -0.3404388427734375, -0.32262420654296875, -0.3048095703125, -0.28699493408203125, -0.2691802978515625, -0.25136566162109375, -0.233551025390625, -0.21573638916015625, -0.1979217529296875, -0.18010711669921875, -0.16229248046875, -0.14447784423828125, -0.1266632080078125, -0.10884857177734375, -0.091033935546875, -0.07321929931640625, -0.0554046630859375, -0.03759002685546875, -0.019775390625, -0.00196075439453125, 0.0158538818359375, 0.03366851806640625, 0.051483154296875, 0.06929779052734375, 0.0871124267578125, 0.10492706298828125, 0.12274169921875, 0.14055633544921875, 0.1583709716796875, 0.17618560791015625, 0.194000244140625, 0.21181488037109375, 0.2296295166015625, 0.24744415283203125, 0.2652587890625, 0.28307342529296875, 0.3008880615234375, 0.31870269775390625, 0.336517333984375, 0.35433197021484375, 0.3721466064453125, 0.38996124267578125, 0.40777587890625, 0.42559051513671875, 0.4434051513671875, 0.46121978759765625, 0.479034423828125, 0.49684906005859375, 0.5146636962890625, 0.5324783325195312, 0.55029296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 17.0, 26.0, 52.0, 85.0, 145.0, 341.0, 941.0, 3757.0, 330410.0, 3849428.0, 7079.0, 1142.0, 441.0, 209.0, 91.0, 44.0, 28.0, 14.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.243072509765625, -4.11505126953125, -3.987030029296875, -3.8590087890625, -3.730987548828125, -3.60296630859375, -3.474945068359375, -3.346923828125, -3.218902587890625, -3.09088134765625, -2.962860107421875, -2.8348388671875, -2.706817626953125, -2.57879638671875, -2.450775146484375, -2.32275390625, -2.194732666015625, -2.06671142578125, -1.938690185546875, -1.8106689453125, -1.682647705078125, -1.55462646484375, -1.426605224609375, -1.298583984375, -1.170562744140625, -1.04254150390625, -0.914520263671875, -0.7864990234375, -0.658477783203125, -0.53045654296875, -0.402435302734375, -0.2744140625, -0.146392822265625, -0.01837158203125, 0.109649658203125, 0.2376708984375, 0.365692138671875, 0.49371337890625, 0.621734619140625, 0.749755859375, 0.877777099609375, 1.00579833984375, 1.133819580078125, 1.2618408203125, 1.389862060546875, 1.51788330078125, 1.645904541015625, 1.77392578125, 1.901947021484375, 2.02996826171875, 2.157989501953125, 2.2860107421875, 2.414031982421875, 2.54205322265625, 2.670074462890625, 2.798095703125, 2.926116943359375, 3.05413818359375, 3.182159423828125, 3.3101806640625, 3.438201904296875, 3.56622314453125, 3.694244384765625, 3.822265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 20.0, 62.0, 179.0, 843.0, 2180.0, 595.0, 120.0, 42.0, 19.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.204864501953125, -3.08355712890625, -2.962249755859375, -2.8409423828125, -2.719635009765625, -2.59832763671875, -2.477020263671875, -2.355712890625, -2.234405517578125, -2.11309814453125, -1.991790771484375, -1.8704833984375, -1.749176025390625, -1.62786865234375, -1.506561279296875, -1.38525390625, -1.263946533203125, -1.14263916015625, -1.021331787109375, -0.9000244140625, -0.778717041015625, -0.65740966796875, -0.536102294921875, -0.414794921875, -0.293487548828125, -0.17218017578125, -0.050872802734375, 0.0704345703125, 0.191741943359375, 0.31304931640625, 0.434356689453125, 0.5556640625, 0.676971435546875, 0.79827880859375, 0.919586181640625, 1.0408935546875, 1.162200927734375, 1.28350830078125, 1.404815673828125, 1.526123046875, 1.647430419921875, 1.76873779296875, 1.890045166015625, 2.0113525390625, 2.132659912109375, 2.25396728515625, 2.375274658203125, 2.49658203125, 2.617889404296875, 2.73919677734375, 2.860504150390625, 2.9818115234375, 3.103118896484375, 3.22442626953125, 3.345733642578125, 3.467041015625, 3.588348388671875, 3.70965576171875, 3.830963134765625, 3.9522705078125, 4.073577880859375, 4.19488525390625, 4.316192626953125, 4.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 19.0, 76.0, 518.0, 316.0, 50.0, 13.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8726806640625, -36.564170837402344, -35.25566482543945, -33.9471549987793, -32.63864517211914, -31.33013916015625, -30.021629333496094, -28.71312141418457, -27.404613494873047, -26.096105575561523, -24.787595748901367, -23.479087829589844, -22.17057991027832, -20.862071990966797, -19.55356216430664, -18.245054244995117, -16.93654441833496, -15.628035545349121, -14.319527626037598, -13.011018753051758, -11.702510833740234, -10.394001960754395, -9.085493087768555, -7.776985168457031, -6.468476295471191, -5.15996789932251, -3.851459264755249, -2.5429506301879883, -1.2344422340393066, 0.074066162109375, 1.3825750350952148, 2.6910829544067383, 3.999591827392578, 5.30810022354126, 6.616608619689941, 7.925117492675781, 9.233625411987305, 10.542134284973145, 11.850643157958984, 13.159151077270508, 14.467659950256348, 15.776168823242188, 17.08467674255371, 18.393184661865234, 19.70169448852539, 21.010202407836914, 22.318710327148438, 23.627220153808594, 24.935728073120117, 26.24423599243164, 27.552745819091797, 28.86125373840332, 30.169761657714844, 31.478271484375, 32.786781311035156, 34.09528732299805, 35.4037971496582, 36.71230697631836, 38.02081298828125, 39.329322814941406, 40.63783264160156, 41.94633865356445, 43.25484848022461, 44.5633544921875, 45.871864318847656]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 8.0, 5.0, 10.0, 15.0, 19.0, 15.0, 30.0, 53.0, 58.0, 54.0, 69.0, 71.0, 66.0, 88.0, 82.0, 72.0, 72.0, 40.0, 53.0, 37.0, 24.0, 25.0, 13.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.154629707336426, -11.825424194335938, -11.496219635009766, -11.167014122009277, -10.837809562683105, -10.508604049682617, -10.179399490356445, -9.850193977355957, -9.520989418029785, -9.191783905029297, -8.862579345703125, -8.533373832702637, -8.204169273376465, -7.874964237213135, -7.545759201049805, -7.216553688049316, -6.887348651885986, -6.558143615722656, -6.228938579559326, -5.899733543395996, -5.570528507232666, -5.241323471069336, -4.912117958068848, -4.582913398742676, -4.2537078857421875, -3.9245028495788574, -3.5952978134155273, -3.2660927772521973, -2.936887741088867, -2.607682704925537, -2.278477430343628, -1.9492723941802979, -1.6200675964355469, -1.2908625602722168, -0.9616574645042419, -0.6324523687362671, -0.303247332572937, 0.025957703590393066, 0.3551628589630127, 0.6843678951263428, 1.0135729312896729, 1.342777967453003, 1.671983003616333, 2.001188278198242, 2.3303933143615723, 2.6595983505249023, 2.9888033866882324, 3.3180084228515625, 3.6472134590148926, 3.9764184951782227, 4.305623531341553, 4.634828567504883, 4.964033603668213, 5.293238639831543, 5.622444152832031, 5.951648712158203, 6.280854225158691, 6.6100592613220215, 6.939264297485352, 7.268469333648682, 7.597674369812012, 7.926879405975342, 8.256084442138672, 8.58528995513916, 8.914494514465332]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 14.0, 17.0, 33.0, 47.0, 69.0, 99.0, 133.0, 204.0, 324.0, 540.0, 807.0, 1376.0, 2203.0, 3802.0, 6388.0, 11755.0, 21255.0, 39957.0, 73637.0, 132276.0, 205250.0, 215048.0, 148445.0, 83963.0, 44925.0, 24604.0, 13351.0, 7380.0, 4181.0, 2481.0, 1449.0, 875.0, 561.0, 374.0, 273.0, 148.0, 96.0, 69.0, 45.0, 33.0, 14.0, 9.0, 12.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5776214599609375, -0.559051513671875, -0.5404815673828125, -0.52191162109375, -0.5033416748046875, -0.484771728515625, -0.4662017822265625, -0.4476318359375, -0.4290618896484375, -0.410491943359375, -0.3919219970703125, -0.37335205078125, -0.3547821044921875, -0.336212158203125, -0.3176422119140625, -0.299072265625, -0.2805023193359375, -0.261932373046875, -0.2433624267578125, -0.22479248046875, -0.2062225341796875, -0.187652587890625, -0.1690826416015625, -0.1505126953125, -0.1319427490234375, -0.113372802734375, -0.0948028564453125, -0.07623291015625, -0.0576629638671875, -0.039093017578125, -0.0205230712890625, -0.001953125, 0.0166168212890625, 0.035186767578125, 0.0537567138671875, 0.07232666015625, 0.0908966064453125, 0.109466552734375, 0.1280364990234375, 0.1466064453125, 0.1651763916015625, 0.183746337890625, 0.2023162841796875, 0.22088623046875, 0.2394561767578125, 0.258026123046875, 0.2765960693359375, 0.295166015625, 0.3137359619140625, 0.332305908203125, 0.3508758544921875, 0.36944580078125, 0.3880157470703125, 0.406585693359375, 0.4251556396484375, 0.4437255859375, 0.4622955322265625, 0.480865478515625, 0.4994354248046875, 0.51800537109375, 0.5365753173828125, 0.555145263671875, 0.5737152099609375, 0.59228515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 23.0, 26.0, 25.0, 33.0, 36.0, 39.0, 35.0, 50.0, 49.0, 49.0, 69.0, 33.0, 47.0, 51.0, 38.0, 42.0, 37.0, 37.0, 27.0, 30.0, 35.0, 25.0, 21.0, 14.0, 16.0, 15.0, 9.0, 4.0, 8.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5880661010742188, -0.5667572021484375, -0.5454483032226562, -0.524139404296875, -0.5028305053710938, -0.4815216064453125, -0.46021270751953125, -0.43890380859375, -0.41759490966796875, -0.3962860107421875, -0.37497711181640625, -0.353668212890625, -0.33235931396484375, -0.3110504150390625, -0.28974151611328125, -0.2684326171875, -0.24712371826171875, -0.2258148193359375, -0.20450592041015625, -0.183197021484375, -0.16188812255859375, -0.1405792236328125, -0.11927032470703125, -0.09796142578125, -0.07665252685546875, -0.0553436279296875, -0.03403472900390625, -0.012725830078125, 0.00858306884765625, 0.0298919677734375, 0.05120086669921875, 0.072509765625, 0.09381866455078125, 0.1151275634765625, 0.13643646240234375, 0.157745361328125, 0.17905426025390625, 0.2003631591796875, 0.22167205810546875, 0.24298095703125, 0.26428985595703125, 0.2855987548828125, 0.30690765380859375, 0.328216552734375, 0.34952545166015625, 0.3708343505859375, 0.39214324951171875, 0.4134521484375, 0.43476104736328125, 0.4560699462890625, 0.47737884521484375, 0.498687744140625, 0.5199966430664062, 0.5413055419921875, 0.5626144409179688, 0.58392333984375, 0.6052322387695312, 0.6265411376953125, 0.6478500366210938, 0.669158935546875, 0.6904678344726562, 0.7117767333984375, 0.7330856323242188, 0.75439453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 13.0, 4.0, 16.0, 15.0, 21.0, 25.0, 19.0, 51.0, 44.0, 76.0, 100.0, 151.0, 210.0, 346.0, 595.0, 1274.0, 3341.0, 10992.0, 44089.0, 203993.0, 601373.0, 138409.0, 30312.0, 7985.0, 2550.0, 1047.0, 490.0, 305.0, 204.0, 123.0, 121.0, 58.0, 40.0, 40.0, 25.0, 28.0, 23.0, 17.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.61328125, -1.56634521484375, -1.5194091796875, -1.47247314453125, -1.425537109375, -1.37860107421875, -1.3316650390625, -1.28472900390625, -1.23779296875, -1.19085693359375, -1.1439208984375, -1.09698486328125, -1.050048828125, -1.00311279296875, -0.9561767578125, -0.90924072265625, -0.8623046875, -0.81536865234375, -0.7684326171875, -0.72149658203125, -0.674560546875, -0.62762451171875, -0.5806884765625, -0.53375244140625, -0.48681640625, -0.43988037109375, -0.3929443359375, -0.34600830078125, -0.299072265625, -0.25213623046875, -0.2052001953125, -0.15826416015625, -0.111328125, -0.06439208984375, -0.0174560546875, 0.02947998046875, 0.076416015625, 0.12335205078125, 0.1702880859375, 0.21722412109375, 0.26416015625, 0.31109619140625, 0.3580322265625, 0.40496826171875, 0.451904296875, 0.49884033203125, 0.5457763671875, 0.59271240234375, 0.6396484375, 0.68658447265625, 0.7335205078125, 0.78045654296875, 0.827392578125, 0.87432861328125, 0.9212646484375, 0.96820068359375, 1.01513671875, 1.06207275390625, 1.1090087890625, 1.15594482421875, 1.202880859375, 1.24981689453125, 1.2967529296875, 1.34368896484375, 1.390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 7.0, 6.0, 4.0, 7.0, 9.0, 17.0, 15.0, 17.0, 22.0, 19.0, 31.0, 27.0, 35.0, 48.0, 44.0, 38.0, 39.0, 44.0, 44.0, 62.0, 50.0, 54.0, 44.0, 49.0, 42.0, 52.0, 31.0, 34.0, 19.0, 25.0, 15.0, 15.0, 12.0, 4.0, 7.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.338134765625, -2.26025390625, -2.182373046875, -2.1044921875, -2.026611328125, -1.94873046875, -1.870849609375, -1.79296875, -1.715087890625, -1.63720703125, -1.559326171875, -1.4814453125, -1.403564453125, -1.32568359375, -1.247802734375, -1.169921875, -1.092041015625, -1.01416015625, -0.936279296875, -0.8583984375, -0.780517578125, -0.70263671875, -0.624755859375, -0.546875, -0.468994140625, -0.39111328125, -0.313232421875, -0.2353515625, -0.157470703125, -0.07958984375, -0.001708984375, 0.076171875, 0.154052734375, 0.23193359375, 0.309814453125, 0.3876953125, 0.465576171875, 0.54345703125, 0.621337890625, 0.69921875, 0.777099609375, 0.85498046875, 0.932861328125, 1.0107421875, 1.088623046875, 1.16650390625, 1.244384765625, 1.322265625, 1.400146484375, 1.47802734375, 1.555908203125, 1.6337890625, 1.711669921875, 1.78955078125, 1.867431640625, 1.9453125, 2.023193359375, 2.10107421875, 2.178955078125, 2.2568359375, 2.334716796875, 2.41259765625, 2.490478515625, 2.568359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 6.0, 13.0, 18.0, 39.0, 77.0, 103.0, 164.0, 349.0, 659.0, 1552.0, 3636.0, 11490.0, 40641.0, 177124.0, 623349.0, 140857.0, 32800.0, 9559.0, 3360.0, 1372.0, 621.0, 343.0, 171.0, 106.0, 46.0, 32.0, 24.0, 8.0, 8.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52099609375, -0.5054092407226562, -0.4898223876953125, -0.47423553466796875, -0.458648681640625, -0.44306182861328125, -0.4274749755859375, -0.41188812255859375, -0.39630126953125, -0.38071441650390625, -0.3651275634765625, -0.34954071044921875, -0.333953857421875, -0.31836700439453125, -0.3027801513671875, -0.28719329833984375, -0.2716064453125, -0.25601959228515625, -0.2404327392578125, -0.22484588623046875, -0.209259033203125, -0.19367218017578125, -0.1780853271484375, -0.16249847412109375, -0.14691162109375, -0.13132476806640625, -0.1157379150390625, -0.10015106201171875, -0.084564208984375, -0.06897735595703125, -0.0533905029296875, -0.03780364990234375, -0.022216796875, -0.00662994384765625, 0.0089569091796875, 0.02454376220703125, 0.040130615234375, 0.05571746826171875, 0.0713043212890625, 0.08689117431640625, 0.10247802734375, 0.11806488037109375, 0.1336517333984375, 0.14923858642578125, 0.164825439453125, 0.18041229248046875, 0.1959991455078125, 0.21158599853515625, 0.2271728515625, 0.24275970458984375, 0.2583465576171875, 0.27393341064453125, 0.289520263671875, 0.30510711669921875, 0.3206939697265625, 0.33628082275390625, 0.35186767578125, 0.36745452880859375, 0.3830413818359375, 0.39862823486328125, 0.414215087890625, 0.42980194091796875, 0.4453887939453125, 0.46097564697265625, 0.4765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 13.0, 20.0, 35.0, 34.0, 55.0, 77.0, 120.0, 145.0, 131.0, 109.0, 89.0, 38.0, 31.0, 18.0, 19.0, 7.0, 9.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015581771731376648, -0.00014831870794296265, -0.0001408196985721588, -0.00013332068920135498, -0.00012582167983055115, -0.00011832267045974731, -0.00011082366108894348, -0.00010332465171813965, -9.582564234733582e-05, -8.832663297653198e-05, -8.082762360572815e-05, -7.332861423492432e-05, -6.582960486412048e-05, -5.833059549331665e-05, -5.083158612251282e-05, -4.3332576751708984e-05, -3.583356738090515e-05, -2.833455801010132e-05, -2.0835548639297485e-05, -1.3336539268493652e-05, -5.837529897689819e-06, 1.6614794731140137e-06, 9.160488843917847e-06, 1.665949821472168e-05, 2.4158507585525513e-05, 3.1657516956329346e-05, 3.915652632713318e-05, 4.665553569793701e-05, 5.4154545068740845e-05, 6.165355443954468e-05, 6.915256381034851e-05, 7.665157318115234e-05, 8.415058255195618e-05, 9.164959192276001e-05, 9.914860129356384e-05, 0.00010664761066436768, 0.00011414662003517151, 0.00012164562940597534, 0.00012914463877677917, 0.000136643648147583, 0.00014414265751838684, 0.00015164166688919067, 0.0001591406762599945, 0.00016663968563079834, 0.00017413869500160217, 0.000181637704372406, 0.00018913671374320984, 0.00019663572311401367, 0.0002041347324848175, 0.00021163374185562134, 0.00021913275122642517, 0.000226631760597229, 0.00023413076996803284, 0.00024162977933883667, 0.0002491287887096405, 0.00025662779808044434, 0.00026412680745124817, 0.000271625816822052, 0.00027912482619285583, 0.00028662383556365967, 0.0002941228449344635, 0.00030162185430526733, 0.00030912086367607117, 0.000316619873046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 14.0, 19.0, 33.0, 46.0, 78.0, 111.0, 223.0, 502.0, 1108.0, 3182.0, 11661.0, 58034.0, 343031.0, 543389.0, 68014.0, 13261.0, 3539.0, 1196.0, 495.0, 238.0, 132.0, 78.0, 52.0, 28.0, 21.0, 22.0, 13.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5162582397460938, -0.4978485107421875, -0.47943878173828125, -0.461029052734375, -0.44261932373046875, -0.4242095947265625, -0.40579986572265625, -0.38739013671875, -0.36898040771484375, -0.3505706787109375, -0.33216094970703125, -0.313751220703125, -0.29534149169921875, -0.2769317626953125, -0.25852203369140625, -0.2401123046875, -0.22170257568359375, -0.2032928466796875, -0.18488311767578125, -0.166473388671875, -0.14806365966796875, -0.1296539306640625, -0.11124420166015625, -0.09283447265625, -0.07442474365234375, -0.0560150146484375, -0.03760528564453125, -0.019195556640625, -0.00078582763671875, 0.0176239013671875, 0.03603363037109375, 0.054443359375, 0.07285308837890625, 0.0912628173828125, 0.10967254638671875, 0.128082275390625, 0.14649200439453125, 0.1649017333984375, 0.18331146240234375, 0.20172119140625, 0.22013092041015625, 0.2385406494140625, 0.25695037841796875, 0.275360107421875, 0.29376983642578125, 0.3121795654296875, 0.33058929443359375, 0.3489990234375, 0.36740875244140625, 0.3858184814453125, 0.40422821044921875, 0.422637939453125, 0.44104766845703125, 0.4594573974609375, 0.47786712646484375, 0.49627685546875, 0.5146865844726562, 0.5330963134765625, 0.5515060424804688, 0.569915771484375, 0.5883255004882812, 0.6067352294921875, 0.6251449584960938, 0.6435546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 11.0, 11.0, 15.0, 29.0, 27.0, 29.0, 42.0, 39.0, 73.0, 83.0, 91.0, 91.0, 80.0, 77.0, 53.0, 66.0, 41.0, 29.0, 27.0, 19.0, 18.0, 12.0, 9.0, 4.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.6296157836914062, -0.6107940673828125, -0.5919723510742188, -0.573150634765625, -0.5543289184570312, -0.5355072021484375, -0.5166854858398438, -0.49786376953125, -0.47904205322265625, -0.4602203369140625, -0.44139862060546875, -0.422576904296875, -0.40375518798828125, -0.3849334716796875, -0.36611175537109375, -0.3472900390625, -0.32846832275390625, -0.3096466064453125, -0.29082489013671875, -0.272003173828125, -0.25318145751953125, -0.2343597412109375, -0.21553802490234375, -0.19671630859375, -0.17789459228515625, -0.1590728759765625, -0.14025115966796875, -0.121429443359375, -0.10260772705078125, -0.0837860107421875, -0.06496429443359375, -0.046142578125, -0.02732086181640625, -0.0084991455078125, 0.01032257080078125, 0.029144287109375, 0.04796600341796875, 0.0667877197265625, 0.08560943603515625, 0.10443115234375, 0.12325286865234375, 0.1420745849609375, 0.16089630126953125, 0.179718017578125, 0.19853973388671875, 0.2173614501953125, 0.23618316650390625, 0.2550048828125, 0.27382659912109375, 0.2926483154296875, 0.31147003173828125, 0.330291748046875, 0.34911346435546875, 0.3679351806640625, 0.38675689697265625, 0.40557861328125, 0.42440032958984375, 0.4432220458984375, 0.46204376220703125, 0.480865478515625, 0.49968719482421875, 0.5185089111328125, 0.5373306274414062, 0.55615234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 19.0, 33.0, 74.0, 159.0, 325.0, 200.0, 103.0, 39.0, 21.0, 11.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.74115753173828, -17.211669921875, -16.68218421936035, -16.15269660949707, -15.623208999633789, -15.093722343444824, -14.56423568725586, -14.034748077392578, -13.505261421203613, -12.975774765014648, -12.446287155151367, -11.916800498962402, -11.387313842773438, -10.857826232910156, -10.328339576721191, -9.798852920532227, -9.269365310668945, -8.73987865447998, -8.2103910446167, -7.680904388427734, -7.151417255401611, -6.621930122375488, -6.092443466186523, -5.5629563331604, -5.033469200134277, -4.503982067108154, -3.9744951725006104, -3.4450082778930664, -2.9155211448669434, -2.3860340118408203, -1.8565471172332764, -1.3270602226257324, -0.7975730895996094, -0.2680860757827759, 0.2614009380340576, 0.7908879518508911, 1.3203749656677246, 1.8498620986938477, 2.3793489933013916, 2.9088358879089355, 3.4383230209350586, 3.9678101539611816, 4.497297286987305, 5.0267839431762695, 5.556271076202393, 6.085758209228516, 6.6152448654174805, 7.1447319984436035, 7.674219131469727, 8.203705787658691, 8.733193397521973, 9.262680053710938, 9.792167663574219, 10.321654319763184, 10.851140975952148, 11.38062858581543, 11.910115242004395, 12.43960189819336, 12.96908950805664, 13.498576164245605, 14.02806282043457, 14.557550430297852, 15.087037086486816, 15.616523742675781, 16.146011352539062]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 5.0, 9.0, 8.0, 17.0, 12.0, 13.0, 16.0, 19.0, 22.0, 28.0, 30.0, 29.0, 30.0, 29.0, 35.0, 50.0, 55.0, 88.0, 76.0, 61.0, 37.0, 31.0, 34.0, 22.0, 33.0, 30.0, 16.0, 18.0, 31.0, 19.0, 15.0, 10.0, 7.0, 8.0, 9.0, 4.0, 7.0, 8.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-8.921832084655762, -8.66435432434082, -8.406875610351562, -8.149396896362305, -7.891919136047363, -7.634440898895264, -7.376962661743164, -7.1194844245910645, -6.862006187438965, -6.604527950286865, -6.347049713134766, -6.089571475982666, -5.832093238830566, -5.574615001678467, -5.317136764526367, -5.059658527374268, -4.802180290222168, -4.544702053070068, -4.287223815917969, -4.029745578765869, -3.7722673416137695, -3.51478910446167, -3.2573108673095703, -2.9998326301574707, -2.742354393005371, -2.4848761558532715, -2.227397918701172, -1.9699196815490723, -1.7124414443969727, -1.454963207244873, -1.1974849700927734, -0.9400067329406738, -0.6825294494628906, -0.425051212310791, -0.1675729751586914, 0.0899052619934082, 0.3473834991455078, 0.6048617362976074, 0.862339973449707, 1.1198182106018066, 1.3772964477539062, 1.6347746849060059, 1.8922529220581055, 2.149731159210205, 2.4072093963623047, 2.6646876335144043, 2.922165870666504, 3.1796441078186035, 3.437122344970703, 3.6946005821228027, 3.9520788192749023, 4.209557056427002, 4.467035293579102, 4.724513530731201, 4.981991767883301, 5.2394700050354, 5.4969482421875, 5.7544264793396, 6.011904716491699, 6.269382953643799, 6.526861190795898, 6.784339427947998, 7.041817665100098, 7.299295902252197, 7.556774139404297]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 12.0, 12.0, 9.0, 18.0, 31.0, 51.0, 46.0, 80.0, 109.0, 163.0, 259.0, 390.0, 568.0, 889.0, 1470.0, 2514.0, 4951.0, 11363.0, 37048.0, 169603.0, 830838.0, 2041584.0, 870289.0, 163108.0, 35892.0, 11395.0, 4943.0, 2540.0, 1415.0, 875.0, 558.0, 388.0, 253.0, 177.0, 130.0, 101.0, 63.0, 45.0, 28.0, 19.0, 14.0, 13.0, 5.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5108871459960938, -0.4929656982421875, -0.47504425048828125, -0.457122802734375, -0.43920135498046875, -0.4212799072265625, -0.40335845947265625, -0.38543701171875, -0.36751556396484375, -0.3495941162109375, -0.33167266845703125, -0.313751220703125, -0.29582977294921875, -0.2779083251953125, -0.25998687744140625, -0.2420654296875, -0.22414398193359375, -0.2062225341796875, -0.18830108642578125, -0.170379638671875, -0.15245819091796875, -0.1345367431640625, -0.11661529541015625, -0.09869384765625, -0.08077239990234375, -0.0628509521484375, -0.04492950439453125, -0.027008056640625, -0.00908660888671875, 0.0088348388671875, 0.02675628662109375, 0.044677734375, 0.06259918212890625, 0.0805206298828125, 0.09844207763671875, 0.116363525390625, 0.13428497314453125, 0.1522064208984375, 0.17012786865234375, 0.18804931640625, 0.20597076416015625, 0.2238922119140625, 0.24181365966796875, 0.259735107421875, 0.27765655517578125, 0.2955780029296875, 0.31349945068359375, 0.3314208984375, 0.34934234619140625, 0.3672637939453125, 0.38518524169921875, 0.403106689453125, 0.42102813720703125, 0.4389495849609375, 0.45687103271484375, 0.47479248046875, 0.49271392822265625, 0.5106353759765625, 0.5285568237304688, 0.546478271484375, 0.5643997192382812, 0.5823211669921875, 0.6002426147460938, 0.6181640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 1.0, 4.0, 8.0, 10.0, 10.0, 7.0, 15.0, 29.0, 23.0, 30.0, 40.0, 31.0, 42.0, 35.0, 47.0, 45.0, 50.0, 58.0, 49.0, 42.0, 47.0, 44.0, 37.0, 42.0, 21.0, 35.0, 32.0, 25.0, 19.0, 20.0, 26.0, 24.0, 15.0, 4.0, 12.0, 7.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61376953125, -0.5949630737304688, -0.5761566162109375, -0.5573501586914062, -0.538543701171875, -0.5197372436523438, -0.5009307861328125, -0.48212432861328125, -0.46331787109375, -0.44451141357421875, -0.4257049560546875, -0.40689849853515625, -0.388092041015625, -0.36928558349609375, -0.3504791259765625, -0.33167266845703125, -0.3128662109375, -0.29405975341796875, -0.2752532958984375, -0.25644683837890625, -0.237640380859375, -0.21883392333984375, -0.2000274658203125, -0.18122100830078125, -0.16241455078125, -0.14360809326171875, -0.1248016357421875, -0.10599517822265625, -0.087188720703125, -0.06838226318359375, -0.0495758056640625, -0.03076934814453125, -0.011962890625, 0.00684356689453125, 0.0256500244140625, 0.04445648193359375, 0.063262939453125, 0.08206939697265625, 0.1008758544921875, 0.11968231201171875, 0.13848876953125, 0.15729522705078125, 0.1761016845703125, 0.19490814208984375, 0.213714599609375, 0.23252105712890625, 0.2513275146484375, 0.27013397216796875, 0.2889404296875, 0.30774688720703125, 0.3265533447265625, 0.34535980224609375, 0.364166259765625, 0.38297271728515625, 0.4017791748046875, 0.42058563232421875, 0.43939208984375, 0.45819854736328125, 0.4770050048828125, 0.49581146240234375, 0.514617919921875, 0.5334243774414062, 0.5522308349609375, 0.5710372924804688, 0.58984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 16.0, 25.0, 52.0, 162.0, 404.0, 2203.0, 317807.0, 3867955.0, 4624.0, 654.0, 209.0, 86.0, 41.0, 24.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.658935546875, -4.50927734375, -4.359619140625, -4.2099609375, -4.060302734375, -3.91064453125, -3.760986328125, -3.611328125, -3.461669921875, -3.31201171875, -3.162353515625, -3.0126953125, -2.863037109375, -2.71337890625, -2.563720703125, -2.4140625, -2.264404296875, -2.11474609375, -1.965087890625, -1.8154296875, -1.665771484375, -1.51611328125, -1.366455078125, -1.216796875, -1.067138671875, -0.91748046875, -0.767822265625, -0.6181640625, -0.468505859375, -0.31884765625, -0.169189453125, -0.01953125, 0.130126953125, 0.27978515625, 0.429443359375, 0.5791015625, 0.728759765625, 0.87841796875, 1.028076171875, 1.177734375, 1.327392578125, 1.47705078125, 1.626708984375, 1.7763671875, 1.926025390625, 2.07568359375, 2.225341796875, 2.375, 2.524658203125, 2.67431640625, 2.823974609375, 2.9736328125, 3.123291015625, 3.27294921875, 3.422607421875, 3.572265625, 3.721923828125, 3.87158203125, 4.021240234375, 4.1708984375, 4.320556640625, 4.47021484375, 4.619873046875, 4.76953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 10.0, 24.0, 14.0, 40.0, 84.0, 145.0, 339.0, 804.0, 1085.0, 787.0, 364.0, 182.0, 78.0, 44.0, 31.0, 15.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1865234375, -1.1287078857421875, -1.070892333984375, -1.0130767822265625, -0.95526123046875, -0.8974456787109375, -0.839630126953125, -0.7818145751953125, -0.7239990234375, -0.6661834716796875, -0.608367919921875, -0.5505523681640625, -0.49273681640625, -0.4349212646484375, -0.377105712890625, -0.3192901611328125, -0.261474609375, -0.2036590576171875, -0.145843505859375, -0.0880279541015625, -0.03021240234375, 0.0276031494140625, 0.085418701171875, 0.1432342529296875, 0.2010498046875, 0.2588653564453125, 0.316680908203125, 0.3744964599609375, 0.43231201171875, 0.4901275634765625, 0.547943115234375, 0.6057586669921875, 0.66357421875, 0.7213897705078125, 0.779205322265625, 0.8370208740234375, 0.89483642578125, 0.9526519775390625, 1.010467529296875, 1.0682830810546875, 1.1260986328125, 1.1839141845703125, 1.241729736328125, 1.2995452880859375, 1.35736083984375, 1.4151763916015625, 1.472991943359375, 1.5308074951171875, 1.588623046875, 1.6464385986328125, 1.704254150390625, 1.7620697021484375, 1.81988525390625, 1.8777008056640625, 1.935516357421875, 1.9933319091796875, 2.0511474609375, 2.1089630126953125, 2.166778564453125, 2.2245941162109375, 2.28240966796875, 2.3402252197265625, 2.398040771484375, 2.4558563232421875, 2.513671875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 13.0, 22.0, 55.0, 204.0, 299.0, 256.0, 99.0, 28.0, 16.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.188379287719727, -12.54666519165039, -11.904952049255371, -11.263237953186035, -10.6215238571167, -9.97981071472168, -9.338096618652344, -8.696382522583008, -8.054668426513672, -7.412954807281494, -6.771240711212158, -6.1295270919799805, -5.4878129959106445, -4.846099376678467, -4.204385757446289, -3.562671661376953, -2.9209585189819336, -2.2792446613311768, -1.6375309228897095, -0.9958171844482422, -0.35410332679748535, 0.2876105308532715, 0.9293241500854492, 1.5710382461547852, 2.212751865386963, 2.8544657230377197, 3.4961795806884766, 4.137893199920654, 4.779606819152832, 5.421320915222168, 6.063034534454346, 6.704748630523682, 7.346462249755859, 7.988175868988037, 8.629889488220215, 9.27160358428955, 9.913317680358887, 10.555030822753906, 11.196744918823242, 11.838459014892578, 12.480173110961914, 13.12188720703125, 13.76360034942627, 14.405314445495605, 15.047028541564941, 15.688741683959961, 16.330455780029297, 16.972169876098633, 17.61388397216797, 18.255598068237305, 18.89731216430664, 19.539024353027344, 20.18073844909668, 20.822452545166016, 21.46416664123535, 22.105880737304688, 22.74759292602539, 23.389307022094727, 24.031021118164062, 24.672733306884766, 25.3144474029541, 25.956161499023438, 26.597875595092773, 27.23958969116211, 27.881303787231445]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 6.0, 10.0, 7.0, 10.0, 12.0, 20.0, 21.0, 20.0, 22.0, 51.0, 38.0, 39.0, 51.0, 56.0, 56.0, 49.0, 50.0, 43.0, 66.0, 53.0, 41.0, 31.0, 55.0, 38.0, 38.0, 21.0, 20.0, 17.0, 12.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.450509548187256, -7.235997200012207, -7.021484851837158, -6.806972503662109, -6.592460632324219, -6.377947807312012, -6.163435935974121, -5.948923587799072, -5.734411239624023, -5.519898891448975, -5.305386543273926, -5.090874195098877, -4.876361846923828, -4.6618499755859375, -4.447337627410889, -4.23282527923584, -4.018312931060791, -3.803800582885742, -3.5892882347106934, -3.3747761249542236, -3.160263776779175, -2.945751428604126, -2.7312393188476562, -2.5167269706726074, -2.3022146224975586, -2.0877022743225098, -1.8731900453567505, -1.6586778163909912, -1.4441654682159424, -1.2296531200408936, -1.0151408910751343, -0.800628662109375, -0.5861167907714844, -0.3716045022010803, -0.15709221363067627, 0.05742007493972778, 0.27193236351013184, 0.48644471168518066, 0.7009569406509399, 0.9154691696166992, 1.129981517791748, 1.3444938659667969, 1.5590060949325562, 1.7735183238983154, 1.9880306720733643, 2.202543020248413, 2.417055130004883, 2.6315674781799316, 2.8460798263549805, 3.0605921745300293, 3.275104522705078, 3.489616632461548, 3.7041289806365967, 3.9186413288116455, 4.133153438568115, 4.347665786743164, 4.562178134918213, 4.776690483093262, 4.9912028312683105, 5.205715179443359, 5.42022705078125, 5.634739875793457, 5.849251747131348, 6.0637640953063965, 6.278276443481445]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 14.0, 20.0, 35.0, 38.0, 70.0, 72.0, 154.0, 213.0, 291.0, 508.0, 725.0, 1230.0, 2042.0, 3146.0, 5205.0, 9251.0, 15775.0, 27693.0, 49693.0, 89325.0, 156435.0, 223943.0, 193733.0, 117800.0, 65269.0, 36076.0, 20480.0, 11829.0, 6909.0, 4027.0, 2445.0, 1504.0, 929.0, 568.0, 369.0, 233.0, 164.0, 88.0, 79.0, 64.0, 27.0, 31.0, 13.0, 12.0, 4.0, 10.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.467041015625, -0.4507865905761719, -0.43453216552734375, -0.4182777404785156, -0.4020233154296875, -0.3857688903808594, -0.36951446533203125, -0.3532600402832031, -0.337005615234375, -0.3207511901855469, -0.30449676513671875, -0.2882423400878906, -0.2719879150390625, -0.2557334899902344, -0.23947906494140625, -0.22322463989257812, -0.20697021484375, -0.19071578979492188, -0.17446136474609375, -0.15820693969726562, -0.1419525146484375, -0.12569808959960938, -0.10944366455078125, -0.09318923950195312, -0.076934814453125, -0.060680389404296875, -0.04442596435546875, -0.028171539306640625, -0.0119171142578125, 0.004337310791015625, 0.02059173583984375, 0.036846160888671875, 0.0531005859375, 0.06935501098632812, 0.08560943603515625, 0.10186386108398438, 0.1181182861328125, 0.13437271118164062, 0.15062713623046875, 0.16688156127929688, 0.183135986328125, 0.19939041137695312, 0.21564483642578125, 0.23189926147460938, 0.2481536865234375, 0.2644081115722656, 0.28066253662109375, 0.2969169616699219, 0.31317138671875, 0.3294258117675781, 0.34568023681640625, 0.3619346618652344, 0.3781890869140625, 0.3944435119628906, 0.41069793701171875, 0.4269523620605469, 0.443206787109375, 0.4594612121582031, 0.47571563720703125, 0.4919700622558594, 0.5082244873046875, 0.5244789123535156, 0.5407333374023438, 0.5569877624511719, 0.5732421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 7.0, 5.0, 9.0, 10.0, 8.0, 19.0, 25.0, 18.0, 17.0, 26.0, 41.0, 36.0, 47.0, 40.0, 44.0, 52.0, 46.0, 45.0, 37.0, 54.0, 36.0, 48.0, 48.0, 24.0, 26.0, 38.0, 28.0, 29.0, 20.0, 24.0, 15.0, 19.0, 14.0, 6.0, 4.0, 7.0, 6.0, 3.0, 7.0, 0.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5100021362304688, -0.4911956787109375, -0.47238922119140625, -0.453582763671875, -0.43477630615234375, -0.4159698486328125, -0.39716339111328125, -0.37835693359375, -0.35955047607421875, -0.3407440185546875, -0.32193756103515625, -0.303131103515625, -0.28432464599609375, -0.2655181884765625, -0.24671173095703125, -0.2279052734375, -0.20909881591796875, -0.1902923583984375, -0.17148590087890625, -0.152679443359375, -0.13387298583984375, -0.1150665283203125, -0.09626007080078125, -0.07745361328125, -0.05864715576171875, -0.0398406982421875, -0.02103424072265625, -0.002227783203125, 0.01657867431640625, 0.0353851318359375, 0.05419158935546875, 0.072998046875, 0.09180450439453125, 0.1106109619140625, 0.12941741943359375, 0.148223876953125, 0.16703033447265625, 0.1858367919921875, 0.20464324951171875, 0.22344970703125, 0.24225616455078125, 0.2610626220703125, 0.27986907958984375, 0.298675537109375, 0.31748199462890625, 0.3362884521484375, 0.35509490966796875, 0.3739013671875, 0.39270782470703125, 0.4115142822265625, 0.43032073974609375, 0.449127197265625, 0.46793365478515625, 0.4867401123046875, 0.5055465698242188, 0.52435302734375, 0.5431594848632812, 0.5619659423828125, 0.5807723999023438, 0.599578857421875, 0.6183853149414062, 0.6371917724609375, 0.6559982299804688, 0.6748046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 9.0, 8.0, 11.0, 18.0, 22.0, 25.0, 69.0, 73.0, 127.0, 205.0, 378.0, 770.0, 2221.0, 11783.0, 132598.0, 821244.0, 68295.0, 7373.0, 1735.0, 688.0, 357.0, 178.0, 129.0, 80.0, 47.0, 32.0, 27.0, 16.0, 14.0, 3.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.589935302734375, -2.50994873046875, -2.429962158203125, -2.3499755859375, -2.269989013671875, -2.19000244140625, -2.110015869140625, -2.030029296875, -1.950042724609375, -1.87005615234375, -1.790069580078125, -1.7100830078125, -1.630096435546875, -1.55010986328125, -1.470123291015625, -1.39013671875, -1.310150146484375, -1.23016357421875, -1.150177001953125, -1.0701904296875, -0.990203857421875, -0.91021728515625, -0.830230712890625, -0.750244140625, -0.670257568359375, -0.59027099609375, -0.510284423828125, -0.4302978515625, -0.350311279296875, -0.27032470703125, -0.190338134765625, -0.1103515625, -0.030364990234375, 0.04962158203125, 0.129608154296875, 0.2095947265625, 0.289581298828125, 0.36956787109375, 0.449554443359375, 0.529541015625, 0.609527587890625, 0.68951416015625, 0.769500732421875, 0.8494873046875, 0.929473876953125, 1.00946044921875, 1.089447021484375, 1.16943359375, 1.249420166015625, 1.32940673828125, 1.409393310546875, 1.4893798828125, 1.569366455078125, 1.64935302734375, 1.729339599609375, 1.809326171875, 1.889312744140625, 1.96929931640625, 2.049285888671875, 2.1292724609375, 2.209259033203125, 2.28924560546875, 2.369232177734375, 2.44921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 13.0, 9.0, 11.0, 17.0, 21.0, 18.0, 26.0, 29.0, 31.0, 33.0, 38.0, 45.0, 37.0, 57.0, 50.0, 66.0, 52.0, 57.0, 36.0, 44.0, 36.0, 35.0, 29.0, 26.0, 37.0, 21.0, 20.0, 15.0, 11.0, 4.0, 18.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.171875, -2.10394287109375, -2.0360107421875, -1.96807861328125, -1.900146484375, -1.83221435546875, -1.7642822265625, -1.69635009765625, -1.62841796875, -1.56048583984375, -1.4925537109375, -1.42462158203125, -1.356689453125, -1.28875732421875, -1.2208251953125, -1.15289306640625, -1.0849609375, -1.01702880859375, -0.9490966796875, -0.88116455078125, -0.813232421875, -0.74530029296875, -0.6773681640625, -0.60943603515625, -0.54150390625, -0.47357177734375, -0.4056396484375, -0.33770751953125, -0.269775390625, -0.20184326171875, -0.1339111328125, -0.06597900390625, 0.001953125, 0.06988525390625, 0.1378173828125, 0.20574951171875, 0.273681640625, 0.34161376953125, 0.4095458984375, 0.47747802734375, 0.54541015625, 0.61334228515625, 0.6812744140625, 0.74920654296875, 0.817138671875, 0.88507080078125, 0.9530029296875, 1.02093505859375, 1.0888671875, 1.15679931640625, 1.2247314453125, 1.29266357421875, 1.360595703125, 1.42852783203125, 1.4964599609375, 1.56439208984375, 1.63232421875, 1.70025634765625, 1.7681884765625, 1.83612060546875, 1.904052734375, 1.97198486328125, 2.0399169921875, 2.10784912109375, 2.17578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 14.0, 13.0, 30.0, 45.0, 77.0, 109.0, 245.0, 671.0, 2086.0, 8020.0, 54119.0, 796102.0, 164318.0, 17108.0, 3666.0, 1099.0, 415.0, 149.0, 92.0, 51.0, 31.0, 18.0, 23.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.77880859375, -0.7534561157226562, -0.7281036376953125, -0.7027511596679688, -0.677398681640625, -0.6520462036132812, -0.6266937255859375, -0.6013412475585938, -0.57598876953125, -0.5506362915039062, -0.5252838134765625, -0.49993133544921875, -0.474578857421875, -0.44922637939453125, -0.4238739013671875, -0.39852142333984375, -0.3731689453125, -0.34781646728515625, -0.3224639892578125, -0.29711151123046875, -0.271759033203125, -0.24640655517578125, -0.2210540771484375, -0.19570159912109375, -0.17034912109375, -0.14499664306640625, -0.1196441650390625, -0.09429168701171875, -0.068939208984375, -0.04358673095703125, -0.0182342529296875, 0.00711822509765625, 0.032470703125, 0.05782318115234375, 0.0831756591796875, 0.10852813720703125, 0.133880615234375, 0.15923309326171875, 0.1845855712890625, 0.20993804931640625, 0.23529052734375, 0.26064300537109375, 0.2859954833984375, 0.31134796142578125, 0.336700439453125, 0.36205291748046875, 0.3874053955078125, 0.41275787353515625, 0.4381103515625, 0.46346282958984375, 0.4888153076171875, 0.5141677856445312, 0.539520263671875, 0.5648727416992188, 0.5902252197265625, 0.6155776977539062, 0.64093017578125, 0.6662826538085938, 0.6916351318359375, 0.7169876098632812, 0.742340087890625, 0.7676925659179688, 0.7930450439453125, 0.8183975219726562, 0.84375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 30.0, 37.0, 52.0, 85.0, 148.0, 177.0, 166.0, 118.0, 65.0, 39.0, 23.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003266334533691406, -0.000317256897687912, -0.00030788034200668335, -0.0002985037863254547, -0.0002891272306442261, -0.00027975067496299744, -0.0002703741192817688, -0.00026099756360054016, -0.0002516210079193115, -0.00024224445223808289, -0.00023286789655685425, -0.0002234913408756256, -0.00021411478519439697, -0.00020473822951316833, -0.0001953616738319397, -0.00018598511815071106, -0.00017660856246948242, -0.00016723200678825378, -0.00015785545110702515, -0.0001484788954257965, -0.00013910233974456787, -0.00012972578406333923, -0.0001203492283821106, -0.00011097267270088196, -0.00010159611701965332, -9.221956133842468e-05, -8.284300565719604e-05, -7.346644997596741e-05, -6.408989429473877e-05, -5.471333861351013e-05, -4.5336782932281494e-05, -3.5960227251052856e-05, -2.658367156982422e-05, -1.720711588859558e-05, -7.830560207366943e-06, 1.5459954738616943e-06, 1.0922551155090332e-05, 2.029910683631897e-05, 2.9675662517547607e-05, 3.9052218198776245e-05, 4.842877388000488e-05, 5.780532956123352e-05, 6.718188524246216e-05, 7.65584409236908e-05, 8.593499660491943e-05, 9.531155228614807e-05, 0.00010468810796737671, 0.00011406466364860535, 0.00012344121932983398, 0.00013281777501106262, 0.00014219433069229126, 0.0001515708863735199, 0.00016094744205474854, 0.00017032399773597717, 0.0001797005534172058, 0.00018907710909843445, 0.00019845366477966309, 0.00020783022046089172, 0.00021720677614212036, 0.000226583331823349, 0.00023595988750457764, 0.0002453364431858063, 0.0002547129988670349, 0.00026408955454826355, 0.0002734661102294922]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 5.0, 8.0, 10.0, 34.0, 44.0, 100.0, 327.0, 1349.0, 26678.0, 1004701.0, 13735.0, 1089.0, 284.0, 93.0, 36.0, 33.0, 8.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.247100830078125, -2.17779541015625, -2.108489990234375, -2.0391845703125, -1.969879150390625, -1.90057373046875, -1.831268310546875, -1.761962890625, -1.692657470703125, -1.62335205078125, -1.554046630859375, -1.4847412109375, -1.415435791015625, -1.34613037109375, -1.276824951171875, -1.20751953125, -1.138214111328125, -1.06890869140625, -0.999603271484375, -0.9302978515625, -0.860992431640625, -0.79168701171875, -0.722381591796875, -0.653076171875, -0.583770751953125, -0.51446533203125, -0.445159912109375, -0.3758544921875, -0.306549072265625, -0.23724365234375, -0.167938232421875, -0.0986328125, -0.029327392578125, 0.03997802734375, 0.109283447265625, 0.1785888671875, 0.247894287109375, 0.31719970703125, 0.386505126953125, 0.455810546875, 0.525115966796875, 0.59442138671875, 0.663726806640625, 0.7330322265625, 0.802337646484375, 0.87164306640625, 0.940948486328125, 1.01025390625, 1.079559326171875, 1.14886474609375, 1.218170166015625, 1.2874755859375, 1.356781005859375, 1.42608642578125, 1.495391845703125, 1.564697265625, 1.634002685546875, 1.70330810546875, 1.772613525390625, 1.8419189453125, 1.911224365234375, 1.98052978515625, 2.049835205078125, 2.119140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 13.0, 27.0, 90.0, 186.0, 266.0, 195.0, 119.0, 50.0, 17.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6279296875, -1.579620361328125, -1.53131103515625, -1.483001708984375, -1.4346923828125, -1.386383056640625, -1.33807373046875, -1.289764404296875, -1.241455078125, -1.193145751953125, -1.14483642578125, -1.096527099609375, -1.0482177734375, -0.999908447265625, -0.95159912109375, -0.903289794921875, -0.85498046875, -0.806671142578125, -0.75836181640625, -0.710052490234375, -0.6617431640625, -0.613433837890625, -0.56512451171875, -0.516815185546875, -0.468505859375, -0.420196533203125, -0.37188720703125, -0.323577880859375, -0.2752685546875, -0.226959228515625, -0.17864990234375, -0.130340576171875, -0.08203125, -0.033721923828125, 0.01458740234375, 0.062896728515625, 0.1112060546875, 0.159515380859375, 0.20782470703125, 0.256134033203125, 0.304443359375, 0.352752685546875, 0.40106201171875, 0.449371337890625, 0.4976806640625, 0.545989990234375, 0.59429931640625, 0.642608642578125, 0.69091796875, 0.739227294921875, 0.78753662109375, 0.835845947265625, 0.8841552734375, 0.932464599609375, 0.98077392578125, 1.029083251953125, 1.077392578125, 1.125701904296875, 1.17401123046875, 1.222320556640625, 1.2706298828125, 1.318939208984375, 1.36724853515625, 1.415557861328125, 1.4638671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 12.0, 27.0, 72.0, 119.0, 317.0, 283.0, 101.0, 43.0, 15.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.00189971923828, -29.363317489624023, -28.724735260009766, -28.086153030395508, -27.44757080078125, -26.80898666381836, -26.1704044342041, -25.531822204589844, -24.893239974975586, -24.254657745361328, -23.61607551574707, -22.977493286132812, -22.338909149169922, -21.700326919555664, -21.061744689941406, -20.42316246032715, -19.78458023071289, -19.145998001098633, -18.507415771484375, -17.868833541870117, -17.23025131225586, -16.59166717529297, -15.953084945678711, -15.314502716064453, -14.675920486450195, -14.037338256835938, -13.39875602722168, -12.760172843933105, -12.121590614318848, -11.48300838470459, -10.844425201416016, -10.205842971801758, -9.5672607421875, -8.928678512573242, -8.290096282958984, -7.65151309967041, -7.012930870056152, -6.3743486404418945, -5.7357659339904785, -5.0971832275390625, -4.458600997924805, -3.8200185298919678, -3.181436061859131, -2.542853593826294, -1.904271125793457, -1.2656886577606201, -0.6271061897277832, 0.011476516723632812, 0.6500587463378906, 1.2886412143707275, 1.9272236824035645, 2.5658061504364014, 3.2043886184692383, 3.842971086502075, 4.481553554534912, 5.120136260986328, 5.758718490600586, 6.397300720214844, 7.03588342666626, 7.674466133117676, 8.313048362731934, 8.951630592346191, 9.590213775634766, 10.228796005249023, 10.867378234863281]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 4.0, 13.0, 11.0, 7.0, 16.0, 17.0, 16.0, 17.0, 18.0, 18.0, 28.0, 37.0, 23.0, 26.0, 32.0, 42.0, 48.0, 103.0, 102.0, 66.0, 32.0, 27.0, 26.0, 32.0, 30.0, 33.0, 25.0, 14.0, 18.0, 7.0, 5.0, 10.0, 8.0, 12.0, 9.0, 6.0, 12.0, 2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.52434778213501, -7.28047513961792, -7.03660249710083, -6.79272985458374, -6.54885721206665, -6.3049845695495605, -6.0611114501953125, -5.817238807678223, -5.573366165161133, -5.329493522644043, -5.085620880126953, -4.841748237609863, -4.597875595092773, -4.354002952575684, -4.110130310058594, -3.866257429122925, -3.622385025024414, -3.378512382507324, -3.1346397399902344, -2.8907670974731445, -2.6468944549560547, -2.403021812438965, -2.159148931503296, -1.915276288986206, -1.6714036464691162, -1.4275310039520264, -1.1836583614349365, -0.9397855997085571, -0.6959129571914673, -0.45204031467437744, -0.20816755294799805, 0.0357050895690918, 0.27957820892333984, 0.5234508514404297, 0.7673235535621643, 1.011196255683899, 1.2550688982009888, 1.4989415407180786, 1.742814302444458, 1.9866869449615479, 2.2305595874786377, 2.4744322299957275, 2.7183048725128174, 2.9621777534484863, 3.206050395965576, 3.449923038482666, 3.693795680999756, 3.9376683235168457, 4.1815409660339355, 4.425413608551025, 4.669286251068115, 4.913158893585205, 5.157031536102295, 5.400904178619385, 5.644777297973633, 5.888649940490723, 6.1325225830078125, 6.376395225524902, 6.620267868041992, 6.864140510559082, 7.108013153076172, 7.351885795593262, 7.595758438110352, 7.839631080627441, 8.083503723144531]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 12.0, 14.0, 27.0, 30.0, 62.0, 68.0, 113.0, 152.0, 253.0, 453.0, 821.0, 1372.0, 2826.0, 6271.0, 17395.0, 64374.0, 282624.0, 1158681.0, 1865685.0, 612018.0, 130787.0, 31826.0, 9844.0, 4040.0, 1927.0, 1059.0, 554.0, 357.0, 215.0, 129.0, 93.0, 54.0, 40.0, 25.0, 20.0, 17.0, 7.0, 10.0, 5.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.60693359375, -0.58868408203125, -0.5704345703125, -0.55218505859375, -0.533935546875, -0.51568603515625, -0.4974365234375, -0.47918701171875, -0.4609375, -0.44268798828125, -0.4244384765625, -0.40618896484375, -0.387939453125, -0.36968994140625, -0.3514404296875, -0.33319091796875, -0.31494140625, -0.29669189453125, -0.2784423828125, -0.26019287109375, -0.241943359375, -0.22369384765625, -0.2054443359375, -0.18719482421875, -0.1689453125, -0.15069580078125, -0.1324462890625, -0.11419677734375, -0.095947265625, -0.07769775390625, -0.0594482421875, -0.04119873046875, -0.02294921875, -0.00469970703125, 0.0135498046875, 0.03179931640625, 0.050048828125, 0.06829833984375, 0.0865478515625, 0.10479736328125, 0.123046875, 0.14129638671875, 0.1595458984375, 0.17779541015625, 0.196044921875, 0.21429443359375, 0.2325439453125, 0.25079345703125, 0.26904296875, 0.28729248046875, 0.3055419921875, 0.32379150390625, 0.342041015625, 0.36029052734375, 0.3785400390625, 0.39678955078125, 0.4150390625, 0.43328857421875, 0.4515380859375, 0.46978759765625, 0.488037109375, 0.50628662109375, 0.5245361328125, 0.54278564453125, 0.56103515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 0.0, 9.0, 6.0, 10.0, 10.0, 9.0, 15.0, 12.0, 21.0, 22.0, 21.0, 25.0, 37.0, 33.0, 35.0, 31.0, 42.0, 34.0, 43.0, 41.0, 45.0, 34.0, 34.0, 58.0, 34.0, 34.0, 35.0, 22.0, 37.0, 30.0, 33.0, 21.0, 14.0, 13.0, 21.0, 15.0, 13.0, 10.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.52099609375, -0.504150390625, -0.4873046875, -0.470458984375, -0.45361328125, -0.436767578125, -0.419921875, -0.403076171875, -0.38623046875, -0.369384765625, -0.3525390625, -0.335693359375, -0.31884765625, -0.302001953125, -0.28515625, -0.268310546875, -0.25146484375, -0.234619140625, -0.2177734375, -0.200927734375, -0.18408203125, -0.167236328125, -0.150390625, -0.133544921875, -0.11669921875, -0.099853515625, -0.0830078125, -0.066162109375, -0.04931640625, -0.032470703125, -0.015625, 0.001220703125, 0.01806640625, 0.034912109375, 0.0517578125, 0.068603515625, 0.08544921875, 0.102294921875, 0.119140625, 0.135986328125, 0.15283203125, 0.169677734375, 0.1865234375, 0.203369140625, 0.22021484375, 0.237060546875, 0.25390625, 0.270751953125, 0.28759765625, 0.304443359375, 0.3212890625, 0.338134765625, 0.35498046875, 0.371826171875, 0.388671875, 0.405517578125, 0.42236328125, 0.439208984375, 0.4560546875, 0.472900390625, 0.48974609375, 0.506591796875, 0.5234375, 0.540283203125, 0.55712890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 17.0, 41.0, 117.0, 290.0, 1041.0, 19763.0, 4152367.0, 19013.0, 1106.0, 295.0, 116.0, 52.0, 27.0, 10.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.21209716796875, -4.0531005859375, -3.89410400390625, -3.735107421875, -3.57611083984375, -3.4171142578125, -3.25811767578125, -3.09912109375, -2.94012451171875, -2.7811279296875, -2.62213134765625, -2.463134765625, -2.30413818359375, -2.1451416015625, -1.98614501953125, -1.8271484375, -1.66815185546875, -1.5091552734375, -1.35015869140625, -1.191162109375, -1.03216552734375, -0.8731689453125, -0.71417236328125, -0.55517578125, -0.39617919921875, -0.2371826171875, -0.07818603515625, 0.080810546875, 0.23980712890625, 0.3988037109375, 0.55780029296875, 0.716796875, 0.87579345703125, 1.0347900390625, 1.19378662109375, 1.352783203125, 1.51177978515625, 1.6707763671875, 1.82977294921875, 1.98876953125, 2.14776611328125, 2.3067626953125, 2.46575927734375, 2.624755859375, 2.78375244140625, 2.9427490234375, 3.10174560546875, 3.2607421875, 3.41973876953125, 3.5787353515625, 3.73773193359375, 3.896728515625, 4.05572509765625, 4.2147216796875, 4.37371826171875, 4.53271484375, 4.69171142578125, 4.8507080078125, 5.00970458984375, 5.168701171875, 5.32769775390625, 5.4866943359375, 5.64569091796875, 5.8046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 5.0, 6.0, 3.0, 7.0, 14.0, 41.0, 88.0, 178.0, 383.0, 880.0, 1175.0, 710.0, 292.0, 142.0, 57.0, 44.0, 22.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.748046875, -1.678985595703125, -1.60992431640625, -1.540863037109375, -1.4718017578125, -1.402740478515625, -1.33367919921875, -1.264617919921875, -1.195556640625, -1.126495361328125, -1.05743408203125, -0.988372802734375, -0.9193115234375, -0.850250244140625, -0.78118896484375, -0.712127685546875, -0.64306640625, -0.574005126953125, -0.50494384765625, -0.435882568359375, -0.3668212890625, -0.297760009765625, -0.22869873046875, -0.159637451171875, -0.090576171875, -0.021514892578125, 0.04754638671875, 0.116607666015625, 0.1856689453125, 0.254730224609375, 0.32379150390625, 0.392852783203125, 0.4619140625, 0.530975341796875, 0.60003662109375, 0.669097900390625, 0.7381591796875, 0.807220458984375, 0.87628173828125, 0.945343017578125, 1.014404296875, 1.083465576171875, 1.15252685546875, 1.221588134765625, 1.2906494140625, 1.359710693359375, 1.42877197265625, 1.497833251953125, 1.56689453125, 1.635955810546875, 1.70501708984375, 1.774078369140625, 1.8431396484375, 1.912200927734375, 1.98126220703125, 2.050323486328125, 2.119384765625, 2.188446044921875, 2.25750732421875, 2.326568603515625, 2.3956298828125, 2.464691162109375, 2.53375244140625, 2.602813720703125, 2.671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 19.0, 45.0, 172.0, 361.0, 255.0, 85.0, 32.0, 20.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.079544067382812, -11.24988079071045, -10.420218467712402, -9.590555191040039, -8.760892868041992, -7.931229591369629, -7.101566314697266, -6.2719035148620605, -5.4422407150268555, -4.61257791519165, -3.782914876937866, -2.953251838684082, -2.123589038848877, -1.2939262390136719, -0.4642629623413086, 0.3653998374938965, 1.1950626373291016, 2.0247254371643066, 2.854388475418091, 3.684051513671875, 4.51371431350708, 5.343377113342285, 6.173040390014648, 7.0027031898498535, 7.832365989685059, 8.662029266357422, 9.491691589355469, 10.321354866027832, 11.151018142700195, 11.980680465698242, 12.810343742370605, 13.640007019042969, 14.469669342041016, 15.299332618713379, 16.128995895385742, 16.95865821838379, 17.788320541381836, 18.617984771728516, 19.447647094726562, 20.27730941772461, 21.106971740722656, 21.936634063720703, 22.766298294067383, 23.59596061706543, 24.425622940063477, 25.255287170410156, 26.084949493408203, 26.91461181640625, 27.74427604675293, 28.573938369750977, 29.403602600097656, 30.233264923095703, 31.06292724609375, 31.892589569091797, 32.722251892089844, 33.551918029785156, 34.3815803527832, 35.21124267578125, 36.0409049987793, 36.870567321777344, 37.700233459472656, 38.5298957824707, 39.35955810546875, 40.1892204284668, 41.018882751464844]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 10.0, 12.0, 11.0, 17.0, 23.0, 35.0, 37.0, 35.0, 39.0, 43.0, 65.0, 43.0, 46.0, 40.0, 47.0, 44.0, 50.0, 55.0, 38.0, 36.0, 30.0, 35.0, 31.0, 31.0, 29.0, 18.0, 18.0, 15.0, 8.0, 7.0, 13.0, 7.0, 4.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.137204170227051, -6.908017635345459, -6.678831100463867, -6.449645042419434, -6.220458507537842, -5.99127197265625, -5.762085437774658, -5.532898902893066, -5.303712368011475, -5.074525833129883, -4.845339298248291, -4.616152763366699, -4.386966705322266, -4.157780170440674, -3.928593635559082, -3.6994071006774902, -3.4702208042144775, -3.2410342693328857, -3.011847972869873, -2.7826614379882812, -2.5534749031066895, -2.3242883682250977, -2.095102071762085, -1.8659155368804932, -1.636729121208191, -1.4075427055358887, -1.1783561706542969, -0.9491697549819946, -0.7199832797050476, -0.4907968044281006, -0.26161038875579834, -0.03242385387420654, 0.1967625617980957, 0.4259490370750427, 0.6551355123519897, 0.884321928024292, 1.1135084629058838, 1.342694878578186, 1.5718812942504883, 1.80106782913208, 2.030254364013672, 2.2594408988952637, 2.4886271953582764, 2.717813730239868, 2.94700026512146, 3.1761865615844727, 3.4053730964660645, 3.6345596313476562, 3.863745927810669, 4.092932224273682, 4.322118759155273, 4.551305294036865, 4.780491828918457, 5.009678363800049, 5.238864898681641, 5.468050956726074, 5.697237491607666, 5.926424026489258, 6.15561056137085, 6.384797096252441, 6.613983154296875, 6.843169689178467, 7.072356224060059, 7.30154275894165, 7.530729293823242]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 9.0, 9.0, 7.0, 19.0, 34.0, 39.0, 44.0, 78.0, 128.0, 184.0, 286.0, 431.0, 670.0, 1104.0, 1641.0, 2820.0, 4775.0, 8109.0, 14518.0, 27257.0, 53189.0, 107500.0, 212368.0, 271908.0, 167528.0, 82562.0, 41531.0, 21577.0, 11780.0, 6430.0, 3757.0, 2294.0, 1444.0, 882.0, 521.0, 367.0, 258.0, 177.0, 111.0, 55.0, 51.0, 34.0, 30.0, 13.0, 16.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5922393798828125, -0.569732666015625, -0.5472259521484375, -0.52471923828125, -0.5022125244140625, -0.479705810546875, -0.4571990966796875, -0.4346923828125, -0.4121856689453125, -0.389678955078125, -0.3671722412109375, -0.34466552734375, -0.3221588134765625, -0.299652099609375, -0.2771453857421875, -0.254638671875, -0.2321319580078125, -0.209625244140625, -0.1871185302734375, -0.16461181640625, -0.1421051025390625, -0.119598388671875, -0.0970916748046875, -0.0745849609375, -0.0520782470703125, -0.029571533203125, -0.0070648193359375, 0.01544189453125, 0.0379486083984375, 0.060455322265625, 0.0829620361328125, 0.10546875, 0.1279754638671875, 0.150482177734375, 0.1729888916015625, 0.19549560546875, 0.2180023193359375, 0.240509033203125, 0.2630157470703125, 0.2855224609375, 0.3080291748046875, 0.330535888671875, 0.3530426025390625, 0.37554931640625, 0.3980560302734375, 0.420562744140625, 0.4430694580078125, 0.465576171875, 0.4880828857421875, 0.510589599609375, 0.5330963134765625, 0.55560302734375, 0.5781097412109375, 0.600616455078125, 0.6231231689453125, 0.6456298828125, 0.6681365966796875, 0.690643310546875, 0.7131500244140625, 0.73565673828125, 0.7581634521484375, 0.780670166015625, 0.8031768798828125, 0.82568359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 10.0, 5.0, 5.0, 4.0, 15.0, 14.0, 14.0, 15.0, 20.0, 23.0, 29.0, 32.0, 35.0, 32.0, 34.0, 56.0, 37.0, 41.0, 41.0, 44.0, 54.0, 51.0, 49.0, 31.0, 48.0, 37.0, 23.0, 26.0, 28.0, 24.0, 15.0, 16.0, 19.0, 13.0, 13.0, 5.0, 6.0, 7.0, 7.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.572265625, -0.5529861450195312, -0.5337066650390625, -0.5144271850585938, -0.495147705078125, -0.47586822509765625, -0.4565887451171875, -0.43730926513671875, -0.41802978515625, -0.39875030517578125, -0.3794708251953125, -0.36019134521484375, -0.340911865234375, -0.32163238525390625, -0.3023529052734375, -0.28307342529296875, -0.2637939453125, -0.24451446533203125, -0.2252349853515625, -0.20595550537109375, -0.186676025390625, -0.16739654541015625, -0.1481170654296875, -0.12883758544921875, -0.10955810546875, -0.09027862548828125, -0.0709991455078125, -0.05171966552734375, -0.032440185546875, -0.01316070556640625, 0.0061187744140625, 0.02539825439453125, 0.044677734375, 0.06395721435546875, 0.0832366943359375, 0.10251617431640625, 0.121795654296875, 0.14107513427734375, 0.1603546142578125, 0.17963409423828125, 0.19891357421875, 0.21819305419921875, 0.2374725341796875, 0.25675201416015625, 0.276031494140625, 0.29531097412109375, 0.3145904541015625, 0.33386993408203125, 0.3531494140625, 0.37242889404296875, 0.3917083740234375, 0.41098785400390625, 0.430267333984375, 0.44954681396484375, 0.4688262939453125, 0.48810577392578125, 0.50738525390625, 0.5266647338867188, 0.5459442138671875, 0.5652236938476562, 0.584503173828125, 0.6037826538085938, 0.6230621337890625, 0.6423416137695312, 0.66162109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 17.0, 16.0, 28.0, 32.0, 64.0, 98.0, 149.0, 243.0, 416.0, 883.0, 2438.0, 15990.0, 772546.0, 242044.0, 9895.0, 1924.0, 791.0, 396.0, 221.0, 123.0, 81.0, 38.0, 32.0, 23.0, 21.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.39453125, -4.275421142578125, -4.15631103515625, -4.037200927734375, -3.9180908203125, -3.798980712890625, -3.67987060546875, -3.560760498046875, -3.441650390625, -3.322540283203125, -3.20343017578125, -3.084320068359375, -2.9652099609375, -2.846099853515625, -2.72698974609375, -2.607879638671875, -2.48876953125, -2.369659423828125, -2.25054931640625, -2.131439208984375, -2.0123291015625, -1.893218994140625, -1.77410888671875, -1.654998779296875, -1.535888671875, -1.416778564453125, -1.29766845703125, -1.178558349609375, -1.0594482421875, -0.940338134765625, -0.82122802734375, -0.702117919921875, -0.5830078125, -0.463897705078125, -0.34478759765625, -0.225677490234375, -0.1065673828125, 0.012542724609375, 0.13165283203125, 0.250762939453125, 0.369873046875, 0.488983154296875, 0.60809326171875, 0.727203369140625, 0.8463134765625, 0.965423583984375, 1.08453369140625, 1.203643798828125, 1.32275390625, 1.441864013671875, 1.56097412109375, 1.680084228515625, 1.7991943359375, 1.918304443359375, 2.03741455078125, 2.156524658203125, 2.275634765625, 2.394744873046875, 2.51385498046875, 2.632965087890625, 2.7520751953125, 2.871185302734375, 2.99029541015625, 3.109405517578125, 3.228515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 7.0, 4.0, 2.0, 7.0, 9.0, 12.0, 8.0, 15.0, 18.0, 22.0, 19.0, 29.0, 29.0, 26.0, 44.0, 44.0, 42.0, 52.0, 57.0, 60.0, 57.0, 51.0, 54.0, 43.0, 53.0, 30.0, 32.0, 27.0, 29.0, 19.0, 16.0, 11.0, 19.0, 5.0, 7.0, 5.0, 8.0, 3.0, 1.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.322509765625, -2.24658203125, -2.170654296875, -2.0947265625, -2.018798828125, -1.94287109375, -1.866943359375, -1.791015625, -1.715087890625, -1.63916015625, -1.563232421875, -1.4873046875, -1.411376953125, -1.33544921875, -1.259521484375, -1.18359375, -1.107666015625, -1.03173828125, -0.955810546875, -0.8798828125, -0.803955078125, -0.72802734375, -0.652099609375, -0.576171875, -0.500244140625, -0.42431640625, -0.348388671875, -0.2724609375, -0.196533203125, -0.12060546875, -0.044677734375, 0.03125, 0.107177734375, 0.18310546875, 0.259033203125, 0.3349609375, 0.410888671875, 0.48681640625, 0.562744140625, 0.638671875, 0.714599609375, 0.79052734375, 0.866455078125, 0.9423828125, 1.018310546875, 1.09423828125, 1.170166015625, 1.24609375, 1.322021484375, 1.39794921875, 1.473876953125, 1.5498046875, 1.625732421875, 1.70166015625, 1.777587890625, 1.853515625, 1.929443359375, 2.00537109375, 2.081298828125, 2.1572265625, 2.233154296875, 2.30908203125, 2.385009765625, 2.4609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 1.0, 14.0, 9.0, 8.0, 5.0, 14.0, 27.0, 34.0, 52.0, 80.0, 117.0, 206.0, 437.0, 897.0, 2509.0, 9615.0, 55684.0, 760473.0, 188027.0, 22418.0, 4888.0, 1597.0, 635.0, 314.0, 189.0, 95.0, 60.0, 36.0, 29.0, 19.0, 9.0, 8.0, 6.0, 9.0, 2.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6648788452148438, -0.6451873779296875, -0.6254959106445312, -0.605804443359375, -0.5861129760742188, -0.5664215087890625, -0.5467300415039062, -0.52703857421875, -0.5073471069335938, -0.4876556396484375, -0.46796417236328125, -0.448272705078125, -0.42858123779296875, -0.4088897705078125, -0.38919830322265625, -0.3695068359375, -0.34981536865234375, -0.3301239013671875, -0.31043243408203125, -0.290740966796875, -0.27104949951171875, -0.2513580322265625, -0.23166656494140625, -0.21197509765625, -0.19228363037109375, -0.1725921630859375, -0.15290069580078125, -0.133209228515625, -0.11351776123046875, -0.0938262939453125, -0.07413482666015625, -0.054443359375, -0.03475189208984375, -0.0150604248046875, 0.00463104248046875, 0.024322509765625, 0.04401397705078125, 0.0637054443359375, 0.08339691162109375, 0.10308837890625, 0.12277984619140625, 0.1424713134765625, 0.16216278076171875, 0.181854248046875, 0.20154571533203125, 0.2212371826171875, 0.24092864990234375, 0.2606201171875, 0.28031158447265625, 0.3000030517578125, 0.31969451904296875, 0.339385986328125, 0.35907745361328125, 0.3787689208984375, 0.39846038818359375, 0.41815185546875, 0.43784332275390625, 0.4575347900390625, 0.47722625732421875, 0.496917724609375, 0.5166091918945312, 0.5363006591796875, 0.5559921264648438, 0.57568359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 13.0, 19.0, 22.0, 45.0, 83.0, 120.0, 190.0, 184.0, 98.0, 83.0, 38.0, 24.0, 22.0, 13.0, 10.0, 12.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003020763397216797, -0.0002916567027568817, -0.00028123706579208374, -0.00027081742882728577, -0.0002603977918624878, -0.0002499781548976898, -0.00023955851793289185, -0.00022913888096809387, -0.0002187192440032959, -0.00020829960703849792, -0.00019787997007369995, -0.00018746033310890198, -0.000177040696144104, -0.00016662105917930603, -0.00015620142221450806, -0.00014578178524971008, -0.0001353621482849121, -0.00012494251132011414, -0.00011452287435531616, -0.00010410323739051819, -9.368360042572021e-05, -8.326396346092224e-05, -7.284432649612427e-05, -6.24246895313263e-05, -5.200505256652832e-05, -4.158541560173035e-05, -3.116577863693237e-05, -2.07461416721344e-05, -1.0326504707336426e-05, 9.313225746154785e-08, 1.0512769222259521e-05, 2.0932406187057495e-05, 3.135204315185547e-05, 4.177168011665344e-05, 5.2191317081451416e-05, 6.261095404624939e-05, 7.303059101104736e-05, 8.345022797584534e-05, 9.386986494064331e-05, 0.00010428950190544128, 0.00011470913887023926, 0.00012512877583503723, 0.0001355484127998352, 0.00014596804976463318, 0.00015638768672943115, 0.00016680732369422913, 0.0001772269606590271, 0.00018764659762382507, 0.00019806623458862305, 0.00020848587155342102, 0.000218905508518219, 0.00022932514548301697, 0.00023974478244781494, 0.0002501644194126129, 0.0002605840563774109, 0.00027100369334220886, 0.00028142333030700684, 0.0002918429672718048, 0.0003022626042366028, 0.00031268224120140076, 0.00032310187816619873, 0.0003335215151309967, 0.0003439411520957947, 0.00035436078906059265, 0.0003647804260253906]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 1.0, 5.0, 8.0, 17.0, 23.0, 38.0, 46.0, 76.0, 107.0, 220.0, 445.0, 968.0, 3615.0, 22006.0, 671845.0, 325755.0, 18197.0, 3147.0, 1018.0, 442.0, 213.0, 115.0, 87.0, 44.0, 29.0, 17.0, 14.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.927734375, -0.9026336669921875, -0.877532958984375, -0.8524322509765625, -0.82733154296875, -0.8022308349609375, -0.777130126953125, -0.7520294189453125, -0.7269287109375, -0.7018280029296875, -0.676727294921875, -0.6516265869140625, -0.62652587890625, -0.6014251708984375, -0.576324462890625, -0.5512237548828125, -0.526123046875, -0.5010223388671875, -0.475921630859375, -0.4508209228515625, -0.42572021484375, -0.4006195068359375, -0.375518798828125, -0.3504180908203125, -0.3253173828125, -0.3002166748046875, -0.275115966796875, -0.2500152587890625, -0.22491455078125, -0.1998138427734375, -0.174713134765625, -0.1496124267578125, -0.12451171875, -0.0994110107421875, -0.074310302734375, -0.0492095947265625, -0.02410888671875, 0.0009918212890625, 0.026092529296875, 0.0511932373046875, 0.0762939453125, 0.1013946533203125, 0.126495361328125, 0.1515960693359375, 0.17669677734375, 0.2017974853515625, 0.226898193359375, 0.2519989013671875, 0.277099609375, 0.3022003173828125, 0.327301025390625, 0.3524017333984375, 0.37750244140625, 0.4026031494140625, 0.427703857421875, 0.4528045654296875, 0.4779052734375, 0.5030059814453125, 0.528106689453125, 0.5532073974609375, 0.57830810546875, 0.6034088134765625, 0.628509521484375, 0.6536102294921875, 0.6787109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 7.0, 10.0, 15.0, 14.0, 21.0, 42.0, 35.0, 61.0, 84.0, 105.0, 103.0, 121.0, 93.0, 86.0, 54.0, 39.0, 30.0, 16.0, 12.0, 12.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6493377685546875, -0.631195068359375, -0.6130523681640625, -0.59490966796875, -0.5767669677734375, -0.558624267578125, -0.5404815673828125, -0.5223388671875, -0.5041961669921875, -0.486053466796875, -0.4679107666015625, -0.44976806640625, -0.4316253662109375, -0.413482666015625, -0.3953399658203125, -0.377197265625, -0.3590545654296875, -0.340911865234375, -0.3227691650390625, -0.30462646484375, -0.2864837646484375, -0.268341064453125, -0.2501983642578125, -0.2320556640625, -0.2139129638671875, -0.195770263671875, -0.1776275634765625, -0.15948486328125, -0.1413421630859375, -0.123199462890625, -0.1050567626953125, -0.0869140625, -0.0687713623046875, -0.050628662109375, -0.0324859619140625, -0.01434326171875, 0.0037994384765625, 0.021942138671875, 0.0400848388671875, 0.0582275390625, 0.0763702392578125, 0.094512939453125, 0.1126556396484375, 0.13079833984375, 0.1489410400390625, 0.167083740234375, 0.1852264404296875, 0.203369140625, 0.2215118408203125, 0.239654541015625, 0.2577972412109375, 0.27593994140625, 0.2940826416015625, 0.312225341796875, 0.3303680419921875, 0.3485107421875, 0.3666534423828125, 0.384796142578125, 0.4029388427734375, 0.42108154296875, 0.4392242431640625, 0.457366943359375, 0.4755096435546875, 0.49365234375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 14.0, 62.0, 433.0, 398.0, 74.0, 16.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.4105110168457, -45.120765686035156, -43.83102035522461, -42.54127502441406, -41.251529693603516, -39.96178436279297, -38.67203903198242, -37.382293701171875, -36.09254455566406, -34.802799224853516, -33.51305389404297, -32.22330856323242, -30.933563232421875, -29.643817901611328, -28.35407066345215, -27.0643253326416, -25.774581909179688, -24.48483657836914, -23.195091247558594, -21.905345916748047, -20.6156005859375, -19.325855255126953, -18.036108016967773, -16.746362686157227, -15.45661735534668, -14.166872024536133, -12.877126693725586, -11.587380409240723, -10.297635078430176, -9.007889747619629, -7.718143939971924, -6.428398132324219, -5.1386566162109375, -3.8489110469818115, -2.5591654777526855, -1.2694199085235596, 0.020325660705566406, 1.3100709915161133, 2.5998167991638184, 3.8895626068115234, 5.17930793762207, 6.469053268432617, 7.758799076080322, 9.048544883728027, 10.338290214538574, 11.628035545349121, 12.917781829833984, 14.207527160644531, 15.497272491455078, 16.787017822265625, 18.076763153076172, 19.36650848388672, 20.656253814697266, 21.945999145507812, 23.235746383666992, 24.52549171447754, 25.815237045288086, 27.104982376098633, 28.39472770690918, 29.684473037719727, 30.974220275878906, 32.26396560668945, 33.5537109375, 34.84345626831055, 36.133201599121094]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 10.0, 10.0, 17.0, 18.0, 22.0, 18.0, 25.0, 44.0, 30.0, 20.0, 38.0, 53.0, 168.0, 168.0, 54.0, 44.0, 34.0, 24.0, 27.0, 18.0, 33.0, 17.0, 13.0, 11.0, 12.0, 15.0, 9.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53750991821289, -11.177508354187012, -10.81750774383545, -10.45750617980957, -10.097505569458008, -9.737504005432129, -9.37750244140625, -9.017501831054688, -8.657500267028809, -8.29749870300293, -7.937498092651367, -7.577496528625488, -7.217495441436768, -6.857494354248047, -6.497493267059326, -6.1374921798706055, -5.777491092681885, -5.417490005493164, -5.057488918304443, -4.697487831115723, -4.337486267089844, -3.977485179901123, -3.6174840927124023, -3.2574827671051025, -2.897481679916382, -2.537480592727661, -2.1774792671203613, -1.8174781799316406, -1.4574769735336304, -1.0974757671356201, -0.7374746799468994, -0.3774733543395996, -0.017472267150878906, 0.34252890944480896, 0.7025300860404968, 1.0625312328338623, 1.4225324392318726, 1.7825336456298828, 2.1425347328186035, 2.5025360584259033, 2.862537145614624, 3.2225382328033447, 3.5825395584106445, 3.9425406455993652, 4.302541732788086, 4.662543296813965, 5.022543907165527, 5.382545471191406, 5.742546558380127, 6.102547645568848, 6.462548732757568, 6.822549819946289, 7.182551383972168, 7.542552471160889, 7.902553558349609, 8.262555122375488, 8.62255573272705, 8.98255729675293, 9.342557907104492, 9.702559471130371, 10.062560081481934, 10.422561645507812, 10.782562255859375, 11.142563819885254, 11.502565383911133]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 12.0, 14.0, 29.0, 46.0, 101.0, 148.0, 320.0, 637.0, 1469.0, 3992.0, 13599.0, 77161.0, 894439.0, 2717211.0, 432710.0, 38969.0, 8289.0, 2832.0, 1146.0, 552.0, 260.0, 146.0, 79.0, 58.0, 31.0, 16.0, 11.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.904296875, -0.85986328125, -0.8154296875, -0.77099609375, -0.7265625, -0.68212890625, -0.6376953125, -0.59326171875, -0.548828125, -0.50439453125, -0.4599609375, -0.41552734375, -0.37109375, -0.32666015625, -0.2822265625, -0.23779296875, -0.193359375, -0.14892578125, -0.1044921875, -0.06005859375, -0.015625, 0.02880859375, 0.0732421875, 0.11767578125, 0.162109375, 0.20654296875, 0.2509765625, 0.29541015625, 0.33984375, 0.38427734375, 0.4287109375, 0.47314453125, 0.517578125, 0.56201171875, 0.6064453125, 0.65087890625, 0.6953125, 0.73974609375, 0.7841796875, 0.82861328125, 0.873046875, 0.91748046875, 0.9619140625, 1.00634765625, 1.05078125, 1.09521484375, 1.1396484375, 1.18408203125, 1.228515625, 1.27294921875, 1.3173828125, 1.36181640625, 1.40625, 1.45068359375, 1.4951171875, 1.53955078125, 1.583984375, 1.62841796875, 1.6728515625, 1.71728515625, 1.76171875, 1.80615234375, 1.8505859375, 1.89501953125, 1.939453125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 8.0, 12.0, 11.0, 22.0, 20.0, 32.0, 35.0, 41.0, 57.0, 55.0, 57.0, 53.0, 61.0, 62.0, 50.0, 76.0, 52.0, 44.0, 46.0, 47.0, 30.0, 21.0, 18.0, 21.0, 17.0, 13.0, 6.0, 6.0, 11.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.495880126953125, -0.47027587890625, -0.444671630859375, -0.4190673828125, -0.393463134765625, -0.36785888671875, -0.342254638671875, -0.316650390625, -0.291046142578125, -0.26544189453125, -0.239837646484375, -0.2142333984375, -0.188629150390625, -0.16302490234375, -0.137420654296875, -0.11181640625, -0.086212158203125, -0.06060791015625, -0.035003662109375, -0.0093994140625, 0.016204833984375, 0.04180908203125, 0.067413330078125, 0.093017578125, 0.118621826171875, 0.14422607421875, 0.169830322265625, 0.1954345703125, 0.221038818359375, 0.24664306640625, 0.272247314453125, 0.2978515625, 0.323455810546875, 0.34906005859375, 0.374664306640625, 0.4002685546875, 0.425872802734375, 0.45147705078125, 0.477081298828125, 0.502685546875, 0.528289794921875, 0.55389404296875, 0.579498291015625, 0.6051025390625, 0.630706787109375, 0.65631103515625, 0.681915283203125, 0.70751953125, 0.733123779296875, 0.75872802734375, 0.784332275390625, 0.8099365234375, 0.835540771484375, 0.86114501953125, 0.886749267578125, 0.912353515625, 0.937957763671875, 0.96356201171875, 0.989166259765625, 1.0147705078125, 1.040374755859375, 1.06597900390625, 1.091583251953125, 1.1171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 2.0, 2.0, 15.0, 45.0, 66.0, 127.0, 352.0, 868.0, 4737.0, 4020751.0, 163389.0, 2654.0, 691.0, 290.0, 143.0, 58.0, 34.0, 18.0, 12.0, 10.0, 4.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.07421875, -6.80047607421875, -6.5267333984375, -6.25299072265625, -5.979248046875, -5.70550537109375, -5.4317626953125, -5.15802001953125, -4.88427734375, -4.61053466796875, -4.3367919921875, -4.06304931640625, -3.789306640625, -3.51556396484375, -3.2418212890625, -2.96807861328125, -2.6943359375, -2.42059326171875, -2.1468505859375, -1.87310791015625, -1.599365234375, -1.32562255859375, -1.0518798828125, -0.77813720703125, -0.50439453125, -0.23065185546875, 0.0430908203125, 0.31683349609375, 0.590576171875, 0.86431884765625, 1.1380615234375, 1.41180419921875, 1.685546875, 1.95928955078125, 2.2330322265625, 2.50677490234375, 2.780517578125, 3.05426025390625, 3.3280029296875, 3.60174560546875, 3.87548828125, 4.14923095703125, 4.4229736328125, 4.69671630859375, 4.970458984375, 5.24420166015625, 5.5179443359375, 5.79168701171875, 6.0654296875, 6.33917236328125, 6.6129150390625, 6.88665771484375, 7.160400390625, 7.43414306640625, 7.7078857421875, 7.98162841796875, 8.25537109375, 8.52911376953125, 8.8028564453125, 9.07659912109375, 9.350341796875, 9.62408447265625, 9.8978271484375, 10.17156982421875, 10.4453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 21.0, 22.0, 49.0, 102.0, 199.0, 490.0, 1291.0, 1087.0, 430.0, 179.0, 99.0, 48.0, 25.0, 19.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.90557861328125, -1.7681884765625, -1.63079833984375, -1.493408203125, -1.35601806640625, -1.2186279296875, -1.08123779296875, -0.94384765625, -0.80645751953125, -0.6690673828125, -0.53167724609375, -0.394287109375, -0.25689697265625, -0.1195068359375, 0.01788330078125, 0.1552734375, 0.29266357421875, 0.4300537109375, 0.56744384765625, 0.704833984375, 0.84222412109375, 0.9796142578125, 1.11700439453125, 1.25439453125, 1.39178466796875, 1.5291748046875, 1.66656494140625, 1.803955078125, 1.94134521484375, 2.0787353515625, 2.21612548828125, 2.353515625, 2.49090576171875, 2.6282958984375, 2.76568603515625, 2.903076171875, 3.04046630859375, 3.1778564453125, 3.31524658203125, 3.45263671875, 3.59002685546875, 3.7274169921875, 3.86480712890625, 4.002197265625, 4.13958740234375, 4.2769775390625, 4.41436767578125, 4.5517578125, 4.68914794921875, 4.8265380859375, 4.96392822265625, 5.101318359375, 5.23870849609375, 5.3760986328125, 5.51348876953125, 5.65087890625, 5.78826904296875, 5.9256591796875, 6.06304931640625, 6.200439453125, 6.33782958984375, 6.4752197265625, 6.61260986328125, 6.75]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 6.0, 10.0, 10.0, 22.0, 54.0, 119.0, 240.0, 236.0, 150.0, 66.0, 34.0, 15.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.86121940612793, -14.803691864013672, -13.746164321899414, -12.68863582611084, -11.631108283996582, -10.573580741882324, -9.51605224609375, -8.458524703979492, -7.400997161865234, -6.343469619750977, -5.2859416007995605, -4.2284135818481445, -3.1708860397338867, -2.113358497619629, -1.055830478668213, 0.001697540283203125, 1.059225082397461, 2.116752862930298, 3.1742806434631348, 4.231808662414551, 5.289336204528809, 6.346863746643066, 7.404391765594482, 8.461919784545898, 9.519447326660156, 10.576974868774414, 11.634502410888672, 12.692030906677246, 13.749558448791504, 14.807085990905762, 15.864614486694336, 16.922142028808594, 17.97966766357422, 19.037195205688477, 20.094722747802734, 21.152250289916992, 22.20977783203125, 23.26730728149414, 24.3248348236084, 25.382362365722656, 26.439889907836914, 27.497417449951172, 28.55494499206543, 29.612472534179688, 30.670001983642578, 31.727527618408203, 32.785057067871094, 33.84258270263672, 34.90011215209961, 35.9576416015625, 37.015167236328125, 38.072696685791016, 39.13022232055664, 40.18775177001953, 41.245277404785156, 42.30280685424805, 43.36033630371094, 44.41786575317383, 45.47539138793945, 46.532920837402344, 47.59044647216797, 48.64797592163086, 49.705501556396484, 50.763031005859375, 51.820556640625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 8.0, 12.0, 9.0, 11.0, 18.0, 24.0, 25.0, 39.0, 27.0, 26.0, 28.0, 38.0, 38.0, 44.0, 55.0, 43.0, 59.0, 59.0, 68.0, 39.0, 54.0, 44.0, 32.0, 25.0, 31.0, 26.0, 22.0, 15.0, 12.0, 9.0, 7.0, 8.0, 6.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.595611572265625, -12.182685852050781, -11.769760131835938, -11.356834411621094, -10.94390869140625, -10.530982971191406, -10.118057250976562, -9.705131530761719, -9.292205810546875, -8.879280090332031, -8.466354370117188, -8.053428649902344, -7.6405029296875, -7.227577209472656, -6.814651966094971, -6.401726245880127, -5.988801002502441, -5.575875282287598, -5.162949562072754, -4.75002384185791, -4.337098121643066, -3.9241726398468018, -3.511247158050537, -3.0983214378356934, -2.6853957176208496, -2.272469997406006, -1.8595443964004517, -1.4466187953948975, -1.0336930751800537, -0.62076735496521, -0.2078418731689453, 0.20508384704589844, 0.6180095672607422, 1.030935287475586, 1.4438608884811401, 1.8567864894866943, 2.269712209701538, 2.682637929916382, 3.0955634117126465, 3.5084891319274902, 3.921414852142334, 4.334340572357178, 4.7472662925720215, 5.160191535949707, 5.573117256164551, 5.9860429763793945, 6.398968696594238, 6.811894416809082, 7.224820137023926, 7.6377458572387695, 8.050671577453613, 8.463597297668457, 8.8765230178833, 9.289448738098145, 9.702373504638672, 10.115299224853516, 10.52822494506836, 10.941150665283203, 11.354076385498047, 11.76700210571289, 12.179927825927734, 12.592853546142578, 13.005779266357422, 13.418704986572266, 13.83163070678711]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 5.0, 6.0, 15.0, 23.0, 27.0, 38.0, 64.0, 87.0, 155.0, 235.0, 459.0, 945.0, 1814.0, 4016.0, 9942.0, 29436.0, 120252.0, 633944.0, 185110.0, 39750.0, 12679.0, 4992.0, 2167.0, 1037.0, 572.0, 300.0, 187.0, 96.0, 60.0, 38.0, 33.0, 23.0, 15.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5228118896484375, -1.471405029296875, -1.4199981689453125, -1.36859130859375, -1.3171844482421875, -1.265777587890625, -1.2143707275390625, -1.1629638671875, -1.1115570068359375, -1.060150146484375, -1.0087432861328125, -0.95733642578125, -0.9059295654296875, -0.854522705078125, -0.8031158447265625, -0.751708984375, -0.7003021240234375, -0.648895263671875, -0.5974884033203125, -0.54608154296875, -0.4946746826171875, -0.443267822265625, -0.3918609619140625, -0.3404541015625, -0.2890472412109375, -0.237640380859375, -0.1862335205078125, -0.13482666015625, -0.0834197998046875, -0.032012939453125, 0.0193939208984375, 0.07080078125, 0.1222076416015625, 0.173614501953125, 0.2250213623046875, 0.27642822265625, 0.3278350830078125, 0.379241943359375, 0.4306488037109375, 0.4820556640625, 0.5334625244140625, 0.584869384765625, 0.6362762451171875, 0.68768310546875, 0.7390899658203125, 0.790496826171875, 0.8419036865234375, 0.893310546875, 0.9447174072265625, 0.996124267578125, 1.0475311279296875, 1.09893798828125, 1.1503448486328125, 1.201751708984375, 1.2531585693359375, 1.3045654296875, 1.3559722900390625, 1.407379150390625, 1.4587860107421875, 1.51019287109375, 1.5615997314453125, 1.613006591796875, 1.6644134521484375, 1.7158203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 19.0, 21.0, 17.0, 21.0, 18.0, 37.0, 27.0, 43.0, 53.0, 55.0, 70.0, 59.0, 69.0, 60.0, 60.0, 34.0, 50.0, 46.0, 49.0, 27.0, 23.0, 26.0, 19.0, 18.0, 12.0, 9.0, 8.0, 7.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.86669921875, -0.8351211547851562, -0.8035430908203125, -0.7719650268554688, -0.740386962890625, -0.7088088989257812, -0.6772308349609375, -0.6456527709960938, -0.61407470703125, -0.5824966430664062, -0.5509185791015625, -0.5193405151367188, -0.487762451171875, -0.45618438720703125, -0.4246063232421875, -0.39302825927734375, -0.3614501953125, -0.32987213134765625, -0.2982940673828125, -0.26671600341796875, -0.235137939453125, -0.20355987548828125, -0.1719818115234375, -0.14040374755859375, -0.10882568359375, -0.07724761962890625, -0.0456695556640625, -0.01409149169921875, 0.017486572265625, 0.04906463623046875, 0.0806427001953125, 0.11222076416015625, 0.143798828125, 0.17537689208984375, 0.2069549560546875, 0.23853302001953125, 0.270111083984375, 0.30168914794921875, 0.3332672119140625, 0.36484527587890625, 0.39642333984375, 0.42800140380859375, 0.4595794677734375, 0.49115753173828125, 0.522735595703125, 0.5543136596679688, 0.5858917236328125, 0.6174697875976562, 0.6490478515625, 0.6806259155273438, 0.7122039794921875, 0.7437820434570312, 0.775360107421875, 0.8069381713867188, 0.8385162353515625, 0.8700942993164062, 0.90167236328125, 0.9332504272460938, 0.9648284912109375, 0.9964065551757812, 1.027984619140625, 1.0595626831054688, 1.0911407470703125, 1.1227188110351562, 1.154296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 8.0, 7.0, 18.0, 27.0, 40.0, 55.0, 83.0, 134.0, 255.0, 495.0, 1294.0, 5068.0, 61670.0, 949746.0, 24940.0, 3000.0, 870.0, 351.0, 173.0, 93.0, 55.0, 38.0, 22.0, 20.0, 17.0, 12.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.45001220703125, -3.3433837890625, -3.23675537109375, -3.130126953125, -3.02349853515625, -2.9168701171875, -2.81024169921875, -2.70361328125, -2.59698486328125, -2.4903564453125, -2.38372802734375, -2.277099609375, -2.17047119140625, -2.0638427734375, -1.95721435546875, -1.8505859375, -1.74395751953125, -1.6373291015625, -1.53070068359375, -1.424072265625, -1.31744384765625, -1.2108154296875, -1.10418701171875, -0.99755859375, -0.89093017578125, -0.7843017578125, -0.67767333984375, -0.571044921875, -0.46441650390625, -0.3577880859375, -0.25115966796875, -0.14453125, -0.03790283203125, 0.0687255859375, 0.17535400390625, 0.281982421875, 0.38861083984375, 0.4952392578125, 0.60186767578125, 0.70849609375, 0.81512451171875, 0.9217529296875, 1.02838134765625, 1.135009765625, 1.24163818359375, 1.3482666015625, 1.45489501953125, 1.5615234375, 1.66815185546875, 1.7747802734375, 1.88140869140625, 1.988037109375, 2.09466552734375, 2.2012939453125, 2.30792236328125, 2.41455078125, 2.52117919921875, 2.6278076171875, 2.73443603515625, 2.841064453125, 2.94769287109375, 3.0543212890625, 3.16094970703125, 3.267578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 8.0, 6.0, 12.0, 5.0, 10.0, 15.0, 12.0, 12.0, 16.0, 24.0, 30.0, 33.0, 33.0, 32.0, 51.0, 46.0, 65.0, 63.0, 71.0, 76.0, 61.0, 50.0, 45.0, 36.0, 29.0, 24.0, 24.0, 14.0, 12.0, 15.0, 17.0, 8.0, 11.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.213348388671875, -3.10052490234375, -2.987701416015625, -2.8748779296875, -2.762054443359375, -2.64923095703125, -2.536407470703125, -2.423583984375, -2.310760498046875, -2.19793701171875, -2.085113525390625, -1.9722900390625, -1.859466552734375, -1.74664306640625, -1.633819580078125, -1.52099609375, -1.408172607421875, -1.29534912109375, -1.182525634765625, -1.0697021484375, -0.956878662109375, -0.84405517578125, -0.731231689453125, -0.618408203125, -0.505584716796875, -0.39276123046875, -0.279937744140625, -0.1671142578125, -0.054290771484375, 0.05853271484375, 0.171356201171875, 0.2841796875, 0.397003173828125, 0.50982666015625, 0.622650146484375, 0.7354736328125, 0.848297119140625, 0.96112060546875, 1.073944091796875, 1.186767578125, 1.299591064453125, 1.41241455078125, 1.525238037109375, 1.6380615234375, 1.750885009765625, 1.86370849609375, 1.976531982421875, 2.08935546875, 2.202178955078125, 2.31500244140625, 2.427825927734375, 2.5406494140625, 2.653472900390625, 2.76629638671875, 2.879119873046875, 2.991943359375, 3.104766845703125, 3.21759033203125, 3.330413818359375, 3.4432373046875, 3.556060791015625, 3.66888427734375, 3.781707763671875, 3.89453125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 13.0, 14.0, 21.0, 24.0, 37.0, 49.0, 96.0, 274.0, 692.0, 3021.0, 46940.0, 983604.0, 11363.0, 1563.0, 389.0, 189.0, 91.0, 61.0, 19.0, 19.0, 12.0, 11.0, 12.0, 3.0, 6.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.125, -1.085235595703125, -1.04547119140625, -1.005706787109375, -0.9659423828125, -0.926177978515625, -0.88641357421875, -0.846649169921875, -0.806884765625, -0.767120361328125, -0.72735595703125, -0.687591552734375, -0.6478271484375, -0.608062744140625, -0.56829833984375, -0.528533935546875, -0.48876953125, -0.449005126953125, -0.40924072265625, -0.369476318359375, -0.3297119140625, -0.289947509765625, -0.25018310546875, -0.210418701171875, -0.170654296875, -0.130889892578125, -0.09112548828125, -0.051361083984375, -0.0115966796875, 0.028167724609375, 0.06793212890625, 0.107696533203125, 0.1474609375, 0.187225341796875, 0.22698974609375, 0.266754150390625, 0.3065185546875, 0.346282958984375, 0.38604736328125, 0.425811767578125, 0.465576171875, 0.505340576171875, 0.54510498046875, 0.584869384765625, 0.6246337890625, 0.664398193359375, 0.70416259765625, 0.743927001953125, 0.78369140625, 0.823455810546875, 0.86322021484375, 0.902984619140625, 0.9427490234375, 0.982513427734375, 1.02227783203125, 1.062042236328125, 1.101806640625, 1.141571044921875, 1.18133544921875, 1.221099853515625, 1.2608642578125, 1.300628662109375, 1.34039306640625, 1.380157470703125, 1.419921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 14.0, 27.0, 24.0, 39.0, 74.0, 132.0, 185.0, 166.0, 105.0, 69.0, 41.0, 15.0, 21.0, 16.0, 14.0, 13.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000247955322265625, -0.00024062395095825195, -0.0002332925796508789, -0.00022596120834350586, -0.0002186298370361328, -0.00021129846572875977, -0.00020396709442138672, -0.00019663572311401367, -0.00018930435180664062, -0.00018197298049926758, -0.00017464160919189453, -0.00016731023788452148, -0.00015997886657714844, -0.0001526474952697754, -0.00014531612396240234, -0.0001379847526550293, -0.00013065338134765625, -0.0001233220100402832, -0.00011599063873291016, -0.00010865926742553711, -0.00010132789611816406, -9.399652481079102e-05, -8.666515350341797e-05, -7.933378219604492e-05, -7.200241088867188e-05, -6.467103958129883e-05, -5.733966827392578e-05, -5.0008296966552734e-05, -4.267692565917969e-05, -3.534555435180664e-05, -2.8014183044433594e-05, -2.0682811737060547e-05, -1.33514404296875e-05, -6.020069122314453e-06, 1.3113021850585938e-06, 8.64267349243164e-06, 1.5974044799804688e-05, 2.3305416107177734e-05, 3.063678741455078e-05, 3.796815872192383e-05, 4.5299530029296875e-05, 5.263090133666992e-05, 5.996227264404297e-05, 6.729364395141602e-05, 7.462501525878906e-05, 8.195638656616211e-05, 8.928775787353516e-05, 9.66191291809082e-05, 0.00010395050048828125, 0.0001112818717956543, 0.00011861324310302734, 0.0001259446144104004, 0.00013327598571777344, 0.00014060735702514648, 0.00014793872833251953, 0.00015527009963989258, 0.00016260147094726562, 0.00016993284225463867, 0.00017726421356201172, 0.00018459558486938477, 0.0001919269561767578, 0.00019925832748413086, 0.0002065896987915039, 0.00021392107009887695, 0.00022125244140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 9.0, 15.0, 34.0, 54.0, 81.0, 159.0, 427.0, 1240.0, 5265.0, 59267.0, 952863.0, 24311.0, 3284.0, 919.0, 297.0, 144.0, 64.0, 36.0, 25.0, 14.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6846847534179688, -0.6613616943359375, -0.6380386352539062, -0.614715576171875, -0.5913925170898438, -0.5680694580078125, -0.5447463989257812, -0.52142333984375, -0.49810028076171875, -0.4747772216796875, -0.45145416259765625, -0.428131103515625, -0.40480804443359375, -0.3814849853515625, -0.35816192626953125, -0.3348388671875, -0.31151580810546875, -0.2881927490234375, -0.26486968994140625, -0.241546630859375, -0.21822357177734375, -0.1949005126953125, -0.17157745361328125, -0.14825439453125, -0.12493133544921875, -0.1016082763671875, -0.07828521728515625, -0.054962158203125, -0.03163909912109375, -0.0083160400390625, 0.01500701904296875, 0.038330078125, 0.06165313720703125, 0.0849761962890625, 0.10829925537109375, 0.131622314453125, 0.15494537353515625, 0.1782684326171875, 0.20159149169921875, 0.22491455078125, 0.24823760986328125, 0.2715606689453125, 0.29488372802734375, 0.318206787109375, 0.34152984619140625, 0.3648529052734375, 0.38817596435546875, 0.4114990234375, 0.43482208251953125, 0.4581451416015625, 0.48146820068359375, 0.504791259765625, 0.5281143188476562, 0.5514373779296875, 0.5747604370117188, 0.59808349609375, 0.6214065551757812, 0.6447296142578125, 0.6680526733398438, 0.691375732421875, 0.7146987915039062, 0.7380218505859375, 0.7613449096679688, 0.78466796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 10.0, 7.0, 13.0, 16.0, 17.0, 35.0, 47.0, 67.0, 88.0, 110.0, 125.0, 131.0, 75.0, 74.0, 44.0, 27.0, 25.0, 19.0, 12.0, 9.0, 14.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.6201171875, -0.603668212890625, -0.58721923828125, -0.570770263671875, -0.5543212890625, -0.537872314453125, -0.52142333984375, -0.504974365234375, -0.488525390625, -0.472076416015625, -0.45562744140625, -0.439178466796875, -0.4227294921875, -0.406280517578125, -0.38983154296875, -0.373382568359375, -0.35693359375, -0.340484619140625, -0.32403564453125, -0.307586669921875, -0.2911376953125, -0.274688720703125, -0.25823974609375, -0.241790771484375, -0.225341796875, -0.208892822265625, -0.19244384765625, -0.175994873046875, -0.1595458984375, -0.143096923828125, -0.12664794921875, -0.110198974609375, -0.09375, -0.077301025390625, -0.06085205078125, -0.044403076171875, -0.0279541015625, -0.011505126953125, 0.00494384765625, 0.021392822265625, 0.037841796875, 0.054290771484375, 0.07073974609375, 0.087188720703125, 0.1036376953125, 0.120086669921875, 0.13653564453125, 0.152984619140625, 0.16943359375, 0.185882568359375, 0.20233154296875, 0.218780517578125, 0.2352294921875, 0.251678466796875, 0.26812744140625, 0.284576416015625, 0.301025390625, 0.317474365234375, 0.33392333984375, 0.350372314453125, 0.3668212890625, 0.383270263671875, 0.39971923828125, 0.416168212890625, 0.4326171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 12.0, 58.0, 683.0, 209.0, 31.0, 13.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.34331130981445, -45.75852584838867, -44.173736572265625, -42.588951110839844, -41.00416564941406, -39.41938018798828, -37.834590911865234, -36.24980545043945, -34.665016174316406, -33.080230712890625, -31.49544334411621, -29.910655975341797, -28.325870513916016, -26.7410831451416, -25.156295776367188, -23.571510314941406, -21.986724853515625, -20.40193748474121, -18.81715202331543, -17.232364654541016, -15.647578239440918, -14.06279182434082, -12.478004455566406, -10.893218040466309, -9.308431625366211, -7.723645210266113, -6.138858318328857, -4.554071426391602, -2.969285011291504, -1.3844985961914062, 0.2002887725830078, 1.7850751876831055, 3.369861602783203, 4.954648017883301, 6.539434909820557, 8.124221801757812, 9.70900821685791, 11.293794631958008, 12.878582000732422, 14.46336841583252, 16.048154830932617, 17.63294219970703, 19.217727661132812, 20.802515029907227, 22.38730239868164, 23.972087860107422, 25.556875228881836, 27.14166259765625, 28.72644805908203, 30.311235427856445, 31.896020889282227, 33.48080825805664, 35.06559371948242, 36.65038299560547, 38.23516845703125, 39.81995391845703, 41.40473937988281, 42.989524841308594, 44.57431411743164, 46.15909957885742, 47.7438850402832, 49.32867431640625, 50.91345977783203, 52.49824523925781, 54.08303451538086]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 17.0, 20.0, 23.0, 38.0, 57.0, 65.0, 378.0, 166.0, 66.0, 43.0, 37.0, 27.0, 15.0, 12.0, 10.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.040874481201172, -9.316638946533203, -8.59240436553955, -7.868168830871582, -7.143933296203613, -6.419698238372803, -5.695463180541992, -4.971227645874023, -4.246992588043213, -3.5227572917938232, -2.7985219955444336, -2.074286937713623, -1.3500516414642334, -0.6258163452148438, 0.0984187126159668, 0.8226542472839355, 1.546889305114746, 2.2711246013641357, 2.9953598976135254, 3.719594955444336, 4.443830490112305, 5.168065547943115, 5.892300605773926, 6.6165361404418945, 7.340771198272705, 8.065006256103516, 8.789241790771484, 9.513477325439453, 10.237711906433105, 10.961947441101074, 11.686182022094727, 12.410417556762695, 13.134653091430664, 13.858888626098633, 14.583123207092285, 15.307358741760254, 16.031593322753906, 16.755828857421875, 17.480064392089844, 18.204299926757812, 18.92853546142578, 19.65277099609375, 20.37700653076172, 21.101242065429688, 21.825475692749023, 22.549711227416992, 23.27394676208496, 23.99818229675293, 24.722415924072266, 25.446651458740234, 26.170886993408203, 26.895122528076172, 27.619356155395508, 28.343591690063477, 29.067827224731445, 29.792062759399414, 30.516298294067383, 31.24053382873535, 31.96476936340332, 32.689002990722656, 33.413238525390625, 34.137474060058594, 34.86170959472656, 35.58594512939453, 36.3101806640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 9.0, 9.0, 14.0, 21.0, 32.0, 30.0, 44.0, 54.0, 47.0, 100.0, 342.0, 99.0, 40.0, 43.0, 37.0, 19.0, 18.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8437728881835938, -0.7983856201171875, -0.7529983520507812, -0.707611083984375, -0.6622238159179688, -0.6168365478515625, -0.5714492797851562, -0.52606201171875, -0.48067474365234375, -0.4352874755859375, -0.38990020751953125, -0.344512939453125, -0.29912567138671875, -0.2537384033203125, -0.20835113525390625, -0.1629638671875, -0.11757659912109375, -0.0721893310546875, -0.02680206298828125, 0.018585205078125, 0.06397247314453125, 0.1093597412109375, 0.15474700927734375, 0.20013427734375, 0.24552154541015625, 0.2909088134765625, 0.33629608154296875, 0.381683349609375, 0.42707061767578125, 0.4724578857421875, 0.5178451538085938, 0.563232421875, 0.6086196899414062, 0.6540069580078125, 0.6993942260742188, 0.744781494140625, 0.7901687622070312, 0.8355560302734375, 0.8809432983398438, 0.92633056640625, 0.9717178344726562, 1.0171051025390625, 1.0624923706054688, 1.107879638671875, 1.1532669067382812, 1.1986541748046875, 1.2440414428710938, 1.2894287109375, 1.3348159790039062, 1.3802032470703125, 1.4255905151367188, 1.470977783203125, 1.5163650512695312, 1.5617523193359375, 1.6071395874023438, 1.65252685546875, 1.6979141235351562, 1.7433013916015625, 1.7886886596679688, 1.834075927734375, 1.8794631958007812, 1.9248504638671875, 1.9702377319335938, 2.015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 7.0, 7.0, 0.0, 5.0, 16.0, 10.0, 27.0, 28.0, 65.0, 159.0, 823.0, 46812.0, 8339089.0, 1119.0, 205.0, 84.0, 50.0, 28.0, 11.0, 8.0, 8.0, 3.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.296606063842773, -26.54012680053711, -25.783649444580078, -25.027170181274414, -24.270692825317383, -23.51421356201172, -22.757736206054688, -22.001256942749023, -21.24477767944336, -20.488298416137695, -19.731821060180664, -18.975341796875, -18.21886444091797, -17.462385177612305, -16.70590591430664, -15.94942855834961, -15.192951202392578, -14.43647289276123, -13.679994583129883, -12.923515319824219, -12.167037963867188, -11.410558700561523, -10.654080390930176, -9.897602081298828, -9.14112377166748, -8.384645462036133, -7.628167152404785, -6.871688365936279, -6.115210056304932, -5.358731746673584, -4.602252960205078, -3.8457746505737305, -3.08929443359375, -2.3328161239624023, -1.5763375759124756, -0.8198590278625488, -0.06338071823120117, 0.6930975914001465, 1.4495763778686523, 2.2060546875, 2.9625329971313477, 3.7190113067626953, 4.475489616394043, 5.231968402862549, 5.9884467124938965, 6.744925022125244, 7.50140380859375, 8.257882118225098, 9.014360427856445, 9.770838737487793, 10.52731704711914, 11.283796310424805, 12.040273666381836, 12.7967529296875, 13.553231239318848, 14.309709548950195, 15.066187858581543, 15.82266616821289, 16.579145431518555, 17.335622787475586, 18.09210205078125, 18.84857940673828, 19.605058670043945, 20.36153793334961, 21.11801528930664]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 6.0, 6.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.687347412109375, -26.179248809814453, -25.671152114868164, -25.163053512573242, -24.65495491027832, -24.14685821533203, -23.63875961303711, -23.130661010742188, -22.622562408447266, -22.114463806152344, -21.606367111206055, -21.098268508911133, -20.59016990661621, -20.082073211669922, -19.573974609375, -19.065876007080078, -18.55777931213379, -18.049680709838867, -17.541584014892578, -17.033485412597656, -16.525386810302734, -16.017288208007812, -15.509191513061523, -15.001092910766602, -14.492995262145996, -13.98489761352539, -13.476799011230469, -12.968701362609863, -12.460603713989258, -11.952505111694336, -11.44440746307373, -10.936309814453125, -10.428211212158203, -9.920113563537598, -9.412014961242676, -8.90391731262207, -8.395818710327148, -7.887721061706543, -7.3796234130859375, -6.871525287628174, -6.363426685333252, -5.855328559875488, -5.347230911254883, -4.839132785797119, -4.3310346603393555, -3.822936534881592, -3.3148386478424072, -2.8067407608032227, -2.298642635345459, -1.7905446290969849, -1.2824466228485107, -0.7743486166000366, -0.2662506103515625, 0.24184751510620117, 0.7499454021453857, 1.2580432891845703, 1.766141414642334, 2.2742395401000977, 2.7823374271392822, 3.290435314178467, 3.7985334396362305, 4.306631565093994, 4.814729690551758, 5.322827339172363, 5.830925464630127]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 12.0, 9.0, 22.0, 27.0, 30.0, 46.0, 79.0, 91.0, 166.0, 255.0, 445.0, 891.0, 1928.0, 4929.0, 15850.0, 62754.0, 236602.0, 146543.0, 35313.0, 10472.0, 4020.0, 1760.0, 887.0, 430.0, 266.0, 156.0, 83.0, 64.0, 46.0, 28.0, 20.0, 11.0, 8.0, 6.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.3984375, -9.15606689453125, -8.9136962890625, -8.67132568359375, -8.428955078125, -8.18658447265625, -7.9442138671875, -7.70184326171875, -7.45947265625, -7.21710205078125, -6.9747314453125, -6.73236083984375, -6.489990234375, -6.24761962890625, -6.0052490234375, -5.76287841796875, -5.5205078125, -5.27813720703125, -5.0357666015625, -4.79339599609375, -4.551025390625, -4.30865478515625, -4.0662841796875, -3.82391357421875, -3.58154296875, -3.33917236328125, -3.0968017578125, -2.85443115234375, -2.612060546875, -2.36968994140625, -2.1273193359375, -1.88494873046875, -1.642578125, -1.40020751953125, -1.1578369140625, -0.91546630859375, -0.673095703125, -0.43072509765625, -0.1883544921875, 0.05401611328125, 0.29638671875, 0.53875732421875, 0.7811279296875, 1.02349853515625, 1.265869140625, 1.50823974609375, 1.7506103515625, 1.99298095703125, 2.2353515625, 2.47772216796875, 2.7200927734375, 2.96246337890625, 3.204833984375, 3.44720458984375, 3.6895751953125, 3.93194580078125, 4.17431640625, 4.41668701171875, 4.6590576171875, 4.90142822265625, 5.143798828125, 5.38616943359375, 5.6285400390625, 5.87091064453125, 6.11328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 9.0, 5.0, 11.0, 29.0, 26.0, 49.0, 72.0, 97.0, 93.0, 139.0, 121.0, 109.0, 61.0, 44.0, 34.0, 27.0, 15.0, 15.0, 12.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.480316162109375, -1.42156982421875, -1.362823486328125, -1.3040771484375, -1.245330810546875, -1.18658447265625, -1.127838134765625, -1.069091796875, -1.010345458984375, -0.95159912109375, -0.892852783203125, -0.8341064453125, -0.775360107421875, -0.71661376953125, -0.657867431640625, -0.59912109375, -0.540374755859375, -0.48162841796875, -0.422882080078125, -0.3641357421875, -0.305389404296875, -0.24664306640625, -0.187896728515625, -0.129150390625, -0.070404052734375, -0.01165771484375, 0.047088623046875, 0.1058349609375, 0.164581298828125, 0.22332763671875, 0.282073974609375, 0.3408203125, 0.399566650390625, 0.45831298828125, 0.517059326171875, 0.5758056640625, 0.634552001953125, 0.69329833984375, 0.752044677734375, 0.810791015625, 0.869537353515625, 0.92828369140625, 0.987030029296875, 1.0457763671875, 1.104522705078125, 1.16326904296875, 1.222015380859375, 1.28076171875, 1.339508056640625, 1.39825439453125, 1.457000732421875, 1.5157470703125, 1.574493408203125, 1.63323974609375, 1.691986083984375, 1.750732421875, 1.809478759765625, 1.86822509765625, 1.926971435546875, 1.9857177734375, 2.044464111328125, 2.10321044921875, 2.161956787109375, 2.220703125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 7.0, 7.0, 10.0, 11.0, 15.0, 26.0, 65.0, 115.0, 104.0, 55.0, 28.0, 12.0, 11.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.74677848815918, -11.425983428955078, -11.105188369750977, -10.784393310546875, -10.463598251342773, -10.142803192138672, -9.82200813293457, -9.501213073730469, -9.180418014526367, -8.859622955322266, -8.538827896118164, -8.218032836914062, -7.897237777709961, -7.576442718505859, -7.255647659301758, -6.934852600097656, -6.614058017730713, -6.293262958526611, -5.97246789932251, -5.651672840118408, -5.330877780914307, -5.010082721710205, -4.689288139343262, -4.36849308013916, -4.047698020935059, -3.726902961730957, -3.4061079025268555, -3.085312843322754, -2.7645177841186523, -2.443722724914551, -2.1229279041290283, -1.8021328449249268, -1.481337547302246, -1.1605424880981445, -0.8397474884986877, -0.518952488899231, -0.1981574296951294, 0.12263762950897217, 0.4434325695037842, 0.7642276287078857, 1.0850226879119873, 1.4058177471160889, 1.7266128063201904, 2.047407627105713, 2.3682026863098145, 2.688997745513916, 3.0097928047180176, 3.330587863922119, 3.6513829231262207, 3.9721779823303223, 4.292973041534424, 4.613768100738525, 4.934563159942627, 5.2553582191467285, 5.576152801513672, 5.896947860717773, 6.217742919921875, 6.538537979125977, 6.859333038330078, 7.18012809753418, 7.500923156738281, 7.821718215942383, 8.142513275146484, 8.463308334350586, 8.784103393554688]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 4.0, 3.0, 11.0, 6.0, 6.0, 9.0, 14.0, 28.0, 63.0, 85.0, 102.0, 69.0, 34.0, 17.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.045466423034668, -6.832422256469727, -6.619378089904785, -6.406333923339844, -6.193289279937744, -5.980245113372803, -5.767200946807861, -5.55415678024292, -5.3411126136779785, -5.128068447113037, -4.915024280548096, -4.701979637145996, -4.488935470581055, -4.275891304016113, -4.062847137451172, -3.8498029708862305, -3.63675856590271, -3.4237143993377686, -3.210669994354248, -2.9976258277893066, -2.7845816612243652, -2.571537494659424, -2.3584930896759033, -2.145448923110962, -1.932404637336731, -1.7193603515625, -1.5063161849975586, -1.2932718992233276, -1.0802276134490967, -0.8671834468841553, -0.6541391611099243, -0.4410949945449829, -0.22805070877075195, -0.015006467700004578, 0.1980377733707428, 0.41108202934265137, 0.6241262555122375, 0.8371704816818237, 1.0502147674560547, 1.263258934020996, 1.476303219795227, 1.689347505569458, 1.9023916721343994, 2.11543607711792, 2.3284802436828613, 2.5415244102478027, 2.754568576812744, 2.9676127433776855, 3.180657148361206, 3.3937013149261475, 3.606745719909668, 3.8197898864746094, 4.032834053039551, 4.245878219604492, 4.458922386169434, 4.671966552734375, 4.885011196136475, 5.098055362701416, 5.311099529266357, 5.524144172668457, 5.737188339233398, 5.95023250579834, 6.163276672363281, 6.376320838928223, 6.589365005493164]}, "eval/loss": 4.16178035736084, "eval/wer": 2.431594605315351, "eval/runtime": 950.4746, "eval/samples_per_second": 2.78, "eval/steps_per_second": 0.233, "train/train_runtime": 6757.0177, "train/train_samples_per_second": 4.223, "train/train_steps_per_second": 0.176, "train/total_flos": 0.0, "train/train_loss": 4.268135019066556} \ No newline at end of file