diff --git "a/wandb/run-20220228_231357-3lq2qpez/files/wandb-summary.json" "b/wandb/run-20220228_231357-3lq2qpez/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220228_231357-3lq2qpez/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.3745, "train/learning_rate": 8.94e-06, "train/epoch": 0.88, "train/global_step": 450, "_runtime": 4157, "_timestamp": 1646094194, "_step": 449, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 67.0, 372.0, 436.0, 119.0, 11.0, 2.0, 2.0], "bins": [-291.3792419433594, -286.455322265625, -281.53143310546875, -276.6075134277344, -271.6836242675781, -266.75970458984375, -261.8358154296875, -256.9118957519531, -251.98800659179688, -247.06410217285156, -242.14019775390625, -237.21629333496094, -232.29238891601562, -227.3684844970703, -222.444580078125, -217.52066040039062, -212.5967559814453, -207.6728515625, -202.7489471435547, -197.82504272460938, -192.90113830566406, -187.97723388671875, -183.05332946777344, -178.12942504882812, -173.20550537109375, -168.28160095214844, -163.35769653320312, -158.4337921142578, -153.5098876953125, -148.5859832763672, -143.66207885742188, -138.7381591796875, -133.81427001953125, -128.89036560058594, -123.96646118164062, -119.04255676269531, -114.11865234375, -109.19474792480469, -104.27083587646484, -99.34693145751953, -94.42301940917969, -89.49911499023438, -84.57521057128906, -79.65130615234375, -74.72740173339844, -69.80349731445312, -64.87958526611328, -59.95568084716797, -55.031776428222656, -50.107872009277344, -45.18396759033203, -40.26005935668945, -35.33615493774414, -30.412250518798828, -25.488344192504883, -20.564437866210938, -15.640535354614258, -10.716629981994629, -5.792724609375, -0.8688192367553711, 4.055086135864258, 8.97899055480957, 13.902896881103516, 18.82680320739746, 23.750707626342773]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 9.0, 9.0, 8.0, 16.0, 16.0, 19.0, 17.0, 31.0, 35.0, 39.0, 36.0, 48.0, 49.0, 62.0, 53.0, 56.0, 51.0, 43.0, 54.0, 49.0, 40.0, 52.0, 32.0, 21.0, 33.0, 20.0, 25.0, 16.0, 10.0, 13.0, 14.0, 9.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.70005798339844, -50.74428176879883, -48.78850555419922, -46.832733154296875, -44.876956939697266, -42.921180725097656, -40.96540451049805, -39.00962829589844, -37.053855895996094, -35.098079681396484, -33.142303466796875, -31.1865291595459, -29.230754852294922, -27.274978637695312, -25.319202423095703, -23.363426208496094, -21.407649993896484, -19.451873779296875, -17.4960994720459, -15.540323257446289, -13.584547996520996, -11.628772735595703, -9.672996520996094, -7.717221260070801, -5.761445999145508, -3.8056704998016357, -1.8498950004577637, 0.1058807373046875, 2.0616559982299805, 4.017431259155273, 5.973207473754883, 7.928982734680176, 9.884757995605469, 11.840533256530762, 13.796308517456055, 15.752084732055664, 17.70785903930664, 19.66363525390625, 21.61941146850586, 23.57518768310547, 25.530961990356445, 27.486738204956055, 29.44251251220703, 31.39828872680664, 33.35406494140625, 35.309837341308594, 37.26561737060547, 39.22138977050781, 41.17716598510742, 43.13294219970703, 45.08871841430664, 47.04449462890625, 49.000267028808594, 50.9560432434082, 52.91181945800781, 54.86759567260742, 56.82337188720703, 58.77914810180664, 60.73492431640625, 62.690696716308594, 64.64647674560547, 66.60224914550781, 68.55802917480469, 70.51380157470703, 72.46957397460938]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 10.0, 9.0, 11.0, 8.0, 14.0, 15.0, 20.0, 18.0, 26.0, 23.0, 30.0, 42.0, 51.0, 32.0, 45.0, 46.0, 38.0, 41.0, 60.0, 37.0, 44.0, 39.0, 48.0, 42.0, 37.0, 38.0, 30.0, 28.0, 20.0, 16.0, 19.0, 6.0, 10.0, 11.0, 9.0, 8.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.59765625, -4.4586181640625, -4.319580078125, -4.1805419921875, -4.04150390625, -3.9024658203125, -3.763427734375, -3.6243896484375, -3.4853515625, -3.3463134765625, -3.207275390625, -3.0682373046875, -2.92919921875, -2.7901611328125, -2.651123046875, -2.5120849609375, -2.373046875, -2.2340087890625, -2.094970703125, -1.9559326171875, -1.81689453125, -1.6778564453125, -1.538818359375, -1.3997802734375, -1.2607421875, -1.1217041015625, -0.982666015625, -0.8436279296875, -0.70458984375, -0.5655517578125, -0.426513671875, -0.2874755859375, -0.1484375, -0.0093994140625, 0.129638671875, 0.2686767578125, 0.40771484375, 0.5467529296875, 0.685791015625, 0.8248291015625, 0.9638671875, 1.1029052734375, 1.241943359375, 1.3809814453125, 1.52001953125, 1.6590576171875, 1.798095703125, 1.9371337890625, 2.076171875, 2.2152099609375, 2.354248046875, 2.4932861328125, 2.63232421875, 2.7713623046875, 2.910400390625, 3.0494384765625, 3.1884765625, 3.3275146484375, 3.466552734375, 3.6055908203125, 3.74462890625, 3.8836669921875, 4.022705078125, 4.1617431640625, 4.30078125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 6.0, 10.0, 9.0, 17.0, 26.0, 22.0, 44.0, 57.0, 67.0, 91.0, 100.0, 176.0, 217.0, 305.0, 429.0, 678.0, 1121.0, 1769.0, 3104.0, 6576.0, 17562.0, 82002.0, 804336.0, 2535316.0, 642511.0, 68776.0, 15351.0, 5924.0, 2884.0, 1643.0, 977.0, 622.0, 446.0, 304.0, 180.0, 140.0, 129.0, 80.0, 72.0, 47.0, 41.0, 28.0, 21.0, 26.0, 12.0, 7.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.5, -10.1551513671875, -9.810302734375, -9.4654541015625, -9.12060546875, -8.7757568359375, -8.430908203125, -8.0860595703125, -7.7412109375, -7.3963623046875, -7.051513671875, -6.7066650390625, -6.36181640625, -6.0169677734375, -5.672119140625, -5.3272705078125, -4.982421875, -4.6375732421875, -4.292724609375, -3.9478759765625, -3.60302734375, -3.2581787109375, -2.913330078125, -2.5684814453125, -2.2236328125, -1.8787841796875, -1.533935546875, -1.1890869140625, -0.84423828125, -0.4993896484375, -0.154541015625, 0.1903076171875, 0.53515625, 0.8800048828125, 1.224853515625, 1.5697021484375, 1.91455078125, 2.2593994140625, 2.604248046875, 2.9490966796875, 3.2939453125, 3.6387939453125, 3.983642578125, 4.3284912109375, 4.67333984375, 5.0181884765625, 5.363037109375, 5.7078857421875, 6.052734375, 6.3975830078125, 6.742431640625, 7.0872802734375, 7.43212890625, 7.7769775390625, 8.121826171875, 8.4666748046875, 8.8115234375, 9.1563720703125, 9.501220703125, 9.8460693359375, 10.19091796875, 10.5357666015625, 10.880615234375, 11.2254638671875, 11.5703125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 14.0, 19.0, 24.0, 34.0, 34.0, 74.0, 94.0, 135.0, 196.0, 324.0, 432.0, 666.0, 591.0, 438.0, 313.0, 201.0, 165.0, 82.0, 63.0, 42.0, 33.0, 23.0, 14.0, 14.0, 10.0, 8.0, 4.0, 5.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.27197265625, -15.7626953125, -15.25341796875, -14.744140625, -14.23486328125, -13.7255859375, -13.21630859375, -12.70703125, -12.19775390625, -11.6884765625, -11.17919921875, -10.669921875, -10.16064453125, -9.6513671875, -9.14208984375, -8.6328125, -8.12353515625, -7.6142578125, -7.10498046875, -6.595703125, -6.08642578125, -5.5771484375, -5.06787109375, -4.55859375, -4.04931640625, -3.5400390625, -3.03076171875, -2.521484375, -2.01220703125, -1.5029296875, -0.99365234375, -0.484375, 0.02490234375, 0.5341796875, 1.04345703125, 1.552734375, 2.06201171875, 2.5712890625, 3.08056640625, 3.58984375, 4.09912109375, 4.6083984375, 5.11767578125, 5.626953125, 6.13623046875, 6.6455078125, 7.15478515625, 7.6640625, 8.17333984375, 8.6826171875, 9.19189453125, 9.701171875, 10.21044921875, 10.7197265625, 11.22900390625, 11.73828125, 12.24755859375, 12.7568359375, 13.26611328125, 13.775390625, 14.28466796875, 14.7939453125, 15.30322265625, 15.8125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 11.0, 10.0, 19.0, 15.0, 33.0, 39.0, 60.0, 84.0, 139.0, 226.0, 333.0, 599.0, 1173.0, 3477.0, 90689.0, 4040832.0, 50847.0, 2964.0, 1145.0, 602.0, 333.0, 190.0, 147.0, 99.0, 61.0, 38.0, 37.0, 17.0, 10.0, 13.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.25, -52.52490234375, -50.7998046875, -49.07470703125, -47.349609375, -45.62451171875, -43.8994140625, -42.17431640625, -40.44921875, -38.72412109375, -36.9990234375, -35.27392578125, -33.548828125, -31.82373046875, -30.0986328125, -28.37353515625, -26.6484375, -24.92333984375, -23.1982421875, -21.47314453125, -19.748046875, -18.02294921875, -16.2978515625, -14.57275390625, -12.84765625, -11.12255859375, -9.3974609375, -7.67236328125, -5.947265625, -4.22216796875, -2.4970703125, -0.77197265625, 0.953125, 2.67822265625, 4.4033203125, 6.12841796875, 7.853515625, 9.57861328125, 11.3037109375, 13.02880859375, 14.75390625, 16.47900390625, 18.2041015625, 19.92919921875, 21.654296875, 23.37939453125, 25.1044921875, 26.82958984375, 28.5546875, 30.27978515625, 32.0048828125, 33.72998046875, 35.455078125, 37.18017578125, 38.9052734375, 40.63037109375, 42.35546875, 44.08056640625, 45.8056640625, 47.53076171875, 49.255859375, 50.98095703125, 52.7060546875, 54.43115234375, 56.15625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 49.0, 286.0, 456.0, 176.0, 29.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.35960388183594, -204.20941162109375, -200.05921936035156, -195.90902709960938, -191.7588348388672, -187.608642578125, -183.4584503173828, -179.30825805664062, -175.15806579589844, -171.00787353515625, -166.85768127441406, -162.70748901367188, -158.5572967529297, -154.4071044921875, -150.2569122314453, -146.10671997070312, -141.95654296875, -137.8063507080078, -133.65615844726562, -129.50596618652344, -125.35577392578125, -121.20558166503906, -117.05538940429688, -112.90519714355469, -108.7550048828125, -104.60481262207031, -100.45462036132812, -96.30442810058594, -92.15423583984375, -88.00404357910156, -83.85385131835938, -79.70365905761719, -75.55348205566406, -71.40328979492188, -67.25309753417969, -63.1029052734375, -58.95271301269531, -54.802520751953125, -50.6523323059082, -46.502140045166016, -42.35194396972656, -38.201751708984375, -34.05155944824219, -29.901369094848633, -25.751176834106445, -21.600984573364258, -17.450794219970703, -13.300601959228516, -9.150409698486328, -5.000217914581299, -0.8500261306762695, 3.3001651763916016, 7.450357437133789, 11.600549697875977, 15.750740051269531, 19.90093231201172, 24.051124572753906, 28.201316833496094, 32.35150909423828, 36.50170135498047, 40.651893615722656, 44.802085876464844, 48.952274322509766, 53.10246658325195, 57.25265884399414]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 2.0, 15.0, 10.0, 21.0, 9.0, 29.0, 36.0, 28.0, 36.0, 35.0, 33.0, 46.0, 47.0, 45.0, 65.0, 64.0, 53.0, 47.0, 47.0, 41.0, 42.0, 34.0, 31.0, 24.0, 19.0, 29.0, 19.0, 19.0, 22.0, 18.0, 6.0, 9.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.763336181640625, -59.1818733215332, -57.60041427612305, -56.018951416015625, -54.4374885559082, -52.85602569580078, -51.274566650390625, -49.6931037902832, -48.11164093017578, -46.53017807006836, -44.9487190246582, -43.36725616455078, -41.78579330444336, -40.20433044433594, -38.62287139892578, -37.04140853881836, -35.45994567871094, -33.878482818603516, -32.29702377319336, -30.715560913085938, -29.134098052978516, -27.552637100219727, -25.971176147460938, -24.389713287353516, -22.80825424194336, -21.22679328918457, -19.64533042907715, -18.06386947631836, -16.482406616210938, -14.900945663452148, -13.319483757019043, -11.738021850585938, -10.156558990478516, -8.57509708404541, -6.993635177612305, -5.412173748016357, -3.830711841583252, -2.2492499351501465, -0.6677885055541992, 0.9136734008789062, 2.4951353073120117, 4.076597213745117, 5.658059120178223, 7.23952054977417, 8.820981979370117, 10.402444839477539, 11.983905792236328, 13.565367698669434, 15.146829605102539, 16.728290557861328, 18.30975341796875, 19.89121437072754, 21.47267723083496, 23.05413818359375, 24.635601043701172, 26.21706199645996, 27.79852294921875, 29.37998390197754, 30.96144676208496, 32.54290771484375, 34.12437057495117, 35.705833435058594, 37.28729248046875, 38.86875534057617, 40.450218200683594]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 5.0, 6.0, 6.0, 7.0, 18.0, 9.0, 17.0, 11.0, 13.0, 29.0, 23.0, 13.0, 28.0, 34.0, 27.0, 32.0, 33.0, 37.0, 33.0, 26.0, 37.0, 39.0, 34.0, 46.0, 38.0, 39.0, 36.0, 46.0, 41.0, 24.0, 27.0, 24.0, 18.0, 20.0, 20.0, 22.0, 7.0, 12.0, 12.0, 7.0, 11.0, 11.0, 6.0, 5.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.33203125, -4.20794677734375, -4.0838623046875, -3.95977783203125, -3.835693359375, -3.71160888671875, -3.5875244140625, -3.46343994140625, -3.33935546875, -3.21527099609375, -3.0911865234375, -2.96710205078125, -2.843017578125, -2.71893310546875, -2.5948486328125, -2.47076416015625, -2.3466796875, -2.22259521484375, -2.0985107421875, -1.97442626953125, -1.850341796875, -1.72625732421875, -1.6021728515625, -1.47808837890625, -1.35400390625, -1.22991943359375, -1.1058349609375, -0.98175048828125, -0.857666015625, -0.73358154296875, -0.6094970703125, -0.48541259765625, -0.361328125, -0.23724365234375, -0.1131591796875, 0.01092529296875, 0.135009765625, 0.25909423828125, 0.3831787109375, 0.50726318359375, 0.63134765625, 0.75543212890625, 0.8795166015625, 1.00360107421875, 1.127685546875, 1.25177001953125, 1.3758544921875, 1.49993896484375, 1.6240234375, 1.74810791015625, 1.8721923828125, 1.99627685546875, 2.120361328125, 2.24444580078125, 2.3685302734375, 2.49261474609375, 2.61669921875, 2.74078369140625, 2.8648681640625, 2.98895263671875, 3.113037109375, 3.23712158203125, 3.3612060546875, 3.48529052734375, 3.609375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 15.0, 23.0, 35.0, 47.0, 67.0, 102.0, 168.0, 259.0, 350.0, 529.0, 778.0, 1128.0, 1731.0, 2411.0, 3496.0, 5204.0, 7509.0, 10903.0, 16256.0, 24261.0, 37338.0, 60027.0, 100050.0, 197008.0, 263016.0, 118299.0, 69551.0, 42614.0, 27724.0, 18304.0, 12454.0, 8394.0, 5934.0, 3922.0, 2770.0, 1865.0, 1293.0, 870.0, 565.0, 451.0, 274.0, 178.0, 123.0, 86.0, 62.0, 36.0, 18.0, 20.0, 12.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.87060546875, -0.8435287475585938, -0.8164520263671875, -0.7893753051757812, -0.762298583984375, -0.7352218627929688, -0.7081451416015625, -0.6810684204101562, -0.65399169921875, -0.6269149780273438, -0.5998382568359375, -0.5727615356445312, -0.545684814453125, -0.5186080932617188, -0.4915313720703125, -0.46445465087890625, -0.4373779296875, -0.41030120849609375, -0.3832244873046875, -0.35614776611328125, -0.329071044921875, -0.30199432373046875, -0.2749176025390625, -0.24784088134765625, -0.22076416015625, -0.19368743896484375, -0.1666107177734375, -0.13953399658203125, -0.112457275390625, -0.08538055419921875, -0.0583038330078125, -0.03122711181640625, -0.004150390625, 0.02292633056640625, 0.0500030517578125, 0.07707977294921875, 0.104156494140625, 0.13123321533203125, 0.1583099365234375, 0.18538665771484375, 0.21246337890625, 0.23954010009765625, 0.2666168212890625, 0.29369354248046875, 0.320770263671875, 0.34784698486328125, 0.3749237060546875, 0.40200042724609375, 0.4290771484375, 0.45615386962890625, 0.4832305908203125, 0.5103073120117188, 0.537384033203125, 0.5644607543945312, 0.5915374755859375, 0.6186141967773438, 0.64569091796875, 0.6727676391601562, 0.6998443603515625, 0.7269210815429688, 0.753997802734375, 0.7810745239257812, 0.8081512451171875, 0.8352279663085938, 0.8623046875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 3.0, 6.0, 10.0, 12.0, 8.0, 13.0, 14.0, 17.0, 17.0, 18.0, 32.0, 23.0, 21.0, 26.0, 38.0, 40.0, 27.0, 36.0, 40.0, 39.0, 42.0, 1065.0, 32.0, 31.0, 40.0, 30.0, 30.0, 37.0, 26.0, 32.0, 29.0, 20.0, 32.0, 16.0, 19.0, 4.0, 17.0, 16.0, 10.0, 15.0, 7.0, 15.0, 2.0, 7.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3515625, -2.274383544921875, -2.19720458984375, -2.120025634765625, -2.0428466796875, -1.965667724609375, -1.88848876953125, -1.811309814453125, -1.734130859375, -1.656951904296875, -1.57977294921875, -1.502593994140625, -1.4254150390625, -1.348236083984375, -1.27105712890625, -1.193878173828125, -1.11669921875, -1.039520263671875, -0.96234130859375, -0.885162353515625, -0.8079833984375, -0.730804443359375, -0.65362548828125, -0.576446533203125, -0.499267578125, -0.422088623046875, -0.34490966796875, -0.267730712890625, -0.1905517578125, -0.113372802734375, -0.03619384765625, 0.040985107421875, 0.1181640625, 0.195343017578125, 0.27252197265625, 0.349700927734375, 0.4268798828125, 0.504058837890625, 0.58123779296875, 0.658416748046875, 0.735595703125, 0.812774658203125, 0.88995361328125, 0.967132568359375, 1.0443115234375, 1.121490478515625, 1.19866943359375, 1.275848388671875, 1.35302734375, 1.430206298828125, 1.50738525390625, 1.584564208984375, 1.6617431640625, 1.738922119140625, 1.81610107421875, 1.893280029296875, 1.970458984375, 2.047637939453125, 2.12481689453125, 2.201995849609375, 2.2791748046875, 2.356353759765625, 2.43353271484375, 2.510711669921875, 2.587890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 15.0, 21.0, 34.0, 45.0, 57.0, 96.0, 129.0, 205.0, 290.0, 418.0, 604.0, 839.0, 1286.0, 1892.0, 2800.0, 4035.0, 6060.0, 8778.0, 13040.0, 18893.0, 28363.0, 43023.0, 67525.0, 112821.0, 1294654.0, 205615.0, 101835.0, 62492.0, 39703.0, 26511.0, 17594.0, 11952.0, 8228.0, 5635.0, 3833.0, 2508.0, 1702.0, 1174.0, 771.0, 543.0, 359.0, 259.0, 148.0, 117.0, 70.0, 56.0, 36.0, 21.0, 15.0, 13.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7468338012695312, -0.7226715087890625, -0.6985092163085938, -0.674346923828125, -0.6501846313476562, -0.6260223388671875, -0.6018600463867188, -0.57769775390625, -0.5535354614257812, -0.5293731689453125, -0.5052108764648438, -0.481048583984375, -0.45688629150390625, -0.4327239990234375, -0.40856170654296875, -0.3843994140625, -0.36023712158203125, -0.3360748291015625, -0.31191253662109375, -0.287750244140625, -0.26358795166015625, -0.2394256591796875, -0.21526336669921875, -0.19110107421875, -0.16693878173828125, -0.1427764892578125, -0.11861419677734375, -0.094451904296875, -0.07028961181640625, -0.0461273193359375, -0.02196502685546875, 0.002197265625, 0.02635955810546875, 0.0505218505859375, 0.07468414306640625, 0.098846435546875, 0.12300872802734375, 0.1471710205078125, 0.17133331298828125, 0.19549560546875, 0.21965789794921875, 0.2438201904296875, 0.26798248291015625, 0.292144775390625, 0.31630706787109375, 0.3404693603515625, 0.36463165283203125, 0.3887939453125, 0.41295623779296875, 0.4371185302734375, 0.46128082275390625, 0.485443115234375, 0.5096054077148438, 0.5337677001953125, 0.5579299926757812, 0.58209228515625, 0.6062545776367188, 0.6304168701171875, 0.6545791625976562, 0.678741455078125, 0.7029037475585938, 0.7270660400390625, 0.7512283325195312, 0.775390625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 10.0, 7.0, 8.0, 13.0, 15.0, 24.0, 37.0, 34.0, 39.0, 71.0, 100.0, 102.0, 117.0, 99.0, 68.0, 55.0, 39.0, 26.0, 28.0, 16.0, 14.0, 9.0, 8.0, 13.0, 7.0, 8.0, 6.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0006685256958007812, -0.0006477087736129761, -0.0006268918514251709, -0.0006060749292373657, -0.0005852580070495605, -0.0005644410848617554, -0.0005436241626739502, -0.000522807240486145, -0.0005019903182983398, -0.00048117339611053467, -0.0004603564739227295, -0.0004395395517349243, -0.00041872262954711914, -0.00039790570735931396, -0.0003770887851715088, -0.0003562718629837036, -0.00033545494079589844, -0.00031463801860809326, -0.0002938210964202881, -0.0002730041742324829, -0.00025218725204467773, -0.00023137032985687256, -0.00021055340766906738, -0.0001897364854812622, -0.00016891956329345703, -0.00014810264110565186, -0.00012728571891784668, -0.0001064687967300415, -8.565187454223633e-05, -6.483495235443115e-05, -4.4018030166625977e-05, -2.32011079788208e-05, -2.384185791015625e-06, 1.843273639678955e-05, 3.9249658584594727e-05, 6.00665807723999e-05, 8.088350296020508e-05, 0.00010170042514801025, 0.00012251734733581543, 0.0001433342695236206, 0.00016415119171142578, 0.00018496811389923096, 0.00020578503608703613, 0.0002266019582748413, 0.0002474188804626465, 0.00026823580265045166, 0.00028905272483825684, 0.000309869647026062, 0.0003306865692138672, 0.00035150349140167236, 0.00037232041358947754, 0.0003931373357772827, 0.0004139542579650879, 0.00043477118015289307, 0.00045558810234069824, 0.0004764050245285034, 0.0004972219467163086, 0.0005180388689041138, 0.0005388557910919189, 0.0005596727132797241, 0.0005804896354675293, 0.0006013065576553345, 0.0006221234798431396, 0.0006429404020309448, 0.00066375732421875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 12.0, 14.0, 17.0, 19.0, 12.0, 22.0, 30.0, 50.0, 46.0, 63.0, 77.0, 136.0, 196.0, 310.0, 414.0, 811.0, 712401.0, 331714.0, 762.0, 435.0, 292.0, 170.0, 132.0, 104.0, 65.0, 47.0, 46.0, 37.0, 26.0, 14.0, 10.0, 9.0, 5.0, 9.0, 6.0, 7.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.011383056640625, -0.011027097702026367, -0.010671138763427734, -0.010315179824829102, -0.009959220886230469, -0.009603261947631836, -0.009247303009033203, -0.00889134407043457, -0.008535385131835938, -0.008179426193237305, -0.007823467254638672, -0.007467508316040039, -0.007111549377441406, -0.0067555904388427734, -0.006399631500244141, -0.006043672561645508, -0.005687713623046875, -0.005331754684448242, -0.004975795745849609, -0.0046198368072509766, -0.004263877868652344, -0.003907918930053711, -0.003551959991455078, -0.0031960010528564453, -0.0028400421142578125, -0.0024840831756591797, -0.002128124237060547, -0.001772165298461914, -0.0014162063598632812, -0.0010602474212646484, -0.0007042884826660156, -0.0003483295440673828, 7.62939453125e-06, 0.0003635883331298828, 0.0007195472717285156, 0.0010755062103271484, 0.0014314651489257812, 0.001787424087524414, 0.002143383026123047, 0.0024993419647216797, 0.0028553009033203125, 0.0032112598419189453, 0.003567218780517578, 0.003923177719116211, 0.004279136657714844, 0.0046350955963134766, 0.004991054534912109, 0.005347013473510742, 0.005702972412109375, 0.006058931350708008, 0.006414890289306641, 0.0067708492279052734, 0.007126808166503906, 0.007482767105102539, 0.007838726043701172, 0.008194684982299805, 0.008550643920898438, 0.00890660285949707, 0.009262561798095703, 0.009618520736694336, 0.009974479675292969, 0.010330438613891602, 0.010686397552490234, 0.011042356491088867, 0.0113983154296875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 10.0, 962.0, 45.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001487051136791706, -0.0014111509080976248, -0.0013352505629882216, -0.0012593503342941403, -0.0011834499891847372, -0.001107549760490656, -0.0010316495317965746, -0.0009557492448948324, -0.0008798489579930902, -0.0008039486710913479, -0.0007280483841896057, -0.0006521481554955244, -0.0005762478685937822, -0.00050034758169204, -0.0004244473238941282, -0.00034854706609621644, -0.0002726467791944742, -0.00019674650684464723, -0.00012084623449482024, -4.4945962144993246e-05, 3.0954310204833746e-05, 0.00010685459710657597, 0.00018275485490448773, 0.0002586551127023995, 0.0003345553996041417, 0.00041045568650588393, 0.0004863559443037957, 0.0005622562021017075, 0.0006381564890034497, 0.0007140567759051919, 0.0007899570045992732, 0.0008658572915010154, 0.000941757345572114, 0.0010176575742661953, 0.0010935579193755984, 0.0011694581480696797, 0.0012453584931790829, 0.0013212587218731642, 0.0013971589505672455, 0.0014730591792613268, 0.00154895952437073, 0.0016248597530648112, 0.0017007600981742144, 0.0017766603268682957, 0.001852560555562377, 0.0019284609006717801, 0.0020043612457811832, 0.0020802614744752645, 0.002156161703169346, 0.002232061931863427, 0.0023079621605575085, 0.0023838626220822334, 0.0024597628507763147, 0.002535663079470396, 0.0026115633081644773, 0.0026874635368585587, 0.0027633639983832836, 0.002839264227077365, 0.0029151644557714462, 0.002991064917296171, 0.0030669651459902525, 0.003142865374684334, 0.003218765603378415, 0.0032946658320724964, 0.0033705660607665777]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 11.0, 10.0, 12.0, 12.0, 11.0, 23.0, 21.0, 27.0, 25.0, 40.0, 42.0, 38.0, 32.0, 36.0, 54.0, 53.0, 40.0, 48.0, 49.0, 48.0, 48.0, 41.0, 37.0, 37.0, 45.0, 35.0, 25.0, 19.0, 20.0, 11.0, 10.0, 15.0, 5.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003020167350769043, -0.00029215216636657715, -0.00028228759765625, -0.00027242302894592285, -0.0002625584602355957, -0.00025269389152526855, -0.0002428293228149414, -0.00023296475410461426, -0.0002231001853942871, -0.00021323561668395996, -0.0002033710479736328, -0.00019350647926330566, -0.00018364191055297852, -0.00017377734184265137, -0.00016391277313232422, -0.00015404820442199707, -0.00014418363571166992, -0.00013431906700134277, -0.00012445449829101562, -0.00011458992958068848, -0.00010472536087036133, -9.486079216003418e-05, -8.499622344970703e-05, -7.513165473937988e-05, -6.526708602905273e-05, -5.5402517318725586e-05, -4.553794860839844e-05, -3.567337989807129e-05, -2.580881118774414e-05, -1.5944242477416992e-05, -6.079673767089844e-06, 3.7848949432373047e-06, 1.3649463653564453e-05, 2.35140323638916e-05, 3.337860107421875e-05, 4.32431697845459e-05, 5.310773849487305e-05, 6.29723072052002e-05, 7.283687591552734e-05, 8.270144462585449e-05, 9.256601333618164e-05, 0.00010243058204650879, 0.00011229515075683594, 0.00012215971946716309, 0.00013202428817749023, 0.00014188885688781738, 0.00015175342559814453, 0.00016161799430847168, 0.00017148256301879883, 0.00018134713172912598, 0.00019121170043945312, 0.00020107626914978027, 0.00021094083786010742, 0.00022080540657043457, 0.00023066997528076172, 0.00024053454399108887, 0.000250399112701416, 0.00026026368141174316, 0.0002701282501220703, 0.00027999281883239746, 0.0002898573875427246, 0.00029972195625305176, 0.0003095865249633789, 0.00031945109367370605, 0.0003293156623840332]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 5.0, 6.0, 6.0, 7.0, 18.0, 9.0, 17.0, 11.0, 13.0, 29.0, 23.0, 13.0, 28.0, 34.0, 27.0, 32.0, 33.0, 37.0, 33.0, 26.0, 37.0, 39.0, 34.0, 46.0, 38.0, 39.0, 36.0, 46.0, 41.0, 24.0, 27.0, 24.0, 18.0, 20.0, 20.0, 22.0, 7.0, 12.0, 12.0, 7.0, 11.0, 11.0, 6.0, 5.0, 4.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.33203125, -4.20794677734375, -4.0838623046875, -3.95977783203125, -3.835693359375, -3.71160888671875, -3.5875244140625, -3.46343994140625, -3.33935546875, -3.21527099609375, -3.0911865234375, -2.96710205078125, -2.843017578125, -2.71893310546875, -2.5948486328125, -2.47076416015625, -2.3466796875, -2.22259521484375, -2.0985107421875, -1.97442626953125, -1.850341796875, -1.72625732421875, -1.6021728515625, -1.47808837890625, -1.35400390625, -1.22991943359375, -1.1058349609375, -0.98175048828125, -0.857666015625, -0.73358154296875, -0.6094970703125, -0.48541259765625, -0.361328125, -0.23724365234375, -0.1131591796875, 0.01092529296875, 0.135009765625, 0.25909423828125, 0.3831787109375, 0.50726318359375, 0.63134765625, 0.75543212890625, 0.8795166015625, 1.00360107421875, 1.127685546875, 1.25177001953125, 1.3758544921875, 1.49993896484375, 1.6240234375, 1.74810791015625, 1.8721923828125, 1.99627685546875, 2.120361328125, 2.24444580078125, 2.3685302734375, 2.49261474609375, 2.61669921875, 2.74078369140625, 2.8648681640625, 2.98895263671875, 3.113037109375, 3.23712158203125, 3.3612060546875, 3.48529052734375, 3.609375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 6.0, 7.0, 7.0, 15.0, 21.0, 25.0, 30.0, 49.0, 63.0, 89.0, 117.0, 152.0, 232.0, 296.0, 419.0, 584.0, 735.0, 1179.0, 1614.0, 2305.0, 3446.0, 6264.0, 12782.0, 55394.0, 867719.0, 63600.0, 13503.0, 6068.0, 3702.0, 2388.0, 1605.0, 1158.0, 867.0, 561.0, 429.0, 285.0, 231.0, 168.0, 114.0, 89.0, 71.0, 44.0, 35.0, 29.0, 22.0, 10.0, 8.0, 10.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-29.4375, -28.532470703125, -27.62744140625, -26.722412109375, -25.8173828125, -24.912353515625, -24.00732421875, -23.102294921875, -22.197265625, -21.292236328125, -20.38720703125, -19.482177734375, -18.5771484375, -17.672119140625, -16.76708984375, -15.862060546875, -14.95703125, -14.052001953125, -13.14697265625, -12.241943359375, -11.3369140625, -10.431884765625, -9.52685546875, -8.621826171875, -7.716796875, -6.811767578125, -5.90673828125, -5.001708984375, -4.0966796875, -3.191650390625, -2.28662109375, -1.381591796875, -0.4765625, 0.428466796875, 1.33349609375, 2.238525390625, 3.1435546875, 4.048583984375, 4.95361328125, 5.858642578125, 6.763671875, 7.668701171875, 8.57373046875, 9.478759765625, 10.3837890625, 11.288818359375, 12.19384765625, 13.098876953125, 14.00390625, 14.908935546875, 15.81396484375, 16.718994140625, 17.6240234375, 18.529052734375, 19.43408203125, 20.339111328125, 21.244140625, 22.149169921875, 23.05419921875, 23.959228515625, 24.8642578125, 25.769287109375, 26.67431640625, 27.579345703125, 28.484375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 3.0, 5.0, 8.0, 10.0, 12.0, 14.0, 18.0, 24.0, 23.0, 24.0, 28.0, 21.0, 43.0, 39.0, 37.0, 37.0, 57.0, 92.0, 446.0, 1524.0, 129.0, 68.0, 56.0, 47.0, 45.0, 38.0, 39.0, 33.0, 24.0, 18.0, 11.0, 20.0, 17.0, 8.0, 11.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.3944091796875, -11.952880859375, -11.5113525390625, -11.06982421875, -10.6282958984375, -10.186767578125, -9.7452392578125, -9.3037109375, -8.8621826171875, -8.420654296875, -7.9791259765625, -7.53759765625, -7.0960693359375, -6.654541015625, -6.2130126953125, -5.771484375, -5.3299560546875, -4.888427734375, -4.4468994140625, -4.00537109375, -3.5638427734375, -3.122314453125, -2.6807861328125, -2.2392578125, -1.7977294921875, -1.356201171875, -0.9146728515625, -0.47314453125, -0.0316162109375, 0.409912109375, 0.8514404296875, 1.29296875, 1.7344970703125, 2.176025390625, 2.6175537109375, 3.05908203125, 3.5006103515625, 3.942138671875, 4.3836669921875, 4.8251953125, 5.2667236328125, 5.708251953125, 6.1497802734375, 6.59130859375, 7.0328369140625, 7.474365234375, 7.9158935546875, 8.357421875, 8.7989501953125, 9.240478515625, 9.6820068359375, 10.12353515625, 10.5650634765625, 11.006591796875, 11.4481201171875, 11.8896484375, 12.3311767578125, 12.772705078125, 13.2142333984375, 13.65576171875, 14.0972900390625, 14.538818359375, 14.9803466796875, 15.421875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 7.0, 10.0, 15.0, 17.0, 22.0, 21.0, 22.0, 30.0, 41.0, 48.0, 56.0, 92.0, 196.0, 687.0, 12754.0, 3127987.0, 2720.0, 444.0, 150.0, 72.0, 51.0, 47.0, 25.0, 25.0, 24.0, 25.0, 25.0, 24.0, 9.0, 7.0, 12.0, 9.0, 4.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.25, -70.20654296875, -68.1630859375, -66.11962890625, -64.076171875, -62.03271484375, -59.9892578125, -57.94580078125, -55.90234375, -53.85888671875, -51.8154296875, -49.77197265625, -47.728515625, -45.68505859375, -43.6416015625, -41.59814453125, -39.5546875, -37.51123046875, -35.4677734375, -33.42431640625, -31.380859375, -29.33740234375, -27.2939453125, -25.25048828125, -23.20703125, -21.16357421875, -19.1201171875, -17.07666015625, -15.033203125, -12.98974609375, -10.9462890625, -8.90283203125, -6.859375, -4.81591796875, -2.7724609375, -0.72900390625, 1.314453125, 3.35791015625, 5.4013671875, 7.44482421875, 9.48828125, 11.53173828125, 13.5751953125, 15.61865234375, 17.662109375, 19.70556640625, 21.7490234375, 23.79248046875, 25.8359375, 27.87939453125, 29.9228515625, 31.96630859375, 34.009765625, 36.05322265625, 38.0966796875, 40.14013671875, 42.18359375, 44.22705078125, 46.2705078125, 48.31396484375, 50.357421875, 52.40087890625, 54.4443359375, 56.48779296875, 58.53125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 15.0, 114.0, 600.0, 264.0, 17.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.5019302368164, -87.7023696899414, -85.90280151367188, -84.10324096679688, -82.30367279052734, -80.50411224365234, -78.70454406738281, -76.90498352050781, -75.10542297363281, -73.30586242675781, -71.50629425048828, -69.70673370361328, -67.90716552734375, -66.10760498046875, -64.30804443359375, -62.50847625732422, -60.70891189575195, -58.90934753417969, -57.10978317260742, -55.310218811035156, -53.510658264160156, -51.71109390258789, -49.911529541015625, -48.11196517944336, -46.312400817871094, -44.51283645629883, -42.71327209472656, -40.91371154785156, -39.1141471862793, -37.31458282470703, -35.515018463134766, -33.7154541015625, -31.9158935546875, -30.116329193115234, -28.3167667388916, -26.517202377319336, -24.717639923095703, -22.918075561523438, -21.118511199951172, -19.318946838378906, -17.519384384155273, -15.719820976257324, -13.920257568359375, -12.12069320678711, -10.32112979888916, -8.521566390991211, -6.722002029418945, -4.922438621520996, -3.122875213623047, -1.3233115673065186, 0.47625207901000977, 2.275815963745117, 4.075379371643066, 5.874942779541016, 7.674507141113281, 9.47407054901123, 11.27363395690918, 13.073197364807129, 14.872760772705078, 16.672325134277344, 18.47188949584961, 20.271451950073242, 22.071016311645508, 23.87057876586914, 25.670143127441406]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 9.0, 10.0, 13.0, 14.0, 16.0, 22.0, 25.0, 20.0, 39.0, 33.0, 27.0, 42.0, 34.0, 36.0, 38.0, 33.0, 48.0, 48.0, 43.0, 47.0, 35.0, 45.0, 37.0, 36.0, 31.0, 22.0, 31.0, 28.0, 33.0, 16.0, 12.0, 16.0, 9.0, 12.0, 2.0, 9.0, 7.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.31623458862305, -41.987945556640625, -40.6596565246582, -39.33136749267578, -38.003074645996094, -36.67478561401367, -35.34649658203125, -34.01820755004883, -32.689918518066406, -31.361629486083984, -30.033340454101562, -28.705049514770508, -27.376760482788086, -26.048471450805664, -24.72018051147461, -23.391891479492188, -22.063602447509766, -20.735313415527344, -19.407024383544922, -18.078733444213867, -16.750444412231445, -15.422155380249023, -14.093865394592285, -12.765575408935547, -11.437286376953125, -10.108997344970703, -8.780707359313965, -7.452417850494385, -6.124128341674805, -4.795838832855225, -3.4675493240356445, -2.1392593383789062, -0.81097412109375, 0.5173153877258301, 1.8456048965454102, 3.1738944053649902, 4.50218391418457, 5.83047342300415, 7.1587629318237305, 8.487052917480469, 9.81534194946289, 11.143630981445312, 12.47192096710205, 13.800210952758789, 15.128499984741211, 16.456789016723633, 17.785079956054688, 19.11336898803711, 20.44165802001953, 21.769947052001953, 23.098236083984375, 24.42652702331543, 25.75481605529785, 27.083105087280273, 28.411396026611328, 29.73968505859375, 31.067974090576172, 32.396263122558594, 33.724552154541016, 35.05284118652344, 36.381134033203125, 37.70942306518555, 39.03771209716797, 40.36600112915039, 41.69429016113281]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 11.0, 8.0, 5.0, 12.0, 9.0, 13.0, 10.0, 19.0, 15.0, 17.0, 17.0, 27.0, 31.0, 25.0, 29.0, 34.0, 37.0, 31.0, 25.0, 36.0, 41.0, 34.0, 44.0, 33.0, 36.0, 35.0, 43.0, 36.0, 43.0, 33.0, 27.0, 24.0, 23.0, 15.0, 30.0, 8.0, 12.0, 14.0, 13.0, 10.0, 6.0, 12.0, 6.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.34375, -4.2125244140625, -4.081298828125, -3.9500732421875, -3.81884765625, -3.6876220703125, -3.556396484375, -3.4251708984375, -3.2939453125, -3.1627197265625, -3.031494140625, -2.9002685546875, -2.76904296875, -2.6378173828125, -2.506591796875, -2.3753662109375, -2.244140625, -2.1129150390625, -1.981689453125, -1.8504638671875, -1.71923828125, -1.5880126953125, -1.456787109375, -1.3255615234375, -1.1943359375, -1.0631103515625, -0.931884765625, -0.8006591796875, -0.66943359375, -0.5382080078125, -0.406982421875, -0.2757568359375, -0.14453125, -0.0133056640625, 0.117919921875, 0.2491455078125, 0.38037109375, 0.5115966796875, 0.642822265625, 0.7740478515625, 0.9052734375, 1.0364990234375, 1.167724609375, 1.2989501953125, 1.43017578125, 1.5614013671875, 1.692626953125, 1.8238525390625, 1.955078125, 2.0863037109375, 2.217529296875, 2.3487548828125, 2.47998046875, 2.6112060546875, 2.742431640625, 2.8736572265625, 3.0048828125, 3.1361083984375, 3.267333984375, 3.3985595703125, 3.52978515625, 3.6610107421875, 3.792236328125, 3.9234619140625, 4.0546875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 10.0, 7.0, 11.0, 11.0, 9.0, 22.0, 23.0, 29.0, 50.0, 69.0, 113.0, 163.0, 240.0, 464.0, 783.0, 1536.0, 3067.0, 6628.0, 15363.0, 50444.0, 1186286.0, 2810703.0, 82934.0, 20417.0, 7838.0, 3324.0, 1672.0, 848.0, 445.0, 265.0, 164.0, 101.0, 76.0, 44.0, 33.0, 32.0, 11.0, 5.0, 14.0, 8.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.0, -27.1005859375, -26.201171875, -25.3017578125, -24.40234375, -23.5029296875, -22.603515625, -21.7041015625, -20.8046875, -19.9052734375, -19.005859375, -18.1064453125, -17.20703125, -16.3076171875, -15.408203125, -14.5087890625, -13.609375, -12.7099609375, -11.810546875, -10.9111328125, -10.01171875, -9.1123046875, -8.212890625, -7.3134765625, -6.4140625, -5.5146484375, -4.615234375, -3.7158203125, -2.81640625, -1.9169921875, -1.017578125, -0.1181640625, 0.78125, 1.6806640625, 2.580078125, 3.4794921875, 4.37890625, 5.2783203125, 6.177734375, 7.0771484375, 7.9765625, 8.8759765625, 9.775390625, 10.6748046875, 11.57421875, 12.4736328125, 13.373046875, 14.2724609375, 15.171875, 16.0712890625, 16.970703125, 17.8701171875, 18.76953125, 19.6689453125, 20.568359375, 21.4677734375, 22.3671875, 23.2666015625, 24.166015625, 25.0654296875, 25.96484375, 26.8642578125, 27.763671875, 28.6630859375, 29.5625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 11.0, 15.0, 30.0, 62.0, 124.0, 241.0, 627.0, 1282.0, 979.0, 394.0, 168.0, 73.0, 39.0, 18.0, 16.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.6875, -65.1640625, -63.640625, -62.1171875, -60.59375, -59.0703125, -57.546875, -56.0234375, -54.5, -52.9765625, -51.453125, -49.9296875, -48.40625, -46.8828125, -45.359375, -43.8359375, -42.3125, -40.7890625, -39.265625, -37.7421875, -36.21875, -34.6953125, -33.171875, -31.6484375, -30.125, -28.6015625, -27.078125, -25.5546875, -24.03125, -22.5078125, -20.984375, -19.4609375, -17.9375, -16.4140625, -14.890625, -13.3671875, -11.84375, -10.3203125, -8.796875, -7.2734375, -5.75, -4.2265625, -2.703125, -1.1796875, 0.34375, 1.8671875, 3.390625, 4.9140625, 6.4375, 7.9609375, 9.484375, 11.0078125, 12.53125, 14.0546875, 15.578125, 17.1015625, 18.625, 20.1484375, 21.671875, 23.1953125, 24.71875, 26.2421875, 27.765625, 29.2890625, 30.8125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 18.0, 24.0, 31.0, 77.0, 178.0, 396.0, 2609.0, 4188185.0, 1995.0, 406.0, 183.0, 82.0, 46.0, 30.0, 13.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.5, -83.78125, -77.0625, -70.34375, -63.625, -56.90625, -50.1875, -43.46875, -36.75, -30.03125, -23.3125, -16.59375, -9.875, -3.15625, 3.5625, 10.28125, 17.0, 23.71875, 30.4375, 37.15625, 43.875, 50.59375, 57.3125, 64.03125, 70.75, 77.46875, 84.1875, 90.90625, 97.625, 104.34375, 111.0625, 117.78125, 124.5, 131.21875, 137.9375, 144.65625, 151.375, 158.09375, 164.8125, 171.53125, 178.25, 184.96875, 191.6875, 198.40625, 205.125, 211.84375, 218.5625, 225.28125, 232.0, 238.71875, 245.4375, 252.15625, 258.875, 265.59375, 272.3125, 279.03125, 285.75, 292.46875, 299.1875, 305.90625, 312.625, 319.34375, 326.0625, 332.78125, 339.5]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 18.0, 83.0, 258.0, 353.0, 222.0, 64.0, 9.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.7776870727539, -80.0458984375, -76.31410217285156, -72.58230590820312, -68.85051727294922, -65.11872863769531, -61.386932373046875, -57.6551399230957, -53.92334747314453, -50.19155502319336, -46.45976257324219, -42.727970123291016, -38.996177673339844, -35.26438522338867, -31.5325927734375, -27.800800323486328, -24.069007873535156, -20.337215423583984, -16.605422973632812, -12.87363052368164, -9.141838073730469, -5.410045623779297, -1.678253173828125, 2.053539276123047, 5.785331726074219, 9.51712417602539, 13.248916625976562, 16.980709075927734, 20.712501525878906, 24.444293975830078, 28.17608642578125, 31.907878875732422, 35.639678955078125, 39.3714714050293, 43.10326385498047, 46.83505630493164, 50.56684875488281, 54.298641204833984, 58.030433654785156, 61.76222610473633, 65.4940185546875, 69.22581481933594, 72.95760345458984, 76.68939208984375, 80.42118835449219, 84.15298461914062, 87.88477325439453, 91.61656188964844, 95.34835815429688, 99.08015441894531, 102.81194305419922, 106.54373168945312, 110.27552795410156, 114.00732421875, 117.7391128540039, 121.47090148925781, 125.20269775390625, 128.9344940185547, 132.66629028320312, 136.3980712890625, 140.12986755371094, 143.86166381835938, 147.59344482421875, 151.3252410888672, 155.05703735351562]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 5.0, 8.0, 9.0, 13.0, 21.0, 14.0, 19.0, 10.0, 21.0, 32.0, 22.0, 32.0, 27.0, 37.0, 49.0, 42.0, 44.0, 39.0, 49.0, 43.0, 44.0, 41.0, 37.0, 35.0, 46.0, 34.0, 39.0, 26.0, 22.0, 29.0, 18.0, 16.0, 16.0, 18.0, 11.0, 5.0, 4.0, 7.0, 3.0, 1.0, 2.0, 5.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-64.79257202148438, -62.469390869140625, -60.14620590209961, -57.82302474975586, -55.499839782714844, -53.176658630371094, -50.853477478027344, -48.53029251098633, -46.20710754394531, -43.88392639160156, -41.56074142456055, -39.2375602722168, -36.91437530517578, -34.59119415283203, -32.26801300048828, -29.944828033447266, -27.621646881103516, -25.298463821411133, -22.97528076171875, -20.652099609375, -18.328914642333984, -16.005733489990234, -13.682550430297852, -11.359367370605469, -9.036184310913086, -6.713001251220703, -4.3898186683654785, -2.066636085510254, 0.2565469741821289, 2.5797300338745117, 4.902912139892578, 7.226095199584961, 9.549278259277344, 11.872461318969727, 14.19564437866211, 16.51882553100586, 18.842010498046875, 21.165191650390625, 23.488374710083008, 25.81155776977539, 28.134740829467773, 30.457923889160156, 32.781105041503906, 35.10429000854492, 37.42747116088867, 39.75065612792969, 42.07383728027344, 44.39701843261719, 46.7202033996582, 49.04338455200195, 51.36656951904297, 53.68975067138672, 56.012935638427734, 58.336116790771484, 60.6593017578125, 62.98248291015625, 65.3056640625, 67.62884521484375, 69.9520263671875, 72.27521514892578, 74.59839630126953, 76.92157745361328, 79.24475860595703, 81.56794738769531, 83.89112854003906]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 8.0, 11.0, 9.0, 13.0, 15.0, 13.0, 19.0, 17.0, 25.0, 23.0, 25.0, 31.0, 29.0, 27.0, 31.0, 42.0, 42.0, 30.0, 25.0, 42.0, 51.0, 34.0, 37.0, 38.0, 23.0, 37.0, 38.0, 22.0, 26.0, 27.0, 18.0, 30.0, 18.0, 19.0, 12.0, 15.0, 12.0, 15.0, 6.0, 7.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0], "bins": [-4.51953125, -4.38641357421875, -4.2532958984375, -4.12017822265625, -3.987060546875, -3.85394287109375, -3.7208251953125, -3.58770751953125, -3.45458984375, -3.32147216796875, -3.1883544921875, -3.05523681640625, -2.922119140625, -2.78900146484375, -2.6558837890625, -2.52276611328125, -2.3896484375, -2.25653076171875, -2.1234130859375, -1.99029541015625, -1.857177734375, -1.72406005859375, -1.5909423828125, -1.45782470703125, -1.32470703125, -1.19158935546875, -1.0584716796875, -0.92535400390625, -0.792236328125, -0.65911865234375, -0.5260009765625, -0.39288330078125, -0.259765625, -0.12664794921875, 0.0064697265625, 0.13958740234375, 0.272705078125, 0.40582275390625, 0.5389404296875, 0.67205810546875, 0.80517578125, 0.93829345703125, 1.0714111328125, 1.20452880859375, 1.337646484375, 1.47076416015625, 1.6038818359375, 1.73699951171875, 1.8701171875, 2.00323486328125, 2.1363525390625, 2.26947021484375, 2.402587890625, 2.53570556640625, 2.6688232421875, 2.80194091796875, 2.93505859375, 3.06817626953125, 3.2012939453125, 3.33441162109375, 3.467529296875, 3.60064697265625, 3.7337646484375, 3.86688232421875, 4.0]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 6.0, 6.0, 10.0, 15.0, 21.0, 28.0, 53.0, 79.0, 129.0, 162.0, 232.0, 335.0, 453.0, 776.0, 1066.0, 1533.0, 2242.0, 3311.0, 4809.0, 7121.0, 10776.0, 16217.0, 24767.0, 38640.0, 61949.0, 103143.0, 206441.0, 255696.0, 116484.0, 68466.0, 42576.0, 27239.0, 17764.0, 11615.0, 7933.0, 5177.0, 3546.0, 2439.0, 1681.0, 1123.0, 785.0, 534.0, 379.0, 273.0, 182.0, 112.0, 70.0, 55.0, 45.0, 21.0, 15.0, 18.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.90380859375, -0.8737869262695312, -0.8437652587890625, -0.8137435913085938, -0.783721923828125, -0.7537002563476562, -0.7236785888671875, -0.6936569213867188, -0.66363525390625, -0.6336135864257812, -0.6035919189453125, -0.5735702514648438, -0.543548583984375, -0.5135269165039062, -0.4835052490234375, -0.45348358154296875, -0.4234619140625, -0.39344024658203125, -0.3634185791015625, -0.33339691162109375, -0.303375244140625, -0.27335357666015625, -0.2433319091796875, -0.21331024169921875, -0.18328857421875, -0.15326690673828125, -0.1232452392578125, -0.09322357177734375, -0.063201904296875, -0.03318023681640625, -0.0031585693359375, 0.02686309814453125, 0.056884765625, 0.08690643310546875, 0.1169281005859375, 0.14694976806640625, 0.176971435546875, 0.20699310302734375, 0.2370147705078125, 0.26703643798828125, 0.29705810546875, 0.32707977294921875, 0.3571014404296875, 0.38712310791015625, 0.417144775390625, 0.44716644287109375, 0.4771881103515625, 0.5072097778320312, 0.5372314453125, 0.5672531127929688, 0.5972747802734375, 0.6272964477539062, 0.657318115234375, 0.6873397827148438, 0.7173614501953125, 0.7473831176757812, 0.77740478515625, 0.8074264526367188, 0.8374481201171875, 0.8674697875976562, 0.897491455078125, 0.9275131225585938, 0.9575347900390625, 0.9875564575195312, 1.017578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 1.0, 6.0, 5.0, 8.0, 12.0, 13.0, 14.0, 16.0, 23.0, 25.0, 26.0, 31.0, 19.0, 39.0, 39.0, 36.0, 22.0, 49.0, 51.0, 45.0, 1061.0, 47.0, 40.0, 32.0, 37.0, 39.0, 44.0, 32.0, 33.0, 33.0, 30.0, 15.0, 23.0, 13.0, 6.0, 11.0, 11.0, 11.0, 13.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.171875, -3.074310302734375, -2.97674560546875, -2.879180908203125, -2.7816162109375, -2.684051513671875, -2.58648681640625, -2.488922119140625, -2.391357421875, -2.293792724609375, -2.19622802734375, -2.098663330078125, -2.0010986328125, -1.903533935546875, -1.80596923828125, -1.708404541015625, -1.61083984375, -1.513275146484375, -1.41571044921875, -1.318145751953125, -1.2205810546875, -1.123016357421875, -1.02545166015625, -0.927886962890625, -0.830322265625, -0.732757568359375, -0.63519287109375, -0.537628173828125, -0.4400634765625, -0.342498779296875, -0.24493408203125, -0.147369384765625, -0.0498046875, 0.047760009765625, 0.14532470703125, 0.242889404296875, 0.3404541015625, 0.438018798828125, 0.53558349609375, 0.633148193359375, 0.730712890625, 0.828277587890625, 0.92584228515625, 1.023406982421875, 1.1209716796875, 1.218536376953125, 1.31610107421875, 1.413665771484375, 1.51123046875, 1.608795166015625, 1.70635986328125, 1.803924560546875, 1.9014892578125, 1.999053955078125, 2.09661865234375, 2.194183349609375, 2.291748046875, 2.389312744140625, 2.48687744140625, 2.584442138671875, 2.6820068359375, 2.779571533203125, 2.87713623046875, 2.974700927734375, 3.072265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 10.0, 12.0, 19.0, 31.0, 33.0, 56.0, 82.0, 121.0, 168.0, 264.0, 390.0, 555.0, 841.0, 1298.0, 1950.0, 2863.0, 4276.0, 6854.0, 10389.0, 15984.0, 24789.0, 39128.0, 62290.0, 105847.0, 232791.0, 1298271.0, 110006.0, 64402.0, 40197.0, 25501.0, 16357.0, 10666.0, 7035.0, 4624.0, 3053.0, 1958.0, 1267.0, 861.0, 611.0, 413.0, 261.0, 200.0, 122.0, 96.0, 63.0, 43.0, 24.0, 20.0, 15.0, 11.0, 5.0, 5.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-0.94677734375, -0.9172210693359375, -0.887664794921875, -0.8581085205078125, -0.82855224609375, -0.7989959716796875, -0.769439697265625, -0.7398834228515625, -0.7103271484375, -0.6807708740234375, -0.651214599609375, -0.6216583251953125, -0.59210205078125, -0.5625457763671875, -0.532989501953125, -0.5034332275390625, -0.473876953125, -0.4443206787109375, -0.414764404296875, -0.3852081298828125, -0.35565185546875, -0.3260955810546875, -0.296539306640625, -0.2669830322265625, -0.2374267578125, -0.2078704833984375, -0.178314208984375, -0.1487579345703125, -0.11920166015625, -0.0896453857421875, -0.060089111328125, -0.0305328369140625, -0.0009765625, 0.0285797119140625, 0.058135986328125, 0.0876922607421875, 0.11724853515625, 0.1468048095703125, 0.176361083984375, 0.2059173583984375, 0.2354736328125, 0.2650299072265625, 0.294586181640625, 0.3241424560546875, 0.35369873046875, 0.3832550048828125, 0.412811279296875, 0.4423675537109375, 0.471923828125, 0.5014801025390625, 0.531036376953125, 0.5605926513671875, 0.59014892578125, 0.6197052001953125, 0.649261474609375, 0.6788177490234375, 0.7083740234375, 0.7379302978515625, 0.767486572265625, 0.7970428466796875, 0.82659912109375, 0.8561553955078125, 0.885711669921875, 0.9152679443359375, 0.94482421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 4.0, 3.0, 5.0, 13.0, 7.0, 10.0, 23.0, 21.0, 31.0, 48.0, 66.0, 87.0, 105.0, 110.0, 107.0, 101.0, 61.0, 53.0, 30.0, 21.0, 21.0, 8.0, 9.0, 11.0, 8.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0], "bins": [-0.0007848739624023438, -0.0007627904415130615, -0.0007407069206237793, -0.0007186233997344971, -0.0006965398788452148, -0.0006744563579559326, -0.0006523728370666504, -0.0006302893161773682, -0.0006082057952880859, -0.0005861222743988037, -0.0005640387535095215, -0.0005419552326202393, -0.000519871711730957, -0.0004977881908416748, -0.0004757046699523926, -0.00045362114906311035, -0.0004315376281738281, -0.0004094541072845459, -0.00038737058639526367, -0.00036528706550598145, -0.0003432035446166992, -0.000321120023727417, -0.00029903650283813477, -0.00027695298194885254, -0.0002548694610595703, -0.00023278594017028809, -0.00021070241928100586, -0.00018861889839172363, -0.0001665353775024414, -0.00014445185661315918, -0.00012236833572387695, -0.00010028481483459473, -7.82012939453125e-05, -5.6117773056030273e-05, -3.403425216674805e-05, -1.195073127746582e-05, 1.0132789611816406e-05, 3.221631050109863e-05, 5.429983139038086e-05, 7.638335227966309e-05, 9.846687316894531e-05, 0.00012055039405822754, 0.00014263391494750977, 0.000164717435836792, 0.00018680095672607422, 0.00020888447761535645, 0.00023096799850463867, 0.0002530515193939209, 0.0002751350402832031, 0.00029721856117248535, 0.0003193020820617676, 0.0003413856029510498, 0.00036346912384033203, 0.00038555264472961426, 0.0004076361656188965, 0.0004297196865081787, 0.00045180320739746094, 0.00047388672828674316, 0.0004959702491760254, 0.0005180537700653076, 0.0005401372909545898, 0.0005622208118438721, 0.0005843043327331543, 0.0006063878536224365, 0.0006284713745117188]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 3.0, 11.0, 11.0, 14.0, 16.0, 32.0, 35.0, 51.0, 103.0, 187.0, 334.0, 1194.0, 1043827.0, 1779.0, 418.0, 188.0, 121.0, 61.0, 33.0, 34.0, 23.0, 16.0, 14.0, 8.0, 7.0, 3.0, 7.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0153045654296875, -0.014749765396118164, -0.014194965362548828, -0.013640165328979492, -0.013085365295410156, -0.01253056526184082, -0.011975765228271484, -0.011420965194702148, -0.010866165161132812, -0.010311365127563477, -0.00975656509399414, -0.009201765060424805, -0.008646965026855469, -0.008092164993286133, -0.007537364959716797, -0.006982564926147461, -0.006427764892578125, -0.005872964859008789, -0.005318164825439453, -0.004763364791870117, -0.004208564758300781, -0.0036537647247314453, -0.0030989646911621094, -0.0025441646575927734, -0.0019893646240234375, -0.0014345645904541016, -0.0008797645568847656, -0.0003249645233154297, 0.00022983551025390625, 0.0007846355438232422, 0.0013394355773925781, 0.001894235610961914, 0.00244903564453125, 0.003003835678100586, 0.003558635711669922, 0.004113435745239258, 0.004668235778808594, 0.00522303581237793, 0.005777835845947266, 0.0063326358795166016, 0.0068874359130859375, 0.0074422359466552734, 0.00799703598022461, 0.008551836013793945, 0.009106636047363281, 0.009661436080932617, 0.010216236114501953, 0.010771036148071289, 0.011325836181640625, 0.011880636215209961, 0.012435436248779297, 0.012990236282348633, 0.013545036315917969, 0.014099836349487305, 0.01465463638305664, 0.015209436416625977, 0.015764236450195312, 0.01631903648376465, 0.016873836517333984, 0.01742863655090332, 0.017983436584472656, 0.018538236618041992, 0.019093036651611328, 0.019647836685180664, 0.02020263671875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 96.0, 481.0, 375.0, 53.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.001678246771916747, -0.0016487597022205591, -0.0016192725161090493, -0.0015897854464128613, -0.0015602983767166734, -0.0015308113070204854, -0.0015013241209089756, -0.0014718370512127876, -0.0014423499815165997, -0.0014128629118204117, -0.0013833757257089019, -0.001353888656012714, -0.001324401586316526, -0.001294914516620338, -0.0012654273305088282, -0.0012359402608126402, -0.0012064531911164522, -0.0011769661214202642, -0.0011474789353087544, -0.0011179918656125665, -0.0010885047959163785, -0.0010590177262201905, -0.0010295305401086807, -0.0010000434704124928, -0.0009705563425086439, -0.000941069214604795, -0.000911582144908607, -0.0008820950170047581, -0.0008526079473085701, -0.0008231208194047213, -0.0007936337497085333, -0.0007641466218046844, -0.0007346596103161573, -0.0007051724824123085, -0.0006756854127161205, -0.0006461982848122716, -0.0006167112151160836, -0.0005872240872122347, -0.0005577370175160468, -0.0005282498896121979, -0.0004987628199160099, -0.0004692757211159915, -0.00043978862231597304, -0.0004103015235159546, -0.0003808144247159362, -0.0003513272968120873, -0.0003218402271158993, -0.00029235309921205044, -0.00026286597130820155, -0.00023337887250818312, -0.0002038917737081647, -0.00017440467490814626, -0.00014491757610812783, -0.00011543046275619417, -8.594336395617574e-05, -5.6456265156157315e-05, -2.6969180908054113e-05, 2.51791971095372e-06, 3.200502032996155e-05, 6.149212276795879e-05, 9.097922156797722e-05, 0.00012046632764395326, 0.0001499534264439717, 0.00017944052524399012, 0.00020892762404400855]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 2.0, 6.0, 6.0, 8.0, 13.0, 11.0, 11.0, 16.0, 13.0, 21.0, 19.0, 27.0, 30.0, 38.0, 39.0, 21.0, 50.0, 42.0, 31.0, 38.0, 48.0, 49.0, 34.0, 41.0, 39.0, 33.0, 38.0, 41.0, 22.0, 34.0, 24.0, 15.0, 30.0, 25.0, 19.0, 14.0, 12.0, 11.0, 9.0, 8.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002929568290710449, -0.00028406083583831787, -0.0002751648426055908, -0.00026626884937286377, -0.0002573728561401367, -0.00024847686290740967, -0.00023958086967468262, -0.00023068487644195557, -0.00022178888320922852, -0.00021289288997650146, -0.00020399689674377441, -0.00019510090351104736, -0.0001862049102783203, -0.00017730891704559326, -0.0001684129238128662, -0.00015951693058013916, -0.0001506209373474121, -0.00014172494411468506, -0.000132828950881958, -0.00012393295764923096, -0.0001150369644165039, -0.00010614097118377686, -9.72449779510498e-05, -8.834898471832275e-05, -7.94529914855957e-05, -7.055699825286865e-05, -6.16610050201416e-05, -5.276501178741455e-05, -4.38690185546875e-05, -3.497302532196045e-05, -2.60770320892334e-05, -1.7181038856506348e-05, -8.285045623779297e-06, 6.109476089477539e-07, 9.506940841674805e-06, 1.8402934074401855e-05, 2.7298927307128906e-05, 3.619492053985596e-05, 4.509091377258301e-05, 5.398690700531006e-05, 6.288290023803711e-05, 7.177889347076416e-05, 8.067488670349121e-05, 8.957087993621826e-05, 9.846687316894531e-05, 0.00010736286640167236, 0.00011625885963439941, 0.00012515485286712646, 0.00013405084609985352, 0.00014294683933258057, 0.00015184283256530762, 0.00016073882579803467, 0.00016963481903076172, 0.00017853081226348877, 0.00018742680549621582, 0.00019632279872894287, 0.00020521879196166992, 0.00021411478519439697, 0.00022301077842712402, 0.00023190677165985107, 0.00024080276489257812, 0.0002496987581253052, 0.0002585947513580322, 0.0002674907445907593, 0.00027638673782348633]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 8.0, 11.0, 9.0, 13.0, 15.0, 13.0, 19.0, 17.0, 25.0, 23.0, 25.0, 31.0, 29.0, 27.0, 31.0, 42.0, 42.0, 30.0, 25.0, 42.0, 51.0, 34.0, 37.0, 38.0, 23.0, 37.0, 38.0, 22.0, 26.0, 27.0, 18.0, 30.0, 18.0, 19.0, 12.0, 15.0, 12.0, 15.0, 6.0, 7.0, 5.0, 5.0, 5.0, 4.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0], "bins": [-4.51953125, -4.38641357421875, -4.2532958984375, -4.12017822265625, -3.987060546875, -3.85394287109375, -3.7208251953125, -3.58770751953125, -3.45458984375, -3.32147216796875, -3.1883544921875, -3.05523681640625, -2.922119140625, -2.78900146484375, -2.6558837890625, -2.52276611328125, -2.3896484375, -2.25653076171875, -2.1234130859375, -1.99029541015625, -1.857177734375, -1.72406005859375, -1.5909423828125, -1.45782470703125, -1.32470703125, -1.19158935546875, -1.0584716796875, -0.92535400390625, -0.792236328125, -0.65911865234375, -0.5260009765625, -0.39288330078125, -0.259765625, -0.12664794921875, 0.0064697265625, 0.13958740234375, 0.272705078125, 0.40582275390625, 0.5389404296875, 0.67205810546875, 0.80517578125, 0.93829345703125, 1.0714111328125, 1.20452880859375, 1.337646484375, 1.47076416015625, 1.6038818359375, 1.73699951171875, 1.8701171875, 2.00323486328125, 2.1363525390625, 2.26947021484375, 2.402587890625, 2.53570556640625, 2.6688232421875, 2.80194091796875, 2.93505859375, 3.06817626953125, 3.2012939453125, 3.33441162109375, 3.467529296875, 3.60064697265625, 3.7337646484375, 3.86688232421875, 4.0]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 9.0, 6.0, 8.0, 14.0, 13.0, 19.0, 29.0, 42.0, 54.0, 54.0, 66.0, 112.0, 127.0, 196.0, 246.0, 351.0, 571.0, 837.0, 1496.0, 2775.0, 5878.0, 13930.0, 37931.0, 116816.0, 399621.0, 320241.0, 93030.0, 30970.0, 11770.0, 5076.0, 2426.0, 1256.0, 784.0, 501.0, 338.0, 264.0, 141.0, 134.0, 107.0, 63.0, 63.0, 44.0, 33.0, 29.0, 24.0, 20.0, 12.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-4.125, -3.9996337890625, -3.874267578125, -3.7489013671875, -3.62353515625, -3.4981689453125, -3.372802734375, -3.2474365234375, -3.1220703125, -2.9967041015625, -2.871337890625, -2.7459716796875, -2.62060546875, -2.4952392578125, -2.369873046875, -2.2445068359375, -2.119140625, -1.9937744140625, -1.868408203125, -1.7430419921875, -1.61767578125, -1.4923095703125, -1.366943359375, -1.2415771484375, -1.1162109375, -0.9908447265625, -0.865478515625, -0.7401123046875, -0.61474609375, -0.4893798828125, -0.364013671875, -0.2386474609375, -0.11328125, 0.0120849609375, 0.137451171875, 0.2628173828125, 0.38818359375, 0.5135498046875, 0.638916015625, 0.7642822265625, 0.8896484375, 1.0150146484375, 1.140380859375, 1.2657470703125, 1.39111328125, 1.5164794921875, 1.641845703125, 1.7672119140625, 1.892578125, 2.0179443359375, 2.143310546875, 2.2686767578125, 2.39404296875, 2.5194091796875, 2.644775390625, 2.7701416015625, 2.8955078125, 3.0208740234375, 3.146240234375, 3.2716064453125, 3.39697265625, 3.5223388671875, 3.647705078125, 3.7730712890625, 3.8984375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 5.0, 4.0, 11.0, 10.0, 23.0, 11.0, 16.0, 23.0, 23.0, 31.0, 36.0, 38.0, 44.0, 43.0, 35.0, 44.0, 67.0, 284.0, 1765.0, 98.0, 57.0, 35.0, 39.0, 49.0, 32.0, 41.0, 23.0, 28.0, 23.0, 15.0, 17.0, 15.0, 11.0, 11.0, 8.0, 5.0, 5.0, 7.0, 4.0, 1.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.421875, -16.864013671875, -16.30615234375, -15.748291015625, -15.1904296875, -14.632568359375, -14.07470703125, -13.516845703125, -12.958984375, -12.401123046875, -11.84326171875, -11.285400390625, -10.7275390625, -10.169677734375, -9.61181640625, -9.053955078125, -8.49609375, -7.938232421875, -7.38037109375, -6.822509765625, -6.2646484375, -5.706787109375, -5.14892578125, -4.591064453125, -4.033203125, -3.475341796875, -2.91748046875, -2.359619140625, -1.8017578125, -1.243896484375, -0.68603515625, -0.128173828125, 0.4296875, 0.987548828125, 1.54541015625, 2.103271484375, 2.6611328125, 3.218994140625, 3.77685546875, 4.334716796875, 4.892578125, 5.450439453125, 6.00830078125, 6.566162109375, 7.1240234375, 7.681884765625, 8.23974609375, 8.797607421875, 9.35546875, 9.913330078125, 10.47119140625, 11.029052734375, 11.5869140625, 12.144775390625, 12.70263671875, 13.260498046875, 13.818359375, 14.376220703125, 14.93408203125, 15.491943359375, 16.0498046875, 16.607666015625, 17.16552734375, 17.723388671875, 18.28125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 6.0, 10.0, 8.0, 14.0, 12.0, 18.0, 18.0, 22.0, 27.0, 38.0, 43.0, 60.0, 74.0, 131.0, 230.0, 582.0, 3464.0, 3113955.0, 25145.0, 966.0, 298.0, 150.0, 92.0, 66.0, 43.0, 46.0, 36.0, 24.0, 16.0, 21.0, 18.0, 15.0, 11.0, 12.0, 4.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.34375, -41.0478515625, -39.751953125, -38.4560546875, -37.16015625, -35.8642578125, -34.568359375, -33.2724609375, -31.9765625, -30.6806640625, -29.384765625, -28.0888671875, -26.79296875, -25.4970703125, -24.201171875, -22.9052734375, -21.609375, -20.3134765625, -19.017578125, -17.7216796875, -16.42578125, -15.1298828125, -13.833984375, -12.5380859375, -11.2421875, -9.9462890625, -8.650390625, -7.3544921875, -6.05859375, -4.7626953125, -3.466796875, -2.1708984375, -0.875, 0.4208984375, 1.716796875, 3.0126953125, 4.30859375, 5.6044921875, 6.900390625, 8.1962890625, 9.4921875, 10.7880859375, 12.083984375, 13.3798828125, 14.67578125, 15.9716796875, 17.267578125, 18.5634765625, 19.859375, 21.1552734375, 22.451171875, 23.7470703125, 25.04296875, 26.3388671875, 27.634765625, 28.9306640625, 30.2265625, 31.5224609375, 32.818359375, 34.1142578125, 35.41015625, 36.7060546875, 38.001953125, 39.2978515625, 40.59375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [4.0, 330.0, 671.0, 13.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.629512786865234, -3.53395676612854, -0.4384007453918457, 2.6571550369262695, 5.752711296081543, 8.848267555236816, 11.943822860717773, 15.039379119873047, 18.13493537902832, 21.230491638183594, 24.326047897338867, 27.42160415649414, 30.51715850830078, 33.61271667480469, 36.70827102661133, 39.80382537841797, 42.899383544921875, 45.994937896728516, 49.09049606323242, 52.18605041503906, 55.28160858154297, 58.37716293334961, 61.47271728515625, 64.56827545166016, 67.66383361816406, 70.75939178466797, 73.85494232177734, 76.95050048828125, 80.04605865478516, 83.14161682128906, 86.23716735839844, 89.33272552490234, 92.42827606201172, 95.52383422851562, 98.619384765625, 101.7149429321289, 104.81050109863281, 107.90605926513672, 111.0016098022461, 114.09716796875, 117.1927261352539, 120.28828430175781, 123.38383483886719, 126.4793930053711, 129.574951171875, 132.67050170898438, 135.7660675048828, 138.8616180419922, 141.95716857910156, 145.05271911621094, 148.14828491210938, 151.24383544921875, 154.33938598632812, 157.43495178222656, 160.53050231933594, 163.62606811523438, 166.72161865234375, 169.81716918945312, 172.91273498535156, 176.00828552246094, 179.1038360595703, 182.19940185546875, 185.29495239257812, 188.3905029296875, 191.48606872558594]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 12.0, 8.0, 12.0, 14.0, 21.0, 24.0, 26.0, 31.0, 23.0, 32.0, 27.0, 26.0, 33.0, 36.0, 30.0, 38.0, 44.0, 35.0, 55.0, 38.0, 32.0, 46.0, 35.0, 42.0, 40.0, 28.0, 23.0, 29.0, 24.0, 15.0, 11.0, 20.0, 19.0, 14.0, 9.0, 4.0, 8.0, 4.0, 7.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-59.70993423461914, -58.04661178588867, -56.3832893371582, -54.719966888427734, -53.05664825439453, -51.39332580566406, -49.730003356933594, -48.066680908203125, -46.403358459472656, -44.74003601074219, -43.07671356201172, -41.41339111328125, -39.75006866455078, -38.08674621582031, -36.42342758178711, -34.76010513305664, -33.09678268432617, -31.433460235595703, -29.770137786865234, -28.1068172454834, -26.44349479675293, -24.78017234802246, -23.116851806640625, -21.453529357910156, -19.790206909179688, -18.12688446044922, -16.46356201171875, -14.800241470336914, -13.136919021606445, -11.473596572875977, -9.810275077819824, -8.146953582763672, -6.4836273193359375, -4.820305347442627, -3.1569833755493164, -1.4936614036560059, 0.1696605682373047, 1.8329830169677734, 3.496304512023926, 5.159626007080078, 6.822948455810547, 8.486270904541016, 10.149592399597168, 11.81291389465332, 13.476236343383789, 15.139558792114258, 16.802879333496094, 18.466201782226562, 20.12952423095703, 21.7928466796875, 23.45616912841797, 25.119489669799805, 26.782812118530273, 28.446134567260742, 30.109455108642578, 31.772777557373047, 33.436100006103516, 35.099422454833984, 36.76274490356445, 38.42606735229492, 40.089385986328125, 41.752708435058594, 43.41603088378906, 45.07935333251953, 46.74267578125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 4.0, 7.0, 15.0, 6.0, 17.0, 10.0, 17.0, 25.0, 22.0, 22.0, 19.0, 32.0, 29.0, 31.0, 26.0, 39.0, 35.0, 37.0, 34.0, 36.0, 52.0, 33.0, 33.0, 35.0, 33.0, 40.0, 31.0, 24.0, 28.0, 24.0, 30.0, 24.0, 18.0, 17.0, 16.0, 21.0, 10.0, 8.0, 8.0, 12.0, 4.0, 3.0, 7.0, 7.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-4.55859375, -4.42181396484375, -4.2850341796875, -4.14825439453125, -4.011474609375, -3.87469482421875, -3.7379150390625, -3.60113525390625, -3.46435546875, -3.32757568359375, -3.1907958984375, -3.05401611328125, -2.917236328125, -2.78045654296875, -2.6436767578125, -2.50689697265625, -2.3701171875, -2.23333740234375, -2.0965576171875, -1.95977783203125, -1.822998046875, -1.68621826171875, -1.5494384765625, -1.41265869140625, -1.27587890625, -1.13909912109375, -1.0023193359375, -0.86553955078125, -0.728759765625, -0.59197998046875, -0.4552001953125, -0.31842041015625, -0.181640625, -0.04486083984375, 0.0919189453125, 0.22869873046875, 0.365478515625, 0.50225830078125, 0.6390380859375, 0.77581787109375, 0.91259765625, 1.04937744140625, 1.1861572265625, 1.32293701171875, 1.459716796875, 1.59649658203125, 1.7332763671875, 1.87005615234375, 2.0068359375, 2.14361572265625, 2.2803955078125, 2.41717529296875, 2.553955078125, 2.69073486328125, 2.8275146484375, 2.96429443359375, 3.10107421875, 3.23785400390625, 3.3746337890625, 3.51141357421875, 3.648193359375, 3.78497314453125, 3.9217529296875, 4.05853271484375, 4.1953125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 2.0, 7.0, 6.0, 7.0, 16.0, 16.0, 20.0, 39.0, 48.0, 39.0, 52.0, 97.0, 157.0, 232.0, 531.0, 1713.0, 15035.0, 458376.0, 3318286.0, 383915.0, 12839.0, 1610.0, 461.0, 256.0, 146.0, 103.0, 69.0, 39.0, 33.0, 24.0, 19.0, 16.0, 16.0, 10.0, 12.0, 10.0, 5.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.171875, -17.6123046875, -17.052734375, -16.4931640625, -15.93359375, -15.3740234375, -14.814453125, -14.2548828125, -13.6953125, -13.1357421875, -12.576171875, -12.0166015625, -11.45703125, -10.8974609375, -10.337890625, -9.7783203125, -9.21875, -8.6591796875, -8.099609375, -7.5400390625, -6.98046875, -6.4208984375, -5.861328125, -5.3017578125, -4.7421875, -4.1826171875, -3.623046875, -3.0634765625, -2.50390625, -1.9443359375, -1.384765625, -0.8251953125, -0.265625, 0.2939453125, 0.853515625, 1.4130859375, 1.97265625, 2.5322265625, 3.091796875, 3.6513671875, 4.2109375, 4.7705078125, 5.330078125, 5.8896484375, 6.44921875, 7.0087890625, 7.568359375, 8.1279296875, 8.6875, 9.2470703125, 9.806640625, 10.3662109375, 10.92578125, 11.4853515625, 12.044921875, 12.6044921875, 13.1640625, 13.7236328125, 14.283203125, 14.8427734375, 15.40234375, 15.9619140625, 16.521484375, 17.0810546875, 17.640625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 15.0, 17.0, 32.0, 38.0, 48.0, 88.0, 129.0, 188.0, 241.0, 387.0, 539.0, 607.0, 535.0, 352.0, 286.0, 188.0, 130.0, 65.0, 51.0, 38.0, 18.0, 17.0, 21.0, 12.0, 6.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.21875, -22.58154296875, -21.9443359375, -21.30712890625, -20.669921875, -20.03271484375, -19.3955078125, -18.75830078125, -18.12109375, -17.48388671875, -16.8466796875, -16.20947265625, -15.572265625, -14.93505859375, -14.2978515625, -13.66064453125, -13.0234375, -12.38623046875, -11.7490234375, -11.11181640625, -10.474609375, -9.83740234375, -9.2001953125, -8.56298828125, -7.92578125, -7.28857421875, -6.6513671875, -6.01416015625, -5.376953125, -4.73974609375, -4.1025390625, -3.46533203125, -2.828125, -2.19091796875, -1.5537109375, -0.91650390625, -0.279296875, 0.35791015625, 0.9951171875, 1.63232421875, 2.26953125, 2.90673828125, 3.5439453125, 4.18115234375, 4.818359375, 5.45556640625, 6.0927734375, 6.72998046875, 7.3671875, 8.00439453125, 8.6416015625, 9.27880859375, 9.916015625, 10.55322265625, 11.1904296875, 11.82763671875, 12.46484375, 13.10205078125, 13.7392578125, 14.37646484375, 15.013671875, 15.65087890625, 16.2880859375, 16.92529296875, 17.5625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 9.0, 7.0, 13.0, 25.0, 35.0, 37.0, 57.0, 85.0, 118.0, 162.0, 279.0, 584.0, 2937.0, 940186.0, 3243238.0, 4921.0, 694.0, 318.0, 187.0, 115.0, 83.0, 47.0, 50.0, 27.0, 14.0, 16.0, 7.0, 6.0, 10.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.21875, -61.04541015625, -58.8720703125, -56.69873046875, -54.525390625, -52.35205078125, -50.1787109375, -48.00537109375, -45.83203125, -43.65869140625, -41.4853515625, -39.31201171875, -37.138671875, -34.96533203125, -32.7919921875, -30.61865234375, -28.4453125, -26.27197265625, -24.0986328125, -21.92529296875, -19.751953125, -17.57861328125, -15.4052734375, -13.23193359375, -11.05859375, -8.88525390625, -6.7119140625, -4.53857421875, -2.365234375, -0.19189453125, 1.9814453125, 4.15478515625, 6.328125, 8.50146484375, 10.6748046875, 12.84814453125, 15.021484375, 17.19482421875, 19.3681640625, 21.54150390625, 23.71484375, 25.88818359375, 28.0615234375, 30.23486328125, 32.408203125, 34.58154296875, 36.7548828125, 38.92822265625, 41.1015625, 43.27490234375, 45.4482421875, 47.62158203125, 49.794921875, 51.96826171875, 54.1416015625, 56.31494140625, 58.48828125, 60.66162109375, 62.8349609375, 65.00830078125, 67.181640625, 69.35498046875, 71.5283203125, 73.70166015625, 75.875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 22.0, 46.0, 104.0, 196.0, 259.0, 212.0, 105.0, 52.0, 13.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.79904556274414, -21.876253128051758, -18.953460693359375, -16.030670166015625, -13.107877731323242, -10.18508529663086, -7.262294769287109, -4.339502334594727, -1.4167098999023438, 1.5060820579528809, 4.4288740158081055, 7.351665496826172, 10.274457931518555, 13.197250366210938, 16.120040893554688, 19.04283332824707, 21.965625762939453, 24.888418197631836, 27.81121063232422, 30.73400115966797, 33.65679168701172, 36.579586029052734, 39.502376556396484, 42.4251708984375, 45.34796142578125, 48.270751953125, 51.193546295166016, 54.116336822509766, 57.03913116455078, 59.96192169189453, 62.88471221923828, 65.80750274658203, 68.73030090332031, 71.65309143066406, 74.57588195800781, 77.49867248535156, 80.42147064208984, 83.3442611694336, 86.26705169677734, 89.1898422241211, 92.11264038085938, 95.03543090820312, 97.95822143554688, 100.88101196289062, 103.8038101196289, 106.72660064697266, 109.6493911743164, 112.57218170166016, 115.4949722290039, 118.41776275634766, 121.3405532836914, 124.26335144042969, 127.18614196777344, 130.1089324951172, 133.03172302246094, 135.9545135498047, 138.87730407714844, 141.8000946044922, 144.72288513183594, 147.6456756591797, 150.56846618652344, 153.49127197265625, 156.4140625, 159.33685302734375, 162.2596435546875]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 10.0, 5.0, 9.0, 11.0, 11.0, 12.0, 20.0, 19.0, 18.0, 30.0, 23.0, 29.0, 32.0, 31.0, 42.0, 39.0, 40.0, 37.0, 43.0, 49.0, 39.0, 55.0, 44.0, 33.0, 44.0, 27.0, 34.0, 24.0, 23.0, 28.0, 20.0, 14.0, 21.0, 14.0, 8.0, 11.0, 14.0, 9.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-52.273338317871094, -50.668548583984375, -49.063758850097656, -47.45896911621094, -45.85417938232422, -44.2493896484375, -42.64460372924805, -41.03981399536133, -39.43502426147461, -37.83023452758789, -36.22544479370117, -34.62065505981445, -33.015869140625, -31.41107749938965, -29.806289672851562, -28.201499938964844, -26.596710205078125, -24.991920471191406, -23.387130737304688, -21.7823429107666, -20.177553176879883, -18.572763442993164, -16.967975616455078, -15.36318588256836, -13.75839614868164, -12.153606414794922, -10.54881763458252, -8.944028854370117, -7.339239120483398, -5.73444938659668, -4.129660606384277, -2.524871826171875, -0.9200859069824219, 0.6847033500671387, 2.289492607116699, 3.8942818641662598, 5.49907112121582, 7.103860855102539, 8.708649635314941, 10.313438415527344, 11.918228149414062, 13.523017883300781, 15.127806663513184, 16.732595443725586, 18.337385177612305, 19.942174911499023, 21.54696273803711, 23.151752471923828, 24.756542205810547, 26.361331939697266, 27.966121673583984, 29.57090950012207, 31.17569923400879, 32.780487060546875, 34.385276794433594, 35.99006652832031, 37.59485626220703, 39.19964599609375, 40.80443572998047, 42.40922546386719, 44.014015197753906, 45.618804931640625, 47.22359085083008, 48.8283805847168, 50.433170318603516]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 11.0, 4.0, 9.0, 11.0, 10.0, 12.0, 19.0, 22.0, 14.0, 20.0, 28.0, 25.0, 32.0, 30.0, 25.0, 39.0, 25.0, 34.0, 49.0, 34.0, 47.0, 32.0, 44.0, 39.0, 43.0, 40.0, 40.0, 29.0, 23.0, 24.0, 18.0, 25.0, 26.0, 18.0, 16.0, 9.0, 14.0, 11.0, 11.0, 9.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.82421875, -4.67730712890625, -4.5303955078125, -4.38348388671875, -4.236572265625, -4.08966064453125, -3.9427490234375, -3.79583740234375, -3.64892578125, -3.50201416015625, -3.3551025390625, -3.20819091796875, -3.061279296875, -2.91436767578125, -2.7674560546875, -2.62054443359375, -2.4736328125, -2.32672119140625, -2.1798095703125, -2.03289794921875, -1.885986328125, -1.73907470703125, -1.5921630859375, -1.44525146484375, -1.29833984375, -1.15142822265625, -1.0045166015625, -0.85760498046875, -0.710693359375, -0.56378173828125, -0.4168701171875, -0.26995849609375, -0.123046875, 0.02386474609375, 0.1707763671875, 0.31768798828125, 0.464599609375, 0.61151123046875, 0.7584228515625, 0.90533447265625, 1.05224609375, 1.19915771484375, 1.3460693359375, 1.49298095703125, 1.639892578125, 1.78680419921875, 1.9337158203125, 2.08062744140625, 2.2275390625, 2.37445068359375, 2.5213623046875, 2.66827392578125, 2.815185546875, 2.96209716796875, 3.1090087890625, 3.25592041015625, 3.40283203125, 3.54974365234375, 3.6966552734375, 3.84356689453125, 3.990478515625, 4.13739013671875, 4.2843017578125, 4.43121337890625, 4.578125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 17.0, 21.0, 20.0, 37.0, 59.0, 88.0, 135.0, 212.0, 282.0, 382.0, 624.0, 793.0, 1174.0, 1761.0, 2551.0, 3530.0, 5276.0, 7779.0, 11223.0, 16579.0, 25028.0, 38665.0, 60813.0, 105012.0, 244997.0, 241482.0, 103737.0, 60476.0, 38355.0, 24893.0, 16857.0, 11175.0, 7524.0, 5242.0, 3705.0, 2480.0, 1743.0, 1179.0, 832.0, 557.0, 405.0, 259.0, 188.0, 123.0, 84.0, 73.0, 39.0, 33.0, 16.0, 12.0, 12.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.0224609375, -0.989471435546875, -0.95648193359375, -0.923492431640625, -0.8905029296875, -0.857513427734375, -0.82452392578125, -0.791534423828125, -0.758544921875, -0.725555419921875, -0.69256591796875, -0.659576416015625, -0.6265869140625, -0.593597412109375, -0.56060791015625, -0.527618408203125, -0.49462890625, -0.461639404296875, -0.42864990234375, -0.395660400390625, -0.3626708984375, -0.329681396484375, -0.29669189453125, -0.263702392578125, -0.230712890625, -0.197723388671875, -0.16473388671875, -0.131744384765625, -0.0987548828125, -0.065765380859375, -0.03277587890625, 0.000213623046875, 0.033203125, 0.066192626953125, 0.09918212890625, 0.132171630859375, 0.1651611328125, 0.198150634765625, 0.23114013671875, 0.264129638671875, 0.297119140625, 0.330108642578125, 0.36309814453125, 0.396087646484375, 0.4290771484375, 0.462066650390625, 0.49505615234375, 0.528045654296875, 0.56103515625, 0.594024658203125, 0.62701416015625, 0.660003662109375, 0.6929931640625, 0.725982666015625, 0.75897216796875, 0.791961669921875, 0.824951171875, 0.857940673828125, 0.89093017578125, 0.923919677734375, 0.9569091796875, 0.989898681640625, 1.02288818359375, 1.055877685546875, 1.0888671875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 9.0, 15.0, 14.0, 18.0, 28.0, 17.0, 21.0, 27.0, 31.0, 42.0, 29.0, 33.0, 27.0, 39.0, 38.0, 45.0, 37.0, 1061.0, 43.0, 37.0, 38.0, 40.0, 34.0, 39.0, 33.0, 24.0, 24.0, 26.0, 18.0, 24.0, 14.0, 14.0, 15.0, 11.0, 9.0, 7.0, 7.0, 9.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.95703125, -2.858673095703125, -2.76031494140625, -2.661956787109375, -2.5635986328125, -2.465240478515625, -2.36688232421875, -2.268524169921875, -2.170166015625, -2.071807861328125, -1.97344970703125, -1.875091552734375, -1.7767333984375, -1.678375244140625, -1.58001708984375, -1.481658935546875, -1.38330078125, -1.284942626953125, -1.18658447265625, -1.088226318359375, -0.9898681640625, -0.891510009765625, -0.79315185546875, -0.694793701171875, -0.596435546875, -0.498077392578125, -0.39971923828125, -0.301361083984375, -0.2030029296875, -0.104644775390625, -0.00628662109375, 0.092071533203125, 0.1904296875, 0.288787841796875, 0.38714599609375, 0.485504150390625, 0.5838623046875, 0.682220458984375, 0.78057861328125, 0.878936767578125, 0.977294921875, 1.075653076171875, 1.17401123046875, 1.272369384765625, 1.3707275390625, 1.469085693359375, 1.56744384765625, 1.665802001953125, 1.76416015625, 1.862518310546875, 1.96087646484375, 2.059234619140625, 2.1575927734375, 2.255950927734375, 2.35430908203125, 2.452667236328125, 2.551025390625, 2.649383544921875, 2.74774169921875, 2.846099853515625, 2.9444580078125, 3.042816162109375, 3.14117431640625, 3.239532470703125, 3.337890625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 10.0, 12.0, 21.0, 31.0, 56.0, 76.0, 131.0, 184.0, 277.0, 407.0, 668.0, 952.0, 1464.0, 2195.0, 3398.0, 5116.0, 7895.0, 11921.0, 18364.0, 28516.0, 44186.0, 71363.0, 124419.0, 1327616.0, 190987.0, 95534.0, 57748.0, 36102.0, 23452.0, 15267.0, 10051.0, 6531.0, 4313.0, 2782.0, 1770.0, 1165.0, 721.0, 461.0, 323.0, 216.0, 155.0, 99.0, 66.0, 42.0, 24.0, 18.0, 10.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9873046875, -0.95623779296875, -0.9251708984375, -0.89410400390625, -0.863037109375, -0.83197021484375, -0.8009033203125, -0.76983642578125, -0.73876953125, -0.70770263671875, -0.6766357421875, -0.64556884765625, -0.614501953125, -0.58343505859375, -0.5523681640625, -0.52130126953125, -0.490234375, -0.45916748046875, -0.4281005859375, -0.39703369140625, -0.365966796875, -0.33489990234375, -0.3038330078125, -0.27276611328125, -0.24169921875, -0.21063232421875, -0.1795654296875, -0.14849853515625, -0.117431640625, -0.08636474609375, -0.0552978515625, -0.02423095703125, 0.0068359375, 0.03790283203125, 0.0689697265625, 0.10003662109375, 0.131103515625, 0.16217041015625, 0.1932373046875, 0.22430419921875, 0.25537109375, 0.28643798828125, 0.3175048828125, 0.34857177734375, 0.379638671875, 0.41070556640625, 0.4417724609375, 0.47283935546875, 0.50390625, 0.53497314453125, 0.5660400390625, 0.59710693359375, 0.628173828125, 0.65924072265625, 0.6903076171875, 0.72137451171875, 0.75244140625, 0.78350830078125, 0.8145751953125, 0.84564208984375, 0.876708984375, 0.90777587890625, 0.9388427734375, 0.96990966796875, 1.0009765625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 0.0, 11.0, 3.0, 8.0, 10.0, 8.0, 14.0, 16.0, 21.0, 19.0, 19.0, 40.0, 54.0, 61.0, 103.0, 128.0, 116.0, 75.0, 65.0, 37.0, 37.0, 32.0, 20.0, 19.0, 15.0, 14.0, 11.0, 10.0, 5.0, 9.0, 4.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0009493827819824219, -0.00092296302318573, -0.0008965432643890381, -0.0008701235055923462, -0.0008437037467956543, -0.0008172839879989624, -0.0007908642292022705, -0.0007644444704055786, -0.0007380247116088867, -0.0007116049528121948, -0.0006851851940155029, -0.000658765435218811, -0.0006323456764221191, -0.0006059259176254272, -0.0005795061588287354, -0.0005530864000320435, -0.0005266666412353516, -0.0005002468824386597, -0.0004738271236419678, -0.0004474073648452759, -0.000420987606048584, -0.0003945678472518921, -0.0003681480884552002, -0.0003417283296585083, -0.0003153085708618164, -0.0002888888120651245, -0.0002624690532684326, -0.00023604929447174072, -0.00020962953567504883, -0.00018320977687835693, -0.00015679001808166504, -0.00013037025928497314, -0.00010395050048828125, -7.753074169158936e-05, -5.111098289489746e-05, -2.4691224098205566e-05, 1.7285346984863281e-06, 2.8148293495178223e-05, 5.456805229187012e-05, 8.098781108856201e-05, 0.0001074075698852539, 0.0001338273286819458, 0.0001602470874786377, 0.0001866668462753296, 0.00021308660507202148, 0.00023950636386871338, 0.0002659261226654053, 0.00029234588146209717, 0.00031876564025878906, 0.00034518539905548096, 0.00037160515785217285, 0.00039802491664886475, 0.00042444467544555664, 0.00045086443424224854, 0.00047728419303894043, 0.0005037039518356323, 0.0005301237106323242, 0.0005565434694290161, 0.000582963228225708, 0.0006093829870223999, 0.0006358027458190918, 0.0006622225046157837, 0.0006886422634124756, 0.0007150620222091675, 0.0007414817810058594]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 9.0, 13.0, 19.0, 28.0, 29.0, 30.0, 54.0, 68.0, 108.0, 198.0, 448.0, 54137.0, 992083.0, 605.0, 261.0, 125.0, 98.0, 48.0, 41.0, 39.0, 22.0, 12.0, 11.0, 20.0, 9.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017120361328125, -0.0164644718170166, -0.015808582305908203, -0.015152692794799805, -0.014496803283691406, -0.013840913772583008, -0.01318502426147461, -0.012529134750366211, -0.011873245239257812, -0.011217355728149414, -0.010561466217041016, -0.009905576705932617, -0.009249687194824219, -0.00859379768371582, -0.007937908172607422, -0.0072820186614990234, -0.006626129150390625, -0.0059702396392822266, -0.005314350128173828, -0.00465846061706543, -0.004002571105957031, -0.003346681594848633, -0.0026907920837402344, -0.002034902572631836, -0.0013790130615234375, -0.0007231235504150391, -6.723403930664062e-05, 0.0005886554718017578, 0.0012445449829101562, 0.0019004344940185547, 0.002556324005126953, 0.0032122135162353516, 0.00386810302734375, 0.0045239925384521484, 0.005179882049560547, 0.005835771560668945, 0.006491661071777344, 0.007147550582885742, 0.007803440093994141, 0.008459329605102539, 0.009115219116210938, 0.009771108627319336, 0.010426998138427734, 0.011082887649536133, 0.011738777160644531, 0.01239466667175293, 0.013050556182861328, 0.013706445693969727, 0.014362335205078125, 0.015018224716186523, 0.015674114227294922, 0.01633000373840332, 0.01698589324951172, 0.017641782760620117, 0.018297672271728516, 0.018953561782836914, 0.019609451293945312, 0.02026534080505371, 0.02092123031616211, 0.021577119827270508, 0.022233009338378906, 0.022888898849487305, 0.023544788360595703, 0.0242006778717041, 0.0248565673828125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 37.0, 322.0, 546.0, 98.0, 9.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014350657584145665, -0.0013943292433395982, -0.0013535927282646298, -0.0013128562131896615, -0.0012721196981146932, -0.0012313831830397248, -0.0011906466679647565, -0.0011499101528897882, -0.0011091736378148198, -0.0010684371227398515, -0.0010277006076648831, -0.0009869640925899148, -0.0009462275775149465, -0.0009054910624399781, -0.0008647545473650098, -0.0008240180322900414, -0.0007832814590074122, -0.0007425449439324439, -0.0007018084288574755, -0.0006610719137825072, -0.0006203353987075388, -0.0005795988836325705, -0.0005388623103499413, -0.0004981257952749729, -0.00045738930930383503, -0.0004166527942288667, -0.00037591627915389836, -0.00033517973497509956, -0.0002944432199001312, -0.0002537067048251629, -0.00021297018975019455, -0.0001722336746752262, -0.00013149715960025787, -9.076064452528954e-05, -5.002412217436358e-05, -9.287599823437631e-06, 3.144891525153071e-05, 7.218543032649904e-05, 0.00011292195995338261, 0.00015365847502835095, 0.0001943949901033193, 0.00023513150517828763, 0.00027586802025325596, 0.00031660456443205476, 0.0003573410795070231, 0.00039807759458199143, 0.00043881410965695977, 0.0004795506247319281, 0.0005202871398068964, 0.0005610236548818648, 0.0006017601699568331, 0.0006424966850318015, 0.0006832332001067698, 0.0007239697151817381, 0.0007647062884643674, 0.0008054428035393357, 0.0008461793186143041, 0.0008869158336892724, 0.0009276523487642407, 0.0009683888638392091, 0.0010091253789141774, 0.0010498618939891458, 0.001090598409064114, 0.0011313349241390824, 0.0011720714392140508]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 2.0, 11.0, 8.0, 11.0, 13.0, 23.0, 27.0, 27.0, 25.0, 21.0, 24.0, 31.0, 34.0, 37.0, 40.0, 35.0, 30.0, 46.0, 30.0, 36.0, 53.0, 42.0, 32.0, 33.0, 26.0, 30.0, 45.0, 25.0, 29.0, 25.0, 20.0, 18.0, 23.0, 12.0, 16.0, 7.0, 7.0, 10.0, 8.0, 9.0, 4.0, 4.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003237128257751465, -0.00031276140362024307, -0.00030180998146533966, -0.00029085855931043625, -0.00027990713715553284, -0.0002689557150006294, -0.000258004292845726, -0.0002470528706908226, -0.0002361014485359192, -0.00022515002638101578, -0.00021419860422611237, -0.00020324718207120895, -0.00019229575991630554, -0.00018134433776140213, -0.00017039291560649872, -0.0001594414934515953, -0.0001484900712966919, -0.00013753864914178848, -0.00012658722698688507, -0.00011563580483198166, -0.00010468438267707825, -9.373296052217484e-05, -8.278153836727142e-05, -7.183011621236801e-05, -6.08786940574646e-05, -4.992727190256119e-05, -3.8975849747657776e-05, -2.8024427592754364e-05, -1.7073005437850952e-05, -6.12158328294754e-06, 4.829838871955872e-06, 1.5781261026859283e-05, 2.6732683181762695e-05, 3.768410533666611e-05, 4.863552749156952e-05, 5.958694964647293e-05, 7.053837180137634e-05, 8.148979395627975e-05, 9.244121611118317e-05, 0.00010339263826608658, 0.00011434406042098999, 0.0001252954825758934, 0.00013624690473079681, 0.00014719832688570023, 0.00015814974904060364, 0.00016910117119550705, 0.00018005259335041046, 0.00019100401550531387, 0.00020195543766021729, 0.0002129068598151207, 0.0002238582819700241, 0.00023480970412492752, 0.00024576112627983093, 0.00025671254843473434, 0.00026766397058963776, 0.00027861539274454117, 0.0002895668148994446, 0.000300518237054348, 0.0003114696592092514, 0.0003224210813641548, 0.00033337250351905823, 0.00034432392567396164, 0.00035527534782886505, 0.00036622676998376846, 0.0003771781921386719]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 11.0, 4.0, 9.0, 11.0, 10.0, 12.0, 19.0, 22.0, 14.0, 20.0, 28.0, 25.0, 32.0, 30.0, 25.0, 39.0, 25.0, 34.0, 49.0, 34.0, 47.0, 32.0, 44.0, 39.0, 43.0, 40.0, 40.0, 29.0, 23.0, 24.0, 18.0, 25.0, 26.0, 18.0, 16.0, 9.0, 14.0, 11.0, 11.0, 9.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.82421875, -4.67730712890625, -4.5303955078125, -4.38348388671875, -4.236572265625, -4.08966064453125, -3.9427490234375, -3.79583740234375, -3.64892578125, -3.50201416015625, -3.3551025390625, -3.20819091796875, -3.061279296875, -2.91436767578125, -2.7674560546875, -2.62054443359375, -2.4736328125, -2.32672119140625, -2.1798095703125, -2.03289794921875, -1.885986328125, -1.73907470703125, -1.5921630859375, -1.44525146484375, -1.29833984375, -1.15142822265625, -1.0045166015625, -0.85760498046875, -0.710693359375, -0.56378173828125, -0.4168701171875, -0.26995849609375, -0.123046875, 0.02386474609375, 0.1707763671875, 0.31768798828125, 0.464599609375, 0.61151123046875, 0.7584228515625, 0.90533447265625, 1.05224609375, 1.19915771484375, 1.3460693359375, 1.49298095703125, 1.639892578125, 1.78680419921875, 1.9337158203125, 2.08062744140625, 2.2275390625, 2.37445068359375, 2.5213623046875, 2.66827392578125, 2.815185546875, 2.96209716796875, 3.1090087890625, 3.25592041015625, 3.40283203125, 3.54974365234375, 3.6966552734375, 3.84356689453125, 3.990478515625, 4.13739013671875, 4.2843017578125, 4.43121337890625, 4.578125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 8.0, 20.0, 21.0, 32.0, 37.0, 51.0, 66.0, 102.0, 145.0, 201.0, 310.0, 494.0, 700.0, 1127.0, 1915.0, 3563.0, 6827.0, 14312.0, 31666.0, 78164.0, 214233.0, 424035.0, 159738.0, 60668.0, 25274.0, 11461.0, 5741.0, 2971.0, 1635.0, 1010.0, 626.0, 418.0, 282.0, 217.0, 134.0, 93.0, 67.0, 49.0, 38.0, 29.0, 11.0, 17.0, 11.0, 9.0, 3.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.20703125, -3.107940673828125, -3.00885009765625, -2.909759521484375, -2.8106689453125, -2.711578369140625, -2.61248779296875, -2.513397216796875, -2.414306640625, -2.315216064453125, -2.21612548828125, -2.117034912109375, -2.0179443359375, -1.918853759765625, -1.81976318359375, -1.720672607421875, -1.62158203125, -1.522491455078125, -1.42340087890625, -1.324310302734375, -1.2252197265625, -1.126129150390625, -1.02703857421875, -0.927947998046875, -0.828857421875, -0.729766845703125, -0.63067626953125, -0.531585693359375, -0.4324951171875, -0.333404541015625, -0.23431396484375, -0.135223388671875, -0.0361328125, 0.062957763671875, 0.16204833984375, 0.261138916015625, 0.3602294921875, 0.459320068359375, 0.55841064453125, 0.657501220703125, 0.756591796875, 0.855682373046875, 0.95477294921875, 1.053863525390625, 1.1529541015625, 1.252044677734375, 1.35113525390625, 1.450225830078125, 1.54931640625, 1.648406982421875, 1.74749755859375, 1.846588134765625, 1.9456787109375, 2.044769287109375, 2.14385986328125, 2.242950439453125, 2.342041015625, 2.441131591796875, 2.54022216796875, 2.639312744140625, 2.7384033203125, 2.837493896484375, 2.93658447265625, 3.035675048828125, 3.134765625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 1.0, 4.0, 6.0, 11.0, 11.0, 14.0, 12.0, 18.0, 19.0, 31.0, 40.0, 24.0, 27.0, 34.0, 36.0, 32.0, 47.0, 45.0, 73.0, 348.0, 1686.0, 87.0, 50.0, 46.0, 35.0, 41.0, 35.0, 36.0, 29.0, 33.0, 21.0, 23.0, 20.0, 15.0, 11.0, 12.0, 7.0, 2.0, 5.0, 8.0, 5.0, 1.0, 5.0, 2.0, 1.0], "bins": [-23.1875, -22.594970703125, -22.00244140625, -21.409912109375, -20.8173828125, -20.224853515625, -19.63232421875, -19.039794921875, -18.447265625, -17.854736328125, -17.26220703125, -16.669677734375, -16.0771484375, -15.484619140625, -14.89208984375, -14.299560546875, -13.70703125, -13.114501953125, -12.52197265625, -11.929443359375, -11.3369140625, -10.744384765625, -10.15185546875, -9.559326171875, -8.966796875, -8.374267578125, -7.78173828125, -7.189208984375, -6.5966796875, -6.004150390625, -5.41162109375, -4.819091796875, -4.2265625, -3.634033203125, -3.04150390625, -2.448974609375, -1.8564453125, -1.263916015625, -0.67138671875, -0.078857421875, 0.513671875, 1.106201171875, 1.69873046875, 2.291259765625, 2.8837890625, 3.476318359375, 4.06884765625, 4.661376953125, 5.25390625, 5.846435546875, 6.43896484375, 7.031494140625, 7.6240234375, 8.216552734375, 8.80908203125, 9.401611328125, 9.994140625, 10.586669921875, 11.17919921875, 11.771728515625, 12.3642578125, 12.956787109375, 13.54931640625, 14.141845703125, 14.734375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 3.0, 7.0, 4.0, 3.0, 7.0, 10.0, 7.0, 16.0, 17.0, 22.0, 20.0, 33.0, 23.0, 32.0, 49.0, 71.0, 87.0, 162.0, 309.0, 668.0, 3182.0, 719836.0, 2415300.0, 4184.0, 681.0, 340.0, 176.0, 97.0, 60.0, 54.0, 41.0, 39.0, 43.0, 17.0, 25.0, 14.0, 11.0, 16.0, 9.0, 13.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.056884765625, -22.09814453125, -21.139404296875, -20.1806640625, -19.221923828125, -18.26318359375, -17.304443359375, -16.345703125, -15.386962890625, -14.42822265625, -13.469482421875, -12.5107421875, -11.552001953125, -10.59326171875, -9.634521484375, -8.67578125, -7.717041015625, -6.75830078125, -5.799560546875, -4.8408203125, -3.882080078125, -2.92333984375, -1.964599609375, -1.005859375, -0.047119140625, 0.91162109375, 1.870361328125, 2.8291015625, 3.787841796875, 4.74658203125, 5.705322265625, 6.6640625, 7.622802734375, 8.58154296875, 9.540283203125, 10.4990234375, 11.457763671875, 12.41650390625, 13.375244140625, 14.333984375, 15.292724609375, 16.25146484375, 17.210205078125, 18.1689453125, 19.127685546875, 20.08642578125, 21.045166015625, 22.00390625, 22.962646484375, 23.92138671875, 24.880126953125, 25.8388671875, 26.797607421875, 27.75634765625, 28.715087890625, 29.673828125, 30.632568359375, 31.59130859375, 32.550048828125, 33.5087890625, 34.467529296875, 35.42626953125, 36.385009765625, 37.34375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 23.0, 120.0, 352.0, 357.0, 130.0, 25.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.105545997619629, -8.664589881896973, -7.223633766174316, -5.782677173614502, -4.341721057891846, -2.9007649421691895, -1.459808349609375, -0.01885223388671875, 1.4221038818359375, 2.8630599975585938, 4.30401611328125, 5.7449727058410645, 7.185928821563721, 8.626884460449219, 10.067841529846191, 11.508797645568848, 12.949753761291504, 14.39070987701416, 15.831665992736816, 17.27262306213379, 18.713579177856445, 20.1545352935791, 21.595491409301758, 23.036447525024414, 24.47740364074707, 25.918359756469727, 27.359315872192383, 28.80027198791504, 30.241228103637695, 31.68218421936035, 33.12314224243164, 34.5640983581543, 36.00505447387695, 37.44601058959961, 38.886966705322266, 40.32792282104492, 41.76887893676758, 43.209835052490234, 44.65079116821289, 46.09174728393555, 47.5327033996582, 48.97365951538086, 50.414615631103516, 51.85557174682617, 53.29652786254883, 54.737483978271484, 56.17844009399414, 57.6193962097168, 59.06035614013672, 60.501312255859375, 61.94226837158203, 63.38322448730469, 64.82418060302734, 66.26513671875, 67.70609283447266, 69.14704895019531, 70.58800506591797, 72.02896118164062, 73.46991729736328, 74.91087341308594, 76.3518295288086, 77.79278564453125, 79.2337417602539, 80.67469787597656, 82.11565399169922]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 9.0, 11.0, 11.0, 24.0, 17.0, 17.0, 19.0, 24.0, 21.0, 32.0, 37.0, 36.0, 39.0, 28.0, 30.0, 51.0, 33.0, 49.0, 46.0, 38.0, 27.0, 32.0, 38.0, 49.0, 40.0, 30.0, 20.0, 25.0, 20.0, 18.0, 17.0, 19.0, 14.0, 10.0, 10.0, 9.0, 10.0, 12.0, 2.0, 5.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.206199645996094, -53.41696548461914, -51.62772750854492, -49.83849334716797, -48.049259185791016, -46.26002502441406, -44.470787048339844, -42.68155288696289, -40.89231872558594, -39.103084564208984, -37.313846588134766, -35.52461242675781, -33.73537826538086, -31.946142196655273, -30.156906127929688, -28.367671966552734, -26.57843589782715, -24.789199829101562, -22.99996566772461, -21.210729598999023, -19.42149543762207, -17.632259368896484, -15.843024253845215, -14.053789138793945, -12.264554023742676, -10.475318908691406, -8.686083793640137, -6.896848201751709, -5.1076130867004395, -3.3183774948120117, -1.5291423797607422, 0.26009273529052734, 2.049327850341797, 3.8385629653930664, 5.627798080444336, 7.417033672332764, 9.206268310546875, 10.995504379272461, 12.78473949432373, 14.573974609375, 16.363208770751953, 18.15244483947754, 19.941679000854492, 21.730915069580078, 23.52014923095703, 25.309385299682617, 27.098621368408203, 28.887855529785156, 30.677091598510742, 32.46632766723633, 34.25556182861328, 36.044795989990234, 37.83403396606445, 39.623268127441406, 41.41250228881836, 43.20173645019531, 44.99097442626953, 46.780208587646484, 48.5694465637207, 50.358680725097656, 52.14791488647461, 53.93714904785156, 55.72638702392578, 57.515621185302734, 59.30485534667969]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 9.0, 8.0, 9.0, 9.0, 12.0, 13.0, 20.0, 16.0, 18.0, 25.0, 25.0, 25.0, 35.0, 34.0, 25.0, 35.0, 40.0, 40.0, 50.0, 41.0, 34.0, 39.0, 49.0, 37.0, 44.0, 41.0, 31.0, 13.0, 22.0, 28.0, 24.0, 24.0, 22.0, 20.0, 16.0, 8.0, 6.0, 9.0, 11.0, 9.0, 3.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.16015625, -5.00445556640625, -4.8487548828125, -4.69305419921875, -4.537353515625, -4.38165283203125, -4.2259521484375, -4.07025146484375, -3.91455078125, -3.75885009765625, -3.6031494140625, -3.44744873046875, -3.291748046875, -3.13604736328125, -2.9803466796875, -2.82464599609375, -2.6689453125, -2.51324462890625, -2.3575439453125, -2.20184326171875, -2.046142578125, -1.89044189453125, -1.7347412109375, -1.57904052734375, -1.42333984375, -1.26763916015625, -1.1119384765625, -0.95623779296875, -0.800537109375, -0.64483642578125, -0.4891357421875, -0.33343505859375, -0.177734375, -0.02203369140625, 0.1336669921875, 0.28936767578125, 0.445068359375, 0.60076904296875, 0.7564697265625, 0.91217041015625, 1.06787109375, 1.22357177734375, 1.3792724609375, 1.53497314453125, 1.690673828125, 1.84637451171875, 2.0020751953125, 2.15777587890625, 2.3134765625, 2.46917724609375, 2.6248779296875, 2.78057861328125, 2.936279296875, 3.09197998046875, 3.2476806640625, 3.40338134765625, 3.55908203125, 3.71478271484375, 3.8704833984375, 4.02618408203125, 4.181884765625, 4.33758544921875, 4.4932861328125, 4.64898681640625, 4.8046875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 10.0, 8.0, 11.0, 11.0, 22.0, 14.0, 18.0, 24.0, 24.0, 35.0, 29.0, 19.0, 38.0, 44.0, 82.0, 201.0, 1198.0, 90768.0, 3987321.0, 112419.0, 1341.0, 215.0, 89.0, 39.0, 33.0, 31.0, 29.0, 32.0, 19.0, 13.0, 23.0, 22.0, 17.0, 9.0, 11.0, 5.0, 9.0, 10.0, 6.0, 7.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.5, -31.50048828125, -30.5009765625, -29.50146484375, -28.501953125, -27.50244140625, -26.5029296875, -25.50341796875, -24.50390625, -23.50439453125, -22.5048828125, -21.50537109375, -20.505859375, -19.50634765625, -18.5068359375, -17.50732421875, -16.5078125, -15.50830078125, -14.5087890625, -13.50927734375, -12.509765625, -11.51025390625, -10.5107421875, -9.51123046875, -8.51171875, -7.51220703125, -6.5126953125, -5.51318359375, -4.513671875, -3.51416015625, -2.5146484375, -1.51513671875, -0.515625, 0.48388671875, 1.4833984375, 2.48291015625, 3.482421875, 4.48193359375, 5.4814453125, 6.48095703125, 7.48046875, 8.47998046875, 9.4794921875, 10.47900390625, 11.478515625, 12.47802734375, 13.4775390625, 14.47705078125, 15.4765625, 16.47607421875, 17.4755859375, 18.47509765625, 19.474609375, 20.47412109375, 21.4736328125, 22.47314453125, 23.47265625, 24.47216796875, 25.4716796875, 26.47119140625, 27.470703125, 28.47021484375, 29.4697265625, 30.46923828125, 31.46875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 5.0, 15.0, 28.0, 35.0, 49.0, 93.0, 142.0, 267.0, 432.0, 650.0, 778.0, 608.0, 389.0, 237.0, 120.0, 84.0, 47.0, 33.0, 20.0, 13.0, 11.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.6513671875, -26.912109375, -26.1728515625, -25.43359375, -24.6943359375, -23.955078125, -23.2158203125, -22.4765625, -21.7373046875, -20.998046875, -20.2587890625, -19.51953125, -18.7802734375, -18.041015625, -17.3017578125, -16.5625, -15.8232421875, -15.083984375, -14.3447265625, -13.60546875, -12.8662109375, -12.126953125, -11.3876953125, -10.6484375, -9.9091796875, -9.169921875, -8.4306640625, -7.69140625, -6.9521484375, -6.212890625, -5.4736328125, -4.734375, -3.9951171875, -3.255859375, -2.5166015625, -1.77734375, -1.0380859375, -0.298828125, 0.4404296875, 1.1796875, 1.9189453125, 2.658203125, 3.3974609375, 4.13671875, 4.8759765625, 5.615234375, 6.3544921875, 7.09375, 7.8330078125, 8.572265625, 9.3115234375, 10.05078125, 10.7900390625, 11.529296875, 12.2685546875, 13.0078125, 13.7470703125, 14.486328125, 15.2255859375, 15.96484375, 16.7041015625, 17.443359375, 18.1826171875, 18.921875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 15.0, 6.0, 28.0, 38.0, 37.0, 64.0, 96.0, 147.0, 236.0, 478.0, 1353.0, 131855.0, 4052538.0, 5691.0, 786.0, 363.0, 206.0, 110.0, 86.0, 50.0, 29.0, 19.0, 17.0, 7.0, 8.0, 4.0, 3.0, 4.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.9375, -81.3359375, -78.734375, -76.1328125, -73.53125, -70.9296875, -68.328125, -65.7265625, -63.125, -60.5234375, -57.921875, -55.3203125, -52.71875, -50.1171875, -47.515625, -44.9140625, -42.3125, -39.7109375, -37.109375, -34.5078125, -31.90625, -29.3046875, -26.703125, -24.1015625, -21.5, -18.8984375, -16.296875, -13.6953125, -11.09375, -8.4921875, -5.890625, -3.2890625, -0.6875, 1.9140625, 4.515625, 7.1171875, 9.71875, 12.3203125, 14.921875, 17.5234375, 20.125, 22.7265625, 25.328125, 27.9296875, 30.53125, 33.1328125, 35.734375, 38.3359375, 40.9375, 43.5390625, 46.140625, 48.7421875, 51.34375, 53.9453125, 56.546875, 59.1484375, 61.75, 64.3515625, 66.953125, 69.5546875, 72.15625, 74.7578125, 77.359375, 79.9609375, 82.5625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 6.0, 20.0, 67.0, 107.0, 149.0, 166.0, 208.0, 142.0, 69.0, 43.0, 16.0, 8.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.26334381103516, -71.68768310546875, -69.11201477050781, -66.5363540649414, -63.960689544677734, -61.38502502441406, -58.809364318847656, -56.233699798583984, -53.65803527832031, -51.08237075805664, -48.506710052490234, -45.93104553222656, -43.35538101196289, -40.77971649169922, -38.20405578613281, -35.62839126586914, -33.052730560302734, -30.477067947387695, -27.901403427124023, -25.325740814208984, -22.750076293945312, -20.174413681030273, -17.598751068115234, -15.023086547851562, -12.447423934936523, -9.871760368347168, -7.296097278594971, -4.720434188842773, -2.144770622253418, 0.4308929443359375, 3.0065555572509766, 5.582220077514648, 8.157882690429688, 10.733546257019043, 13.309209823608398, 15.884872436523438, 18.46053695678711, 21.03619956970215, 23.611862182617188, 26.18752670288086, 28.7631893157959, 31.338851928710938, 33.91451644897461, 36.49018096923828, 39.06584167480469, 41.64150619506836, 44.21717071533203, 46.79283142089844, 49.36849594116211, 51.94416046142578, 54.51982116699219, 57.09548568725586, 59.67115020751953, 62.24681091308594, 64.82247924804688, 67.39813995361328, 69.97380065917969, 72.5494613647461, 75.12512969970703, 77.70079040527344, 80.27645111083984, 82.85211944580078, 85.42778015136719, 88.00344848632812, 90.57910919189453]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 2.0, 9.0, 11.0, 9.0, 13.0, 15.0, 17.0, 25.0, 18.0, 26.0, 23.0, 23.0, 37.0, 40.0, 36.0, 30.0, 37.0, 43.0, 38.0, 42.0, 47.0, 45.0, 53.0, 44.0, 43.0, 44.0, 23.0, 32.0, 28.0, 30.0, 19.0, 19.0, 11.0, 10.0, 6.0, 12.0, 10.0, 5.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.24416732788086, -49.63560104370117, -48.02703857421875, -46.41847229003906, -44.809906005859375, -43.20133972167969, -41.5927734375, -39.98421096801758, -38.37564468383789, -36.7670783996582, -35.15851593017578, -33.549949645996094, -31.941383361816406, -30.33281707763672, -28.724252700805664, -27.11568832397461, -25.507122039794922, -23.898555755615234, -22.28999137878418, -20.681427001953125, -19.072860717773438, -17.46429443359375, -15.855730056762695, -14.247164726257324, -12.638599395751953, -11.030034065246582, -9.421468734741211, -7.81290340423584, -6.204338073730469, -4.595772743225098, -2.9872074127197266, -1.3786420822143555, 0.22991943359375, 1.838484764099121, 3.447050094604492, 5.055615425109863, 6.664180755615234, 8.272746086120605, 9.881311416625977, 11.489876747131348, 13.098442077636719, 14.70700740814209, 16.31557273864746, 17.924137115478516, 19.532703399658203, 21.14126968383789, 22.749834060668945, 24.3583984375, 25.966964721679688, 27.575531005859375, 29.18409538269043, 30.792659759521484, 32.40122604370117, 34.00979232788086, 35.61835479736328, 37.22692108154297, 38.835487365722656, 40.444053649902344, 42.05261993408203, 43.66118240356445, 45.26974868774414, 46.87831497192383, 48.48687744140625, 50.09544372558594, 51.704010009765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 8.0, 5.0, 6.0, 12.0, 11.0, 14.0, 10.0, 14.0, 13.0, 21.0, 30.0, 28.0, 23.0, 30.0, 37.0, 39.0, 36.0, 44.0, 43.0, 39.0, 39.0, 37.0, 32.0, 44.0, 49.0, 32.0, 38.0, 30.0, 27.0, 34.0, 24.0, 14.0, 25.0, 24.0, 20.0, 14.0, 13.0, 9.0, 8.0, 6.0, 8.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.1279296875, -4.962890625, -4.7978515625, -4.6328125, -4.4677734375, -4.302734375, -4.1376953125, -3.97265625, -3.8076171875, -3.642578125, -3.4775390625, -3.3125, -3.1474609375, -2.982421875, -2.8173828125, -2.65234375, -2.4873046875, -2.322265625, -2.1572265625, -1.9921875, -1.8271484375, -1.662109375, -1.4970703125, -1.33203125, -1.1669921875, -1.001953125, -0.8369140625, -0.671875, -0.5068359375, -0.341796875, -0.1767578125, -0.01171875, 0.1533203125, 0.318359375, 0.4833984375, 0.6484375, 0.8134765625, 0.978515625, 1.1435546875, 1.30859375, 1.4736328125, 1.638671875, 1.8037109375, 1.96875, 2.1337890625, 2.298828125, 2.4638671875, 2.62890625, 2.7939453125, 2.958984375, 3.1240234375, 3.2890625, 3.4541015625, 3.619140625, 3.7841796875, 3.94921875, 4.1142578125, 4.279296875, 4.4443359375, 4.609375, 4.7744140625, 4.939453125, 5.1044921875, 5.26953125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 10.0, 13.0, 12.0, 29.0, 45.0, 70.0, 83.0, 144.0, 200.0, 335.0, 440.0, 673.0, 961.0, 1386.0, 1887.0, 2838.0, 4061.0, 5768.0, 8387.0, 12007.0, 17694.0, 26540.0, 41068.0, 65776.0, 111907.0, 237743.0, 219163.0, 106143.0, 62962.0, 39268.0, 25944.0, 17048.0, 11704.0, 7942.0, 5520.0, 3901.0, 2743.0, 1937.0, 1280.0, 955.0, 615.0, 444.0, 304.0, 208.0, 139.0, 88.0, 60.0, 53.0, 14.0, 17.0, 14.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0556640625, -1.0226287841796875, -0.989593505859375, -0.9565582275390625, -0.92352294921875, -0.8904876708984375, -0.857452392578125, -0.8244171142578125, -0.7913818359375, -0.7583465576171875, -0.725311279296875, -0.6922760009765625, -0.65924072265625, -0.6262054443359375, -0.593170166015625, -0.5601348876953125, -0.527099609375, -0.4940643310546875, -0.461029052734375, -0.4279937744140625, -0.39495849609375, -0.3619232177734375, -0.328887939453125, -0.2958526611328125, -0.2628173828125, -0.2297821044921875, -0.196746826171875, -0.1637115478515625, -0.13067626953125, -0.0976409912109375, -0.064605712890625, -0.0315704345703125, 0.00146484375, 0.0345001220703125, 0.067535400390625, 0.1005706787109375, 0.13360595703125, 0.1666412353515625, 0.199676513671875, 0.2327117919921875, 0.2657470703125, 0.2987823486328125, 0.331817626953125, 0.3648529052734375, 0.39788818359375, 0.4309234619140625, 0.463958740234375, 0.4969940185546875, 0.530029296875, 0.5630645751953125, 0.596099853515625, 0.6291351318359375, 0.66217041015625, 0.6952056884765625, 0.728240966796875, 0.7612762451171875, 0.7943115234375, 0.8273468017578125, 0.860382080078125, 0.8934173583984375, 0.92645263671875, 0.9594879150390625, 0.992523193359375, 1.0255584716796875, 1.05859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 8.0, 6.0, 5.0, 7.0, 13.0, 14.0, 11.0, 14.0, 17.0, 24.0, 21.0, 17.0, 31.0, 28.0, 23.0, 31.0, 43.0, 40.0, 35.0, 30.0, 32.0, 30.0, 1068.0, 35.0, 39.0, 33.0, 36.0, 27.0, 43.0, 28.0, 31.0, 18.0, 23.0, 15.0, 28.0, 21.0, 14.0, 17.0, 10.0, 13.0, 9.0, 8.0, 6.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.83203125, -2.73828125, -2.64453125, -2.55078125, -2.45703125, -2.36328125, -2.26953125, -2.17578125, -2.08203125, -1.98828125, -1.89453125, -1.80078125, -1.70703125, -1.61328125, -1.51953125, -1.42578125, -1.33203125, -1.23828125, -1.14453125, -1.05078125, -0.95703125, -0.86328125, -0.76953125, -0.67578125, -0.58203125, -0.48828125, -0.39453125, -0.30078125, -0.20703125, -0.11328125, -0.01953125, 0.07421875, 0.16796875, 0.26171875, 0.35546875, 0.44921875, 0.54296875, 0.63671875, 0.73046875, 0.82421875, 0.91796875, 1.01171875, 1.10546875, 1.19921875, 1.29296875, 1.38671875, 1.48046875, 1.57421875, 1.66796875, 1.76171875, 1.85546875, 1.94921875, 2.04296875, 2.13671875, 2.23046875, 2.32421875, 2.41796875, 2.51171875, 2.60546875, 2.69921875, 2.79296875, 2.88671875, 2.98046875, 3.07421875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 3.0, 11.0, 14.0, 12.0, 30.0, 39.0, 52.0, 85.0, 123.0, 146.0, 254.0, 347.0, 498.0, 730.0, 1041.0, 1543.0, 2163.0, 3225.0, 4601.0, 6619.0, 9748.0, 13649.0, 20240.0, 29296.0, 43941.0, 69309.0, 114366.0, 1289721.0, 194381.0, 101285.0, 62776.0, 40048.0, 26696.0, 18640.0, 12830.0, 8901.0, 6098.0, 4185.0, 2982.0, 1989.0, 1393.0, 922.0, 671.0, 461.0, 332.0, 232.0, 157.0, 106.0, 79.0, 54.0, 39.0, 30.0, 18.0, 12.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.9091796875, -0.8806686401367188, -0.8521575927734375, -0.8236465454101562, -0.795135498046875, -0.7666244506835938, -0.7381134033203125, -0.7096023559570312, -0.68109130859375, -0.6525802612304688, -0.6240692138671875, -0.5955581665039062, -0.567047119140625, -0.5385360717773438, -0.5100250244140625, -0.48151397705078125, -0.4530029296875, -0.42449188232421875, -0.3959808349609375, -0.36746978759765625, -0.338958740234375, -0.31044769287109375, -0.2819366455078125, -0.25342559814453125, -0.22491455078125, -0.19640350341796875, -0.1678924560546875, -0.13938140869140625, -0.110870361328125, -0.08235931396484375, -0.0538482666015625, -0.02533721923828125, 0.003173828125, 0.03168487548828125, 0.0601959228515625, 0.08870697021484375, 0.117218017578125, 0.14572906494140625, 0.1742401123046875, 0.20275115966796875, 0.23126220703125, 0.25977325439453125, 0.2882843017578125, 0.31679534912109375, 0.345306396484375, 0.37381744384765625, 0.4023284912109375, 0.43083953857421875, 0.4593505859375, 0.48786163330078125, 0.5163726806640625, 0.5448837280273438, 0.573394775390625, 0.6019058227539062, 0.6304168701171875, 0.6589279174804688, 0.68743896484375, 0.7159500122070312, 0.7444610595703125, 0.7729721069335938, 0.801483154296875, 0.8299942016601562, 0.8585052490234375, 0.8870162963867188, 0.91552734375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 12.0, 17.0, 20.0, 21.0, 33.0, 53.0, 95.0, 114.0, 132.0, 138.0, 93.0, 86.0, 51.0, 32.0, 23.0, 16.0, 4.0, 11.0, 5.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010089874267578125, -0.0009799078106880188, -0.0009508281946182251, -0.0009217485785484314, -0.0008926689624786377, -0.000863589346408844, -0.0008345097303390503, -0.0008054301142692566, -0.0007763504981994629, -0.0007472708821296692, -0.0007181912660598755, -0.0006891116499900818, -0.0006600320339202881, -0.0006309524178504944, -0.0006018728017807007, -0.000572793185710907, -0.0005437135696411133, -0.0005146339535713196, -0.0004855543375015259, -0.0004564747214317322, -0.0004273951053619385, -0.0003983154892921448, -0.0003692358732223511, -0.0003401562571525574, -0.00031107664108276367, -0.00028199702501296997, -0.00025291740894317627, -0.00022383779287338257, -0.00019475817680358887, -0.00016567856073379517, -0.00013659894466400146, -0.00010751932859420776, -7.843971252441406e-05, -4.936009645462036e-05, -2.028048038482666e-05, 8.799135684967041e-06, 3.787875175476074e-05, 6.695836782455444e-05, 9.603798389434814e-05, 0.00012511759996414185, 0.00015419721603393555, 0.00018327683210372925, 0.00021235644817352295, 0.00024143606424331665, 0.00027051568031311035, 0.00029959529638290405, 0.00032867491245269775, 0.00035775452852249146, 0.00038683414459228516, 0.00041591376066207886, 0.00044499337673187256, 0.00047407299280166626, 0.00050315260887146, 0.0005322322249412537, 0.0005613118410110474, 0.0005903914570808411, 0.0006194710731506348, 0.0006485506892204285, 0.0006776303052902222, 0.0007067099213600159, 0.0007357895374298096, 0.0007648691534996033, 0.000793948769569397, 0.0008230283856391907, 0.0008521080017089844]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 11.0, 7.0, 11.0, 34.0, 34.0, 69.0, 114.0, 245.0, 544.0, 398066.0, 648334.0, 531.0, 225.0, 135.0, 73.0, 32.0, 17.0, 22.0, 15.0, 8.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022216796875, -0.02145099639892578, -0.020685195922851562, -0.019919395446777344, -0.019153594970703125, -0.018387794494628906, -0.017621994018554688, -0.01685619354248047, -0.01609039306640625, -0.015324592590332031, -0.014558792114257812, -0.013792991638183594, -0.013027191162109375, -0.012261390686035156, -0.011495590209960938, -0.010729789733886719, -0.0099639892578125, -0.009198188781738281, -0.008432388305664062, -0.007666587829589844, -0.006900787353515625, -0.006134986877441406, -0.0053691864013671875, -0.004603385925292969, -0.00383758544921875, -0.0030717849731445312, -0.0023059844970703125, -0.0015401840209960938, -0.000774383544921875, -8.58306884765625e-06, 0.0007572174072265625, 0.0015230178833007812, 0.002288818359375, 0.0030546188354492188, 0.0038204193115234375, 0.004586219787597656, 0.005352020263671875, 0.006117820739746094, 0.0068836212158203125, 0.007649421691894531, 0.00841522216796875, 0.009181022644042969, 0.009946823120117188, 0.010712623596191406, 0.011478424072265625, 0.012244224548339844, 0.013010025024414062, 0.013775825500488281, 0.0145416259765625, 0.015307426452636719, 0.016073226928710938, 0.016839027404785156, 0.017604827880859375, 0.018370628356933594, 0.019136428833007812, 0.01990222930908203, 0.02066802978515625, 0.02143383026123047, 0.022199630737304688, 0.022965431213378906, 0.023731231689453125, 0.024497032165527344, 0.025262832641601562, 0.02602863311767578, 0.02679443359375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 611.0, 391.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004294907674193382, -0.004216710105538368, -0.004138512071222067, -0.004060314502567053, -0.003982116933912039, -0.0039039188995957375, -0.0038257213309407234, -0.0037475235294550657, -0.003669325727969408, -0.0035911279264837503, -0.0035129303578287363, -0.0034347325563430786, -0.003356534754857421, -0.0032783369533717632, -0.003200139384716749, -0.0031219415832310915, -0.0030437440145760775, -0.0029655462130904198, -0.0028873486444354057, -0.002809150842949748, -0.0027309530414640903, -0.0026527554728090763, -0.0025745576713234186, -0.002496359869837761, -0.002418162301182747, -0.002339964499697089, -0.002261766931042075, -0.0021835691295564175, -0.0021053713280707598, -0.002027173526585102, -0.001948975957930088, -0.0018707781564444304, -0.001792580122128129, -0.0017143824370577931, -0.0016361846355721354, -0.0015579869505017996, -0.0014797891490161419, -0.001401591463945806, -0.0013233937788754702, -0.0012451959773898125, -0.0011669982923194766, -0.0010888006072491407, -0.001010602805763483, -0.0009324051206931472, -0.0008542073774151504, -0.0007760096341371536, -0.0006978119490668178, -0.000619614205788821, -0.0005414164625108242, -0.0004632187192328274, -0.0003850210050586611, -0.0003068232908844948, -0.000228625547606498, -0.00015042780432850122, -7.22300901543349e-05, 5.967624019831419e-06, 8.41653672978282e-05, 0.00016236309602390975, 0.0002405608247499913, 0.0003187585389241576, 0.0003969562822021544, 0.0004751540254801512, 0.000553351710550487, 0.0006315494538284838, 0.0007097471971064806]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 8.0, 4.0, 7.0, 14.0, 8.0, 11.0, 8.0, 16.0, 22.0, 17.0, 25.0, 25.0, 24.0, 23.0, 38.0, 43.0, 33.0, 36.0, 35.0, 43.0, 33.0, 52.0, 46.0, 54.0, 36.0, 36.0, 32.0, 31.0, 30.0, 32.0, 21.0, 20.0, 21.0, 22.0, 18.0, 12.0, 9.0, 9.0, 11.0, 8.0, 5.0, 5.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000286102294921875, -0.0002766391262412071, -0.00026717595756053925, -0.00025771278887987137, -0.0002482496201992035, -0.00023878645151853561, -0.00022932328283786774, -0.00021986011415719986, -0.00021039694547653198, -0.0002009337767958641, -0.00019147060811519623, -0.00018200743943452835, -0.00017254427075386047, -0.0001630811020731926, -0.00015361793339252472, -0.00014415476471185684, -0.00013469159603118896, -0.0001252284273505211, -0.00011576525866985321, -0.00010630208998918533, -9.683892130851746e-05, -8.737575262784958e-05, -7.79125839471817e-05, -6.844941526651382e-05, -5.898624658584595e-05, -4.952307790517807e-05, -4.005990922451019e-05, -3.0596740543842316e-05, -2.113357186317444e-05, -1.1670403182506561e-05, -2.207234501838684e-06, 7.255934178829193e-06, 1.671910285949707e-05, 2.6182271540164948e-05, 3.5645440220832825e-05, 4.51086089015007e-05, 5.457177758216858e-05, 6.403494626283646e-05, 7.349811494350433e-05, 8.296128362417221e-05, 9.242445230484009e-05, 0.00010188762098550797, 0.00011135078966617584, 0.00012081395834684372, 0.0001302771270275116, 0.00013974029570817947, 0.00014920346438884735, 0.00015866663306951523, 0.0001681298017501831, 0.00017759297043085098, 0.00018705613911151886, 0.00019651930779218674, 0.00020598247647285461, 0.0002154456451535225, 0.00022490881383419037, 0.00023437198251485825, 0.00024383515119552612, 0.000253298319876194, 0.0002627614885568619, 0.00027222465723752975, 0.00028168782591819763, 0.0002911509945988655, 0.0003006141632795334, 0.00031007733196020126, 0.00031954050064086914]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 8.0, 5.0, 6.0, 12.0, 11.0, 14.0, 10.0, 14.0, 13.0, 21.0, 30.0, 28.0, 23.0, 30.0, 37.0, 39.0, 36.0, 44.0, 43.0, 39.0, 39.0, 37.0, 32.0, 44.0, 49.0, 32.0, 38.0, 30.0, 27.0, 34.0, 24.0, 14.0, 25.0, 24.0, 20.0, 14.0, 13.0, 9.0, 8.0, 6.0, 8.0, 6.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.1279296875, -4.962890625, -4.7978515625, -4.6328125, -4.4677734375, -4.302734375, -4.1376953125, -3.97265625, -3.8076171875, -3.642578125, -3.4775390625, -3.3125, -3.1474609375, -2.982421875, -2.8173828125, -2.65234375, -2.4873046875, -2.322265625, -2.1572265625, -1.9921875, -1.8271484375, -1.662109375, -1.4970703125, -1.33203125, -1.1669921875, -1.001953125, -0.8369140625, -0.671875, -0.5068359375, -0.341796875, -0.1767578125, -0.01171875, 0.1533203125, 0.318359375, 0.4833984375, 0.6484375, 0.8134765625, 0.978515625, 1.1435546875, 1.30859375, 1.4736328125, 1.638671875, 1.8037109375, 1.96875, 2.1337890625, 2.298828125, 2.4638671875, 2.62890625, 2.7939453125, 2.958984375, 3.1240234375, 3.2890625, 3.4541015625, 3.619140625, 3.7841796875, 3.94921875, 4.1142578125, 4.279296875, 4.4443359375, 4.609375, 4.7744140625, 4.939453125, 5.1044921875, 5.26953125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 8.0, 4.0, 10.0, 8.0, 20.0, 20.0, 44.0, 48.0, 66.0, 77.0, 122.0, 169.0, 250.0, 312.0, 485.0, 808.0, 1147.0, 1997.0, 3553.0, 6897.0, 15205.0, 39753.0, 141798.0, 491998.0, 242108.0, 60569.0, 20962.0, 8942.0, 4508.0, 2412.0, 1413.0, 898.0, 593.0, 397.0, 295.0, 218.0, 127.0, 86.0, 67.0, 53.0, 27.0, 20.0, 18.0, 15.0, 14.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.462890625, -3.346221923828125, -3.22955322265625, -3.112884521484375, -2.9962158203125, -2.879547119140625, -2.76287841796875, -2.646209716796875, -2.529541015625, -2.412872314453125, -2.29620361328125, -2.179534912109375, -2.0628662109375, -1.946197509765625, -1.82952880859375, -1.712860107421875, -1.59619140625, -1.479522705078125, -1.36285400390625, -1.246185302734375, -1.1295166015625, -1.012847900390625, -0.89617919921875, -0.779510498046875, -0.662841796875, -0.546173095703125, -0.42950439453125, -0.312835693359375, -0.1961669921875, -0.079498291015625, 0.03717041015625, 0.153839111328125, 0.2705078125, 0.387176513671875, 0.50384521484375, 0.620513916015625, 0.7371826171875, 0.853851318359375, 0.97052001953125, 1.087188720703125, 1.203857421875, 1.320526123046875, 1.43719482421875, 1.553863525390625, 1.6705322265625, 1.787200927734375, 1.90386962890625, 2.020538330078125, 2.13720703125, 2.253875732421875, 2.37054443359375, 2.487213134765625, 2.6038818359375, 2.720550537109375, 2.83721923828125, 2.953887939453125, 3.070556640625, 3.187225341796875, 3.30389404296875, 3.420562744140625, 3.5372314453125, 3.653900146484375, 3.77056884765625, 3.887237548828125, 4.00390625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 3.0, 10.0, 6.0, 12.0, 13.0, 11.0, 17.0, 16.0, 20.0, 23.0, 31.0, 32.0, 32.0, 33.0, 38.0, 37.0, 53.0, 59.0, 341.0, 1734.0, 76.0, 53.0, 40.0, 41.0, 46.0, 50.0, 35.0, 37.0, 21.0, 22.0, 23.0, 13.0, 17.0, 16.0, 12.0, 6.0, 4.0, 5.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.187744140625, -17.56298828125, -16.938232421875, -16.3134765625, -15.688720703125, -15.06396484375, -14.439208984375, -13.814453125, -13.189697265625, -12.56494140625, -11.940185546875, -11.3154296875, -10.690673828125, -10.06591796875, -9.441162109375, -8.81640625, -8.191650390625, -7.56689453125, -6.942138671875, -6.3173828125, -5.692626953125, -5.06787109375, -4.443115234375, -3.818359375, -3.193603515625, -2.56884765625, -1.944091796875, -1.3193359375, -0.694580078125, -0.06982421875, 0.554931640625, 1.1796875, 1.804443359375, 2.42919921875, 3.053955078125, 3.6787109375, 4.303466796875, 4.92822265625, 5.552978515625, 6.177734375, 6.802490234375, 7.42724609375, 8.052001953125, 8.6767578125, 9.301513671875, 9.92626953125, 10.551025390625, 11.17578125, 11.800537109375, 12.42529296875, 13.050048828125, 13.6748046875, 14.299560546875, 14.92431640625, 15.549072265625, 16.173828125, 16.798583984375, 17.42333984375, 18.048095703125, 18.6728515625, 19.297607421875, 19.92236328125, 20.547119140625, 21.171875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 16.0, 9.0, 22.0, 14.0, 18.0, 22.0, 30.0, 43.0, 39.0, 67.0, 101.0, 156.0, 233.0, 487.0, 1916.0, 86586.0, 3047550.0, 6622.0, 814.0, 319.0, 183.0, 108.0, 83.0, 47.0, 40.0, 34.0, 20.0, 24.0, 16.0, 12.0, 13.0, 17.0, 10.0, 6.0, 6.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.875, -33.8564453125, -32.837890625, -31.8193359375, -30.80078125, -29.7822265625, -28.763671875, -27.7451171875, -26.7265625, -25.7080078125, -24.689453125, -23.6708984375, -22.65234375, -21.6337890625, -20.615234375, -19.5966796875, -18.578125, -17.5595703125, -16.541015625, -15.5224609375, -14.50390625, -13.4853515625, -12.466796875, -11.4482421875, -10.4296875, -9.4111328125, -8.392578125, -7.3740234375, -6.35546875, -5.3369140625, -4.318359375, -3.2998046875, -2.28125, -1.2626953125, -0.244140625, 0.7744140625, 1.79296875, 2.8115234375, 3.830078125, 4.8486328125, 5.8671875, 6.8857421875, 7.904296875, 8.9228515625, 9.94140625, 10.9599609375, 11.978515625, 12.9970703125, 14.015625, 15.0341796875, 16.052734375, 17.0712890625, 18.08984375, 19.1083984375, 20.126953125, 21.1455078125, 22.1640625, 23.1826171875, 24.201171875, 25.2197265625, 26.23828125, 27.2568359375, 28.275390625, 29.2939453125, 30.3125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 6.0, 585.0, 423.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.739985466003418, -8.436986923217773, -4.1339874267578125, 0.16901111602783203, 4.472010612487793, 8.775010108947754, 13.078007698059082, 17.38100814819336, 21.684005737304688, 25.98700523376465, 30.29000473022461, 34.59300231933594, 38.89600372314453, 43.19900131225586, 47.50199890136719, 51.80500030517578, 56.10799789428711, 60.41099548339844, 64.71399688720703, 69.01699829101562, 73.31999206542969, 77.62299346923828, 81.92599487304688, 86.22898864746094, 90.53199005126953, 94.83499145507812, 99.13798522949219, 103.44098663330078, 107.74398803710938, 112.04698181152344, 116.34998321533203, 120.65298461914062, 124.95597839355469, 129.25897216796875, 133.56198120117188, 137.86497497558594, 142.16796875, 146.47097778320312, 150.7739715576172, 155.07696533203125, 159.37997436523438, 163.68296813964844, 167.98597717285156, 172.28897094726562, 176.5919647216797, 180.8949737548828, 185.19796752929688, 189.50096130371094, 193.803955078125, 198.10694885253906, 202.4099578857422, 206.71295166015625, 211.0159454345703, 215.31895446777344, 219.6219482421875, 223.92494201660156, 228.2279510498047, 232.53094482421875, 236.83395385742188, 241.13694763183594, 245.43994140625, 249.74295043945312, 254.0459442138672, 258.34893798828125, 262.6519470214844]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 2.0, 6.0, 2.0, 6.0, 7.0, 7.0, 8.0, 13.0, 11.0, 12.0, 9.0, 14.0, 20.0, 23.0, 28.0, 34.0, 24.0, 30.0, 35.0, 37.0, 25.0, 49.0, 39.0, 38.0, 36.0, 27.0, 49.0, 37.0, 32.0, 29.0, 32.0, 38.0, 30.0, 26.0, 27.0, 17.0, 16.0, 28.0, 15.0, 17.0, 13.0, 12.0, 14.0, 5.0, 4.0, 8.0, 2.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-55.407169342041016, -53.6591682434082, -51.91116714477539, -50.16316604614258, -48.41516876220703, -46.66716766357422, -44.919166564941406, -43.171165466308594, -41.42316436767578, -39.67516326904297, -37.927162170410156, -36.179161071777344, -34.43115997314453, -32.68315887451172, -30.935161590576172, -29.18716049194336, -27.439159393310547, -25.691158294677734, -23.943157196044922, -22.195158004760742, -20.44715690612793, -18.699155807495117, -16.951156616210938, -15.203155517578125, -13.455154418945312, -11.7071533203125, -9.959153175354004, -8.211153030395508, -6.463151931762695, -4.715150833129883, -2.9671506881713867, -1.2191505432128906, 0.5288543701171875, 2.276854991912842, 4.024855613708496, 5.77285623550415, 7.520856857299805, 9.268857955932617, 11.016858100891113, 12.76485824584961, 14.512859344482422, 16.260860443115234, 18.008861541748047, 19.756860733032227, 21.50486183166504, 23.25286293029785, 25.00086212158203, 26.748863220214844, 28.496864318847656, 30.24486541748047, 31.99286651611328, 33.740867614746094, 35.488868713378906, 37.23686981201172, 38.984867095947266, 40.73286819458008, 42.48086929321289, 44.2288703918457, 45.976871490478516, 47.72487258911133, 49.472869873046875, 51.22087097167969, 52.9688720703125, 54.71687316894531, 56.464874267578125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 4.0, 7.0, 11.0, 10.0, 15.0, 10.0, 12.0, 17.0, 21.0, 20.0, 27.0, 30.0, 31.0, 29.0, 38.0, 39.0, 39.0, 45.0, 43.0, 45.0, 38.0, 43.0, 38.0, 52.0, 30.0, 37.0, 30.0, 31.0, 25.0, 28.0, 22.0, 23.0, 27.0, 15.0, 13.0, 10.0, 8.0, 10.0, 5.0, 9.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.68359375, -5.51220703125, -5.3408203125, -5.16943359375, -4.998046875, -4.82666015625, -4.6552734375, -4.48388671875, -4.3125, -4.14111328125, -3.9697265625, -3.79833984375, -3.626953125, -3.45556640625, -3.2841796875, -3.11279296875, -2.94140625, -2.77001953125, -2.5986328125, -2.42724609375, -2.255859375, -2.08447265625, -1.9130859375, -1.74169921875, -1.5703125, -1.39892578125, -1.2275390625, -1.05615234375, -0.884765625, -0.71337890625, -0.5419921875, -0.37060546875, -0.19921875, -0.02783203125, 0.1435546875, 0.31494140625, 0.486328125, 0.65771484375, 0.8291015625, 1.00048828125, 1.171875, 1.34326171875, 1.5146484375, 1.68603515625, 1.857421875, 2.02880859375, 2.2001953125, 2.37158203125, 2.54296875, 2.71435546875, 2.8857421875, 3.05712890625, 3.228515625, 3.39990234375, 3.5712890625, 3.74267578125, 3.9140625, 4.08544921875, 4.2568359375, 4.42822265625, 4.599609375, 4.77099609375, 4.9423828125, 5.11376953125, 5.28515625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 3.0, 7.0, 7.0, 9.0, 23.0, 14.0, 16.0, 31.0, 45.0, 52.0, 97.0, 116.0, 235.0, 435.0, 1029.0, 3152.0, 14565.0, 105193.0, 919478.0, 2357795.0, 698181.0, 77285.0, 11898.0, 2665.0, 917.0, 360.0, 230.0, 137.0, 74.0, 55.0, 42.0, 31.0, 18.0, 19.0, 6.0, 10.0, 14.0, 10.0, 2.0, 4.0, 8.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.5699462890625, -10.233642578125, -9.8973388671875, -9.56103515625, -9.2247314453125, -8.888427734375, -8.5521240234375, -8.2158203125, -7.8795166015625, -7.543212890625, -7.2069091796875, -6.87060546875, -6.5343017578125, -6.197998046875, -5.8616943359375, -5.525390625, -5.1890869140625, -4.852783203125, -4.5164794921875, -4.18017578125, -3.8438720703125, -3.507568359375, -3.1712646484375, -2.8349609375, -2.4986572265625, -2.162353515625, -1.8260498046875, -1.48974609375, -1.1534423828125, -0.817138671875, -0.4808349609375, -0.14453125, 0.1917724609375, 0.528076171875, 0.8643798828125, 1.20068359375, 1.5369873046875, 1.873291015625, 2.2095947265625, 2.5458984375, 2.8822021484375, 3.218505859375, 3.5548095703125, 3.89111328125, 4.2274169921875, 4.563720703125, 4.9000244140625, 5.236328125, 5.5726318359375, 5.908935546875, 6.2452392578125, 6.58154296875, 6.9178466796875, 7.254150390625, 7.5904541015625, 7.9267578125, 8.2630615234375, 8.599365234375, 8.9356689453125, 9.27197265625, 9.6082763671875, 9.944580078125, 10.2808837890625, 10.6171875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 13.0, 22.0, 12.0, 32.0, 44.0, 60.0, 89.0, 97.0, 158.0, 185.0, 272.0, 363.0, 436.0, 476.0, 424.0, 375.0, 252.0, 213.0, 139.0, 104.0, 69.0, 67.0, 46.0, 22.0, 30.0, 16.0, 13.0, 10.0, 3.0, 7.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.953125, -15.4896240234375, -15.026123046875, -14.5626220703125, -14.09912109375, -13.6356201171875, -13.172119140625, -12.7086181640625, -12.2451171875, -11.7816162109375, -11.318115234375, -10.8546142578125, -10.39111328125, -9.9276123046875, -9.464111328125, -9.0006103515625, -8.537109375, -8.0736083984375, -7.610107421875, -7.1466064453125, -6.68310546875, -6.2196044921875, -5.756103515625, -5.2926025390625, -4.8291015625, -4.3656005859375, -3.902099609375, -3.4385986328125, -2.97509765625, -2.5115966796875, -2.048095703125, -1.5845947265625, -1.12109375, -0.6575927734375, -0.194091796875, 0.2694091796875, 0.73291015625, 1.1964111328125, 1.659912109375, 2.1234130859375, 2.5869140625, 3.0504150390625, 3.513916015625, 3.9774169921875, 4.44091796875, 4.9044189453125, 5.367919921875, 5.8314208984375, 6.294921875, 6.7584228515625, 7.221923828125, 7.6854248046875, 8.14892578125, 8.6124267578125, 9.075927734375, 9.5394287109375, 10.0029296875, 10.4664306640625, 10.929931640625, 11.3934326171875, 11.85693359375, 12.3204345703125, 12.783935546875, 13.2474365234375, 13.7109375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 11.0, 12.0, 18.0, 39.0, 51.0, 73.0, 85.0, 159.0, 206.0, 439.0, 1666.0, 193265.0, 3986703.0, 9989.0, 726.0, 264.0, 187.0, 106.0, 69.0, 53.0, 43.0, 29.0, 18.0, 16.0, 6.0, 7.0, 10.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.8125, -56.5732421875, -54.333984375, -52.0947265625, -49.85546875, -47.6162109375, -45.376953125, -43.1376953125, -40.8984375, -38.6591796875, -36.419921875, -34.1806640625, -31.94140625, -29.7021484375, -27.462890625, -25.2236328125, -22.984375, -20.7451171875, -18.505859375, -16.2666015625, -14.02734375, -11.7880859375, -9.548828125, -7.3095703125, -5.0703125, -2.8310546875, -0.591796875, 1.6474609375, 3.88671875, 6.1259765625, 8.365234375, 10.6044921875, 12.84375, 15.0830078125, 17.322265625, 19.5615234375, 21.80078125, 24.0400390625, 26.279296875, 28.5185546875, 30.7578125, 32.9970703125, 35.236328125, 37.4755859375, 39.71484375, 41.9541015625, 44.193359375, 46.4326171875, 48.671875, 50.9111328125, 53.150390625, 55.3896484375, 57.62890625, 59.8681640625, 62.107421875, 64.3466796875, 66.5859375, 68.8251953125, 71.064453125, 73.3037109375, 75.54296875, 77.7822265625, 80.021484375, 82.2607421875, 84.5]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 24.0, 257.0, 479.0, 236.0, 19.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-281.2601318359375, -274.1336669921875, -267.0072326660156, -259.8807678222656, -252.7543182373047, -245.62786865234375, -238.5014190673828, -231.37496948242188, -224.24850463867188, -217.12205505371094, -209.99560546875, -202.869140625, -195.74269104003906, -188.61624145507812, -181.4897918701172, -174.36334228515625, -167.2368927001953, -160.11044311523438, -152.98399353027344, -145.8575439453125, -138.7310791015625, -131.60462951660156, -124.47817993164062, -117.35173034667969, -110.22527313232422, -103.09882354736328, -95.97236633300781, -88.84591674804688, -81.71946716308594, -74.59300994873047, -67.46656036376953, -60.34010696411133, -53.213653564453125, -46.08720016479492, -38.96074676513672, -31.83429718017578, -24.707843780517578, -17.581390380859375, -10.454940795898438, -3.3284873962402344, 3.7979660034179688, 10.924418449401855, 18.050870895385742, 25.177322387695312, 32.303775787353516, 39.43022918701172, 46.556678771972656, 53.68313217163086, 60.80958557128906, 67.93603515625, 75.06249237060547, 82.1889419555664, 89.31539916992188, 96.44184875488281, 103.56829833984375, 110.69474792480469, 117.82120513916016, 124.9476547241211, 132.07411193847656, 139.2005615234375, 146.32701110839844, 153.45346069335938, 160.57992553710938, 167.7063751220703, 174.83282470703125]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 4.0, 15.0, 12.0, 10.0, 17.0, 20.0, 18.0, 29.0, 24.0, 30.0, 34.0, 36.0, 36.0, 48.0, 47.0, 51.0, 43.0, 54.0, 53.0, 33.0, 43.0, 42.0, 42.0, 41.0, 27.0, 28.0, 23.0, 19.0, 24.0, 18.0, 14.0, 12.0, 11.0, 9.0, 9.0, 9.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.21318054199219, -48.53741455078125, -46.86164474487305, -45.185874938964844, -43.510108947753906, -41.83434295654297, -40.158573150634766, -38.48280334472656, -36.807037353515625, -35.13127136230469, -33.455501556396484, -31.779733657836914, -30.103965759277344, -28.428197860717773, -26.752429962158203, -25.076662063598633, -23.400894165039062, -21.725126266479492, -20.049358367919922, -18.37359046936035, -16.69782257080078, -15.022054672241211, -13.34628677368164, -11.67051887512207, -9.9947509765625, -8.31898307800293, -6.643215179443359, -4.967447280883789, -3.2916793823242188, -1.6159114837646484, 0.059856414794921875, 1.7356243133544922, 3.4113922119140625, 5.087160110473633, 6.762928009033203, 8.438695907592773, 10.114463806152344, 11.790231704711914, 13.465999603271484, 15.141767501831055, 16.817535400390625, 18.493303298950195, 20.169071197509766, 21.844839096069336, 23.520606994628906, 25.196374893188477, 26.872142791748047, 28.547910690307617, 30.223678588867188, 31.899446487426758, 33.57521438598633, 35.25098419189453, 36.92675018310547, 38.602516174316406, 40.27828598022461, 41.95405578613281, 43.62982177734375, 45.30558776855469, 46.98135757446289, 48.657127380371094, 50.33289337158203, 52.00865936279297, 53.68442916870117, 55.360198974609375, 57.03596496582031]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 5.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 8.0, 12.0, 16.0, 20.0, 30.0, 26.0, 36.0, 31.0, 28.0, 32.0, 30.0, 42.0, 43.0, 45.0, 55.0, 38.0, 48.0, 45.0, 42.0, 39.0, 41.0, 35.0, 25.0, 26.0, 25.0, 21.0, 12.0, 20.0, 19.0, 17.0, 16.0, 8.0, 11.0, 7.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.1484375, -5.96844482421875, -5.7884521484375, -5.60845947265625, -5.428466796875, -5.24847412109375, -5.0684814453125, -4.88848876953125, -4.70849609375, -4.52850341796875, -4.3485107421875, -4.16851806640625, -3.988525390625, -3.80853271484375, -3.6285400390625, -3.44854736328125, -3.2685546875, -3.08856201171875, -2.9085693359375, -2.72857666015625, -2.548583984375, -2.36859130859375, -2.1885986328125, -2.00860595703125, -1.82861328125, -1.64862060546875, -1.4686279296875, -1.28863525390625, -1.108642578125, -0.92864990234375, -0.7486572265625, -0.56866455078125, -0.388671875, -0.20867919921875, -0.0286865234375, 0.15130615234375, 0.331298828125, 0.51129150390625, 0.6912841796875, 0.87127685546875, 1.05126953125, 1.23126220703125, 1.4112548828125, 1.59124755859375, 1.771240234375, 1.95123291015625, 2.1312255859375, 2.31121826171875, 2.4912109375, 2.67120361328125, 2.8511962890625, 3.03118896484375, 3.211181640625, 3.39117431640625, 3.5711669921875, 3.75115966796875, 3.93115234375, 4.11114501953125, 4.2911376953125, 4.47113037109375, 4.651123046875, 4.83111572265625, 5.0111083984375, 5.19110107421875, 5.37109375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 7.0, 4.0, 21.0, 26.0, 39.0, 51.0, 95.0, 99.0, 169.0, 236.0, 378.0, 500.0, 700.0, 1057.0, 1597.0, 2291.0, 3304.0, 4976.0, 7545.0, 11290.0, 17393.0, 26862.0, 42533.0, 70171.0, 127435.0, 322787.0, 176455.0, 86580.0, 51481.0, 31976.0, 20308.0, 13124.0, 8679.0, 5880.0, 3935.0, 2804.0, 1781.0, 1290.0, 879.0, 591.0, 398.0, 279.0, 200.0, 124.0, 66.0, 50.0, 48.0, 13.0, 17.0, 10.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0], "bins": [-1.2255859375, -1.189208984375, -1.15283203125, -1.116455078125, -1.080078125, -1.043701171875, -1.00732421875, -0.970947265625, -0.9345703125, -0.898193359375, -0.86181640625, -0.825439453125, -0.7890625, -0.752685546875, -0.71630859375, -0.679931640625, -0.6435546875, -0.607177734375, -0.57080078125, -0.534423828125, -0.498046875, -0.461669921875, -0.42529296875, -0.388916015625, -0.3525390625, -0.316162109375, -0.27978515625, -0.243408203125, -0.20703125, -0.170654296875, -0.13427734375, -0.097900390625, -0.0615234375, -0.025146484375, 0.01123046875, 0.047607421875, 0.083984375, 0.120361328125, 0.15673828125, 0.193115234375, 0.2294921875, 0.265869140625, 0.30224609375, 0.338623046875, 0.375, 0.411376953125, 0.44775390625, 0.484130859375, 0.5205078125, 0.556884765625, 0.59326171875, 0.629638671875, 0.666015625, 0.702392578125, 0.73876953125, 0.775146484375, 0.8115234375, 0.847900390625, 0.88427734375, 0.920654296875, 0.95703125, 0.993408203125, 1.02978515625, 1.066162109375, 1.1025390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 6.0, 6.0, 6.0, 13.0, 6.0, 16.0, 14.0, 17.0, 13.0, 24.0, 27.0, 23.0, 25.0, 36.0, 29.0, 46.0, 48.0, 34.0, 39.0, 50.0, 1060.0, 35.0, 33.0, 42.0, 41.0, 30.0, 50.0, 31.0, 27.0, 26.0, 30.0, 24.0, 22.0, 11.0, 11.0, 8.0, 8.0, 14.0, 9.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.45703125, -3.350982666015625, -3.24493408203125, -3.138885498046875, -3.0328369140625, -2.926788330078125, -2.82073974609375, -2.714691162109375, -2.608642578125, -2.502593994140625, -2.39654541015625, -2.290496826171875, -2.1844482421875, -2.078399658203125, -1.97235107421875, -1.866302490234375, -1.76025390625, -1.654205322265625, -1.54815673828125, -1.442108154296875, -1.3360595703125, -1.230010986328125, -1.12396240234375, -1.017913818359375, -0.911865234375, -0.805816650390625, -0.69976806640625, -0.593719482421875, -0.4876708984375, -0.381622314453125, -0.27557373046875, -0.169525146484375, -0.0634765625, 0.042572021484375, 0.14862060546875, 0.254669189453125, 0.3607177734375, 0.466766357421875, 0.57281494140625, 0.678863525390625, 0.784912109375, 0.890960693359375, 0.99700927734375, 1.103057861328125, 1.2091064453125, 1.315155029296875, 1.42120361328125, 1.527252197265625, 1.63330078125, 1.739349365234375, 1.84539794921875, 1.951446533203125, 2.0574951171875, 2.163543701171875, 2.26959228515625, 2.375640869140625, 2.481689453125, 2.587738037109375, 2.69378662109375, 2.799835205078125, 2.9058837890625, 3.011932373046875, 3.11798095703125, 3.224029541015625, 3.330078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 6.0, 6.0, 11.0, 14.0, 24.0, 33.0, 29.0, 54.0, 69.0, 95.0, 157.0, 195.0, 302.0, 416.0, 576.0, 865.0, 1192.0, 1690.0, 2383.0, 3531.0, 5101.0, 7523.0, 11009.0, 16314.0, 24738.0, 38635.0, 62226.0, 106532.0, 222940.0, 1293147.0, 112618.0, 65115.0, 40118.0, 25709.0, 16906.0, 11393.0, 7702.0, 5370.0, 3724.0, 2514.0, 1762.0, 1271.0, 899.0, 642.0, 418.0, 323.0, 246.0, 164.0, 122.0, 92.0, 60.0, 42.0, 41.0, 18.0, 22.0, 15.0, 9.0, 8.0, 1.0, 2.0, 5.0], "bins": [-1.03125, -0.9990692138671875, -0.966888427734375, -0.9347076416015625, -0.90252685546875, -0.8703460693359375, -0.838165283203125, -0.8059844970703125, -0.7738037109375, -0.7416229248046875, -0.709442138671875, -0.6772613525390625, -0.64508056640625, -0.6128997802734375, -0.580718994140625, -0.5485382080078125, -0.516357421875, -0.4841766357421875, -0.451995849609375, -0.4198150634765625, -0.38763427734375, -0.3554534912109375, -0.323272705078125, -0.2910919189453125, -0.2589111328125, -0.2267303466796875, -0.194549560546875, -0.1623687744140625, -0.13018798828125, -0.0980072021484375, -0.065826416015625, -0.0336456298828125, -0.00146484375, 0.0307159423828125, 0.062896728515625, 0.0950775146484375, 0.12725830078125, 0.1594390869140625, 0.191619873046875, 0.2238006591796875, 0.2559814453125, 0.2881622314453125, 0.320343017578125, 0.3525238037109375, 0.38470458984375, 0.4168853759765625, 0.449066162109375, 0.4812469482421875, 0.513427734375, 0.5456085205078125, 0.577789306640625, 0.6099700927734375, 0.64215087890625, 0.6743316650390625, 0.706512451171875, 0.7386932373046875, 0.7708740234375, 0.8030548095703125, 0.835235595703125, 0.8674163818359375, 0.89959716796875, 0.9317779541015625, 0.963958740234375, 0.9961395263671875, 1.0283203125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 3.0, 1.0, 9.0, 14.0, 5.0, 12.0, 8.0, 14.0, 23.0, 28.0, 38.0, 43.0, 55.0, 75.0, 82.0, 82.0, 93.0, 92.0, 70.0, 46.0, 39.0, 36.0, 23.0, 19.0, 21.0, 14.0, 5.0, 10.0, 7.0, 10.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00089263916015625, -0.0008683204650878906, -0.0008440017700195312, -0.0008196830749511719, -0.0007953643798828125, -0.0007710456848144531, -0.0007467269897460938, -0.0007224082946777344, -0.000698089599609375, -0.0006737709045410156, -0.0006494522094726562, -0.0006251335144042969, -0.0006008148193359375, -0.0005764961242675781, -0.0005521774291992188, -0.0005278587341308594, -0.0005035400390625, -0.0004792213439941406, -0.00045490264892578125, -0.0004305839538574219, -0.0004062652587890625, -0.0003819465637207031, -0.00035762786865234375, -0.0003333091735839844, -0.000308990478515625, -0.0002846717834472656, -0.00026035308837890625, -0.00023603439331054688, -0.0002117156982421875, -0.00018739700317382812, -0.00016307830810546875, -0.00013875961303710938, -0.00011444091796875, -9.012222290039062e-05, -6.580352783203125e-05, -4.1484832763671875e-05, -1.71661376953125e-05, 7.152557373046875e-06, 3.147125244140625e-05, 5.5789947509765625e-05, 8.0108642578125e-05, 0.00010442733764648438, 0.00012874603271484375, 0.00015306472778320312, 0.0001773834228515625, 0.00020170211791992188, 0.00022602081298828125, 0.0002503395080566406, 0.000274658203125, 0.0002989768981933594, 0.00032329559326171875, 0.0003476142883300781, 0.0003719329833984375, 0.0003962516784667969, 0.00042057037353515625, 0.0004448890686035156, 0.000469207763671875, 0.0004935264587402344, 0.0005178451538085938, 0.0005421638488769531, 0.0005664825439453125, 0.0005908012390136719, 0.0006151199340820312, 0.0006394386291503906, 0.00066375732421875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 8.0, 7.0, 15.0, 9.0, 21.0, 19.0, 23.0, 44.0, 55.0, 80.0, 140.0, 269.0, 682.0, 186894.0, 858753.0, 754.0, 326.0, 154.0, 86.0, 66.0, 28.0, 24.0, 21.0, 14.0, 15.0, 12.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157470703125, -0.015165090560913086, -0.014583110809326172, -0.014001131057739258, -0.013419151306152344, -0.01283717155456543, -0.012255191802978516, -0.011673212051391602, -0.011091232299804688, -0.010509252548217773, -0.00992727279663086, -0.009345293045043945, -0.008763313293457031, -0.008181333541870117, -0.007599353790283203, -0.007017374038696289, -0.006435394287109375, -0.005853414535522461, -0.005271434783935547, -0.004689455032348633, -0.004107475280761719, -0.0035254955291748047, -0.0029435157775878906, -0.0023615360260009766, -0.0017795562744140625, -0.0011975765228271484, -0.0006155967712402344, -3.361701965332031e-05, 0.0005483627319335938, 0.0011303424835205078, 0.0017123222351074219, 0.002294301986694336, 0.00287628173828125, 0.003458261489868164, 0.004040241241455078, 0.004622220993041992, 0.005204200744628906, 0.00578618049621582, 0.006368160247802734, 0.0069501399993896484, 0.0075321197509765625, 0.008114099502563477, 0.00869607925415039, 0.009278059005737305, 0.009860038757324219, 0.010442018508911133, 0.011023998260498047, 0.011605978012084961, 0.012187957763671875, 0.012769937515258789, 0.013351917266845703, 0.013933897018432617, 0.014515876770019531, 0.015097856521606445, 0.01567983627319336, 0.016261816024780273, 0.016843795776367188, 0.0174257755279541, 0.018007755279541016, 0.01858973503112793, 0.019171714782714844, 0.019753694534301758, 0.020335674285888672, 0.020917654037475586, 0.0214996337890625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 73.0, 302.0, 408.0, 176.0, 41.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00046411185758188367, -0.00043158448534086347, -0.0003990571422036737, -0.000366529799066484, -0.00033400242682546377, -0.00030147505458444357, -0.0002689477114472538, -0.00023642035375814885, -0.00020389299606904387, -0.0001713656383799389, -0.00013883828069083393, -0.00010631092300172895, -7.378356531262398e-05, -4.1256207623519003e-05, -8.728849934414029e-06, 2.3798507754690945e-05, 5.632586544379592e-05, 8.88532231329009e-05, 0.00012138058082200587, 0.00015390793851111084, 0.00018643529620021582, 0.0002189626538893208, 0.00025149001157842577, 0.0002840173547156155, 0.0003165447269566357, 0.0003490720991976559, 0.00038159944233484566, 0.0004141267854720354, 0.0004466541577130556, 0.0004791815299540758, 0.000511708902195096, 0.0005442362162284553, 0.0005767635302618146, 0.0006092909025028348, 0.000641818274743855, 0.0006743455887772143, 0.0007068729610182345, 0.0007394003332592547, 0.000771927647292614, 0.0008044550195336342, 0.0008369823917746544, 0.0008695097640156746, 0.0009020371362566948, 0.0009345644502900541, 0.0009670918225310743, 0.0009996191365644336, 0.0010321465088054538, 0.001064673881046474, 0.0010972012532874942, 0.0011297286255285144, 0.0011622559977695346, 0.0011947833700105548, 0.0012273106258362532, 0.0012598379980772734, 0.0012923653703182936, 0.0013248927425593138, 0.001357420114800334, 0.0013899474870413542, 0.0014224748592823744, 0.0014550022315233946, 0.0014875296037644148, 0.0015200568595901132, 0.0015525842318311334, 0.0015851116040721536, 0.0016176389763131738]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 2.0, 4.0, 4.0, 7.0, 6.0, 8.0, 8.0, 5.0, 16.0, 14.0, 18.0, 14.0, 15.0, 12.0, 21.0, 20.0, 22.0, 29.0, 25.0, 28.0, 28.0, 30.0, 46.0, 27.0, 31.0, 34.0, 31.0, 26.0, 35.0, 40.0, 35.0, 34.0, 28.0, 32.0, 29.0, 27.0, 33.0, 19.0, 25.0, 21.0, 12.0, 17.0, 8.0, 10.0, 9.0, 3.0, 16.0, 3.0, 10.0, 11.0, 4.0, 1.0, 3.0, 4.0, 5.0, 2.0, 1.0], "bins": [-0.00028777122497558594, -0.0002792598679661751, -0.0002707485109567642, -0.00026223715394735336, -0.0002537257969379425, -0.00024521443992853165, -0.0002367030829191208, -0.00022819172590970993, -0.00021968036890029907, -0.00021116901189088821, -0.00020265765488147736, -0.0001941462978720665, -0.00018563494086265564, -0.00017712358385324478, -0.00016861222684383392, -0.00016010086983442307, -0.0001515895128250122, -0.00014307815581560135, -0.0001345667988061905, -0.00012605544179677963, -0.00011754408478736877, -0.00010903272777795792, -0.00010052137076854706, -9.20100137591362e-05, -8.349865674972534e-05, -7.498729974031448e-05, -6.647594273090363e-05, -5.796458572149277e-05, -4.945322871208191e-05, -4.094187170267105e-05, -3.243051469326019e-05, -2.3919157683849335e-05, -1.5407800674438477e-05, -6.896443665027618e-06, 1.6149133443832397e-06, 1.0126270353794098e-05, 1.8637627363204956e-05, 2.7148984372615814e-05, 3.566034138202667e-05, 4.417169839143753e-05, 5.268305540084839e-05, 6.119441241025925e-05, 6.97057694196701e-05, 7.821712642908096e-05, 8.672848343849182e-05, 9.523984044790268e-05, 0.00010375119745731354, 0.0001122625544667244, 0.00012077391147613525, 0.0001292852684855461, 0.00013779662549495697, 0.00014630798250436783, 0.0001548193395137787, 0.00016333069652318954, 0.0001718420535326004, 0.00018035341054201126, 0.00018886476755142212, 0.00019737612456083298, 0.00020588748157024384, 0.0002143988385796547, 0.00022291019558906555, 0.0002314215525984764, 0.00023993290960788727, 0.0002484442666172981, 0.000256955623626709]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 5.0, 6.0, 3.0, 5.0, 5.0, 7.0, 11.0, 8.0, 12.0, 16.0, 20.0, 30.0, 26.0, 36.0, 31.0, 28.0, 32.0, 30.0, 42.0, 43.0, 45.0, 55.0, 38.0, 48.0, 45.0, 42.0, 39.0, 41.0, 35.0, 25.0, 26.0, 25.0, 21.0, 12.0, 20.0, 19.0, 17.0, 16.0, 8.0, 11.0, 7.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.1484375, -5.96844482421875, -5.7884521484375, -5.60845947265625, -5.428466796875, -5.24847412109375, -5.0684814453125, -4.88848876953125, -4.70849609375, -4.52850341796875, -4.3485107421875, -4.16851806640625, -3.988525390625, -3.80853271484375, -3.6285400390625, -3.44854736328125, -3.2685546875, -3.08856201171875, -2.9085693359375, -2.72857666015625, -2.548583984375, -2.36859130859375, -2.1885986328125, -2.00860595703125, -1.82861328125, -1.64862060546875, -1.4686279296875, -1.28863525390625, -1.108642578125, -0.92864990234375, -0.7486572265625, -0.56866455078125, -0.388671875, -0.20867919921875, -0.0286865234375, 0.15130615234375, 0.331298828125, 0.51129150390625, 0.6912841796875, 0.87127685546875, 1.05126953125, 1.23126220703125, 1.4112548828125, 1.59124755859375, 1.771240234375, 1.95123291015625, 2.1312255859375, 2.31121826171875, 2.4912109375, 2.67120361328125, 2.8511962890625, 3.03118896484375, 3.211181640625, 3.39117431640625, 3.5711669921875, 3.75115966796875, 3.93115234375, 4.11114501953125, 4.2911376953125, 4.47113037109375, 4.651123046875, 4.83111572265625, 5.0111083984375, 5.19110107421875, 5.37109375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 5.0, 5.0, 6.0, 4.0, 5.0, 7.0, 10.0, 12.0, 10.0, 23.0, 24.0, 60.0, 74.0, 142.0, 256.0, 558.0, 1210.0, 2726.0, 6101.0, 15316.0, 42416.0, 141511.0, 445900.0, 271774.0, 77509.0, 25760.0, 9545.0, 4022.0, 1829.0, 843.0, 401.0, 185.0, 103.0, 55.0, 35.0, 23.0, 24.0, 20.0, 12.0, 9.0, 9.0, 8.0, 7.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.75390625, -3.6427001953125, -3.531494140625, -3.4202880859375, -3.30908203125, -3.1978759765625, -3.086669921875, -2.9754638671875, -2.8642578125, -2.7530517578125, -2.641845703125, -2.5306396484375, -2.41943359375, -2.3082275390625, -2.197021484375, -2.0858154296875, -1.974609375, -1.8634033203125, -1.752197265625, -1.6409912109375, -1.52978515625, -1.4185791015625, -1.307373046875, -1.1961669921875, -1.0849609375, -0.9737548828125, -0.862548828125, -0.7513427734375, -0.64013671875, -0.5289306640625, -0.417724609375, -0.3065185546875, -0.1953125, -0.0841064453125, 0.027099609375, 0.1383056640625, 0.24951171875, 0.3607177734375, 0.471923828125, 0.5831298828125, 0.6943359375, 0.8055419921875, 0.916748046875, 1.0279541015625, 1.13916015625, 1.2503662109375, 1.361572265625, 1.4727783203125, 1.583984375, 1.6951904296875, 1.806396484375, 1.9176025390625, 2.02880859375, 2.1400146484375, 2.251220703125, 2.3624267578125, 2.4736328125, 2.5848388671875, 2.696044921875, 2.8072509765625, 2.91845703125, 3.0296630859375, 3.140869140625, 3.2520751953125, 3.36328125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 6.0, 15.0, 12.0, 18.0, 19.0, 24.0, 26.0, 38.0, 35.0, 39.0, 48.0, 44.0, 50.0, 75.0, 207.0, 1811.0, 121.0, 69.0, 46.0, 46.0, 32.0, 29.0, 28.0, 31.0, 39.0, 23.0, 15.0, 11.0, 15.0, 14.0, 11.0, 11.0, 6.0, 1.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.03125, -20.337646484375, -19.64404296875, -18.950439453125, -18.2568359375, -17.563232421875, -16.86962890625, -16.176025390625, -15.482421875, -14.788818359375, -14.09521484375, -13.401611328125, -12.7080078125, -12.014404296875, -11.32080078125, -10.627197265625, -9.93359375, -9.239990234375, -8.54638671875, -7.852783203125, -7.1591796875, -6.465576171875, -5.77197265625, -5.078369140625, -4.384765625, -3.691162109375, -2.99755859375, -2.303955078125, -1.6103515625, -0.916748046875, -0.22314453125, 0.470458984375, 1.1640625, 1.857666015625, 2.55126953125, 3.244873046875, 3.9384765625, 4.632080078125, 5.32568359375, 6.019287109375, 6.712890625, 7.406494140625, 8.10009765625, 8.793701171875, 9.4873046875, 10.180908203125, 10.87451171875, 11.568115234375, 12.26171875, 12.955322265625, 13.64892578125, 14.342529296875, 15.0361328125, 15.729736328125, 16.42333984375, 17.116943359375, 17.810546875, 18.504150390625, 19.19775390625, 19.891357421875, 20.5849609375, 21.278564453125, 21.97216796875, 22.665771484375, 23.359375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 6.0, 1.0, 9.0, 13.0, 9.0, 19.0, 13.0, 16.0, 20.0, 40.0, 43.0, 50.0, 56.0, 95.0, 146.0, 250.0, 501.0, 2021.0, 484069.0, 2654213.0, 2673.0, 586.0, 301.0, 149.0, 103.0, 73.0, 60.0, 32.0, 29.0, 20.0, 15.0, 23.0, 15.0, 4.0, 7.0, 8.0, 3.0, 4.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.75, -37.578125, -36.40625, -35.234375, -34.0625, -32.890625, -31.71875, -30.546875, -29.375, -28.203125, -27.03125, -25.859375, -24.6875, -23.515625, -22.34375, -21.171875, -20.0, -18.828125, -17.65625, -16.484375, -15.3125, -14.140625, -12.96875, -11.796875, -10.625, -9.453125, -8.28125, -7.109375, -5.9375, -4.765625, -3.59375, -2.421875, -1.25, -0.078125, 1.09375, 2.265625, 3.4375, 4.609375, 5.78125, 6.953125, 8.125, 9.296875, 10.46875, 11.640625, 12.8125, 13.984375, 15.15625, 16.328125, 17.5, 18.671875, 19.84375, 21.015625, 22.1875, 23.359375, 24.53125, 25.703125, 26.875, 28.046875, 29.21875, 30.390625, 31.5625, 32.734375, 33.90625, 35.078125, 36.25]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 6.0, 25.0, 108.0, 289.0, 332.0, 191.0, 49.0, 12.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.983089447021484, -7.739930629730225, -6.496771812438965, -5.253612995147705, -4.010454177856445, -2.7672953605651855, -1.5241365432739258, -0.2809772491455078, 0.9621810913085938, 2.2053399085998535, 3.4484987258911133, 4.691657543182373, 5.934816360473633, 7.177975177764893, 8.421133995056152, 9.66429328918457, 10.907451629638672, 12.150609970092773, 13.393769264221191, 14.63692855834961, 15.880086898803711, 17.123245239257812, 18.366405487060547, 19.60956382751465, 20.85272216796875, 22.09588050842285, 23.339038848876953, 24.582199096679688, 25.82535743713379, 27.06851577758789, 28.311676025390625, 29.554834365844727, 30.797988891601562, 32.0411491394043, 33.284305572509766, 34.5274658203125, 35.77062225341797, 37.0137825012207, 38.25694274902344, 39.500099182128906, 40.74325942993164, 41.986419677734375, 43.229576110839844, 44.47273635864258, 45.71589660644531, 46.95905303955078, 48.202213287353516, 49.44537353515625, 50.68852996826172, 51.93169021606445, 53.17484664916992, 54.418006896972656, 55.661163330078125, 56.90432357788086, 58.147483825683594, 59.39064025878906, 60.6338005065918, 61.87696075439453, 63.1201171875, 64.36327362060547, 65.60643768310547, 66.84959411621094, 68.0927505493164, 69.3359146118164, 70.57907104492188]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 11.0, 9.0, 12.0, 17.0, 16.0, 20.0, 22.0, 32.0, 26.0, 19.0, 30.0, 25.0, 39.0, 35.0, 31.0, 26.0, 37.0, 42.0, 44.0, 33.0, 33.0, 33.0, 36.0, 33.0, 37.0, 36.0, 35.0, 29.0, 25.0, 23.0, 18.0, 12.0, 16.0, 11.0, 15.0, 11.0, 11.0, 11.0, 6.0, 5.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.10654067993164, -46.3146858215332, -44.5228271484375, -42.73097229003906, -40.939117431640625, -39.14725875854492, -37.355403900146484, -35.56354522705078, -33.771690368652344, -31.979833602905273, -30.187976837158203, -28.396121978759766, -26.604265213012695, -24.812408447265625, -23.020553588867188, -21.228696823120117, -19.436840057373047, -17.644983291625977, -15.853127479553223, -14.061271667480469, -12.269414901733398, -10.477558135986328, -8.685702323913574, -6.89384651184082, -5.10198974609375, -3.310133457183838, -1.5182771682739258, 0.27357912063598633, 2.0654354095458984, 3.8572921752929688, 5.649147987365723, 7.441003799438477, 9.232864379882812, 11.024721145629883, 12.816576957702637, 14.60843276977539, 16.40028953552246, 18.19214630126953, 19.98400115966797, 21.77585792541504, 23.56771469116211, 25.35957145690918, 27.15142822265625, 28.943283081054688, 30.735139846801758, 32.52699661254883, 34.318851470947266, 36.11071014404297, 37.902565002441406, 39.694419860839844, 41.48627853393555, 43.278133392333984, 45.06999206542969, 46.861846923828125, 48.65370178222656, 50.445556640625, 52.2374153137207, 54.02927017211914, 55.821128845214844, 57.61298370361328, 59.40483856201172, 61.19669723510742, 62.98855209350586, 64.78041076660156, 66.572265625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 7.0, 4.0, 3.0, 9.0, 7.0, 4.0, 11.0, 9.0, 13.0, 20.0, 15.0, 34.0, 31.0, 38.0, 35.0, 27.0, 27.0, 26.0, 47.0, 46.0, 48.0, 43.0, 49.0, 38.0, 45.0, 47.0, 33.0, 36.0, 31.0, 31.0, 29.0, 22.0, 16.0, 16.0, 14.0, 20.0, 21.0, 11.0, 9.0, 9.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.27734375, -6.09698486328125, -5.9166259765625, -5.73626708984375, -5.555908203125, -5.37554931640625, -5.1951904296875, -5.01483154296875, -4.83447265625, -4.65411376953125, -4.4737548828125, -4.29339599609375, -4.113037109375, -3.93267822265625, -3.7523193359375, -3.57196044921875, -3.3916015625, -3.21124267578125, -3.0308837890625, -2.85052490234375, -2.670166015625, -2.48980712890625, -2.3094482421875, -2.12908935546875, -1.94873046875, -1.76837158203125, -1.5880126953125, -1.40765380859375, -1.227294921875, -1.04693603515625, -0.8665771484375, -0.68621826171875, -0.505859375, -0.32550048828125, -0.1451416015625, 0.03521728515625, 0.215576171875, 0.39593505859375, 0.5762939453125, 0.75665283203125, 0.93701171875, 1.11737060546875, 1.2977294921875, 1.47808837890625, 1.658447265625, 1.83880615234375, 2.0191650390625, 2.19952392578125, 2.3798828125, 2.56024169921875, 2.7406005859375, 2.92095947265625, 3.101318359375, 3.28167724609375, 3.4620361328125, 3.64239501953125, 3.82275390625, 4.00311279296875, 4.1834716796875, 4.36383056640625, 4.544189453125, 4.72454833984375, 4.9049072265625, 5.08526611328125, 5.265625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 9.0, 5.0, 8.0, 11.0, 17.0, 16.0, 24.0, 29.0, 39.0, 43.0, 63.0, 64.0, 125.0, 208.0, 643.0, 3068.0, 29792.0, 800652.0, 3068522.0, 274532.0, 13551.0, 1758.0, 461.0, 193.0, 109.0, 78.0, 51.0, 28.0, 18.0, 32.0, 21.0, 21.0, 10.0, 16.0, 11.0, 7.0, 4.0, 11.0, 6.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-19.125, -18.5838623046875, -18.042724609375, -17.5015869140625, -16.96044921875, -16.4193115234375, -15.878173828125, -15.3370361328125, -14.7958984375, -14.2547607421875, -13.713623046875, -13.1724853515625, -12.63134765625, -12.0902099609375, -11.549072265625, -11.0079345703125, -10.466796875, -9.9256591796875, -9.384521484375, -8.8433837890625, -8.30224609375, -7.7611083984375, -7.219970703125, -6.6788330078125, -6.1376953125, -5.5965576171875, -5.055419921875, -4.5142822265625, -3.97314453125, -3.4320068359375, -2.890869140625, -2.3497314453125, -1.80859375, -1.2674560546875, -0.726318359375, -0.1851806640625, 0.35595703125, 0.8970947265625, 1.438232421875, 1.9793701171875, 2.5205078125, 3.0616455078125, 3.602783203125, 4.1439208984375, 4.68505859375, 5.2261962890625, 5.767333984375, 6.3084716796875, 6.849609375, 7.3907470703125, 7.931884765625, 8.4730224609375, 9.01416015625, 9.5552978515625, 10.096435546875, 10.6375732421875, 11.1787109375, 11.7198486328125, 12.260986328125, 12.8021240234375, 13.34326171875, 13.8843994140625, 14.425537109375, 14.9666748046875, 15.5078125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 12.0, 11.0, 22.0, 21.0, 25.0, 37.0, 51.0, 61.0, 66.0, 77.0, 124.0, 156.0, 189.0, 254.0, 317.0, 380.0, 363.0, 370.0, 285.0, 273.0, 189.0, 179.0, 135.0, 105.0, 85.0, 54.0, 50.0, 37.0, 42.0, 19.0, 16.0, 14.0, 13.0, 8.0, 5.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 3.0], "bins": [-14.4375, -14.0628662109375, -13.688232421875, -13.3135986328125, -12.93896484375, -12.5643310546875, -12.189697265625, -11.8150634765625, -11.4404296875, -11.0657958984375, -10.691162109375, -10.3165283203125, -9.94189453125, -9.5672607421875, -9.192626953125, -8.8179931640625, -8.443359375, -8.0687255859375, -7.694091796875, -7.3194580078125, -6.94482421875, -6.5701904296875, -6.195556640625, -5.8209228515625, -5.4462890625, -5.0716552734375, -4.697021484375, -4.3223876953125, -3.94775390625, -3.5731201171875, -3.198486328125, -2.8238525390625, -2.44921875, -2.0745849609375, -1.699951171875, -1.3253173828125, -0.95068359375, -0.5760498046875, -0.201416015625, 0.1732177734375, 0.5478515625, 0.9224853515625, 1.297119140625, 1.6717529296875, 2.04638671875, 2.4210205078125, 2.795654296875, 3.1702880859375, 3.544921875, 3.9195556640625, 4.294189453125, 4.6688232421875, 5.04345703125, 5.4180908203125, 5.792724609375, 6.1673583984375, 6.5419921875, 6.9166259765625, 7.291259765625, 7.6658935546875, 8.04052734375, 8.4151611328125, 8.789794921875, 9.1644287109375, 9.5390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 10.0, 16.0, 15.0, 26.0, 23.0, 47.0, 61.0, 102.0, 114.0, 164.0, 260.0, 408.0, 1287.0, 54387.0, 4078573.0, 56241.0, 1308.0, 408.0, 227.0, 184.0, 116.0, 82.0, 57.0, 46.0, 28.0, 21.0, 16.0, 12.0, 8.0, 7.0, 8.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.375, -49.4365234375, -47.498046875, -45.5595703125, -43.62109375, -41.6826171875, -39.744140625, -37.8056640625, -35.8671875, -33.9287109375, -31.990234375, -30.0517578125, -28.11328125, -26.1748046875, -24.236328125, -22.2978515625, -20.359375, -18.4208984375, -16.482421875, -14.5439453125, -12.60546875, -10.6669921875, -8.728515625, -6.7900390625, -4.8515625, -2.9130859375, -0.974609375, 0.9638671875, 2.90234375, 4.8408203125, 6.779296875, 8.7177734375, 10.65625, 12.5947265625, 14.533203125, 16.4716796875, 18.41015625, 20.3486328125, 22.287109375, 24.2255859375, 26.1640625, 28.1025390625, 30.041015625, 31.9794921875, 33.91796875, 35.8564453125, 37.794921875, 39.7333984375, 41.671875, 43.6103515625, 45.548828125, 47.4873046875, 49.42578125, 51.3642578125, 53.302734375, 55.2412109375, 57.1796875, 59.1181640625, 61.056640625, 62.9951171875, 64.93359375, 66.8720703125, 68.810546875, 70.7490234375, 72.6875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 34.0, 175.0, 370.0, 306.0, 104.0, 19.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.06234741210938, -97.26841735839844, -91.4744873046875, -85.68055725097656, -79.88663482666016, -74.09270477294922, -68.29877471923828, -62.50484848022461, -56.71091842651367, -50.916988372802734, -45.12306213378906, -39.329132080078125, -33.53520202636719, -27.741275787353516, -21.947345733642578, -16.153419494628906, -10.359489440917969, -4.565560817718506, 1.228367805480957, 7.022296905517578, 12.816225051879883, 18.610153198242188, 24.404083251953125, 30.198009490966797, 35.991939544677734, 41.78586959838867, 47.579795837402344, 53.37372589111328, 59.16765594482422, 64.96157836914062, 70.75550842285156, 76.5494384765625, 82.34336853027344, 88.13729858398438, 93.93122863769531, 99.72515869140625, 105.51908111572266, 111.3130111694336, 117.10694122314453, 122.90086364746094, 128.69479370117188, 134.4887237548828, 140.28265380859375, 146.0765838623047, 151.87051391601562, 157.6644287109375, 163.4583740234375, 169.25228881835938, 175.04623413085938, 180.8401641845703, 186.63409423828125, 192.4280242919922, 198.22195434570312, 204.015869140625, 209.809814453125, 215.60372924804688, 221.3976593017578, 227.19158935546875, 232.9855194091797, 238.77944946289062, 244.57337951660156, 250.3673095703125, 256.1612243652344, 261.9551696777344, 267.74908447265625]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 4.0, 6.0, 6.0, 4.0, 7.0, 16.0, 8.0, 15.0, 22.0, 17.0, 21.0, 16.0, 23.0, 26.0, 33.0, 43.0, 32.0, 33.0, 45.0, 27.0, 39.0, 51.0, 39.0, 44.0, 41.0, 32.0, 37.0, 45.0, 27.0, 49.0, 27.0, 22.0, 24.0, 23.0, 19.0, 13.0, 6.0, 12.0, 8.0, 14.0, 3.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.953277587890625, -43.4921760559082, -42.031070709228516, -40.569969177246094, -39.108863830566406, -37.647762298583984, -36.18666076660156, -34.725555419921875, -33.26445388793945, -31.8033504486084, -30.342247009277344, -28.881145477294922, -27.420042037963867, -25.958938598632812, -24.497835159301758, -23.036731719970703, -21.57562828063965, -20.114524841308594, -18.65342140197754, -17.192317962646484, -15.731216430664062, -14.270112991333008, -12.809009552001953, -11.347907066345215, -9.88680362701416, -8.425700187683105, -6.964597702026367, -5.5034942626953125, -4.042391300201416, -2.5812883377075195, -1.1201848983764648, 0.34091758728027344, 1.8020210266113281, 3.2631239891052246, 4.724226951599121, 6.185330390930176, 7.646433353424072, 9.107536315917969, 10.568639755249023, 12.029742240905762, 13.490845680236816, 14.951949119567871, 16.41305160522461, 17.874155044555664, 19.33525848388672, 20.79636001586914, 22.257465362548828, 23.71856689453125, 25.179670333862305, 26.64077377319336, 28.101877212524414, 29.56298065185547, 31.02408218383789, 32.48518371582031, 33.9462890625, 35.40739059448242, 36.86849594116211, 38.32959747314453, 39.79070281982422, 41.25180435180664, 42.71290969848633, 44.17401123046875, 45.63511657714844, 47.09621810913086, 48.55731964111328]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 2.0, 6.0, 7.0, 9.0, 12.0, 11.0, 23.0, 16.0, 25.0, 24.0, 35.0, 27.0, 30.0, 35.0, 39.0, 28.0, 48.0, 38.0, 49.0, 53.0, 37.0, 42.0, 54.0, 50.0, 24.0, 28.0, 34.0, 32.0, 25.0, 17.0, 20.0, 17.0, 14.0, 18.0, 14.0, 11.0, 12.0, 9.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.578125, -6.39215087890625, -6.2061767578125, -6.02020263671875, -5.834228515625, -5.64825439453125, -5.4622802734375, -5.27630615234375, -5.09033203125, -4.90435791015625, -4.7183837890625, -4.53240966796875, -4.346435546875, -4.16046142578125, -3.9744873046875, -3.78851318359375, -3.6025390625, -3.41656494140625, -3.2305908203125, -3.04461669921875, -2.858642578125, -2.67266845703125, -2.4866943359375, -2.30072021484375, -2.11474609375, -1.92877197265625, -1.7427978515625, -1.55682373046875, -1.370849609375, -1.18487548828125, -0.9989013671875, -0.81292724609375, -0.626953125, -0.44097900390625, -0.2550048828125, -0.06903076171875, 0.116943359375, 0.30291748046875, 0.4888916015625, 0.67486572265625, 0.86083984375, 1.04681396484375, 1.2327880859375, 1.41876220703125, 1.604736328125, 1.79071044921875, 1.9766845703125, 2.16265869140625, 2.3486328125, 2.53460693359375, 2.7205810546875, 2.90655517578125, 3.092529296875, 3.27850341796875, 3.4644775390625, 3.65045166015625, 3.83642578125, 4.02239990234375, 4.2083740234375, 4.39434814453125, 4.580322265625, 4.76629638671875, 4.9522705078125, 5.13824462890625, 5.32421875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 7.0, 4.0, 11.0, 11.0, 27.0, 28.0, 43.0, 77.0, 86.0, 160.0, 222.0, 381.0, 562.0, 904.0, 1370.0, 2121.0, 3431.0, 5802.0, 9402.0, 15647.0, 25928.0, 44225.0, 79007.0, 175743.0, 366571.0, 147009.0, 70125.0, 39431.0, 23340.0, 14120.0, 8656.0, 5249.0, 3417.0, 1978.0, 1259.0, 812.0, 458.0, 325.0, 212.0, 127.0, 87.0, 65.0, 52.0, 17.0, 21.0, 7.0, 11.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.701171875, -1.6531219482421875, -1.605072021484375, -1.5570220947265625, -1.50897216796875, -1.4609222412109375, -1.412872314453125, -1.3648223876953125, -1.3167724609375, -1.2687225341796875, -1.220672607421875, -1.1726226806640625, -1.12457275390625, -1.0765228271484375, -1.028472900390625, -0.9804229736328125, -0.932373046875, -0.8843231201171875, -0.836273193359375, -0.7882232666015625, -0.74017333984375, -0.6921234130859375, -0.644073486328125, -0.5960235595703125, -0.5479736328125, -0.4999237060546875, -0.451873779296875, -0.4038238525390625, -0.35577392578125, -0.3077239990234375, -0.259674072265625, -0.2116241455078125, -0.16357421875, -0.1155242919921875, -0.067474365234375, -0.0194244384765625, 0.02862548828125, 0.0766754150390625, 0.124725341796875, 0.1727752685546875, 0.2208251953125, 0.2688751220703125, 0.316925048828125, 0.3649749755859375, 0.41302490234375, 0.4610748291015625, 0.509124755859375, 0.5571746826171875, 0.605224609375, 0.6532745361328125, 0.701324462890625, 0.7493743896484375, 0.79742431640625, 0.8454742431640625, 0.893524169921875, 0.9415740966796875, 0.9896240234375, 1.0376739501953125, 1.085723876953125, 1.1337738037109375, 1.18182373046875, 1.2298736572265625, 1.277923583984375, 1.3259735107421875, 1.3740234375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 6.0, 6.0, 7.0, 4.0, 9.0, 12.0, 15.0, 18.0, 19.0, 16.0, 19.0, 17.0, 28.0, 29.0, 38.0, 36.0, 28.0, 30.0, 36.0, 33.0, 42.0, 36.0, 1060.0, 49.0, 40.0, 30.0, 38.0, 38.0, 33.0, 28.0, 27.0, 17.0, 23.0, 23.0, 13.0, 14.0, 20.0, 16.0, 13.0, 14.0, 7.0, 5.0, 12.0, 3.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.40234375, -3.296875, -3.19140625, -3.0859375, -2.98046875, -2.875, -2.76953125, -2.6640625, -2.55859375, -2.453125, -2.34765625, -2.2421875, -2.13671875, -2.03125, -1.92578125, -1.8203125, -1.71484375, -1.609375, -1.50390625, -1.3984375, -1.29296875, -1.1875, -1.08203125, -0.9765625, -0.87109375, -0.765625, -0.66015625, -0.5546875, -0.44921875, -0.34375, -0.23828125, -0.1328125, -0.02734375, 0.078125, 0.18359375, 0.2890625, 0.39453125, 0.5, 0.60546875, 0.7109375, 0.81640625, 0.921875, 1.02734375, 1.1328125, 1.23828125, 1.34375, 1.44921875, 1.5546875, 1.66015625, 1.765625, 1.87109375, 1.9765625, 2.08203125, 2.1875, 2.29296875, 2.3984375, 2.50390625, 2.609375, 2.71484375, 2.8203125, 2.92578125, 3.03125, 3.13671875, 3.2421875, 3.34765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 10.0, 9.0, 17.0, 22.0, 31.0, 50.0, 59.0, 91.0, 136.0, 181.0, 260.0, 397.0, 525.0, 762.0, 1130.0, 1606.0, 2293.0, 3175.0, 4716.0, 6651.0, 9657.0, 13841.0, 19729.0, 28973.0, 43949.0, 67750.0, 113097.0, 1301814.0, 195528.0, 96369.0, 60129.0, 38669.0, 26019.0, 18257.0, 12554.0, 8715.0, 6046.0, 4267.0, 2904.0, 2079.0, 1397.0, 992.0, 659.0, 469.0, 351.0, 237.0, 168.0, 125.0, 86.0, 63.0, 35.0, 35.0, 15.0, 17.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0], "bins": [-1.0068359375, -0.9752349853515625, -0.943634033203125, -0.9120330810546875, -0.88043212890625, -0.8488311767578125, -0.817230224609375, -0.7856292724609375, -0.7540283203125, -0.7224273681640625, -0.690826416015625, -0.6592254638671875, -0.62762451171875, -0.5960235595703125, -0.564422607421875, -0.5328216552734375, -0.501220703125, -0.4696197509765625, -0.438018798828125, -0.4064178466796875, -0.37481689453125, -0.3432159423828125, -0.311614990234375, -0.2800140380859375, -0.2484130859375, -0.2168121337890625, -0.185211181640625, -0.1536102294921875, -0.12200927734375, -0.0904083251953125, -0.058807373046875, -0.0272064208984375, 0.00439453125, 0.0359954833984375, 0.067596435546875, 0.0991973876953125, 0.13079833984375, 0.1623992919921875, 0.194000244140625, 0.2256011962890625, 0.2572021484375, 0.2888031005859375, 0.320404052734375, 0.3520050048828125, 0.38360595703125, 0.4152069091796875, 0.446807861328125, 0.4784088134765625, 0.510009765625, 0.5416107177734375, 0.573211669921875, 0.6048126220703125, 0.63641357421875, 0.6680145263671875, 0.699615478515625, 0.7312164306640625, 0.7628173828125, 0.7944183349609375, 0.826019287109375, 0.8576202392578125, 0.88922119140625, 0.9208221435546875, 0.952423095703125, 0.9840240478515625, 1.015625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 10.0, 6.0, 10.0, 6.0, 18.0, 18.0, 12.0, 18.0, 26.0, 34.0, 35.0, 56.0, 78.0, 112.0, 124.0, 124.0, 84.0, 46.0, 35.0, 22.0, 34.0, 22.0, 13.0, 3.0, 14.0, 5.0, 6.0, 5.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0011682510375976562, -0.0011320710182189941, -0.001095890998840332, -0.00105971097946167, -0.0010235309600830078, -0.0009873509407043457, -0.0009511709213256836, -0.0009149909019470215, -0.0008788108825683594, -0.0008426308631896973, -0.0008064508438110352, -0.000770270824432373, -0.0007340908050537109, -0.0006979107856750488, -0.0006617307662963867, -0.0006255507469177246, -0.0005893707275390625, -0.0005531907081604004, -0.0005170106887817383, -0.00048083066940307617, -0.00044465065002441406, -0.00040847063064575195, -0.00037229061126708984, -0.00033611059188842773, -0.0002999305725097656, -0.0002637505531311035, -0.0002275705337524414, -0.0001913905143737793, -0.0001552104949951172, -0.00011903047561645508, -8.285045623779297e-05, -4.667043685913086e-05, -1.049041748046875e-05, 2.568960189819336e-05, 6.186962127685547e-05, 9.804964065551758e-05, 0.0001342296600341797, 0.0001704096794128418, 0.0002065896987915039, 0.00024276971817016602, 0.0002789497375488281, 0.00031512975692749023, 0.00035130977630615234, 0.00038748979568481445, 0.00042366981506347656, 0.00045984983444213867, 0.0004960298538208008, 0.0005322098731994629, 0.000568389892578125, 0.0006045699119567871, 0.0006407499313354492, 0.0006769299507141113, 0.0007131099700927734, 0.0007492899894714355, 0.0007854700088500977, 0.0008216500282287598, 0.0008578300476074219, 0.000894010066986084, 0.0009301900863647461, 0.0009663701057434082, 0.0010025501251220703, 0.0010387301445007324, 0.0010749101638793945, 0.0011110901832580566, 0.0011472702026367188]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 3.0, 7.0, 4.0, 3.0, 9.0, 12.0, 10.0, 8.0, 20.0, 23.0, 31.0, 48.0, 61.0, 114.0, 245.0, 691.0, 219420.0, 826424.0, 764.0, 258.0, 129.0, 65.0, 40.0, 33.0, 28.0, 20.0, 8.0, 23.0, 16.0, 7.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.027587890625, -0.02677750587463379, -0.025967121124267578, -0.025156736373901367, -0.024346351623535156, -0.023535966873168945, -0.022725582122802734, -0.021915197372436523, -0.021104812622070312, -0.0202944278717041, -0.01948404312133789, -0.01867365837097168, -0.01786327362060547, -0.017052888870239258, -0.016242504119873047, -0.015432119369506836, -0.014621734619140625, -0.013811349868774414, -0.013000965118408203, -0.012190580368041992, -0.011380195617675781, -0.01056981086730957, -0.00975942611694336, -0.008949041366577148, -0.008138656616210938, -0.0073282718658447266, -0.006517887115478516, -0.005707502365112305, -0.004897117614746094, -0.004086732864379883, -0.003276348114013672, -0.002465963363647461, -0.00165557861328125, -0.0008451938629150391, -3.4809112548828125e-05, 0.0007755756378173828, 0.0015859603881835938, 0.0023963451385498047, 0.0032067298889160156, 0.0040171146392822266, 0.0048274993896484375, 0.0056378841400146484, 0.006448268890380859, 0.00725865364074707, 0.008069038391113281, 0.008879423141479492, 0.009689807891845703, 0.010500192642211914, 0.011310577392578125, 0.012120962142944336, 0.012931346893310547, 0.013741731643676758, 0.014552116394042969, 0.01536250114440918, 0.01617288589477539, 0.0169832706451416, 0.017793655395507812, 0.018604040145874023, 0.019414424896240234, 0.020224809646606445, 0.021035194396972656, 0.021845579147338867, 0.022655963897705078, 0.02346634864807129, 0.0242767333984375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 54.0, 400.0, 488.0, 67.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038122409023344517, -0.00031835102709010243, -0.00025547799305059016, -0.00019260494445916265, -0.00012973189586773515, -6.685883272439241e-05, -3.9857986848801374e-06, 5.888723535463214e-05, 0.00012176029849797487, 0.00018463334708940238, 0.0002475063956808299, 0.00031037942972034216, 0.0003732524928636849, 0.0004361255560070276, 0.0004989985609427094, 0.0005618716240860522, 0.0006247446872293949, 0.0006876177503727376, 0.0007504908135160804, 0.0008133638184517622, 0.0008762368815951049, 0.0009391099447384477, 0.0010019829496741295, 0.0010648560710251331, 0.001127729075960815, 0.0011906020808964968, 0.0012534752022475004, 0.0013163482071831822, 0.001379221212118864, 0.0014420943334698677, 0.0015049673384055495, 0.0015678403433412313, 0.001630713464692235, 0.0016935864696279168, 0.0017564595909789205, 0.0018193325959146023, 0.001882205717265606, 0.0019450787222012877, 0.0020079517271369696, 0.002070824848487973, 0.002133697737008333, 0.002196570858359337, 0.002259443746879697, 0.0023223168682307005, 0.002385189989581704, 0.002448062878102064, 0.0025109359994530678, 0.0025738091208040714, 0.002636682242155075, 0.0026995553635060787, 0.0027624282520264387, 0.0028253013733774424, 0.002888174494728446, 0.002951047383248806, 0.0030139205045998096, 0.0030767936259508133, 0.003139666747301817, 0.0032025398686528206, 0.0032654127571731806, 0.0033282858785241842, 0.003391158999875188, 0.003454031888395548, 0.0035169050097465515, 0.003579778131097555, 0.003642651019617915]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 10.0, 6.0, 7.0, 6.0, 13.0, 8.0, 12.0, 19.0, 27.0, 26.0, 24.0, 27.0, 40.0, 35.0, 37.0, 48.0, 45.0, 33.0, 57.0, 43.0, 52.0, 30.0, 37.0, 42.0, 37.0, 45.0, 38.0, 29.0, 23.0, 36.0, 13.0, 18.0, 12.0, 10.0, 7.0, 17.0, 11.0, 8.0, 5.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00046062469482421875, -0.00044448673725128174, -0.0004283487796783447, -0.0004122108221054077, -0.0003960728645324707, -0.0003799349069595337, -0.0003637969493865967, -0.00034765899181365967, -0.00033152103424072266, -0.00031538307666778564, -0.00029924511909484863, -0.0002831071615219116, -0.0002669692039489746, -0.0002508312463760376, -0.00023469328880310059, -0.00021855533123016357, -0.00020241737365722656, -0.00018627941608428955, -0.00017014145851135254, -0.00015400350093841553, -0.00013786554336547852, -0.0001217275857925415, -0.00010558962821960449, -8.945167064666748e-05, -7.331371307373047e-05, -5.717575550079346e-05, -4.1037797927856445e-05, -2.4899840354919434e-05, -8.761882781982422e-06, 7.37607479095459e-06, 2.35140323638916e-05, 3.965198993682861e-05, 5.5789947509765625e-05, 7.192790508270264e-05, 8.806586265563965e-05, 0.00010420382022857666, 0.00012034177780151367, 0.00013647973537445068, 0.0001526176929473877, 0.0001687556505203247, 0.00018489360809326172, 0.00020103156566619873, 0.00021716952323913574, 0.00023330748081207275, 0.00024944543838500977, 0.0002655833959579468, 0.0002817213535308838, 0.0002978593111038208, 0.0003139972686767578, 0.0003301352262496948, 0.00034627318382263184, 0.00036241114139556885, 0.00037854909896850586, 0.00039468705654144287, 0.0004108250141143799, 0.0004269629716873169, 0.0004431009292602539, 0.0004592388868331909, 0.00047537684440612793, 0.0004915148019790649, 0.000507652759552002, 0.000523790717124939, 0.000539928674697876, 0.000556066632270813, 0.00057220458984375]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 2.0, 6.0, 7.0, 9.0, 12.0, 11.0, 23.0, 16.0, 25.0, 24.0, 35.0, 27.0, 30.0, 35.0, 39.0, 28.0, 48.0, 38.0, 49.0, 53.0, 37.0, 42.0, 54.0, 50.0, 24.0, 29.0, 33.0, 32.0, 25.0, 17.0, 20.0, 17.0, 14.0, 18.0, 14.0, 11.0, 12.0, 9.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.578125, -6.39215087890625, -6.2061767578125, -6.02020263671875, -5.834228515625, -5.64825439453125, -5.4622802734375, -5.27630615234375, -5.09033203125, -4.90435791015625, -4.7183837890625, -4.53240966796875, -4.346435546875, -4.16046142578125, -3.9744873046875, -3.78851318359375, -3.6025390625, -3.41656494140625, -3.2305908203125, -3.04461669921875, -2.858642578125, -2.67266845703125, -2.4866943359375, -2.30072021484375, -2.11474609375, -1.92877197265625, -1.7427978515625, -1.55682373046875, -1.370849609375, -1.18487548828125, -0.9989013671875, -0.81292724609375, -0.626953125, -0.44097900390625, -0.2550048828125, -0.06903076171875, 0.116943359375, 0.30291748046875, 0.4888916015625, 0.67486572265625, 0.86083984375, 1.04681396484375, 1.2327880859375, 1.41876220703125, 1.604736328125, 1.79071044921875, 1.9766845703125, 2.16265869140625, 2.3486328125, 2.53460693359375, 2.7205810546875, 2.90655517578125, 3.092529296875, 3.27850341796875, 3.4644775390625, 3.65045166015625, 3.83642578125, 4.02239990234375, 4.2083740234375, 4.39434814453125, 4.580322265625, 4.76629638671875, 4.9522705078125, 5.13824462890625, 5.32421875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 7.0, 7.0, 6.0, 16.0, 28.0, 39.0, 49.0, 79.0, 107.0, 188.0, 286.0, 376.0, 614.0, 968.0, 1524.0, 2404.0, 3872.0, 6454.0, 11737.0, 24423.0, 64625.0, 236488.0, 480732.0, 130540.0, 42211.0, 17970.0, 9000.0, 5124.0, 3193.0, 1942.0, 1236.0, 768.0, 560.0, 322.0, 206.0, 159.0, 96.0, 63.0, 40.0, 25.0, 26.0, 17.0, 17.0, 1.0, 5.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0], "bins": [-4.8671875, -4.729278564453125, -4.59136962890625, -4.453460693359375, -4.3155517578125, -4.177642822265625, -4.03973388671875, -3.901824951171875, -3.763916015625, -3.626007080078125, -3.48809814453125, -3.350189208984375, -3.2122802734375, -3.074371337890625, -2.93646240234375, -2.798553466796875, -2.66064453125, -2.522735595703125, -2.38482666015625, -2.246917724609375, -2.1090087890625, -1.971099853515625, -1.83319091796875, -1.695281982421875, -1.557373046875, -1.419464111328125, -1.28155517578125, -1.143646240234375, -1.0057373046875, -0.867828369140625, -0.72991943359375, -0.592010498046875, -0.4541015625, -0.316192626953125, -0.17828369140625, -0.040374755859375, 0.0975341796875, 0.235443115234375, 0.37335205078125, 0.511260986328125, 0.649169921875, 0.787078857421875, 0.92498779296875, 1.062896728515625, 1.2008056640625, 1.338714599609375, 1.47662353515625, 1.614532470703125, 1.75244140625, 1.890350341796875, 2.02825927734375, 2.166168212890625, 2.3040771484375, 2.441986083984375, 2.57989501953125, 2.717803955078125, 2.855712890625, 2.993621826171875, 3.13153076171875, 3.269439697265625, 3.4073486328125, 3.545257568359375, 3.68316650390625, 3.821075439453125, 3.958984375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 7.0, 4.0, 5.0, 8.0, 11.0, 7.0, 13.0, 6.0, 16.0, 18.0, 13.0, 23.0, 32.0, 21.0, 37.0, 42.0, 32.0, 38.0, 61.0, 70.0, 118.0, 1643.0, 306.0, 100.0, 48.0, 41.0, 50.0, 36.0, 34.0, 27.0, 39.0, 25.0, 29.0, 19.0, 14.0, 9.0, 10.0, 6.0, 10.0, 6.0, 6.0, 5.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.15625, -21.52001953125, -20.8837890625, -20.24755859375, -19.611328125, -18.97509765625, -18.3388671875, -17.70263671875, -17.06640625, -16.43017578125, -15.7939453125, -15.15771484375, -14.521484375, -13.88525390625, -13.2490234375, -12.61279296875, -11.9765625, -11.34033203125, -10.7041015625, -10.06787109375, -9.431640625, -8.79541015625, -8.1591796875, -7.52294921875, -6.88671875, -6.25048828125, -5.6142578125, -4.97802734375, -4.341796875, -3.70556640625, -3.0693359375, -2.43310546875, -1.796875, -1.16064453125, -0.5244140625, 0.11181640625, 0.748046875, 1.38427734375, 2.0205078125, 2.65673828125, 3.29296875, 3.92919921875, 4.5654296875, 5.20166015625, 5.837890625, 6.47412109375, 7.1103515625, 7.74658203125, 8.3828125, 9.01904296875, 9.6552734375, 10.29150390625, 10.927734375, 11.56396484375, 12.2001953125, 12.83642578125, 13.47265625, 14.10888671875, 14.7451171875, 15.38134765625, 16.017578125, 16.65380859375, 17.2900390625, 17.92626953125, 18.5625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 9.0, 1.0, 5.0, 16.0, 10.0, 16.0, 17.0, 23.0, 38.0, 52.0, 70.0, 92.0, 108.0, 220.0, 429.0, 932.0, 10618.0, 3084413.0, 45778.0, 1569.0, 462.0, 253.0, 156.0, 94.0, 89.0, 59.0, 39.0, 27.0, 27.0, 17.0, 13.0, 12.0, 9.0, 12.0, 11.0, 3.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-48.625, -47.26123046875, -45.8974609375, -44.53369140625, -43.169921875, -41.80615234375, -40.4423828125, -39.07861328125, -37.71484375, -36.35107421875, -34.9873046875, -33.62353515625, -32.259765625, -30.89599609375, -29.5322265625, -28.16845703125, -26.8046875, -25.44091796875, -24.0771484375, -22.71337890625, -21.349609375, -19.98583984375, -18.6220703125, -17.25830078125, -15.89453125, -14.53076171875, -13.1669921875, -11.80322265625, -10.439453125, -9.07568359375, -7.7119140625, -6.34814453125, -4.984375, -3.62060546875, -2.2568359375, -0.89306640625, 0.470703125, 1.83447265625, 3.1982421875, 4.56201171875, 5.92578125, 7.28955078125, 8.6533203125, 10.01708984375, 11.380859375, 12.74462890625, 14.1083984375, 15.47216796875, 16.8359375, 18.19970703125, 19.5634765625, 20.92724609375, 22.291015625, 23.65478515625, 25.0185546875, 26.38232421875, 27.74609375, 29.10986328125, 30.4736328125, 31.83740234375, 33.201171875, 34.56494140625, 35.9287109375, 37.29248046875, 38.65625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 27.0, 64.0, 114.0, 205.0, 232.0, 193.0, 92.0, 46.0, 17.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.94467544555664, -47.91040802001953, -46.87614059448242, -45.84187316894531, -44.80760955810547, -43.77334213256836, -42.73907470703125, -41.70480728149414, -40.67053985595703, -39.63627243041992, -38.60200500488281, -37.5677375793457, -36.533470153808594, -35.49920654296875, -34.46493911743164, -33.43067169189453, -32.39640426635742, -31.362136840820312, -30.327869415283203, -29.293603897094727, -28.259336471557617, -27.225069046020508, -26.19080352783203, -25.156536102294922, -24.122268676757812, -23.088001251220703, -22.053733825683594, -21.019468307495117, -19.985200881958008, -18.9509334564209, -17.916667938232422, -16.882400512695312, -15.848133087158203, -14.813865661621094, -13.7795991897583, -12.745332717895508, -11.711065292358398, -10.676797866821289, -9.642531394958496, -8.608264923095703, -7.573997497558594, -6.539730548858643, -5.505463600158691, -4.47119665145874, -3.436929702758789, -2.402662754058838, -1.3683958053588867, -0.33412885665893555, 0.7001380920410156, 1.7344050407409668, 2.768671989440918, 3.802938938140869, 4.83720588684082, 5.8714728355407715, 6.905739784240723, 7.940006732940674, 8.974273681640625, 10.008541107177734, 11.042807579040527, 12.07707405090332, 13.11134147644043, 14.145608901977539, 15.179875373840332, 16.214141845703125, 17.248409271240234]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 8.0, 10.0, 10.0, 9.0, 11.0, 9.0, 13.0, 25.0, 16.0, 19.0, 29.0, 24.0, 41.0, 39.0, 46.0, 32.0, 46.0, 46.0, 39.0, 48.0, 49.0, 35.0, 32.0, 34.0, 38.0, 51.0, 30.0, 27.0, 34.0, 28.0, 18.0, 17.0, 18.0, 12.0, 11.0, 10.0, 10.0, 6.0, 5.0, 9.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-62.74290466308594, -60.74461364746094, -58.7463264465332, -56.74803924560547, -54.74974822998047, -52.75145721435547, -50.753170013427734, -48.7548828125, -46.756591796875, -44.75830078125, -42.760013580322266, -40.76172637939453, -38.76343536376953, -36.76514434814453, -34.7668571472168, -32.76856994628906, -30.770278930664062, -28.771989822387695, -26.773700714111328, -24.77541160583496, -22.777122497558594, -20.778833389282227, -18.78054428100586, -16.782255172729492, -14.783966064453125, -12.785676956176758, -10.78738784790039, -8.789098739624023, -6.790809631347656, -4.792520523071289, -2.794231414794922, -0.7959423065185547, 1.2023468017578125, 3.2006359100341797, 5.198925018310547, 7.197214126586914, 9.195503234863281, 11.193792343139648, 13.192081451416016, 15.190370559692383, 17.18865966796875, 19.186948776245117, 21.185237884521484, 23.18352699279785, 25.18181610107422, 27.180105209350586, 29.178394317626953, 31.17668342590332, 33.17497253417969, 35.17326354980469, 37.17155075073242, 39.169837951660156, 41.168128967285156, 43.166419982910156, 45.16470718383789, 47.162994384765625, 49.161285400390625, 51.159576416015625, 53.15786361694336, 55.156150817871094, 57.154441833496094, 59.152732849121094, 61.15102005004883, 63.14930725097656, 65.14759826660156]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 5.0, 8.0, 6.0, 17.0, 7.0, 16.0, 17.0, 21.0, 22.0, 25.0, 27.0, 29.0, 36.0, 37.0, 28.0, 39.0, 43.0, 45.0, 40.0, 38.0, 48.0, 42.0, 45.0, 46.0, 30.0, 23.0, 39.0, 26.0, 24.0, 20.0, 23.0, 19.0, 12.0, 19.0, 14.0, 10.0, 14.0, 14.0, 6.0, 2.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-6.7109375, -6.5264892578125, -6.342041015625, -6.1575927734375, -5.97314453125, -5.7886962890625, -5.604248046875, -5.4197998046875, -5.2353515625, -5.0509033203125, -4.866455078125, -4.6820068359375, -4.49755859375, -4.3131103515625, -4.128662109375, -3.9442138671875, -3.759765625, -3.5753173828125, -3.390869140625, -3.2064208984375, -3.02197265625, -2.8375244140625, -2.653076171875, -2.4686279296875, -2.2841796875, -2.0997314453125, -1.915283203125, -1.7308349609375, -1.54638671875, -1.3619384765625, -1.177490234375, -0.9930419921875, -0.80859375, -0.6241455078125, -0.439697265625, -0.2552490234375, -0.07080078125, 0.1136474609375, 0.298095703125, 0.4825439453125, 0.6669921875, 0.8514404296875, 1.035888671875, 1.2203369140625, 1.40478515625, 1.5892333984375, 1.773681640625, 1.9581298828125, 2.142578125, 2.3270263671875, 2.511474609375, 2.6959228515625, 2.88037109375, 3.0648193359375, 3.249267578125, 3.4337158203125, 3.6181640625, 3.8026123046875, 3.987060546875, 4.1715087890625, 4.35595703125, 4.5404052734375, 4.724853515625, 4.9093017578125, 5.09375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 8.0, 6.0, 6.0, 13.0, 16.0, 33.0, 55.0, 57.0, 95.0, 177.0, 291.0, 567.0, 1191.0, 2727.0, 7197.0, 21600.0, 83273.0, 382966.0, 1266069.0, 1595364.0, 629264.0, 148797.0, 37020.0, 10702.0, 3711.0, 1555.0, 638.0, 344.0, 177.0, 110.0, 82.0, 61.0, 33.0, 26.0, 16.0, 14.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5078125, -7.2745361328125, -7.041259765625, -6.8079833984375, -6.57470703125, -6.3414306640625, -6.108154296875, -5.8748779296875, -5.6416015625, -5.4083251953125, -5.175048828125, -4.9417724609375, -4.70849609375, -4.4752197265625, -4.241943359375, -4.0086669921875, -3.775390625, -3.5421142578125, -3.308837890625, -3.0755615234375, -2.84228515625, -2.6090087890625, -2.375732421875, -2.1424560546875, -1.9091796875, -1.6759033203125, -1.442626953125, -1.2093505859375, -0.97607421875, -0.7427978515625, -0.509521484375, -0.2762451171875, -0.04296875, 0.1903076171875, 0.423583984375, 0.6568603515625, 0.89013671875, 1.1234130859375, 1.356689453125, 1.5899658203125, 1.8232421875, 2.0565185546875, 2.289794921875, 2.5230712890625, 2.75634765625, 2.9896240234375, 3.222900390625, 3.4561767578125, 3.689453125, 3.9227294921875, 4.156005859375, 4.3892822265625, 4.62255859375, 4.8558349609375, 5.089111328125, 5.3223876953125, 5.5556640625, 5.7889404296875, 6.022216796875, 6.2554931640625, 6.48876953125, 6.7220458984375, 6.955322265625, 7.1885986328125, 7.421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 3.0, 7.0, 11.0, 17.0, 23.0, 19.0, 32.0, 39.0, 58.0, 90.0, 135.0, 149.0, 210.0, 287.0, 353.0, 449.0, 448.0, 435.0, 334.0, 254.0, 180.0, 138.0, 98.0, 86.0, 66.0, 35.0, 31.0, 20.0, 21.0, 12.0, 9.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.15625, -16.6964111328125, -16.236572265625, -15.7767333984375, -15.31689453125, -14.8570556640625, -14.397216796875, -13.9373779296875, -13.4775390625, -13.0177001953125, -12.557861328125, -12.0980224609375, -11.63818359375, -11.1783447265625, -10.718505859375, -10.2586669921875, -9.798828125, -9.3389892578125, -8.879150390625, -8.4193115234375, -7.95947265625, -7.4996337890625, -7.039794921875, -6.5799560546875, -6.1201171875, -5.6602783203125, -5.200439453125, -4.7406005859375, -4.28076171875, -3.8209228515625, -3.361083984375, -2.9012451171875, -2.44140625, -1.9815673828125, -1.521728515625, -1.0618896484375, -0.60205078125, -0.1422119140625, 0.317626953125, 0.7774658203125, 1.2373046875, 1.6971435546875, 2.156982421875, 2.6168212890625, 3.07666015625, 3.5364990234375, 3.996337890625, 4.4561767578125, 4.916015625, 5.3758544921875, 5.835693359375, 6.2955322265625, 6.75537109375, 7.2152099609375, 7.675048828125, 8.1348876953125, 8.5947265625, 9.0545654296875, 9.514404296875, 9.9742431640625, 10.43408203125, 10.8939208984375, 11.353759765625, 11.8135986328125, 12.2734375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 9.0, 11.0, 18.0, 19.0, 20.0, 35.0, 41.0, 52.0, 69.0, 104.0, 158.0, 240.0, 436.0, 2098.0, 188140.0, 3982965.0, 17979.0, 890.0, 311.0, 192.0, 131.0, 88.0, 59.0, 48.0, 32.0, 34.0, 33.0, 14.0, 15.0, 9.0, 3.0, 4.0, 2.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.46875, -60.47314453125, -58.4775390625, -56.48193359375, -54.486328125, -52.49072265625, -50.4951171875, -48.49951171875, -46.50390625, -44.50830078125, -42.5126953125, -40.51708984375, -38.521484375, -36.52587890625, -34.5302734375, -32.53466796875, -30.5390625, -28.54345703125, -26.5478515625, -24.55224609375, -22.556640625, -20.56103515625, -18.5654296875, -16.56982421875, -14.57421875, -12.57861328125, -10.5830078125, -8.58740234375, -6.591796875, -4.59619140625, -2.6005859375, -0.60498046875, 1.390625, 3.38623046875, 5.3818359375, 7.37744140625, 9.373046875, 11.36865234375, 13.3642578125, 15.35986328125, 17.35546875, 19.35107421875, 21.3466796875, 23.34228515625, 25.337890625, 27.33349609375, 29.3291015625, 31.32470703125, 33.3203125, 35.31591796875, 37.3115234375, 39.30712890625, 41.302734375, 43.29833984375, 45.2939453125, 47.28955078125, 49.28515625, 51.28076171875, 53.2763671875, 55.27197265625, 57.267578125, 59.26318359375, 61.2587890625, 63.25439453125, 65.25]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 16.0, 35.0, 53.0, 89.0, 120.0, 135.0, 148.0, 147.0, 99.0, 83.0, 38.0, 21.0, 15.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.97037506103516, -99.62586975097656, -97.28136444091797, -94.93685913085938, -92.59235382080078, -90.24784851074219, -87.9033432006836, -85.558837890625, -83.2143325805664, -80.86982727050781, -78.52532196044922, -76.18081665039062, -73.83631134033203, -71.49180603027344, -69.14730072021484, -66.80279541015625, -64.45828247070312, -62.11377716064453, -59.76927185058594, -57.424766540527344, -55.08026123046875, -52.735755920410156, -50.39125061035156, -48.04674530029297, -45.702239990234375, -43.35773468017578, -41.01322937011719, -38.668724060058594, -36.32421875, -33.979713439941406, -31.63520622253418, -29.290700912475586, -26.94620132446289, -24.601696014404297, -22.257190704345703, -19.91268539428711, -17.568180084228516, -15.223673820495605, -12.879167556762695, -10.534662246704102, -8.190156936645508, -5.845651626586914, -3.501145839691162, -1.1566400527954102, 1.1878652572631836, 3.5323705673217773, 5.8768768310546875, 8.221382141113281, 10.565887451171875, 12.910392761230469, 15.254898071289062, 17.599403381347656, 19.94390869140625, 22.288414001464844, 24.63292121887207, 26.977426528930664, 29.321931838989258, 31.66643714904785, 34.01094436645508, 36.35544967651367, 38.699954986572266, 41.04446029663086, 43.38896560668945, 45.73347091674805, 48.07797622680664]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 4.0, 5.0, 7.0, 6.0, 11.0, 16.0, 13.0, 19.0, 16.0, 20.0, 37.0, 21.0, 31.0, 22.0, 37.0, 27.0, 34.0, 36.0, 39.0, 37.0, 36.0, 41.0, 41.0, 39.0, 33.0, 41.0, 35.0, 45.0, 34.0, 34.0, 21.0, 23.0, 15.0, 20.0, 13.0, 9.0, 12.0, 11.0, 16.0, 7.0, 9.0, 2.0, 6.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-42.62672424316406, -41.16558837890625, -39.70445251464844, -38.243316650390625, -36.78218078613281, -35.321048736572266, -33.85991287231445, -32.39877700805664, -30.937641143798828, -29.476505279541016, -28.015369415283203, -26.554235458374023, -25.09309959411621, -23.6319637298584, -22.17082977294922, -20.709693908691406, -19.248558044433594, -17.78742218017578, -16.32628631591797, -14.865152359008789, -13.404016494750977, -11.942880630493164, -10.481745719909668, -9.020610809326172, -7.559474945068359, -6.098339557647705, -4.637204170227051, -3.1760687828063965, -1.7149333953857422, -0.2537980079650879, 1.2073373794555664, 2.6684722900390625, 4.129608154296875, 5.590743541717529, 7.051878929138184, 8.51301383972168, 9.974149703979492, 11.435285568237305, 12.8964204788208, 14.357555389404297, 15.81869125366211, 17.279827117919922, 18.740962982177734, 20.202096939086914, 21.663232803344727, 23.12436866760254, 24.58550262451172, 26.04663848876953, 27.507774353027344, 28.968910217285156, 30.43004608154297, 31.89118003845215, 33.352317810058594, 34.81344985961914, 36.27458572387695, 37.735721588134766, 39.19685745239258, 40.65799331665039, 42.1191291809082, 43.580265045166016, 45.04139709472656, 46.502532958984375, 47.96366882324219, 49.4248046875, 50.88594055175781]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 1.0, 6.0, 4.0, 10.0, 6.0, 10.0, 8.0, 14.0, 18.0, 19.0, 18.0, 22.0, 23.0, 24.0, 38.0, 37.0, 46.0, 36.0, 37.0, 29.0, 40.0, 41.0, 59.0, 41.0, 36.0, 40.0, 33.0, 38.0, 33.0, 29.0, 20.0, 24.0, 27.0, 28.0, 18.0, 14.0, 11.0, 10.0, 15.0, 12.0, 7.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.17950439453125, -5.9918212890625, -5.80413818359375, -5.616455078125, -5.42877197265625, -5.2410888671875, -5.05340576171875, -4.86572265625, -4.67803955078125, -4.4903564453125, -4.30267333984375, -4.114990234375, -3.92730712890625, -3.7396240234375, -3.55194091796875, -3.3642578125, -3.17657470703125, -2.9888916015625, -2.80120849609375, -2.613525390625, -2.42584228515625, -2.2381591796875, -2.05047607421875, -1.86279296875, -1.67510986328125, -1.4874267578125, -1.29974365234375, -1.112060546875, -0.92437744140625, -0.7366943359375, -0.54901123046875, -0.361328125, -0.17364501953125, 0.0140380859375, 0.20172119140625, 0.389404296875, 0.57708740234375, 0.7647705078125, 0.95245361328125, 1.14013671875, 1.32781982421875, 1.5155029296875, 1.70318603515625, 1.890869140625, 2.07855224609375, 2.2662353515625, 2.45391845703125, 2.6416015625, 2.82928466796875, 3.0169677734375, 3.20465087890625, 3.392333984375, 3.58001708984375, 3.7677001953125, 3.95538330078125, 4.14306640625, 4.33074951171875, 4.5184326171875, 4.70611572265625, 4.893798828125, 5.08148193359375, 5.2691650390625, 5.45684814453125, 5.64453125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 11.0, 17.0, 22.0, 26.0, 33.0, 56.0, 61.0, 122.0, 162.0, 231.0, 322.0, 489.0, 694.0, 1049.0, 1542.0, 2332.0, 3518.0, 5183.0, 7958.0, 12422.0, 19026.0, 30295.0, 48461.0, 81845.0, 153246.0, 329392.0, 143627.0, 77607.0, 46441.0, 28955.0, 18363.0, 11890.0, 7763.0, 5136.0, 3358.0, 2223.0, 1542.0, 1016.0, 677.0, 447.0, 306.0, 214.0, 161.0, 95.0, 73.0, 44.0, 35.0, 25.0, 11.0, 13.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0], "bins": [-1.369140625, -1.328216552734375, -1.28729248046875, -1.246368408203125, -1.2054443359375, -1.164520263671875, -1.12359619140625, -1.082672119140625, -1.041748046875, -1.000823974609375, -0.95989990234375, -0.918975830078125, -0.8780517578125, -0.837127685546875, -0.79620361328125, -0.755279541015625, -0.71435546875, -0.673431396484375, -0.63250732421875, -0.591583251953125, -0.5506591796875, -0.509735107421875, -0.46881103515625, -0.427886962890625, -0.386962890625, -0.346038818359375, -0.30511474609375, -0.264190673828125, -0.2232666015625, -0.182342529296875, -0.14141845703125, -0.100494384765625, -0.0595703125, -0.018646240234375, 0.02227783203125, 0.063201904296875, 0.1041259765625, 0.145050048828125, 0.18597412109375, 0.226898193359375, 0.267822265625, 0.308746337890625, 0.34967041015625, 0.390594482421875, 0.4315185546875, 0.472442626953125, 0.51336669921875, 0.554290771484375, 0.59521484375, 0.636138916015625, 0.67706298828125, 0.717987060546875, 0.7589111328125, 0.799835205078125, 0.84075927734375, 0.881683349609375, 0.922607421875, 0.963531494140625, 1.00445556640625, 1.045379638671875, 1.0863037109375, 1.127227783203125, 1.16815185546875, 1.209075927734375, 1.25]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 7.0, 5.0, 5.0, 18.0, 13.0, 13.0, 19.0, 26.0, 23.0, 27.0, 26.0, 38.0, 43.0, 59.0, 38.0, 37.0, 48.0, 48.0, 1069.0, 33.0, 51.0, 36.0, 39.0, 31.0, 34.0, 36.0, 32.0, 27.0, 25.0, 25.0, 22.0, 7.0, 14.0, 11.0, 4.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.28436279296875, -4.1507568359375, -4.01715087890625, -3.883544921875, -3.74993896484375, -3.6163330078125, -3.48272705078125, -3.34912109375, -3.21551513671875, -3.0819091796875, -2.94830322265625, -2.814697265625, -2.68109130859375, -2.5474853515625, -2.41387939453125, -2.2802734375, -2.14666748046875, -2.0130615234375, -1.87945556640625, -1.745849609375, -1.61224365234375, -1.4786376953125, -1.34503173828125, -1.21142578125, -1.07781982421875, -0.9442138671875, -0.81060791015625, -0.677001953125, -0.54339599609375, -0.4097900390625, -0.27618408203125, -0.142578125, -0.00897216796875, 0.1246337890625, 0.25823974609375, 0.391845703125, 0.52545166015625, 0.6590576171875, 0.79266357421875, 0.92626953125, 1.05987548828125, 1.1934814453125, 1.32708740234375, 1.460693359375, 1.59429931640625, 1.7279052734375, 1.86151123046875, 1.9951171875, 2.12872314453125, 2.2623291015625, 2.39593505859375, 2.529541015625, 2.66314697265625, 2.7967529296875, 2.93035888671875, 3.06396484375, 3.19757080078125, 3.3311767578125, 3.46478271484375, 3.598388671875, 3.73199462890625, 3.8656005859375, 3.99920654296875, 4.1328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 8.0, 14.0, 23.0, 27.0, 49.0, 73.0, 103.0, 155.0, 207.0, 313.0, 485.0, 733.0, 1109.0, 1610.0, 2486.0, 3806.0, 5792.0, 9189.0, 14349.0, 22979.0, 36404.0, 61243.0, 107719.0, 239734.0, 1308554.0, 112941.0, 63518.0, 38281.0, 23534.0, 14630.0, 9439.0, 5935.0, 3921.0, 2553.0, 1722.0, 1086.0, 773.0, 492.0, 344.0, 254.0, 177.0, 110.0, 77.0, 54.0, 45.0, 23.0, 20.0, 10.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3212890625, -1.2800445556640625, -1.238800048828125, -1.1975555419921875, -1.15631103515625, -1.1150665283203125, -1.073822021484375, -1.0325775146484375, -0.9913330078125, -0.9500885009765625, -0.908843994140625, -0.8675994873046875, -0.82635498046875, -0.7851104736328125, -0.743865966796875, -0.7026214599609375, -0.661376953125, -0.6201324462890625, -0.578887939453125, -0.5376434326171875, -0.49639892578125, -0.4551544189453125, -0.413909912109375, -0.3726654052734375, -0.3314208984375, -0.2901763916015625, -0.248931884765625, -0.2076873779296875, -0.16644287109375, -0.1251983642578125, -0.083953857421875, -0.0427093505859375, -0.00146484375, 0.0397796630859375, 0.081024169921875, 0.1222686767578125, 0.16351318359375, 0.2047576904296875, 0.246002197265625, 0.2872467041015625, 0.3284912109375, 0.3697357177734375, 0.410980224609375, 0.4522247314453125, 0.49346923828125, 0.5347137451171875, 0.575958251953125, 0.6172027587890625, 0.658447265625, 0.6996917724609375, 0.740936279296875, 0.7821807861328125, 0.82342529296875, 0.8646697998046875, 0.905914306640625, 0.9471588134765625, 0.9884033203125, 1.0296478271484375, 1.070892333984375, 1.1121368408203125, 1.15338134765625, 1.1946258544921875, 1.235870361328125, 1.2771148681640625, 1.318359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 7.0, 14.0, 17.0, 19.0, 21.0, 34.0, 45.0, 70.0, 110.0, 146.0, 144.0, 115.0, 72.0, 64.0, 37.0, 25.0, 18.0, 11.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012788772583007812, -0.0012376904487609863, -0.0011965036392211914, -0.0011553168296813965, -0.0011141300201416016, -0.0010729432106018066, -0.0010317564010620117, -0.0009905695915222168, -0.0009493827819824219, -0.000908195972442627, -0.000867009162902832, -0.0008258223533630371, -0.0007846355438232422, -0.0007434487342834473, -0.0007022619247436523, -0.0006610751152038574, -0.0006198883056640625, -0.0005787014961242676, -0.0005375146865844727, -0.0004963278770446777, -0.0004551410675048828, -0.0004139542579650879, -0.00037276744842529297, -0.00033158063888549805, -0.0002903938293457031, -0.0002492070198059082, -0.00020802021026611328, -0.00016683340072631836, -0.00012564659118652344, -8.445978164672852e-05, -4.3272972106933594e-05, -2.086162567138672e-06, 3.910064697265625e-05, 8.028745651245117e-05, 0.0001214742660522461, 0.00016266107559204102, 0.00020384788513183594, 0.00024503469467163086, 0.0002862215042114258, 0.0003274083137512207, 0.0003685951232910156, 0.00040978193283081055, 0.00045096874237060547, 0.0004921555519104004, 0.0005333423614501953, 0.0005745291709899902, 0.0006157159805297852, 0.0006569027900695801, 0.000698089599609375, 0.0007392764091491699, 0.0007804632186889648, 0.0008216500282287598, 0.0008628368377685547, 0.0009040236473083496, 0.0009452104568481445, 0.0009863972663879395, 0.0010275840759277344, 0.0010687708854675293, 0.0011099576950073242, 0.0011511445045471191, 0.001192331314086914, 0.001233518123626709, 0.001274704933166504, 0.0013158917427062988, 0.0013570785522460938]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 8.0, 8.0, 11.0, 22.0, 26.0, 47.0, 93.0, 200.0, 545.0, 224804.0, 821733.0, 613.0, 180.0, 92.0, 40.0, 35.0, 21.0, 9.0, 12.0, 16.0, 10.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03106689453125, -0.030126571655273438, -0.029186248779296875, -0.028245925903320312, -0.02730560302734375, -0.026365280151367188, -0.025424957275390625, -0.024484634399414062, -0.0235443115234375, -0.022603988647460938, -0.021663665771484375, -0.020723342895507812, -0.01978302001953125, -0.018842697143554688, -0.017902374267578125, -0.016962051391601562, -0.016021728515625, -0.015081405639648438, -0.014141082763671875, -0.013200759887695312, -0.01226043701171875, -0.011320114135742188, -0.010379791259765625, -0.009439468383789062, -0.0084991455078125, -0.0075588226318359375, -0.006618499755859375, -0.0056781768798828125, -0.00473785400390625, -0.0037975311279296875, -0.002857208251953125, -0.0019168853759765625, -0.0009765625, -3.62396240234375e-05, 0.000904083251953125, 0.0018444061279296875, 0.00278472900390625, 0.0037250518798828125, 0.004665374755859375, 0.0056056976318359375, 0.0065460205078125, 0.0074863433837890625, 0.008426666259765625, 0.009366989135742188, 0.01030731201171875, 0.011247634887695312, 0.012187957763671875, 0.013128280639648438, 0.014068603515625, 0.015008926391601562, 0.015949249267578125, 0.016889572143554688, 0.01782989501953125, 0.018770217895507812, 0.019710540771484375, 0.020650863647460938, 0.0215911865234375, 0.022531509399414062, 0.023471832275390625, 0.024412155151367188, 0.02535247802734375, 0.026292800903320312, 0.027233123779296875, 0.028173446655273438, 0.02911376953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 10.0, 67.0, 254.0, 384.0, 231.0, 53.0, 12.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00228013820014894, -0.002239047782495618, -0.0021979573648422956, -0.0021568667143583298, -0.0021157762967050076, -0.0020746858790516853, -0.002033595461398363, -0.0019925048109143972, -0.001951414393261075, -0.0019103239756077528, -0.0018692334415391088, -0.0018281430238857865, -0.0017870524898171425, -0.0017459620721638203, -0.0017048715380951762, -0.001663781120441854, -0.00162269058637321, -0.0015816001687198877, -0.0015405096346512437, -0.0014994192169979215, -0.0014583286829292774, -0.0014172382652759552, -0.0013761477312073112, -0.001335057313553989, -0.0012939668959006667, -0.0012528764782473445, -0.0012117859441787004, -0.0011706955265253782, -0.0011296049924567342, -0.001088514574803412, -0.001047424040734768, -0.0010063336230814457, -0.0009652430890128016, -0.0009241526131518185, -0.0008830621372908354, -0.0008419716614298522, -0.0008008811855688691, -0.000759790709707886, -0.0007187002338469028, -0.0006776098161935806, -0.0006365192821249366, -0.0005954288062639534, -0.0005543383304029703, -0.0005132478545419872, -0.00047215737868100405, -0.0004310669028200209, -0.00038997645606286824, -0.0003488859802018851, -0.00030779550434090197, -0.00026670502847991884, -0.0002256145526189357, -0.0001845240913098678, -0.00014343361544888467, -0.00010234313958790153, -6.125267827883363e-05, -2.0162202417850494e-05, 2.092827344313264e-05, 6.201874930411577e-05, 0.00010310921788914129, 0.0001441996864741668, 0.00018529016233514994, 0.00022638063819613308, 0.000267471099505201, 0.0003085615753661841, 0.00034965205122716725]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 8.0, 13.0, 11.0, 15.0, 20.0, 22.0, 15.0, 30.0, 37.0, 28.0, 35.0, 41.0, 42.0, 42.0, 35.0, 51.0, 42.0, 43.0, 45.0, 54.0, 45.0, 36.0, 36.0, 30.0, 24.0, 34.0, 21.0, 23.0, 21.0, 22.0, 13.0, 11.0, 6.0, 8.0, 9.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003460049629211426, -0.00033319834619760513, -0.0003203917294740677, -0.00030758511275053024, -0.0002947784960269928, -0.00028197187930345535, -0.0002691652625799179, -0.00025635864585638046, -0.00024355202913284302, -0.00023074541240930557, -0.00021793879568576813, -0.00020513217896223068, -0.00019232556223869324, -0.0001795189455151558, -0.00016671232879161835, -0.0001539057120680809, -0.00014109909534454346, -0.000128292478621006, -0.00011548586189746857, -0.00010267924517393112, -8.987262845039368e-05, -7.706601172685623e-05, -6.425939500331879e-05, -5.145277827978134e-05, -3.8646161556243896e-05, -2.583954483270645e-05, -1.3032928109169006e-05, -2.2631138563156128e-07, 1.2580305337905884e-05, 2.538692206144333e-05, 3.8193538784980774e-05, 5.100015550851822e-05, 6.380677223205566e-05, 7.661338895559311e-05, 8.942000567913055e-05, 0.000102226622402668, 0.00011503323912620544, 0.0001278398558497429, 0.00014064647257328033, 0.00015345308929681778, 0.00016625970602035522, 0.00017906632274389267, 0.00019187293946743011, 0.00020467955619096756, 0.000217486172914505, 0.00023029278963804245, 0.0002430994063615799, 0.00025590602308511734, 0.0002687126398086548, 0.00028151925653219223, 0.0002943258732557297, 0.0003071324899792671, 0.00031993910670280457, 0.000332745723426342, 0.00034555234014987946, 0.0003583589568734169, 0.00037116557359695435, 0.0003839721903204918, 0.00039677880704402924, 0.0004095854237675667, 0.0004223920404911041, 0.00043519865721464157, 0.000448005273938179, 0.00046081189066171646, 0.0004736185073852539]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 1.0, 6.0, 4.0, 10.0, 6.0, 10.0, 8.0, 14.0, 18.0, 19.0, 18.0, 22.0, 23.0, 24.0, 38.0, 37.0, 46.0, 36.0, 37.0, 29.0, 40.0, 41.0, 59.0, 41.0, 36.0, 40.0, 33.0, 38.0, 33.0, 29.0, 20.0, 24.0, 27.0, 28.0, 18.0, 14.0, 11.0, 10.0, 15.0, 12.0, 7.0, 5.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.17950439453125, -5.9918212890625, -5.80413818359375, -5.616455078125, -5.42877197265625, -5.2410888671875, -5.05340576171875, -4.86572265625, -4.67803955078125, -4.4903564453125, -4.30267333984375, -4.114990234375, -3.92730712890625, -3.7396240234375, -3.55194091796875, -3.3642578125, -3.17657470703125, -2.9888916015625, -2.80120849609375, -2.613525390625, -2.42584228515625, -2.2381591796875, -2.05047607421875, -1.86279296875, -1.67510986328125, -1.4874267578125, -1.29974365234375, -1.112060546875, -0.92437744140625, -0.7366943359375, -0.54901123046875, -0.361328125, -0.17364501953125, 0.0140380859375, 0.20172119140625, 0.389404296875, 0.57708740234375, 0.7647705078125, 0.95245361328125, 1.14013671875, 1.32781982421875, 1.5155029296875, 1.70318603515625, 1.890869140625, 2.07855224609375, 2.2662353515625, 2.45391845703125, 2.6416015625, 2.82928466796875, 3.0169677734375, 3.20465087890625, 3.392333984375, 3.58001708984375, 3.7677001953125, 3.95538330078125, 4.14306640625, 4.33074951171875, 4.5184326171875, 4.70611572265625, 4.893798828125, 5.08148193359375, 5.2691650390625, 5.45684814453125, 5.64453125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 10.0, 5.0, 11.0, 8.0, 7.0, 22.0, 32.0, 29.0, 39.0, 56.0, 115.0, 153.0, 268.0, 494.0, 898.0, 1760.0, 3608.0, 7529.0, 17327.0, 43757.0, 122889.0, 375717.0, 310842.0, 98961.0, 36209.0, 14701.0, 6551.0, 3051.0, 1532.0, 819.0, 426.0, 250.0, 145.0, 108.0, 75.0, 30.0, 28.0, 23.0, 17.0, 13.0, 16.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-4.83984375, -4.701171875, -4.5625, -4.423828125, -4.28515625, -4.146484375, -4.0078125, -3.869140625, -3.73046875, -3.591796875, -3.453125, -3.314453125, -3.17578125, -3.037109375, -2.8984375, -2.759765625, -2.62109375, -2.482421875, -2.34375, -2.205078125, -2.06640625, -1.927734375, -1.7890625, -1.650390625, -1.51171875, -1.373046875, -1.234375, -1.095703125, -0.95703125, -0.818359375, -0.6796875, -0.541015625, -0.40234375, -0.263671875, -0.125, 0.013671875, 0.15234375, 0.291015625, 0.4296875, 0.568359375, 0.70703125, 0.845703125, 0.984375, 1.123046875, 1.26171875, 1.400390625, 1.5390625, 1.677734375, 1.81640625, 1.955078125, 2.09375, 2.232421875, 2.37109375, 2.509765625, 2.6484375, 2.787109375, 2.92578125, 3.064453125, 3.203125, 3.341796875, 3.48046875, 3.619140625, 3.7578125, 3.896484375, 4.03515625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 2.0, 8.0, 10.0, 18.0, 20.0, 18.0, 26.0, 29.0, 23.0, 29.0, 40.0, 32.0, 43.0, 41.0, 60.0, 95.0, 377.0, 1607.0, 118.0, 61.0, 52.0, 59.0, 36.0, 38.0, 36.0, 40.0, 26.0, 13.0, 15.0, 18.0, 10.0, 15.0, 9.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-26.4375, -25.662353515625, -24.88720703125, -24.112060546875, -23.3369140625, -22.561767578125, -21.78662109375, -21.011474609375, -20.236328125, -19.461181640625, -18.68603515625, -17.910888671875, -17.1357421875, -16.360595703125, -15.58544921875, -14.810302734375, -14.03515625, -13.260009765625, -12.48486328125, -11.709716796875, -10.9345703125, -10.159423828125, -9.38427734375, -8.609130859375, -7.833984375, -7.058837890625, -6.28369140625, -5.508544921875, -4.7333984375, -3.958251953125, -3.18310546875, -2.407958984375, -1.6328125, -0.857666015625, -0.08251953125, 0.692626953125, 1.4677734375, 2.242919921875, 3.01806640625, 3.793212890625, 4.568359375, 5.343505859375, 6.11865234375, 6.893798828125, 7.6689453125, 8.444091796875, 9.21923828125, 9.994384765625, 10.76953125, 11.544677734375, 12.31982421875, 13.094970703125, 13.8701171875, 14.645263671875, 15.42041015625, 16.195556640625, 16.970703125, 17.745849609375, 18.52099609375, 19.296142578125, 20.0712890625, 20.846435546875, 21.62158203125, 22.396728515625, 23.171875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 18.0, 12.0, 23.0, 22.0, 29.0, 33.0, 60.0, 85.0, 126.0, 155.0, 268.0, 375.0, 1126.0, 19583.0, 3113553.0, 8255.0, 832.0, 348.0, 230.0, 156.0, 99.0, 68.0, 49.0, 36.0, 44.0, 19.0, 27.0, 14.0, 11.0, 11.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.9375, -50.2841796875, -48.630859375, -46.9775390625, -45.32421875, -43.6708984375, -42.017578125, -40.3642578125, -38.7109375, -37.0576171875, -35.404296875, -33.7509765625, -32.09765625, -30.4443359375, -28.791015625, -27.1376953125, -25.484375, -23.8310546875, -22.177734375, -20.5244140625, -18.87109375, -17.2177734375, -15.564453125, -13.9111328125, -12.2578125, -10.6044921875, -8.951171875, -7.2978515625, -5.64453125, -3.9912109375, -2.337890625, -0.6845703125, 0.96875, 2.6220703125, 4.275390625, 5.9287109375, 7.58203125, 9.2353515625, 10.888671875, 12.5419921875, 14.1953125, 15.8486328125, 17.501953125, 19.1552734375, 20.80859375, 22.4619140625, 24.115234375, 25.7685546875, 27.421875, 29.0751953125, 30.728515625, 32.3818359375, 34.03515625, 35.6884765625, 37.341796875, 38.9951171875, 40.6484375, 42.3017578125, 43.955078125, 45.6083984375, 47.26171875, 48.9150390625, 50.568359375, 52.2216796875, 53.875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 30.0, 315.0, 576.0, 90.0, 7.0], "bins": [-203.14938354492188, -199.82945251464844, -196.50950622558594, -193.1895751953125, -189.86964416503906, -186.54971313476562, -183.22976684570312, -179.9098358154297, -176.58990478515625, -173.2699737548828, -169.9500274658203, -166.63009643554688, -163.31016540527344, -159.990234375, -156.6702880859375, -153.35035705566406, -150.03041076660156, -146.71047973632812, -143.39053344726562, -140.0706024169922, -136.75067138671875, -133.43072509765625, -130.1107940673828, -126.79086303710938, -123.4709243774414, -120.15098571777344, -116.8310546875, -113.51111602783203, -110.19117736816406, -106.87124633789062, -103.55130767822266, -100.23136901855469, -96.91143798828125, -93.59149932861328, -90.27156829833984, -86.95162963867188, -83.63169860839844, -80.31175994873047, -76.9918212890625, -73.67189025878906, -70.35194396972656, -67.0320053100586, -63.712074279785156, -60.39213562011719, -57.072200775146484, -53.75226593017578, -50.43232727050781, -47.11239242553711, -43.79246139526367, -40.47252655029297, -37.152587890625, -33.8326530456543, -30.512718200683594, -27.19278335571289, -23.872846603393555, -20.55290985107422, -17.232975006103516, -13.913039207458496, -10.593103408813477, -7.273167610168457, -3.9532318115234375, -0.6332969665527344, 2.6866397857666016, 6.0065765380859375, 9.32651138305664]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 12.0, 6.0, 9.0, 13.0, 15.0, 12.0, 12.0, 17.0, 29.0, 20.0, 38.0, 31.0, 33.0, 38.0, 32.0, 36.0, 43.0, 43.0, 44.0, 49.0, 38.0, 34.0, 31.0, 41.0, 38.0, 36.0, 28.0, 40.0, 27.0, 25.0, 20.0, 22.0, 18.0, 23.0, 13.0, 3.0, 7.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.76433181762695, -56.03938674926758, -54.31444549560547, -52.589500427246094, -50.86455535888672, -49.13961410522461, -47.414669036865234, -45.689727783203125, -43.96478271484375, -42.239837646484375, -40.514896392822266, -38.78995132446289, -37.06501007080078, -35.340065002441406, -33.61511993408203, -31.89017677307129, -30.165233612060547, -28.440290451049805, -26.715347290039062, -24.990402221679688, -23.265459060668945, -21.540515899658203, -19.815570831298828, -18.090627670288086, -16.365684509277344, -14.640741348266602, -12.915797233581543, -11.190853118896484, -9.465909957885742, -7.740966796875, -6.016022682189941, -4.291078567504883, -2.5661354064941406, -0.8411917686462402, 0.8837518692016602, 2.6086955070495605, 4.333639144897461, 6.058582305908203, 7.783526420593262, 9.50847053527832, 11.233413696289062, 12.958356857299805, 14.683300971984863, 16.408245086669922, 18.133188247680664, 19.858131408691406, 21.58307647705078, 23.308019638061523, 25.032962799072266, 26.757905960083008, 28.48284912109375, 30.207794189453125, 31.932737350463867, 33.65768051147461, 35.382625579833984, 37.107566833496094, 38.83251190185547, 40.557456970214844, 42.28239822387695, 44.00734329223633, 45.73228454589844, 47.45722961425781, 49.18217468261719, 50.90711975097656, 52.63206100463867]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 7.0, 8.0, 14.0, 11.0, 11.0, 18.0, 18.0, 13.0, 22.0, 28.0, 23.0, 46.0, 25.0, 47.0, 34.0, 39.0, 34.0, 41.0, 45.0, 50.0, 44.0, 43.0, 30.0, 42.0, 26.0, 30.0, 26.0, 36.0, 21.0, 26.0, 19.0, 23.0, 18.0, 13.0, 9.0, 16.0, 9.0, 5.0, 6.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.135986328125, -5.94384765625, -5.751708984375, -5.5595703125, -5.367431640625, -5.17529296875, -4.983154296875, -4.791015625, -4.598876953125, -4.40673828125, -4.214599609375, -4.0224609375, -3.830322265625, -3.63818359375, -3.446044921875, -3.25390625, -3.061767578125, -2.86962890625, -2.677490234375, -2.4853515625, -2.293212890625, -2.10107421875, -1.908935546875, -1.716796875, -1.524658203125, -1.33251953125, -1.140380859375, -0.9482421875, -0.756103515625, -0.56396484375, -0.371826171875, -0.1796875, 0.012451171875, 0.20458984375, 0.396728515625, 0.5888671875, 0.781005859375, 0.97314453125, 1.165283203125, 1.357421875, 1.549560546875, 1.74169921875, 1.933837890625, 2.1259765625, 2.318115234375, 2.51025390625, 2.702392578125, 2.89453125, 3.086669921875, 3.27880859375, 3.470947265625, 3.6630859375, 3.855224609375, 4.04736328125, 4.239501953125, 4.431640625, 4.623779296875, 4.81591796875, 5.008056640625, 5.2001953125, 5.392333984375, 5.58447265625, 5.776611328125, 5.96875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 4.0, 5.0, 10.0, 19.0, 8.0, 19.0, 9.0, 22.0, 16.0, 27.0, 27.0, 38.0, 44.0, 75.0, 109.0, 137.0, 252.0, 877.0, 17938.0, 3152450.0, 1015449.0, 5434.0, 572.0, 214.0, 118.0, 77.0, 66.0, 32.0, 41.0, 34.0, 20.0, 28.0, 8.0, 22.0, 15.0, 9.0, 13.0, 10.0, 9.0, 6.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.09375, -34.056884765625, -33.02001953125, -31.983154296875, -30.9462890625, -29.909423828125, -28.87255859375, -27.835693359375, -26.798828125, -25.761962890625, -24.72509765625, -23.688232421875, -22.6513671875, -21.614501953125, -20.57763671875, -19.540771484375, -18.50390625, -17.467041015625, -16.43017578125, -15.393310546875, -14.3564453125, -13.319580078125, -12.28271484375, -11.245849609375, -10.208984375, -9.172119140625, -8.13525390625, -7.098388671875, -6.0615234375, -5.024658203125, -3.98779296875, -2.950927734375, -1.9140625, -0.877197265625, 0.15966796875, 1.196533203125, 2.2333984375, 3.270263671875, 4.30712890625, 5.343994140625, 6.380859375, 7.417724609375, 8.45458984375, 9.491455078125, 10.5283203125, 11.565185546875, 12.60205078125, 13.638916015625, 14.67578125, 15.712646484375, 16.74951171875, 17.786376953125, 18.8232421875, 19.860107421875, 20.89697265625, 21.933837890625, 22.970703125, 24.007568359375, 25.04443359375, 26.081298828125, 27.1181640625, 28.155029296875, 29.19189453125, 30.228759765625, 31.265625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 5.0, 13.0, 7.0, 14.0, 13.0, 15.0, 25.0, 36.0, 66.0, 66.0, 84.0, 139.0, 165.0, 215.0, 249.0, 316.0, 418.0, 433.0, 391.0, 317.0, 259.0, 203.0, 136.0, 119.0, 100.0, 69.0, 45.0, 41.0, 37.0, 23.0, 18.0, 8.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.7265625, -12.3348388671875, -11.943115234375, -11.5513916015625, -11.15966796875, -10.7679443359375, -10.376220703125, -9.9844970703125, -9.5927734375, -9.2010498046875, -8.809326171875, -8.4176025390625, -8.02587890625, -7.6341552734375, -7.242431640625, -6.8507080078125, -6.458984375, -6.0672607421875, -5.675537109375, -5.2838134765625, -4.89208984375, -4.5003662109375, -4.108642578125, -3.7169189453125, -3.3251953125, -2.9334716796875, -2.541748046875, -2.1500244140625, -1.75830078125, -1.3665771484375, -0.974853515625, -0.5831298828125, -0.19140625, 0.2003173828125, 0.592041015625, 0.9837646484375, 1.37548828125, 1.7672119140625, 2.158935546875, 2.5506591796875, 2.9423828125, 3.3341064453125, 3.725830078125, 4.1175537109375, 4.50927734375, 4.9010009765625, 5.292724609375, 5.6844482421875, 6.076171875, 6.4678955078125, 6.859619140625, 7.2513427734375, 7.64306640625, 8.0347900390625, 8.426513671875, 8.8182373046875, 9.2099609375, 9.6016845703125, 9.993408203125, 10.3851318359375, 10.77685546875, 11.1685791015625, 11.560302734375, 11.9520263671875, 12.34375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 10.0, 14.0, 12.0, 23.0, 36.0, 46.0, 58.0, 74.0, 112.0, 136.0, 235.0, 340.0, 596.0, 2848.0, 677374.0, 3503479.0, 6888.0, 787.0, 398.0, 224.0, 161.0, 118.0, 79.0, 55.0, 47.0, 35.0, 23.0, 21.0, 20.0, 10.0, 1.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-77.75, -75.7109375, -73.671875, -71.6328125, -69.59375, -67.5546875, -65.515625, -63.4765625, -61.4375, -59.3984375, -57.359375, -55.3203125, -53.28125, -51.2421875, -49.203125, -47.1640625, -45.125, -43.0859375, -41.046875, -39.0078125, -36.96875, -34.9296875, -32.890625, -30.8515625, -28.8125, -26.7734375, -24.734375, -22.6953125, -20.65625, -18.6171875, -16.578125, -14.5390625, -12.5, -10.4609375, -8.421875, -6.3828125, -4.34375, -2.3046875, -0.265625, 1.7734375, 3.8125, 5.8515625, 7.890625, 9.9296875, 11.96875, 14.0078125, 16.046875, 18.0859375, 20.125, 22.1640625, 24.203125, 26.2421875, 28.28125, 30.3203125, 32.359375, 34.3984375, 36.4375, 38.4765625, 40.515625, 42.5546875, 44.59375, 46.6328125, 48.671875, 50.7109375, 52.75]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 20.0, 34.0, 54.0, 75.0, 153.0, 126.0, 140.0, 155.0, 100.0, 68.0, 38.0, 27.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-91.42068481445312, -89.20539855957031, -86.99010467529297, -84.77481842041016, -82.55953216552734, -80.34423828125, -78.12895202636719, -75.91366577148438, -73.69837951660156, -71.48309326171875, -69.2677993774414, -67.0525131225586, -64.83722686767578, -62.6219367980957, -60.406646728515625, -58.19136047363281, -55.97606658935547, -53.76077651977539, -51.54549026489258, -49.3302001953125, -47.11491394042969, -44.89962387084961, -42.68433380126953, -40.46904754638672, -38.25375747680664, -36.03846740722656, -33.82318115234375, -31.607891082763672, -29.392602920532227, -27.17731475830078, -24.962024688720703, -22.746736526489258, -20.531448364257812, -18.316160202026367, -16.100872039794922, -13.885581970214844, -11.670293807983398, -9.455005645751953, -7.239716529846191, -5.02442741394043, -2.8091392517089844, -0.5938506126403809, 1.6214380264282227, 3.836726665496826, 6.05201530456543, 8.267303466796875, 10.482592582702637, 12.697881698608398, 14.913169860839844, 17.12845802307129, 19.343746185302734, 21.559036254882812, 23.774324417114258, 25.989612579345703, 28.20490264892578, 30.420190811157227, 32.63547897338867, 34.85076904296875, 37.06605529785156, 39.28134536743164, 41.49663543701172, 43.71192169189453, 45.92721176147461, 48.14250183105469, 50.3577880859375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 5.0, 4.0, 4.0, 9.0, 4.0, 3.0, 15.0, 17.0, 12.0, 18.0, 16.0, 14.0, 41.0, 37.0, 38.0, 52.0, 43.0, 62.0, 45.0, 41.0, 55.0, 48.0, 42.0, 50.0, 33.0, 58.0, 32.0, 25.0, 36.0, 23.0, 29.0, 15.0, 17.0, 14.0, 15.0, 8.0, 12.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.319488525390625, -47.75261306762695, -46.18573760986328, -44.618858337402344, -43.05198287963867, -41.485107421875, -39.91823196411133, -38.351356506347656, -36.78447723388672, -35.21760177612305, -33.650726318359375, -32.08384704589844, -30.516971588134766, -28.950096130371094, -27.383220672607422, -25.81634521484375, -24.249469757080078, -22.682594299316406, -21.1157169342041, -19.54884147644043, -17.981964111328125, -16.415088653564453, -14.848213195800781, -13.281336784362793, -11.714460372924805, -10.147583961486816, -8.580707550048828, -7.013832092285156, -5.446955680847168, -3.8800792694091797, -2.313203811645508, -0.7463274002075195, 0.8205490112304688, 2.387425184249878, 3.954301357269287, 5.521177291870117, 7.0880537033081055, 8.654930114746094, 10.221805572509766, 11.788681983947754, 13.355558395385742, 14.92243480682373, 16.48931121826172, 18.05618667602539, 19.623062133789062, 21.189939498901367, 22.75681495666504, 24.323692321777344, 25.890567779541016, 27.457443237304688, 29.024320602416992, 30.591196060180664, 32.15807342529297, 33.72494888305664, 35.29182434082031, 36.858699798583984, 38.425575256347656, 39.99245071411133, 41.559326171875, 43.12620544433594, 44.69308090209961, 46.25995635986328, 47.82683181762695, 49.393707275390625, 50.96058654785156]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 14.0, 10.0, 13.0, 19.0, 17.0, 17.0, 22.0, 22.0, 31.0, 31.0, 40.0, 38.0, 38.0, 43.0, 38.0, 36.0, 47.0, 46.0, 39.0, 47.0, 34.0, 31.0, 35.0, 36.0, 26.0, 24.0, 24.0, 25.0, 17.0, 24.0, 12.0, 13.0, 19.0, 8.0, 12.0, 12.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.14251708984375, -5.9490966796875, -5.75567626953125, -5.562255859375, -5.36883544921875, -5.1754150390625, -4.98199462890625, -4.78857421875, -4.59515380859375, -4.4017333984375, -4.20831298828125, -4.014892578125, -3.82147216796875, -3.6280517578125, -3.43463134765625, -3.2412109375, -3.04779052734375, -2.8543701171875, -2.66094970703125, -2.467529296875, -2.27410888671875, -2.0806884765625, -1.88726806640625, -1.69384765625, -1.50042724609375, -1.3070068359375, -1.11358642578125, -0.920166015625, -0.72674560546875, -0.5333251953125, -0.33990478515625, -0.146484375, 0.04693603515625, 0.2403564453125, 0.43377685546875, 0.627197265625, 0.82061767578125, 1.0140380859375, 1.20745849609375, 1.40087890625, 1.59429931640625, 1.7877197265625, 1.98114013671875, 2.174560546875, 2.36798095703125, 2.5614013671875, 2.75482177734375, 2.9482421875, 3.14166259765625, 3.3350830078125, 3.52850341796875, 3.721923828125, 3.91534423828125, 4.1087646484375, 4.30218505859375, 4.49560546875, 4.68902587890625, 4.8824462890625, 5.07586669921875, 5.269287109375, 5.46270751953125, 5.6561279296875, 5.84954833984375, 6.04296875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 10.0, 8.0, 6.0, 18.0, 25.0, 23.0, 64.0, 68.0, 108.0, 155.0, 225.0, 323.0, 439.0, 629.0, 917.0, 1337.0, 1981.0, 2783.0, 4027.0, 5571.0, 7824.0, 11110.0, 16119.0, 23482.0, 35693.0, 55704.0, 92441.0, 188056.0, 280318.0, 118775.0, 67711.0, 42644.0, 27808.0, 18722.0, 12749.0, 9154.0, 6378.0, 4539.0, 3142.0, 2324.0, 1564.0, 1122.0, 783.0, 546.0, 364.0, 219.0, 185.0, 102.0, 73.0, 64.0, 45.0, 35.0, 13.0, 14.0, 10.0, 2.0, 3.0, 8.0, 2.0, 0.0, 4.0], "bins": [-1.16796875, -1.1305389404296875, -1.093109130859375, -1.0556793212890625, -1.01824951171875, -0.9808197021484375, -0.943389892578125, -0.9059600830078125, -0.8685302734375, -0.8311004638671875, -0.793670654296875, -0.7562408447265625, -0.71881103515625, -0.6813812255859375, -0.643951416015625, -0.6065216064453125, -0.569091796875, -0.5316619873046875, -0.494232177734375, -0.4568023681640625, -0.41937255859375, -0.3819427490234375, -0.344512939453125, -0.3070831298828125, -0.2696533203125, -0.2322235107421875, -0.194793701171875, -0.1573638916015625, -0.11993408203125, -0.0825042724609375, -0.045074462890625, -0.0076446533203125, 0.02978515625, 0.0672149658203125, 0.104644775390625, 0.1420745849609375, 0.17950439453125, 0.2169342041015625, 0.254364013671875, 0.2917938232421875, 0.3292236328125, 0.3666534423828125, 0.404083251953125, 0.4415130615234375, 0.47894287109375, 0.5163726806640625, 0.553802490234375, 0.5912322998046875, 0.628662109375, 0.6660919189453125, 0.703521728515625, 0.7409515380859375, 0.77838134765625, 0.8158111572265625, 0.853240966796875, 0.8906707763671875, 0.9281005859375, 0.9655303955078125, 1.002960205078125, 1.0403900146484375, 1.07781982421875, 1.1152496337890625, 1.152679443359375, 1.1901092529296875, 1.2275390625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 6.0, 13.0, 18.0, 19.0, 17.0, 17.0, 27.0, 33.0, 26.0, 33.0, 27.0, 33.0, 34.0, 38.0, 44.0, 37.0, 28.0, 1073.0, 32.0, 39.0, 54.0, 28.0, 31.0, 36.0, 31.0, 33.0, 31.0, 24.0, 13.0, 32.0, 12.0, 18.0, 12.0, 13.0, 8.0, 6.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.01171875, -3.890625, -3.76953125, -3.6484375, -3.52734375, -3.40625, -3.28515625, -3.1640625, -3.04296875, -2.921875, -2.80078125, -2.6796875, -2.55859375, -2.4375, -2.31640625, -2.1953125, -2.07421875, -1.953125, -1.83203125, -1.7109375, -1.58984375, -1.46875, -1.34765625, -1.2265625, -1.10546875, -0.984375, -0.86328125, -0.7421875, -0.62109375, -0.5, -0.37890625, -0.2578125, -0.13671875, -0.015625, 0.10546875, 0.2265625, 0.34765625, 0.46875, 0.58984375, 0.7109375, 0.83203125, 0.953125, 1.07421875, 1.1953125, 1.31640625, 1.4375, 1.55859375, 1.6796875, 1.80078125, 1.921875, 2.04296875, 2.1640625, 2.28515625, 2.40625, 2.52734375, 2.6484375, 2.76953125, 2.890625, 3.01171875, 3.1328125, 3.25390625, 3.375, 3.49609375, 3.6171875, 3.73828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 18.0, 15.0, 21.0, 43.0, 54.0, 69.0, 125.0, 151.0, 223.0, 332.0, 485.0, 719.0, 1038.0, 1533.0, 2277.0, 3461.0, 5201.0, 7954.0, 11859.0, 18149.0, 27274.0, 42148.0, 65914.0, 113911.0, 1295448.0, 215153.0, 105133.0, 61879.0, 39842.0, 25940.0, 17072.0, 11319.0, 7441.0, 4885.0, 3261.0, 2182.0, 1508.0, 992.0, 666.0, 441.0, 321.0, 206.0, 147.0, 92.0, 74.0, 47.0, 32.0, 30.0, 14.0, 12.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.19140625, -1.1540985107421875, -1.116790771484375, -1.0794830322265625, -1.04217529296875, -1.0048675537109375, -0.967559814453125, -0.9302520751953125, -0.8929443359375, -0.8556365966796875, -0.818328857421875, -0.7810211181640625, -0.74371337890625, -0.7064056396484375, -0.669097900390625, -0.6317901611328125, -0.594482421875, -0.5571746826171875, -0.519866943359375, -0.4825592041015625, -0.44525146484375, -0.4079437255859375, -0.370635986328125, -0.3333282470703125, -0.2960205078125, -0.2587127685546875, -0.221405029296875, -0.1840972900390625, -0.14678955078125, -0.1094818115234375, -0.072174072265625, -0.0348663330078125, 0.00244140625, 0.0397491455078125, 0.077056884765625, 0.1143646240234375, 0.15167236328125, 0.1889801025390625, 0.226287841796875, 0.2635955810546875, 0.3009033203125, 0.3382110595703125, 0.375518798828125, 0.4128265380859375, 0.45013427734375, 0.4874420166015625, 0.524749755859375, 0.5620574951171875, 0.599365234375, 0.6366729736328125, 0.673980712890625, 0.7112884521484375, 0.74859619140625, 0.7859039306640625, 0.823211669921875, 0.8605194091796875, 0.8978271484375, 0.9351348876953125, 0.972442626953125, 1.0097503662109375, 1.04705810546875, 1.0843658447265625, 1.121673583984375, 1.1589813232421875, 1.1962890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 6.0, 5.0, 8.0, 6.0, 11.0, 10.0, 15.0, 15.0, 15.0, 28.0, 31.0, 38.0, 39.0, 70.0, 66.0, 83.0, 87.0, 86.0, 58.0, 75.0, 40.0, 40.0, 28.0, 25.0, 21.0, 10.0, 15.0, 11.0, 8.0, 8.0, 9.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0008068084716796875, -0.0007828846573829651, -0.0007589608430862427, -0.0007350370287895203, -0.0007111132144927979, -0.0006871894001960754, -0.000663265585899353, -0.0006393417716026306, -0.0006154179573059082, -0.0005914941430091858, -0.0005675703287124634, -0.000543646514415741, -0.0005197227001190186, -0.0004957988858222961, -0.00047187507152557373, -0.0004479512572288513, -0.0004240274429321289, -0.0004001036286354065, -0.0003761798143386841, -0.00035225600004196167, -0.00032833218574523926, -0.00030440837144851685, -0.00028048455715179443, -0.000256560742855072, -0.0002326369285583496, -0.0002087131142616272, -0.00018478929996490479, -0.00016086548566818237, -0.00013694167137145996, -0.00011301785707473755, -8.909404277801514e-05, -6.517022848129272e-05, -4.124641418457031e-05, -1.73225998878479e-05, 6.601214408874512e-06, 3.0525028705596924e-05, 5.4448843002319336e-05, 7.837265729904175e-05, 0.00010229647159576416, 0.00012622028589248657, 0.00015014410018920898, 0.0001740679144859314, 0.0001979917287826538, 0.00022191554307937622, 0.00024583935737609863, 0.00026976317167282104, 0.00029368698596954346, 0.00031761080026626587, 0.0003415346145629883, 0.0003654584288597107, 0.0003893822431564331, 0.0004133060574531555, 0.00043722987174987793, 0.00046115368604660034, 0.00048507750034332275, 0.0005090013146400452, 0.0005329251289367676, 0.00055684894323349, 0.0005807727575302124, 0.0006046965718269348, 0.0006286203861236572, 0.0006525442004203796, 0.000676468014717102, 0.0007003918290138245, 0.0007243156433105469]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 8.0, 5.0, 15.0, 13.0, 25.0, 22.0, 47.0, 47.0, 72.0, 105.0, 169.0, 336.0, 865.0, 237817.0, 807009.0, 1041.0, 377.0, 188.0, 119.0, 71.0, 48.0, 38.0, 29.0, 25.0, 10.0, 7.0, 12.0, 11.0, 4.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0197601318359375, -0.01912379264831543, -0.01848745346069336, -0.01785111427307129, -0.01721477508544922, -0.01657843589782715, -0.015942096710205078, -0.015305757522583008, -0.014669418334960938, -0.014033079147338867, -0.013396739959716797, -0.012760400772094727, -0.012124061584472656, -0.011487722396850586, -0.010851383209228516, -0.010215044021606445, -0.009578704833984375, -0.008942365646362305, -0.008306026458740234, -0.007669687271118164, -0.007033348083496094, -0.0063970088958740234, -0.005760669708251953, -0.005124330520629883, -0.0044879913330078125, -0.003851652145385742, -0.003215312957763672, -0.0025789737701416016, -0.0019426345825195312, -0.001306295394897461, -0.0006699562072753906, -3.361701965332031e-05, 0.00060272216796875, 0.0012390613555908203, 0.0018754005432128906, 0.002511739730834961, 0.0031480789184570312, 0.0037844181060791016, 0.004420757293701172, 0.005057096481323242, 0.0056934356689453125, 0.006329774856567383, 0.006966114044189453, 0.0076024532318115234, 0.008238792419433594, 0.008875131607055664, 0.009511470794677734, 0.010147809982299805, 0.010784149169921875, 0.011420488357543945, 0.012056827545166016, 0.012693166732788086, 0.013329505920410156, 0.013965845108032227, 0.014602184295654297, 0.015238523483276367, 0.015874862670898438, 0.016511201858520508, 0.017147541046142578, 0.01778388023376465, 0.01842021942138672, 0.01905655860900879, 0.01969289779663086, 0.02032923698425293, 0.020965576171875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 26.0, 93.0, 257.0, 352.0, 198.0, 54.0, 16.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006999492179602385, -0.0006637161131948233, -0.0006274830084294081, -0.0005912499036639929, -0.0005550168571062386, -0.0005187837523408234, -0.0004825506475754082, -0.0004463175719138235, -0.0004100844671484083, -0.0003738513623829931, -0.00033761828672140837, -0.0003013851819559932, -0.000265152077190578, -0.00022891900152899325, -0.00019268589676357806, -0.00015645282110199332, -0.00012021971633657813, -8.398662612307817e-05, -4.775352863362059e-05, -1.1520431144163013e-05, 2.471265906933695e-05, 6.0945749282836914e-05, 9.71788540482521e-05, 0.00013341192970983684, 0.00016964503447525203, 0.000205878124688752, 0.00024211121490225196, 0.00027834431966766715, 0.00031457742443308234, 0.0003508105000946671, 0.00038704360486008227, 0.000423276680521667, 0.0004595097852870822, 0.0004957428900524974, 0.0005319759948179126, 0.0005682090995833278, 0.000604442146141082, 0.0006406752509064972, 0.0006769083556719124, 0.0007131414022296667, 0.0007493745069950819, 0.0007856076117604971, 0.0008218407165259123, 0.0008580738212913275, 0.0008943068678490818, 0.000930539972614497, 0.0009667730773799121, 0.0010030061239376664, 0.0010392393451184034, 0.0010754724498838186, 0.0011117055546492338, 0.001147938659414649, 0.0011841717641800642, 0.0012204048689454794, 0.0012566379737108946, 0.001292870962060988, 0.0013291040668264031, 0.0013653371715918183, 0.0014015702763572335, 0.0014378033811226487, 0.001474036485888064, 0.0015102694742381573, 0.0015465025790035725, 0.0015827356837689877, 0.0016189687885344028]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 6.0, 9.0, 7.0, 12.0, 10.0, 12.0, 12.0, 13.0, 19.0, 17.0, 17.0, 23.0, 18.0, 21.0, 26.0, 27.0, 22.0, 26.0, 37.0, 35.0, 37.0, 36.0, 33.0, 35.0, 41.0, 42.0, 43.0, 34.0, 31.0, 37.0, 26.0, 23.0, 32.0, 22.0, 24.0, 14.0, 16.0, 14.0, 15.0, 13.0, 13.0, 17.0, 10.0, 9.0, 5.0, 7.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003209710121154785, -0.00031079910695552826, -0.000300627201795578, -0.00029045529663562775, -0.0002802833914756775, -0.00027011148631572723, -0.000259939581155777, -0.0002497676759958267, -0.00023959577083587646, -0.0002294238656759262, -0.00021925196051597595, -0.0002090800553560257, -0.00019890815019607544, -0.00018873624503612518, -0.00017856433987617493, -0.00016839243471622467, -0.00015822052955627441, -0.00014804862439632416, -0.0001378767192363739, -0.00012770481407642365, -0.00011753290891647339, -0.00010736100375652313, -9.718909859657288e-05, -8.701719343662262e-05, -7.684528827667236e-05, -6.667338311672211e-05, -5.650147795677185e-05, -4.6329572796821594e-05, -3.615766763687134e-05, -2.598576247692108e-05, -1.5813857316970825e-05, -5.641952157020569e-06, 4.5299530029296875e-06, 1.4701858162879944e-05, 2.48737633228302e-05, 3.5045668482780457e-05, 4.521757364273071e-05, 5.538947880268097e-05, 6.556138396263123e-05, 7.573328912258148e-05, 8.590519428253174e-05, 9.6077099442482e-05, 0.00010624900460243225, 0.00011642090976238251, 0.00012659281492233276, 0.00013676472008228302, 0.00014693662524223328, 0.00015710853040218353, 0.0001672804355621338, 0.00017745234072208405, 0.0001876242458820343, 0.00019779615104198456, 0.00020796805620193481, 0.00021813996136188507, 0.00022831186652183533, 0.00023848377168178558, 0.00024865567684173584, 0.0002588275820016861, 0.00026899948716163635, 0.0002791713923215866, 0.00028934329748153687, 0.0002995152026414871, 0.0003096871078014374, 0.00031985901296138763, 0.0003300309181213379]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 14.0, 10.0, 13.0, 19.0, 17.0, 17.0, 22.0, 22.0, 31.0, 31.0, 40.0, 38.0, 38.0, 43.0, 38.0, 36.0, 47.0, 46.0, 39.0, 47.0, 34.0, 31.0, 35.0, 36.0, 26.0, 24.0, 24.0, 25.0, 17.0, 24.0, 12.0, 13.0, 19.0, 8.0, 12.0, 12.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.14251708984375, -5.9490966796875, -5.75567626953125, -5.562255859375, -5.36883544921875, -5.1754150390625, -4.98199462890625, -4.78857421875, -4.59515380859375, -4.4017333984375, -4.20831298828125, -4.014892578125, -3.82147216796875, -3.6280517578125, -3.43463134765625, -3.2412109375, -3.04779052734375, -2.8543701171875, -2.66094970703125, -2.467529296875, -2.27410888671875, -2.0806884765625, -1.88726806640625, -1.69384765625, -1.50042724609375, -1.3070068359375, -1.11358642578125, -0.920166015625, -0.72674560546875, -0.5333251953125, -0.33990478515625, -0.146484375, 0.04693603515625, 0.2403564453125, 0.43377685546875, 0.627197265625, 0.82061767578125, 1.0140380859375, 1.20745849609375, 1.40087890625, 1.59429931640625, 1.7877197265625, 1.98114013671875, 2.174560546875, 2.36798095703125, 2.5614013671875, 2.75482177734375, 2.9482421875, 3.14166259765625, 3.3350830078125, 3.52850341796875, 3.721923828125, 3.91534423828125, 4.1087646484375, 4.30218505859375, 4.49560546875, 4.68902587890625, 4.8824462890625, 5.07586669921875, 5.269287109375, 5.46270751953125, 5.6561279296875, 5.84954833984375, 6.04296875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 10.0, 18.0, 34.0, 35.0, 72.0, 92.0, 144.0, 201.0, 343.0, 525.0, 879.0, 1449.0, 2531.0, 4372.0, 7800.0, 14337.0, 28021.0, 61316.0, 161511.0, 400125.0, 214655.0, 78010.0, 33604.0, 16956.0, 9058.0, 5122.0, 2892.0, 1672.0, 1051.0, 668.0, 396.0, 224.0, 144.0, 92.0, 58.0, 40.0, 28.0, 24.0, 15.0, 8.0, 6.0, 1.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8828125, -3.763824462890625, -3.64483642578125, -3.525848388671875, -3.4068603515625, -3.287872314453125, -3.16888427734375, -3.049896240234375, -2.930908203125, -2.811920166015625, -2.69293212890625, -2.573944091796875, -2.4549560546875, -2.335968017578125, -2.21697998046875, -2.097991943359375, -1.97900390625, -1.860015869140625, -1.74102783203125, -1.622039794921875, -1.5030517578125, -1.384063720703125, -1.26507568359375, -1.146087646484375, -1.027099609375, -0.908111572265625, -0.78912353515625, -0.670135498046875, -0.5511474609375, -0.432159423828125, -0.31317138671875, -0.194183349609375, -0.0751953125, 0.043792724609375, 0.16278076171875, 0.281768798828125, 0.4007568359375, 0.519744873046875, 0.63873291015625, 0.757720947265625, 0.876708984375, 0.995697021484375, 1.11468505859375, 1.233673095703125, 1.3526611328125, 1.471649169921875, 1.59063720703125, 1.709625244140625, 1.82861328125, 1.947601318359375, 2.06658935546875, 2.185577392578125, 2.3045654296875, 2.423553466796875, 2.54254150390625, 2.661529541015625, 2.780517578125, 2.899505615234375, 3.01849365234375, 3.137481689453125, 3.2564697265625, 3.375457763671875, 3.49444580078125, 3.613433837890625, 3.732421875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 10.0, 10.0, 8.0, 14.0, 16.0, 15.0, 28.0, 27.0, 31.0, 40.0, 40.0, 45.0, 45.0, 59.0, 76.0, 120.0, 1647.0, 255.0, 77.0, 57.0, 58.0, 49.0, 41.0, 33.0, 38.0, 24.0, 20.0, 30.0, 19.0, 13.0, 14.0, 17.0, 14.0, 12.0, 5.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.890625, -25.145751953125, -24.40087890625, -23.656005859375, -22.9111328125, -22.166259765625, -21.42138671875, -20.676513671875, -19.931640625, -19.186767578125, -18.44189453125, -17.697021484375, -16.9521484375, -16.207275390625, -15.46240234375, -14.717529296875, -13.97265625, -13.227783203125, -12.48291015625, -11.738037109375, -10.9931640625, -10.248291015625, -9.50341796875, -8.758544921875, -8.013671875, -7.268798828125, -6.52392578125, -5.779052734375, -5.0341796875, -4.289306640625, -3.54443359375, -2.799560546875, -2.0546875, -1.309814453125, -0.56494140625, 0.179931640625, 0.9248046875, 1.669677734375, 2.41455078125, 3.159423828125, 3.904296875, 4.649169921875, 5.39404296875, 6.138916015625, 6.8837890625, 7.628662109375, 8.37353515625, 9.118408203125, 9.86328125, 10.608154296875, 11.35302734375, 12.097900390625, 12.8427734375, 13.587646484375, 14.33251953125, 15.077392578125, 15.822265625, 16.567138671875, 17.31201171875, 18.056884765625, 18.8017578125, 19.546630859375, 20.29150390625, 21.036376953125, 21.78125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 3.0, 4.0, 12.0, 14.0, 19.0, 34.0, 70.0, 66.0, 98.0, 187.0, 339.0, 771.0, 19606.0, 3120394.0, 2951.0, 502.0, 256.0, 138.0, 84.0, 51.0, 27.0, 26.0, 18.0, 12.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.625, -91.6962890625, -88.767578125, -85.8388671875, -82.91015625, -79.9814453125, -77.052734375, -74.1240234375, -71.1953125, -68.2666015625, -65.337890625, -62.4091796875, -59.48046875, -56.5517578125, -53.623046875, -50.6943359375, -47.765625, -44.8369140625, -41.908203125, -38.9794921875, -36.05078125, -33.1220703125, -30.193359375, -27.2646484375, -24.3359375, -21.4072265625, -18.478515625, -15.5498046875, -12.62109375, -9.6923828125, -6.763671875, -3.8349609375, -0.90625, 2.0224609375, 4.951171875, 7.8798828125, 10.80859375, 13.7373046875, 16.666015625, 19.5947265625, 22.5234375, 25.4521484375, 28.380859375, 31.3095703125, 34.23828125, 37.1669921875, 40.095703125, 43.0244140625, 45.953125, 48.8818359375, 51.810546875, 54.7392578125, 57.66796875, 60.5966796875, 63.525390625, 66.4541015625, 69.3828125, 72.3115234375, 75.240234375, 78.1689453125, 81.09765625, 84.0263671875, 86.955078125, 89.8837890625, 92.8125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 57.0, 262.0, 490.0, 175.0, 19.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.70610809326172, -36.486854553222656, -33.26760482788086, -30.048351287841797, -26.829099655151367, -23.609848022460938, -20.390594482421875, -17.171342849731445, -13.952091217041016, -10.732839584350586, -7.51358699798584, -4.294334411621094, -1.075082778930664, 2.1441688537597656, 5.363422393798828, 8.582674026489258, 11.801925659179688, 15.021177291870117, 18.240428924560547, 21.45968246459961, 24.67893409729004, 27.89818572998047, 31.11743927001953, 34.336692810058594, 37.55594253540039, 40.77519607543945, 43.99444580078125, 47.21369934082031, 50.432952880859375, 53.65220260620117, 56.871456146240234, 60.09070587158203, 63.30995178222656, 66.52920532226562, 69.74845886230469, 72.96771240234375, 76.18695831298828, 79.40621185302734, 82.6254653930664, 85.84471893310547, 89.06396484375, 92.28321838378906, 95.50247192382812, 98.72172546386719, 101.94097137451172, 105.16022491455078, 108.37947845458984, 111.5987319946289, 114.81798553466797, 118.03723907470703, 121.2564926147461, 124.47573852539062, 127.69499206542969, 130.91424560546875, 134.1334991455078, 137.35275268554688, 140.57200622558594, 143.791259765625, 147.01051330566406, 150.22976684570312, 153.4490203857422, 156.66827392578125, 159.88751220703125, 163.1067657470703, 166.32601928710938]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 7.0, 7.0, 9.0, 12.0, 10.0, 13.0, 15.0, 20.0, 30.0, 31.0, 27.0, 24.0, 31.0, 25.0, 34.0, 39.0, 28.0, 36.0, 48.0, 41.0, 44.0, 43.0, 40.0, 40.0, 47.0, 32.0, 30.0, 27.0, 31.0, 38.0, 20.0, 23.0, 15.0, 12.0, 17.0, 9.0, 9.0, 6.0, 4.0, 10.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-68.74517822265625, -66.63235473632812, -64.51952362060547, -62.40669631958008, -60.29386901855469, -58.18104553222656, -56.06821823120117, -53.95539093017578, -51.84256362915039, -49.729736328125, -47.61690902709961, -45.50408172607422, -43.391258239746094, -41.27842712402344, -39.16560363769531, -37.05277633666992, -34.93994903564453, -32.82712173461914, -30.71429443359375, -28.601469039916992, -26.4886417388916, -24.37581443786621, -22.262989044189453, -20.150161743164062, -18.037334442138672, -15.924507141113281, -13.811680793762207, -11.698854446411133, -9.586027145385742, -7.473199844360352, -5.360373497009277, -3.247547149658203, -1.1347122192382812, 0.9781146049499512, 3.0909414291381836, 5.203768253326416, 7.316595077514648, 9.429422378540039, 11.542248725891113, 13.655075073242188, 15.767902374267578, 17.88072967529297, 19.99355697631836, 22.106382369995117, 24.219209671020508, 26.3320369720459, 28.444862365722656, 30.557689666748047, 32.67051696777344, 34.78334426879883, 36.89617156982422, 39.00899887084961, 41.121826171875, 43.234649658203125, 45.347476959228516, 47.460304260253906, 49.5731315612793, 51.68595886230469, 53.79878616333008, 55.91161346435547, 58.024436950683594, 60.13726806640625, 62.250091552734375, 64.3629150390625, 66.47574615478516]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 8.0, 7.0, 7.0, 7.0, 10.0, 19.0, 21.0, 16.0, 16.0, 14.0, 24.0, 20.0, 25.0, 35.0, 39.0, 45.0, 41.0, 50.0, 34.0, 46.0, 39.0, 40.0, 51.0, 34.0, 34.0, 23.0, 35.0, 31.0, 30.0, 33.0, 20.0, 21.0, 11.0, 20.0, 25.0, 12.0, 12.0, 13.0, 10.0, 3.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.203125, -6.9998779296875, -6.796630859375, -6.5933837890625, -6.39013671875, -6.1868896484375, -5.983642578125, -5.7803955078125, -5.5771484375, -5.3739013671875, -5.170654296875, -4.9674072265625, -4.76416015625, -4.5609130859375, -4.357666015625, -4.1544189453125, -3.951171875, -3.7479248046875, -3.544677734375, -3.3414306640625, -3.13818359375, -2.9349365234375, -2.731689453125, -2.5284423828125, -2.3251953125, -2.1219482421875, -1.918701171875, -1.7154541015625, -1.51220703125, -1.3089599609375, -1.105712890625, -0.9024658203125, -0.69921875, -0.4959716796875, -0.292724609375, -0.0894775390625, 0.11376953125, 0.3170166015625, 0.520263671875, 0.7235107421875, 0.9267578125, 1.1300048828125, 1.333251953125, 1.5364990234375, 1.73974609375, 1.9429931640625, 2.146240234375, 2.3494873046875, 2.552734375, 2.7559814453125, 2.959228515625, 3.1624755859375, 3.36572265625, 3.5689697265625, 3.772216796875, 3.9754638671875, 4.1787109375, 4.3819580078125, 4.585205078125, 4.7884521484375, 4.99169921875, 5.1949462890625, 5.398193359375, 5.6014404296875, 5.8046875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 10.0, 16.0, 23.0, 28.0, 39.0, 52.0, 60.0, 98.0, 116.0, 199.0, 420.0, 619.0, 1295.0, 3329.0, 10271.0, 41079.0, 243792.0, 1101097.0, 1824583.0, 775957.0, 150311.0, 28492.0, 7415.0, 2512.0, 1034.0, 501.0, 304.0, 186.0, 125.0, 87.0, 62.0, 45.0, 31.0, 30.0, 15.0, 11.0, 8.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-10.171875, -9.89215087890625, -9.6124267578125, -9.33270263671875, -9.052978515625, -8.77325439453125, -8.4935302734375, -8.21380615234375, -7.93408203125, -7.65435791015625, -7.3746337890625, -7.09490966796875, -6.815185546875, -6.53546142578125, -6.2557373046875, -5.97601318359375, -5.6962890625, -5.41656494140625, -5.1368408203125, -4.85711669921875, -4.577392578125, -4.29766845703125, -4.0179443359375, -3.73822021484375, -3.45849609375, -3.17877197265625, -2.8990478515625, -2.61932373046875, -2.339599609375, -2.05987548828125, -1.7801513671875, -1.50042724609375, -1.220703125, -0.94097900390625, -0.6612548828125, -0.38153076171875, -0.101806640625, 0.17791748046875, 0.4576416015625, 0.73736572265625, 1.01708984375, 1.29681396484375, 1.5765380859375, 1.85626220703125, 2.135986328125, 2.41571044921875, 2.6954345703125, 2.97515869140625, 3.2548828125, 3.53460693359375, 3.8143310546875, 4.09405517578125, 4.373779296875, 4.65350341796875, 4.9332275390625, 5.21295166015625, 5.49267578125, 5.77239990234375, 6.0521240234375, 6.33184814453125, 6.611572265625, 6.89129638671875, 7.1710205078125, 7.45074462890625, 7.73046875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 10.0, 10.0, 16.0, 31.0, 42.0, 59.0, 72.0, 109.0, 152.0, 241.0, 271.0, 397.0, 442.0, 471.0, 419.0, 377.0, 266.0, 196.0, 157.0, 99.0, 56.0, 54.0, 38.0, 19.0, 18.0, 17.0, 7.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.5784912109375, -12.102294921875, -11.6260986328125, -11.14990234375, -10.6737060546875, -10.197509765625, -9.7213134765625, -9.2451171875, -8.7689208984375, -8.292724609375, -7.8165283203125, -7.34033203125, -6.8641357421875, -6.387939453125, -5.9117431640625, -5.435546875, -4.9593505859375, -4.483154296875, -4.0069580078125, -3.53076171875, -3.0545654296875, -2.578369140625, -2.1021728515625, -1.6259765625, -1.1497802734375, -0.673583984375, -0.1973876953125, 0.27880859375, 0.7550048828125, 1.231201171875, 1.7073974609375, 2.18359375, 2.6597900390625, 3.135986328125, 3.6121826171875, 4.08837890625, 4.5645751953125, 5.040771484375, 5.5169677734375, 5.9931640625, 6.4693603515625, 6.945556640625, 7.4217529296875, 7.89794921875, 8.3741455078125, 8.850341796875, 9.3265380859375, 9.802734375, 10.2789306640625, 10.755126953125, 11.2313232421875, 11.70751953125, 12.1837158203125, 12.659912109375, 13.1361083984375, 13.6123046875, 14.0885009765625, 14.564697265625, 15.0408935546875, 15.51708984375, 15.9932861328125, 16.469482421875, 16.9456787109375, 17.421875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 4.0, 7.0, 14.0, 13.0, 10.0, 22.0, 22.0, 35.0, 52.0, 62.0, 69.0, 83.0, 105.0, 176.0, 277.0, 424.0, 1088.0, 11463.0, 3095361.0, 1077140.0, 5678.0, 871.0, 440.0, 229.0, 145.0, 114.0, 63.0, 58.0, 45.0, 43.0, 32.0, 28.0, 10.0, 24.0, 17.0, 9.0, 13.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-50.59375, -48.95654296875, -47.3193359375, -45.68212890625, -44.044921875, -42.40771484375, -40.7705078125, -39.13330078125, -37.49609375, -35.85888671875, -34.2216796875, -32.58447265625, -30.947265625, -29.31005859375, -27.6728515625, -26.03564453125, -24.3984375, -22.76123046875, -21.1240234375, -19.48681640625, -17.849609375, -16.21240234375, -14.5751953125, -12.93798828125, -11.30078125, -9.66357421875, -8.0263671875, -6.38916015625, -4.751953125, -3.11474609375, -1.4775390625, 0.15966796875, 1.796875, 3.43408203125, 5.0712890625, 6.70849609375, 8.345703125, 9.98291015625, 11.6201171875, 13.25732421875, 14.89453125, 16.53173828125, 18.1689453125, 19.80615234375, 21.443359375, 23.08056640625, 24.7177734375, 26.35498046875, 27.9921875, 29.62939453125, 31.2666015625, 32.90380859375, 34.541015625, 36.17822265625, 37.8154296875, 39.45263671875, 41.08984375, 42.72705078125, 44.3642578125, 46.00146484375, 47.638671875, 49.27587890625, 50.9130859375, 52.55029296875, 54.1875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 20.0, 25.0, 85.0, 155.0, 213.0, 206.0, 156.0, 89.0, 42.0, 9.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.6499252319336, -69.373046875, -66.0961685180664, -62.81929016113281, -59.54241180419922, -56.265533447265625, -52.98865509033203, -49.71177673339844, -46.434898376464844, -43.15802001953125, -39.881141662597656, -36.60426330566406, -33.32738494873047, -30.050506591796875, -26.77362823486328, -23.496749877929688, -20.219871520996094, -16.9429931640625, -13.666114807128906, -10.389236450195312, -7.112358093261719, -3.835479736328125, -0.5586013793945312, 2.7182769775390625, 5.995155334472656, 9.27203369140625, 12.548912048339844, 15.825790405273438, 19.10266876220703, 22.379547119140625, 25.65642547607422, 28.933303833007812, 32.210174560546875, 35.48705291748047, 38.76393127441406, 42.040809631347656, 45.31768798828125, 48.594566345214844, 51.87144470214844, 55.14832305908203, 58.425201416015625, 61.70207977294922, 64.97895812988281, 68.2558364868164, 71.53271484375, 74.8095932006836, 78.08647155761719, 81.36334991455078, 84.64022827148438, 87.91710662841797, 91.19398498535156, 94.47086334228516, 97.74774169921875, 101.02462005615234, 104.30149841308594, 107.57837677001953, 110.85525512695312, 114.13213348388672, 117.40901184082031, 120.6858901977539, 123.9627685546875, 127.2396469116211, 130.5165252685547, 133.79339599609375, 137.07028198242188]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 8.0, 3.0, 8.0, 14.0, 4.0, 9.0, 11.0, 29.0, 21.0, 24.0, 28.0, 27.0, 33.0, 35.0, 35.0, 37.0, 50.0, 51.0, 41.0, 52.0, 38.0, 49.0, 39.0, 38.0, 37.0, 32.0, 27.0, 39.0, 22.0, 24.0, 17.0, 28.0, 14.0, 18.0, 15.0, 14.0, 8.0, 10.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.84675598144531, -40.31849670410156, -38.79023742675781, -37.26197814941406, -35.73371887207031, -34.20545959472656, -32.67720031738281, -31.14893913269043, -29.62067985534668, -28.09242057800293, -26.56416130065918, -25.035900115966797, -23.507640838623047, -21.979381561279297, -20.451122283935547, -18.922863006591797, -17.394603729248047, -15.866344451904297, -14.338085174560547, -12.80982494354248, -11.28156566619873, -9.75330638885498, -8.225046157836914, -6.696786880493164, -5.168527603149414, -3.640268087387085, -2.112008571624756, -0.5837488174438477, 0.9445104598999023, 2.4727697372436523, 4.001029968261719, 5.529289245605469, 7.057548522949219, 8.585807800292969, 10.114067077636719, 11.642327308654785, 13.170586585998535, 14.698845863342285, 16.22710609436035, 17.7553653717041, 19.28362464904785, 20.8118839263916, 22.34014320373535, 23.868404388427734, 25.396663665771484, 26.924922943115234, 28.453182220458984, 29.981441497802734, 31.509700775146484, 33.037960052490234, 34.566219329833984, 36.094478607177734, 37.622737884521484, 39.150997161865234, 40.67926025390625, 42.20751953125, 43.73577880859375, 45.2640380859375, 46.79229736328125, 48.320556640625, 49.84881591796875, 51.3770751953125, 52.90533447265625, 54.43359375, 55.96185302734375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 7.0, 12.0, 12.0, 12.0, 21.0, 21.0, 17.0, 18.0, 31.0, 29.0, 24.0, 26.0, 43.0, 33.0, 38.0, 55.0, 42.0, 45.0, 44.0, 41.0, 31.0, 56.0, 42.0, 26.0, 26.0, 21.0, 30.0, 25.0, 24.0, 22.0, 22.0, 25.0, 8.0, 7.0, 17.0, 12.0, 6.0, 7.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.46875, -7.25604248046875, -7.0433349609375, -6.83062744140625, -6.617919921875, -6.40521240234375, -6.1925048828125, -5.97979736328125, -5.76708984375, -5.55438232421875, -5.3416748046875, -5.12896728515625, -4.916259765625, -4.70355224609375, -4.4908447265625, -4.27813720703125, -4.0654296875, -3.85272216796875, -3.6400146484375, -3.42730712890625, -3.214599609375, -3.00189208984375, -2.7891845703125, -2.57647705078125, -2.36376953125, -2.15106201171875, -1.9383544921875, -1.72564697265625, -1.512939453125, -1.30023193359375, -1.0875244140625, -0.87481689453125, -0.662109375, -0.44940185546875, -0.2366943359375, -0.02398681640625, 0.188720703125, 0.40142822265625, 0.6141357421875, 0.82684326171875, 1.03955078125, 1.25225830078125, 1.4649658203125, 1.67767333984375, 1.890380859375, 2.10308837890625, 2.3157958984375, 2.52850341796875, 2.7412109375, 2.95391845703125, 3.1666259765625, 3.37933349609375, 3.592041015625, 3.80474853515625, 4.0174560546875, 4.23016357421875, 4.44287109375, 4.65557861328125, 4.8682861328125, 5.08099365234375, 5.293701171875, 5.50640869140625, 5.7191162109375, 5.93182373046875, 6.14453125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 13.0, 18.0, 24.0, 38.0, 70.0, 78.0, 117.0, 200.0, 327.0, 554.0, 915.0, 1730.0, 2715.0, 4715.0, 7341.0, 11955.0, 19495.0, 31888.0, 56480.0, 111154.0, 293796.0, 266265.0, 105377.0, 54179.0, 30866.0, 18472.0, 11511.0, 7115.0, 4342.0, 2774.0, 1662.0, 977.0, 592.0, 301.0, 163.0, 109.0, 74.0, 60.0, 30.0, 19.0, 16.0, 14.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.8720703125, -1.8185272216796875, -1.764984130859375, -1.7114410400390625, -1.65789794921875, -1.6043548583984375, -1.550811767578125, -1.4972686767578125, -1.4437255859375, -1.3901824951171875, -1.336639404296875, -1.2830963134765625, -1.22955322265625, -1.1760101318359375, -1.122467041015625, -1.0689239501953125, -1.015380859375, -0.9618377685546875, -0.908294677734375, -0.8547515869140625, -0.80120849609375, -0.7476654052734375, -0.694122314453125, -0.6405792236328125, -0.5870361328125, -0.5334930419921875, -0.479949951171875, -0.4264068603515625, -0.37286376953125, -0.3193206787109375, -0.265777587890625, -0.2122344970703125, -0.15869140625, -0.1051483154296875, -0.051605224609375, 0.0019378662109375, 0.05548095703125, 0.1090240478515625, 0.162567138671875, 0.2161102294921875, 0.2696533203125, 0.3231964111328125, 0.376739501953125, 0.4302825927734375, 0.48382568359375, 0.5373687744140625, 0.590911865234375, 0.6444549560546875, 0.697998046875, 0.7515411376953125, 0.805084228515625, 0.8586273193359375, 0.91217041015625, 0.9657135009765625, 1.019256591796875, 1.0727996826171875, 1.1263427734375, 1.1798858642578125, 1.233428955078125, 1.2869720458984375, 1.34051513671875, 1.3940582275390625, 1.447601318359375, 1.5011444091796875, 1.5546875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 7.0, 4.0, 7.0, 9.0, 15.0, 11.0, 17.0, 15.0, 23.0, 19.0, 19.0, 28.0, 27.0, 23.0, 29.0, 22.0, 34.0, 29.0, 26.0, 35.0, 22.0, 36.0, 1065.0, 42.0, 40.0, 34.0, 36.0, 36.0, 30.0, 27.0, 25.0, 24.0, 20.0, 33.0, 27.0, 12.0, 13.0, 18.0, 13.0, 12.0, 9.0, 10.0, 10.0, 6.0, 4.0, 7.0, 2.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.666015625, -3.548614501953125, -3.43121337890625, -3.313812255859375, -3.1964111328125, -3.079010009765625, -2.96160888671875, -2.844207763671875, -2.726806640625, -2.609405517578125, -2.49200439453125, -2.374603271484375, -2.2572021484375, -2.139801025390625, -2.02239990234375, -1.904998779296875, -1.78759765625, -1.670196533203125, -1.55279541015625, -1.435394287109375, -1.3179931640625, -1.200592041015625, -1.08319091796875, -0.965789794921875, -0.848388671875, -0.730987548828125, -0.61358642578125, -0.496185302734375, -0.3787841796875, -0.261383056640625, -0.14398193359375, -0.026580810546875, 0.0908203125, 0.208221435546875, 0.32562255859375, 0.443023681640625, 0.5604248046875, 0.677825927734375, 0.79522705078125, 0.912628173828125, 1.030029296875, 1.147430419921875, 1.26483154296875, 1.382232666015625, 1.4996337890625, 1.617034912109375, 1.73443603515625, 1.851837158203125, 1.96923828125, 2.086639404296875, 2.20404052734375, 2.321441650390625, 2.4388427734375, 2.556243896484375, 2.67364501953125, 2.791046142578125, 2.908447265625, 3.025848388671875, 3.14324951171875, 3.260650634765625, 3.3780517578125, 3.495452880859375, 3.61285400390625, 3.730255126953125, 3.84765625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 9.0, 13.0, 13.0, 30.0, 32.0, 62.0, 62.0, 110.0, 149.0, 205.0, 287.0, 416.0, 581.0, 783.0, 1160.0, 1616.0, 2361.0, 3288.0, 4797.0, 6769.0, 9651.0, 13961.0, 20000.0, 28517.0, 41604.0, 62355.0, 98887.0, 196718.0, 1283643.0, 107318.0, 67105.0, 44181.0, 30437.0, 21083.0, 14815.0, 10244.0, 7232.0, 5078.0, 3555.0, 2451.0, 1714.0, 1166.0, 834.0, 578.0, 385.0, 271.0, 190.0, 126.0, 92.0, 62.0, 52.0, 32.0, 25.0, 13.0, 8.0, 11.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.1494140625, -1.11358642578125, -1.0777587890625, -1.04193115234375, -1.006103515625, -0.97027587890625, -0.9344482421875, -0.89862060546875, -0.86279296875, -0.82696533203125, -0.7911376953125, -0.75531005859375, -0.719482421875, -0.68365478515625, -0.6478271484375, -0.61199951171875, -0.576171875, -0.54034423828125, -0.5045166015625, -0.46868896484375, -0.432861328125, -0.39703369140625, -0.3612060546875, -0.32537841796875, -0.28955078125, -0.25372314453125, -0.2178955078125, -0.18206787109375, -0.146240234375, -0.11041259765625, -0.0745849609375, -0.03875732421875, -0.0029296875, 0.03289794921875, 0.0687255859375, 0.10455322265625, 0.140380859375, 0.17620849609375, 0.2120361328125, 0.24786376953125, 0.28369140625, 0.31951904296875, 0.3553466796875, 0.39117431640625, 0.427001953125, 0.46282958984375, 0.4986572265625, 0.53448486328125, 0.5703125, 0.60614013671875, 0.6419677734375, 0.67779541015625, 0.713623046875, 0.74945068359375, 0.7852783203125, 0.82110595703125, 0.85693359375, 0.89276123046875, 0.9285888671875, 0.96441650390625, 1.000244140625, 1.03607177734375, 1.0718994140625, 1.10772705078125, 1.1435546875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 0.0, 3.0, 1.0, 4.0, 9.0, 4.0, 5.0, 5.0, 11.0, 11.0, 12.0, 11.0, 30.0, 31.0, 42.0, 76.0, 78.0, 113.0, 142.0, 125.0, 81.0, 60.0, 42.0, 27.0, 22.0, 17.0, 9.0, 7.0, 7.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010986328125, -0.0010675638914108276, -0.0010364949703216553, -0.001005426049232483, -0.0009743571281433105, -0.0009432882070541382, -0.0009122192859649658, -0.0008811503648757935, -0.0008500814437866211, -0.0008190125226974487, -0.0007879436016082764, -0.000756874680519104, -0.0007258057594299316, -0.0006947368383407593, -0.0006636679172515869, -0.0006325989961624146, -0.0006015300750732422, -0.0005704611539840698, -0.0005393922328948975, -0.0005083233118057251, -0.00047725439071655273, -0.00044618546962738037, -0.000415116548538208, -0.00038404762744903564, -0.0003529787063598633, -0.0003219097852706909, -0.00029084086418151855, -0.0002597719430923462, -0.00022870302200317383, -0.00019763410091400146, -0.0001665651798248291, -0.00013549625873565674, -0.00010442733764648438, -7.335841655731201e-05, -4.228949546813965e-05, -1.1220574378967285e-05, 1.9848346710205078e-05, 5.091726779937744e-05, 8.19861888885498e-05, 0.00011305510997772217, 0.00014412403106689453, 0.0001751929521560669, 0.00020626187324523926, 0.00023733079433441162, 0.000268399715423584, 0.00029946863651275635, 0.0003305375576019287, 0.0003616064786911011, 0.00039267539978027344, 0.0004237443208694458, 0.00045481324195861816, 0.00048588216304779053, 0.0005169510841369629, 0.0005480200052261353, 0.0005790889263153076, 0.00061015784740448, 0.0006412267684936523, 0.0006722956895828247, 0.0007033646106719971, 0.0007344335317611694, 0.0007655024528503418, 0.0007965713739395142, 0.0008276402950286865, 0.0008587092161178589, 0.0008897781372070312]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 8.0, 8.0, 11.0, 15.0, 31.0, 41.0, 59.0, 87.0, 154.0, 436.0, 3415.0, 1041058.0, 2385.0, 423.0, 135.0, 78.0, 46.0, 55.0, 23.0, 15.0, 17.0, 10.0, 11.0, 8.0, 8.0, 5.0, 3.0, 0.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0207672119140625, -0.02003765106201172, -0.019308090209960938, -0.018578529357910156, -0.017848968505859375, -0.017119407653808594, -0.016389846801757812, -0.01566028594970703, -0.01493072509765625, -0.014201164245605469, -0.013471603393554688, -0.012742042541503906, -0.012012481689453125, -0.011282920837402344, -0.010553359985351562, -0.009823799133300781, -0.00909423828125, -0.008364677429199219, -0.0076351165771484375, -0.006905555725097656, -0.006175994873046875, -0.005446434020996094, -0.0047168731689453125, -0.003987312316894531, -0.00325775146484375, -0.0025281906127929688, -0.0017986297607421875, -0.0010690689086914062, -0.000339508056640625, 0.00039005279541015625, 0.0011196136474609375, 0.0018491744995117188, 0.0025787353515625, 0.0033082962036132812, 0.0040378570556640625, 0.004767417907714844, 0.005496978759765625, 0.006226539611816406, 0.0069561004638671875, 0.007685661315917969, 0.00841522216796875, 0.009144783020019531, 0.009874343872070312, 0.010603904724121094, 0.011333465576171875, 0.012063026428222656, 0.012792587280273438, 0.013522148132324219, 0.014251708984375, 0.014981269836425781, 0.015710830688476562, 0.016440391540527344, 0.017169952392578125, 0.017899513244628906, 0.018629074096679688, 0.01935863494873047, 0.02008819580078125, 0.02081775665283203, 0.021547317504882812, 0.022276878356933594, 0.023006439208984375, 0.023736000061035156, 0.024465560913085938, 0.02519512176513672, 0.0259246826171875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 11.0, 27.0, 40.0, 78.0, 90.0, 127.0, 142.0, 146.0, 135.0, 73.0, 50.0, 33.0, 18.0, 14.0, 8.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043618600466288626, -0.00042153120739385486, -0.00040687641012482345, -0.00039222161285579205, -0.0003775667864829302, -0.00036291201831772923, -0.00034825719194486737, -0.00033360239467583597, -0.00031894759740680456, -0.00030429280013777316, -0.00028963800286874175, -0.00027498320559971035, -0.00026032840833067894, -0.0002456735819578171, -0.00023101878468878567, -0.00021636398741975427, -0.00020170919015072286, -0.00018705439288169146, -0.00017239959561266005, -0.00015774478379171342, -0.000143089986522682, -0.0001284351892536506, -0.00011378038470866159, -9.912558016367257e-05, -8.447078289464116e-05, -6.981598562560976e-05, -5.5161181080620736e-05, -4.050638017361052e-05, -2.585157926660031e-05, -1.1196781997568905e-05, 3.4580225474201143e-06, 1.8112827092409134e-05, 3.276759525761008e-05, 4.7422396164620295e-05, 6.207719707163051e-05, 7.673200161661953e-05, 9.138679888565093e-05, 0.00010604159615468234, 0.00012069640069967136, 0.00013535120524466038, 0.00015000600251369178, 0.0001646607997827232, 0.0001793155970517546, 0.00019397040887270123, 0.00020862520614173263, 0.00022328000341076404, 0.00023793481523171067, 0.0002525896125007421, 0.0002672444097697735, 0.0002818992070388049, 0.0002965540043078363, 0.0003112088015768677, 0.0003258635988458991, 0.00034051842521876097, 0.00035517322248779237, 0.0003698280197568238, 0.0003844828170258552, 0.0003991376142948866, 0.000413792411563918, 0.0004284472088329494, 0.00044310203520581126, 0.0004577568033710122, 0.0004724116297438741, 0.0004870664270129055, 0.0005017212242819369]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 10.0, 10.0, 7.0, 15.0, 16.0, 22.0, 24.0, 24.0, 22.0, 31.0, 28.0, 26.0, 37.0, 38.0, 43.0, 33.0, 36.0, 39.0, 47.0, 31.0, 43.0, 38.0, 33.0, 33.0, 38.0, 32.0, 38.0, 32.0, 18.0, 15.0, 22.0, 19.0, 10.0, 17.0, 11.0, 8.0, 10.0, 5.0, 9.0, 6.0, 2.0, 3.0, 6.0, 0.0, 4.0, 4.0, 0.0, 1.0], "bins": [-0.0003591775894165039, -0.00034872163087129593, -0.00033826567232608795, -0.00032780971378088, -0.000317353755235672, -0.000306897796690464, -0.00029644183814525604, -0.00028598587960004807, -0.0002755299210548401, -0.0002650739625096321, -0.00025461800396442413, -0.00024416204541921616, -0.00023370608687400818, -0.0002232501283288002, -0.00021279416978359222, -0.00020233821123838425, -0.00019188225269317627, -0.0001814262941479683, -0.00017097033560276031, -0.00016051437705755234, -0.00015005841851234436, -0.00013960245996713638, -0.0001291465014219284, -0.00011869054287672043, -0.00010823458433151245, -9.777862578630447e-05, -8.73226672410965e-05, -7.686670869588852e-05, -6.641075015068054e-05, -5.5954791605472565e-05, -4.549883306026459e-05, -3.504287451505661e-05, -2.4586915969848633e-05, -1.4130957424640656e-05, -3.6749988794326782e-06, 6.780959665775299e-06, 1.7236918210983276e-05, 2.7692876756191254e-05, 3.814883530139923e-05, 4.860479384660721e-05, 5.9060752391815186e-05, 6.951671093702316e-05, 7.997266948223114e-05, 9.042862802743912e-05, 0.0001008845865726471, 0.00011134054511785507, 0.00012179650366306305, 0.00013225246220827103, 0.000142708420753479, 0.00015316437929868698, 0.00016362033784389496, 0.00017407629638910294, 0.0001845322549343109, 0.0001949882134795189, 0.00020544417202472687, 0.00021590013056993484, 0.00022635608911514282, 0.0002368120476603508, 0.0002472680062055588, 0.00025772396475076675, 0.00026817992329597473, 0.0002786358818411827, 0.0002890918403863907, 0.00029954779893159866, 0.00031000375747680664]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 7.0, 12.0, 12.0, 12.0, 21.0, 21.0, 17.0, 18.0, 31.0, 29.0, 24.0, 26.0, 43.0, 33.0, 39.0, 54.0, 42.0, 45.0, 44.0, 41.0, 31.0, 56.0, 42.0, 26.0, 26.0, 21.0, 30.0, 25.0, 24.0, 22.0, 22.0, 25.0, 8.0, 7.0, 17.0, 12.0, 6.0, 7.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.46875, -7.25604248046875, -7.0433349609375, -6.83062744140625, -6.617919921875, -6.40521240234375, -6.1925048828125, -5.97979736328125, -5.76708984375, -5.55438232421875, -5.3416748046875, -5.12896728515625, -4.916259765625, -4.70355224609375, -4.4908447265625, -4.27813720703125, -4.0654296875, -3.85272216796875, -3.6400146484375, -3.42730712890625, -3.214599609375, -3.00189208984375, -2.7891845703125, -2.57647705078125, -2.36376953125, -2.15106201171875, -1.9383544921875, -1.72564697265625, -1.512939453125, -1.30023193359375, -1.0875244140625, -0.87481689453125, -0.662109375, -0.44940185546875, -0.2366943359375, -0.02398681640625, 0.188720703125, 0.40142822265625, 0.6141357421875, 0.82684326171875, 1.03955078125, 1.25225830078125, 1.4649658203125, 1.67767333984375, 1.890380859375, 2.10308837890625, 2.3157958984375, 2.52850341796875, 2.7412109375, 2.95391845703125, 3.1666259765625, 3.37933349609375, 3.592041015625, 3.80474853515625, 4.0174560546875, 4.23016357421875, 4.44287109375, 4.65557861328125, 4.8682861328125, 5.08099365234375, 5.293701171875, 5.50640869140625, 5.7191162109375, 5.93182373046875, 6.14453125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 11.0, 15.0, 22.0, 28.0, 44.0, 61.0, 90.0, 139.0, 225.0, 339.0, 577.0, 1089.0, 2294.0, 4945.0, 11798.0, 31848.0, 95626.0, 317483.0, 394345.0, 121231.0, 40299.0, 14463.0, 5927.0, 2599.0, 1301.0, 655.0, 403.0, 242.0, 138.0, 91.0, 73.0, 51.0, 28.0, 23.0, 18.0, 9.0, 7.0, 2.0, 7.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.17352294921875, -5.0072021484375, -4.84088134765625, -4.674560546875, -4.50823974609375, -4.3419189453125, -4.17559814453125, -4.00927734375, -3.84295654296875, -3.6766357421875, -3.51031494140625, -3.343994140625, -3.17767333984375, -3.0113525390625, -2.84503173828125, -2.6787109375, -2.51239013671875, -2.3460693359375, -2.17974853515625, -2.013427734375, -1.84710693359375, -1.6807861328125, -1.51446533203125, -1.34814453125, -1.18182373046875, -1.0155029296875, -0.84918212890625, -0.682861328125, -0.51654052734375, -0.3502197265625, -0.18389892578125, -0.017578125, 0.14874267578125, 0.3150634765625, 0.48138427734375, 0.647705078125, 0.81402587890625, 0.9803466796875, 1.14666748046875, 1.31298828125, 1.47930908203125, 1.6456298828125, 1.81195068359375, 1.978271484375, 2.14459228515625, 2.3109130859375, 2.47723388671875, 2.6435546875, 2.80987548828125, 2.9761962890625, 3.14251708984375, 3.308837890625, 3.47515869140625, 3.6414794921875, 3.80780029296875, 3.97412109375, 4.14044189453125, 4.3067626953125, 4.47308349609375, 4.639404296875, 4.80572509765625, 4.9720458984375, 5.13836669921875, 5.3046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 5.0, 16.0, 11.0, 14.0, 24.0, 25.0, 29.0, 20.0, 40.0, 54.0, 43.0, 58.0, 94.0, 183.0, 1759.0, 198.0, 81.0, 65.0, 50.0, 53.0, 44.0, 33.0, 30.0, 22.0, 24.0, 14.0, 13.0, 13.0, 6.0, 3.0, 6.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-39.0, -37.960693359375, -36.92138671875, -35.882080078125, -34.8427734375, -33.803466796875, -32.76416015625, -31.724853515625, -30.685546875, -29.646240234375, -28.60693359375, -27.567626953125, -26.5283203125, -25.489013671875, -24.44970703125, -23.410400390625, -22.37109375, -21.331787109375, -20.29248046875, -19.253173828125, -18.2138671875, -17.174560546875, -16.13525390625, -15.095947265625, -14.056640625, -13.017333984375, -11.97802734375, -10.938720703125, -9.8994140625, -8.860107421875, -7.82080078125, -6.781494140625, -5.7421875, -4.702880859375, -3.66357421875, -2.624267578125, -1.5849609375, -0.545654296875, 0.49365234375, 1.532958984375, 2.572265625, 3.611572265625, 4.65087890625, 5.690185546875, 6.7294921875, 7.768798828125, 8.80810546875, 9.847412109375, 10.88671875, 11.926025390625, 12.96533203125, 14.004638671875, 15.0439453125, 16.083251953125, 17.12255859375, 18.161865234375, 19.201171875, 20.240478515625, 21.27978515625, 22.319091796875, 23.3583984375, 24.397705078125, 25.43701171875, 26.476318359375, 27.515625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 9.0, 3.0, 9.0, 9.0, 27.0, 18.0, 32.0, 33.0, 55.0, 59.0, 112.0, 166.0, 199.0, 356.0, 711.0, 7456.0, 3127895.0, 6806.0, 698.0, 344.0, 201.0, 158.0, 107.0, 50.0, 47.0, 50.0, 23.0, 20.0, 17.0, 10.0, 9.0, 2.0, 5.0, 3.0, 7.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.125, -63.7197265625, -61.314453125, -58.9091796875, -56.50390625, -54.0986328125, -51.693359375, -49.2880859375, -46.8828125, -44.4775390625, -42.072265625, -39.6669921875, -37.26171875, -34.8564453125, -32.451171875, -30.0458984375, -27.640625, -25.2353515625, -22.830078125, -20.4248046875, -18.01953125, -15.6142578125, -13.208984375, -10.8037109375, -8.3984375, -5.9931640625, -3.587890625, -1.1826171875, 1.22265625, 3.6279296875, 6.033203125, 8.4384765625, 10.84375, 13.2490234375, 15.654296875, 18.0595703125, 20.46484375, 22.8701171875, 25.275390625, 27.6806640625, 30.0859375, 32.4912109375, 34.896484375, 37.3017578125, 39.70703125, 42.1123046875, 44.517578125, 46.9228515625, 49.328125, 51.7333984375, 54.138671875, 56.5439453125, 58.94921875, 61.3544921875, 63.759765625, 66.1650390625, 68.5703125, 70.9755859375, 73.380859375, 75.7861328125, 78.19140625, 80.5966796875, 83.001953125, 85.4072265625, 87.8125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 9.0, 25.0, 82.0, 187.0, 332.0, 259.0, 95.0, 24.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.437366485595703, -14.722323417663574, -13.007280349731445, -11.292236328125, -9.577193260192871, -7.862150192260742, -6.147106170654297, -4.432063102722168, -2.717020034790039, -1.001976728439331, 0.713066577911377, 2.428110122680664, 4.143153190612793, 5.858196258544922, 7.573240280151367, 9.288283348083496, 11.003326416015625, 12.718369483947754, 14.433412551879883, 16.148456573486328, 17.86349868774414, 19.578542709350586, 21.29358673095703, 23.008628845214844, 24.72367286682129, 26.438716888427734, 28.153759002685547, 29.868803024291992, 31.583847045898438, 33.29888916015625, 35.01393127441406, 36.72897720336914, 38.44401550292969, 40.1590576171875, 41.87410354614258, 43.58914566040039, 45.3041877746582, 47.01923370361328, 48.734275817871094, 50.449317932128906, 52.16436004638672, 53.87940216064453, 55.59444808959961, 57.30949020385742, 59.024532318115234, 60.73957824707031, 62.454620361328125, 64.16966247558594, 65.88470458984375, 67.59974670410156, 69.31478881835938, 71.02983093261719, 72.74488067626953, 74.45992279052734, 76.17496490478516, 77.89000701904297, 79.60505676269531, 81.32009887695312, 83.03514099121094, 84.75018310546875, 86.4652328491211, 88.1802749633789, 89.89531707763672, 91.61035919189453, 93.32540130615234]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 6.0, 5.0, 8.0, 14.0, 7.0, 17.0, 16.0, 17.0, 28.0, 25.0, 26.0, 35.0, 29.0, 40.0, 34.0, 34.0, 38.0, 39.0, 45.0, 40.0, 33.0, 43.0, 40.0, 41.0, 37.0, 23.0, 28.0, 36.0, 29.0, 16.0, 32.0, 22.0, 17.0, 10.0, 16.0, 15.0, 7.0, 10.0, 7.0, 7.0, 9.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-62.862335205078125, -60.94387435913086, -59.02541732788086, -57.106956481933594, -55.188499450683594, -53.27003860473633, -51.35157775878906, -49.43312072753906, -47.51466369628906, -45.5962028503418, -43.6777458190918, -41.75928497314453, -39.84082794189453, -37.922367095947266, -36.00390625, -34.08544921875, -32.166988372802734, -30.2485294342041, -28.33007049560547, -26.411609649658203, -24.493152618408203, -22.574691772460938, -20.656232833862305, -18.737773895263672, -16.81931495666504, -14.900856018066406, -12.982397079467773, -11.063937187194824, -9.145478248596191, -7.227019309997559, -5.308559417724609, -3.3901004791259766, -1.4716453552246094, 0.44681382179260254, 2.3652729988098145, 4.2837324142456055, 6.202191352844238, 8.120650291442871, 10.03911018371582, 11.957569122314453, 13.876028060913086, 15.794486999511719, 17.71294593811035, 19.631404876708984, 21.54986572265625, 23.46832275390625, 25.386783599853516, 27.30524253845215, 29.22370147705078, 31.142160415649414, 33.06061935424805, 34.97908020019531, 36.89753723144531, 38.81599807739258, 40.734458923339844, 42.652915954589844, 44.571372985839844, 46.48983383178711, 48.40829086303711, 50.326751708984375, 52.245208740234375, 54.16366958618164, 56.082130432128906, 58.000587463378906, 59.91904830932617]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 6.0, 14.0, 16.0, 21.0, 17.0, 16.0, 25.0, 23.0, 26.0, 32.0, 20.0, 32.0, 28.0, 32.0, 41.0, 49.0, 47.0, 47.0, 41.0, 36.0, 42.0, 42.0, 40.0, 28.0, 25.0, 28.0, 21.0, 26.0, 27.0, 27.0, 17.0, 22.0, 12.0, 12.0, 6.0, 17.0, 8.0, 5.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.08599853515625, -6.8712158203125, -6.65643310546875, -6.441650390625, -6.22686767578125, -6.0120849609375, -5.79730224609375, -5.58251953125, -5.36773681640625, -5.1529541015625, -4.93817138671875, -4.723388671875, -4.50860595703125, -4.2938232421875, -4.07904052734375, -3.8642578125, -3.64947509765625, -3.4346923828125, -3.21990966796875, -3.005126953125, -2.79034423828125, -2.5755615234375, -2.36077880859375, -2.14599609375, -1.93121337890625, -1.7164306640625, -1.50164794921875, -1.286865234375, -1.07208251953125, -0.8572998046875, -0.64251708984375, -0.427734375, -0.21295166015625, 0.0018310546875, 0.21661376953125, 0.431396484375, 0.64617919921875, 0.8609619140625, 1.07574462890625, 1.29052734375, 1.50531005859375, 1.7200927734375, 1.93487548828125, 2.149658203125, 2.36444091796875, 2.5792236328125, 2.79400634765625, 3.0087890625, 3.22357177734375, 3.4383544921875, 3.65313720703125, 3.867919921875, 4.08270263671875, 4.2974853515625, 4.51226806640625, 4.72705078125, 4.94183349609375, 5.1566162109375, 5.37139892578125, 5.586181640625, 5.80096435546875, 6.0157470703125, 6.23052978515625, 6.4453125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 4.0, 6.0, 12.0, 15.0, 20.0, 20.0, 22.0, 37.0, 42.0, 55.0, 56.0, 93.0, 163.0, 330.0, 795.0, 6789.0, 784809.0, 3352495.0, 45608.0, 1779.0, 423.0, 220.0, 122.0, 80.0, 56.0, 42.0, 32.0, 26.0, 27.0, 15.0, 16.0, 11.0, 15.0, 8.0, 11.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.942138671875, -31.00927734375, -30.076416015625, -29.1435546875, -28.210693359375, -27.27783203125, -26.344970703125, -25.412109375, -24.479248046875, -23.54638671875, -22.613525390625, -21.6806640625, -20.747802734375, -19.81494140625, -18.882080078125, -17.94921875, -17.016357421875, -16.08349609375, -15.150634765625, -14.2177734375, -13.284912109375, -12.35205078125, -11.419189453125, -10.486328125, -9.553466796875, -8.62060546875, -7.687744140625, -6.7548828125, -5.822021484375, -4.88916015625, -3.956298828125, -3.0234375, -2.090576171875, -1.15771484375, -0.224853515625, 0.7080078125, 1.640869140625, 2.57373046875, 3.506591796875, 4.439453125, 5.372314453125, 6.30517578125, 7.238037109375, 8.1708984375, 9.103759765625, 10.03662109375, 10.969482421875, 11.90234375, 12.835205078125, 13.76806640625, 14.700927734375, 15.6337890625, 16.566650390625, 17.49951171875, 18.432373046875, 19.365234375, 20.298095703125, 21.23095703125, 22.163818359375, 23.0966796875, 24.029541015625, 24.96240234375, 25.895263671875, 26.828125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 9.0, 6.0, 6.0, 15.0, 12.0, 22.0, 20.0, 35.0, 47.0, 54.0, 91.0, 121.0, 183.0, 220.0, 259.0, 354.0, 480.0, 460.0, 388.0, 314.0, 261.0, 175.0, 151.0, 103.0, 80.0, 60.0, 46.0, 20.0, 19.0, 12.0, 17.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.2109375, -14.78955078125, -14.3681640625, -13.94677734375, -13.525390625, -13.10400390625, -12.6826171875, -12.26123046875, -11.83984375, -11.41845703125, -10.9970703125, -10.57568359375, -10.154296875, -9.73291015625, -9.3115234375, -8.89013671875, -8.46875, -8.04736328125, -7.6259765625, -7.20458984375, -6.783203125, -6.36181640625, -5.9404296875, -5.51904296875, -5.09765625, -4.67626953125, -4.2548828125, -3.83349609375, -3.412109375, -2.99072265625, -2.5693359375, -2.14794921875, -1.7265625, -1.30517578125, -0.8837890625, -0.46240234375, -0.041015625, 0.38037109375, 0.8017578125, 1.22314453125, 1.64453125, 2.06591796875, 2.4873046875, 2.90869140625, 3.330078125, 3.75146484375, 4.1728515625, 4.59423828125, 5.015625, 5.43701171875, 5.8583984375, 6.27978515625, 6.701171875, 7.12255859375, 7.5439453125, 7.96533203125, 8.38671875, 8.80810546875, 9.2294921875, 9.65087890625, 10.072265625, 10.49365234375, 10.9150390625, 11.33642578125, 11.7578125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 9.0, 6.0, 3.0, 6.0, 6.0, 15.0, 23.0, 39.0, 42.0, 33.0, 59.0, 69.0, 97.0, 135.0, 255.0, 429.0, 1031.0, 11328.0, 4016192.0, 161382.0, 1687.0, 508.0, 277.0, 166.0, 108.0, 92.0, 68.0, 60.0, 42.0, 19.0, 20.0, 18.0, 12.0, 13.0, 9.0, 5.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-64.0625, -62.0419921875, -60.021484375, -58.0009765625, -55.98046875, -53.9599609375, -51.939453125, -49.9189453125, -47.8984375, -45.8779296875, -43.857421875, -41.8369140625, -39.81640625, -37.7958984375, -35.775390625, -33.7548828125, -31.734375, -29.7138671875, -27.693359375, -25.6728515625, -23.65234375, -21.6318359375, -19.611328125, -17.5908203125, -15.5703125, -13.5498046875, -11.529296875, -9.5087890625, -7.48828125, -5.4677734375, -3.447265625, -1.4267578125, 0.59375, 2.6142578125, 4.634765625, 6.6552734375, 8.67578125, 10.6962890625, 12.716796875, 14.7373046875, 16.7578125, 18.7783203125, 20.798828125, 22.8193359375, 24.83984375, 26.8603515625, 28.880859375, 30.9013671875, 32.921875, 34.9423828125, 36.962890625, 38.9833984375, 41.00390625, 43.0244140625, 45.044921875, 47.0654296875, 49.0859375, 51.1064453125, 53.126953125, 55.1474609375, 57.16796875, 59.1884765625, 61.208984375, 63.2294921875, 65.25]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 21.0, 52.0, 110.0, 195.0, 232.0, 183.0, 130.0, 58.0, 16.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.04988861083984, -81.83489990234375, -78.61991882324219, -75.4049301147461, -72.18994140625, -68.9749526977539, -65.75996398925781, -62.54498291015625, -59.329994201660156, -56.11500549316406, -52.900020599365234, -49.685035705566406, -46.47004699707031, -43.25505828857422, -40.04007339477539, -36.82508850097656, -33.61009979248047, -30.395112991333008, -27.180126190185547, -23.965139389038086, -20.750152587890625, -17.535165786743164, -14.320178985595703, -11.105192184448242, -7.890205383300781, -4.67521858215332, -1.4602317810058594, 1.7547550201416016, 4.9697418212890625, 8.184728622436523, 11.399715423583984, 14.614702224731445, 17.829689025878906, 21.044675827026367, 24.259662628173828, 27.47464942932129, 30.68963623046875, 33.904624938964844, 37.11960983276367, 40.3345947265625, 43.549583435058594, 46.76457214355469, 49.979557037353516, 53.194541931152344, 56.40953063964844, 59.62451934814453, 62.83950424194336, 66.05448913574219, 69.26947784423828, 72.48446655273438, 75.69944763183594, 78.91443634033203, 82.12942504882812, 85.34441375732422, 88.55940246582031, 91.77438354492188, 94.98937225341797, 98.20436096191406, 101.41934204101562, 104.63433074951172, 107.84931945800781, 111.0643081665039, 114.279296875, 117.49427795410156, 120.70926666259766]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 5.0, 9.0, 7.0, 7.0, 11.0, 7.0, 13.0, 15.0, 13.0, 16.0, 21.0, 24.0, 28.0, 24.0, 35.0, 25.0, 41.0, 30.0, 35.0, 29.0, 48.0, 46.0, 44.0, 33.0, 40.0, 35.0, 28.0, 31.0, 26.0, 31.0, 33.0, 25.0, 27.0, 26.0, 17.0, 15.0, 12.0, 7.0, 17.0, 11.0, 13.0, 9.0, 7.0, 8.0, 0.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.09910583496094, -36.88505172729492, -35.67100143432617, -34.456947326660156, -33.24289321899414, -32.028839111328125, -30.814788818359375, -29.60073471069336, -28.386682510375977, -27.172630310058594, -25.958576202392578, -24.744524002075195, -23.530471801757812, -22.316417694091797, -21.102365493774414, -19.88831329345703, -18.674259185791016, -17.460206985473633, -16.246152877807617, -15.032100677490234, -13.818047523498535, -12.603994369506836, -11.389942169189453, -10.175889015197754, -8.961835861206055, -7.7477827072143555, -6.5337300300598145, -5.319677352905273, -4.105624198913574, -2.891571044921875, -1.677518367767334, -0.46346569061279297, 0.7505874633789062, 1.9646403789520264, 3.1786932945251465, 4.3927459716796875, 5.606799125671387, 6.820852279663086, 8.034904479980469, 9.248957633972168, 10.463010787963867, 11.677063941955566, 12.891117095947266, 14.105169296264648, 15.319222450256348, 16.533275604248047, 17.74732780456543, 18.961380004882812, 20.175434112548828, 21.38948631286621, 22.603540420532227, 23.81759262084961, 25.031646728515625, 26.245698928833008, 27.45975112915039, 28.673805236816406, 29.88785743713379, 31.101909637451172, 32.31596374511719, 33.5300178527832, 34.74406814575195, 35.95812225341797, 37.172176361083984, 38.386226654052734, 39.60028076171875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 6.0, 8.0, 13.0, 15.0, 12.0, 14.0, 16.0, 23.0, 24.0, 13.0, 29.0, 25.0, 31.0, 24.0, 29.0, 34.0, 28.0, 35.0, 27.0, 37.0, 32.0, 41.0, 42.0, 32.0, 32.0, 34.0, 28.0, 35.0, 29.0, 24.0, 13.0, 24.0, 27.0, 25.0, 19.0, 16.0, 16.0, 13.0, 10.0, 10.0, 8.0, 4.0, 12.0, 5.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.428466796875, -5.24755859375, -5.066650390625, -4.8857421875, -4.704833984375, -4.52392578125, -4.343017578125, -4.162109375, -3.981201171875, -3.80029296875, -3.619384765625, -3.4384765625, -3.257568359375, -3.07666015625, -2.895751953125, -2.71484375, -2.533935546875, -2.35302734375, -2.172119140625, -1.9912109375, -1.810302734375, -1.62939453125, -1.448486328125, -1.267578125, -1.086669921875, -0.90576171875, -0.724853515625, -0.5439453125, -0.363037109375, -0.18212890625, -0.001220703125, 0.1796875, 0.360595703125, 0.54150390625, 0.722412109375, 0.9033203125, 1.084228515625, 1.26513671875, 1.446044921875, 1.626953125, 1.807861328125, 1.98876953125, 2.169677734375, 2.3505859375, 2.531494140625, 2.71240234375, 2.893310546875, 3.07421875, 3.255126953125, 3.43603515625, 3.616943359375, 3.7978515625, 3.978759765625, 4.15966796875, 4.340576171875, 4.521484375, 4.702392578125, 4.88330078125, 5.064208984375, 5.2451171875, 5.426025390625, 5.60693359375, 5.787841796875, 5.96875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 21.0, 34.0, 46.0, 62.0, 95.0, 118.0, 183.0, 232.0, 326.0, 506.0, 654.0, 976.0, 1407.0, 1926.0, 2679.0, 3799.0, 5353.0, 7656.0, 10813.0, 15287.0, 21149.0, 30476.0, 43707.0, 66430.0, 108145.0, 250456.0, 188300.0, 94181.0, 59173.0, 39575.0, 27721.0, 19707.0, 13657.0, 9822.0, 6957.0, 4965.0, 3533.0, 2467.0, 1718.0, 1235.0, 871.0, 625.0, 451.0, 357.0, 226.0, 168.0, 100.0, 64.0, 51.0, 34.0, 18.0, 17.0, 10.0, 10.0, 5.0, 3.0, 3.0], "bins": [-1.18359375, -1.1475830078125, -1.111572265625, -1.0755615234375, -1.03955078125, -1.0035400390625, -0.967529296875, -0.9315185546875, -0.8955078125, -0.8594970703125, -0.823486328125, -0.7874755859375, -0.75146484375, -0.7154541015625, -0.679443359375, -0.6434326171875, -0.607421875, -0.5714111328125, -0.535400390625, -0.4993896484375, -0.46337890625, -0.4273681640625, -0.391357421875, -0.3553466796875, -0.3193359375, -0.2833251953125, -0.247314453125, -0.2113037109375, -0.17529296875, -0.1392822265625, -0.103271484375, -0.0672607421875, -0.03125, 0.0047607421875, 0.040771484375, 0.0767822265625, 0.11279296875, 0.1488037109375, 0.184814453125, 0.2208251953125, 0.2568359375, 0.2928466796875, 0.328857421875, 0.3648681640625, 0.40087890625, 0.4368896484375, 0.472900390625, 0.5089111328125, 0.544921875, 0.5809326171875, 0.616943359375, 0.6529541015625, 0.68896484375, 0.7249755859375, 0.760986328125, 0.7969970703125, 0.8330078125, 0.8690185546875, 0.905029296875, 0.9410400390625, 0.97705078125, 1.0130615234375, 1.049072265625, 1.0850830078125, 1.12109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 11.0, 11.0, 10.0, 4.0, 12.0, 14.0, 14.0, 19.0, 25.0, 14.0, 30.0, 23.0, 30.0, 22.0, 34.0, 40.0, 33.0, 41.0, 40.0, 43.0, 1079.0, 30.0, 33.0, 31.0, 39.0, 37.0, 46.0, 31.0, 31.0, 26.0, 21.0, 33.0, 19.0, 15.0, 15.0, 10.0, 11.0, 10.0, 2.0, 10.0, 8.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-4.39453125, -4.265350341796875, -4.13616943359375, -4.006988525390625, -3.8778076171875, -3.748626708984375, -3.61944580078125, -3.490264892578125, -3.361083984375, -3.231903076171875, -3.10272216796875, -2.973541259765625, -2.8443603515625, -2.715179443359375, -2.58599853515625, -2.456817626953125, -2.32763671875, -2.198455810546875, -2.06927490234375, -1.940093994140625, -1.8109130859375, -1.681732177734375, -1.55255126953125, -1.423370361328125, -1.294189453125, -1.165008544921875, -1.03582763671875, -0.906646728515625, -0.7774658203125, -0.648284912109375, -0.51910400390625, -0.389923095703125, -0.2607421875, -0.131561279296875, -0.00238037109375, 0.126800537109375, 0.2559814453125, 0.385162353515625, 0.51434326171875, 0.643524169921875, 0.772705078125, 0.901885986328125, 1.03106689453125, 1.160247802734375, 1.2894287109375, 1.418609619140625, 1.54779052734375, 1.676971435546875, 1.80615234375, 1.935333251953125, 2.06451416015625, 2.193695068359375, 2.3228759765625, 2.452056884765625, 2.58123779296875, 2.710418701171875, 2.839599609375, 2.968780517578125, 3.09796142578125, 3.227142333984375, 3.3563232421875, 3.485504150390625, 3.61468505859375, 3.743865966796875, 3.873046875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 17.0, 29.0, 31.0, 64.0, 75.0, 127.0, 157.0, 265.0, 342.0, 521.0, 752.0, 1033.0, 1516.0, 2316.0, 3436.0, 5034.0, 7396.0, 11304.0, 17040.0, 25794.0, 39880.0, 64023.0, 107647.0, 1273076.0, 250525.0, 106595.0, 63075.0, 39316.0, 25386.0, 16600.0, 10966.0, 7433.0, 4941.0, 3325.0, 2274.0, 1540.0, 1051.0, 663.0, 507.0, 312.0, 211.0, 165.0, 102.0, 90.0, 43.0, 43.0, 27.0, 15.0, 17.0, 6.0, 9.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.3056640625, -1.2648468017578125, -1.224029541015625, -1.1832122802734375, -1.14239501953125, -1.1015777587890625, -1.060760498046875, -1.0199432373046875, -0.9791259765625, -0.9383087158203125, -0.897491455078125, -0.8566741943359375, -0.81585693359375, -0.7750396728515625, -0.734222412109375, -0.6934051513671875, -0.652587890625, -0.6117706298828125, -0.570953369140625, -0.5301361083984375, -0.48931884765625, -0.4485015869140625, -0.407684326171875, -0.3668670654296875, -0.3260498046875, -0.2852325439453125, -0.244415283203125, -0.2035980224609375, -0.16278076171875, -0.1219635009765625, -0.081146240234375, -0.0403289794921875, 0.00048828125, 0.0413055419921875, 0.082122802734375, 0.1229400634765625, 0.16375732421875, 0.2045745849609375, 0.245391845703125, 0.2862091064453125, 0.3270263671875, 0.3678436279296875, 0.408660888671875, 0.4494781494140625, 0.49029541015625, 0.5311126708984375, 0.571929931640625, 0.6127471923828125, 0.653564453125, 0.6943817138671875, 0.735198974609375, 0.7760162353515625, 0.81683349609375, 0.8576507568359375, 0.898468017578125, 0.9392852783203125, 0.9801025390625, 1.0209197998046875, 1.061737060546875, 1.1025543212890625, 1.14337158203125, 1.1841888427734375, 1.225006103515625, 1.2658233642578125, 1.306640625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 6.0, 5.0, 4.0, 5.0, 11.0, 16.0, 28.0, 30.0, 63.0, 69.0, 143.0, 143.0, 170.0, 105.0, 80.0, 43.0, 26.0, 12.0, 9.0, 3.0, 3.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001308441162109375, -0.0012683123350143433, -0.0012281835079193115, -0.0011880546808242798, -0.001147925853729248, -0.0011077970266342163, -0.0010676681995391846, -0.0010275393724441528, -0.000987410545349121, -0.0009472817182540894, -0.0009071528911590576, -0.0008670240640640259, -0.0008268952369689941, -0.0007867664098739624, -0.0007466375827789307, -0.0007065087556838989, -0.0006663799285888672, -0.0006262511014938354, -0.0005861222743988037, -0.000545993447303772, -0.0005058646202087402, -0.0004657357931137085, -0.00042560696601867676, -0.000385478138923645, -0.0003453493118286133, -0.00030522048473358154, -0.0002650916576385498, -0.00022496283054351807, -0.00018483400344848633, -0.0001447051763534546, -0.00010457634925842285, -6.444752216339111e-05, -2.4318695068359375e-05, 1.5810132026672363e-05, 5.59389591217041e-05, 9.606778621673584e-05, 0.00013619661331176758, 0.00017632544040679932, 0.00021645426750183105, 0.0002565830945968628, 0.00029671192169189453, 0.00033684074878692627, 0.000376969575881958, 0.00041709840297698975, 0.0004572272300720215, 0.0004973560571670532, 0.000537484884262085, 0.0005776137113571167, 0.0006177425384521484, 0.0006578713655471802, 0.0006980001926422119, 0.0007381290197372437, 0.0007782578468322754, 0.0008183866739273071, 0.0008585155010223389, 0.0008986443281173706, 0.0009387731552124023, 0.000978901982307434, 0.0010190308094024658, 0.0010591596364974976, 0.0010992884635925293, 0.001139417290687561, 0.0011795461177825928, 0.0012196749448776245, 0.0012598037719726562]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 9.0, 2.0, 3.0, 9.0, 6.0, 3.0, 18.0, 26.0, 52.0, 74.0, 163.0, 411.0, 7660.0, 1038494.0, 1082.0, 258.0, 109.0, 49.0, 33.0, 18.0, 21.0, 9.0, 8.0, 7.0, 9.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0288848876953125, -0.02796173095703125, -0.02703857421875, -0.02611541748046875, -0.0251922607421875, -0.02426910400390625, -0.023345947265625, -0.02242279052734375, -0.0214996337890625, -0.02057647705078125, -0.0196533203125, -0.01873016357421875, -0.0178070068359375, -0.01688385009765625, -0.015960693359375, -0.01503753662109375, -0.0141143798828125, -0.01319122314453125, -0.01226806640625, -0.01134490966796875, -0.0104217529296875, -0.00949859619140625, -0.008575439453125, -0.00765228271484375, -0.0067291259765625, -0.00580596923828125, -0.0048828125, -0.00395965576171875, -0.0030364990234375, -0.00211334228515625, -0.001190185546875, -0.00026702880859375, 0.0006561279296875, 0.00157928466796875, 0.00250244140625, 0.00342559814453125, 0.0043487548828125, 0.00527191162109375, 0.006195068359375, 0.00711822509765625, 0.0080413818359375, 0.00896453857421875, 0.0098876953125, 0.01081085205078125, 0.0117340087890625, 0.01265716552734375, 0.013580322265625, 0.01450347900390625, 0.0154266357421875, 0.01634979248046875, 0.01727294921875, 0.01819610595703125, 0.0191192626953125, 0.02004241943359375, 0.020965576171875, 0.02188873291015625, 0.0228118896484375, 0.02373504638671875, 0.024658203125, 0.02558135986328125, 0.0265045166015625, 0.02742767333984375, 0.028350830078125, 0.02927398681640625, 0.0301971435546875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 49.0, 329.0, 500.0, 122.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033341809175908566, -0.003273783717304468, -0.003213386284187436, -0.0031529890839010477, -0.0030925916507840157, -0.0030321944504976273, -0.002971797017380595, -0.002911399817094207, -0.0028510023839771748, -0.0027906051836907864, -0.0027302077505737543, -0.002669810550287366, -0.002609413117170334, -0.0025490159168839455, -0.0024886184837669134, -0.002428221283480525, -0.0023678240831941366, -0.0023074268829077482, -0.002247029449790716, -0.0021866322495043278, -0.0021262348163872957, -0.0020658376161009073, -0.0020054401829838753, -0.0019450429826974869, -0.0018846456659957767, -0.0018242483492940664, -0.0017638510325923562, -0.001703453715890646, -0.0016430565156042576, -0.0015826590824872255, -0.0015222618822008371, -0.001461864565499127, -0.0014014672487974167, -0.0013410699320957065, -0.0012806726153939962, -0.001220275298692286, -0.0011598779819905758, -0.0010994807817041874, -0.0010390834650024772, -0.000978686148300767, -0.0009182888898067176, -0.0008578915731050074, -0.0007974943146109581, -0.0007370969979092479, -0.0006766996812075377, -0.0006163023645058274, -0.0005559050478041172, -0.0004955077893100679, -0.00043511047260835767, -0.00037471315590664744, -0.0003143158683087677, -0.0002539185807108879, -0.00019352126400917768, -0.00013312394730746746, -7.272665970958769e-05, -1.2329372111707926e-05, 4.80679445900023e-05, 0.0001084652467397973, 0.0001688625488895923, 0.00022925985103938729, 0.0002896571531891823, 0.0003500544698908925, 0.0004104517574887723, 0.00047084904508665204, 0.0005312463617883623]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 8.0, 10.0, 11.0, 10.0, 11.0, 13.0, 16.0, 28.0, 18.0, 22.0, 32.0, 33.0, 34.0, 30.0, 36.0, 39.0, 40.0, 46.0, 46.0, 41.0, 48.0, 40.0, 43.0, 41.0, 33.0, 31.0, 27.0, 21.0, 30.0, 32.0, 25.0, 24.0, 18.0, 10.0, 7.0, 4.0, 9.0, 6.0, 5.0, 6.0, 6.0, 0.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0004298090934753418, -0.00041638221591711044, -0.0004029553383588791, -0.00038952846080064774, -0.0003761015832424164, -0.00036267470568418503, -0.0003492478281259537, -0.0003358209505677223, -0.00032239407300949097, -0.0003089671954512596, -0.00029554031789302826, -0.0002821134403347969, -0.00026868656277656555, -0.0002552596852183342, -0.00024183280766010284, -0.0002284059301018715, -0.00021497905254364014, -0.00020155217498540878, -0.00018812529742717743, -0.00017469841986894608, -0.00016127154231071472, -0.00014784466475248337, -0.00013441778719425201, -0.00012099090963602066, -0.0001075640320777893, -9.413715451955795e-05, -8.07102769613266e-05, -6.728339940309525e-05, -5.385652184486389e-05, -4.042964428663254e-05, -2.7002766728401184e-05, -1.357588917016983e-05, -1.4901161193847656e-07, 1.3277865946292877e-05, 2.670474350452423e-05, 4.0131621062755585e-05, 5.355849862098694e-05, 6.698537617921829e-05, 8.041225373744965e-05, 9.3839131295681e-05, 0.00010726600885391235, 0.00012069288641214371, 0.00013411976397037506, 0.00014754664152860641, 0.00016097351908683777, 0.00017440039664506912, 0.00018782727420330048, 0.00020125415176153183, 0.00021468102931976318, 0.00022810790687799454, 0.0002415347844362259, 0.00025496166199445724, 0.0002683885395526886, 0.00028181541711091995, 0.0002952422946691513, 0.00030866917222738266, 0.000322096049785614, 0.00033552292734384537, 0.0003489498049020767, 0.0003623766824603081, 0.00037580356001853943, 0.0003892304375767708, 0.00040265731513500214, 0.0004160841926932335, 0.00042951107025146484]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 6.0, 8.0, 13.0, 15.0, 12.0, 14.0, 16.0, 23.0, 24.0, 13.0, 29.0, 25.0, 31.0, 24.0, 29.0, 34.0, 28.0, 35.0, 27.0, 37.0, 32.0, 41.0, 42.0, 32.0, 32.0, 34.0, 28.0, 35.0, 29.0, 24.0, 13.0, 24.0, 27.0, 25.0, 19.0, 16.0, 16.0, 13.0, 10.0, 10.0, 8.0, 4.0, 12.0, 5.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.428466796875, -5.24755859375, -5.066650390625, -4.8857421875, -4.704833984375, -4.52392578125, -4.343017578125, -4.162109375, -3.981201171875, -3.80029296875, -3.619384765625, -3.4384765625, -3.257568359375, -3.07666015625, -2.895751953125, -2.71484375, -2.533935546875, -2.35302734375, -2.172119140625, -1.9912109375, -1.810302734375, -1.62939453125, -1.448486328125, -1.267578125, -1.086669921875, -0.90576171875, -0.724853515625, -0.5439453125, -0.363037109375, -0.18212890625, -0.001220703125, 0.1796875, 0.360595703125, 0.54150390625, 0.722412109375, 0.9033203125, 1.084228515625, 1.26513671875, 1.446044921875, 1.626953125, 1.807861328125, 1.98876953125, 2.169677734375, 2.3505859375, 2.531494140625, 2.71240234375, 2.893310546875, 3.07421875, 3.255126953125, 3.43603515625, 3.616943359375, 3.7978515625, 3.978759765625, 4.15966796875, 4.340576171875, 4.521484375, 4.702392578125, 4.88330078125, 5.064208984375, 5.2451171875, 5.426025390625, 5.60693359375, 5.787841796875, 5.96875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 5.0, 5.0, 8.0, 5.0, 7.0, 9.0, 11.0, 12.0, 23.0, 37.0, 37.0, 47.0, 57.0, 85.0, 122.0, 140.0, 186.0, 248.0, 355.0, 594.0, 913.0, 1562.0, 2867.0, 5864.0, 13384.0, 32941.0, 100533.0, 405995.0, 342043.0, 86386.0, 29755.0, 12022.0, 5392.0, 2625.0, 1436.0, 876.0, 593.0, 366.0, 253.0, 177.0, 134.0, 96.0, 82.0, 65.0, 47.0, 41.0, 28.0, 22.0, 9.0, 11.0, 12.0, 9.0, 6.0, 8.0, 2.0, 3.0, 8.0, 1.0, 2.0, 2.0], "bins": [-6.3984375, -6.1981201171875, -5.997802734375, -5.7974853515625, -5.59716796875, -5.3968505859375, -5.196533203125, -4.9962158203125, -4.7958984375, -4.5955810546875, -4.395263671875, -4.1949462890625, -3.99462890625, -3.7943115234375, -3.593994140625, -3.3936767578125, -3.193359375, -2.9930419921875, -2.792724609375, -2.5924072265625, -2.39208984375, -2.1917724609375, -1.991455078125, -1.7911376953125, -1.5908203125, -1.3905029296875, -1.190185546875, -0.9898681640625, -0.78955078125, -0.5892333984375, -0.388916015625, -0.1885986328125, 0.01171875, 0.2120361328125, 0.412353515625, 0.6126708984375, 0.81298828125, 1.0133056640625, 1.213623046875, 1.4139404296875, 1.6142578125, 1.8145751953125, 2.014892578125, 2.2152099609375, 2.41552734375, 2.6158447265625, 2.816162109375, 3.0164794921875, 3.216796875, 3.4171142578125, 3.617431640625, 3.8177490234375, 4.01806640625, 4.2183837890625, 4.418701171875, 4.6190185546875, 4.8193359375, 5.0196533203125, 5.219970703125, 5.4202880859375, 5.62060546875, 5.8209228515625, 6.021240234375, 6.2215576171875, 6.421875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 4.0, 8.0, 7.0, 8.0, 10.0, 16.0, 14.0, 13.0, 23.0, 22.0, 27.0, 26.0, 26.0, 43.0, 40.0, 47.0, 48.0, 70.0, 118.0, 356.0, 1469.0, 166.0, 75.0, 54.0, 37.0, 42.0, 27.0, 50.0, 30.0, 31.0, 22.0, 19.0, 18.0, 13.0, 8.0, 6.0, 10.0, 6.0, 10.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.5, -19.8193359375, -19.138671875, -18.4580078125, -17.77734375, -17.0966796875, -16.416015625, -15.7353515625, -15.0546875, -14.3740234375, -13.693359375, -13.0126953125, -12.33203125, -11.6513671875, -10.970703125, -10.2900390625, -9.609375, -8.9287109375, -8.248046875, -7.5673828125, -6.88671875, -6.2060546875, -5.525390625, -4.8447265625, -4.1640625, -3.4833984375, -2.802734375, -2.1220703125, -1.44140625, -0.7607421875, -0.080078125, 0.6005859375, 1.28125, 1.9619140625, 2.642578125, 3.3232421875, 4.00390625, 4.6845703125, 5.365234375, 6.0458984375, 6.7265625, 7.4072265625, 8.087890625, 8.7685546875, 9.44921875, 10.1298828125, 10.810546875, 11.4912109375, 12.171875, 12.8525390625, 13.533203125, 14.2138671875, 14.89453125, 15.5751953125, 16.255859375, 16.9365234375, 17.6171875, 18.2978515625, 18.978515625, 19.6591796875, 20.33984375, 21.0205078125, 21.701171875, 22.3818359375, 23.0625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 5.0, 5.0, 13.0, 7.0, 17.0, 14.0, 29.0, 35.0, 41.0, 73.0, 84.0, 98.0, 151.0, 249.0, 363.0, 777.0, 5763.0, 3012862.0, 121824.0, 1711.0, 530.0, 294.0, 207.0, 128.0, 91.0, 75.0, 65.0, 42.0, 24.0, 33.0, 14.0, 18.0, 12.0, 11.0, 9.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.5625, -56.66015625, -54.7578125, -52.85546875, -50.953125, -49.05078125, -47.1484375, -45.24609375, -43.34375, -41.44140625, -39.5390625, -37.63671875, -35.734375, -33.83203125, -31.9296875, -30.02734375, -28.125, -26.22265625, -24.3203125, -22.41796875, -20.515625, -18.61328125, -16.7109375, -14.80859375, -12.90625, -11.00390625, -9.1015625, -7.19921875, -5.296875, -3.39453125, -1.4921875, 0.41015625, 2.3125, 4.21484375, 6.1171875, 8.01953125, 9.921875, 11.82421875, 13.7265625, 15.62890625, 17.53125, 19.43359375, 21.3359375, 23.23828125, 25.140625, 27.04296875, 28.9453125, 30.84765625, 32.75, 34.65234375, 36.5546875, 38.45703125, 40.359375, 42.26171875, 44.1640625, 46.06640625, 47.96875, 49.87109375, 51.7734375, 53.67578125, 55.578125, 57.48046875, 59.3828125, 61.28515625, 63.1875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 11.0, 365.0, 620.0, 19.0, 4.0, 0.0, 1.0, 1.0], "bins": [-373.006103515625, -366.5893249511719, -360.17254638671875, -353.75579833984375, -347.3390197753906, -340.9222412109375, -334.5054626464844, -328.08868408203125, -321.67193603515625, -315.2551574707031, -308.83837890625, -302.421630859375, -296.0048522949219, -289.58807373046875, -283.1712951660156, -276.7545166015625, -270.3377685546875, -263.9209899902344, -257.50421142578125, -251.0874481201172, -244.67068481445312, -238.25390625, -231.83712768554688, -225.4203643798828, -219.00357055664062, -212.5867919921875, -206.17002868652344, -199.7532501220703, -193.33648681640625, -186.91970825195312, -180.5029296875, -174.08616638183594, -167.66941833496094, -161.2526397705078, -154.83587646484375, -148.41909790039062, -142.00233459472656, -135.58555603027344, -129.16879272460938, -122.75201416015625, -116.33523559570312, -109.91846466064453, -103.50169372558594, -97.08491516113281, -90.66815185546875, -84.25137329101562, -77.83460235595703, -71.41783142089844, -65.00106811523438, -58.58429718017578, -52.16752624511719, -45.75075149536133, -39.333980560302734, -32.91720962524414, -26.50043487548828, -20.083663940429688, -13.666889190673828, -7.250117301940918, -0.8333454132080078, 5.583427429199219, 12.000198364257812, 18.416969299316406, 24.833744049072266, 31.25051498413086, 37.66728591918945]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 9.0, 10.0, 10.0, 9.0, 13.0, 25.0, 25.0, 34.0, 37.0, 36.0, 42.0, 45.0, 41.0, 46.0, 36.0, 52.0, 50.0, 45.0, 39.0, 54.0, 36.0, 33.0, 38.0, 34.0, 23.0, 32.0, 27.0, 26.0, 10.0, 17.0, 7.0, 14.0, 5.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.75575256347656, -65.56576538085938, -63.375770568847656, -61.1857795715332, -58.99578857421875, -56.8057975769043, -54.615806579589844, -52.42581558227539, -50.23582458496094, -48.045833587646484, -45.85584259033203, -43.66585159301758, -41.475860595703125, -39.28586959838867, -37.09587860107422, -34.905887603759766, -32.71589660644531, -30.52590560913086, -28.335914611816406, -26.145923614501953, -23.9559326171875, -21.765941619873047, -19.575950622558594, -17.38595962524414, -15.195968627929688, -13.005977630615234, -10.815986633300781, -8.625995635986328, -6.436004638671875, -4.246013641357422, -2.0560226440429688, 0.13396835327148438, 2.3239593505859375, 4.513950347900391, 6.703941345214844, 8.893932342529297, 11.08392333984375, 13.273914337158203, 15.463905334472656, 17.65389633178711, 19.843887329101562, 22.033878326416016, 24.22386932373047, 26.413860321044922, 28.603851318359375, 30.793842315673828, 32.98383331298828, 35.173824310302734, 37.36381530761719, 39.55380630493164, 41.743797302246094, 43.93378829956055, 46.123779296875, 48.31377029418945, 50.503761291503906, 52.69375228881836, 54.88374328613281, 57.073734283447266, 59.26372528076172, 61.45371627807617, 63.643707275390625, 65.83369445800781, 68.02368927001953, 70.21368408203125, 72.40367126464844]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 7.0, 6.0, 8.0, 10.0, 11.0, 14.0, 9.0, 17.0, 20.0, 22.0, 29.0, 24.0, 26.0, 25.0, 35.0, 26.0, 34.0, 26.0, 29.0, 43.0, 37.0, 35.0, 36.0, 38.0, 28.0, 36.0, 32.0, 29.0, 30.0, 34.0, 24.0, 32.0, 17.0, 22.0, 18.0, 25.0, 17.0, 18.0, 18.0, 7.0, 12.0, 8.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.55078125, -6.3516845703125, -6.152587890625, -5.9534912109375, -5.75439453125, -5.5552978515625, -5.356201171875, -5.1571044921875, -4.9580078125, -4.7589111328125, -4.559814453125, -4.3607177734375, -4.16162109375, -3.9625244140625, -3.763427734375, -3.5643310546875, -3.365234375, -3.1661376953125, -2.967041015625, -2.7679443359375, -2.56884765625, -2.3697509765625, -2.170654296875, -1.9715576171875, -1.7724609375, -1.5733642578125, -1.374267578125, -1.1751708984375, -0.97607421875, -0.7769775390625, -0.577880859375, -0.3787841796875, -0.1796875, 0.0194091796875, 0.218505859375, 0.4176025390625, 0.61669921875, 0.8157958984375, 1.014892578125, 1.2139892578125, 1.4130859375, 1.6121826171875, 1.811279296875, 2.0103759765625, 2.20947265625, 2.4085693359375, 2.607666015625, 2.8067626953125, 3.005859375, 3.2049560546875, 3.404052734375, 3.6031494140625, 3.80224609375, 4.0013427734375, 4.200439453125, 4.3995361328125, 4.5986328125, 4.7977294921875, 4.996826171875, 5.1959228515625, 5.39501953125, 5.5941162109375, 5.793212890625, 5.9923095703125, 6.19140625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 6.0, 4.0, 6.0, 8.0, 8.0, 11.0, 11.0, 17.0, 16.0, 13.0, 26.0, 30.0, 25.0, 18.0, 35.0, 39.0, 71.0, 135.0, 357.0, 1088.0, 7316.0, 248672.0, 3415392.0, 507754.0, 10847.0, 1482.0, 412.0, 142.0, 37.0, 35.0, 26.0, 25.0, 35.0, 21.0, 23.0, 22.0, 21.0, 15.0, 22.0, 12.0, 11.0, 9.0, 3.0, 2.0, 6.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.078125, -23.339111328125, -22.60009765625, -21.861083984375, -21.1220703125, -20.383056640625, -19.64404296875, -18.905029296875, -18.166015625, -17.427001953125, -16.68798828125, -15.948974609375, -15.2099609375, -14.470947265625, -13.73193359375, -12.992919921875, -12.25390625, -11.514892578125, -10.77587890625, -10.036865234375, -9.2978515625, -8.558837890625, -7.81982421875, -7.080810546875, -6.341796875, -5.602783203125, -4.86376953125, -4.124755859375, -3.3857421875, -2.646728515625, -1.90771484375, -1.168701171875, -0.4296875, 0.309326171875, 1.04833984375, 1.787353515625, 2.5263671875, 3.265380859375, 4.00439453125, 4.743408203125, 5.482421875, 6.221435546875, 6.96044921875, 7.699462890625, 8.4384765625, 9.177490234375, 9.91650390625, 10.655517578125, 11.39453125, 12.133544921875, 12.87255859375, 13.611572265625, 14.3505859375, 15.089599609375, 15.82861328125, 16.567626953125, 17.306640625, 18.045654296875, 18.78466796875, 19.523681640625, 20.2626953125, 21.001708984375, 21.74072265625, 22.479736328125, 23.21875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 12.0, 11.0, 17.0, 21.0, 26.0, 32.0, 52.0, 58.0, 105.0, 152.0, 158.0, 207.0, 318.0, 401.0, 437.0, 462.0, 409.0, 346.0, 231.0, 166.0, 137.0, 95.0, 59.0, 48.0, 25.0, 25.0, 18.0, 11.0, 11.0, 13.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.0645751953125, -14.621337890625, -14.1781005859375, -13.73486328125, -13.2916259765625, -12.848388671875, -12.4051513671875, -11.9619140625, -11.5186767578125, -11.075439453125, -10.6322021484375, -10.18896484375, -9.7457275390625, -9.302490234375, -8.8592529296875, -8.416015625, -7.9727783203125, -7.529541015625, -7.0863037109375, -6.64306640625, -6.1998291015625, -5.756591796875, -5.3133544921875, -4.8701171875, -4.4268798828125, -3.983642578125, -3.5404052734375, -3.09716796875, -2.6539306640625, -2.210693359375, -1.7674560546875, -1.32421875, -0.8809814453125, -0.437744140625, 0.0054931640625, 0.44873046875, 0.8919677734375, 1.335205078125, 1.7784423828125, 2.2216796875, 2.6649169921875, 3.108154296875, 3.5513916015625, 3.99462890625, 4.4378662109375, 4.881103515625, 5.3243408203125, 5.767578125, 6.2108154296875, 6.654052734375, 7.0972900390625, 7.54052734375, 7.9837646484375, 8.427001953125, 8.8702392578125, 9.3134765625, 9.7567138671875, 10.199951171875, 10.6431884765625, 11.08642578125, 11.5296630859375, 11.972900390625, 12.4161376953125, 12.859375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 7.0, 10.0, 18.0, 21.0, 35.0, 29.0, 45.0, 45.0, 85.0, 116.0, 135.0, 199.0, 277.0, 424.0, 899.0, 13137.0, 4079649.0, 96263.0, 1226.0, 480.0, 296.0, 205.0, 180.0, 118.0, 103.0, 58.0, 45.0, 40.0, 36.0, 28.0, 19.0, 12.0, 7.0, 2.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.25, -49.1708984375, -47.091796875, -45.0126953125, -42.93359375, -40.8544921875, -38.775390625, -36.6962890625, -34.6171875, -32.5380859375, -30.458984375, -28.3798828125, -26.30078125, -24.2216796875, -22.142578125, -20.0634765625, -17.984375, -15.9052734375, -13.826171875, -11.7470703125, -9.66796875, -7.5888671875, -5.509765625, -3.4306640625, -1.3515625, 0.7275390625, 2.806640625, 4.8857421875, 6.96484375, 9.0439453125, 11.123046875, 13.2021484375, 15.28125, 17.3603515625, 19.439453125, 21.5185546875, 23.59765625, 25.6767578125, 27.755859375, 29.8349609375, 31.9140625, 33.9931640625, 36.072265625, 38.1513671875, 40.23046875, 42.3095703125, 44.388671875, 46.4677734375, 48.546875, 50.6259765625, 52.705078125, 54.7841796875, 56.86328125, 58.9423828125, 61.021484375, 63.1005859375, 65.1796875, 67.2587890625, 69.337890625, 71.4169921875, 73.49609375, 75.5751953125, 77.654296875, 79.7333984375, 81.8125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 12.0, 53.0, 189.0, 290.0, 317.0, 113.0, 35.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.15267944335938, -185.36924743652344, -180.58583068847656, -175.80239868164062, -171.01898193359375, -166.2355499267578, -161.45213317871094, -156.668701171875, -151.88528442382812, -147.1018524169922, -142.3184356689453, -137.53500366210938, -132.7515869140625, -127.96815490722656, -123.18473052978516, -118.40130615234375, -113.61787414550781, -108.8344497680664, -104.051025390625, -99.2676010131836, -94.48417663574219, -89.70074462890625, -84.91732025146484, -80.13389587402344, -75.35047149658203, -70.56704711914062, -65.78362274169922, -61.00019454956055, -56.21677017211914, -51.433345794677734, -46.64991760253906, -41.866493225097656, -37.08308410644531, -32.299659729003906, -27.516233444213867, -22.732807159423828, -17.949382781982422, -13.165958404541016, -8.382532119750977, -3.5991058349609375, 1.1843185424804688, 5.967743873596191, 10.751169204711914, 15.534594535827637, 20.31801986694336, 25.101444244384766, 29.884870529174805, 34.668296813964844, 39.45172119140625, 44.235145568847656, 49.01856994628906, 53.801998138427734, 58.58542251586914, 63.36884689331055, 68.15227508544922, 72.93569946289062, 77.71912384033203, 82.50254821777344, 87.28597259521484, 92.06939697265625, 96.85282897949219, 101.63624572753906, 106.419677734375, 111.2031021118164, 115.98652648925781]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 10.0, 8.0, 5.0, 13.0, 11.0, 9.0, 13.0, 15.0, 16.0, 24.0, 23.0, 35.0, 45.0, 36.0, 25.0, 39.0, 38.0, 39.0, 40.0, 33.0, 46.0, 40.0, 33.0, 53.0, 45.0, 27.0, 34.0, 27.0, 19.0, 29.0, 21.0, 27.0, 15.0, 16.0, 13.0, 14.0, 10.0, 11.0, 5.0, 11.0, 7.0, 5.0, 2.0, 1.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0], "bins": [-45.53866195678711, -44.20953369140625, -42.880401611328125, -41.551273345947266, -40.22214126586914, -38.89301300048828, -37.563880920410156, -36.2347526550293, -34.90562438964844, -33.57649612426758, -32.24736404418945, -30.91823387145996, -29.58910369873047, -28.25997543334961, -26.930845260620117, -25.601715087890625, -24.2725830078125, -22.943452835083008, -21.614322662353516, -20.285192489624023, -18.95606231689453, -17.626934051513672, -16.29780387878418, -14.968673706054688, -13.639543533325195, -12.310413360595703, -10.981283187866211, -9.652153968811035, -8.323023796081543, -6.993893623352051, -5.664763927459717, -4.335634231567383, -3.0065078735351562, -1.6773779392242432, -0.3482480049133301, 0.980881929397583, 2.310011863708496, 3.6391420364379883, 4.968271732330322, 6.297401428222656, 7.626531600952148, 8.95566177368164, 10.284791946411133, 11.613921165466309, 12.9430513381958, 14.272181510925293, 15.601310729980469, 16.93044090270996, 18.259571075439453, 19.588701248168945, 20.917831420898438, 22.24696159362793, 23.576091766357422, 24.90522003173828, 26.234350204467773, 27.563480377197266, 28.892610549926758, 30.22174072265625, 31.550870895385742, 32.880001068115234, 34.209129333496094, 35.53826141357422, 36.86738967895508, 38.19651794433594, 39.52565002441406]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 9.0, 7.0, 6.0, 9.0, 11.0, 5.0, 20.0, 20.0, 13.0, 25.0, 28.0, 30.0, 26.0, 36.0, 27.0, 40.0, 27.0, 23.0, 40.0, 33.0, 33.0, 32.0, 41.0, 30.0, 34.0, 33.0, 33.0, 42.0, 28.0, 35.0, 29.0, 20.0, 24.0, 20.0, 22.0, 10.0, 17.0, 10.0, 15.0, 11.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.72265625, -5.52728271484375, -5.3319091796875, -5.13653564453125, -4.941162109375, -4.74578857421875, -4.5504150390625, -4.35504150390625, -4.15966796875, -3.96429443359375, -3.7689208984375, -3.57354736328125, -3.378173828125, -3.18280029296875, -2.9874267578125, -2.79205322265625, -2.5966796875, -2.40130615234375, -2.2059326171875, -2.01055908203125, -1.815185546875, -1.61981201171875, -1.4244384765625, -1.22906494140625, -1.03369140625, -0.83831787109375, -0.6429443359375, -0.44757080078125, -0.252197265625, -0.05682373046875, 0.1385498046875, 0.33392333984375, 0.529296875, 0.72467041015625, 0.9200439453125, 1.11541748046875, 1.310791015625, 1.50616455078125, 1.7015380859375, 1.89691162109375, 2.09228515625, 2.28765869140625, 2.4830322265625, 2.67840576171875, 2.873779296875, 3.06915283203125, 3.2645263671875, 3.45989990234375, 3.6552734375, 3.85064697265625, 4.0460205078125, 4.24139404296875, 4.436767578125, 4.63214111328125, 4.8275146484375, 5.02288818359375, 5.21826171875, 5.41363525390625, 5.6090087890625, 5.80438232421875, 5.999755859375, 6.19512939453125, 6.3905029296875, 6.58587646484375, 6.78125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 0.0, 8.0, 9.0, 15.0, 30.0, 39.0, 51.0, 115.0, 138.0, 238.0, 336.0, 501.0, 761.0, 1202.0, 1839.0, 2662.0, 4205.0, 6419.0, 10066.0, 16113.0, 25992.0, 43345.0, 76482.0, 145019.0, 319919.0, 175077.0, 88532.0, 50073.0, 29221.0, 18231.0, 11351.0, 7072.0, 4673.0, 3067.0, 1939.0, 1286.0, 897.0, 552.0, 381.0, 260.0, 149.0, 104.0, 69.0, 37.0, 26.0, 16.0, 8.0, 15.0, 7.0, 8.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.7978515625, -1.7459259033203125, -1.694000244140625, -1.6420745849609375, -1.59014892578125, -1.5382232666015625, -1.486297607421875, -1.4343719482421875, -1.3824462890625, -1.3305206298828125, -1.278594970703125, -1.2266693115234375, -1.17474365234375, -1.1228179931640625, -1.070892333984375, -1.0189666748046875, -0.967041015625, -0.9151153564453125, -0.863189697265625, -0.8112640380859375, -0.75933837890625, -0.7074127197265625, -0.655487060546875, -0.6035614013671875, -0.5516357421875, -0.4997100830078125, -0.447784423828125, -0.3958587646484375, -0.34393310546875, -0.2920074462890625, -0.240081787109375, -0.1881561279296875, -0.13623046875, -0.0843048095703125, -0.032379150390625, 0.0195465087890625, 0.07147216796875, 0.1233978271484375, 0.175323486328125, 0.2272491455078125, 0.2791748046875, 0.3311004638671875, 0.383026123046875, 0.4349517822265625, 0.48687744140625, 0.5388031005859375, 0.590728759765625, 0.6426544189453125, 0.694580078125, 0.7465057373046875, 0.798431396484375, 0.8503570556640625, 0.90228271484375, 0.9542083740234375, 1.006134033203125, 1.0580596923828125, 1.1099853515625, 1.1619110107421875, 1.213836669921875, 1.2657623291015625, 1.31768798828125, 1.3696136474609375, 1.421539306640625, 1.4734649658203125, 1.525390625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 7.0, 12.0, 6.0, 14.0, 16.0, 18.0, 18.0, 26.0, 28.0, 31.0, 28.0, 28.0, 17.0, 38.0, 25.0, 36.0, 46.0, 38.0, 45.0, 1065.0, 30.0, 48.0, 36.0, 43.0, 25.0, 33.0, 28.0, 23.0, 32.0, 17.0, 15.0, 23.0, 22.0, 14.0, 20.0, 16.0, 17.0, 6.0, 6.0, 3.0, 7.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.921875, -3.78741455078125, -3.6529541015625, -3.51849365234375, -3.384033203125, -3.24957275390625, -3.1151123046875, -2.98065185546875, -2.84619140625, -2.71173095703125, -2.5772705078125, -2.44281005859375, -2.308349609375, -2.17388916015625, -2.0394287109375, -1.90496826171875, -1.7705078125, -1.63604736328125, -1.5015869140625, -1.36712646484375, -1.232666015625, -1.09820556640625, -0.9637451171875, -0.82928466796875, -0.69482421875, -0.56036376953125, -0.4259033203125, -0.29144287109375, -0.156982421875, -0.02252197265625, 0.1119384765625, 0.24639892578125, 0.380859375, 0.51531982421875, 0.6497802734375, 0.78424072265625, 0.918701171875, 1.05316162109375, 1.1876220703125, 1.32208251953125, 1.45654296875, 1.59100341796875, 1.7254638671875, 1.85992431640625, 1.994384765625, 2.12884521484375, 2.2633056640625, 2.39776611328125, 2.5322265625, 2.66668701171875, 2.8011474609375, 2.93560791015625, 3.070068359375, 3.20452880859375, 3.3389892578125, 3.47344970703125, 3.60791015625, 3.74237060546875, 3.8768310546875, 4.01129150390625, 4.145751953125, 4.28021240234375, 4.4146728515625, 4.54913330078125, 4.68359375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 9.0, 17.0, 19.0, 34.0, 60.0, 74.0, 124.0, 185.0, 241.0, 420.0, 618.0, 966.0, 1404.0, 2173.0, 3391.0, 5216.0, 7969.0, 12017.0, 18364.0, 27362.0, 42075.0, 65501.0, 114391.0, 1320550.0, 206747.0, 98306.0, 58500.0, 37506.0, 25028.0, 16637.0, 10964.0, 7164.0, 4553.0, 3018.0, 1924.0, 1264.0, 803.0, 517.0, 357.0, 229.0, 152.0, 108.0, 59.0, 44.0, 20.0, 23.0, 8.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.392578125, -1.3488922119140625, -1.305206298828125, -1.2615203857421875, -1.21783447265625, -1.1741485595703125, -1.130462646484375, -1.0867767333984375, -1.0430908203125, -0.9994049072265625, -0.955718994140625, -0.9120330810546875, -0.86834716796875, -0.8246612548828125, -0.780975341796875, -0.7372894287109375, -0.693603515625, -0.6499176025390625, -0.606231689453125, -0.5625457763671875, -0.51885986328125, -0.4751739501953125, -0.431488037109375, -0.3878021240234375, -0.3441162109375, -0.3004302978515625, -0.256744384765625, -0.2130584716796875, -0.16937255859375, -0.1256866455078125, -0.082000732421875, -0.0383148193359375, 0.00537109375, 0.0490570068359375, 0.092742919921875, 0.1364288330078125, 0.18011474609375, 0.2238006591796875, 0.267486572265625, 0.3111724853515625, 0.3548583984375, 0.3985443115234375, 0.442230224609375, 0.4859161376953125, 0.52960205078125, 0.5732879638671875, 0.616973876953125, 0.6606597900390625, 0.704345703125, 0.7480316162109375, 0.791717529296875, 0.8354034423828125, 0.87908935546875, 0.9227752685546875, 0.966461181640625, 1.0101470947265625, 1.0538330078125, 1.0975189208984375, 1.141204833984375, 1.1848907470703125, 1.22857666015625, 1.2722625732421875, 1.315948486328125, 1.3596343994140625, 1.4033203125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 4.0, 8.0, 12.0, 10.0, 18.0, 21.0, 31.0, 42.0, 56.0, 79.0, 92.0, 120.0, 102.0, 99.0, 76.0, 62.0, 35.0, 28.0, 23.0, 20.0, 10.0, 6.0, 12.0, 5.0, 3.0, 11.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011968612670898438, -0.0011571794748306274, -0.0011174976825714111, -0.0010778158903121948, -0.0010381340980529785, -0.0009984523057937622, -0.0009587705135345459, -0.0009190887212753296, -0.0008794069290161133, -0.000839725136756897, -0.0008000433444976807, -0.0007603615522384644, -0.000720679759979248, -0.0006809979677200317, -0.0006413161754608154, -0.0006016343832015991, -0.0005619525909423828, -0.0005222707986831665, -0.0004825890064239502, -0.0004429072141647339, -0.0004032254219055176, -0.00036354362964630127, -0.00032386183738708496, -0.00028418004512786865, -0.00024449825286865234, -0.00020481646060943604, -0.00016513466835021973, -0.00012545287609100342, -8.577108383178711e-05, -4.60892915725708e-05, -6.407499313354492e-06, 3.3274292945861816e-05, 7.295608520507812e-05, 0.00011263787746429443, 0.00015231966972351074, 0.00019200146198272705, 0.00023168325424194336, 0.00027136504650115967, 0.000311046838760376, 0.0003507286310195923, 0.0003904104232788086, 0.0004300922155380249, 0.0004697740077972412, 0.0005094558000564575, 0.0005491375923156738, 0.0005888193845748901, 0.0006285011768341064, 0.0006681829690933228, 0.0007078647613525391, 0.0007475465536117554, 0.0007872283458709717, 0.000826910138130188, 0.0008665919303894043, 0.0009062737226486206, 0.0009459555149078369, 0.0009856373071670532, 0.0010253190994262695, 0.0010650008916854858, 0.0011046826839447021, 0.0011443644762039185, 0.0011840462684631348, 0.001223728060722351, 0.0012634098529815674, 0.0013030916452407837, 0.0013427734375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 11.0, 16.0, 14.0, 32.0, 45.0, 92.0, 165.0, 551.0, 940377.0, 106375.0, 456.0, 146.0, 102.0, 45.0, 26.0, 26.0, 15.0, 10.0, 7.0, 5.0, 5.0, 1.0, 7.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038848876953125, -0.0377039909362793, -0.036559104919433594, -0.03541421890258789, -0.03426933288574219, -0.033124446868896484, -0.03197956085205078, -0.030834674835205078, -0.029689788818359375, -0.028544902801513672, -0.02740001678466797, -0.026255130767822266, -0.025110244750976562, -0.02396535873413086, -0.022820472717285156, -0.021675586700439453, -0.02053070068359375, -0.019385814666748047, -0.018240928649902344, -0.01709604263305664, -0.015951156616210938, -0.014806270599365234, -0.013661384582519531, -0.012516498565673828, -0.011371612548828125, -0.010226726531982422, -0.009081840515136719, -0.007936954498291016, -0.0067920684814453125, -0.005647182464599609, -0.004502296447753906, -0.003357410430908203, -0.0022125244140625, -0.0010676383972167969, 7.724761962890625e-05, 0.0012221336364746094, 0.0023670196533203125, 0.0035119056701660156, 0.004656791687011719, 0.005801677703857422, 0.006946563720703125, 0.008091449737548828, 0.009236335754394531, 0.010381221771240234, 0.011526107788085938, 0.01267099380493164, 0.013815879821777344, 0.014960765838623047, 0.01610565185546875, 0.017250537872314453, 0.018395423889160156, 0.01954030990600586, 0.020685195922851562, 0.021830081939697266, 0.02297496795654297, 0.024119853973388672, 0.025264739990234375, 0.026409626007080078, 0.02755451202392578, 0.028699398040771484, 0.029844284057617188, 0.03098917007446289, 0.032134056091308594, 0.0332789421081543, 0.034423828125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 161.0, 751.0, 95.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0047737243585288525, -0.004675162490457296, -0.00457660062238574, -0.004478038754314184, -0.004379476886242628, -0.004280915018171072, -0.004182353615760803, -0.004083791747689247, -0.003985229879617691, -0.003886668011546135, -0.003788106143474579, -0.0036895442754030228, -0.0035909826401621103, -0.0034924207720905542, -0.003393858904018998, -0.003295297035947442, -0.0031967349350452423, -0.0030981730669736862, -0.00299961119890213, -0.002901049330830574, -0.0028024876955896616, -0.0027039258275181055, -0.0026053639594465494, -0.0025068020913749933, -0.002408240456134081, -0.002309678588062525, -0.0022111167199909687, -0.0021125548519194126, -0.0020139932166785, -0.001915431348606944, -0.001816869480535388, -0.001718307612463832, -0.0016197458608075976, -0.0015211839927360415, -0.0014226222410798073, -0.0013240603730082512, -0.001225498504936695, -0.001126936636865139, -0.0010283748852089047, -0.0009298130171373487, -0.0008312512072734535, -0.0007326893974095583, -0.0006341275293380022, -0.000535565719474107, -0.0004370038805063814, -0.00033844204153865576, -0.00023988023167476058, -0.0001413183636032045, -4.275655373930931e-05, 5.580527795245871e-05, 0.00015436710964422673, 0.00025292893406003714, 0.00035149077302776277, 0.0004500526119954884, 0.0005486144218593836, 0.0006471762899309397, 0.0007457380997948349, 0.00084429990965873, 0.0009428617777302861, 0.0010414235293865204, 0.0011399853974580765, 0.0012385472655296326, 0.0013371091336011887, 0.0014356710016727448, 0.001534232753328979]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 8.0, 8.0, 15.0, 19.0, 17.0, 38.0, 25.0, 23.0, 27.0, 40.0, 35.0, 30.0, 49.0, 55.0, 48.0, 50.0, 53.0, 39.0, 38.0, 30.0, 36.0, 38.0, 35.0, 35.0, 37.0, 20.0, 26.0, 18.0, 18.0, 16.0, 11.0, 11.0, 5.0, 4.0, 5.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004996061325073242, -0.0004834374412894249, -0.0004672687500715256, -0.00045110005885362625, -0.00043493136763572693, -0.0004187626764178276, -0.0004025939851999283, -0.00038642529398202896, -0.00037025660276412964, -0.0003540879115462303, -0.000337919220328331, -0.00032175052911043167, -0.00030558183789253235, -0.000289413146674633, -0.0002732444554567337, -0.0002570757642388344, -0.00024090707302093506, -0.00022473838180303574, -0.00020856969058513641, -0.0001924009993672371, -0.00017623230814933777, -0.00016006361693143845, -0.00014389492571353912, -0.0001277262344956398, -0.00011155754327774048, -9.538885205984116e-05, -7.922016084194183e-05, -6.305146962404251e-05, -4.688277840614319e-05, -3.0714087188243866e-05, -1.4545395970344543e-05, 1.623295247554779e-06, 1.77919864654541e-05, 3.3960677683353424e-05, 5.0129368901252747e-05, 6.629806011915207e-05, 8.246675133705139e-05, 9.863544255495071e-05, 0.00011480413377285004, 0.00013097282499074936, 0.00014714151620864868, 0.000163310207426548, 0.00017947889864444733, 0.00019564758986234665, 0.00021181628108024597, 0.0002279849722981453, 0.0002441536635160446, 0.00026032235473394394, 0.00027649104595184326, 0.0002926597371697426, 0.0003088284283876419, 0.00032499711960554123, 0.00034116581082344055, 0.0003573345020413399, 0.0003735031932592392, 0.0003896718844771385, 0.00040584057569503784, 0.00042200926691293716, 0.0004381779581308365, 0.0004543466493487358, 0.00047051534056663513, 0.00048668403178453445, 0.0005028527230024338, 0.0005190214142203331, 0.0005351901054382324]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 9.0, 7.0, 6.0, 9.0, 11.0, 5.0, 20.0, 20.0, 13.0, 25.0, 28.0, 30.0, 26.0, 36.0, 27.0, 40.0, 27.0, 23.0, 40.0, 33.0, 33.0, 32.0, 41.0, 30.0, 34.0, 33.0, 33.0, 42.0, 28.0, 35.0, 29.0, 20.0, 24.0, 20.0, 22.0, 10.0, 17.0, 10.0, 15.0, 11.0, 9.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.72265625, -5.52728271484375, -5.3319091796875, -5.13653564453125, -4.941162109375, -4.74578857421875, -4.5504150390625, -4.35504150390625, -4.15966796875, -3.96429443359375, -3.7689208984375, -3.57354736328125, -3.378173828125, -3.18280029296875, -2.9874267578125, -2.79205322265625, -2.5966796875, -2.40130615234375, -2.2059326171875, -2.01055908203125, -1.815185546875, -1.61981201171875, -1.4244384765625, -1.22906494140625, -1.03369140625, -0.83831787109375, -0.6429443359375, -0.44757080078125, -0.252197265625, -0.05682373046875, 0.1385498046875, 0.33392333984375, 0.529296875, 0.72467041015625, 0.9200439453125, 1.11541748046875, 1.310791015625, 1.50616455078125, 1.7015380859375, 1.89691162109375, 2.09228515625, 2.28765869140625, 2.4830322265625, 2.67840576171875, 2.873779296875, 3.06915283203125, 3.2645263671875, 3.45989990234375, 3.6552734375, 3.85064697265625, 4.0460205078125, 4.24139404296875, 4.436767578125, 4.63214111328125, 4.8275146484375, 5.02288818359375, 5.21826171875, 5.41363525390625, 5.6090087890625, 5.80438232421875, 5.999755859375, 6.19512939453125, 6.3905029296875, 6.58587646484375, 6.78125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 9.0, 8.0, 18.0, 27.0, 28.0, 42.0, 30.0, 52.0, 64.0, 97.0, 141.0, 168.0, 234.0, 329.0, 508.0, 785.0, 1144.0, 1850.0, 2970.0, 4709.0, 8205.0, 15665.0, 31506.0, 72368.0, 184139.0, 372830.0, 200035.0, 77955.0, 34011.0, 16312.0, 8617.0, 4997.0, 2917.0, 1883.0, 1228.0, 807.0, 542.0, 359.0, 257.0, 175.0, 136.0, 92.0, 70.0, 59.0, 39.0, 37.0, 25.0, 24.0, 13.0, 8.0, 15.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.03515625, -3.9072265625, -3.779296875, -3.6513671875, -3.5234375, -3.3955078125, -3.267578125, -3.1396484375, -3.01171875, -2.8837890625, -2.755859375, -2.6279296875, -2.5, -2.3720703125, -2.244140625, -2.1162109375, -1.98828125, -1.8603515625, -1.732421875, -1.6044921875, -1.4765625, -1.3486328125, -1.220703125, -1.0927734375, -0.96484375, -0.8369140625, -0.708984375, -0.5810546875, -0.453125, -0.3251953125, -0.197265625, -0.0693359375, 0.05859375, 0.1865234375, 0.314453125, 0.4423828125, 0.5703125, 0.6982421875, 0.826171875, 0.9541015625, 1.08203125, 1.2099609375, 1.337890625, 1.4658203125, 1.59375, 1.7216796875, 1.849609375, 1.9775390625, 2.10546875, 2.2333984375, 2.361328125, 2.4892578125, 2.6171875, 2.7451171875, 2.873046875, 3.0009765625, 3.12890625, 3.2568359375, 3.384765625, 3.5126953125, 3.640625, 3.7685546875, 3.896484375, 4.0244140625, 4.15234375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 5.0, 6.0, 8.0, 7.0, 7.0, 18.0, 17.0, 21.0, 31.0, 25.0, 33.0, 45.0, 51.0, 64.0, 49.0, 65.0, 115.0, 1654.0, 315.0, 85.0, 68.0, 58.0, 41.0, 43.0, 30.0, 26.0, 39.0, 38.0, 19.0, 16.0, 15.0, 3.0, 9.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.4375, -33.593505859375, -32.74951171875, -31.905517578125, -31.0615234375, -30.217529296875, -29.37353515625, -28.529541015625, -27.685546875, -26.841552734375, -25.99755859375, -25.153564453125, -24.3095703125, -23.465576171875, -22.62158203125, -21.777587890625, -20.93359375, -20.089599609375, -19.24560546875, -18.401611328125, -17.5576171875, -16.713623046875, -15.86962890625, -15.025634765625, -14.181640625, -13.337646484375, -12.49365234375, -11.649658203125, -10.8056640625, -9.961669921875, -9.11767578125, -8.273681640625, -7.4296875, -6.585693359375, -5.74169921875, -4.897705078125, -4.0537109375, -3.209716796875, -2.36572265625, -1.521728515625, -0.677734375, 0.166259765625, 1.01025390625, 1.854248046875, 2.6982421875, 3.542236328125, 4.38623046875, 5.230224609375, 6.07421875, 6.918212890625, 7.76220703125, 8.606201171875, 9.4501953125, 10.294189453125, 11.13818359375, 11.982177734375, 12.826171875, 13.670166015625, 14.51416015625, 15.358154296875, 16.2021484375, 17.046142578125, 17.89013671875, 18.734130859375, 19.578125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 12.0, 24.0, 50.0, 67.0, 157.0, 308.0, 670.0, 14970.0, 3127447.0, 1139.0, 398.0, 198.0, 107.0, 58.0, 36.0, 25.0, 13.0, 11.0, 10.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.5, -132.951171875, -128.40234375, -123.853515625, -119.3046875, -114.755859375, -110.20703125, -105.658203125, -101.109375, -96.560546875, -92.01171875, -87.462890625, -82.9140625, -78.365234375, -73.81640625, -69.267578125, -64.71875, -60.169921875, -55.62109375, -51.072265625, -46.5234375, -41.974609375, -37.42578125, -32.876953125, -28.328125, -23.779296875, -19.23046875, -14.681640625, -10.1328125, -5.583984375, -1.03515625, 3.513671875, 8.0625, 12.611328125, 17.16015625, 21.708984375, 26.2578125, 30.806640625, 35.35546875, 39.904296875, 44.453125, 49.001953125, 53.55078125, 58.099609375, 62.6484375, 67.197265625, 71.74609375, 76.294921875, 80.84375, 85.392578125, 89.94140625, 94.490234375, 99.0390625, 103.587890625, 108.13671875, 112.685546875, 117.234375, 121.783203125, 126.33203125, 130.880859375, 135.4296875, 139.978515625, 144.52734375, 149.076171875, 153.625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 83.0, 932.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.15531921386719, -40.69756317138672, -28.239810943603516, -15.782058715820312, -3.3243026733398438, 9.133453369140625, 21.591201782226562, 34.04895782470703, 46.5067138671875, 58.96446990966797, 71.42222595214844, 83.87997436523438, 96.33773040771484, 108.79548645019531, 121.25323486328125, 133.71099853515625, 146.1687469482422, 158.62649536132812, 171.08425903320312, 183.54200744628906, 195.999755859375, 208.45751953125, 220.91526794433594, 233.37301635742188, 245.83078002929688, 258.2885437011719, 270.74627685546875, 283.20404052734375, 295.66180419921875, 308.11956787109375, 320.5773010253906, 333.0350646972656, 345.4927978515625, 357.9505615234375, 370.4082946777344, 382.8660583496094, 395.3238220214844, 407.78155517578125, 420.23931884765625, 432.69708251953125, 445.15484619140625, 457.61260986328125, 470.0703430175781, 482.5281066894531, 494.9858703613281, 507.443603515625, 519.9013671875, 532.359130859375, 544.81689453125, 557.274658203125, 569.732421875, 582.190185546875, 594.6478881835938, 607.1056518554688, 619.5634155273438, 632.0211791992188, 644.4788818359375, 656.9366455078125, 669.3944091796875, 681.8521728515625, 694.3098754882812, 706.7676391601562, 719.2254028320312, 731.6831665039062, 744.1409301757812]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 6.0, 4.0, 9.0, 2.0, 11.0, 8.0, 13.0, 4.0, 14.0, 14.0, 21.0, 31.0, 27.0, 21.0, 36.0, 26.0, 36.0, 40.0, 39.0, 34.0, 38.0, 47.0, 45.0, 35.0, 44.0, 32.0, 44.0, 39.0, 31.0, 27.0, 26.0, 22.0, 20.0, 25.0, 23.0, 20.0, 14.0, 8.0, 13.0, 13.0, 7.0, 5.0, 10.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0], "bins": [-68.06098937988281, -66.08135223388672, -64.10171508789062, -62.1220817565918, -60.1424446105957, -58.16280746459961, -56.18317413330078, -54.20353698730469, -52.223899841308594, -50.2442626953125, -48.264625549316406, -46.28499221801758, -44.305355072021484, -42.32571792602539, -40.34608459472656, -38.36644744873047, -36.386810302734375, -34.40717315673828, -32.42753601074219, -30.44790267944336, -28.468265533447266, -26.488628387451172, -24.50899314880371, -22.52935791015625, -20.549720764160156, -18.570083618164062, -16.5904483795166, -14.610812187194824, -12.631175994873047, -10.65153980255127, -8.671903610229492, -6.692267417907715, -4.7126312255859375, -2.73299503326416, -0.7533588409423828, 1.2262773513793945, 3.205913543701172, 5.185549736022949, 7.165185928344727, 9.144822120666504, 11.124458312988281, 13.104094505310059, 15.083730697631836, 17.063365936279297, 19.04300308227539, 21.022640228271484, 23.002275466918945, 24.981910705566406, 26.9615478515625, 28.941184997558594, 30.920820236206055, 32.900455474853516, 34.88009262084961, 36.8597297668457, 38.83936309814453, 40.819000244140625, 42.79863739013672, 44.77827453613281, 46.757911682128906, 48.737545013427734, 50.71718215942383, 52.69681930541992, 54.67645263671875, 56.656089782714844, 58.63572692871094]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 10.0, 6.0, 9.0, 8.0, 7.0, 11.0, 20.0, 17.0, 19.0, 21.0, 29.0, 29.0, 39.0, 31.0, 28.0, 44.0, 40.0, 33.0, 38.0, 46.0, 41.0, 31.0, 36.0, 41.0, 33.0, 47.0, 30.0, 36.0, 25.0, 25.0, 30.0, 14.0, 17.0, 23.0, 17.0, 12.0, 12.0, 14.0, 7.0, 5.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7265625, -6.49652099609375, -6.2664794921875, -6.03643798828125, -5.806396484375, -5.57635498046875, -5.3463134765625, -5.11627197265625, -4.88623046875, -4.65618896484375, -4.4261474609375, -4.19610595703125, -3.966064453125, -3.73602294921875, -3.5059814453125, -3.27593994140625, -3.0458984375, -2.81585693359375, -2.5858154296875, -2.35577392578125, -2.125732421875, -1.89569091796875, -1.6656494140625, -1.43560791015625, -1.20556640625, -0.97552490234375, -0.7454833984375, -0.51544189453125, -0.285400390625, -0.05535888671875, 0.1746826171875, 0.40472412109375, 0.634765625, 0.86480712890625, 1.0948486328125, 1.32489013671875, 1.554931640625, 1.78497314453125, 2.0150146484375, 2.24505615234375, 2.47509765625, 2.70513916015625, 2.9351806640625, 3.16522216796875, 3.395263671875, 3.62530517578125, 3.8553466796875, 4.08538818359375, 4.3154296875, 4.54547119140625, 4.7755126953125, 5.00555419921875, 5.235595703125, 5.46563720703125, 5.6956787109375, 5.92572021484375, 6.15576171875, 6.38580322265625, 6.6158447265625, 6.84588623046875, 7.075927734375, 7.30596923828125, 7.5360107421875, 7.76605224609375, 7.99609375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 6.0, 7.0, 12.0, 8.0, 12.0, 19.0, 24.0, 21.0, 38.0, 45.0, 59.0, 87.0, 122.0, 287.0, 631.0, 2212.0, 16573.0, 467000.0, 3090810.0, 592580.0, 19821.0, 2493.0, 629.0, 257.0, 143.0, 86.0, 56.0, 48.0, 28.0, 22.0, 26.0, 14.0, 25.0, 15.0, 15.0, 6.0, 6.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.984375, -17.37548828125, -16.7666015625, -16.15771484375, -15.548828125, -14.93994140625, -14.3310546875, -13.72216796875, -13.11328125, -12.50439453125, -11.8955078125, -11.28662109375, -10.677734375, -10.06884765625, -9.4599609375, -8.85107421875, -8.2421875, -7.63330078125, -7.0244140625, -6.41552734375, -5.806640625, -5.19775390625, -4.5888671875, -3.97998046875, -3.37109375, -2.76220703125, -2.1533203125, -1.54443359375, -0.935546875, -0.32666015625, 0.2822265625, 0.89111328125, 1.5, 2.10888671875, 2.7177734375, 3.32666015625, 3.935546875, 4.54443359375, 5.1533203125, 5.76220703125, 6.37109375, 6.97998046875, 7.5888671875, 8.19775390625, 8.806640625, 9.41552734375, 10.0244140625, 10.63330078125, 11.2421875, 11.85107421875, 12.4599609375, 13.06884765625, 13.677734375, 14.28662109375, 14.8955078125, 15.50439453125, 16.11328125, 16.72216796875, 17.3310546875, 17.93994140625, 18.548828125, 19.15771484375, 19.7666015625, 20.37548828125, 20.984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 16.0, 10.0, 14.0, 30.0, 37.0, 46.0, 60.0, 94.0, 142.0, 177.0, 245.0, 358.0, 457.0, 557.0, 448.0, 400.0, 270.0, 211.0, 147.0, 118.0, 68.0, 51.0, 31.0, 26.0, 17.0, 7.0, 9.0, 8.0, 12.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.34375, -13.860595703125, -13.37744140625, -12.894287109375, -12.4111328125, -11.927978515625, -11.44482421875, -10.961669921875, -10.478515625, -9.995361328125, -9.51220703125, -9.029052734375, -8.5458984375, -8.062744140625, -7.57958984375, -7.096435546875, -6.61328125, -6.130126953125, -5.64697265625, -5.163818359375, -4.6806640625, -4.197509765625, -3.71435546875, -3.231201171875, -2.748046875, -2.264892578125, -1.78173828125, -1.298583984375, -0.8154296875, -0.332275390625, 0.15087890625, 0.634033203125, 1.1171875, 1.600341796875, 2.08349609375, 2.566650390625, 3.0498046875, 3.532958984375, 4.01611328125, 4.499267578125, 4.982421875, 5.465576171875, 5.94873046875, 6.431884765625, 6.9150390625, 7.398193359375, 7.88134765625, 8.364501953125, 8.84765625, 9.330810546875, 9.81396484375, 10.297119140625, 10.7802734375, 11.263427734375, 11.74658203125, 12.229736328125, 12.712890625, 13.196044921875, 13.67919921875, 14.162353515625, 14.6455078125, 15.128662109375, 15.61181640625, 16.094970703125, 16.578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 10.0, 5.0, 17.0, 12.0, 19.0, 30.0, 37.0, 41.0, 31.0, 48.0, 77.0, 94.0, 128.0, 161.0, 243.0, 369.0, 684.0, 2783.0, 1188613.0, 2994263.0, 4373.0, 736.0, 389.0, 272.0, 183.0, 132.0, 111.0, 89.0, 62.0, 52.0, 46.0, 32.0, 40.0, 27.0, 15.0, 16.0, 9.0, 5.0, 5.0, 2.0, 0.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.375, -56.43359375, -54.4921875, -52.55078125, -50.609375, -48.66796875, -46.7265625, -44.78515625, -42.84375, -40.90234375, -38.9609375, -37.01953125, -35.078125, -33.13671875, -31.1953125, -29.25390625, -27.3125, -25.37109375, -23.4296875, -21.48828125, -19.546875, -17.60546875, -15.6640625, -13.72265625, -11.78125, -9.83984375, -7.8984375, -5.95703125, -4.015625, -2.07421875, -0.1328125, 1.80859375, 3.75, 5.69140625, 7.6328125, 9.57421875, 11.515625, 13.45703125, 15.3984375, 17.33984375, 19.28125, 21.22265625, 23.1640625, 25.10546875, 27.046875, 28.98828125, 30.9296875, 32.87109375, 34.8125, 36.75390625, 38.6953125, 40.63671875, 42.578125, 44.51953125, 46.4609375, 48.40234375, 50.34375, 52.28515625, 54.2265625, 56.16796875, 58.109375, 60.05078125, 61.9921875, 63.93359375, 65.875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 9.0, 73.0, 203.0, 356.0, 242.0, 103.0, 21.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-255.10964965820312, -250.26254272460938, -245.4154510498047, -240.56834411621094, -235.7212371826172, -230.87413024902344, -226.02703857421875, -221.179931640625, -216.33282470703125, -211.4857177734375, -206.6386260986328, -201.79151916503906, -196.9444122314453, -192.09730529785156, -187.25021362304688, -182.40310668945312, -177.55599975585938, -172.70889282226562, -167.86180114746094, -163.0146942138672, -158.16758728027344, -153.3204803466797, -148.473388671875, -143.62628173828125, -138.77919006347656, -133.9320831298828, -129.08499145507812, -124.23788452148438, -119.39077758789062, -114.5436782836914, -109.69657897949219, -104.84947204589844, -100.00234985351562, -95.1552505493164, -90.30814361572266, -85.46104431152344, -80.61393737792969, -75.76683807373047, -70.91973876953125, -66.0726318359375, -61.22553253173828, -56.3784294128418, -51.53132629394531, -46.684226989746094, -41.837120056152344, -36.990020751953125, -32.14291763305664, -27.295814514160156, -22.448711395263672, -17.601608276367188, -12.75450611114502, -7.907403945922852, -3.060300827026367, 1.7868022918701172, 6.633903503417969, 11.481006622314453, 16.328109741210938, 21.175212860107422, 26.022315979003906, 30.869417190551758, 35.716522216796875, 40.563621520996094, 45.41072463989258, 50.25782775878906, 55.10493087768555]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 11.0, 13.0, 3.0, 6.0, 12.0, 14.0, 17.0, 20.0, 25.0, 30.0, 20.0, 23.0, 32.0, 31.0, 52.0, 34.0, 41.0, 39.0, 28.0, 40.0, 33.0, 40.0, 45.0, 51.0, 33.0, 31.0, 29.0, 30.0, 34.0, 15.0, 21.0, 24.0, 24.0, 18.0, 16.0, 14.0, 6.0, 13.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.07752990722656, -37.707191467285156, -36.336856842041016, -34.96651840209961, -33.59618377685547, -32.22584533691406, -30.855510711669922, -29.485172271728516, -28.114837646484375, -26.7445011138916, -25.374164581298828, -24.003828048706055, -22.63349151611328, -21.263154983520508, -19.892818450927734, -18.522480010986328, -17.152143478393555, -15.781806945800781, -14.411470413208008, -13.041133880615234, -11.670797348022461, -10.300460815429688, -8.930123329162598, -7.559786796569824, -6.189450263977051, -4.819113731384277, -3.448776960372925, -2.0784401893615723, -0.7081036567687988, 0.6622328758239746, 2.0325698852539062, 3.4029064178466797, 4.773242950439453, 6.143579483032227, 7.513916015625, 8.884252548217773, 10.254589080810547, 11.62492561340332, 12.99526309967041, 14.365599632263184, 15.735936164855957, 17.106273651123047, 18.47661018371582, 19.846946716308594, 21.217283248901367, 22.58761978149414, 23.957956314086914, 25.328292846679688, 26.69862937927246, 28.068965911865234, 29.439302444458008, 30.80963897705078, 32.17997741699219, 33.55031204223633, 34.920650482177734, 36.290985107421875, 37.66132354736328, 39.03166198730469, 40.40199661254883, 41.772335052490234, 43.142669677734375, 44.51300811767578, 45.88334274291992, 47.25368118286133, 48.62401580810547]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 8.0, 10.0, 10.0, 5.0, 17.0, 11.0, 27.0, 17.0, 20.0, 20.0, 20.0, 23.0, 35.0, 34.0, 34.0, 40.0, 40.0, 49.0, 46.0, 43.0, 38.0, 29.0, 45.0, 46.0, 38.0, 33.0, 31.0, 34.0, 26.0, 21.0, 33.0, 17.0, 18.0, 15.0, 15.0, 9.0, 6.0, 8.0, 10.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.67578125, -6.4493408203125, -6.222900390625, -5.9964599609375, -5.77001953125, -5.5435791015625, -5.317138671875, -5.0906982421875, -4.8642578125, -4.6378173828125, -4.411376953125, -4.1849365234375, -3.95849609375, -3.7320556640625, -3.505615234375, -3.2791748046875, -3.052734375, -2.8262939453125, -2.599853515625, -2.3734130859375, -2.14697265625, -1.9205322265625, -1.694091796875, -1.4676513671875, -1.2412109375, -1.0147705078125, -0.788330078125, -0.5618896484375, -0.33544921875, -0.1090087890625, 0.117431640625, 0.3438720703125, 0.5703125, 0.7967529296875, 1.023193359375, 1.2496337890625, 1.47607421875, 1.7025146484375, 1.928955078125, 2.1553955078125, 2.3818359375, 2.6082763671875, 2.834716796875, 3.0611572265625, 3.28759765625, 3.5140380859375, 3.740478515625, 3.9669189453125, 4.193359375, 4.4197998046875, 4.646240234375, 4.8726806640625, 5.09912109375, 5.3255615234375, 5.552001953125, 5.7784423828125, 6.0048828125, 6.2313232421875, 6.457763671875, 6.6842041015625, 6.91064453125, 7.1370849609375, 7.363525390625, 7.5899658203125, 7.81640625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 11.0, 10.0, 16.0, 19.0, 28.0, 35.0, 68.0, 100.0, 123.0, 163.0, 278.0, 389.0, 605.0, 839.0, 1200.0, 1817.0, 2682.0, 3899.0, 5622.0, 8425.0, 12382.0, 18411.0, 27533.0, 43018.0, 70731.0, 131482.0, 317189.0, 171069.0, 84513.0, 50210.0, 31828.0, 20500.0, 13649.0, 9294.0, 6298.0, 4266.0, 3093.0, 2113.0, 1392.0, 1006.0, 723.0, 513.0, 317.0, 245.0, 170.0, 89.0, 68.0, 49.0, 34.0, 14.0, 9.0, 11.0, 3.0, 7.0, 4.0, 2.0, 1.0], "bins": [-1.576171875, -1.5293426513671875, -1.482513427734375, -1.4356842041015625, -1.38885498046875, -1.3420257568359375, -1.295196533203125, -1.2483673095703125, -1.2015380859375, -1.1547088623046875, -1.107879638671875, -1.0610504150390625, -1.01422119140625, -0.9673919677734375, -0.920562744140625, -0.8737335205078125, -0.826904296875, -0.7800750732421875, -0.733245849609375, -0.6864166259765625, -0.63958740234375, -0.5927581787109375, -0.545928955078125, -0.4990997314453125, -0.4522705078125, -0.4054412841796875, -0.358612060546875, -0.3117828369140625, -0.26495361328125, -0.2181243896484375, -0.171295166015625, -0.1244659423828125, -0.07763671875, -0.0308074951171875, 0.016021728515625, 0.0628509521484375, 0.10968017578125, 0.1565093994140625, 0.203338623046875, 0.2501678466796875, 0.2969970703125, 0.3438262939453125, 0.390655517578125, 0.4374847412109375, 0.48431396484375, 0.5311431884765625, 0.577972412109375, 0.6248016357421875, 0.671630859375, 0.7184600830078125, 0.765289306640625, 0.8121185302734375, 0.85894775390625, 0.9057769775390625, 0.952606201171875, 0.9994354248046875, 1.0462646484375, 1.0930938720703125, 1.139923095703125, 1.1867523193359375, 1.23358154296875, 1.2804107666015625, 1.327239990234375, 1.3740692138671875, 1.4208984375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 11.0, 3.0, 10.0, 23.0, 10.0, 17.0, 22.0, 36.0, 31.0, 25.0, 37.0, 35.0, 46.0, 41.0, 40.0, 51.0, 48.0, 1071.0, 40.0, 34.0, 38.0, 41.0, 41.0, 33.0, 28.0, 23.0, 33.0, 26.0, 22.0, 16.0, 16.0, 16.0, 11.0, 16.0, 8.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.25396728515625, -4.0977783203125, -3.94158935546875, -3.785400390625, -3.62921142578125, -3.4730224609375, -3.31683349609375, -3.16064453125, -3.00445556640625, -2.8482666015625, -2.69207763671875, -2.535888671875, -2.37969970703125, -2.2235107421875, -2.06732177734375, -1.9111328125, -1.75494384765625, -1.5987548828125, -1.44256591796875, -1.286376953125, -1.13018798828125, -0.9739990234375, -0.81781005859375, -0.66162109375, -0.50543212890625, -0.3492431640625, -0.19305419921875, -0.036865234375, 0.11932373046875, 0.2755126953125, 0.43170166015625, 0.587890625, 0.74407958984375, 0.9002685546875, 1.05645751953125, 1.212646484375, 1.36883544921875, 1.5250244140625, 1.68121337890625, 1.83740234375, 1.99359130859375, 2.1497802734375, 2.30596923828125, 2.462158203125, 2.61834716796875, 2.7745361328125, 2.93072509765625, 3.0869140625, 3.24310302734375, 3.3992919921875, 3.55548095703125, 3.711669921875, 3.86785888671875, 4.0240478515625, 4.18023681640625, 4.33642578125, 4.49261474609375, 4.6488037109375, 4.80499267578125, 4.961181640625, 5.11737060546875, 5.2735595703125, 5.42974853515625, 5.5859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 5.0, 17.0, 13.0, 26.0, 39.0, 47.0, 73.0, 109.0, 134.0, 238.0, 340.0, 596.0, 808.0, 1319.0, 2051.0, 3252.0, 5186.0, 8341.0, 13567.0, 21835.0, 36084.0, 60822.0, 107834.0, 274596.0, 1293668.0, 109596.0, 61251.0, 36496.0, 22296.0, 13685.0, 8415.0, 5199.0, 3244.0, 2019.0, 1324.0, 866.0, 561.0, 388.0, 258.0, 176.0, 131.0, 65.0, 45.0, 41.0, 27.0, 19.0, 10.0, 3.0, 9.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.65625, -1.6045074462890625, -1.552764892578125, -1.5010223388671875, -1.44927978515625, -1.3975372314453125, -1.345794677734375, -1.2940521240234375, -1.2423095703125, -1.1905670166015625, -1.138824462890625, -1.0870819091796875, -1.03533935546875, -0.9835968017578125, -0.931854248046875, -0.8801116943359375, -0.828369140625, -0.7766265869140625, -0.724884033203125, -0.6731414794921875, -0.62139892578125, -0.5696563720703125, -0.517913818359375, -0.4661712646484375, -0.4144287109375, -0.3626861572265625, -0.310943603515625, -0.2592010498046875, -0.20745849609375, -0.1557159423828125, -0.103973388671875, -0.0522308349609375, -0.00048828125, 0.0512542724609375, 0.102996826171875, 0.1547393798828125, 0.20648193359375, 0.2582244873046875, 0.309967041015625, 0.3617095947265625, 0.4134521484375, 0.4651947021484375, 0.516937255859375, 0.5686798095703125, 0.62042236328125, 0.6721649169921875, 0.723907470703125, 0.7756500244140625, 0.827392578125, 0.8791351318359375, 0.930877685546875, 0.9826202392578125, 1.03436279296875, 1.0861053466796875, 1.137847900390625, 1.1895904541015625, 1.2413330078125, 1.2930755615234375, 1.344818115234375, 1.3965606689453125, 1.44830322265625, 1.5000457763671875, 1.551788330078125, 1.6035308837890625, 1.6552734375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 16.0, 12.0, 21.0, 16.0, 21.0, 26.0, 27.0, 37.0, 38.0, 63.0, 85.0, 118.0, 124.0, 80.0, 59.0, 42.0, 42.0, 34.0, 29.0, 27.0, 9.0, 18.0, 16.0, 5.0, 5.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00116729736328125, -0.001133054494857788, -0.0010988116264343262, -0.0010645687580108643, -0.0010303258895874023, -0.0009960830211639404, -0.0009618401527404785, -0.0009275972843170166, -0.0008933544158935547, -0.0008591115474700928, -0.0008248686790466309, -0.0007906258106231689, -0.000756382942199707, -0.0007221400737762451, -0.0006878972053527832, -0.0006536543369293213, -0.0006194114685058594, -0.0005851686000823975, -0.0005509257316589355, -0.0005166828632354736, -0.0004824399948120117, -0.0004481971263885498, -0.0004139542579650879, -0.000379711389541626, -0.00034546852111816406, -0.00031122565269470215, -0.00027698278427124023, -0.00024273991584777832, -0.0002084970474243164, -0.0001742541790008545, -0.00014001131057739258, -0.00010576844215393066, -7.152557373046875e-05, -3.7282705307006836e-05, -3.039836883544922e-06, 3.120303153991699e-05, 6.54458999633789e-05, 9.968876838684082e-05, 0.00013393163681030273, 0.00016817450523376465, 0.00020241737365722656, 0.00023666024208068848, 0.0002709031105041504, 0.0003051459789276123, 0.0003393888473510742, 0.00037363171577453613, 0.00040787458419799805, 0.00044211745262145996, 0.0004763603210449219, 0.0005106031894683838, 0.0005448460578918457, 0.0005790889263153076, 0.0006133317947387695, 0.0006475746631622314, 0.0006818175315856934, 0.0007160604000091553, 0.0007503032684326172, 0.0007845461368560791, 0.000818789005279541, 0.0008530318737030029, 0.0008872747421264648, 0.0009215176105499268, 0.0009557604789733887, 0.0009900033473968506, 0.0010242462158203125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 12.0, 12.0, 16.0, 30.0, 29.0, 33.0, 73.0, 93.0, 191.0, 558.0, 30507.0, 1015345.0, 1029.0, 235.0, 121.0, 62.0, 57.0, 38.0, 24.0, 21.0, 19.0, 13.0, 9.0, 5.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271453857421875, -0.026245832443237305, -0.02534627914428711, -0.024446725845336914, -0.02354717254638672, -0.022647619247436523, -0.021748065948486328, -0.020848512649536133, -0.019948959350585938, -0.019049406051635742, -0.018149852752685547, -0.01725029945373535, -0.016350746154785156, -0.015451192855834961, -0.014551639556884766, -0.01365208625793457, -0.012752532958984375, -0.01185297966003418, -0.010953426361083984, -0.010053873062133789, -0.009154319763183594, -0.008254766464233398, -0.007355213165283203, -0.006455659866333008, -0.0055561065673828125, -0.004656553268432617, -0.003756999969482422, -0.0028574466705322266, -0.0019578933715820312, -0.001058340072631836, -0.00015878677368164062, 0.0007407665252685547, 0.00164031982421875, 0.0025398731231689453, 0.0034394264221191406, 0.004338979721069336, 0.005238533020019531, 0.0061380863189697266, 0.007037639617919922, 0.007937192916870117, 0.008836746215820312, 0.009736299514770508, 0.010635852813720703, 0.011535406112670898, 0.012434959411621094, 0.013334512710571289, 0.014234066009521484, 0.01513361930847168, 0.016033172607421875, 0.01693272590637207, 0.017832279205322266, 0.01873183250427246, 0.019631385803222656, 0.02053093910217285, 0.021430492401123047, 0.022330045700073242, 0.023229598999023438, 0.024129152297973633, 0.025028705596923828, 0.025928258895874023, 0.02682781219482422, 0.027727365493774414, 0.02862691879272461, 0.029526472091674805, 0.030426025390625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 14.0, 66.0, 207.0, 372.0, 228.0, 95.0, 27.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013643455458804965, -0.0013225041329860687, -0.0012806628365069628, -0.001238821423612535, -0.001196980127133429, -0.0011551387142390013, -0.0011132974177598953, -0.0010714560048654675, -0.0010296147083863616, -0.0009877732954919338, -0.0009459319990128279, -0.000904090644326061, -0.0008622492896392941, -0.0008204079349525273, -0.0007785665802657604, -0.0007367251673713326, -0.0006948838126845658, -0.0006530424579977989, -0.0006112011033110321, -0.0005693597486242652, -0.0005275183939374983, -0.00048567703925073147, -0.00044383565546013415, -0.0004019943007733673, -0.0003601529460866004, -0.00031831159139983356, -0.0002764702367130667, -0.0002346288674743846, -0.00019278751278761774, -0.00015094615810085088, -0.00010910478886216879, -6.726343417540193e-05, -2.5422079488635063e-05, 1.6419278836110607e-05, 5.826063716085628e-05, 0.00010010199912358075, 0.00014194335381034762, 0.00018378470849711448, 0.00022562607773579657, 0.00026746743242256343, 0.0003093087871093303, 0.00035115014179609716, 0.000392991496482864, 0.00043483288027346134, 0.0004766742349602282, 0.0005185155896469951, 0.0005603569443337619, 0.0006021982990205288, 0.0006440396537072957, 0.0006858810083940625, 0.0007277223630808294, 0.0007695637177675962, 0.0008114050724543631, 0.00085324642714113, 0.0008950878400355577, 0.0009369291365146637, 0.0009787705494090915, 0.0010206119623035192, 0.0010624532587826252, 0.001104294671677053, 0.001146135968156159, 0.0011879773810505867, 0.0012298186775296926, 0.0012716600904241204, 0.0013135013869032264]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 9.0, 7.0, 18.0, 10.0, 19.0, 15.0, 19.0, 24.0, 24.0, 28.0, 24.0, 23.0, 30.0, 32.0, 33.0, 35.0, 39.0, 37.0, 40.0, 41.0, 47.0, 43.0, 42.0, 41.0, 42.0, 26.0, 36.0, 34.0, 27.0, 35.0, 20.0, 17.0, 11.0, 15.0, 11.0, 9.0, 9.0, 4.0, 8.0, 2.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.00046330690383911133, -0.0004499778151512146, -0.00043664872646331787, -0.00042331963777542114, -0.0004099905490875244, -0.0003966614603996277, -0.00038333237171173096, -0.00037000328302383423, -0.0003566741943359375, -0.00034334510564804077, -0.00033001601696014404, -0.0003166869282722473, -0.0003033578395843506, -0.00029002875089645386, -0.00027669966220855713, -0.0002633705735206604, -0.00025004148483276367, -0.00023671239614486694, -0.00022338330745697021, -0.00021005421876907349, -0.00019672513008117676, -0.00018339604139328003, -0.0001700669527053833, -0.00015673786401748657, -0.00014340877532958984, -0.00013007968664169312, -0.00011675059795379639, -0.00010342150926589966, -9.009242057800293e-05, -7.67633318901062e-05, -6.343424320220947e-05, -5.0105154514312744e-05, -3.6776065826416016e-05, -2.3446977138519287e-05, -1.0117888450622559e-05, 3.21120023727417e-06, 1.65402889251709e-05, 2.9869377613067627e-05, 4.3198466300964355e-05, 5.6527554988861084e-05, 6.985664367675781e-05, 8.318573236465454e-05, 9.651482105255127e-05, 0.000109843909740448, 0.00012317299842834473, 0.00013650208711624146, 0.00014983117580413818, 0.0001631602644920349, 0.00017648935317993164, 0.00018981844186782837, 0.0002031475305557251, 0.00021647661924362183, 0.00022980570793151855, 0.00024313479661941528, 0.000256463885307312, 0.00026979297399520874, 0.00028312206268310547, 0.0002964511513710022, 0.0003097802400588989, 0.00032310932874679565, 0.0003364384174346924, 0.0003497675061225891, 0.00036309659481048584, 0.00037642568349838257, 0.0003897547721862793]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 8.0, 10.0, 10.0, 5.0, 17.0, 11.0, 27.0, 17.0, 20.0, 20.0, 20.0, 23.0, 35.0, 34.0, 34.0, 40.0, 40.0, 49.0, 46.0, 43.0, 38.0, 29.0, 45.0, 46.0, 38.0, 33.0, 31.0, 34.0, 26.0, 21.0, 33.0, 17.0, 18.0, 15.0, 15.0, 9.0, 6.0, 8.0, 10.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.67578125, -6.4493408203125, -6.222900390625, -5.9964599609375, -5.77001953125, -5.5435791015625, -5.317138671875, -5.0906982421875, -4.8642578125, -4.6378173828125, -4.411376953125, -4.1849365234375, -3.95849609375, -3.7320556640625, -3.505615234375, -3.2791748046875, -3.052734375, -2.8262939453125, -2.599853515625, -2.3734130859375, -2.14697265625, -1.9205322265625, -1.694091796875, -1.4676513671875, -1.2412109375, -1.0147705078125, -0.788330078125, -0.5618896484375, -0.33544921875, -0.1090087890625, 0.117431640625, 0.3438720703125, 0.5703125, 0.7967529296875, 1.023193359375, 1.2496337890625, 1.47607421875, 1.7025146484375, 1.928955078125, 2.1553955078125, 2.3818359375, 2.6082763671875, 2.834716796875, 3.0611572265625, 3.28759765625, 3.5140380859375, 3.740478515625, 3.9669189453125, 4.193359375, 4.4197998046875, 4.646240234375, 4.8726806640625, 5.09912109375, 5.3255615234375, 5.552001953125, 5.7784423828125, 6.0048828125, 6.2313232421875, 6.457763671875, 6.6842041015625, 6.91064453125, 7.1370849609375, 7.363525390625, 7.5899658203125, 7.81640625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 8.0, 9.0, 14.0, 14.0, 12.0, 27.0, 18.0, 50.0, 52.0, 72.0, 100.0, 151.0, 259.0, 438.0, 849.0, 1714.0, 4223.0, 11102.0, 37113.0, 176496.0, 593394.0, 168443.0, 35609.0, 10631.0, 4010.0, 1670.0, 813.0, 440.0, 260.0, 159.0, 121.0, 82.0, 59.0, 31.0, 27.0, 23.0, 17.0, 8.0, 11.0, 10.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.48046875, -6.26068115234375, -6.0408935546875, -5.82110595703125, -5.601318359375, -5.38153076171875, -5.1617431640625, -4.94195556640625, -4.72216796875, -4.50238037109375, -4.2825927734375, -4.06280517578125, -3.843017578125, -3.62322998046875, -3.4034423828125, -3.18365478515625, -2.9638671875, -2.74407958984375, -2.5242919921875, -2.30450439453125, -2.084716796875, -1.86492919921875, -1.6451416015625, -1.42535400390625, -1.20556640625, -0.98577880859375, -0.7659912109375, -0.54620361328125, -0.326416015625, -0.10662841796875, 0.1131591796875, 0.33294677734375, 0.552734375, 0.77252197265625, 0.9923095703125, 1.21209716796875, 1.431884765625, 1.65167236328125, 1.8714599609375, 2.09124755859375, 2.31103515625, 2.53082275390625, 2.7506103515625, 2.97039794921875, 3.190185546875, 3.40997314453125, 3.6297607421875, 3.84954833984375, 4.0693359375, 4.28912353515625, 4.5089111328125, 4.72869873046875, 4.948486328125, 5.16827392578125, 5.3880615234375, 5.60784912109375, 5.82763671875, 6.04742431640625, 6.2672119140625, 6.48699951171875, 6.706787109375, 6.92657470703125, 7.1463623046875, 7.36614990234375, 7.5859375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 12.0, 10.0, 11.0, 13.0, 14.0, 14.0, 18.0, 30.0, 23.0, 39.0, 36.0, 35.0, 37.0, 43.0, 43.0, 62.0, 143.0, 1705.0, 262.0, 86.0, 42.0, 36.0, 40.0, 36.0, 31.0, 34.0, 28.0, 24.0, 17.0, 19.0, 16.0, 18.0, 13.0, 12.0, 7.0, 8.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.890625, -22.166748046875, -21.44287109375, -20.718994140625, -19.9951171875, -19.271240234375, -18.54736328125, -17.823486328125, -17.099609375, -16.375732421875, -15.65185546875, -14.927978515625, -14.2041015625, -13.480224609375, -12.75634765625, -12.032470703125, -11.30859375, -10.584716796875, -9.86083984375, -9.136962890625, -8.4130859375, -7.689208984375, -6.96533203125, -6.241455078125, -5.517578125, -4.793701171875, -4.06982421875, -3.345947265625, -2.6220703125, -1.898193359375, -1.17431640625, -0.450439453125, 0.2734375, 0.997314453125, 1.72119140625, 2.445068359375, 3.1689453125, 3.892822265625, 4.61669921875, 5.340576171875, 6.064453125, 6.788330078125, 7.51220703125, 8.236083984375, 8.9599609375, 9.683837890625, 10.40771484375, 11.131591796875, 11.85546875, 12.579345703125, 13.30322265625, 14.027099609375, 14.7509765625, 15.474853515625, 16.19873046875, 16.922607421875, 17.646484375, 18.370361328125, 19.09423828125, 19.818115234375, 20.5419921875, 21.265869140625, 21.98974609375, 22.713623046875, 23.4375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 13.0, 22.0, 29.0, 34.0, 41.0, 64.0, 96.0, 153.0, 231.0, 338.0, 638.0, 4799.0, 3122755.0, 14422.0, 920.0, 387.0, 240.0, 159.0, 90.0, 70.0, 47.0, 33.0, 28.0, 16.0, 22.0, 10.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-86.875, -84.62548828125, -82.3759765625, -80.12646484375, -77.876953125, -75.62744140625, -73.3779296875, -71.12841796875, -68.87890625, -66.62939453125, -64.3798828125, -62.13037109375, -59.880859375, -57.63134765625, -55.3818359375, -53.13232421875, -50.8828125, -48.63330078125, -46.3837890625, -44.13427734375, -41.884765625, -39.63525390625, -37.3857421875, -35.13623046875, -32.88671875, -30.63720703125, -28.3876953125, -26.13818359375, -23.888671875, -21.63916015625, -19.3896484375, -17.14013671875, -14.890625, -12.64111328125, -10.3916015625, -8.14208984375, -5.892578125, -3.64306640625, -1.3935546875, 0.85595703125, 3.10546875, 5.35498046875, 7.6044921875, 9.85400390625, 12.103515625, 14.35302734375, 16.6025390625, 18.85205078125, 21.1015625, 23.35107421875, 25.6005859375, 27.85009765625, 30.099609375, 32.34912109375, 34.5986328125, 36.84814453125, 39.09765625, 41.34716796875, 43.5966796875, 45.84619140625, 48.095703125, 50.34521484375, 52.5947265625, 54.84423828125, 57.09375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 25.0, 174.0, 479.0, 275.0, 53.0, 10.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.34886169433594, -98.15353393554688, -95.95820617675781, -93.76287841796875, -91.56755065917969, -89.37222290039062, -87.17689514160156, -84.9815673828125, -82.78623962402344, -80.59091186523438, -78.39558410644531, -76.20025634765625, -74.00492858886719, -71.80960083007812, -69.61427307128906, -67.4189453125, -65.22361755371094, -63.028289794921875, -60.83296203613281, -58.63763427734375, -56.44230651855469, -54.246978759765625, -52.05165100097656, -49.8563232421875, -47.660987854003906, -45.465660095214844, -43.27033233642578, -41.07500457763672, -38.879676818847656, -36.684349060058594, -34.48902130126953, -32.29369354248047, -30.098369598388672, -27.90304183959961, -25.707714080810547, -23.512386322021484, -21.317058563232422, -19.12173080444336, -16.926401138305664, -14.731073379516602, -12.535745620727539, -10.340417861938477, -8.145090103149414, -5.949761390686035, -3.7544336318969727, -1.5591058731079102, 0.6362228393554688, 2.8315505981445312, 5.026878356933594, 7.222206115722656, 9.417533874511719, 11.612862586975098, 13.80819034576416, 16.003517150878906, 18.1988468170166, 20.394174575805664, 22.589502334594727, 24.78483009338379, 26.98015785217285, 29.175487518310547, 31.37081527709961, 33.56614303588867, 35.761470794677734, 37.9567985534668, 40.15212631225586]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 2.0, 6.0, 7.0, 7.0, 4.0, 10.0, 16.0, 21.0, 27.0, 22.0, 17.0, 32.0, 25.0, 45.0, 39.0, 31.0, 50.0, 39.0, 37.0, 41.0, 64.0, 37.0, 42.0, 43.0, 38.0, 20.0, 38.0, 34.0, 20.0, 36.0, 19.0, 23.0, 24.0, 9.0, 14.0, 10.0, 12.0, 11.0, 3.0, 6.0, 2.0, 2.0, 4.0, 7.0, 0.0, 2.0, 1.0, 1.0], "bins": [-67.33386993408203, -65.44202423095703, -63.550174713134766, -61.658329010009766, -59.766483306884766, -57.8746337890625, -55.9827880859375, -54.0909423828125, -52.199092864990234, -50.307247161865234, -48.41539764404297, -46.52355194091797, -44.63170623779297, -42.7398567199707, -40.8480110168457, -38.95616149902344, -37.06431579589844, -35.17247009277344, -33.28062057495117, -31.388774871826172, -29.49692726135254, -27.605079650878906, -25.713233947753906, -23.821386337280273, -21.929542541503906, -20.037694931030273, -18.145849227905273, -16.25400161743164, -14.362154006958008, -12.470307350158691, -10.578460693359375, -8.686613082885742, -6.794765472412109, -4.902918338775635, -3.0110714435577393, -1.1192245483398438, 0.7726225852966309, 2.6644697189331055, 4.556316375732422, 6.448163986206055, 8.340010643005371, 10.231857299804688, 12.12370491027832, 14.015551567077637, 15.907398223876953, 17.799245834350586, 19.69109344482422, 21.58293914794922, 23.47478675842285, 25.366634368896484, 27.258480072021484, 29.150327682495117, 31.04217529296875, 32.93402099609375, 34.82586669921875, 36.717716217041016, 38.609561920166016, 40.501407623291016, 42.39325714111328, 44.28510284423828, 46.17694854736328, 48.06879806518555, 49.96064376831055, 51.85249328613281, 53.74433898925781]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 7.0, 7.0, 13.0, 15.0, 11.0, 23.0, 20.0, 18.0, 18.0, 33.0, 26.0, 21.0, 29.0, 45.0, 40.0, 52.0, 45.0, 41.0, 41.0, 35.0, 49.0, 40.0, 39.0, 38.0, 36.0, 28.0, 24.0, 34.0, 25.0, 34.0, 16.0, 15.0, 17.0, 16.0, 5.0, 8.0, 10.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8203125, -6.58056640625, -6.3408203125, -6.10107421875, -5.861328125, -5.62158203125, -5.3818359375, -5.14208984375, -4.90234375, -4.66259765625, -4.4228515625, -4.18310546875, -3.943359375, -3.70361328125, -3.4638671875, -3.22412109375, -2.984375, -2.74462890625, -2.5048828125, -2.26513671875, -2.025390625, -1.78564453125, -1.5458984375, -1.30615234375, -1.06640625, -0.82666015625, -0.5869140625, -0.34716796875, -0.107421875, 0.13232421875, 0.3720703125, 0.61181640625, 0.8515625, 1.09130859375, 1.3310546875, 1.57080078125, 1.810546875, 2.05029296875, 2.2900390625, 2.52978515625, 2.76953125, 3.00927734375, 3.2490234375, 3.48876953125, 3.728515625, 3.96826171875, 4.2080078125, 4.44775390625, 4.6875, 4.92724609375, 5.1669921875, 5.40673828125, 5.646484375, 5.88623046875, 6.1259765625, 6.36572265625, 6.60546875, 6.84521484375, 7.0849609375, 7.32470703125, 7.564453125, 7.80419921875, 8.0439453125, 8.28369140625, 8.5234375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 6.0, 4.0, 3.0, 6.0, 8.0, 10.0, 13.0, 19.0, 22.0, 30.0, 25.0, 26.0, 42.0, 52.0, 62.0, 75.0, 85.0, 139.0, 242.0, 411.0, 1003.0, 3935.0, 47673.0, 1287115.0, 2644278.0, 196806.0, 9052.0, 1576.0, 543.0, 280.0, 169.0, 129.0, 87.0, 68.0, 53.0, 46.0, 40.0, 48.0, 26.0, 27.0, 13.0, 14.0, 13.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.453125, -16.85546875, -16.2578125, -15.66015625, -15.0625, -14.46484375, -13.8671875, -13.26953125, -12.671875, -12.07421875, -11.4765625, -10.87890625, -10.28125, -9.68359375, -9.0859375, -8.48828125, -7.890625, -7.29296875, -6.6953125, -6.09765625, -5.5, -4.90234375, -4.3046875, -3.70703125, -3.109375, -2.51171875, -1.9140625, -1.31640625, -0.71875, -0.12109375, 0.4765625, 1.07421875, 1.671875, 2.26953125, 2.8671875, 3.46484375, 4.0625, 4.66015625, 5.2578125, 5.85546875, 6.453125, 7.05078125, 7.6484375, 8.24609375, 8.84375, 9.44140625, 10.0390625, 10.63671875, 11.234375, 11.83203125, 12.4296875, 13.02734375, 13.625, 14.22265625, 14.8203125, 15.41796875, 16.015625, 16.61328125, 17.2109375, 17.80859375, 18.40625, 19.00390625, 19.6015625, 20.19921875, 20.796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 7.0, 10.0, 6.0, 14.0, 14.0, 12.0, 30.0, 39.0, 48.0, 38.0, 78.0, 128.0, 134.0, 165.0, 222.0, 318.0, 347.0, 430.0, 426.0, 388.0, 321.0, 248.0, 164.0, 108.0, 96.0, 71.0, 47.0, 45.0, 26.0, 30.0, 20.0, 11.0, 10.0, 8.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.7421875, -14.3431396484375, -13.944091796875, -13.5450439453125, -13.14599609375, -12.7469482421875, -12.347900390625, -11.9488525390625, -11.5498046875, -11.1507568359375, -10.751708984375, -10.3526611328125, -9.95361328125, -9.5545654296875, -9.155517578125, -8.7564697265625, -8.357421875, -7.9583740234375, -7.559326171875, -7.1602783203125, -6.76123046875, -6.3621826171875, -5.963134765625, -5.5640869140625, -5.1650390625, -4.7659912109375, -4.366943359375, -3.9678955078125, -3.56884765625, -3.1697998046875, -2.770751953125, -2.3717041015625, -1.97265625, -1.5736083984375, -1.174560546875, -0.7755126953125, -0.37646484375, 0.0225830078125, 0.421630859375, 0.8206787109375, 1.2197265625, 1.6187744140625, 2.017822265625, 2.4168701171875, 2.81591796875, 3.2149658203125, 3.614013671875, 4.0130615234375, 4.412109375, 4.8111572265625, 5.210205078125, 5.6092529296875, 6.00830078125, 6.4073486328125, 6.806396484375, 7.2054443359375, 7.6044921875, 8.0035400390625, 8.402587890625, 8.8016357421875, 9.20068359375, 9.5997314453125, 9.998779296875, 10.3978271484375, 10.796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 8.0, 9.0, 18.0, 8.0, 30.0, 29.0, 27.0, 29.0, 62.0, 64.0, 95.0, 99.0, 146.0, 164.0, 217.0, 323.0, 478.0, 1307.0, 85448.0, 4086138.0, 16981.0, 925.0, 391.0, 269.0, 211.0, 178.0, 131.0, 112.0, 82.0, 56.0, 48.0, 47.0, 42.0, 34.0, 15.0, 15.0, 16.0, 7.0, 10.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.5, -53.47265625, -51.4453125, -49.41796875, -47.390625, -45.36328125, -43.3359375, -41.30859375, -39.28125, -37.25390625, -35.2265625, -33.19921875, -31.171875, -29.14453125, -27.1171875, -25.08984375, -23.0625, -21.03515625, -19.0078125, -16.98046875, -14.953125, -12.92578125, -10.8984375, -8.87109375, -6.84375, -4.81640625, -2.7890625, -0.76171875, 1.265625, 3.29296875, 5.3203125, 7.34765625, 9.375, 11.40234375, 13.4296875, 15.45703125, 17.484375, 19.51171875, 21.5390625, 23.56640625, 25.59375, 27.62109375, 29.6484375, 31.67578125, 33.703125, 35.73046875, 37.7578125, 39.78515625, 41.8125, 43.83984375, 45.8671875, 47.89453125, 49.921875, 51.94921875, 53.9765625, 56.00390625, 58.03125, 60.05859375, 62.0859375, 64.11328125, 66.140625, 68.16796875, 70.1953125, 72.22265625, 74.25]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 32.0, 98.0, 211.0, 256.0, 226.0, 127.0, 41.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.27456665039062, -145.77438354492188, -142.27420043945312, -138.77401733398438, -135.2738494873047, -131.77366638183594, -128.2734832763672, -124.77330017089844, -121.27312469482422, -117.77294158935547, -114.27276611328125, -110.7725830078125, -107.27239990234375, -103.77222442626953, -100.27204132080078, -96.77186584472656, -93.27168273925781, -89.77149963378906, -86.27132415771484, -82.7711410522461, -79.27095794677734, -75.77078247070312, -72.27059936523438, -68.77041625976562, -65.27023315429688, -61.77005386352539, -58.26987075805664, -54.769691467285156, -51.26951217651367, -47.76933288574219, -44.26914978027344, -40.76897048950195, -37.26879119873047, -33.768611907958984, -30.268430709838867, -26.76824951171875, -23.268070220947266, -19.76788902282715, -16.26770782470703, -12.767528533935547, -9.26734733581543, -5.767167091369629, -2.26698637008667, 1.233194351196289, 4.73337459564209, 8.23355484008789, 11.733736038208008, 15.233915328979492, 18.73409652709961, 22.234277725219727, 25.73445701599121, 29.234638214111328, 32.73481750488281, 36.23500061035156, 39.73517990112305, 43.23535919189453, 46.73554229736328, 50.235721588134766, 53.735904693603516, 57.236083984375, 60.736263275146484, 64.23644256591797, 67.73662567138672, 71.23680114746094, 74.73698425292969]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 5.0, 14.0, 6.0, 8.0, 11.0, 20.0, 17.0, 15.0, 18.0, 18.0, 17.0, 23.0, 28.0, 31.0, 31.0, 32.0, 47.0, 35.0, 54.0, 45.0, 31.0, 38.0, 38.0, 37.0, 47.0, 37.0, 30.0, 23.0, 37.0, 22.0, 16.0, 22.0, 30.0, 20.0, 19.0, 17.0, 6.0, 15.0, 8.0, 5.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-45.651275634765625, -44.360755920410156, -43.07023620605469, -41.77971267700195, -40.489192962646484, -39.198673248291016, -37.90815353393555, -36.61763381958008, -35.327110290527344, -34.036590576171875, -32.746070861816406, -31.455549240112305, -30.165027618408203, -28.874507904052734, -27.583988189697266, -26.293468475341797, -25.002948760986328, -23.71242904663086, -22.421907424926758, -21.13138771057129, -19.840866088867188, -18.55034637451172, -17.25982666015625, -15.969305992126465, -14.67878532409668, -13.388264656066895, -12.09774398803711, -10.80722427368164, -9.516703605651855, -8.22618293762207, -6.935662746429443, -5.645142555236816, -4.354621887207031, -3.064101457595825, -1.7735810279846191, -0.4830605983734131, 0.807459831237793, 2.097980499267578, 3.388500690460205, 4.679020881652832, 5.969541549682617, 7.260062217712402, 8.550582885742188, 9.841102600097656, 11.131623268127441, 12.422143936157227, 13.712663650512695, 15.00318431854248, 16.293704986572266, 17.584224700927734, 18.874746322631836, 20.165266036987305, 21.455787658691406, 22.746307373046875, 24.036827087402344, 25.327346801757812, 26.617868423461914, 27.908388137817383, 29.198909759521484, 30.489429473876953, 31.779949188232422, 33.070472717285156, 34.360992431640625, 35.651512145996094, 36.94203186035156]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 8.0, 11.0, 10.0, 13.0, 11.0, 17.0, 22.0, 19.0, 25.0, 21.0, 18.0, 40.0, 36.0, 22.0, 36.0, 48.0, 47.0, 41.0, 39.0, 41.0, 47.0, 34.0, 30.0, 39.0, 41.0, 46.0, 18.0, 26.0, 31.0, 23.0, 22.0, 14.0, 20.0, 15.0, 13.0, 15.0, 7.0, 5.0, 5.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9453125, -6.72039794921875, -6.4954833984375, -6.27056884765625, -6.045654296875, -5.82073974609375, -5.5958251953125, -5.37091064453125, -5.14599609375, -4.92108154296875, -4.6961669921875, -4.47125244140625, -4.246337890625, -4.02142333984375, -3.7965087890625, -3.57159423828125, -3.3466796875, -3.12176513671875, -2.8968505859375, -2.67193603515625, -2.447021484375, -2.22210693359375, -1.9971923828125, -1.77227783203125, -1.54736328125, -1.32244873046875, -1.0975341796875, -0.87261962890625, -0.647705078125, -0.42279052734375, -0.1978759765625, 0.02703857421875, 0.251953125, 0.47686767578125, 0.7017822265625, 0.92669677734375, 1.151611328125, 1.37652587890625, 1.6014404296875, 1.82635498046875, 2.05126953125, 2.27618408203125, 2.5010986328125, 2.72601318359375, 2.950927734375, 3.17584228515625, 3.4007568359375, 3.62567138671875, 3.8505859375, 4.07550048828125, 4.3004150390625, 4.52532958984375, 4.750244140625, 4.97515869140625, 5.2000732421875, 5.42498779296875, 5.64990234375, 5.87481689453125, 6.0997314453125, 6.32464599609375, 6.549560546875, 6.77447509765625, 6.9993896484375, 7.22430419921875, 7.44921875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 5.0, 13.0, 11.0, 18.0, 29.0, 27.0, 46.0, 79.0, 121.0, 163.0, 236.0, 333.0, 523.0, 731.0, 1075.0, 1595.0, 2321.0, 3395.0, 5075.0, 7690.0, 11131.0, 16984.0, 26146.0, 40991.0, 67672.0, 121716.0, 296391.0, 195664.0, 93957.0, 55010.0, 33934.0, 21787.0, 14243.0, 9526.0, 6365.0, 4307.0, 2955.0, 1971.0, 1393.0, 925.0, 658.0, 434.0, 290.0, 208.0, 128.0, 101.0, 63.0, 44.0, 23.0, 27.0, 12.0, 4.0, 6.0, 5.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0], "bins": [-1.4462890625, -1.399322509765625, -1.35235595703125, -1.305389404296875, -1.2584228515625, -1.211456298828125, -1.16448974609375, -1.117523193359375, -1.070556640625, -1.023590087890625, -0.97662353515625, -0.929656982421875, -0.8826904296875, -0.835723876953125, -0.78875732421875, -0.741790771484375, -0.69482421875, -0.647857666015625, -0.60089111328125, -0.553924560546875, -0.5069580078125, -0.459991455078125, -0.41302490234375, -0.366058349609375, -0.319091796875, -0.272125244140625, -0.22515869140625, -0.178192138671875, -0.1312255859375, -0.084259033203125, -0.03729248046875, 0.009674072265625, 0.056640625, 0.103607177734375, 0.15057373046875, 0.197540283203125, 0.2445068359375, 0.291473388671875, 0.33843994140625, 0.385406494140625, 0.432373046875, 0.479339599609375, 0.52630615234375, 0.573272705078125, 0.6202392578125, 0.667205810546875, 0.71417236328125, 0.761138916015625, 0.80810546875, 0.855072021484375, 0.90203857421875, 0.949005126953125, 0.9959716796875, 1.042938232421875, 1.08990478515625, 1.136871337890625, 1.183837890625, 1.230804443359375, 1.27777099609375, 1.324737548828125, 1.3717041015625, 1.418670654296875, 1.46563720703125, 1.512603759765625, 1.5595703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 5.0, 11.0, 12.0, 14.0, 14.0, 17.0, 26.0, 26.0, 33.0, 30.0, 29.0, 43.0, 50.0, 41.0, 40.0, 44.0, 48.0, 1060.0, 43.0, 39.0, 37.0, 46.0, 37.0, 41.0, 29.0, 26.0, 32.0, 17.0, 27.0, 18.0, 15.0, 10.0, 7.0, 10.0, 13.0, 11.0, 7.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.62890625, -4.47943115234375, -4.3299560546875, -4.18048095703125, -4.031005859375, -3.88153076171875, -3.7320556640625, -3.58258056640625, -3.43310546875, -3.28363037109375, -3.1341552734375, -2.98468017578125, -2.835205078125, -2.68572998046875, -2.5362548828125, -2.38677978515625, -2.2373046875, -2.08782958984375, -1.9383544921875, -1.78887939453125, -1.639404296875, -1.48992919921875, -1.3404541015625, -1.19097900390625, -1.04150390625, -0.89202880859375, -0.7425537109375, -0.59307861328125, -0.443603515625, -0.29412841796875, -0.1446533203125, 0.00482177734375, 0.154296875, 0.30377197265625, 0.4532470703125, 0.60272216796875, 0.752197265625, 0.90167236328125, 1.0511474609375, 1.20062255859375, 1.35009765625, 1.49957275390625, 1.6490478515625, 1.79852294921875, 1.947998046875, 2.09747314453125, 2.2469482421875, 2.39642333984375, 2.5458984375, 2.69537353515625, 2.8448486328125, 2.99432373046875, 3.143798828125, 3.29327392578125, 3.4427490234375, 3.59222412109375, 3.74169921875, 3.89117431640625, 4.0406494140625, 4.19012451171875, 4.339599609375, 4.48907470703125, 4.6385498046875, 4.78802490234375, 4.9375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 7.0, 9.0, 19.0, 20.0, 30.0, 44.0, 78.0, 102.0, 142.0, 204.0, 377.0, 543.0, 751.0, 1154.0, 1751.0, 2693.0, 4200.0, 6628.0, 10142.0, 15906.0, 25080.0, 40379.0, 67413.0, 119950.0, 1320675.0, 215272.0, 103770.0, 59768.0, 36307.0, 22561.0, 14652.0, 9309.0, 6083.0, 3849.0, 2504.0, 1606.0, 1038.0, 692.0, 451.0, 323.0, 218.0, 137.0, 97.0, 62.0, 46.0, 22.0, 28.0, 10.0, 9.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.4638671875, -1.4179534912109375, -1.372039794921875, -1.3261260986328125, -1.28021240234375, -1.2342987060546875, -1.188385009765625, -1.1424713134765625, -1.0965576171875, -1.0506439208984375, -1.004730224609375, -0.9588165283203125, -0.91290283203125, -0.8669891357421875, -0.821075439453125, -0.7751617431640625, -0.729248046875, -0.6833343505859375, -0.637420654296875, -0.5915069580078125, -0.54559326171875, -0.4996795654296875, -0.453765869140625, -0.4078521728515625, -0.3619384765625, -0.3160247802734375, -0.270111083984375, -0.2241973876953125, -0.17828369140625, -0.1323699951171875, -0.086456298828125, -0.0405426025390625, 0.00537109375, 0.0512847900390625, 0.097198486328125, 0.1431121826171875, 0.18902587890625, 0.2349395751953125, 0.280853271484375, 0.3267669677734375, 0.3726806640625, 0.4185943603515625, 0.464508056640625, 0.5104217529296875, 0.55633544921875, 0.6022491455078125, 0.648162841796875, 0.6940765380859375, 0.739990234375, 0.7859039306640625, 0.831817626953125, 0.8777313232421875, 0.92364501953125, 0.9695587158203125, 1.015472412109375, 1.0613861083984375, 1.1072998046875, 1.1532135009765625, 1.199127197265625, 1.2450408935546875, 1.29095458984375, 1.3368682861328125, 1.382781982421875, 1.4286956787109375, 1.474609375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 3.0, 6.0, 10.0, 6.0, 12.0, 17.0, 17.0, 27.0, 25.0, 40.0, 48.0, 49.0, 55.0, 73.0, 56.0, 73.0, 64.0, 79.0, 67.0, 59.0, 44.0, 37.0, 21.0, 15.0, 15.0, 16.0, 12.0, 13.0, 8.0, 3.0, 6.0, 3.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007476806640625, -0.0007241517305374146, -0.0007006227970123291, -0.0006770938634872437, -0.0006535649299621582, -0.0006300359964370728, -0.0006065070629119873, -0.0005829781293869019, -0.0005594491958618164, -0.000535920262336731, -0.0005123913288116455, -0.0004888623952865601, -0.0004653334617614746, -0.00044180452823638916, -0.0004182755947113037, -0.00039474666118621826, -0.0003712177276611328, -0.00034768879413604736, -0.0003241598606109619, -0.00030063092708587646, -0.000277101993560791, -0.00025357306003570557, -0.00023004412651062012, -0.00020651519298553467, -0.00018298625946044922, -0.00015945732593536377, -0.00013592839241027832, -0.00011239945888519287, -8.887052536010742e-05, -6.534159183502197e-05, -4.1812658309936523e-05, -1.8283724784851074e-05, 5.245208740234375e-06, 2.8774142265319824e-05, 5.2303075790405273e-05, 7.583200931549072e-05, 9.936094284057617e-05, 0.00012288987636566162, 0.00014641880989074707, 0.00016994774341583252, 0.00019347667694091797, 0.00021700561046600342, 0.00024053454399108887, 0.0002640634775161743, 0.00028759241104125977, 0.0003111213445663452, 0.00033465027809143066, 0.0003581792116165161, 0.00038170814514160156, 0.000405237078666687, 0.00042876601219177246, 0.0004522949457168579, 0.00047582387924194336, 0.0004993528127670288, 0.0005228817462921143, 0.0005464106798171997, 0.0005699396133422852, 0.0005934685468673706, 0.0006169974803924561, 0.0006405264139175415, 0.000664055347442627, 0.0006875842809677124, 0.0007111132144927979, 0.0007346421480178833, 0.0007581710815429688]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 2.0, 0.0, 3.0, 11.0, 8.0, 12.0, 13.0, 16.0, 34.0, 34.0, 52.0, 72.0, 130.0, 256.0, 1016.0, 1018267.0, 27582.0, 481.0, 186.0, 106.0, 70.0, 40.0, 47.0, 21.0, 23.0, 14.0, 17.0, 9.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0236663818359375, -0.02294445037841797, -0.022222518920898438, -0.021500587463378906, -0.020778656005859375, -0.020056724548339844, -0.019334793090820312, -0.01861286163330078, -0.01789093017578125, -0.01716899871826172, -0.016447067260742188, -0.015725135803222656, -0.015003204345703125, -0.014281272888183594, -0.013559341430664062, -0.012837409973144531, -0.012115478515625, -0.011393547058105469, -0.010671615600585938, -0.009949684143066406, -0.009227752685546875, -0.008505821228027344, -0.0077838897705078125, -0.007061958312988281, -0.00634002685546875, -0.005618095397949219, -0.0048961639404296875, -0.004174232482910156, -0.003452301025390625, -0.0027303695678710938, -0.0020084381103515625, -0.0012865066528320312, -0.0005645751953125, 0.00015735626220703125, 0.0008792877197265625, 0.0016012191772460938, 0.002323150634765625, 0.0030450820922851562, 0.0037670135498046875, 0.004488945007324219, 0.00521087646484375, 0.005932807922363281, 0.0066547393798828125, 0.007376670837402344, 0.008098602294921875, 0.008820533752441406, 0.009542465209960938, 0.010264396667480469, 0.010986328125, 0.011708259582519531, 0.012430191040039062, 0.013152122497558594, 0.013874053955078125, 0.014595985412597656, 0.015317916870117188, 0.01603984832763672, 0.01676177978515625, 0.01748371124267578, 0.018205642700195312, 0.018927574157714844, 0.019649505615234375, 0.020371437072753906, 0.021093368530273438, 0.02181529998779297, 0.0225372314453125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 9.0, 71.0, 236.0, 345.0, 241.0, 73.0, 22.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016425125068053603, -0.0016039530746638775, -0.0015653936425223947, -0.0015268342103809118, -0.001488274778239429, -0.0014497153460979462, -0.0014111559139564633, -0.0013725964818149805, -0.0013340370496734977, -0.0012954776175320148, -0.001256918185390532, -0.0012183587532490492, -0.0011797993211075664, -0.0011412398889660835, -0.0011026804568246007, -0.0010641210246831179, -0.001025561592541635, -0.0009870021604001522, -0.0009484427282586694, -0.0009098832961171865, -0.0008713238639757037, -0.0008327644318342209, -0.0007942049996927381, -0.0007556455675512552, -0.0007170861354097724, -0.0006785267032682896, -0.0006399672711268067, -0.0006014078389853239, -0.0005628484068438411, -0.0005242889747023582, -0.0004857295425608754, -0.0004471701104193926, -0.0004086107946932316, -0.00037005136255174875, -0.0003314919304102659, -0.0002929324982687831, -0.00025437306612730026, -0.00021581363398581743, -0.0001772542018443346, -0.00013869476970285177, -0.00010013533756136894, -6.157590541988611e-05, -2.3016473278403282e-05, 1.5542958863079548e-05, 5.410239100456238e-05, 9.266182314604521e-05, 0.00013122125528752804, 0.00016978068742901087, 0.0002083401195704937, 0.00024689955171197653, 0.00028545898385345936, 0.0003240184159949422, 0.000362577848136425, 0.00040113728027790785, 0.0004396967124193907, 0.0004782561445608735, 0.0005168155767023563, 0.0005553750088438392, 0.000593934440985322, 0.0006324938731268048, 0.0006710533052682877, 0.0007096127374097705, 0.0007481721695512533, 0.0007867316016927361, 0.000825291033834219]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 8.0, 12.0, 7.0, 9.0, 10.0, 11.0, 8.0, 15.0, 22.0, 25.0, 25.0, 26.0, 27.0, 35.0, 36.0, 28.0, 38.0, 48.0, 38.0, 25.0, 39.0, 40.0, 40.0, 39.0, 37.0, 39.0, 36.0, 30.0, 26.0, 26.0, 20.0, 30.0, 27.0, 14.0, 18.0, 14.0, 16.0, 6.0, 19.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0], "bins": [-0.00035125017166137695, -0.00034097395837306976, -0.0003306977450847626, -0.0003204215317964554, -0.0003101453185081482, -0.000299869105219841, -0.0002895928919315338, -0.0002793166786432266, -0.00026904046535491943, -0.00025876425206661224, -0.00024848803877830505, -0.00023821182548999786, -0.00022793561220169067, -0.00021765939891338348, -0.0002073831856250763, -0.0001971069723367691, -0.00018683075904846191, -0.00017655454576015472, -0.00016627833247184753, -0.00015600211918354034, -0.00014572590589523315, -0.00013544969260692596, -0.00012517347931861877, -0.00011489726603031158, -0.0001046210527420044, -9.43448394536972e-05, -8.406862616539001e-05, -7.379241287708282e-05, -6.351619958877563e-05, -5.3239986300468445e-05, -4.2963773012161255e-05, -3.2687559723854065e-05, -2.2411346435546875e-05, -1.2135133147239685e-05, -1.8589198589324951e-06, 8.417293429374695e-06, 1.8693506717681885e-05, 2.8969720005989075e-05, 3.9245933294296265e-05, 4.9522146582603455e-05, 5.9798359870910645e-05, 7.007457315921783e-05, 8.035078644752502e-05, 9.062699973583221e-05, 0.0001009032130241394, 0.0001111794263124466, 0.00012145563960075378, 0.00013173185288906097, 0.00014200806617736816, 0.00015228427946567535, 0.00016256049275398254, 0.00017283670604228973, 0.00018311291933059692, 0.00019338913261890411, 0.0002036653459072113, 0.0002139415591955185, 0.00022421777248382568, 0.00023449398577213287, 0.00024477019906044006, 0.00025504641234874725, 0.00026532262563705444, 0.00027559883892536163, 0.0002858750522136688, 0.000296151265501976, 0.0003064274787902832]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 8.0, 11.0, 10.0, 13.0, 10.0, 18.0, 22.0, 19.0, 25.0, 21.0, 18.0, 40.0, 36.0, 22.0, 36.0, 48.0, 47.0, 41.0, 39.0, 41.0, 47.0, 34.0, 30.0, 39.0, 41.0, 46.0, 18.0, 26.0, 31.0, 23.0, 22.0, 14.0, 20.0, 15.0, 13.0, 15.0, 7.0, 5.0, 5.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9453125, -6.72039794921875, -6.4954833984375, -6.27056884765625, -6.045654296875, -5.82073974609375, -5.5958251953125, -5.37091064453125, -5.14599609375, -4.92108154296875, -4.6961669921875, -4.47125244140625, -4.246337890625, -4.02142333984375, -3.7965087890625, -3.57159423828125, -3.3466796875, -3.12176513671875, -2.8968505859375, -2.67193603515625, -2.447021484375, -2.22210693359375, -1.9971923828125, -1.77227783203125, -1.54736328125, -1.32244873046875, -1.0975341796875, -0.87261962890625, -0.647705078125, -0.42279052734375, -0.1978759765625, 0.02703857421875, 0.251953125, 0.47686767578125, 0.7017822265625, 0.92669677734375, 1.151611328125, 1.37652587890625, 1.6014404296875, 1.82635498046875, 2.05126953125, 2.27618408203125, 2.5010986328125, 2.72601318359375, 2.950927734375, 3.17584228515625, 3.4007568359375, 3.62567138671875, 3.8505859375, 4.07550048828125, 4.3004150390625, 4.52532958984375, 4.750244140625, 4.97515869140625, 5.2000732421875, 5.42498779296875, 5.64990234375, 5.87481689453125, 6.0997314453125, 6.32464599609375, 6.549560546875, 6.77447509765625, 6.9993896484375, 7.22430419921875, 7.44921875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 4.0, 4.0, 16.0, 12.0, 19.0, 23.0, 47.0, 60.0, 90.0, 184.0, 316.0, 501.0, 852.0, 1612.0, 2858.0, 5285.0, 10239.0, 21333.0, 47664.0, 120490.0, 330511.0, 307863.0, 112452.0, 44911.0, 19952.0, 9734.0, 5125.0, 2735.0, 1525.0, 894.0, 472.0, 315.0, 171.0, 117.0, 50.0, 29.0, 15.0, 13.0, 15.0, 5.0, 8.0, 11.0, 6.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3046875, -4.15606689453125, -4.0074462890625, -3.85882568359375, -3.710205078125, -3.56158447265625, -3.4129638671875, -3.26434326171875, -3.11572265625, -2.96710205078125, -2.8184814453125, -2.66986083984375, -2.521240234375, -2.37261962890625, -2.2239990234375, -2.07537841796875, -1.9267578125, -1.77813720703125, -1.6295166015625, -1.48089599609375, -1.332275390625, -1.18365478515625, -1.0350341796875, -0.88641357421875, -0.73779296875, -0.58917236328125, -0.4405517578125, -0.29193115234375, -0.143310546875, 0.00531005859375, 0.1539306640625, 0.30255126953125, 0.451171875, 0.59979248046875, 0.7484130859375, 0.89703369140625, 1.045654296875, 1.19427490234375, 1.3428955078125, 1.49151611328125, 1.64013671875, 1.78875732421875, 1.9373779296875, 2.08599853515625, 2.234619140625, 2.38323974609375, 2.5318603515625, 2.68048095703125, 2.8291015625, 2.97772216796875, 3.1263427734375, 3.27496337890625, 3.423583984375, 3.57220458984375, 3.7208251953125, 3.86944580078125, 4.01806640625, 4.16668701171875, 4.3153076171875, 4.46392822265625, 4.612548828125, 4.76116943359375, 4.9097900390625, 5.05841064453125, 5.20703125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 6.0, 11.0, 15.0, 17.0, 8.0, 14.0, 12.0, 29.0, 21.0, 34.0, 30.0, 32.0, 49.0, 46.0, 49.0, 50.0, 84.0, 321.0, 1654.0, 125.0, 63.0, 36.0, 45.0, 60.0, 31.0, 34.0, 31.0, 30.0, 22.0, 16.0, 13.0, 13.0, 7.0, 9.0, 7.0, 11.0, 3.0, 2.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.839111328125, -26.00634765625, -25.173583984375, -24.3408203125, -23.508056640625, -22.67529296875, -21.842529296875, -21.009765625, -20.177001953125, -19.34423828125, -18.511474609375, -17.6787109375, -16.845947265625, -16.01318359375, -15.180419921875, -14.34765625, -13.514892578125, -12.68212890625, -11.849365234375, -11.0166015625, -10.183837890625, -9.35107421875, -8.518310546875, -7.685546875, -6.852783203125, -6.02001953125, -5.187255859375, -4.3544921875, -3.521728515625, -2.68896484375, -1.856201171875, -1.0234375, -0.190673828125, 0.64208984375, 1.474853515625, 2.3076171875, 3.140380859375, 3.97314453125, 4.805908203125, 5.638671875, 6.471435546875, 7.30419921875, 8.136962890625, 8.9697265625, 9.802490234375, 10.63525390625, 11.468017578125, 12.30078125, 13.133544921875, 13.96630859375, 14.799072265625, 15.6318359375, 16.464599609375, 17.29736328125, 18.130126953125, 18.962890625, 19.795654296875, 20.62841796875, 21.461181640625, 22.2939453125, 23.126708984375, 23.95947265625, 24.792236328125, 25.625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 5.0, 5.0, 12.0, 9.0, 16.0, 16.0, 18.0, 14.0, 31.0, 49.0, 51.0, 61.0, 83.0, 115.0, 158.0, 238.0, 286.0, 637.0, 3092.0, 2866871.0, 270381.0, 1902.0, 522.0, 283.0, 197.0, 177.0, 111.0, 87.0, 59.0, 47.0, 40.0, 25.0, 20.0, 15.0, 20.0, 15.0, 13.0, 4.0, 4.0, 2.0, 1.0, 8.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.625, -58.662109375, -56.69921875, -54.736328125, -52.7734375, -50.810546875, -48.84765625, -46.884765625, -44.921875, -42.958984375, -40.99609375, -39.033203125, -37.0703125, -35.107421875, -33.14453125, -31.181640625, -29.21875, -27.255859375, -25.29296875, -23.330078125, -21.3671875, -19.404296875, -17.44140625, -15.478515625, -13.515625, -11.552734375, -9.58984375, -7.626953125, -5.6640625, -3.701171875, -1.73828125, 0.224609375, 2.1875, 4.150390625, 6.11328125, 8.076171875, 10.0390625, 12.001953125, 13.96484375, 15.927734375, 17.890625, 19.853515625, 21.81640625, 23.779296875, 25.7421875, 27.705078125, 29.66796875, 31.630859375, 33.59375, 35.556640625, 37.51953125, 39.482421875, 41.4453125, 43.408203125, 45.37109375, 47.333984375, 49.296875, 51.259765625, 53.22265625, 55.185546875, 57.1484375, 59.111328125, 61.07421875, 63.037109375, 65.0]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 29.0, 75.0, 136.0, 209.0, 229.0, 177.0, 86.0, 42.0, 17.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.923913955688477, -19.83822250366211, -18.752531051635742, -17.666839599609375, -16.581148147583008, -15.49545669555664, -14.40976619720459, -13.324074745178223, -12.238383293151855, -11.152691841125488, -10.067000389099121, -8.98130989074707, -7.895617961883545, -6.809926509857178, -5.724235534667969, -4.638544082641602, -3.5528526306152344, -2.467161178588867, -1.381469964981079, -0.295778751373291, 0.7899127006530762, 1.8756041526794434, 2.9612951278686523, 4.0469865798950195, 5.132678031921387, 6.218369483947754, 7.304060935974121, 8.389751434326172, 9.475442886352539, 10.561134338378906, 11.646825790405273, 12.73251724243164, 13.818206787109375, 14.903898239135742, 15.98958969116211, 17.075281143188477, 18.160972595214844, 19.24666404724121, 20.332355499267578, 21.418045043945312, 22.503738403320312, 23.58942985534668, 24.675121307373047, 25.760812759399414, 26.84650421142578, 27.93219566345215, 29.017887115478516, 30.10357666015625, 31.189268112182617, 32.274959564208984, 33.36064910888672, 34.44634246826172, 35.53203201293945, 36.61772537231445, 37.70341491699219, 38.78910827636719, 39.87479782104492, 40.960487365722656, 42.046180725097656, 43.13187026977539, 44.21756362915039, 45.303253173828125, 46.388946533203125, 47.47463607788086, 48.56032943725586]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 11.0, 5.0, 8.0, 15.0, 17.0, 22.0, 25.0, 23.0, 21.0, 23.0, 39.0, 24.0, 42.0, 45.0, 28.0, 37.0, 38.0, 45.0, 44.0, 45.0, 37.0, 39.0, 45.0, 26.0, 39.0, 45.0, 39.0, 22.0, 27.0, 23.0, 16.0, 18.0, 14.0, 14.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.4604606628418, -55.57683181762695, -53.693199157714844, -51.8095703125, -49.925941467285156, -48.04231262207031, -46.15868377685547, -44.27505111694336, -42.391422271728516, -40.50779342651367, -38.62416076660156, -36.74053192138672, -34.856903076171875, -32.97327423095703, -31.089643478393555, -29.206012725830078, -27.322383880615234, -25.43875503540039, -23.555124282836914, -21.671493530273438, -19.787864685058594, -17.90423583984375, -16.020605087280273, -14.136975288391113, -12.253345489501953, -10.369715690612793, -8.486085891723633, -6.602456092834473, -4.7188262939453125, -2.8351964950561523, -0.9515666961669922, 0.932063102722168, 2.8156890869140625, 4.699318885803223, 6.582948684692383, 8.466578483581543, 10.350208282470703, 12.233838081359863, 14.117467880249023, 16.0010986328125, 17.884727478027344, 19.768356323242188, 21.651987075805664, 23.53561782836914, 25.419246673583984, 27.302875518798828, 29.186506271362305, 31.07013702392578, 32.953765869140625, 34.83739471435547, 36.72102355957031, 38.60465621948242, 40.488285064697266, 42.37191390991211, 44.25554656982422, 46.13917541503906, 48.022804260253906, 49.90643310546875, 51.790061950683594, 53.6736946105957, 55.55732345581055, 57.44095230102539, 59.3245849609375, 61.208213806152344, 63.09184265136719]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 7.0, 7.0, 12.0, 10.0, 11.0, 12.0, 6.0, 17.0, 24.0, 20.0, 17.0, 27.0, 21.0, 31.0, 26.0, 40.0, 46.0, 46.0, 43.0, 45.0, 35.0, 41.0, 34.0, 49.0, 41.0, 32.0, 42.0, 28.0, 27.0, 24.0, 28.0, 24.0, 23.0, 15.0, 20.0, 15.0, 17.0, 9.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.41796875, -7.1837158203125, -6.949462890625, -6.7152099609375, -6.48095703125, -6.2467041015625, -6.012451171875, -5.7781982421875, -5.5439453125, -5.3096923828125, -5.075439453125, -4.8411865234375, -4.60693359375, -4.3726806640625, -4.138427734375, -3.9041748046875, -3.669921875, -3.4356689453125, -3.201416015625, -2.9671630859375, -2.73291015625, -2.4986572265625, -2.264404296875, -2.0301513671875, -1.7958984375, -1.5616455078125, -1.327392578125, -1.0931396484375, -0.85888671875, -0.6246337890625, -0.390380859375, -0.1561279296875, 0.078125, 0.3123779296875, 0.546630859375, 0.7808837890625, 1.01513671875, 1.2493896484375, 1.483642578125, 1.7178955078125, 1.9521484375, 2.1864013671875, 2.420654296875, 2.6549072265625, 2.88916015625, 3.1234130859375, 3.357666015625, 3.5919189453125, 3.826171875, 4.0604248046875, 4.294677734375, 4.5289306640625, 4.76318359375, 4.9974365234375, 5.231689453125, 5.4659423828125, 5.7001953125, 5.9344482421875, 6.168701171875, 6.4029541015625, 6.63720703125, 6.8714599609375, 7.105712890625, 7.3399658203125, 7.57421875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 1.0, 1.0, 7.0, 3.0, 10.0, 5.0, 13.0, 10.0, 11.0, 14.0, 19.0, 16.0, 23.0, 22.0, 34.0, 37.0, 69.0, 99.0, 168.0, 327.0, 1035.0, 4550.0, 100236.0, 3208958.0, 861805.0, 13676.0, 1885.0, 553.0, 249.0, 114.0, 64.0, 49.0, 35.0, 32.0, 27.0, 21.0, 16.0, 19.0, 13.0, 16.0, 9.0, 6.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.421875, -24.620849609375, -23.81982421875, -23.018798828125, -22.2177734375, -21.416748046875, -20.61572265625, -19.814697265625, -19.013671875, -18.212646484375, -17.41162109375, -16.610595703125, -15.8095703125, -15.008544921875, -14.20751953125, -13.406494140625, -12.60546875, -11.804443359375, -11.00341796875, -10.202392578125, -9.4013671875, -8.600341796875, -7.79931640625, -6.998291015625, -6.197265625, -5.396240234375, -4.59521484375, -3.794189453125, -2.9931640625, -2.192138671875, -1.39111328125, -0.590087890625, 0.2109375, 1.011962890625, 1.81298828125, 2.614013671875, 3.4150390625, 4.216064453125, 5.01708984375, 5.818115234375, 6.619140625, 7.420166015625, 8.22119140625, 9.022216796875, 9.8232421875, 10.624267578125, 11.42529296875, 12.226318359375, 13.02734375, 13.828369140625, 14.62939453125, 15.430419921875, 16.2314453125, 17.032470703125, 17.83349609375, 18.634521484375, 19.435546875, 20.236572265625, 21.03759765625, 21.838623046875, 22.6396484375, 23.440673828125, 24.24169921875, 25.042724609375, 25.84375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 15.0, 4.0, 20.0, 34.0, 39.0, 56.0, 96.0, 133.0, 196.0, 266.0, 367.0, 476.0, 547.0, 535.0, 365.0, 252.0, 195.0, 124.0, 109.0, 74.0, 51.0, 35.0, 26.0, 13.0, 15.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0859375, -14.5924072265625, -14.098876953125, -13.6053466796875, -13.11181640625, -12.6182861328125, -12.124755859375, -11.6312255859375, -11.1376953125, -10.6441650390625, -10.150634765625, -9.6571044921875, -9.16357421875, -8.6700439453125, -8.176513671875, -7.6829833984375, -7.189453125, -6.6959228515625, -6.202392578125, -5.7088623046875, -5.21533203125, -4.7218017578125, -4.228271484375, -3.7347412109375, -3.2412109375, -2.7476806640625, -2.254150390625, -1.7606201171875, -1.26708984375, -0.7735595703125, -0.280029296875, 0.2135009765625, 0.70703125, 1.2005615234375, 1.694091796875, 2.1876220703125, 2.68115234375, 3.1746826171875, 3.668212890625, 4.1617431640625, 4.6552734375, 5.1488037109375, 5.642333984375, 6.1358642578125, 6.62939453125, 7.1229248046875, 7.616455078125, 8.1099853515625, 8.603515625, 9.0970458984375, 9.590576171875, 10.0841064453125, 10.57763671875, 11.0711669921875, 11.564697265625, 12.0582275390625, 12.5517578125, 13.0452880859375, 13.538818359375, 14.0323486328125, 14.52587890625, 15.0194091796875, 15.512939453125, 16.0064697265625, 16.5]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 11.0, 13.0, 23.0, 25.0, 34.0, 47.0, 51.0, 87.0, 72.0, 119.0, 167.0, 188.0, 265.0, 431.0, 896.0, 9081.0, 4059769.0, 119608.0, 1560.0, 526.0, 330.0, 226.0, 180.0, 142.0, 97.0, 76.0, 57.0, 52.0, 33.0, 36.0, 16.0, 11.0, 15.0, 5.0, 10.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.75, -69.486328125, -67.22265625, -64.958984375, -62.6953125, -60.431640625, -58.16796875, -55.904296875, -53.640625, -51.376953125, -49.11328125, -46.849609375, -44.5859375, -42.322265625, -40.05859375, -37.794921875, -35.53125, -33.267578125, -31.00390625, -28.740234375, -26.4765625, -24.212890625, -21.94921875, -19.685546875, -17.421875, -15.158203125, -12.89453125, -10.630859375, -8.3671875, -6.103515625, -3.83984375, -1.576171875, 0.6875, 2.951171875, 5.21484375, 7.478515625, 9.7421875, 12.005859375, 14.26953125, 16.533203125, 18.796875, 21.060546875, 23.32421875, 25.587890625, 27.8515625, 30.115234375, 32.37890625, 34.642578125, 36.90625, 39.169921875, 41.43359375, 43.697265625, 45.9609375, 48.224609375, 50.48828125, 52.751953125, 55.015625, 57.279296875, 59.54296875, 61.806640625, 64.0703125, 66.333984375, 68.59765625, 70.861328125, 73.125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 15.0, 39.0, 110.0, 129.0, 173.0, 175.0, 165.0, 92.0, 62.0, 29.0, 10.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.24960708618164, -60.019920349121094, -57.79023361206055, -55.560546875, -53.33086013793945, -51.101173400878906, -48.871490478515625, -46.64179992675781, -44.41211700439453, -42.182430267333984, -39.95274353027344, -37.72305679321289, -35.493370056152344, -33.2636833190918, -31.033998489379883, -28.804311752319336, -26.574623107910156, -24.34493637084961, -22.115249633789062, -19.885562896728516, -17.65587615966797, -15.426190376281738, -13.196504592895508, -10.966817855834961, -8.737131118774414, -6.507444381713867, -4.2777581214904785, -2.04807186126709, 0.18161487579345703, 2.411301612854004, 4.640987396240234, 6.870674133300781, 9.100364685058594, 11.33005142211914, 13.559738159179688, 15.789423942565918, 18.01911163330078, 20.248798370361328, 22.478483200073242, 24.70816993713379, 26.937856674194336, 29.167543411254883, 31.39723014831543, 33.626914978027344, 35.85660171508789, 38.08628845214844, 40.315975189208984, 42.54566192626953, 44.77534866333008, 47.005035400390625, 49.23472213745117, 51.46440887451172, 53.694095611572266, 55.92378234863281, 58.153465270996094, 60.383155822753906, 62.61283874511719, 64.84252166748047, 67.07221221923828, 69.30189514160156, 71.53158569335938, 73.76126861572266, 75.99095916748047, 78.22064208984375, 80.45033264160156]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 6.0, 10.0, 13.0, 12.0, 14.0, 17.0, 19.0, 18.0, 27.0, 25.0, 19.0, 30.0, 43.0, 35.0, 47.0, 46.0, 41.0, 53.0, 32.0, 29.0, 39.0, 41.0, 31.0, 46.0, 38.0, 40.0, 32.0, 23.0, 22.0, 21.0, 17.0, 13.0, 13.0, 15.0, 8.0, 9.0, 10.0, 8.0, 2.0, 7.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-46.8111572265625, -45.45692443847656, -44.10269546508789, -42.74846267700195, -41.39423370361328, -40.040000915527344, -38.685768127441406, -37.33153533935547, -35.9773063659668, -34.62307357788086, -33.26884460449219, -31.91461181640625, -30.560380935668945, -29.20615005493164, -27.851917266845703, -26.4976863861084, -25.143455505371094, -23.78922462463379, -22.434993743896484, -21.080760955810547, -19.726530075073242, -18.372299194335938, -17.01806640625, -15.663835525512695, -14.30960464477539, -12.955373764038086, -11.601141929626465, -10.246910095214844, -8.892679214477539, -7.538447856903076, -6.184216499328613, -4.829984664916992, -3.4757537841796875, -2.1215224266052246, -0.7672910690307617, 0.5869402885437012, 1.941171646118164, 3.295403003692627, 4.64963436126709, 6.003866195678711, 7.358097076416016, 8.71232795715332, 10.066559791564941, 11.420791625976562, 12.775022506713867, 14.129253387451172, 15.483485221862793, 16.837717056274414, 18.19194793701172, 19.546178817749023, 20.900409698486328, 22.254642486572266, 23.60887336730957, 24.963104248046875, 26.317337036132812, 27.671567916870117, 29.025798797607422, 30.380029678344727, 31.73426055908203, 33.08849334716797, 34.442726135253906, 35.79695510864258, 37.151187896728516, 38.50541687011719, 39.859649658203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 6.0, 3.0, 15.0, 9.0, 11.0, 10.0, 13.0, 14.0, 21.0, 27.0, 29.0, 29.0, 43.0, 24.0, 28.0, 27.0, 31.0, 37.0, 39.0, 50.0, 44.0, 45.0, 35.0, 42.0, 45.0, 35.0, 29.0, 35.0, 40.0, 29.0, 19.0, 19.0, 17.0, 16.0, 16.0, 11.0, 17.0, 9.0, 7.0, 3.0, 5.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.15625, -6.927001953125, -6.69775390625, -6.468505859375, -6.2392578125, -6.010009765625, -5.78076171875, -5.551513671875, -5.322265625, -5.093017578125, -4.86376953125, -4.634521484375, -4.4052734375, -4.176025390625, -3.94677734375, -3.717529296875, -3.48828125, -3.259033203125, -3.02978515625, -2.800537109375, -2.5712890625, -2.342041015625, -2.11279296875, -1.883544921875, -1.654296875, -1.425048828125, -1.19580078125, -0.966552734375, -0.7373046875, -0.508056640625, -0.27880859375, -0.049560546875, 0.1796875, 0.408935546875, 0.63818359375, 0.867431640625, 1.0966796875, 1.325927734375, 1.55517578125, 1.784423828125, 2.013671875, 2.242919921875, 2.47216796875, 2.701416015625, 2.9306640625, 3.159912109375, 3.38916015625, 3.618408203125, 3.84765625, 4.076904296875, 4.30615234375, 4.535400390625, 4.7646484375, 4.993896484375, 5.22314453125, 5.452392578125, 5.681640625, 5.910888671875, 6.14013671875, 6.369384765625, 6.5986328125, 6.827880859375, 7.05712890625, 7.286376953125, 7.515625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 11.0, 7.0, 16.0, 30.0, 33.0, 66.0, 99.0, 127.0, 212.0, 269.0, 427.0, 604.0, 866.0, 1326.0, 1978.0, 2992.0, 4431.0, 6433.0, 9966.0, 15582.0, 24651.0, 39581.0, 67182.0, 122265.0, 322828.0, 193441.0, 91345.0, 52202.0, 31727.0, 19916.0, 12953.0, 8171.0, 5440.0, 3687.0, 2439.0, 1697.0, 1140.0, 770.0, 541.0, 350.0, 249.0, 166.0, 125.0, 75.0, 50.0, 40.0, 25.0, 13.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.6318359375, -1.5820465087890625, -1.532257080078125, -1.4824676513671875, -1.43267822265625, -1.3828887939453125, -1.333099365234375, -1.2833099365234375, -1.2335205078125, -1.1837310791015625, -1.133941650390625, -1.0841522216796875, -1.03436279296875, -0.9845733642578125, -0.934783935546875, -0.8849945068359375, -0.835205078125, -0.7854156494140625, -0.735626220703125, -0.6858367919921875, -0.63604736328125, -0.5862579345703125, -0.536468505859375, -0.4866790771484375, -0.4368896484375, -0.3871002197265625, -0.337310791015625, -0.2875213623046875, -0.23773193359375, -0.1879425048828125, -0.138153076171875, -0.0883636474609375, -0.03857421875, 0.0112152099609375, 0.061004638671875, 0.1107940673828125, 0.16058349609375, 0.2103729248046875, 0.260162353515625, 0.3099517822265625, 0.3597412109375, 0.4095306396484375, 0.459320068359375, 0.5091094970703125, 0.55889892578125, 0.6086883544921875, 0.658477783203125, 0.7082672119140625, 0.758056640625, 0.8078460693359375, 0.857635498046875, 0.9074249267578125, 0.95721435546875, 1.0070037841796875, 1.056793212890625, 1.1065826416015625, 1.1563720703125, 1.2061614990234375, 1.255950927734375, 1.3057403564453125, 1.35552978515625, 1.4053192138671875, 1.455108642578125, 1.5048980712890625, 1.5546875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 6.0, 4.0, 5.0, 9.0, 10.0, 8.0, 10.0, 16.0, 17.0, 15.0, 18.0, 24.0, 29.0, 33.0, 24.0, 27.0, 30.0, 39.0, 32.0, 36.0, 36.0, 42.0, 1063.0, 42.0, 44.0, 43.0, 40.0, 39.0, 25.0, 32.0, 29.0, 34.0, 33.0, 18.0, 16.0, 13.0, 24.0, 12.0, 6.0, 12.0, 6.0, 6.0, 8.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-4.48046875, -4.33837890625, -4.1962890625, -4.05419921875, -3.912109375, -3.77001953125, -3.6279296875, -3.48583984375, -3.34375, -3.20166015625, -3.0595703125, -2.91748046875, -2.775390625, -2.63330078125, -2.4912109375, -2.34912109375, -2.20703125, -2.06494140625, -1.9228515625, -1.78076171875, -1.638671875, -1.49658203125, -1.3544921875, -1.21240234375, -1.0703125, -0.92822265625, -0.7861328125, -0.64404296875, -0.501953125, -0.35986328125, -0.2177734375, -0.07568359375, 0.06640625, 0.20849609375, 0.3505859375, 0.49267578125, 0.634765625, 0.77685546875, 0.9189453125, 1.06103515625, 1.203125, 1.34521484375, 1.4873046875, 1.62939453125, 1.771484375, 1.91357421875, 2.0556640625, 2.19775390625, 2.33984375, 2.48193359375, 2.6240234375, 2.76611328125, 2.908203125, 3.05029296875, 3.1923828125, 3.33447265625, 3.4765625, 3.61865234375, 3.7607421875, 3.90283203125, 4.044921875, 4.18701171875, 4.3291015625, 4.47119140625, 4.61328125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 6.0, 12.0, 3.0, 16.0, 20.0, 26.0, 34.0, 51.0, 73.0, 86.0, 143.0, 218.0, 271.0, 382.0, 554.0, 815.0, 1191.0, 1771.0, 2528.0, 3699.0, 5606.0, 8169.0, 12254.0, 18058.0, 27325.0, 41674.0, 64779.0, 110444.0, 1294753.0, 218386.0, 103145.0, 61323.0, 39450.0, 26151.0, 17335.0, 11630.0, 7864.0, 5290.0, 3642.0, 2457.0, 1641.0, 1195.0, 809.0, 594.0, 383.0, 294.0, 182.0, 121.0, 98.0, 58.0, 42.0, 23.0, 26.0, 18.0, 10.0, 2.0, 12.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.375, -1.3319549560546875, -1.288909912109375, -1.2458648681640625, -1.20281982421875, -1.1597747802734375, -1.116729736328125, -1.0736846923828125, -1.0306396484375, -0.9875946044921875, -0.944549560546875, -0.9015045166015625, -0.85845947265625, -0.8154144287109375, -0.772369384765625, -0.7293243408203125, -0.686279296875, -0.6432342529296875, -0.600189208984375, -0.5571441650390625, -0.51409912109375, -0.4710540771484375, -0.428009033203125, -0.3849639892578125, -0.3419189453125, -0.2988739013671875, -0.255828857421875, -0.2127838134765625, -0.16973876953125, -0.1266937255859375, -0.083648681640625, -0.0406036376953125, 0.00244140625, 0.0454864501953125, 0.088531494140625, 0.1315765380859375, 0.17462158203125, 0.2176666259765625, 0.260711669921875, 0.3037567138671875, 0.3468017578125, 0.3898468017578125, 0.432891845703125, 0.4759368896484375, 0.51898193359375, 0.5620269775390625, 0.605072021484375, 0.6481170654296875, 0.691162109375, 0.7342071533203125, 0.777252197265625, 0.8202972412109375, 0.86334228515625, 0.9063873291015625, 0.949432373046875, 0.9924774169921875, 1.0355224609375, 1.0785675048828125, 1.121612548828125, 1.1646575927734375, 1.20770263671875, 1.2507476806640625, 1.293792724609375, 1.3368377685546875, 1.3798828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 14.0, 1.0, 10.0, 18.0, 14.0, 13.0, 20.0, 27.0, 26.0, 26.0, 41.0, 45.0, 33.0, 69.0, 65.0, 79.0, 80.0, 66.0, 52.0, 43.0, 37.0, 30.0, 28.0, 26.0, 15.0, 26.0, 15.0, 11.0, 16.0, 5.0, 8.0, 3.0, 9.0, 2.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0008997917175292969, -0.0008745715022087097, -0.0008493512868881226, -0.0008241310715675354, -0.0007989108562469482, -0.0007736906409263611, -0.0007484704256057739, -0.0007232502102851868, -0.0006980299949645996, -0.0006728097796440125, -0.0006475895643234253, -0.0006223693490028381, -0.000597149133682251, -0.0005719289183616638, -0.0005467087030410767, -0.0005214884877204895, -0.0004962682723999023, -0.0004710480570793152, -0.00044582784175872803, -0.00042060762643814087, -0.0003953874111175537, -0.00037016719579696655, -0.0003449469804763794, -0.00031972676515579224, -0.0002945065498352051, -0.0002692863345146179, -0.00024406611919403076, -0.0002188459038734436, -0.00019362568855285645, -0.0001684054732322693, -0.00014318525791168213, -0.00011796504259109497, -9.274482727050781e-05, -6.752461194992065e-05, -4.2304396629333496e-05, -1.7084181308746338e-05, 8.13603401184082e-06, 3.335624933242798e-05, 5.857646465301514e-05, 8.37966799736023e-05, 0.00010901689529418945, 0.0001342371106147766, 0.00015945732593536377, 0.00018467754125595093, 0.00020989775657653809, 0.00023511797189712524, 0.0002603381872177124, 0.00028555840253829956, 0.0003107786178588867, 0.0003359988331794739, 0.00036121904850006104, 0.0003864392638206482, 0.00041165947914123535, 0.0004368796944618225, 0.00046209990978240967, 0.0004873201251029968, 0.000512540340423584, 0.0005377605557441711, 0.0005629807710647583, 0.0005882009863853455, 0.0006134212017059326, 0.0006386414170265198, 0.0006638616323471069, 0.0006890818476676941, 0.0007143020629882812]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 4.0, 5.0, 9.0, 5.0, 10.0, 10.0, 19.0, 18.0, 27.0, 34.0, 44.0, 48.0, 77.0, 116.0, 192.0, 464.0, 2816.0, 1030827.0, 12486.0, 648.0, 230.0, 133.0, 80.0, 67.0, 44.0, 29.0, 20.0, 23.0, 16.0, 12.0, 7.0, 10.0, 8.0, 4.0, 3.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0182342529296875, -0.017574310302734375, -0.01691436767578125, -0.016254425048828125, -0.015594482421875, -0.014934539794921875, -0.01427459716796875, -0.013614654541015625, -0.0129547119140625, -0.012294769287109375, -0.01163482666015625, -0.010974884033203125, -0.01031494140625, -0.009654998779296875, -0.00899505615234375, -0.008335113525390625, -0.0076751708984375, -0.007015228271484375, -0.00635528564453125, -0.005695343017578125, -0.005035400390625, -0.004375457763671875, -0.00371551513671875, -0.003055572509765625, -0.0023956298828125, -0.001735687255859375, -0.00107574462890625, -0.000415802001953125, 0.000244140625, 0.000904083251953125, 0.00156402587890625, 0.002223968505859375, 0.0028839111328125, 0.003543853759765625, 0.00420379638671875, 0.004863739013671875, 0.005523681640625, 0.006183624267578125, 0.00684356689453125, 0.007503509521484375, 0.0081634521484375, 0.008823394775390625, 0.00948333740234375, 0.010143280029296875, 0.01080322265625, 0.011463165283203125, 0.01212310791015625, 0.012783050537109375, 0.0134429931640625, 0.014102935791015625, 0.01476287841796875, 0.015422821044921875, 0.016082763671875, 0.016742706298828125, 0.01740264892578125, 0.018062591552734375, 0.0187225341796875, 0.019382476806640625, 0.02004241943359375, 0.020702362060546875, 0.0213623046875, 0.022022247314453125, 0.02268218994140625, 0.023342132568359375, 0.0240020751953125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 7.0, 10.0, 23.0, 50.0, 90.0, 180.0, 200.0, 175.0, 133.0, 89.0, 29.0, 15.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024527430650778115, -0.0002203903568442911, -0.00019550640718080103, -0.00017062245751731098, -0.00014573850785382092, -0.00012085455819033086, -9.59706085268408e-05, -7.108665886335075e-05, -4.620270919986069e-05, -2.1318759536370635e-05, 3.565190127119422e-06, 2.844913979060948e-05, 5.3333089454099536e-05, 7.821703911758959e-05, 0.00010310098878107965, 0.0001279849384445697, 0.00015286888810805976, 0.00017775283777154982, 0.00020263678743503988, 0.00022752073709852993, 0.00025240468676202, 0.00027728863642551005, 0.0003021725860890001, 0.00032705653575249016, 0.0003519404854159802, 0.0003768244350794703, 0.00040170838474296033, 0.0004265923344064504, 0.00045147628406994045, 0.0004763602337334305, 0.000501244212500751, 0.0005261281039565802, 0.0005510121118277311, 0.0005758960614912212, 0.0006007800111547112, 0.0006256639608182013, 0.0006505479104816914, 0.0006754318601451814, 0.0007003158098086715, 0.0007251997594721615, 0.0007500837091356516, 0.0007749676587991416, 0.0007998516084626317, 0.0008247355581261218, 0.0008496195077896118, 0.0008745034574531019, 0.0008993874071165919, 0.000924271356780082, 0.000949155306443572, 0.0009740392561070621, 0.0009989232057705522, 0.0010238070972263813, 0.0010486911050975323, 0.0010735751129686832, 0.0010984590044245124, 0.0011233428958803415, 0.0011482269037514925, 0.0011731109116226435, 0.0011979948030784726, 0.0012228786945343018, 0.0012477627024054527, 0.0012726467102766037, 0.0012975306017324328, 0.001322414493188262, 0.001347298501059413]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 5.0, 11.0, 5.0, 10.0, 11.0, 15.0, 18.0, 20.0, 31.0, 33.0, 40.0, 28.0, 35.0, 45.0, 30.0, 54.0, 34.0, 49.0, 31.0, 39.0, 40.0, 47.0, 43.0, 41.0, 38.0, 39.0, 33.0, 22.0, 21.0, 11.0, 28.0, 19.0, 16.0, 8.0, 10.0, 9.0, 5.0, 12.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004807710647583008, -0.00046658050268888474, -0.0004523899406194687, -0.00043819937855005264, -0.0004240088164806366, -0.00040981825441122055, -0.0003956276923418045, -0.00038143713027238846, -0.0003672465682029724, -0.00035305600613355637, -0.0003388654440641403, -0.0003246748819947243, -0.00031048431992530823, -0.0002962937578558922, -0.00028210319578647614, -0.0002679126337170601, -0.00025372207164764404, -0.000239531509578228, -0.00022534094750881195, -0.0002111503854393959, -0.00019695982336997986, -0.0001827692613005638, -0.00016857869923114777, -0.00015438813716173172, -0.00014019757509231567, -0.00012600701302289963, -0.00011181645095348358, -9.762588888406754e-05, -8.343532681465149e-05, -6.924476474523544e-05, -5.50542026758194e-05, -4.086364060640335e-05, -2.6673078536987305e-05, -1.2482516467571259e-05, 1.7080456018447876e-06, 1.5898607671260834e-05, 3.008916974067688e-05, 4.4279731810092926e-05, 5.847029387950897e-05, 7.266085594892502e-05, 8.685141801834106e-05, 0.00010104198008775711, 0.00011523254215717316, 0.0001294231042265892, 0.00014361366629600525, 0.0001578042283654213, 0.00017199479043483734, 0.0001861853525042534, 0.00020037591457366943, 0.00021456647664308548, 0.00022875703871250153, 0.00024294760078191757, 0.0002571381628513336, 0.00027132872492074966, 0.0002855192869901657, 0.00029970984905958176, 0.0003139004111289978, 0.00032809097319841385, 0.0003422815352678299, 0.00035647209733724594, 0.000370662659406662, 0.00038485322147607803, 0.0003990437835454941, 0.0004132343456149101, 0.00042742490768432617]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 6.0, 3.0, 15.0, 9.0, 11.0, 10.0, 13.0, 14.0, 21.0, 27.0, 29.0, 29.0, 43.0, 24.0, 28.0, 27.0, 31.0, 37.0, 39.0, 50.0, 44.0, 45.0, 35.0, 42.0, 45.0, 35.0, 29.0, 35.0, 40.0, 29.0, 19.0, 19.0, 17.0, 16.0, 16.0, 11.0, 17.0, 9.0, 7.0, 3.0, 5.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.15625, -6.927001953125, -6.69775390625, -6.468505859375, -6.2392578125, -6.010009765625, -5.78076171875, -5.551513671875, -5.322265625, -5.093017578125, -4.86376953125, -4.634521484375, -4.4052734375, -4.176025390625, -3.94677734375, -3.717529296875, -3.48828125, -3.259033203125, -3.02978515625, -2.800537109375, -2.5712890625, -2.342041015625, -2.11279296875, -1.883544921875, -1.654296875, -1.425048828125, -1.19580078125, -0.966552734375, -0.7373046875, -0.508056640625, -0.27880859375, -0.049560546875, 0.1796875, 0.408935546875, 0.63818359375, 0.867431640625, 1.0966796875, 1.325927734375, 1.55517578125, 1.784423828125, 2.013671875, 2.242919921875, 2.47216796875, 2.701416015625, 2.9306640625, 3.159912109375, 3.38916015625, 3.618408203125, 3.84765625, 4.076904296875, 4.30615234375, 4.535400390625, 4.7646484375, 4.993896484375, 5.22314453125, 5.452392578125, 5.681640625, 5.910888671875, 6.14013671875, 6.369384765625, 6.5986328125, 6.827880859375, 7.05712890625, 7.286376953125, 7.515625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 4.0, 7.0, 11.0, 11.0, 11.0, 24.0, 30.0, 28.0, 34.0, 54.0, 68.0, 101.0, 132.0, 190.0, 280.0, 444.0, 924.0, 1900.0, 4904.0, 13576.0, 39009.0, 118472.0, 427218.0, 305843.0, 87958.0, 29590.0, 10325.0, 3779.0, 1571.0, 749.0, 362.0, 259.0, 184.0, 119.0, 103.0, 78.0, 46.0, 32.0, 23.0, 26.0, 18.0, 16.0, 11.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.24609375, -7.01873779296875, -6.7913818359375, -6.56402587890625, -6.336669921875, -6.10931396484375, -5.8819580078125, -5.65460205078125, -5.42724609375, -5.19989013671875, -4.9725341796875, -4.74517822265625, -4.517822265625, -4.29046630859375, -4.0631103515625, -3.83575439453125, -3.6083984375, -3.38104248046875, -3.1536865234375, -2.92633056640625, -2.698974609375, -2.47161865234375, -2.2442626953125, -2.01690673828125, -1.78955078125, -1.56219482421875, -1.3348388671875, -1.10748291015625, -0.880126953125, -0.65277099609375, -0.4254150390625, -0.19805908203125, 0.029296875, 0.25665283203125, 0.4840087890625, 0.71136474609375, 0.938720703125, 1.16607666015625, 1.3934326171875, 1.62078857421875, 1.84814453125, 2.07550048828125, 2.3028564453125, 2.53021240234375, 2.757568359375, 2.98492431640625, 3.2122802734375, 3.43963623046875, 3.6669921875, 3.89434814453125, 4.1217041015625, 4.34906005859375, 4.576416015625, 4.80377197265625, 5.0311279296875, 5.25848388671875, 5.48583984375, 5.71319580078125, 5.9405517578125, 6.16790771484375, 6.395263671875, 6.62261962890625, 6.8499755859375, 7.07733154296875, 7.3046875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 9.0, 14.0, 8.0, 10.0, 13.0, 9.0, 25.0, 18.0, 19.0, 34.0, 40.0, 44.0, 45.0, 60.0, 46.0, 84.0, 274.0, 1694.0, 153.0, 80.0, 55.0, 49.0, 44.0, 40.0, 30.0, 30.0, 29.0, 20.0, 12.0, 16.0, 11.0, 13.0, 7.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-31.359375, -30.518310546875, -29.67724609375, -28.836181640625, -27.9951171875, -27.154052734375, -26.31298828125, -25.471923828125, -24.630859375, -23.789794921875, -22.94873046875, -22.107666015625, -21.2666015625, -20.425537109375, -19.58447265625, -18.743408203125, -17.90234375, -17.061279296875, -16.22021484375, -15.379150390625, -14.5380859375, -13.697021484375, -12.85595703125, -12.014892578125, -11.173828125, -10.332763671875, -9.49169921875, -8.650634765625, -7.8095703125, -6.968505859375, -6.12744140625, -5.286376953125, -4.4453125, -3.604248046875, -2.76318359375, -1.922119140625, -1.0810546875, -0.239990234375, 0.60107421875, 1.442138671875, 2.283203125, 3.124267578125, 3.96533203125, 4.806396484375, 5.6474609375, 6.488525390625, 7.32958984375, 8.170654296875, 9.01171875, 9.852783203125, 10.69384765625, 11.534912109375, 12.3759765625, 13.217041015625, 14.05810546875, 14.899169921875, 15.740234375, 16.581298828125, 17.42236328125, 18.263427734375, 19.1044921875, 19.945556640625, 20.78662109375, 21.627685546875, 22.46875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 9.0, 4.0, 14.0, 8.0, 16.0, 20.0, 20.0, 33.0, 48.0, 66.0, 72.0, 99.0, 154.0, 230.0, 333.0, 729.0, 3717.0, 2959292.0, 177585.0, 1666.0, 556.0, 301.0, 210.0, 135.0, 100.0, 48.0, 51.0, 34.0, 31.0, 28.0, 21.0, 24.0, 9.0, 6.0, 5.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-62.875, -60.900390625, -58.92578125, -56.951171875, -54.9765625, -53.001953125, -51.02734375, -49.052734375, -47.078125, -45.103515625, -43.12890625, -41.154296875, -39.1796875, -37.205078125, -35.23046875, -33.255859375, -31.28125, -29.306640625, -27.33203125, -25.357421875, -23.3828125, -21.408203125, -19.43359375, -17.458984375, -15.484375, -13.509765625, -11.53515625, -9.560546875, -7.5859375, -5.611328125, -3.63671875, -1.662109375, 0.3125, 2.287109375, 4.26171875, 6.236328125, 8.2109375, 10.185546875, 12.16015625, 14.134765625, 16.109375, 18.083984375, 20.05859375, 22.033203125, 24.0078125, 25.982421875, 27.95703125, 29.931640625, 31.90625, 33.880859375, 35.85546875, 37.830078125, 39.8046875, 41.779296875, 43.75390625, 45.728515625, 47.703125, 49.677734375, 51.65234375, 53.626953125, 55.6015625, 57.576171875, 59.55078125, 61.525390625, 63.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 274.0, 672.0, 60.0], "bins": [-281.54827880859375, -277.02667236328125, -272.5050354003906, -267.9834289550781, -263.4617919921875, -258.940185546875, -254.41856384277344, -249.89694213867188, -245.37533569335938, -240.8537139892578, -236.33209228515625, -231.81048583984375, -227.2888641357422, -222.76724243164062, -218.24562072753906, -213.7239990234375, -209.202392578125, -204.68077087402344, -200.15914916992188, -195.63754272460938, -191.1159210205078, -186.59429931640625, -182.0726776123047, -177.55105590820312, -173.02943420410156, -168.5078125, -163.98619079589844, -159.46458435058594, -154.94296264648438, -150.4213409423828, -145.89971923828125, -141.37811279296875, -136.85647583007812, -132.33485412597656, -127.81324005126953, -123.29161834716797, -118.77000427246094, -114.24838256835938, -109.72676086425781, -105.20514678955078, -100.68353271484375, -96.16191101074219, -91.64029693603516, -87.1186752319336, -82.59706115722656, -78.075439453125, -73.55381774902344, -69.0322036743164, -64.51058959960938, -59.98897171020508, -55.46735382080078, -50.94573211669922, -46.42411804199219, -41.902496337890625, -37.38087844848633, -32.85926055908203, -28.337642669677734, -23.816024780273438, -19.29440689086914, -14.772787094116211, -10.251169204711914, -5.729551315307617, -1.2079315185546875, 3.3136863708496094, 7.8353047370910645]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 14.0, 8.0, 6.0, 11.0, 11.0, 16.0, 17.0, 18.0, 26.0, 21.0, 35.0, 33.0, 35.0, 42.0, 35.0, 35.0, 34.0, 42.0, 52.0, 42.0, 52.0, 36.0, 45.0, 37.0, 34.0, 41.0, 31.0, 27.0, 34.0, 27.0, 14.0, 14.0, 20.0, 12.0, 10.0, 8.0, 7.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.65973663330078, -60.69182205200195, -58.72391128540039, -56.75599670410156, -54.788082122802734, -52.82017135620117, -50.852256774902344, -48.88434600830078, -46.91643142700195, -44.948516845703125, -42.98060607910156, -41.012691497802734, -39.044776916503906, -37.076866149902344, -35.108951568603516, -33.14103698730469, -31.173124313354492, -29.205211639404297, -27.23729705810547, -25.269384384155273, -23.301471710205078, -21.33355712890625, -19.365644454956055, -17.39773178100586, -15.429818153381348, -13.461904525756836, -11.49399185180664, -9.526078224182129, -7.558165073394775, -5.590251922607422, -3.62233829498291, -1.6544256210327148, 0.3134880065917969, 2.2814011573791504, 4.249314308166504, 6.217227935791016, 8.185140609741211, 10.153054237365723, 12.120967864990234, 14.08888053894043, 16.056793212890625, 18.02470588684082, 19.99262046813965, 21.960533142089844, 23.92844581604004, 25.896358489990234, 27.864273071289062, 29.832185745239258, 31.800100326538086, 33.76801300048828, 35.73592758178711, 37.70384216308594, 39.6717529296875, 41.63966751098633, 43.607582092285156, 45.57549285888672, 47.54340744018555, 49.511322021484375, 51.47923278808594, 53.447147369384766, 55.415061950683594, 57.382972717285156, 59.350887298583984, 61.31880187988281, 63.286712646484375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 5.0, 7.0, 9.0, 7.0, 14.0, 9.0, 9.0, 15.0, 20.0, 17.0, 27.0, 25.0, 29.0, 37.0, 28.0, 40.0, 26.0, 28.0, 52.0, 42.0, 40.0, 37.0, 43.0, 29.0, 48.0, 39.0, 43.0, 35.0, 29.0, 28.0, 32.0, 24.0, 19.0, 20.0, 17.0, 8.0, 8.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.47265625, -7.23291015625, -6.9931640625, -6.75341796875, -6.513671875, -6.27392578125, -6.0341796875, -5.79443359375, -5.5546875, -5.31494140625, -5.0751953125, -4.83544921875, -4.595703125, -4.35595703125, -4.1162109375, -3.87646484375, -3.63671875, -3.39697265625, -3.1572265625, -2.91748046875, -2.677734375, -2.43798828125, -2.1982421875, -1.95849609375, -1.71875, -1.47900390625, -1.2392578125, -0.99951171875, -0.759765625, -0.52001953125, -0.2802734375, -0.04052734375, 0.19921875, 0.43896484375, 0.6787109375, 0.91845703125, 1.158203125, 1.39794921875, 1.6376953125, 1.87744140625, 2.1171875, 2.35693359375, 2.5966796875, 2.83642578125, 3.076171875, 3.31591796875, 3.5556640625, 3.79541015625, 4.03515625, 4.27490234375, 4.5146484375, 4.75439453125, 4.994140625, 5.23388671875, 5.4736328125, 5.71337890625, 5.953125, 6.19287109375, 6.4326171875, 6.67236328125, 6.912109375, 7.15185546875, 7.3916015625, 7.63134765625, 7.87109375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 9.0, 6.0, 17.0, 10.0, 9.0, 22.0, 29.0, 27.0, 38.0, 58.0, 65.0, 82.0, 124.0, 210.0, 348.0, 914.0, 4721.0, 112897.0, 3310192.0, 748133.0, 13407.0, 1608.0, 512.0, 247.0, 154.0, 94.0, 61.0, 69.0, 34.0, 35.0, 34.0, 18.0, 18.0, 14.0, 8.0, 13.0, 8.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.4375, -25.603759765625, -24.77001953125, -23.936279296875, -23.1025390625, -22.268798828125, -21.43505859375, -20.601318359375, -19.767578125, -18.933837890625, -18.10009765625, -17.266357421875, -16.4326171875, -15.598876953125, -14.76513671875, -13.931396484375, -13.09765625, -12.263916015625, -11.43017578125, -10.596435546875, -9.7626953125, -8.928955078125, -8.09521484375, -7.261474609375, -6.427734375, -5.593994140625, -4.76025390625, -3.926513671875, -3.0927734375, -2.259033203125, -1.42529296875, -0.591552734375, 0.2421875, 1.075927734375, 1.90966796875, 2.743408203125, 3.5771484375, 4.410888671875, 5.24462890625, 6.078369140625, 6.912109375, 7.745849609375, 8.57958984375, 9.413330078125, 10.2470703125, 11.080810546875, 11.91455078125, 12.748291015625, 13.58203125, 14.415771484375, 15.24951171875, 16.083251953125, 16.9169921875, 17.750732421875, 18.58447265625, 19.418212890625, 20.251953125, 21.085693359375, 21.91943359375, 22.753173828125, 23.5869140625, 24.420654296875, 25.25439453125, 26.088134765625, 26.921875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 6.0, 10.0, 15.0, 24.0, 18.0, 25.0, 39.0, 55.0, 66.0, 76.0, 114.0, 151.0, 215.0, 279.0, 349.0, 433.0, 468.0, 408.0, 332.0, 244.0, 184.0, 142.0, 89.0, 74.0, 69.0, 52.0, 47.0, 21.0, 22.0, 16.0, 8.0, 6.0, 7.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.8671875, -15.453857421875, -15.04052734375, -14.627197265625, -14.2138671875, -13.800537109375, -13.38720703125, -12.973876953125, -12.560546875, -12.147216796875, -11.73388671875, -11.320556640625, -10.9072265625, -10.493896484375, -10.08056640625, -9.667236328125, -9.25390625, -8.840576171875, -8.42724609375, -8.013916015625, -7.6005859375, -7.187255859375, -6.77392578125, -6.360595703125, -5.947265625, -5.533935546875, -5.12060546875, -4.707275390625, -4.2939453125, -3.880615234375, -3.46728515625, -3.053955078125, -2.640625, -2.227294921875, -1.81396484375, -1.400634765625, -0.9873046875, -0.573974609375, -0.16064453125, 0.252685546875, 0.666015625, 1.079345703125, 1.49267578125, 1.906005859375, 2.3193359375, 2.732666015625, 3.14599609375, 3.559326171875, 3.97265625, 4.385986328125, 4.79931640625, 5.212646484375, 5.6259765625, 6.039306640625, 6.45263671875, 6.865966796875, 7.279296875, 7.692626953125, 8.10595703125, 8.519287109375, 8.9326171875, 9.345947265625, 9.75927734375, 10.172607421875, 10.5859375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 7.0, 9.0, 12.0, 11.0, 17.0, 25.0, 39.0, 37.0, 51.0, 70.0, 77.0, 90.0, 126.0, 147.0, 173.0, 237.0, 301.0, 543.0, 2456.0, 531587.0, 3649465.0, 6449.0, 752.0, 376.0, 262.0, 205.0, 147.0, 128.0, 87.0, 85.0, 66.0, 63.0, 55.0, 34.0, 25.0, 19.0, 11.0, 11.0, 8.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.1875, -64.958984375, -62.73046875, -60.501953125, -58.2734375, -56.044921875, -53.81640625, -51.587890625, -49.359375, -47.130859375, -44.90234375, -42.673828125, -40.4453125, -38.216796875, -35.98828125, -33.759765625, -31.53125, -29.302734375, -27.07421875, -24.845703125, -22.6171875, -20.388671875, -18.16015625, -15.931640625, -13.703125, -11.474609375, -9.24609375, -7.017578125, -4.7890625, -2.560546875, -0.33203125, 1.896484375, 4.125, 6.353515625, 8.58203125, 10.810546875, 13.0390625, 15.267578125, 17.49609375, 19.724609375, 21.953125, 24.181640625, 26.41015625, 28.638671875, 30.8671875, 33.095703125, 35.32421875, 37.552734375, 39.78125, 42.009765625, 44.23828125, 46.466796875, 48.6953125, 50.923828125, 53.15234375, 55.380859375, 57.609375, 59.837890625, 62.06640625, 64.294921875, 66.5234375, 68.751953125, 70.98046875, 73.208984375, 75.4375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 21.0, 143.0, 342.0, 364.0, 126.0, 14.0, 2.0, 3.0, 2.0], "bins": [-314.69049072265625, -309.2684631347656, -303.8464660644531, -298.4244384765625, -293.0024108886719, -287.5804138183594, -282.15838623046875, -276.7363586425781, -271.3143615722656, -265.892333984375, -260.4703369140625, -255.04830932617188, -249.6262969970703, -244.20428466796875, -238.78225708007812, -233.36024475097656, -227.93821716308594, -222.51620483398438, -217.09417724609375, -211.6721649169922, -206.25015258789062, -200.828125, -195.40611267089844, -189.98410034179688, -184.56207275390625, -179.1400604248047, -173.71803283691406, -168.2960205078125, -162.87400817871094, -157.45199584960938, -152.02996826171875, -146.6079559326172, -141.18594360351562, -135.76393127441406, -130.34190368652344, -124.91989135742188, -119.49787902832031, -114.07585906982422, -108.65383911132812, -103.23182678222656, -97.80979919433594, -92.38777923583984, -86.96576690673828, -81.54374694824219, -76.12173461914062, -70.69971466064453, -65.27769470214844, -59.85567855834961, -54.43366622924805, -49.01165008544922, -43.589630126953125, -38.1676139831543, -32.74559783935547, -27.32358169555664, -21.901561737060547, -16.47954559326172, -11.05752944946289, -5.635512351989746, -0.21349525451660156, 5.208522796630859, 10.630538940429688, 16.052555084228516, 21.47457504272461, 26.896591186523438, 32.318607330322266]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 6.0, 4.0, 8.0, 12.0, 8.0, 18.0, 8.0, 11.0, 23.0, 26.0, 21.0, 28.0, 19.0, 15.0, 18.0, 29.0, 29.0, 31.0, 27.0, 40.0, 38.0, 29.0, 44.0, 27.0, 32.0, 32.0, 40.0, 24.0, 34.0, 21.0, 33.0, 25.0, 25.0, 20.0, 29.0, 22.0, 31.0, 13.0, 18.0, 12.0, 13.0, 8.0, 8.0, 7.0, 5.0, 3.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-35.452880859375, -34.26809310913086, -33.083309173583984, -31.898521423339844, -30.713735580444336, -29.528949737548828, -28.344161987304688, -27.15937614440918, -25.974590301513672, -24.789804458618164, -23.605018615722656, -22.420230865478516, -21.235445022583008, -20.0506591796875, -18.86587142944336, -17.68108558654785, -16.496299743652344, -15.311513900756836, -14.126727104187012, -12.941940307617188, -11.75715446472168, -10.572368621826172, -9.387581825256348, -8.202795028686523, -7.018009185791016, -5.83322286605835, -4.648436546325684, -3.4636502265930176, -2.2788639068603516, -1.0940775871276855, 0.09070873260498047, 1.2754955291748047, 2.4602813720703125, 3.6450676918029785, 4.8298540115356445, 6.0146403312683105, 7.199426651000977, 8.384212493896484, 9.568999290466309, 10.753786087036133, 11.93857192993164, 13.123357772827148, 14.308144569396973, 15.492931365966797, 16.677717208862305, 17.862503051757812, 19.047290802001953, 20.23207664489746, 21.41686248779297, 22.601648330688477, 23.786434173583984, 24.971221923828125, 26.156007766723633, 27.34079360961914, 28.52558135986328, 29.71036720275879, 30.895153045654297, 32.07994079589844, 33.26472473144531, 34.44951248168945, 35.634300231933594, 36.81908416748047, 38.00387191772461, 39.18865966796875, 40.373443603515625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 7.0, 8.0, 12.0, 10.0, 11.0, 22.0, 15.0, 22.0, 30.0, 30.0, 22.0, 25.0, 19.0, 41.0, 41.0, 31.0, 45.0, 54.0, 36.0, 26.0, 41.0, 49.0, 32.0, 37.0, 39.0, 34.0, 25.0, 20.0, 32.0, 35.0, 19.0, 23.0, 18.0, 20.0, 10.0, 6.0, 10.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.64453125, -7.4073486328125, -7.170166015625, -6.9329833984375, -6.69580078125, -6.4586181640625, -6.221435546875, -5.9842529296875, -5.7470703125, -5.5098876953125, -5.272705078125, -5.0355224609375, -4.79833984375, -4.5611572265625, -4.323974609375, -4.0867919921875, -3.849609375, -3.6124267578125, -3.375244140625, -3.1380615234375, -2.90087890625, -2.6636962890625, -2.426513671875, -2.1893310546875, -1.9521484375, -1.7149658203125, -1.477783203125, -1.2406005859375, -1.00341796875, -0.7662353515625, -0.529052734375, -0.2918701171875, -0.0546875, 0.1824951171875, 0.419677734375, 0.6568603515625, 0.89404296875, 1.1312255859375, 1.368408203125, 1.6055908203125, 1.8427734375, 2.0799560546875, 2.317138671875, 2.5543212890625, 2.79150390625, 3.0286865234375, 3.265869140625, 3.5030517578125, 3.740234375, 3.9774169921875, 4.214599609375, 4.4517822265625, 4.68896484375, 4.9261474609375, 5.163330078125, 5.4005126953125, 5.6376953125, 5.8748779296875, 6.112060546875, 6.3492431640625, 6.58642578125, 6.8236083984375, 7.060791015625, 7.2979736328125, 7.53515625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 11.0, 14.0, 24.0, 32.0, 57.0, 64.0, 111.0, 149.0, 229.0, 318.0, 475.0, 693.0, 1020.0, 1468.0, 2097.0, 3138.0, 4667.0, 6866.0, 10354.0, 15394.0, 23338.0, 36235.0, 57357.0, 98439.0, 216195.0, 272665.0, 114483.0, 64894.0, 40103.0, 25878.0, 16787.0, 11439.0, 7521.0, 5117.0, 3456.0, 2312.0, 1633.0, 1087.0, 777.0, 506.0, 368.0, 228.0, 180.0, 124.0, 87.0, 58.0, 29.0, 29.0, 14.0, 12.0, 11.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.578125, -1.52899169921875, -1.4798583984375, -1.43072509765625, -1.381591796875, -1.33245849609375, -1.2833251953125, -1.23419189453125, -1.18505859375, -1.13592529296875, -1.0867919921875, -1.03765869140625, -0.988525390625, -0.93939208984375, -0.8902587890625, -0.84112548828125, -0.7919921875, -0.74285888671875, -0.6937255859375, -0.64459228515625, -0.595458984375, -0.54632568359375, -0.4971923828125, -0.44805908203125, -0.39892578125, -0.34979248046875, -0.3006591796875, -0.25152587890625, -0.202392578125, -0.15325927734375, -0.1041259765625, -0.05499267578125, -0.005859375, 0.04327392578125, 0.0924072265625, 0.14154052734375, 0.190673828125, 0.23980712890625, 0.2889404296875, 0.33807373046875, 0.38720703125, 0.43634033203125, 0.4854736328125, 0.53460693359375, 0.583740234375, 0.63287353515625, 0.6820068359375, 0.73114013671875, 0.7802734375, 0.82940673828125, 0.8785400390625, 0.92767333984375, 0.976806640625, 1.02593994140625, 1.0750732421875, 1.12420654296875, 1.17333984375, 1.22247314453125, 1.2716064453125, 1.32073974609375, 1.369873046875, 1.41900634765625, 1.4681396484375, 1.51727294921875, 1.56640625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 13.0, 9.0, 10.0, 10.0, 12.0, 21.0, 8.0, 22.0, 27.0, 27.0, 27.0, 31.0, 39.0, 26.0, 35.0, 38.0, 45.0, 40.0, 45.0, 1065.0, 37.0, 43.0, 34.0, 42.0, 41.0, 25.0, 33.0, 26.0, 24.0, 26.0, 22.0, 24.0, 20.0, 11.0, 15.0, 10.0, 6.0, 11.0, 6.0, 10.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.94921875, -4.79888916015625, -4.6485595703125, -4.49822998046875, -4.347900390625, -4.19757080078125, -4.0472412109375, -3.89691162109375, -3.74658203125, -3.59625244140625, -3.4459228515625, -3.29559326171875, -3.145263671875, -2.99493408203125, -2.8446044921875, -2.69427490234375, -2.5439453125, -2.39361572265625, -2.2432861328125, -2.09295654296875, -1.942626953125, -1.79229736328125, -1.6419677734375, -1.49163818359375, -1.34130859375, -1.19097900390625, -1.0406494140625, -0.89031982421875, -0.739990234375, -0.58966064453125, -0.4393310546875, -0.28900146484375, -0.138671875, 0.01165771484375, 0.1619873046875, 0.31231689453125, 0.462646484375, 0.61297607421875, 0.7633056640625, 0.91363525390625, 1.06396484375, 1.21429443359375, 1.3646240234375, 1.51495361328125, 1.665283203125, 1.81561279296875, 1.9659423828125, 2.11627197265625, 2.2666015625, 2.41693115234375, 2.5672607421875, 2.71759033203125, 2.867919921875, 3.01824951171875, 3.1685791015625, 3.31890869140625, 3.46923828125, 3.61956787109375, 3.7698974609375, 3.92022705078125, 4.070556640625, 4.22088623046875, 4.3712158203125, 4.52154541015625, 4.671875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 15.0, 9.0, 14.0, 32.0, 29.0, 62.0, 99.0, 117.0, 196.0, 292.0, 419.0, 590.0, 866.0, 1311.0, 2067.0, 3034.0, 4636.0, 7005.0, 10601.0, 15898.0, 24231.0, 36903.0, 58296.0, 98511.0, 199558.0, 1320524.0, 118983.0, 68040.0, 42510.0, 27936.0, 18302.0, 12115.0, 7992.0, 5398.0, 3536.0, 2364.0, 1554.0, 1028.0, 658.0, 488.0, 307.0, 201.0, 139.0, 95.0, 58.0, 36.0, 30.0, 20.0, 9.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.4853515625, -1.4391632080078125, -1.392974853515625, -1.3467864990234375, -1.30059814453125, -1.2544097900390625, -1.208221435546875, -1.1620330810546875, -1.1158447265625, -1.0696563720703125, -1.023468017578125, -0.9772796630859375, -0.93109130859375, -0.8849029541015625, -0.838714599609375, -0.7925262451171875, -0.746337890625, -0.7001495361328125, -0.653961181640625, -0.6077728271484375, -0.56158447265625, -0.5153961181640625, -0.469207763671875, -0.4230194091796875, -0.3768310546875, -0.3306427001953125, -0.284454345703125, -0.2382659912109375, -0.19207763671875, -0.1458892822265625, -0.099700927734375, -0.0535125732421875, -0.00732421875, 0.0388641357421875, 0.085052490234375, 0.1312408447265625, 0.17742919921875, 0.2236175537109375, 0.269805908203125, 0.3159942626953125, 0.3621826171875, 0.4083709716796875, 0.454559326171875, 0.5007476806640625, 0.54693603515625, 0.5931243896484375, 0.639312744140625, 0.6855010986328125, 0.731689453125, 0.7778778076171875, 0.824066162109375, 0.8702545166015625, 0.91644287109375, 0.9626312255859375, 1.008819580078125, 1.0550079345703125, 1.1011962890625, 1.1473846435546875, 1.193572998046875, 1.2397613525390625, 1.28594970703125, 1.3321380615234375, 1.378326416015625, 1.4245147705078125, 1.470703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 9.0, 7.0, 17.0, 17.0, 16.0, 22.0, 39.0, 69.0, 102.0, 132.0, 153.0, 125.0, 88.0, 47.0, 28.0, 25.0, 17.0, 13.0, 7.0, 7.0, 8.0, 3.0, 8.0, 3.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0013208389282226562, -0.0012786388397216797, -0.0012364387512207031, -0.0011942386627197266, -0.00115203857421875, -0.0011098384857177734, -0.0010676383972167969, -0.0010254383087158203, -0.0009832382202148438, -0.0009410381317138672, -0.0008988380432128906, -0.0008566379547119141, -0.0008144378662109375, -0.0007722377777099609, -0.0007300376892089844, -0.0006878376007080078, -0.0006456375122070312, -0.0006034374237060547, -0.0005612373352050781, -0.0005190372467041016, -0.000476837158203125, -0.00043463706970214844, -0.0003924369812011719, -0.0003502368927001953, -0.00030803680419921875, -0.0002658367156982422, -0.00022363662719726562, -0.00018143653869628906, -0.0001392364501953125, -9.703636169433594e-05, -5.4836273193359375e-05, -1.2636184692382812e-05, 2.956390380859375e-05, 7.176399230957031e-05, 0.00011396408081054688, 0.00015616416931152344, 0.0001983642578125, 0.00024056434631347656, 0.0002827644348144531, 0.0003249645233154297, 0.00036716461181640625, 0.0004093647003173828, 0.0004515647888183594, 0.0004937648773193359, 0.0005359649658203125, 0.0005781650543212891, 0.0006203651428222656, 0.0006625652313232422, 0.0007047653198242188, 0.0007469654083251953, 0.0007891654968261719, 0.0008313655853271484, 0.000873565673828125, 0.0009157657623291016, 0.0009579658508300781, 0.0010001659393310547, 0.0010423660278320312, 0.0010845661163330078, 0.0011267662048339844, 0.001168966293334961, 0.0012111663818359375, 0.001253366470336914, 0.0012955665588378906, 0.0013377666473388672, 0.0013799667358398438]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 1.0, 7.0, 5.0, 7.0, 6.0, 14.0, 11.0, 13.0, 22.0, 37.0, 63.0, 119.0, 224.0, 686.0, 562549.0, 483569.0, 657.0, 254.0, 112.0, 52.0, 25.0, 26.0, 16.0, 20.0, 12.0, 6.0, 6.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03338623046875, -0.03237438201904297, -0.03136253356933594, -0.030350685119628906, -0.029338836669921875, -0.028326988220214844, -0.027315139770507812, -0.02630329132080078, -0.02529144287109375, -0.02427959442138672, -0.023267745971679688, -0.022255897521972656, -0.021244049072265625, -0.020232200622558594, -0.019220352172851562, -0.01820850372314453, -0.0171966552734375, -0.01618480682373047, -0.015172958374023438, -0.014161109924316406, -0.013149261474609375, -0.012137413024902344, -0.011125564575195312, -0.010113716125488281, -0.00910186767578125, -0.008090019226074219, -0.0070781707763671875, -0.006066322326660156, -0.005054473876953125, -0.004042625427246094, -0.0030307769775390625, -0.0020189285278320312, -0.001007080078125, 4.76837158203125e-06, 0.0010166168212890625, 0.0020284652709960938, 0.003040313720703125, 0.004052162170410156, 0.0050640106201171875, 0.006075859069824219, 0.00708770751953125, 0.008099555969238281, 0.009111404418945312, 0.010123252868652344, 0.011135101318359375, 0.012146949768066406, 0.013158798217773438, 0.014170646667480469, 0.0151824951171875, 0.01619434356689453, 0.017206192016601562, 0.018218040466308594, 0.019229888916015625, 0.020241737365722656, 0.021253585815429688, 0.02226543426513672, 0.02327728271484375, 0.02428913116455078, 0.025300979614257812, 0.026312828063964844, 0.027324676513671875, 0.028336524963378906, 0.029348373413085938, 0.03036022186279297, 0.0313720703125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 14.0, 63.0, 101.0, 185.0, 231.0, 168.0, 136.0, 59.0, 32.0, 11.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014141122810542583, -0.0013850296381860971, -0.0013559471117332578, -0.0013268644688650966, -0.0012977818259969354, -0.001268699299544096, -0.0012396166566759348, -0.0012105340138077736, -0.0011814514873549342, -0.001152368844486773, -0.0011232863180339336, -0.0010942036751657724, -0.0010651210322976112, -0.0010360385058447719, -0.0010069558629766107, -0.0009778733365237713, -0.0009487906936556101, -0.0009197081089951098, -0.0008906254661269486, -0.0008615428814664483, -0.000832460296805948, -0.0008033777121454477, -0.0007742950692772865, -0.0007452124846167862, -0.000716129841748625, -0.0006870472570881248, -0.0006579646142199636, -0.0006288820295594633, -0.000599799444898963, -0.0005707168020308018, -0.0005416342173703015, -0.0005125516327098012, -0.00048346901894547045, -0.0004543864051811397, -0.0004253038205206394, -0.0003962212067563087, -0.0003671386220958084, -0.00033805600833147764, -0.00030897342367097735, -0.0002798908099066466, -0.00025080819614231586, -0.00022172559692990035, -0.00019264299771748483, -0.0001635603839531541, -0.0001344777992926538, -0.00010539518552832305, -7.631258631590754e-05, -4.722998710349202e-05, -1.8147402442991734e-05, 1.0935198588413186e-05, 4.0017799619818106e-05, 6.910040247021243e-05, 9.818300168262795e-05, 0.00012726560817100108, 0.0001563482073834166, 0.0001854308065958321, 0.00021451340580824763, 0.00024359600502066314, 0.0002726786187849939, 0.0003017612034454942, 0.0003308438172098249, 0.00035992643097415566, 0.00038900901563465595, 0.00041809160029515624, 0.000447174214059487]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 8.0, 9.0, 4.0, 10.0, 8.0, 17.0, 16.0, 15.0, 20.0, 26.0, 26.0, 38.0, 32.0, 41.0, 33.0, 36.0, 39.0, 40.0, 45.0, 54.0, 39.0, 47.0, 41.0, 43.0, 38.0, 29.0, 37.0, 41.0, 28.0, 23.0, 19.0, 14.0, 17.0, 16.0, 12.0, 11.0, 6.0, 9.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0006125569343566895, -0.000595402903854847, -0.0005782488733530045, -0.000561094842851162, -0.0005439408123493195, -0.000526786781847477, -0.0005096327513456345, -0.000492478720843792, -0.00047532469034194946, -0.00045817065984010696, -0.00044101662933826447, -0.00042386259883642197, -0.00040670856833457947, -0.00038955453783273697, -0.00037240050733089447, -0.00035524647682905197, -0.00033809244632720947, -0.000320938415825367, -0.0003037843853235245, -0.000286630354821682, -0.0002694763243198395, -0.000252322293817997, -0.00023516826331615448, -0.00021801423281431198, -0.00020086020231246948, -0.00018370617181062698, -0.00016655214130878448, -0.00014939811080694199, -0.0001322440803050995, -0.00011509004980325699, -9.793601930141449e-05, -8.078198879957199e-05, -6.362795829772949e-05, -4.6473927795886993e-05, -2.9319897294044495e-05, -1.2165866792201996e-05, 4.988163709640503e-06, 2.2142194211483002e-05, 3.92962247133255e-05, 5.6450255215168e-05, 7.36042857170105e-05, 9.0758316218853e-05, 0.0001079123467206955, 0.000125066377222538, 0.0001422204077243805, 0.000159374438226223, 0.0001765284687280655, 0.000193682499229908, 0.0002108365297317505, 0.000227990560233593, 0.0002451445907354355, 0.000262298621237278, 0.0002794526517391205, 0.000296606682240963, 0.0003137607127428055, 0.000330914743244648, 0.0003480687737464905, 0.000365222804248333, 0.0003823768347501755, 0.000399530865252018, 0.0004166848957538605, 0.00043383892625570297, 0.00045099295675754547, 0.00046814698725938797, 0.00048530101776123047]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 7.0, 8.0, 12.0, 10.0, 11.0, 22.0, 15.0, 22.0, 30.0, 30.0, 22.0, 25.0, 19.0, 41.0, 41.0, 31.0, 45.0, 54.0, 37.0, 25.0, 41.0, 49.0, 32.0, 37.0, 39.0, 34.0, 25.0, 20.0, 32.0, 35.0, 19.0, 23.0, 18.0, 20.0, 10.0, 6.0, 10.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.64453125, -7.4073486328125, -7.170166015625, -6.9329833984375, -6.69580078125, -6.4586181640625, -6.221435546875, -5.9842529296875, -5.7470703125, -5.5098876953125, -5.272705078125, -5.0355224609375, -4.79833984375, -4.5611572265625, -4.323974609375, -4.0867919921875, -3.849609375, -3.6124267578125, -3.375244140625, -3.1380615234375, -2.90087890625, -2.6636962890625, -2.426513671875, -2.1893310546875, -1.9521484375, -1.7149658203125, -1.477783203125, -1.2406005859375, -1.00341796875, -0.7662353515625, -0.529052734375, -0.2918701171875, -0.0546875, 0.1824951171875, 0.419677734375, 0.6568603515625, 0.89404296875, 1.1312255859375, 1.368408203125, 1.6055908203125, 1.8427734375, 2.0799560546875, 2.317138671875, 2.5543212890625, 2.79150390625, 3.0286865234375, 3.265869140625, 3.5030517578125, 3.740234375, 3.9774169921875, 4.214599609375, 4.4517822265625, 4.68896484375, 4.9261474609375, 5.163330078125, 5.4005126953125, 5.6376953125, 5.8748779296875, 6.112060546875, 6.3492431640625, 6.58642578125, 6.8236083984375, 7.060791015625, 7.2979736328125, 7.53515625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 8.0, 4.0, 7.0, 9.0, 12.0, 16.0, 20.0, 19.0, 36.0, 35.0, 56.0, 67.0, 87.0, 113.0, 184.0, 273.0, 456.0, 849.0, 2102.0, 7103.0, 38540.0, 339539.0, 587911.0, 56531.0, 9514.0, 2542.0, 995.0, 493.0, 314.0, 182.0, 133.0, 105.0, 72.0, 51.0, 43.0, 37.0, 25.0, 13.0, 15.0, 13.0, 10.0, 9.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.1328125, -13.6925048828125, -13.252197265625, -12.8118896484375, -12.37158203125, -11.9312744140625, -11.490966796875, -11.0506591796875, -10.6103515625, -10.1700439453125, -9.729736328125, -9.2894287109375, -8.84912109375, -8.4088134765625, -7.968505859375, -7.5281982421875, -7.087890625, -6.6475830078125, -6.207275390625, -5.7669677734375, -5.32666015625, -4.8863525390625, -4.446044921875, -4.0057373046875, -3.5654296875, -3.1251220703125, -2.684814453125, -2.2445068359375, -1.80419921875, -1.3638916015625, -0.923583984375, -0.4832763671875, -0.04296875, 0.3973388671875, 0.837646484375, 1.2779541015625, 1.71826171875, 2.1585693359375, 2.598876953125, 3.0391845703125, 3.4794921875, 3.9197998046875, 4.360107421875, 4.8004150390625, 5.24072265625, 5.6810302734375, 6.121337890625, 6.5616455078125, 7.001953125, 7.4422607421875, 7.882568359375, 8.3228759765625, 8.76318359375, 9.2034912109375, 9.643798828125, 10.0841064453125, 10.5244140625, 10.9647216796875, 11.405029296875, 11.8453369140625, 12.28564453125, 12.7259521484375, 13.166259765625, 13.6065673828125, 14.046875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 5.0, 6.0, 8.0, 7.0, 11.0, 15.0, 6.0, 24.0, 23.0, 29.0, 23.0, 31.0, 43.0, 45.0, 54.0, 66.0, 77.0, 198.0, 1829.0, 128.0, 74.0, 48.0, 41.0, 40.0, 26.0, 39.0, 29.0, 31.0, 17.0, 16.0, 13.0, 13.0, 11.0, 6.0, 3.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.71875, -27.771240234375, -26.82373046875, -25.876220703125, -24.9287109375, -23.981201171875, -23.03369140625, -22.086181640625, -21.138671875, -20.191162109375, -19.24365234375, -18.296142578125, -17.3486328125, -16.401123046875, -15.45361328125, -14.506103515625, -13.55859375, -12.611083984375, -11.66357421875, -10.716064453125, -9.7685546875, -8.821044921875, -7.87353515625, -6.926025390625, -5.978515625, -5.031005859375, -4.08349609375, -3.135986328125, -2.1884765625, -1.240966796875, -0.29345703125, 0.654052734375, 1.6015625, 2.549072265625, 3.49658203125, 4.444091796875, 5.3916015625, 6.339111328125, 7.28662109375, 8.234130859375, 9.181640625, 10.129150390625, 11.07666015625, 12.024169921875, 12.9716796875, 13.919189453125, 14.86669921875, 15.814208984375, 16.76171875, 17.709228515625, 18.65673828125, 19.604248046875, 20.5517578125, 21.499267578125, 22.44677734375, 23.394287109375, 24.341796875, 25.289306640625, 26.23681640625, 27.184326171875, 28.1318359375, 29.079345703125, 30.02685546875, 30.974365234375, 31.921875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 7.0, 7.0, 8.0, 9.0, 16.0, 20.0, 17.0, 28.0, 39.0, 37.0, 49.0, 57.0, 94.0, 161.0, 280.0, 732.0, 12400.0, 3124187.0, 6125.0, 604.0, 280.0, 137.0, 106.0, 62.0, 43.0, 40.0, 25.0, 28.0, 21.0, 14.0, 18.0, 12.0, 10.0, 7.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-95.25, -92.4833984375, -89.716796875, -86.9501953125, -84.18359375, -81.4169921875, -78.650390625, -75.8837890625, -73.1171875, -70.3505859375, -67.583984375, -64.8173828125, -62.05078125, -59.2841796875, -56.517578125, -53.7509765625, -50.984375, -48.2177734375, -45.451171875, -42.6845703125, -39.91796875, -37.1513671875, -34.384765625, -31.6181640625, -28.8515625, -26.0849609375, -23.318359375, -20.5517578125, -17.78515625, -15.0185546875, -12.251953125, -9.4853515625, -6.71875, -3.9521484375, -1.185546875, 1.5810546875, 4.34765625, 7.1142578125, 9.880859375, 12.6474609375, 15.4140625, 18.1806640625, 20.947265625, 23.7138671875, 26.48046875, 29.2470703125, 32.013671875, 34.7802734375, 37.546875, 40.3134765625, 43.080078125, 45.8466796875, 48.61328125, 51.3798828125, 54.146484375, 56.9130859375, 59.6796875, 62.4462890625, 65.212890625, 67.9794921875, 70.74609375, 73.5126953125, 76.279296875, 79.0458984375, 81.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 31.0, 42.0, 84.0, 125.0, 157.0, 176.0, 130.0, 111.0, 80.0, 35.0, 15.0, 10.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.942230224609375, -20.005300521850586, -19.068370819091797, -18.131441116333008, -17.19451141357422, -16.257583618164062, -15.320652961730957, -14.383724212646484, -13.446794509887695, -12.509864807128906, -11.572935104370117, -10.636005401611328, -9.699076652526855, -8.762146949768066, -7.825217247009277, -6.8882880210876465, -5.951357841491699, -5.01442813873291, -4.077498912811279, -3.1405692100524902, -2.2036397457122803, -1.2667102813720703, -0.32978057861328125, 0.6071486473083496, 1.5440783500671387, 2.4810078144073486, 3.4179372787475586, 4.354866981506348, 5.291796684265137, 6.228725910186768, 7.165655612945557, 8.102584838867188, 9.039514541625977, 9.976444244384766, 10.913373947143555, 11.850303649902344, 12.787232398986816, 13.724162101745605, 14.661091804504395, 15.598020553588867, 16.534950256347656, 17.471879959106445, 18.408809661865234, 19.345739364624023, 20.282669067382812, 21.21959686279297, 22.15652847290039, 23.093456268310547, 24.03038787841797, 24.967317581176758, 25.904247283935547, 26.841176986694336, 27.778106689453125, 28.71503448486328, 29.651966094970703, 30.58889389038086, 31.52582359313965, 32.46275329589844, 33.399681091308594, 34.336612701416016, 35.27354049682617, 36.210472106933594, 37.14739990234375, 38.08433151245117, 39.02125930786133]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 4.0, 7.0, 13.0, 15.0, 20.0, 10.0, 16.0, 28.0, 23.0, 29.0, 25.0, 24.0, 31.0, 34.0, 30.0, 40.0, 36.0, 34.0, 31.0, 40.0, 39.0, 48.0, 39.0, 25.0, 26.0, 28.0, 32.0, 36.0, 22.0, 21.0, 19.0, 21.0, 20.0, 9.0, 18.0, 13.0, 8.0, 9.0, 11.0, 9.0, 5.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 7.0, 1.0, 0.0, 2.0], "bins": [-61.671630859375, -59.755794525146484, -57.8399543762207, -55.92411804199219, -54.008277893066406, -52.09244155883789, -50.176605224609375, -48.260765075683594, -46.34492492675781, -44.4290885925293, -42.513248443603516, -40.597412109375, -38.68157196044922, -36.7657356262207, -34.84989929199219, -32.934059143066406, -31.01822280883789, -29.102384567260742, -27.186546325683594, -25.270709991455078, -23.354869842529297, -21.43903350830078, -19.523195266723633, -17.607357025146484, -15.691518783569336, -13.775680541992188, -11.859842300415039, -9.944005012512207, -8.028166770935059, -6.11232852935791, -4.196491241455078, -2.2806529998779297, -0.36481475830078125, 1.551023244857788, 3.4668612480163574, 5.382699012756348, 7.298537254333496, 9.214375495910645, 11.130212783813477, 13.046051025390625, 14.961889266967773, 16.877727508544922, 18.79356575012207, 20.70940399169922, 22.625240325927734, 24.541080474853516, 26.45691680908203, 28.37275505065918, 30.288593292236328, 32.204429626464844, 34.120269775390625, 36.03610610961914, 37.95194625854492, 39.86778259277344, 41.78362274169922, 43.699459075927734, 45.61529541015625, 47.531131744384766, 49.44697189331055, 51.36280822753906, 53.278648376464844, 55.19448471069336, 57.110321044921875, 59.026161193847656, 60.94200134277344]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 2.0, 9.0, 5.0, 2.0, 9.0, 21.0, 11.0, 16.0, 31.0, 19.0, 22.0, 25.0, 19.0, 30.0, 29.0, 46.0, 43.0, 41.0, 37.0, 50.0, 37.0, 42.0, 37.0, 46.0, 38.0, 40.0, 35.0, 36.0, 34.0, 28.0, 20.0, 31.0, 20.0, 16.0, 13.0, 11.0, 11.0, 10.0, 9.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.4443359375, -8.177734375, -7.9111328125, -7.64453125, -7.3779296875, -7.111328125, -6.8447265625, -6.578125, -6.3115234375, -6.044921875, -5.7783203125, -5.51171875, -5.2451171875, -4.978515625, -4.7119140625, -4.4453125, -4.1787109375, -3.912109375, -3.6455078125, -3.37890625, -3.1123046875, -2.845703125, -2.5791015625, -2.3125, -2.0458984375, -1.779296875, -1.5126953125, -1.24609375, -0.9794921875, -0.712890625, -0.4462890625, -0.1796875, 0.0869140625, 0.353515625, 0.6201171875, 0.88671875, 1.1533203125, 1.419921875, 1.6865234375, 1.953125, 2.2197265625, 2.486328125, 2.7529296875, 3.01953125, 3.2861328125, 3.552734375, 3.8193359375, 4.0859375, 4.3525390625, 4.619140625, 4.8857421875, 5.15234375, 5.4189453125, 5.685546875, 5.9521484375, 6.21875, 6.4853515625, 6.751953125, 7.0185546875, 7.28515625, 7.5517578125, 7.818359375, 8.0849609375, 8.3515625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 9.0, 12.0, 14.0, 16.0, 17.0, 24.0, 40.0, 61.0, 77.0, 140.0, 199.0, 354.0, 715.0, 1530.0, 4259.0, 14933.0, 77902.0, 500820.0, 1695932.0, 1460632.0, 362698.0, 56004.0, 11520.0, 3472.0, 1351.0, 602.0, 337.0, 212.0, 135.0, 76.0, 38.0, 36.0, 17.0, 32.0, 13.0, 13.0, 8.0, 10.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.4876708984375, -11.115966796875, -10.7442626953125, -10.37255859375, -10.0008544921875, -9.629150390625, -9.2574462890625, -8.8857421875, -8.5140380859375, -8.142333984375, -7.7706298828125, -7.39892578125, -7.0272216796875, -6.655517578125, -6.2838134765625, -5.912109375, -5.5404052734375, -5.168701171875, -4.7969970703125, -4.42529296875, -4.0535888671875, -3.681884765625, -3.3101806640625, -2.9384765625, -2.5667724609375, -2.195068359375, -1.8233642578125, -1.45166015625, -1.0799560546875, -0.708251953125, -0.3365478515625, 0.03515625, 0.4068603515625, 0.778564453125, 1.1502685546875, 1.52197265625, 1.8936767578125, 2.265380859375, 2.6370849609375, 3.0087890625, 3.3804931640625, 3.752197265625, 4.1239013671875, 4.49560546875, 4.8673095703125, 5.239013671875, 5.6107177734375, 5.982421875, 6.3541259765625, 6.725830078125, 7.0975341796875, 7.46923828125, 7.8409423828125, 8.212646484375, 8.5843505859375, 8.9560546875, 9.3277587890625, 9.699462890625, 10.0711669921875, 10.44287109375, 10.8145751953125, 11.186279296875, 11.5579833984375, 11.9296875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 12.0, 9.0, 9.0, 22.0, 19.0, 41.0, 46.0, 89.0, 122.0, 162.0, 224.0, 297.0, 371.0, 463.0, 499.0, 435.0, 364.0, 270.0, 185.0, 136.0, 91.0, 60.0, 49.0, 38.0, 24.0, 14.0, 7.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.21875, -10.664794921875, -10.11083984375, -9.556884765625, -9.0029296875, -8.448974609375, -7.89501953125, -7.341064453125, -6.787109375, -6.233154296875, -5.67919921875, -5.125244140625, -4.5712890625, -4.017333984375, -3.46337890625, -2.909423828125, -2.35546875, -1.801513671875, -1.24755859375, -0.693603515625, -0.1396484375, 0.414306640625, 0.96826171875, 1.522216796875, 2.076171875, 2.630126953125, 3.18408203125, 3.738037109375, 4.2919921875, 4.845947265625, 5.39990234375, 5.953857421875, 6.5078125, 7.061767578125, 7.61572265625, 8.169677734375, 8.7236328125, 9.277587890625, 9.83154296875, 10.385498046875, 10.939453125, 11.493408203125, 12.04736328125, 12.601318359375, 13.1552734375, 13.709228515625, 14.26318359375, 14.817138671875, 15.37109375, 15.925048828125, 16.47900390625, 17.032958984375, 17.5869140625, 18.140869140625, 18.69482421875, 19.248779296875, 19.802734375, 20.356689453125, 20.91064453125, 21.464599609375, 22.0185546875, 22.572509765625, 23.12646484375, 23.680419921875, 24.234375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 9.0, 8.0, 10.0, 13.0, 26.0, 30.0, 41.0, 52.0, 69.0, 113.0, 122.0, 161.0, 217.0, 271.0, 418.0, 719.0, 2745.0, 314186.0, 3861408.0, 10650.0, 1187.0, 502.0, 310.0, 230.0, 190.0, 135.0, 125.0, 101.0, 62.0, 49.0, 40.0, 28.0, 18.0, 11.0, 8.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-83.625, -81.43701171875, -79.2490234375, -77.06103515625, -74.873046875, -72.68505859375, -70.4970703125, -68.30908203125, -66.12109375, -63.93310546875, -61.7451171875, -59.55712890625, -57.369140625, -55.18115234375, -52.9931640625, -50.80517578125, -48.6171875, -46.42919921875, -44.2412109375, -42.05322265625, -39.865234375, -37.67724609375, -35.4892578125, -33.30126953125, -31.11328125, -28.92529296875, -26.7373046875, -24.54931640625, -22.361328125, -20.17333984375, -17.9853515625, -15.79736328125, -13.609375, -11.42138671875, -9.2333984375, -7.04541015625, -4.857421875, -2.66943359375, -0.4814453125, 1.70654296875, 3.89453125, 6.08251953125, 8.2705078125, 10.45849609375, 12.646484375, 14.83447265625, 17.0224609375, 19.21044921875, 21.3984375, 23.58642578125, 25.7744140625, 27.96240234375, 30.150390625, 32.33837890625, 34.5263671875, 36.71435546875, 38.90234375, 41.09033203125, 43.2783203125, 45.46630859375, 47.654296875, 49.84228515625, 52.0302734375, 54.21826171875, 56.40625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 115.0, 536.0, 309.0, 39.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-370.7165222167969, -362.6109313964844, -354.5053405761719, -346.39971923828125, -338.29412841796875, -330.18853759765625, -322.08294677734375, -313.97735595703125, -305.87176513671875, -297.76617431640625, -289.66058349609375, -281.5549621582031, -273.4493713378906, -265.3437805175781, -257.2381896972656, -249.13259887695312, -241.0269775390625, -232.92138671875, -224.81578063964844, -216.71018981933594, -208.60458374023438, -200.49899291992188, -192.39340209960938, -184.28781127929688, -176.1822052001953, -168.0766143798828, -159.97100830078125, -151.86541748046875, -143.75982666015625, -135.6542205810547, -127.54862976074219, -119.44303131103516, -111.33743286132812, -103.2318344116211, -95.12623596191406, -87.02064514160156, -78.91504669189453, -70.8094482421875, -62.703853607177734, -54.59825897216797, -46.49266052246094, -38.387062072753906, -30.28146743774414, -22.175870895385742, -14.070274353027344, -5.9646759033203125, 2.140918731689453, 10.246513366699219, 18.35211181640625, 26.45770835876465, 34.56330490112305, 42.66889953613281, 50.774497985839844, 58.880096435546875, 66.98568725585938, 75.0912857055664, 83.19688415527344, 91.30248260498047, 99.4080810546875, 107.513671875, 115.61927032470703, 123.72486877441406, 131.83045959472656, 139.93606567382812, 148.04165649414062]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 12.0, 15.0, 14.0, 18.0, 20.0, 31.0, 30.0, 36.0, 29.0, 38.0, 34.0, 63.0, 50.0, 33.0, 37.0, 38.0, 39.0, 36.0, 37.0, 38.0, 38.0, 40.0, 33.0, 27.0, 27.0, 29.0, 23.0, 17.0, 13.0, 12.0, 13.0, 11.0, 8.0, 11.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.81171417236328, -46.17976760864258, -44.547821044921875, -42.91587448120117, -41.28392791748047, -39.6519775390625, -38.0200309753418, -36.388084411621094, -34.75613784790039, -33.12419128417969, -31.492244720458984, -29.86029624938965, -28.228349685668945, -26.596403121948242, -24.964454650878906, -23.332508087158203, -21.7005615234375, -20.068614959716797, -18.436668395996094, -16.804719924926758, -15.172773361206055, -13.540826797485352, -11.908879280090332, -10.276931762695312, -8.64498519897461, -7.013038158416748, -5.381091117858887, -3.7491440773010254, -2.117197036743164, -0.48525047302246094, 1.1466970443725586, 2.778644561767578, 4.410591125488281, 6.042538166046143, 7.674485206604004, 9.306432723999023, 10.938379287719727, 12.57032585144043, 14.20227336883545, 15.834220886230469, 17.466167449951172, 19.098114013671875, 20.730060577392578, 22.362009048461914, 23.993955612182617, 25.62590217590332, 27.257850646972656, 28.88979721069336, 30.521743774414062, 32.153690338134766, 33.78563690185547, 35.41758346557617, 37.049530029296875, 38.681480407714844, 40.31342697143555, 41.94537353515625, 43.57732009887695, 45.209266662597656, 46.84121322631836, 48.47315979003906, 50.10511016845703, 51.73705291748047, 53.36900329589844, 55.00094985961914, 56.632896423339844]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 7.0, 11.0, 13.0, 14.0, 10.0, 16.0, 25.0, 18.0, 25.0, 26.0, 34.0, 22.0, 27.0, 38.0, 35.0, 39.0, 39.0, 52.0, 40.0, 41.0, 55.0, 34.0, 37.0, 34.0, 34.0, 36.0, 41.0, 22.0, 26.0, 19.0, 21.0, 19.0, 13.0, 20.0, 14.0, 10.0, 10.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.81640625, -7.55474853515625, -7.2930908203125, -7.03143310546875, -6.769775390625, -6.50811767578125, -6.2464599609375, -5.98480224609375, -5.72314453125, -5.46148681640625, -5.1998291015625, -4.93817138671875, -4.676513671875, -4.41485595703125, -4.1531982421875, -3.89154052734375, -3.6298828125, -3.36822509765625, -3.1065673828125, -2.84490966796875, -2.583251953125, -2.32159423828125, -2.0599365234375, -1.79827880859375, -1.53662109375, -1.27496337890625, -1.0133056640625, -0.75164794921875, -0.489990234375, -0.22833251953125, 0.0333251953125, 0.29498291015625, 0.556640625, 0.81829833984375, 1.0799560546875, 1.34161376953125, 1.603271484375, 1.86492919921875, 2.1265869140625, 2.38824462890625, 2.64990234375, 2.91156005859375, 3.1732177734375, 3.43487548828125, 3.696533203125, 3.95819091796875, 4.2198486328125, 4.48150634765625, 4.7431640625, 5.00482177734375, 5.2664794921875, 5.52813720703125, 5.789794921875, 6.05145263671875, 6.3131103515625, 6.57476806640625, 6.83642578125, 7.09808349609375, 7.3597412109375, 7.62139892578125, 7.883056640625, 8.14471435546875, 8.4063720703125, 8.66802978515625, 8.9296875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 14.0, 11.0, 11.0, 16.0, 35.0, 48.0, 78.0, 104.0, 144.0, 243.0, 323.0, 477.0, 689.0, 1063.0, 1709.0, 2487.0, 3764.0, 5636.0, 8569.0, 13117.0, 20556.0, 31956.0, 51735.0, 86638.0, 174758.0, 320036.0, 130647.0, 71847.0, 43488.0, 27575.0, 17417.0, 11287.0, 7345.0, 4984.0, 3255.0, 2150.0, 1430.0, 964.0, 602.0, 432.0, 323.0, 179.0, 112.0, 120.0, 59.0, 47.0, 27.0, 17.0, 8.0, 10.0, 9.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7041015625, -1.6497039794921875, -1.595306396484375, -1.5409088134765625, -1.48651123046875, -1.4321136474609375, -1.377716064453125, -1.3233184814453125, -1.2689208984375, -1.2145233154296875, -1.160125732421875, -1.1057281494140625, -1.05133056640625, -0.9969329833984375, -0.942535400390625, -0.8881378173828125, -0.833740234375, -0.7793426513671875, -0.724945068359375, -0.6705474853515625, -0.61614990234375, -0.5617523193359375, -0.507354736328125, -0.4529571533203125, -0.3985595703125, -0.3441619873046875, -0.289764404296875, -0.2353668212890625, -0.18096923828125, -0.1265716552734375, -0.072174072265625, -0.0177764892578125, 0.03662109375, 0.0910186767578125, 0.145416259765625, 0.1998138427734375, 0.25421142578125, 0.3086090087890625, 0.363006591796875, 0.4174041748046875, 0.4718017578125, 0.5261993408203125, 0.580596923828125, 0.6349945068359375, 0.68939208984375, 0.7437896728515625, 0.798187255859375, 0.8525848388671875, 0.906982421875, 0.9613800048828125, 1.015777587890625, 1.0701751708984375, 1.12457275390625, 1.1789703369140625, 1.233367919921875, 1.2877655029296875, 1.3421630859375, 1.3965606689453125, 1.450958251953125, 1.5053558349609375, 1.55975341796875, 1.6141510009765625, 1.668548583984375, 1.7229461669921875, 1.77734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 9.0, 6.0, 9.0, 10.0, 9.0, 13.0, 11.0, 17.0, 35.0, 16.0, 16.0, 33.0, 26.0, 26.0, 42.0, 34.0, 27.0, 28.0, 29.0, 40.0, 28.0, 1058.0, 33.0, 37.0, 42.0, 26.0, 30.0, 34.0, 29.0, 28.0, 28.0, 27.0, 22.0, 22.0, 17.0, 18.0, 22.0, 15.0, 18.0, 10.0, 6.0, 3.0, 6.0, 5.0, 10.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.90234375, -4.7557373046875, -4.609130859375, -4.4625244140625, -4.31591796875, -4.1693115234375, -4.022705078125, -3.8760986328125, -3.7294921875, -3.5828857421875, -3.436279296875, -3.2896728515625, -3.14306640625, -2.9964599609375, -2.849853515625, -2.7032470703125, -2.556640625, -2.4100341796875, -2.263427734375, -2.1168212890625, -1.97021484375, -1.8236083984375, -1.677001953125, -1.5303955078125, -1.3837890625, -1.2371826171875, -1.090576171875, -0.9439697265625, -0.79736328125, -0.6507568359375, -0.504150390625, -0.3575439453125, -0.2109375, -0.0643310546875, 0.082275390625, 0.2288818359375, 0.37548828125, 0.5220947265625, 0.668701171875, 0.8153076171875, 0.9619140625, 1.1085205078125, 1.255126953125, 1.4017333984375, 1.54833984375, 1.6949462890625, 1.841552734375, 1.9881591796875, 2.134765625, 2.2813720703125, 2.427978515625, 2.5745849609375, 2.72119140625, 2.8677978515625, 3.014404296875, 3.1610107421875, 3.3076171875, 3.4542236328125, 3.600830078125, 3.7474365234375, 3.89404296875, 4.0406494140625, 4.187255859375, 4.3338623046875, 4.48046875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 14.0, 21.0, 19.0, 41.0, 49.0, 72.0, 112.0, 164.0, 227.0, 307.0, 478.0, 698.0, 1009.0, 1366.0, 2034.0, 3011.0, 4502.0, 6245.0, 9296.0, 13604.0, 19744.0, 28719.0, 42943.0, 65463.0, 104589.0, 216184.0, 1265628.0, 106976.0, 66906.0, 43522.0, 29485.0, 20161.0, 13626.0, 9503.0, 6371.0, 4374.0, 3066.0, 2049.0, 1462.0, 976.0, 639.0, 417.0, 340.0, 213.0, 170.0, 110.0, 64.0, 56.0, 43.0, 11.0, 25.0, 13.0, 11.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.4658203125, -1.4200439453125, -1.374267578125, -1.3284912109375, -1.28271484375, -1.2369384765625, -1.191162109375, -1.1453857421875, -1.099609375, -1.0538330078125, -1.008056640625, -0.9622802734375, -0.91650390625, -0.8707275390625, -0.824951171875, -0.7791748046875, -0.7333984375, -0.6876220703125, -0.641845703125, -0.5960693359375, -0.55029296875, -0.5045166015625, -0.458740234375, -0.4129638671875, -0.3671875, -0.3214111328125, -0.275634765625, -0.2298583984375, -0.18408203125, -0.1383056640625, -0.092529296875, -0.0467529296875, -0.0009765625, 0.0447998046875, 0.090576171875, 0.1363525390625, 0.18212890625, 0.2279052734375, 0.273681640625, 0.3194580078125, 0.365234375, 0.4110107421875, 0.456787109375, 0.5025634765625, 0.54833984375, 0.5941162109375, 0.639892578125, 0.6856689453125, 0.7314453125, 0.7772216796875, 0.822998046875, 0.8687744140625, 0.91455078125, 0.9603271484375, 1.006103515625, 1.0518798828125, 1.09765625, 1.1434326171875, 1.189208984375, 1.2349853515625, 1.28076171875, 1.3265380859375, 1.372314453125, 1.4180908203125, 1.4638671875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 4.0, 6.0, 10.0, 12.0, 20.0, 13.0, 23.0, 21.0, 35.0, 47.0, 88.0, 109.0, 115.0, 108.0, 87.0, 76.0, 40.0, 37.0, 29.0, 18.0, 14.0, 17.0, 4.0, 8.0, 9.0, 8.0, 4.0, 9.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0014410018920898438, -0.0013994872570037842, -0.0013579726219177246, -0.001316457986831665, -0.0012749433517456055, -0.001233428716659546, -0.0011919140815734863, -0.0011503994464874268, -0.0011088848114013672, -0.0010673701763153076, -0.001025855541229248, -0.0009843409061431885, -0.0009428262710571289, -0.0009013116359710693, -0.0008597970008850098, -0.0008182823657989502, -0.0007767677307128906, -0.0007352530956268311, -0.0006937384605407715, -0.0006522238254547119, -0.0006107091903686523, -0.0005691945552825928, -0.0005276799201965332, -0.00048616528511047363, -0.00044465065002441406, -0.0004031360149383545, -0.0003616213798522949, -0.00032010674476623535, -0.0002785921096801758, -0.0002370774745941162, -0.00019556283950805664, -0.00015404820442199707, -0.0001125335693359375, -7.101893424987793e-05, -2.950429916381836e-05, 1.2010335922241211e-05, 5.352497100830078e-05, 9.503960609436035e-05, 0.00013655424118041992, 0.0001780688762664795, 0.00021958351135253906, 0.00026109814643859863, 0.0003026127815246582, 0.0003441274166107178, 0.00038564205169677734, 0.0004271566867828369, 0.0004686713218688965, 0.0005101859569549561, 0.0005517005920410156, 0.0005932152271270752, 0.0006347298622131348, 0.0006762444972991943, 0.0007177591323852539, 0.0007592737674713135, 0.000800788402557373, 0.0008423030376434326, 0.0008838176727294922, 0.0009253323078155518, 0.0009668469429016113, 0.001008361577987671, 0.0010498762130737305, 0.00109139084815979, 0.0011329054832458496, 0.0011744201183319092, 0.0012159347534179688]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 6.0, 11.0, 6.0, 14.0, 7.0, 11.0, 29.0, 37.0, 44.0, 96.0, 162.0, 353.0, 1368.0, 1042752.0, 2803.0, 393.0, 169.0, 80.0, 57.0, 34.0, 17.0, 27.0, 13.0, 8.0, 6.0, 10.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030975341796875, -0.0298919677734375, -0.02880859375, -0.0277252197265625, -0.026641845703125, -0.0255584716796875, -0.02447509765625, -0.0233917236328125, -0.022308349609375, -0.0212249755859375, -0.0201416015625, -0.0190582275390625, -0.017974853515625, -0.0168914794921875, -0.01580810546875, -0.0147247314453125, -0.013641357421875, -0.0125579833984375, -0.011474609375, -0.0103912353515625, -0.009307861328125, -0.0082244873046875, -0.00714111328125, -0.0060577392578125, -0.004974365234375, -0.0038909912109375, -0.0028076171875, -0.0017242431640625, -0.000640869140625, 0.0004425048828125, 0.00152587890625, 0.0026092529296875, 0.003692626953125, 0.0047760009765625, 0.005859375, 0.0069427490234375, 0.008026123046875, 0.0091094970703125, 0.01019287109375, 0.0112762451171875, 0.012359619140625, 0.0134429931640625, 0.0145263671875, 0.0156097412109375, 0.016693115234375, 0.0177764892578125, 0.01885986328125, 0.0199432373046875, 0.021026611328125, 0.0221099853515625, 0.023193359375, 0.0242767333984375, 0.025360107421875, 0.0264434814453125, 0.02752685546875, 0.0286102294921875, 0.029693603515625, 0.0307769775390625, 0.0318603515625, 0.0329437255859375, 0.034027099609375, 0.0351104736328125, 0.03619384765625, 0.0372772216796875, 0.038360595703125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 9.0, 140.0, 506.0, 306.0, 46.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.003849547356367111, -0.0037805025931447744, -0.0037114580627530813, -0.0036424132995307446, -0.0035733687691390514, -0.0035043240059167147, -0.003435279242694378, -0.003366234712302685, -0.003297189949080348, -0.0032281451858580112, -0.003159100655466318, -0.0030900558922439814, -0.0030210113618522882, -0.0029519665986299515, -0.0028829220682382584, -0.0028138773050159216, -0.002744832541793585, -0.002675787778571248, -0.002606743248179555, -0.002537698484957218, -0.002468653954565525, -0.0023996091913431883, -0.0023305644281208515, -0.0022615198977291584, -0.0021924753673374653, -0.0021234306041151285, -0.0020543860737234354, -0.0019853413105010986, -0.0019162966636940837, -0.0018472520168870687, -0.0017782073700800538, -0.0017091627232730389, -0.0016401177272200584, -0.0015710730804130435, -0.0015020284336060286, -0.0014329836703836918, -0.0013639390235766768, -0.001294894376769662, -0.001225849729962647, -0.001156805083155632, -0.001087760436348617, -0.0010187157895416021, -0.0009496710845269263, -0.0008806264377199113, -0.0008115817327052355, -0.0007425370858982205, -0.0006734924390912056, -0.0006044477922841907, -0.0005354030872695148, -0.0004663584113586694, -0.000397313735447824, -0.00032826908864080906, -0.00025922441272996366, -0.00019017973681911826, -0.00012113509001210332, -5.209041410125792e-05, 1.695426180958748e-05, 8.599893044447526e-05, 0.00015504359907936305, 0.00022408826043829322, 0.0002931329363491386, 0.000362177612259984, 0.00043122225906699896, 0.0005002669058740139, 0.0005693116108886898]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 7.0, 6.0, 7.0, 4.0, 16.0, 12.0, 18.0, 24.0, 24.0, 19.0, 19.0, 37.0, 27.0, 24.0, 38.0, 37.0, 33.0, 41.0, 35.0, 51.0, 50.0, 45.0, 50.0, 50.0, 41.0, 44.0, 31.0, 31.0, 25.0, 27.0, 21.0, 17.0, 18.0, 16.0, 6.0, 12.0, 11.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005316734313964844, -0.0005137557163834572, -0.00049583800137043, -0.0004779202863574028, -0.0004600025713443756, -0.0004420848563313484, -0.00042416714131832123, -0.00040624942630529404, -0.00038833171129226685, -0.00037041399627923965, -0.00035249628126621246, -0.00033457856625318527, -0.0003166608512401581, -0.0002987431362271309, -0.0002808254212141037, -0.0002629077062010765, -0.0002449899911880493, -0.00022707227617502213, -0.00020915456116199493, -0.00019123684614896774, -0.00017331913113594055, -0.00015540141612291336, -0.00013748370110988617, -0.00011956598609685898, -0.00010164827108383179, -8.37305560708046e-05, -6.58128410577774e-05, -4.7895126044750214e-05, -2.9977411031723022e-05, -1.2059696018695831e-05, 5.85801899433136e-06, 2.377573400735855e-05, 4.169344902038574e-05, 5.961116403341293e-05, 7.752887904644012e-05, 9.544659405946732e-05, 0.00011336430907249451, 0.0001312820240855217, 0.0001491997390985489, 0.00016711745411157608, 0.00018503516912460327, 0.00020295288413763046, 0.00022087059915065765, 0.00023878831416368484, 0.00025670602917671204, 0.00027462374418973923, 0.0002925414592027664, 0.0003104591742157936, 0.0003283768892288208, 0.000346294604241848, 0.0003642123192548752, 0.0003821300342679024, 0.00040004774928092957, 0.00041796546429395676, 0.00043588317930698395, 0.00045380089432001114, 0.00047171860933303833, 0.0004896363243460655, 0.0005075540393590927, 0.0005254717543721199, 0.0005433894693851471, 0.0005613071843981743, 0.0005792248994112015, 0.0005971426144242287, 0.0006150603294372559]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 5.0, 7.0, 11.0, 13.0, 14.0, 10.0, 16.0, 25.0, 18.0, 25.0, 26.0, 34.0, 22.0, 28.0, 37.0, 35.0, 39.0, 39.0, 52.0, 40.0, 41.0, 55.0, 34.0, 37.0, 34.0, 34.0, 36.0, 41.0, 22.0, 26.0, 19.0, 21.0, 19.0, 13.0, 20.0, 14.0, 10.0, 10.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.81640625, -7.55474853515625, -7.2930908203125, -7.03143310546875, -6.769775390625, -6.50811767578125, -6.2464599609375, -5.98480224609375, -5.72314453125, -5.46148681640625, -5.1998291015625, -4.93817138671875, -4.676513671875, -4.41485595703125, -4.1531982421875, -3.89154052734375, -3.6298828125, -3.36822509765625, -3.1065673828125, -2.84490966796875, -2.583251953125, -2.32159423828125, -2.0599365234375, -1.79827880859375, -1.53662109375, -1.27496337890625, -1.0133056640625, -0.75164794921875, -0.489990234375, -0.22833251953125, 0.0333251953125, 0.29498291015625, 0.556640625, 0.81829833984375, 1.0799560546875, 1.34161376953125, 1.603271484375, 1.86492919921875, 2.1265869140625, 2.38824462890625, 2.64990234375, 2.91156005859375, 3.1732177734375, 3.43487548828125, 3.696533203125, 3.95819091796875, 4.2198486328125, 4.48150634765625, 4.7431640625, 5.00482177734375, 5.2664794921875, 5.52813720703125, 5.789794921875, 6.05145263671875, 6.3131103515625, 6.57476806640625, 6.83642578125, 7.09808349609375, 7.3597412109375, 7.62139892578125, 7.883056640625, 8.14471435546875, 8.4063720703125, 8.66802978515625, 8.9296875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 9.0, 14.0, 12.0, 21.0, 21.0, 37.0, 56.0, 68.0, 123.0, 191.0, 317.0, 541.0, 1118.0, 2444.0, 5022.0, 11207.0, 25858.0, 66164.0, 188723.0, 411025.0, 211290.0, 72866.0, 28483.0, 12219.0, 5328.0, 2605.0, 1242.0, 592.0, 359.0, 177.0, 116.0, 100.0, 57.0, 37.0, 30.0, 23.0, 23.0, 6.0, 7.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.79296875, -6.57061767578125, -6.3482666015625, -6.12591552734375, -5.903564453125, -5.68121337890625, -5.4588623046875, -5.23651123046875, -5.01416015625, -4.79180908203125, -4.5694580078125, -4.34710693359375, -4.124755859375, -3.90240478515625, -3.6800537109375, -3.45770263671875, -3.2353515625, -3.01300048828125, -2.7906494140625, -2.56829833984375, -2.345947265625, -2.12359619140625, -1.9012451171875, -1.67889404296875, -1.45654296875, -1.23419189453125, -1.0118408203125, -0.78948974609375, -0.567138671875, -0.34478759765625, -0.1224365234375, 0.09991455078125, 0.322265625, 0.54461669921875, 0.7669677734375, 0.98931884765625, 1.211669921875, 1.43402099609375, 1.6563720703125, 1.87872314453125, 2.10107421875, 2.32342529296875, 2.5457763671875, 2.76812744140625, 2.990478515625, 3.21282958984375, 3.4351806640625, 3.65753173828125, 3.8798828125, 4.10223388671875, 4.3245849609375, 4.54693603515625, 4.769287109375, 4.99163818359375, 5.2139892578125, 5.43634033203125, 5.65869140625, 5.88104248046875, 6.1033935546875, 6.32574462890625, 6.548095703125, 6.77044677734375, 6.9927978515625, 7.21514892578125, 7.4375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 9.0, 9.0, 6.0, 10.0, 11.0, 20.0, 16.0, 16.0, 36.0, 19.0, 37.0, 34.0, 36.0, 44.0, 35.0, 57.0, 80.0, 196.0, 1554.0, 285.0, 104.0, 53.0, 45.0, 38.0, 39.0, 24.0, 37.0, 21.0, 33.0, 19.0, 16.0, 18.0, 15.0, 7.0, 10.0, 11.0, 5.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-26.890625, -26.093017578125, -25.29541015625, -24.497802734375, -23.7001953125, -22.902587890625, -22.10498046875, -21.307373046875, -20.509765625, -19.712158203125, -18.91455078125, -18.116943359375, -17.3193359375, -16.521728515625, -15.72412109375, -14.926513671875, -14.12890625, -13.331298828125, -12.53369140625, -11.736083984375, -10.9384765625, -10.140869140625, -9.34326171875, -8.545654296875, -7.748046875, -6.950439453125, -6.15283203125, -5.355224609375, -4.5576171875, -3.760009765625, -2.96240234375, -2.164794921875, -1.3671875, -0.569580078125, 0.22802734375, 1.025634765625, 1.8232421875, 2.620849609375, 3.41845703125, 4.216064453125, 5.013671875, 5.811279296875, 6.60888671875, 7.406494140625, 8.2041015625, 9.001708984375, 9.79931640625, 10.596923828125, 11.39453125, 12.192138671875, 12.98974609375, 13.787353515625, 14.5849609375, 15.382568359375, 16.18017578125, 16.977783203125, 17.775390625, 18.572998046875, 19.37060546875, 20.168212890625, 20.9658203125, 21.763427734375, 22.56103515625, 23.358642578125, 24.15625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 3.0, 11.0, 9.0, 16.0, 18.0, 13.0, 17.0, 28.0, 42.0, 54.0, 62.0, 82.0, 104.0, 119.0, 188.0, 268.0, 425.0, 942.0, 9294.0, 2610885.0, 516304.0, 4578.0, 814.0, 437.0, 222.0, 180.0, 123.0, 92.0, 96.0, 46.0, 49.0, 42.0, 18.0, 17.0, 21.0, 14.0, 13.0, 13.0, 5.0, 6.0, 2.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-43.21875, -41.86376953125, -40.5087890625, -39.15380859375, -37.798828125, -36.44384765625, -35.0888671875, -33.73388671875, -32.37890625, -31.02392578125, -29.6689453125, -28.31396484375, -26.958984375, -25.60400390625, -24.2490234375, -22.89404296875, -21.5390625, -20.18408203125, -18.8291015625, -17.47412109375, -16.119140625, -14.76416015625, -13.4091796875, -12.05419921875, -10.69921875, -9.34423828125, -7.9892578125, -6.63427734375, -5.279296875, -3.92431640625, -2.5693359375, -1.21435546875, 0.140625, 1.49560546875, 2.8505859375, 4.20556640625, 5.560546875, 6.91552734375, 8.2705078125, 9.62548828125, 10.98046875, 12.33544921875, 13.6904296875, 15.04541015625, 16.400390625, 17.75537109375, 19.1103515625, 20.46533203125, 21.8203125, 23.17529296875, 24.5302734375, 25.88525390625, 27.240234375, 28.59521484375, 29.9501953125, 31.30517578125, 32.66015625, 34.01513671875, 35.3701171875, 36.72509765625, 38.080078125, 39.43505859375, 40.7900390625, 42.14501953125, 43.5]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 52.0, 893.0, 72.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-412.79730224609375, -405.079833984375, -397.3623962402344, -389.6449279785156, -381.927490234375, -374.21002197265625, -366.4925537109375, -358.7751159667969, -351.0576477050781, -343.3401794433594, -335.62274169921875, -327.9052734375, -320.18780517578125, -312.4703674316406, -304.7528991699219, -297.03546142578125, -289.3179931640625, -281.60052490234375, -273.8830871582031, -266.1656188964844, -258.44818115234375, -250.730712890625, -243.01324462890625, -235.29579162597656, -227.57833862304688, -219.8608856201172, -212.1434326171875, -204.42596435546875, -196.70851135253906, -188.99105834960938, -181.27359008789062, -173.55613708496094, -165.8386993408203, -158.12124633789062, -150.40377807617188, -142.6863250732422, -134.9688720703125, -127.25141906738281, -119.5339584350586, -111.81649780273438, -104.09904479980469, -96.381591796875, -88.66413116455078, -80.94667053222656, -73.22921752929688, -65.51176452636719, -57.79430389404297, -50.076847076416016, -42.35939025878906, -34.64193344116211, -26.924476623535156, -19.207019805908203, -11.48956298828125, -3.772106170654297, 3.9453506469726562, 11.66280746459961, 19.380264282226562, 27.097721099853516, 34.81517791748047, 42.53263473510742, 50.250091552734375, 57.96754837036133, 65.68500518798828, 73.4024658203125, 81.11991882324219]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 6.0, 9.0, 6.0, 10.0, 10.0, 7.0, 14.0, 28.0, 13.0, 21.0, 25.0, 23.0, 42.0, 37.0, 37.0, 29.0, 36.0, 30.0, 36.0, 40.0, 45.0, 38.0, 35.0, 37.0, 34.0, 32.0, 36.0, 33.0, 30.0, 30.0, 27.0, 28.0, 28.0, 15.0, 16.0, 18.0, 9.0, 11.0, 3.0, 5.0, 5.0, 6.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-57.751251220703125, -55.80572509765625, -53.860198974609375, -51.9146728515625, -49.969146728515625, -48.02362060546875, -46.07809066772461, -44.132564544677734, -42.18703842163086, -40.241512298583984, -38.29598617553711, -36.350460052490234, -34.404930114746094, -32.45940399169922, -30.513877868652344, -28.56835174560547, -26.622825622558594, -24.67729949951172, -22.731773376464844, -20.786245346069336, -18.84071922302246, -16.895193099975586, -14.949666023254395, -13.004138946533203, -11.058612823486328, -9.113086700439453, -7.167559623718262, -5.2220330238342285, -3.2765064239501953, -1.3309803009033203, 0.6145467758178711, 2.5600738525390625, 4.5055999755859375, 6.451126575469971, 8.396653175354004, 10.342180252075195, 12.28770637512207, 14.233232498168945, 16.178760528564453, 18.124286651611328, 20.069812774658203, 22.015338897705078, 23.960865020751953, 25.90639305114746, 27.851919174194336, 29.79744529724121, 31.74297332763672, 33.688499450683594, 35.63402557373047, 37.579551696777344, 39.52507781982422, 41.470603942871094, 43.41613006591797, 45.361656188964844, 47.307186126708984, 49.25271224975586, 51.198238372802734, 53.14376449584961, 55.089290618896484, 57.03481674194336, 58.9803466796875, 60.925872802734375, 62.87139892578125, 64.81692504882812, 66.762451171875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 10.0, 8.0, 12.0, 18.0, 19.0, 19.0, 18.0, 15.0, 23.0, 33.0, 18.0, 24.0, 36.0, 31.0, 36.0, 37.0, 38.0, 56.0, 43.0, 38.0, 54.0, 42.0, 37.0, 45.0, 29.0, 28.0, 27.0, 29.0, 29.0, 21.0, 18.0, 20.0, 16.0, 11.0, 17.0, 11.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -7.995849609375, -7.72607421875, -7.456298828125, -7.1865234375, -6.916748046875, -6.64697265625, -6.377197265625, -6.107421875, -5.837646484375, -5.56787109375, -5.298095703125, -5.0283203125, -4.758544921875, -4.48876953125, -4.218994140625, -3.94921875, -3.679443359375, -3.40966796875, -3.139892578125, -2.8701171875, -2.600341796875, -2.33056640625, -2.060791015625, -1.791015625, -1.521240234375, -1.25146484375, -0.981689453125, -0.7119140625, -0.442138671875, -0.17236328125, 0.097412109375, 0.3671875, 0.636962890625, 0.90673828125, 1.176513671875, 1.4462890625, 1.716064453125, 1.98583984375, 2.255615234375, 2.525390625, 2.795166015625, 3.06494140625, 3.334716796875, 3.6044921875, 3.874267578125, 4.14404296875, 4.413818359375, 4.68359375, 4.953369140625, 5.22314453125, 5.492919921875, 5.7626953125, 6.032470703125, 6.30224609375, 6.572021484375, 6.841796875, 7.111572265625, 7.38134765625, 7.651123046875, 7.9208984375, 8.190673828125, 8.46044921875, 8.730224609375, 9.0]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 8.0, 15.0, 10.0, 18.0, 10.0, 14.0, 26.0, 28.0, 36.0, 38.0, 57.0, 67.0, 90.0, 154.0, 283.0, 950.0, 5715.0, 150391.0, 3380840.0, 639013.0, 13996.0, 1493.0, 387.0, 174.0, 89.0, 83.0, 56.0, 46.0, 38.0, 33.0, 27.0, 16.0, 8.0, 12.0, 14.0, 11.0, 8.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.65625, -26.75439453125, -25.8525390625, -24.95068359375, -24.048828125, -23.14697265625, -22.2451171875, -21.34326171875, -20.44140625, -19.53955078125, -18.6376953125, -17.73583984375, -16.833984375, -15.93212890625, -15.0302734375, -14.12841796875, -13.2265625, -12.32470703125, -11.4228515625, -10.52099609375, -9.619140625, -8.71728515625, -7.8154296875, -6.91357421875, -6.01171875, -5.10986328125, -4.2080078125, -3.30615234375, -2.404296875, -1.50244140625, -0.6005859375, 0.30126953125, 1.203125, 2.10498046875, 3.0068359375, 3.90869140625, 4.810546875, 5.71240234375, 6.6142578125, 7.51611328125, 8.41796875, 9.31982421875, 10.2216796875, 11.12353515625, 12.025390625, 12.92724609375, 13.8291015625, 14.73095703125, 15.6328125, 16.53466796875, 17.4365234375, 18.33837890625, 19.240234375, 20.14208984375, 21.0439453125, 21.94580078125, 22.84765625, 23.74951171875, 24.6513671875, 25.55322265625, 26.455078125, 27.35693359375, 28.2587890625, 29.16064453125, 30.0625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 11.0, 11.0, 20.0, 19.0, 20.0, 31.0, 41.0, 43.0, 59.0, 91.0, 119.0, 156.0, 205.0, 281.0, 351.0, 412.0, 426.0, 417.0, 367.0, 245.0, 182.0, 136.0, 104.0, 79.0, 65.0, 41.0, 36.0, 20.0, 24.0, 15.0, 13.0, 9.0, 4.0, 4.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.1640625, -12.72998046875, -12.2958984375, -11.86181640625, -11.427734375, -10.99365234375, -10.5595703125, -10.12548828125, -9.69140625, -9.25732421875, -8.8232421875, -8.38916015625, -7.955078125, -7.52099609375, -7.0869140625, -6.65283203125, -6.21875, -5.78466796875, -5.3505859375, -4.91650390625, -4.482421875, -4.04833984375, -3.6142578125, -3.18017578125, -2.74609375, -2.31201171875, -1.8779296875, -1.44384765625, -1.009765625, -0.57568359375, -0.1416015625, 0.29248046875, 0.7265625, 1.16064453125, 1.5947265625, 2.02880859375, 2.462890625, 2.89697265625, 3.3310546875, 3.76513671875, 4.19921875, 4.63330078125, 5.0673828125, 5.50146484375, 5.935546875, 6.36962890625, 6.8037109375, 7.23779296875, 7.671875, 8.10595703125, 8.5400390625, 8.97412109375, 9.408203125, 9.84228515625, 10.2763671875, 10.71044921875, 11.14453125, 11.57861328125, 12.0126953125, 12.44677734375, 12.880859375, 13.31494140625, 13.7490234375, 14.18310546875, 14.6171875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 7.0, 3.0, 5.0, 21.0, 21.0, 27.0, 34.0, 49.0, 54.0, 68.0, 105.0, 144.0, 181.0, 258.0, 415.0, 899.0, 7491.0, 3144434.0, 1033528.0, 4454.0, 811.0, 320.0, 242.0, 167.0, 112.0, 107.0, 60.0, 61.0, 47.0, 36.0, 30.0, 19.0, 15.0, 13.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.34375, -56.00244140625, -53.6611328125, -51.31982421875, -48.978515625, -46.63720703125, -44.2958984375, -41.95458984375, -39.61328125, -37.27197265625, -34.9306640625, -32.58935546875, -30.248046875, -27.90673828125, -25.5654296875, -23.22412109375, -20.8828125, -18.54150390625, -16.2001953125, -13.85888671875, -11.517578125, -9.17626953125, -6.8349609375, -4.49365234375, -2.15234375, 0.18896484375, 2.5302734375, 4.87158203125, 7.212890625, 9.55419921875, 11.8955078125, 14.23681640625, 16.578125, 18.91943359375, 21.2607421875, 23.60205078125, 25.943359375, 28.28466796875, 30.6259765625, 32.96728515625, 35.30859375, 37.64990234375, 39.9912109375, 42.33251953125, 44.673828125, 47.01513671875, 49.3564453125, 51.69775390625, 54.0390625, 56.38037109375, 58.7216796875, 61.06298828125, 63.404296875, 65.74560546875, 68.0869140625, 70.42822265625, 72.76953125, 75.11083984375, 77.4521484375, 79.79345703125, 82.134765625, 84.47607421875, 86.8173828125, 89.15869140625, 91.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 27.0, 124.0, 333.0, 315.0, 167.0, 32.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.72439575195312, -99.51272583007812, -94.30105590820312, -89.08939361572266, -83.87772369384766, -78.66605377197266, -73.45439147949219, -68.24272155761719, -63.03105163574219, -57.81938171386719, -52.60771560668945, -47.39604949951172, -42.18437957763672, -36.97270965576172, -31.761043548583984, -26.54937744140625, -21.33770751953125, -16.126039505004883, -10.914371490478516, -5.702703475952148, -0.49103546142578125, 4.720632553100586, 9.932300567626953, 15.143966674804688, 20.355636596679688, 25.567304611206055, 30.778972625732422, 35.990638732910156, 41.202308654785156, 46.413978576660156, 51.62564468383789, 56.837310791015625, 62.04896545410156, 67.26063537597656, 72.47230529785156, 77.68396759033203, 82.89563751220703, 88.10730743408203, 93.3189697265625, 98.5306396484375, 103.7423095703125, 108.9539794921875, 114.1656494140625, 119.37731170654297, 124.58898162841797, 129.80064392089844, 135.01231384277344, 140.22398376464844, 145.43565368652344, 150.64732360839844, 155.85899353027344, 161.07066345214844, 166.28231811523438, 171.49398803710938, 176.70565795898438, 181.91732788085938, 187.12899780273438, 192.34066772460938, 197.55233764648438, 202.76400756835938, 207.97567749023438, 213.1873321533203, 218.3990020751953, 223.6106719970703, 228.8223419189453]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 9.0, 5.0, 18.0, 18.0, 24.0, 27.0, 26.0, 30.0, 36.0, 25.0, 36.0, 42.0, 35.0, 45.0, 51.0, 52.0, 41.0, 39.0, 48.0, 42.0, 31.0, 34.0, 31.0, 35.0, 26.0, 20.0, 23.0, 28.0, 19.0, 16.0, 11.0, 11.0, 8.0, 7.0, 7.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-52.05033874511719, -50.452239990234375, -48.85414123535156, -47.25604248046875, -45.65794372558594, -44.059844970703125, -42.46174621582031, -40.8636474609375, -39.26554870605469, -37.667449951171875, -36.06935119628906, -34.47125244140625, -32.87315368652344, -31.275054931640625, -29.67695426940918, -28.078855514526367, -26.480754852294922, -24.88265609741211, -23.284557342529297, -21.686458587646484, -20.088359832763672, -18.49026107788086, -16.892160415649414, -15.294061660766602, -13.695962905883789, -12.097864151000977, -10.499765396118164, -8.901665687561035, -7.303566932678223, -5.70546817779541, -4.107368469238281, -2.5092697143554688, -0.9111709594726562, 0.6869280338287354, 2.285027027130127, 3.8831262588500977, 5.48122501373291, 7.079323768615723, 8.677423477172852, 10.275522232055664, 11.873620986938477, 13.471719741821289, 15.069818496704102, 16.667919158935547, 18.26601791381836, 19.864116668701172, 21.462215423583984, 23.060314178466797, 24.65841293334961, 26.256511688232422, 27.854610443115234, 29.452709197998047, 31.05080795288086, 32.64890670776367, 34.24700927734375, 35.84510803222656, 37.443206787109375, 39.04130554199219, 40.639404296875, 42.23750305175781, 43.835601806640625, 45.43370056152344, 47.03179931640625, 48.62989807128906, 50.227996826171875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 8.0, 15.0, 10.0, 12.0, 9.0, 20.0, 17.0, 14.0, 16.0, 26.0, 16.0, 17.0, 28.0, 29.0, 24.0, 27.0, 38.0, 36.0, 40.0, 53.0, 38.0, 46.0, 35.0, 40.0, 29.0, 22.0, 38.0, 30.0, 31.0, 25.0, 27.0, 16.0, 24.0, 23.0, 19.0, 23.0, 13.0, 11.0, 8.0, 10.0, 8.0, 6.0, 4.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.828125, -7.5748291015625, -7.321533203125, -7.0682373046875, -6.81494140625, -6.5616455078125, -6.308349609375, -6.0550537109375, -5.8017578125, -5.5484619140625, -5.295166015625, -5.0418701171875, -4.78857421875, -4.5352783203125, -4.281982421875, -4.0286865234375, -3.775390625, -3.5220947265625, -3.268798828125, -3.0155029296875, -2.76220703125, -2.5089111328125, -2.255615234375, -2.0023193359375, -1.7490234375, -1.4957275390625, -1.242431640625, -0.9891357421875, -0.73583984375, -0.4825439453125, -0.229248046875, 0.0240478515625, 0.27734375, 0.5306396484375, 0.783935546875, 1.0372314453125, 1.29052734375, 1.5438232421875, 1.797119140625, 2.0504150390625, 2.3037109375, 2.5570068359375, 2.810302734375, 3.0635986328125, 3.31689453125, 3.5701904296875, 3.823486328125, 4.0767822265625, 4.330078125, 4.5833740234375, 4.836669921875, 5.0899658203125, 5.34326171875, 5.5965576171875, 5.849853515625, 6.1031494140625, 6.3564453125, 6.6097412109375, 6.863037109375, 7.1163330078125, 7.36962890625, 7.6229248046875, 7.876220703125, 8.1295166015625, 8.3828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 7.0, 10.0, 9.0, 31.0, 49.0, 73.0, 82.0, 104.0, 176.0, 255.0, 468.0, 710.0, 990.0, 1466.0, 2229.0, 3243.0, 4936.0, 7405.0, 11344.0, 16759.0, 25848.0, 40084.0, 63535.0, 112606.0, 294360.0, 209117.0, 94214.0, 55651.0, 35104.0, 22852.0, 14951.0, 9823.0, 6570.0, 4587.0, 3024.0, 2013.0, 1305.0, 860.0, 564.0, 427.0, 263.0, 171.0, 122.0, 58.0, 40.0, 15.0, 19.0, 17.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7939453125, -1.735809326171875, -1.67767333984375, -1.619537353515625, -1.5614013671875, -1.503265380859375, -1.44512939453125, -1.386993408203125, -1.328857421875, -1.270721435546875, -1.21258544921875, -1.154449462890625, -1.0963134765625, -1.038177490234375, -0.98004150390625, -0.921905517578125, -0.86376953125, -0.805633544921875, -0.74749755859375, -0.689361572265625, -0.6312255859375, -0.573089599609375, -0.51495361328125, -0.456817626953125, -0.398681640625, -0.340545654296875, -0.28240966796875, -0.224273681640625, -0.1661376953125, -0.108001708984375, -0.04986572265625, 0.008270263671875, 0.06640625, 0.124542236328125, 0.18267822265625, 0.240814208984375, 0.2989501953125, 0.357086181640625, 0.41522216796875, 0.473358154296875, 0.531494140625, 0.589630126953125, 0.64776611328125, 0.705902099609375, 0.7640380859375, 0.822174072265625, 0.88031005859375, 0.938446044921875, 0.99658203125, 1.054718017578125, 1.11285400390625, 1.170989990234375, 1.2291259765625, 1.287261962890625, 1.34539794921875, 1.403533935546875, 1.461669921875, 1.519805908203125, 1.57794189453125, 1.636077880859375, 1.6942138671875, 1.752349853515625, 1.81048583984375, 1.868621826171875, 1.9267578125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 4.0, 5.0, 5.0, 10.0, 6.0, 8.0, 15.0, 16.0, 18.0, 11.0, 14.0, 26.0, 19.0, 30.0, 15.0, 30.0, 37.0, 33.0, 32.0, 26.0, 39.0, 32.0, 37.0, 25.0, 1062.0, 38.0, 32.0, 27.0, 36.0, 32.0, 42.0, 30.0, 21.0, 19.0, 22.0, 22.0, 19.0, 16.0, 20.0, 11.0, 12.0, 14.0, 9.0, 9.0, 6.0, 9.0, 4.0, 7.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.0, -4.84613037109375, -4.6922607421875, -4.53839111328125, -4.384521484375, -4.23065185546875, -4.0767822265625, -3.92291259765625, -3.76904296875, -3.61517333984375, -3.4613037109375, -3.30743408203125, -3.153564453125, -2.99969482421875, -2.8458251953125, -2.69195556640625, -2.5380859375, -2.38421630859375, -2.2303466796875, -2.07647705078125, -1.922607421875, -1.76873779296875, -1.6148681640625, -1.46099853515625, -1.30712890625, -1.15325927734375, -0.9993896484375, -0.84552001953125, -0.691650390625, -0.53778076171875, -0.3839111328125, -0.23004150390625, -0.076171875, 0.07769775390625, 0.2315673828125, 0.38543701171875, 0.539306640625, 0.69317626953125, 0.8470458984375, 1.00091552734375, 1.15478515625, 1.30865478515625, 1.4625244140625, 1.61639404296875, 1.770263671875, 1.92413330078125, 2.0780029296875, 2.23187255859375, 2.3857421875, 2.53961181640625, 2.6934814453125, 2.84735107421875, 3.001220703125, 3.15509033203125, 3.3089599609375, 3.46282958984375, 3.61669921875, 3.77056884765625, 3.9244384765625, 4.07830810546875, 4.232177734375, 4.38604736328125, 4.5399169921875, 4.69378662109375, 4.84765625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 4.0, 13.0, 16.0, 25.0, 36.0, 54.0, 75.0, 107.0, 141.0, 227.0, 285.0, 418.0, 597.0, 835.0, 1195.0, 1660.0, 2429.0, 3383.0, 4860.0, 6730.0, 9605.0, 13383.0, 19134.0, 27223.0, 39941.0, 60463.0, 95345.0, 175909.0, 1292789.0, 115843.0, 71327.0, 46521.0, 31492.0, 22067.0, 15373.0, 11006.0, 7732.0, 5577.0, 3969.0, 2798.0, 1985.0, 1384.0, 939.0, 663.0, 463.0, 333.0, 240.0, 160.0, 131.0, 77.0, 62.0, 40.0, 28.0, 19.0, 11.0, 10.0, 4.0, 3.0, 2.0, 2.0], "bins": [-1.5, -1.453399658203125, -1.40679931640625, -1.360198974609375, -1.3135986328125, -1.266998291015625, -1.22039794921875, -1.173797607421875, -1.127197265625, -1.080596923828125, -1.03399658203125, -0.987396240234375, -0.9407958984375, -0.894195556640625, -0.84759521484375, -0.800994873046875, -0.75439453125, -0.707794189453125, -0.66119384765625, -0.614593505859375, -0.5679931640625, -0.521392822265625, -0.47479248046875, -0.428192138671875, -0.381591796875, -0.334991455078125, -0.28839111328125, -0.241790771484375, -0.1951904296875, -0.148590087890625, -0.10198974609375, -0.055389404296875, -0.0087890625, 0.037811279296875, 0.08441162109375, 0.131011962890625, 0.1776123046875, 0.224212646484375, 0.27081298828125, 0.317413330078125, 0.364013671875, 0.410614013671875, 0.45721435546875, 0.503814697265625, 0.5504150390625, 0.597015380859375, 0.64361572265625, 0.690216064453125, 0.73681640625, 0.783416748046875, 0.83001708984375, 0.876617431640625, 0.9232177734375, 0.969818115234375, 1.01641845703125, 1.063018798828125, 1.109619140625, 1.156219482421875, 1.20281982421875, 1.249420166015625, 1.2960205078125, 1.342620849609375, 1.38922119140625, 1.435821533203125, 1.482421875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 3.0, 7.0, 11.0, 14.0, 8.0, 16.0, 17.0, 18.0, 25.0, 38.0, 61.0, 57.0, 81.0, 132.0, 130.0, 100.0, 71.0, 48.0, 31.0, 30.0, 17.0, 16.0, 9.0, 10.0, 5.0, 4.0, 7.0, 6.0, 7.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014715194702148438, -0.0014256089925765991, -0.0013796985149383545, -0.0013337880373001099, -0.0012878775596618652, -0.0012419670820236206, -0.001196056604385376, -0.0011501461267471313, -0.0011042356491088867, -0.001058325171470642, -0.0010124146938323975, -0.0009665042161941528, -0.0009205937385559082, -0.0008746832609176636, -0.0008287727832794189, -0.0007828623056411743, -0.0007369518280029297, -0.0006910413503646851, -0.0006451308727264404, -0.0005992203950881958, -0.0005533099174499512, -0.0005073994398117065, -0.0004614889621734619, -0.0004155784845352173, -0.00036966800689697266, -0.00032375752925872803, -0.0002778470516204834, -0.00023193657398223877, -0.00018602609634399414, -0.0001401156187057495, -9.420514106750488e-05, -4.8294663429260254e-05, -2.384185791015625e-06, 4.3526291847229004e-05, 8.943676948547363e-05, 0.00013534724712371826, 0.0001812577247619629, 0.00022716820240020752, 0.00027307868003845215, 0.0003189891576766968, 0.0003648996353149414, 0.00041081011295318604, 0.00045672059059143066, 0.0005026310682296753, 0.0005485415458679199, 0.0005944520235061646, 0.0006403625011444092, 0.0006862729787826538, 0.0007321834564208984, 0.0007780939340591431, 0.0008240044116973877, 0.0008699148893356323, 0.000915825366973877, 0.0009617358446121216, 0.0010076463222503662, 0.0010535567998886108, 0.0010994672775268555, 0.0011453777551651, 0.0011912882328033447, 0.0012371987104415894, 0.001283109188079834, 0.0013290196657180786, 0.0013749301433563232, 0.0014208406209945679, 0.0014667510986328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 12.0, 4.0, 8.0, 10.0, 7.0, 16.0, 12.0, 26.0, 26.0, 48.0, 97.0, 120.0, 213.0, 393.0, 1925.0, 1038038.0, 6215.0, 614.0, 256.0, 161.0, 82.0, 61.0, 52.0, 36.0, 30.0, 18.0, 23.0, 12.0, 6.0, 8.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02838134765625, -0.027390003204345703, -0.026398658752441406, -0.02540731430053711, -0.024415969848632812, -0.023424625396728516, -0.02243328094482422, -0.021441936492919922, -0.020450592041015625, -0.019459247589111328, -0.01846790313720703, -0.017476558685302734, -0.016485214233398438, -0.01549386978149414, -0.014502525329589844, -0.013511180877685547, -0.01251983642578125, -0.011528491973876953, -0.010537147521972656, -0.00954580307006836, -0.008554458618164062, -0.007563114166259766, -0.006571769714355469, -0.005580425262451172, -0.004589080810546875, -0.003597736358642578, -0.0026063919067382812, -0.0016150474548339844, -0.0006237030029296875, 0.0003676414489746094, 0.0013589859008789062, 0.002350330352783203, 0.0033416748046875, 0.004333019256591797, 0.005324363708496094, 0.006315708160400391, 0.0073070526123046875, 0.008298397064208984, 0.009289741516113281, 0.010281085968017578, 0.011272430419921875, 0.012263774871826172, 0.013255119323730469, 0.014246463775634766, 0.015237808227539062, 0.01622915267944336, 0.017220497131347656, 0.018211841583251953, 0.01920318603515625, 0.020194530487060547, 0.021185874938964844, 0.02217721939086914, 0.023168563842773438, 0.024159908294677734, 0.02515125274658203, 0.026142597198486328, 0.027133941650390625, 0.028125286102294922, 0.02911663055419922, 0.030107975006103516, 0.031099319458007812, 0.03209066390991211, 0.033082008361816406, 0.0340733528137207, 0.035064697265625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 15.0, 63.0, 154.0, 313.0, 303.0, 101.0, 47.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001353587256744504, -0.0013065943494439125, -0.001259601442143321, -0.0012126084184274077, -0.0011656155111268163, -0.0011186226038262248, -0.0010716295801103115, -0.00102463667280972, -0.0009776437655091286, -0.0009306508582085371, -0.0008836578927002847, -0.0008366649271920323, -0.0007896720198914409, -0.0007426791125908494, -0.000695686147082597, -0.0006486931815743446, -0.0006017002742737532, -0.0005547073669731617, -0.0005077144014649093, -0.0004607214650604874, -0.00041372852865606546, -0.00036673559225164354, -0.0003197426558472216, -0.0002727497194427997, -0.00022575678303837776, -0.00017876384663395584, -0.0001317709102295339, -8.477797382511199e-05, -3.778503742069006e-05, 9.207898983731866e-06, 5.620083538815379e-05, 0.00010319377179257572, 0.00015018670819699764, 0.00019717964460141957, 0.0002441725810058415, 0.0002911655174102634, 0.00033815845381468534, 0.00038515139021910727, 0.0004321443266235292, 0.0004791372630279511, 0.000526130199432373, 0.0005731231067329645, 0.0006201160722412169, 0.0006671090377494693, 0.0007141019450500607, 0.0007610948523506522, 0.0008080878178589046, 0.000855080783367157, 0.0009020736906677485, 0.0009490665979683399, 0.0009960595052689314, 0.0010430525289848447, 0.0010900454362854362, 0.0011370383435860276, 0.001184031367301941, 0.0012310242746025324, 0.0012780171819031239, 0.0013250100892037153, 0.0013720029965043068, 0.00141899602022022, 0.0014659889275208116, 0.001512981834821403, 0.0015599748585373163, 0.0016069677658379078, 0.0016539606731384993]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 6.0, 3.0, 7.0, 6.0, 10.0, 9.0, 14.0, 11.0, 19.0, 16.0, 27.0, 27.0, 37.0, 36.0, 33.0, 49.0, 38.0, 38.0, 47.0, 36.0, 43.0, 37.0, 29.0, 38.0, 36.0, 32.0, 30.0, 35.0, 24.0, 34.0, 31.0, 27.0, 22.0, 23.0, 9.0, 21.0, 15.0, 12.0, 9.0, 2.0, 3.0, 9.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0006631612777709961, -0.0006446009501814842, -0.0006260406225919724, -0.0006074802950024605, -0.0005889199674129486, -0.0005703596398234367, -0.0005517993122339249, -0.000533238984644413, -0.0005146786570549011, -0.0004961183294653893, -0.0004775580018758774, -0.0004589976742863655, -0.00044043734669685364, -0.00042187701910734177, -0.0004033166915178299, -0.000384756363928318, -0.00036619603633880615, -0.0003476357087492943, -0.0003290753811597824, -0.00031051505357027054, -0.00029195472598075867, -0.0002733943983912468, -0.0002548340708017349, -0.00023627374321222305, -0.00021771341562271118, -0.0001991530880331993, -0.00018059276044368744, -0.00016203243285417557, -0.0001434721052646637, -0.00012491177767515182, -0.00010635145008563995, -8.779112249612808e-05, -6.923079490661621e-05, -5.067046731710434e-05, -3.211013972759247e-05, -1.3549812138080597e-05, 5.010515451431274e-06, 2.3570843040943146e-05, 4.213117063045502e-05, 6.069149821996689e-05, 7.925182580947876e-05, 9.781215339899063e-05, 0.0001163724809885025, 0.00013493280857801437, 0.00015349313616752625, 0.00017205346375703812, 0.00019061379134655, 0.00020917411893606186, 0.00022773444652557373, 0.0002462947741150856, 0.0002648551017045975, 0.00028341542929410934, 0.0003019757568836212, 0.0003205360844731331, 0.00033909641206264496, 0.00035765673965215683, 0.0003762170672416687, 0.00039477739483118057, 0.00041333772242069244, 0.0004318980500102043, 0.0004504583775997162, 0.00046901870518922806, 0.00048757903277873993, 0.0005061393603682518, 0.0005246996879577637]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 2.0, 2.0, 6.0, 8.0, 15.0, 10.0, 12.0, 9.0, 20.0, 17.0, 14.0, 16.0, 26.0, 16.0, 17.0, 28.0, 29.0, 24.0, 27.0, 38.0, 36.0, 40.0, 53.0, 38.0, 46.0, 35.0, 40.0, 29.0, 22.0, 38.0, 30.0, 31.0, 25.0, 27.0, 16.0, 24.0, 23.0, 19.0, 23.0, 13.0, 11.0, 8.0, 10.0, 8.0, 6.0, 4.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.828125, -7.5748291015625, -7.321533203125, -7.0682373046875, -6.81494140625, -6.5616455078125, -6.308349609375, -6.0550537109375, -5.8017578125, -5.5484619140625, -5.295166015625, -5.0418701171875, -4.78857421875, -4.5352783203125, -4.281982421875, -4.0286865234375, -3.775390625, -3.5220947265625, -3.268798828125, -3.0155029296875, -2.76220703125, -2.5089111328125, -2.255615234375, -2.0023193359375, -1.7490234375, -1.4957275390625, -1.242431640625, -0.9891357421875, -0.73583984375, -0.4825439453125, -0.229248046875, 0.0240478515625, 0.27734375, 0.5306396484375, 0.783935546875, 1.0372314453125, 1.29052734375, 1.5438232421875, 1.797119140625, 2.0504150390625, 2.3037109375, 2.5570068359375, 2.810302734375, 3.0635986328125, 3.31689453125, 3.5701904296875, 3.823486328125, 4.0767822265625, 4.330078125, 4.5833740234375, 4.836669921875, 5.0899658203125, 5.34326171875, 5.5965576171875, 5.849853515625, 6.1031494140625, 6.3564453125, 6.6097412109375, 6.863037109375, 7.1163330078125, 7.36962890625, 7.6229248046875, 7.876220703125, 8.1295166015625, 8.3828125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 6.0, 19.0, 10.0, 12.0, 14.0, 22.0, 28.0, 22.0, 37.0, 52.0, 53.0, 79.0, 126.0, 152.0, 238.0, 351.0, 668.0, 1781.0, 7556.0, 40229.0, 361609.0, 562373.0, 58324.0, 10252.0, 2386.0, 830.0, 375.0, 242.0, 187.0, 105.0, 85.0, 58.0, 68.0, 42.0, 32.0, 32.0, 23.0, 14.0, 10.0, 9.0, 12.0, 6.0, 5.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4921875, -14.9940185546875, -14.495849609375, -13.9976806640625, -13.49951171875, -13.0013427734375, -12.503173828125, -12.0050048828125, -11.5068359375, -11.0086669921875, -10.510498046875, -10.0123291015625, -9.51416015625, -9.0159912109375, -8.517822265625, -8.0196533203125, -7.521484375, -7.0233154296875, -6.525146484375, -6.0269775390625, -5.52880859375, -5.0306396484375, -4.532470703125, -4.0343017578125, -3.5361328125, -3.0379638671875, -2.539794921875, -2.0416259765625, -1.54345703125, -1.0452880859375, -0.547119140625, -0.0489501953125, 0.44921875, 0.9473876953125, 1.445556640625, 1.9437255859375, 2.44189453125, 2.9400634765625, 3.438232421875, 3.9364013671875, 4.4345703125, 4.9327392578125, 5.430908203125, 5.9290771484375, 6.42724609375, 6.9254150390625, 7.423583984375, 7.9217529296875, 8.419921875, 8.9180908203125, 9.416259765625, 9.9144287109375, 10.41259765625, 10.9107666015625, 11.408935546875, 11.9071044921875, 12.4052734375, 12.9034423828125, 13.401611328125, 13.8997802734375, 14.39794921875, 14.8961181640625, 15.394287109375, 15.8924560546875, 16.390625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 6.0, 7.0, 13.0, 8.0, 11.0, 9.0, 8.0, 19.0, 25.0, 32.0, 34.0, 31.0, 32.0, 46.0, 49.0, 48.0, 81.0, 174.0, 1518.0, 316.0, 123.0, 64.0, 51.0, 43.0, 37.0, 37.0, 35.0, 30.0, 24.0, 23.0, 27.0, 15.0, 13.0, 11.0, 10.0, 10.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-31.140625, -30.245849609375, -29.35107421875, -28.456298828125, -27.5615234375, -26.666748046875, -25.77197265625, -24.877197265625, -23.982421875, -23.087646484375, -22.19287109375, -21.298095703125, -20.4033203125, -19.508544921875, -18.61376953125, -17.718994140625, -16.82421875, -15.929443359375, -15.03466796875, -14.139892578125, -13.2451171875, -12.350341796875, -11.45556640625, -10.560791015625, -9.666015625, -8.771240234375, -7.87646484375, -6.981689453125, -6.0869140625, -5.192138671875, -4.29736328125, -3.402587890625, -2.5078125, -1.613037109375, -0.71826171875, 0.176513671875, 1.0712890625, 1.966064453125, 2.86083984375, 3.755615234375, 4.650390625, 5.545166015625, 6.43994140625, 7.334716796875, 8.2294921875, 9.124267578125, 10.01904296875, 10.913818359375, 11.80859375, 12.703369140625, 13.59814453125, 14.492919921875, 15.3876953125, 16.282470703125, 17.17724609375, 18.072021484375, 18.966796875, 19.861572265625, 20.75634765625, 21.651123046875, 22.5458984375, 23.440673828125, 24.33544921875, 25.230224609375, 26.125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 18.0, 17.0, 9.0, 16.0, 32.0, 39.0, 49.0, 46.0, 56.0, 106.0, 143.0, 234.0, 517.0, 1709.0, 83640.0, 3050978.0, 6315.0, 818.0, 346.0, 166.0, 124.0, 58.0, 66.0, 44.0, 43.0, 21.0, 9.0, 17.0, 12.0, 14.0, 10.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.84375, -57.56396484375, -55.2841796875, -53.00439453125, -50.724609375, -48.44482421875, -46.1650390625, -43.88525390625, -41.60546875, -39.32568359375, -37.0458984375, -34.76611328125, -32.486328125, -30.20654296875, -27.9267578125, -25.64697265625, -23.3671875, -21.08740234375, -18.8076171875, -16.52783203125, -14.248046875, -11.96826171875, -9.6884765625, -7.40869140625, -5.12890625, -2.84912109375, -0.5693359375, 1.71044921875, 3.990234375, 6.27001953125, 8.5498046875, 10.82958984375, 13.109375, 15.38916015625, 17.6689453125, 19.94873046875, 22.228515625, 24.50830078125, 26.7880859375, 29.06787109375, 31.34765625, 33.62744140625, 35.9072265625, 38.18701171875, 40.466796875, 42.74658203125, 45.0263671875, 47.30615234375, 49.5859375, 51.86572265625, 54.1455078125, 56.42529296875, 58.705078125, 60.98486328125, 63.2646484375, 65.54443359375, 67.82421875, 70.10400390625, 72.3837890625, 74.66357421875, 76.943359375, 79.22314453125, 81.5029296875, 83.78271484375, 86.0625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 20.0, 76.0, 251.0, 369.0, 221.0, 56.0, 13.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.3418197631836, -121.87569427490234, -119.4095687866211, -116.94344329833984, -114.4773178100586, -112.01119232177734, -109.5450668334961, -107.07894897460938, -104.61282348632812, -102.14669799804688, -99.68057250976562, -97.21444702148438, -94.74832153320312, -92.28219604492188, -89.81607055664062, -87.34994506835938, -84.88381958007812, -82.41769409179688, -79.95156860351562, -77.48544311523438, -75.01931762695312, -72.55319213867188, -70.08706665039062, -67.62094116210938, -65.15481567382812, -62.688690185546875, -60.222564697265625, -57.756439208984375, -55.290313720703125, -52.824188232421875, -50.35806655883789, -47.89194107055664, -45.42582321166992, -42.95969772338867, -40.49357223510742, -38.02744674682617, -35.56132507324219, -33.09519958496094, -30.629074096679688, -28.162948608398438, -25.696823120117188, -23.230697631835938, -20.764572143554688, -18.29844856262207, -15.83232307434082, -13.36619758605957, -10.900073051452637, -8.433948516845703, -5.967823028564453, -3.5016980171203613, -1.0355730056762695, 1.4305520057678223, 3.896677017211914, 6.362802505493164, 8.828927040100098, 11.295051574707031, 13.761177062988281, 16.22730255126953, 18.69342803955078, 21.1595516204834, 23.62567710876465, 26.0918025970459, 28.557926177978516, 31.024051666259766, 33.490177154541016]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 9.0, 14.0, 5.0, 15.0, 22.0, 13.0, 5.0, 25.0, 26.0, 27.0, 28.0, 29.0, 31.0, 36.0, 42.0, 31.0, 29.0, 45.0, 50.0, 41.0, 47.0, 30.0, 43.0, 51.0, 27.0, 33.0, 19.0, 24.0, 49.0, 25.0, 19.0, 17.0, 12.0, 15.0, 12.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.91841125488281, -65.606689453125, -63.294960021972656, -60.98323440551758, -58.6715087890625, -56.35978698730469, -54.04806137084961, -51.73633575439453, -49.42461013793945, -47.112884521484375, -44.8011589050293, -42.48943328857422, -40.177711486816406, -37.86598205566406, -35.55426025390625, -33.24253463745117, -30.930809020996094, -28.619083404541016, -26.307357788085938, -23.995634078979492, -21.683908462524414, -19.372182846069336, -17.06045913696289, -14.748733520507812, -12.437007904052734, -10.125282287597656, -7.8135576248168945, -5.501832485198975, -3.1901073455810547, -0.8783817291259766, 1.4333429336547852, 3.745067596435547, 6.056793212890625, 8.368518829345703, 10.680243492126465, 12.991968154907227, 15.303693771362305, 17.615419387817383, 19.927143096923828, 22.238868713378906, 24.550594329833984, 26.862319946289062, 29.17404556274414, 31.485769271850586, 33.79749298095703, 36.109222412109375, 38.42094421386719, 40.732669830322266, 43.044395446777344, 45.35612106323242, 47.6678466796875, 49.97957229614258, 52.291297912597656, 54.60301971435547, 56.91474533081055, 59.226470947265625, 61.5381965637207, 63.84992218017578, 66.1616439819336, 68.47337341308594, 70.78509521484375, 73.0968246459961, 75.4085464477539, 77.72027587890625, 80.03199768066406]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 9.0, 9.0, 10.0, 10.0, 11.0, 19.0, 13.0, 18.0, 23.0, 17.0, 21.0, 16.0, 20.0, 28.0, 21.0, 30.0, 37.0, 21.0, 38.0, 43.0, 41.0, 41.0, 32.0, 42.0, 45.0, 34.0, 41.0, 41.0, 22.0, 31.0, 26.0, 22.0, 18.0, 17.0, 23.0, 20.0, 18.0, 13.0, 12.0, 9.0, 3.0, 8.0, 6.0, 7.0, 7.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.421875, -8.156982421875, -7.89208984375, -7.627197265625, -7.3623046875, -7.097412109375, -6.83251953125, -6.567626953125, -6.302734375, -6.037841796875, -5.77294921875, -5.508056640625, -5.2431640625, -4.978271484375, -4.71337890625, -4.448486328125, -4.18359375, -3.918701171875, -3.65380859375, -3.388916015625, -3.1240234375, -2.859130859375, -2.59423828125, -2.329345703125, -2.064453125, -1.799560546875, -1.53466796875, -1.269775390625, -1.0048828125, -0.739990234375, -0.47509765625, -0.210205078125, 0.0546875, 0.319580078125, 0.58447265625, 0.849365234375, 1.1142578125, 1.379150390625, 1.64404296875, 1.908935546875, 2.173828125, 2.438720703125, 2.70361328125, 2.968505859375, 3.2333984375, 3.498291015625, 3.76318359375, 4.028076171875, 4.29296875, 4.557861328125, 4.82275390625, 5.087646484375, 5.3525390625, 5.617431640625, 5.88232421875, 6.147216796875, 6.412109375, 6.677001953125, 6.94189453125, 7.206787109375, 7.4716796875, 7.736572265625, 8.00146484375, 8.266357421875, 8.53125]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 9.0, 11.0, 12.0, 7.0, 14.0, 23.0, 12.0, 19.0, 21.0, 26.0, 30.0, 41.0, 49.0, 97.0, 147.0, 286.0, 581.0, 1430.0, 5199.0, 35245.0, 711466.0, 2959246.0, 449535.0, 24362.0, 3940.0, 1211.0, 520.0, 235.0, 133.0, 74.0, 69.0, 36.0, 28.0, 25.0, 27.0, 18.0, 14.0, 11.0, 11.0, 14.0, 9.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-22.78125, -22.07861328125, -21.3759765625, -20.67333984375, -19.970703125, -19.26806640625, -18.5654296875, -17.86279296875, -17.16015625, -16.45751953125, -15.7548828125, -15.05224609375, -14.349609375, -13.64697265625, -12.9443359375, -12.24169921875, -11.5390625, -10.83642578125, -10.1337890625, -9.43115234375, -8.728515625, -8.02587890625, -7.3232421875, -6.62060546875, -5.91796875, -5.21533203125, -4.5126953125, -3.81005859375, -3.107421875, -2.40478515625, -1.7021484375, -0.99951171875, -0.296875, 0.40576171875, 1.1083984375, 1.81103515625, 2.513671875, 3.21630859375, 3.9189453125, 4.62158203125, 5.32421875, 6.02685546875, 6.7294921875, 7.43212890625, 8.134765625, 8.83740234375, 9.5400390625, 10.24267578125, 10.9453125, 11.64794921875, 12.3505859375, 13.05322265625, 13.755859375, 14.45849609375, 15.1611328125, 15.86376953125, 16.56640625, 17.26904296875, 17.9716796875, 18.67431640625, 19.376953125, 20.07958984375, 20.7822265625, 21.48486328125, 22.1875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 12.0, 11.0, 9.0, 15.0, 15.0, 19.0, 31.0, 30.0, 59.0, 68.0, 76.0, 102.0, 130.0, 184.0, 250.0, 314.0, 356.0, 445.0, 403.0, 392.0, 295.0, 203.0, 164.0, 129.0, 88.0, 59.0, 49.0, 44.0, 25.0, 20.0, 17.0, 15.0, 10.0, 4.0, 12.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-14.6796875, -14.232177734375, -13.78466796875, -13.337158203125, -12.8896484375, -12.442138671875, -11.99462890625, -11.547119140625, -11.099609375, -10.652099609375, -10.20458984375, -9.757080078125, -9.3095703125, -8.862060546875, -8.41455078125, -7.967041015625, -7.51953125, -7.072021484375, -6.62451171875, -6.177001953125, -5.7294921875, -5.281982421875, -4.83447265625, -4.386962890625, -3.939453125, -3.491943359375, -3.04443359375, -2.596923828125, -2.1494140625, -1.701904296875, -1.25439453125, -0.806884765625, -0.359375, 0.088134765625, 0.53564453125, 0.983154296875, 1.4306640625, 1.878173828125, 2.32568359375, 2.773193359375, 3.220703125, 3.668212890625, 4.11572265625, 4.563232421875, 5.0107421875, 5.458251953125, 5.90576171875, 6.353271484375, 6.80078125, 7.248291015625, 7.69580078125, 8.143310546875, 8.5908203125, 9.038330078125, 9.48583984375, 9.933349609375, 10.380859375, 10.828369140625, 11.27587890625, 11.723388671875, 12.1708984375, 12.618408203125, 13.06591796875, 13.513427734375, 13.9609375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 4.0, 7.0, 1.0, 9.0, 4.0, 15.0, 22.0, 19.0, 42.0, 49.0, 44.0, 73.0, 80.0, 82.0, 148.0, 199.0, 282.0, 550.0, 1788.0, 14408.0, 1586521.0, 2567281.0, 18768.0, 2042.0, 617.0, 344.0, 212.0, 165.0, 116.0, 84.0, 74.0, 53.0, 37.0, 37.0, 22.0, 23.0, 13.0, 19.0, 7.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-66.3125, -64.47265625, -62.6328125, -60.79296875, -58.953125, -57.11328125, -55.2734375, -53.43359375, -51.59375, -49.75390625, -47.9140625, -46.07421875, -44.234375, -42.39453125, -40.5546875, -38.71484375, -36.875, -35.03515625, -33.1953125, -31.35546875, -29.515625, -27.67578125, -25.8359375, -23.99609375, -22.15625, -20.31640625, -18.4765625, -16.63671875, -14.796875, -12.95703125, -11.1171875, -9.27734375, -7.4375, -5.59765625, -3.7578125, -1.91796875, -0.078125, 1.76171875, 3.6015625, 5.44140625, 7.28125, 9.12109375, 10.9609375, 12.80078125, 14.640625, 16.48046875, 18.3203125, 20.16015625, 22.0, 23.83984375, 25.6796875, 27.51953125, 29.359375, 31.19921875, 33.0390625, 34.87890625, 36.71875, 38.55859375, 40.3984375, 42.23828125, 44.078125, 45.91796875, 47.7578125, 49.59765625, 51.4375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 79.0, 510.0, 380.0, 41.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-502.33819580078125, -492.4671936035156, -482.59619140625, -472.7251892089844, -462.85418701171875, -452.9831848144531, -443.1121826171875, -433.2411804199219, -423.37017822265625, -413.4991760253906, -403.628173828125, -393.7571716308594, -383.88616943359375, -374.0151672363281, -364.1441650390625, -354.2731628417969, -344.40216064453125, -334.5311584472656, -324.66015625, -314.7891540527344, -304.91815185546875, -295.0471496582031, -285.1761474609375, -275.3051452636719, -265.43414306640625, -255.56314086914062, -245.692138671875, -235.82113647460938, -225.95013427734375, -216.07913208007812, -206.2081298828125, -196.33712768554688, -186.46612548828125, -176.59512329101562, -166.72412109375, -156.85311889648438, -146.98211669921875, -137.11111450195312, -127.2401123046875, -117.36911010742188, -107.49810791015625, -97.62710571289062, -87.756103515625, -77.88510131835938, -68.01409912109375, -58.143096923828125, -48.2720947265625, -38.401092529296875, -28.53009033203125, -18.659088134765625, -8.7880859375, 1.082916259765625, 10.95391845703125, 20.824920654296875, 30.6959228515625, 40.566925048828125, 50.43792724609375, 60.308929443359375, 70.179931640625, 80.05093383789062, 89.92193603515625, 99.79293823242188, 109.6639404296875, 119.53494262695312, 129.40594482421875]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 5.0, 5.0, 3.0, 7.0, 6.0, 9.0, 10.0, 11.0, 15.0, 12.0, 12.0, 16.0, 24.0, 19.0, 24.0, 33.0, 26.0, 28.0, 34.0, 43.0, 38.0, 45.0, 48.0, 49.0, 49.0, 38.0, 30.0, 40.0, 38.0, 30.0, 36.0, 32.0, 31.0, 21.0, 21.0, 16.0, 16.0, 17.0, 17.0, 8.0, 12.0, 3.0, 8.0, 5.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.00148010253906, -53.39352798461914, -51.78557586669922, -50.1776237487793, -48.569671630859375, -46.96172332763672, -45.3537712097168, -43.745819091796875, -42.13786697387695, -40.52991485595703, -38.92196273803711, -37.31401062011719, -35.70606231689453, -34.098106384277344, -32.49015808105469, -30.882205963134766, -29.274253845214844, -27.666301727294922, -26.058349609375, -24.45039939880371, -22.84244728088379, -21.234495162963867, -19.626544952392578, -18.018592834472656, -16.410640716552734, -14.802688598632812, -13.194737434387207, -11.586786270141602, -9.97883415222168, -8.370882034301758, -6.762930870056152, -5.154979705810547, -3.5470237731933594, -1.9390721321105957, -0.33112049102783203, 1.2768311500549316, 2.8847827911376953, 4.492734909057617, 6.100686073303223, 7.708637237548828, 9.31658935546875, 10.924541473388672, 12.532492637634277, 14.140443801879883, 15.748395919799805, 17.356348037719727, 18.964298248291016, 20.572250366210938, 22.18020248413086, 23.78815460205078, 25.396106719970703, 27.004056930541992, 28.612009048461914, 30.219961166381836, 31.827911376953125, 33.43586349487305, 35.04381561279297, 36.65176773071289, 38.25971984863281, 39.867671966552734, 41.475624084472656, 43.08357238769531, 44.691524505615234, 46.299476623535156, 47.90742874145508]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 10.0, 11.0, 8.0, 13.0, 19.0, 17.0, 22.0, 15.0, 21.0, 38.0, 32.0, 37.0, 34.0, 35.0, 37.0, 38.0, 32.0, 58.0, 34.0, 47.0, 43.0, 42.0, 42.0, 33.0, 36.0, 29.0, 27.0, 23.0, 34.0, 15.0, 24.0, 14.0, 13.0, 4.0, 10.0, 9.0, 4.0, 4.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.080810546875, -8.77880859375, -8.476806640625, -8.1748046875, -7.872802734375, -7.57080078125, -7.268798828125, -6.966796875, -6.664794921875, -6.36279296875, -6.060791015625, -5.7587890625, -5.456787109375, -5.15478515625, -4.852783203125, -4.55078125, -4.248779296875, -3.94677734375, -3.644775390625, -3.3427734375, -3.040771484375, -2.73876953125, -2.436767578125, -2.134765625, -1.832763671875, -1.53076171875, -1.228759765625, -0.9267578125, -0.624755859375, -0.32275390625, -0.020751953125, 0.28125, 0.583251953125, 0.88525390625, 1.187255859375, 1.4892578125, 1.791259765625, 2.09326171875, 2.395263671875, 2.697265625, 2.999267578125, 3.30126953125, 3.603271484375, 3.9052734375, 4.207275390625, 4.50927734375, 4.811279296875, 5.11328125, 5.415283203125, 5.71728515625, 6.019287109375, 6.3212890625, 6.623291015625, 6.92529296875, 7.227294921875, 7.529296875, 7.831298828125, 8.13330078125, 8.435302734375, 8.7373046875, 9.039306640625, 9.34130859375, 9.643310546875, 9.9453125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 14.0, 17.0, 26.0, 39.0, 76.0, 118.0, 184.0, 249.0, 361.0, 549.0, 762.0, 1108.0, 1629.0, 2544.0, 3667.0, 5627.0, 8476.0, 13009.0, 20646.0, 33054.0, 55793.0, 101802.0, 256406.0, 282416.0, 106631.0, 57767.0, 34685.0, 21112.0, 13513.0, 8688.0, 5848.0, 3728.0, 2586.0, 1736.0, 1181.0, 842.0, 547.0, 368.0, 262.0, 153.0, 118.0, 68.0, 58.0, 34.0, 21.0, 12.0, 12.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.06787109375, -1.9990234375, -1.93017578125, -1.861328125, -1.79248046875, -1.7236328125, -1.65478515625, -1.5859375, -1.51708984375, -1.4482421875, -1.37939453125, -1.310546875, -1.24169921875, -1.1728515625, -1.10400390625, -1.03515625, -0.96630859375, -0.8974609375, -0.82861328125, -0.759765625, -0.69091796875, -0.6220703125, -0.55322265625, -0.484375, -0.41552734375, -0.3466796875, -0.27783203125, -0.208984375, -0.14013671875, -0.0712890625, -0.00244140625, 0.06640625, 0.13525390625, 0.2041015625, 0.27294921875, 0.341796875, 0.41064453125, 0.4794921875, 0.54833984375, 0.6171875, 0.68603515625, 0.7548828125, 0.82373046875, 0.892578125, 0.96142578125, 1.0302734375, 1.09912109375, 1.16796875, 1.23681640625, 1.3056640625, 1.37451171875, 1.443359375, 1.51220703125, 1.5810546875, 1.64990234375, 1.71875, 1.78759765625, 1.8564453125, 1.92529296875, 1.994140625, 2.06298828125, 2.1318359375, 2.20068359375, 2.26953125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 6.0, 10.0, 18.0, 16.0, 20.0, 14.0, 18.0, 24.0, 17.0, 25.0, 33.0, 28.0, 38.0, 37.0, 42.0, 39.0, 60.0, 1071.0, 48.0, 39.0, 39.0, 41.0, 40.0, 31.0, 32.0, 31.0, 26.0, 24.0, 32.0, 21.0, 20.0, 12.0, 21.0, 4.0, 8.0, 9.0, 11.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.7047119140625, -5.507080078125, -5.3094482421875, -5.11181640625, -4.9141845703125, -4.716552734375, -4.5189208984375, -4.3212890625, -4.1236572265625, -3.926025390625, -3.7283935546875, -3.53076171875, -3.3331298828125, -3.135498046875, -2.9378662109375, -2.740234375, -2.5426025390625, -2.344970703125, -2.1473388671875, -1.94970703125, -1.7520751953125, -1.554443359375, -1.3568115234375, -1.1591796875, -0.9615478515625, -0.763916015625, -0.5662841796875, -0.36865234375, -0.1710205078125, 0.026611328125, 0.2242431640625, 0.421875, 0.6195068359375, 0.817138671875, 1.0147705078125, 1.21240234375, 1.4100341796875, 1.607666015625, 1.8052978515625, 2.0029296875, 2.2005615234375, 2.398193359375, 2.5958251953125, 2.79345703125, 2.9910888671875, 3.188720703125, 3.3863525390625, 3.583984375, 3.7816162109375, 3.979248046875, 4.1768798828125, 4.37451171875, 4.5721435546875, 4.769775390625, 4.9674072265625, 5.1650390625, 5.3626708984375, 5.560302734375, 5.7579345703125, 5.95556640625, 6.1531982421875, 6.350830078125, 6.5484619140625, 6.74609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 9.0, 18.0, 24.0, 27.0, 49.0, 68.0, 110.0, 194.0, 268.0, 430.0, 675.0, 1051.0, 1677.0, 2539.0, 3939.0, 6544.0, 10029.0, 15477.0, 23908.0, 37736.0, 61134.0, 107843.0, 1313805.0, 244885.0, 103843.0, 59124.0, 36466.0, 23312.0, 15030.0, 9625.0, 6103.0, 4044.0, 2520.0, 1613.0, 1015.0, 661.0, 458.0, 285.0, 209.0, 129.0, 92.0, 56.0, 34.0, 24.0, 18.0, 9.0, 6.0, 8.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.009765625, -1.9468994140625, -1.884033203125, -1.8211669921875, -1.75830078125, -1.6954345703125, -1.632568359375, -1.5697021484375, -1.5068359375, -1.4439697265625, -1.381103515625, -1.3182373046875, -1.25537109375, -1.1925048828125, -1.129638671875, -1.0667724609375, -1.00390625, -0.9410400390625, -0.878173828125, -0.8153076171875, -0.75244140625, -0.6895751953125, -0.626708984375, -0.5638427734375, -0.5009765625, -0.4381103515625, -0.375244140625, -0.3123779296875, -0.24951171875, -0.1866455078125, -0.123779296875, -0.0609130859375, 0.001953125, 0.0648193359375, 0.127685546875, 0.1905517578125, 0.25341796875, 0.3162841796875, 0.379150390625, 0.4420166015625, 0.5048828125, 0.5677490234375, 0.630615234375, 0.6934814453125, 0.75634765625, 0.8192138671875, 0.882080078125, 0.9449462890625, 1.0078125, 1.0706787109375, 1.133544921875, 1.1964111328125, 1.25927734375, 1.3221435546875, 1.385009765625, 1.4478759765625, 1.5107421875, 1.5736083984375, 1.636474609375, 1.6993408203125, 1.76220703125, 1.8250732421875, 1.887939453125, 1.9508056640625, 2.013671875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 3.0, 7.0, 6.0, 2.0, 5.0, 9.0, 7.0, 14.0, 13.0, 16.0, 18.0, 29.0, 28.0, 35.0, 44.0, 47.0, 66.0, 59.0, 64.0, 67.0, 65.0, 65.0, 63.0, 47.0, 32.0, 38.0, 27.0, 24.0, 24.0, 13.0, 8.0, 8.0, 5.0, 11.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006737709045410156, -0.0006507411599159241, -0.0006277114152908325, -0.000604681670665741, -0.0005816519260406494, -0.0005586221814155579, -0.0005355924367904663, -0.0005125626921653748, -0.0004895329475402832, -0.00046650320291519165, -0.0004434734582901001, -0.00042044371366500854, -0.000397413969039917, -0.00037438422441482544, -0.0003513544797897339, -0.00032832473516464233, -0.0003052949905395508, -0.00028226524591445923, -0.0002592355012893677, -0.00023620575666427612, -0.00021317601203918457, -0.00019014626741409302, -0.00016711652278900146, -0.0001440867781639099, -0.00012105703353881836, -9.80272889137268e-05, -7.499754428863525e-05, -5.19677996635437e-05, -2.893805503845215e-05, -5.908310413360596e-06, 1.7121434211730957e-05, 4.015117883682251e-05, 6.318092346191406e-05, 8.621066808700562e-05, 0.00010924041271209717, 0.00013227015733718872, 0.00015529990196228027, 0.00017832964658737183, 0.00020135939121246338, 0.00022438913583755493, 0.0002474188804626465, 0.00027044862508773804, 0.0002934783697128296, 0.00031650811433792114, 0.0003395378589630127, 0.00036256760358810425, 0.0003855973482131958, 0.00040862709283828735, 0.0004316568374633789, 0.00045468658208847046, 0.000477716326713562, 0.0005007460713386536, 0.0005237758159637451, 0.0005468055605888367, 0.0005698353052139282, 0.0005928650498390198, 0.0006158947944641113, 0.0006389245390892029, 0.0006619542837142944, 0.000684984028339386, 0.0007080137729644775, 0.0007310435175895691, 0.0007540732622146606, 0.0007771030068397522, 0.0008001327514648438]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 7.0, 3.0, 9.0, 6.0, 9.0, 13.0, 18.0, 15.0, 19.0, 26.0, 28.0, 28.0, 44.0, 56.0, 106.0, 149.0, 203.0, 333.0, 703.0, 5990.0, 939587.0, 98269.0, 1612.0, 462.0, 272.0, 165.0, 91.0, 72.0, 50.0, 48.0, 34.0, 21.0, 25.0, 18.0, 10.0, 8.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016448974609375, -0.01596200466156006, -0.015475034713745117, -0.014988064765930176, -0.014501094818115234, -0.014014124870300293, -0.013527154922485352, -0.01304018497467041, -0.012553215026855469, -0.012066245079040527, -0.011579275131225586, -0.011092305183410645, -0.010605335235595703, -0.010118365287780762, -0.00963139533996582, -0.009144425392150879, -0.008657455444335938, -0.008170485496520996, -0.007683515548706055, -0.007196545600891113, -0.006709575653076172, -0.0062226057052612305, -0.005735635757446289, -0.005248665809631348, -0.004761695861816406, -0.004274725914001465, -0.0037877559661865234, -0.003300786018371582, -0.0028138160705566406, -0.0023268461227416992, -0.0018398761749267578, -0.0013529062271118164, -0.000865936279296875, -0.0003789663314819336, 0.00010800361633300781, 0.0005949735641479492, 0.0010819435119628906, 0.001568913459777832, 0.0020558834075927734, 0.002542853355407715, 0.0030298233032226562, 0.0035167932510375977, 0.004003763198852539, 0.0044907331466674805, 0.004977703094482422, 0.005464673042297363, 0.005951642990112305, 0.006438612937927246, 0.0069255828857421875, 0.007412552833557129, 0.00789952278137207, 0.008386492729187012, 0.008873462677001953, 0.009360432624816895, 0.009847402572631836, 0.010334372520446777, 0.010821342468261719, 0.01130831241607666, 0.011795282363891602, 0.012282252311706543, 0.012769222259521484, 0.013256192207336426, 0.013743162155151367, 0.014230132102966309, 0.01471710205078125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 21.0, 305.0, 594.0, 93.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004507641773670912, -0.0043927766382694244, -0.00427791103720665, -0.004163045901805162, -0.004048180300742388, -0.0039333151653409, -0.0038184497971087694, -0.0037035844288766384, -0.003588719293475151, -0.00347385392524302, -0.003358988557010889, -0.0032441234216094017, -0.0031292580533772707, -0.0030143926851451397, -0.0028995273169130087, -0.0027846619486808777, -0.0026697965804487467, -0.0025549312122166157, -0.0024400658439844847, -0.0023252004757523537, -0.0022103353403508663, -0.0020954699721187353, -0.0019806046038866043, -0.0018657392356544733, -0.0017508739838376641, -0.0016360086156055331, -0.001521143363788724, -0.001406277995556593, -0.001291412627324462, -0.0011765473755076528, -0.0010616820072755218, -0.0009468166972510517, -0.0008319511543959379, -0.0007170858443714678, -0.0006022205343469977, -0.00048735516611486673, -0.00037248985609039664, -0.00025762454606592655, -0.00014275917783379555, -2.7893867809325457e-05, 8.697144221514463e-05, 0.00020183676679152995, 0.00031670209136791527, 0.0004315674304962158, 0.0005464327405206859, 0.000661298050545156, 0.000776163418777287, 0.0008910287288017571, 0.0010058940388262272, 0.0011207594070583582, 0.0012356246588751674, 0.0013504900271072984, 0.0014653552789241076, 0.0015802206471562386, 0.0016950860153883696, 0.0018099513836205006, 0.0019248166354373097, 0.002039681887254119, 0.00215454725548625, 0.002269412623718381, 0.002384277991950512, 0.0024991431273519993, 0.002614008728414774, 0.0027288738638162613, 0.0028437392320483923]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 5.0, 8.0, 5.0, 15.0, 15.0, 15.0, 21.0, 13.0, 23.0, 25.0, 20.0, 24.0, 25.0, 36.0, 34.0, 35.0, 34.0, 32.0, 38.0, 51.0, 49.0, 46.0, 29.0, 44.0, 47.0, 37.0, 37.0, 29.0, 36.0, 24.0, 17.0, 20.0, 18.0, 14.0, 10.0, 10.0, 8.0, 10.0, 3.0, 6.0, 12.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0003712773323059082, -0.0003598826006054878, -0.00034848786890506744, -0.00033709313720464706, -0.0003256984055042267, -0.0003143036738038063, -0.0003029089421033859, -0.00029151421040296555, -0.00028011947870254517, -0.0002687247470021248, -0.0002573300153017044, -0.000245935283601284, -0.00023454055190086365, -0.00022314582020044327, -0.0002117510885000229, -0.0002003563567996025, -0.00018896162509918213, -0.00017756689339876175, -0.00016617216169834137, -0.000154777429997921, -0.0001433826982975006, -0.00013198796659708023, -0.00012059323489665985, -0.00010919850319623947, -9.780377149581909e-05, -8.640903979539871e-05, -7.501430809497833e-05, -6.361957639455795e-05, -5.222484469413757e-05, -4.0830112993717194e-05, -2.9435381293296814e-05, -1.8040649592876434e-05, -6.645917892456055e-06, 4.748813807964325e-06, 1.6143545508384705e-05, 2.7538277208805084e-05, 3.8933008909225464e-05, 5.0327740609645844e-05, 6.172247231006622e-05, 7.31172040104866e-05, 8.451193571090698e-05, 9.590666741132736e-05, 0.00010730139911174774, 0.00011869613081216812, 0.0001300908625125885, 0.00014148559421300888, 0.00015288032591342926, 0.00016427505761384964, 0.00017566978931427002, 0.0001870645210146904, 0.00019845925271511078, 0.00020985398441553116, 0.00022124871611595154, 0.00023264344781637192, 0.0002440381795167923, 0.0002554329112172127, 0.00026682764291763306, 0.00027822237461805344, 0.0002896171063184738, 0.0003010118380188942, 0.0003124065697193146, 0.00032380130141973495, 0.00033519603312015533, 0.0003465907648205757, 0.0003579854965209961]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 10.0, 11.0, 8.0, 13.0, 19.0, 17.0, 22.0, 15.0, 21.0, 38.0, 32.0, 37.0, 34.0, 35.0, 37.0, 38.0, 32.0, 58.0, 34.0, 47.0, 43.0, 42.0, 42.0, 33.0, 36.0, 29.0, 27.0, 23.0, 34.0, 15.0, 24.0, 14.0, 13.0, 4.0, 10.0, 9.0, 4.0, 4.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.080810546875, -8.77880859375, -8.476806640625, -8.1748046875, -7.872802734375, -7.57080078125, -7.268798828125, -6.966796875, -6.664794921875, -6.36279296875, -6.060791015625, -5.7587890625, -5.456787109375, -5.15478515625, -4.852783203125, -4.55078125, -4.248779296875, -3.94677734375, -3.644775390625, -3.3427734375, -3.040771484375, -2.73876953125, -2.436767578125, -2.134765625, -1.832763671875, -1.53076171875, -1.228759765625, -0.9267578125, -0.624755859375, -0.32275390625, -0.020751953125, 0.28125, 0.583251953125, 0.88525390625, 1.187255859375, 1.4892578125, 1.791259765625, 2.09326171875, 2.395263671875, 2.697265625, 2.999267578125, 3.30126953125, 3.603271484375, 3.9052734375, 4.207275390625, 4.50927734375, 4.811279296875, 5.11328125, 5.415283203125, 5.71728515625, 6.019287109375, 6.3212890625, 6.623291015625, 6.92529296875, 7.227294921875, 7.529296875, 7.831298828125, 8.13330078125, 8.435302734375, 8.7373046875, 9.039306640625, 9.34130859375, 9.643310546875, 9.9453125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 9.0, 4.0, 13.0, 21.0, 24.0, 24.0, 29.0, 53.0, 61.0, 82.0, 94.0, 121.0, 199.0, 251.0, 337.0, 477.0, 709.0, 1394.0, 4516.0, 22452.0, 337271.0, 640236.0, 30165.0, 5680.0, 1634.0, 776.0, 500.0, 353.0, 256.0, 200.0, 148.0, 125.0, 80.0, 69.0, 40.0, 26.0, 21.0, 21.0, 15.0, 13.0, 9.0, 13.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -22.970703125, -22.20703125, -21.443359375, -20.6796875, -19.916015625, -19.15234375, -18.388671875, -17.625, -16.861328125, -16.09765625, -15.333984375, -14.5703125, -13.806640625, -13.04296875, -12.279296875, -11.515625, -10.751953125, -9.98828125, -9.224609375, -8.4609375, -7.697265625, -6.93359375, -6.169921875, -5.40625, -4.642578125, -3.87890625, -3.115234375, -2.3515625, -1.587890625, -0.82421875, -0.060546875, 0.703125, 1.466796875, 2.23046875, 2.994140625, 3.7578125, 4.521484375, 5.28515625, 6.048828125, 6.8125, 7.576171875, 8.33984375, 9.103515625, 9.8671875, 10.630859375, 11.39453125, 12.158203125, 12.921875, 13.685546875, 14.44921875, 15.212890625, 15.9765625, 16.740234375, 17.50390625, 18.267578125, 19.03125, 19.794921875, 20.55859375, 21.322265625, 22.0859375, 22.849609375, 23.61328125, 24.376953125, 25.140625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 6.0, 16.0, 14.0, 17.0, 16.0, 21.0, 18.0, 26.0, 36.0, 26.0, 31.0, 40.0, 50.0, 51.0, 61.0, 110.0, 1512.0, 438.0, 93.0, 64.0, 51.0, 40.0, 43.0, 33.0, 32.0, 34.0, 23.0, 17.0, 24.0, 11.0, 11.0, 15.0, 7.0, 12.0, 8.0, 2.0, 8.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.65625, -26.79150390625, -25.9267578125, -25.06201171875, -24.197265625, -23.33251953125, -22.4677734375, -21.60302734375, -20.73828125, -19.87353515625, -19.0087890625, -18.14404296875, -17.279296875, -16.41455078125, -15.5498046875, -14.68505859375, -13.8203125, -12.95556640625, -12.0908203125, -11.22607421875, -10.361328125, -9.49658203125, -8.6318359375, -7.76708984375, -6.90234375, -6.03759765625, -5.1728515625, -4.30810546875, -3.443359375, -2.57861328125, -1.7138671875, -0.84912109375, 0.015625, 0.88037109375, 1.7451171875, 2.60986328125, 3.474609375, 4.33935546875, 5.2041015625, 6.06884765625, 6.93359375, 7.79833984375, 8.6630859375, 9.52783203125, 10.392578125, 11.25732421875, 12.1220703125, 12.98681640625, 13.8515625, 14.71630859375, 15.5810546875, 16.44580078125, 17.310546875, 18.17529296875, 19.0400390625, 19.90478515625, 20.76953125, 21.63427734375, 22.4990234375, 23.36376953125, 24.228515625, 25.09326171875, 25.9580078125, 26.82275390625, 27.6875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 11.0, 11.0, 10.0, 19.0, 17.0, 8.0, 25.0, 22.0, 37.0, 41.0, 55.0, 49.0, 97.0, 144.0, 248.0, 545.0, 3484.0, 2938148.0, 199716.0, 1832.0, 406.0, 232.0, 143.0, 86.0, 42.0, 43.0, 45.0, 26.0, 22.0, 22.0, 22.0, 17.0, 12.0, 17.0, 9.0, 4.0, 7.0, 5.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-77.9375, -75.4931640625, -73.048828125, -70.6044921875, -68.16015625, -65.7158203125, -63.271484375, -60.8271484375, -58.3828125, -55.9384765625, -53.494140625, -51.0498046875, -48.60546875, -46.1611328125, -43.716796875, -41.2724609375, -38.828125, -36.3837890625, -33.939453125, -31.4951171875, -29.05078125, -26.6064453125, -24.162109375, -21.7177734375, -19.2734375, -16.8291015625, -14.384765625, -11.9404296875, -9.49609375, -7.0517578125, -4.607421875, -2.1630859375, 0.28125, 2.7255859375, 5.169921875, 7.6142578125, 10.05859375, 12.5029296875, 14.947265625, 17.3916015625, 19.8359375, 22.2802734375, 24.724609375, 27.1689453125, 29.61328125, 32.0576171875, 34.501953125, 36.9462890625, 39.390625, 41.8349609375, 44.279296875, 46.7236328125, 49.16796875, 51.6123046875, 54.056640625, 56.5009765625, 58.9453125, 61.3896484375, 63.833984375, 66.2783203125, 68.72265625, 71.1669921875, 73.611328125, 76.0556640625, 78.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 18.0, 151.0, 500.0, 308.0, 38.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.86561584472656, -157.7531280517578, -154.64065551757812, -151.52816772460938, -148.41567993164062, -145.30320739746094, -142.1907196044922, -139.07823181152344, -135.96575927734375, -132.853271484375, -129.7407989501953, -126.62831115722656, -123.51583099365234, -120.4033432006836, -117.29086303710938, -114.17837524414062, -111.06588745117188, -107.95340728759766, -104.8409194946289, -101.72843933105469, -98.61595916748047, -95.50347137451172, -92.3909912109375, -89.27850341796875, -86.16603088378906, -83.05355072021484, -79.9410629272461, -76.82858276367188, -73.71610260009766, -70.6036148071289, -67.49113464355469, -64.37864685058594, -61.266170501708984, -58.1536865234375, -55.04120635986328, -51.9287223815918, -48.81623840332031, -45.703758239746094, -42.59127426147461, -39.478790283203125, -36.366310119628906, -33.25382614135742, -30.14134407043457, -27.02886199951172, -23.916378021240234, -20.803895950317383, -17.69141387939453, -14.578929901123047, -11.466445922851562, -8.353962898254395, -5.241480350494385, -2.128997802734375, 0.983485221862793, 4.095968246459961, 7.2084503173828125, 10.320934295654297, 13.433416366577148, 16.5458984375, 19.658382415771484, 22.770864486694336, 25.883346557617188, 28.995830535888672, 32.108314514160156, 35.220794677734375, 38.33327865600586]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 9.0, 7.0, 4.0, 10.0, 4.0, 10.0, 10.0, 15.0, 16.0, 11.0, 26.0, 26.0, 28.0, 19.0, 38.0, 30.0, 25.0, 32.0, 31.0, 32.0, 35.0, 38.0, 34.0, 39.0, 46.0, 48.0, 40.0, 28.0, 30.0, 35.0, 24.0, 30.0, 32.0, 14.0, 15.0, 19.0, 18.0, 19.0, 14.0, 12.0, 7.0, 6.0, 8.0, 4.0, 2.0, 4.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.436851501464844, -57.34617614746094, -55.25550079345703, -53.16482925415039, -51.074153900146484, -48.98347854614258, -46.89280700683594, -44.80213165283203, -42.711456298828125, -40.62078094482422, -38.53010559082031, -36.43943405151367, -34.348758697509766, -32.25808334350586, -30.167409896850586, -28.076736450195312, -25.986061096191406, -23.8953857421875, -21.804712295532227, -19.714038848876953, -17.623363494873047, -15.532689094543457, -13.442014694213867, -11.351340293884277, -9.260665893554688, -7.169991493225098, -5.079317092895508, -2.988642692565918, -0.8979682922363281, 1.1927061080932617, 3.2833805084228516, 5.374054908752441, 7.4647369384765625, 9.555411338806152, 11.646085739135742, 13.736760139465332, 15.827434539794922, 17.918109893798828, 20.0087833404541, 22.099456787109375, 24.19013214111328, 26.280807495117188, 28.37148094177246, 30.462154388427734, 32.55282974243164, 34.64350509643555, 36.73417663574219, 38.824851989746094, 40.91552734375, 43.006202697753906, 45.09687805175781, 47.18754959106445, 49.27822494506836, 51.368900299072266, 53.459571838378906, 55.55024719238281, 57.64092254638672, 59.731597900390625, 61.82227325439453, 63.91294479370117, 66.00361633300781, 68.09429168701172, 70.18496704101562, 72.27564239501953, 74.36631774902344]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 3.0, 9.0, 5.0, 8.0, 14.0, 17.0, 16.0, 22.0, 24.0, 25.0, 31.0, 30.0, 32.0, 35.0, 33.0, 40.0, 45.0, 49.0, 42.0, 58.0, 49.0, 48.0, 42.0, 38.0, 31.0, 37.0, 30.0, 29.0, 22.0, 25.0, 18.0, 23.0, 13.0, 10.0, 12.0, 7.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.3758544921875, -10.040771484375, -9.7056884765625, -9.37060546875, -9.0355224609375, -8.700439453125, -8.3653564453125, -8.0302734375, -7.6951904296875, -7.360107421875, -7.0250244140625, -6.68994140625, -6.3548583984375, -6.019775390625, -5.6846923828125, -5.349609375, -5.0145263671875, -4.679443359375, -4.3443603515625, -4.00927734375, -3.6741943359375, -3.339111328125, -3.0040283203125, -2.6689453125, -2.3338623046875, -1.998779296875, -1.6636962890625, -1.32861328125, -0.9935302734375, -0.658447265625, -0.3233642578125, 0.01171875, 0.3468017578125, 0.681884765625, 1.0169677734375, 1.35205078125, 1.6871337890625, 2.022216796875, 2.3572998046875, 2.6923828125, 3.0274658203125, 3.362548828125, 3.6976318359375, 4.03271484375, 4.3677978515625, 4.702880859375, 5.0379638671875, 5.373046875, 5.7081298828125, 6.043212890625, 6.3782958984375, 6.71337890625, 7.0484619140625, 7.383544921875, 7.7186279296875, 8.0537109375, 8.3887939453125, 8.723876953125, 9.0589599609375, 9.39404296875, 9.7291259765625, 10.064208984375, 10.3992919921875, 10.734375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 10.0, 8.0, 9.0, 12.0, 18.0, 26.0, 37.0, 37.0, 36.0, 63.0, 67.0, 95.0, 122.0, 142.0, 261.0, 324.0, 695.0, 1530.0, 4719.0, 21711.0, 224339.0, 2137408.0, 1645398.0, 134855.0, 15310.0, 3878.0, 1287.0, 658.0, 356.0, 215.0, 154.0, 122.0, 84.0, 59.0, 48.0, 40.0, 31.0, 33.0, 21.0, 8.0, 15.0, 10.0, 12.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.40625, -21.764404296875, -21.12255859375, -20.480712890625, -19.8388671875, -19.197021484375, -18.55517578125, -17.913330078125, -17.271484375, -16.629638671875, -15.98779296875, -15.345947265625, -14.7041015625, -14.062255859375, -13.42041015625, -12.778564453125, -12.13671875, -11.494873046875, -10.85302734375, -10.211181640625, -9.5693359375, -8.927490234375, -8.28564453125, -7.643798828125, -7.001953125, -6.360107421875, -5.71826171875, -5.076416015625, -4.4345703125, -3.792724609375, -3.15087890625, -2.509033203125, -1.8671875, -1.225341796875, -0.58349609375, 0.058349609375, 0.7001953125, 1.342041015625, 1.98388671875, 2.625732421875, 3.267578125, 3.909423828125, 4.55126953125, 5.193115234375, 5.8349609375, 6.476806640625, 7.11865234375, 7.760498046875, 8.40234375, 9.044189453125, 9.68603515625, 10.327880859375, 10.9697265625, 11.611572265625, 12.25341796875, 12.895263671875, 13.537109375, 14.178955078125, 14.82080078125, 15.462646484375, 16.1044921875, 16.746337890625, 17.38818359375, 18.030029296875, 18.671875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 8.0, 9.0, 11.0, 22.0, 32.0, 48.0, 51.0, 66.0, 97.0, 164.0, 197.0, 331.0, 354.0, 468.0, 499.0, 442.0, 312.0, 280.0, 198.0, 113.0, 92.0, 67.0, 50.0, 38.0, 32.0, 24.0, 6.0, 5.0, 6.0, 5.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.627685546875, -13.13037109375, -12.633056640625, -12.1357421875, -11.638427734375, -11.14111328125, -10.643798828125, -10.146484375, -9.649169921875, -9.15185546875, -8.654541015625, -8.1572265625, -7.659912109375, -7.16259765625, -6.665283203125, -6.16796875, -5.670654296875, -5.17333984375, -4.676025390625, -4.1787109375, -3.681396484375, -3.18408203125, -2.686767578125, -2.189453125, -1.692138671875, -1.19482421875, -0.697509765625, -0.2001953125, 0.297119140625, 0.79443359375, 1.291748046875, 1.7890625, 2.286376953125, 2.78369140625, 3.281005859375, 3.7783203125, 4.275634765625, 4.77294921875, 5.270263671875, 5.767578125, 6.264892578125, 6.76220703125, 7.259521484375, 7.7568359375, 8.254150390625, 8.75146484375, 9.248779296875, 9.74609375, 10.243408203125, 10.74072265625, 11.238037109375, 11.7353515625, 12.232666015625, 12.72998046875, 13.227294921875, 13.724609375, 14.221923828125, 14.71923828125, 15.216552734375, 15.7138671875, 16.211181640625, 16.70849609375, 17.205810546875, 17.703125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 12.0, 8.0, 18.0, 22.0, 28.0, 30.0, 39.0, 47.0, 59.0, 79.0, 105.0, 124.0, 153.0, 250.0, 433.0, 856.0, 2578.0, 12453.0, 190152.0, 3758979.0, 209288.0, 13315.0, 2867.0, 904.0, 470.0, 233.0, 164.0, 139.0, 93.0, 81.0, 64.0, 48.0, 36.0, 26.0, 21.0, 28.0, 14.0, 14.0, 6.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-44.53125, -43.16162109375, -41.7919921875, -40.42236328125, -39.052734375, -37.68310546875, -36.3134765625, -34.94384765625, -33.57421875, -32.20458984375, -30.8349609375, -29.46533203125, -28.095703125, -26.72607421875, -25.3564453125, -23.98681640625, -22.6171875, -21.24755859375, -19.8779296875, -18.50830078125, -17.138671875, -15.76904296875, -14.3994140625, -13.02978515625, -11.66015625, -10.29052734375, -8.9208984375, -7.55126953125, -6.181640625, -4.81201171875, -3.4423828125, -2.07275390625, -0.703125, 0.66650390625, 2.0361328125, 3.40576171875, 4.775390625, 6.14501953125, 7.5146484375, 8.88427734375, 10.25390625, 11.62353515625, 12.9931640625, 14.36279296875, 15.732421875, 17.10205078125, 18.4716796875, 19.84130859375, 21.2109375, 22.58056640625, 23.9501953125, 25.31982421875, 26.689453125, 28.05908203125, 29.4287109375, 30.79833984375, 32.16796875, 33.53759765625, 34.9072265625, 36.27685546875, 37.646484375, 39.01611328125, 40.3857421875, 41.75537109375, 43.125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 12.0, 60.0, 154.0, 314.0, 297.0, 124.0, 36.0, 13.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-255.97579956054688, -250.93980407714844, -245.90380859375, -240.86781311035156, -235.83181762695312, -230.79583740234375, -225.75982666015625, -220.72384643554688, -215.68785095214844, -210.65185546875, -205.61585998535156, -200.57986450195312, -195.5438690185547, -190.50787353515625, -185.47189331054688, -180.43589782714844, -175.39990234375, -170.36390686035156, -165.32791137695312, -160.2919158935547, -155.25592041015625, -150.21994018554688, -145.18392944335938, -140.14794921875, -135.1119384765625, -130.07594299316406, -125.03994750976562, -120.00395202636719, -114.96796417236328, -109.93196868896484, -104.8959732055664, -99.8599853515625, -94.82398223876953, -89.7879867553711, -84.75199127197266, -79.71600341796875, -74.68000793457031, -69.64401245117188, -64.60801696777344, -59.572025299072266, -54.53602981567383, -49.50003433227539, -44.46404266357422, -39.42804718017578, -34.392051696777344, -29.356060028076172, -24.320064544677734, -19.284072875976562, -14.248077392578125, -9.21208381652832, -4.176089286804199, 0.8599052429199219, 5.895898818969727, 10.931892395019531, 15.967887878417969, 21.00387954711914, 26.039875030517578, 31.075868606567383, 36.11186218261719, 41.147857666015625, 46.18385314941406, 51.219844818115234, 56.25584030151367, 61.291831970214844, 66.32782745361328]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 12.0, 9.0, 4.0, 13.0, 11.0, 16.0, 18.0, 25.0, 26.0, 18.0, 27.0, 37.0, 32.0, 35.0, 30.0, 37.0, 42.0, 24.0, 33.0, 32.0, 37.0, 43.0, 41.0, 46.0, 29.0, 31.0, 32.0, 27.0, 27.0, 32.0, 25.0, 16.0, 21.0, 20.0, 18.0, 20.0, 15.0, 6.0, 3.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-53.04289245605469, -51.44862747192383, -49.854366302490234, -48.260101318359375, -46.66584014892578, -45.07157516479492, -43.47731018066406, -41.88304901123047, -40.288787841796875, -38.694522857666016, -37.10026168823242, -35.50599670410156, -33.91173553466797, -32.31747055053711, -30.723207473754883, -29.128944396972656, -27.534679412841797, -25.94041633605957, -24.346153259277344, -22.751888275146484, -21.15762710571289, -19.56336212158203, -17.969099044799805, -16.374835968017578, -14.780572891235352, -13.186309814453125, -11.592046737670898, -9.997782707214355, -8.403519630432129, -6.809256553649902, -5.214992523193359, -3.620729446411133, -2.0264663696289062, -0.4322030544281006, 1.162060260772705, 2.75632381439209, 4.350586891174316, 5.944849967956543, 7.539113998413086, 9.133377075195312, 10.727640151977539, 12.321903228759766, 13.916166305541992, 15.510430335998535, 17.104694366455078, 18.698955535888672, 20.29322052001953, 21.887483596801758, 23.481746673583984, 25.07600975036621, 26.670272827148438, 28.264537811279297, 29.85879898071289, 31.45306396484375, 33.047325134277344, 34.6415901184082, 36.23585510253906, 37.83012008666992, 39.424381256103516, 41.018646240234375, 42.61290740966797, 44.20717239379883, 45.80143737792969, 47.39569854736328, 48.989959716796875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 7.0, 14.0, 9.0, 15.0, 20.0, 22.0, 15.0, 24.0, 20.0, 28.0, 30.0, 36.0, 33.0, 32.0, 47.0, 27.0, 51.0, 46.0, 68.0, 40.0, 48.0, 38.0, 42.0, 37.0, 31.0, 29.0, 32.0, 25.0, 26.0, 19.0, 11.0, 16.0, 9.0, 12.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8046875, -11.4566650390625, -11.108642578125, -10.7606201171875, -10.41259765625, -10.0645751953125, -9.716552734375, -9.3685302734375, -9.0205078125, -8.6724853515625, -8.324462890625, -7.9764404296875, -7.62841796875, -7.2803955078125, -6.932373046875, -6.5843505859375, -6.236328125, -5.8883056640625, -5.540283203125, -5.1922607421875, -4.84423828125, -4.4962158203125, -4.148193359375, -3.8001708984375, -3.4521484375, -3.1041259765625, -2.756103515625, -2.4080810546875, -2.06005859375, -1.7120361328125, -1.364013671875, -1.0159912109375, -0.66796875, -0.3199462890625, 0.028076171875, 0.3760986328125, 0.72412109375, 1.0721435546875, 1.420166015625, 1.7681884765625, 2.1162109375, 2.4642333984375, 2.812255859375, 3.1602783203125, 3.50830078125, 3.8563232421875, 4.204345703125, 4.5523681640625, 4.900390625, 5.2484130859375, 5.596435546875, 5.9444580078125, 6.29248046875, 6.6405029296875, 6.988525390625, 7.3365478515625, 7.6845703125, 8.0325927734375, 8.380615234375, 8.7286376953125, 9.07666015625, 9.4246826171875, 9.772705078125, 10.1207275390625, 10.46875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 9.0, 11.0, 36.0, 28.0, 53.0, 59.0, 96.0, 149.0, 192.0, 332.0, 502.0, 677.0, 1051.0, 1527.0, 2415.0, 3548.0, 5632.0, 8826.0, 13919.0, 21754.0, 34889.0, 57345.0, 99579.0, 235560.0, 286180.0, 109529.0, 61700.0, 37719.0, 23518.0, 14735.0, 9466.0, 6041.0, 3853.0, 2587.0, 1692.0, 1066.0, 722.0, 479.0, 353.0, 228.0, 145.0, 112.0, 67.0, 55.0, 40.0, 19.0, 20.0, 10.0, 8.0, 5.0, 2.0, 5.0, 1.0, 2.0], "bins": [-2.404296875, -2.333740234375, -2.26318359375, -2.192626953125, -2.1220703125, -2.051513671875, -1.98095703125, -1.910400390625, -1.83984375, -1.769287109375, -1.69873046875, -1.628173828125, -1.5576171875, -1.487060546875, -1.41650390625, -1.345947265625, -1.275390625, -1.204833984375, -1.13427734375, -1.063720703125, -0.9931640625, -0.922607421875, -0.85205078125, -0.781494140625, -0.7109375, -0.640380859375, -0.56982421875, -0.499267578125, -0.4287109375, -0.358154296875, -0.28759765625, -0.217041015625, -0.146484375, -0.075927734375, -0.00537109375, 0.065185546875, 0.1357421875, 0.206298828125, 0.27685546875, 0.347412109375, 0.41796875, 0.488525390625, 0.55908203125, 0.629638671875, 0.7001953125, 0.770751953125, 0.84130859375, 0.911865234375, 0.982421875, 1.052978515625, 1.12353515625, 1.194091796875, 1.2646484375, 1.335205078125, 1.40576171875, 1.476318359375, 1.546875, 1.617431640625, 1.68798828125, 1.758544921875, 1.8291015625, 1.899658203125, 1.97021484375, 2.040771484375, 2.111328125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 12.0, 11.0, 12.0, 16.0, 11.0, 22.0, 21.0, 31.0, 25.0, 26.0, 40.0, 53.0, 39.0, 35.0, 46.0, 47.0, 35.0, 1069.0, 47.0, 41.0, 48.0, 42.0, 38.0, 38.0, 31.0, 31.0, 22.0, 28.0, 19.0, 21.0, 12.0, 14.0, 7.0, 2.0, 7.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.41119384765625, -8.1739501953125, -7.93670654296875, -7.699462890625, -7.46221923828125, -7.2249755859375, -6.98773193359375, -6.75048828125, -6.51324462890625, -6.2760009765625, -6.03875732421875, -5.801513671875, -5.56427001953125, -5.3270263671875, -5.08978271484375, -4.8525390625, -4.61529541015625, -4.3780517578125, -4.14080810546875, -3.903564453125, -3.66632080078125, -3.4290771484375, -3.19183349609375, -2.95458984375, -2.71734619140625, -2.4801025390625, -2.24285888671875, -2.005615234375, -1.76837158203125, -1.5311279296875, -1.29388427734375, -1.056640625, -0.81939697265625, -0.5821533203125, -0.34490966796875, -0.107666015625, 0.12957763671875, 0.3668212890625, 0.60406494140625, 0.84130859375, 1.07855224609375, 1.3157958984375, 1.55303955078125, 1.790283203125, 2.02752685546875, 2.2647705078125, 2.50201416015625, 2.7392578125, 2.97650146484375, 3.2137451171875, 3.45098876953125, 3.688232421875, 3.92547607421875, 4.1627197265625, 4.39996337890625, 4.63720703125, 4.87445068359375, 5.1116943359375, 5.34893798828125, 5.586181640625, 5.82342529296875, 6.0606689453125, 6.29791259765625, 6.53515625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 8.0, 12.0, 19.0, 25.0, 53.0, 72.0, 114.0, 182.0, 246.0, 407.0, 669.0, 974.0, 1549.0, 2564.0, 4256.0, 6937.0, 11249.0, 18909.0, 31869.0, 55569.0, 102328.0, 224277.0, 1354253.0, 122352.0, 65198.0, 37095.0, 21769.0, 13060.0, 7916.0, 4810.0, 3111.0, 1908.0, 1221.0, 756.0, 483.0, 294.0, 208.0, 150.0, 82.0, 56.0, 42.0, 28.0, 20.0, 12.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.503570556640625, -2.42315673828125, -2.342742919921875, -2.2623291015625, -2.181915283203125, -2.10150146484375, -2.021087646484375, -1.940673828125, -1.860260009765625, -1.77984619140625, -1.699432373046875, -1.6190185546875, -1.538604736328125, -1.45819091796875, -1.377777099609375, -1.29736328125, -1.216949462890625, -1.13653564453125, -1.056121826171875, -0.9757080078125, -0.895294189453125, -0.81488037109375, -0.734466552734375, -0.654052734375, -0.573638916015625, -0.49322509765625, -0.412811279296875, -0.3323974609375, -0.251983642578125, -0.17156982421875, -0.091156005859375, -0.0107421875, 0.069671630859375, 0.15008544921875, 0.230499267578125, 0.3109130859375, 0.391326904296875, 0.47174072265625, 0.552154541015625, 0.632568359375, 0.712982177734375, 0.79339599609375, 0.873809814453125, 0.9542236328125, 1.034637451171875, 1.11505126953125, 1.195465087890625, 1.27587890625, 1.356292724609375, 1.43670654296875, 1.517120361328125, 1.5975341796875, 1.677947998046875, 1.75836181640625, 1.838775634765625, 1.919189453125, 1.999603271484375, 2.08001708984375, 2.160430908203125, 2.2408447265625, 2.321258544921875, 2.40167236328125, 2.482086181640625, 2.5625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 4.0, 8.0, 7.0, 15.0, 19.0, 21.0, 31.0, 40.0, 31.0, 37.0, 55.0, 75.0, 92.0, 90.0, 87.0, 86.0, 53.0, 39.0, 36.0, 25.0, 33.0, 16.0, 12.0, 15.0, 8.0, 11.0, 7.0, 7.0, 6.0, 5.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0012712478637695312, -0.0012309104204177856, -0.00119057297706604, -0.0011502355337142944, -0.0011098980903625488, -0.0010695606470108032, -0.0010292232036590576, -0.000988885760307312, -0.0009485483169555664, -0.0009082108736038208, -0.0008678734302520752, -0.0008275359869003296, -0.000787198543548584, -0.0007468611001968384, -0.0007065236568450928, -0.0006661862134933472, -0.0006258487701416016, -0.000585511326789856, -0.0005451738834381104, -0.0005048364400863647, -0.00046449899673461914, -0.00042416155338287354, -0.00038382411003112793, -0.0003434866666793823, -0.0003031492233276367, -0.0002628117799758911, -0.0002224743366241455, -0.0001821368932723999, -0.0001417994499206543, -0.00010146200656890869, -6.112456321716309e-05, -2.078711986541748e-05, 1.9550323486328125e-05, 5.988776683807373e-05, 0.00010022521018981934, 0.00014056265354156494, 0.00018090009689331055, 0.00022123754024505615, 0.00026157498359680176, 0.00030191242694854736, 0.00034224987030029297, 0.0003825873136520386, 0.0004229247570037842, 0.0004632622003555298, 0.0005035996437072754, 0.000543937087059021, 0.0005842745304107666, 0.0006246119737625122, 0.0006649494171142578, 0.0007052868604660034, 0.000745624303817749, 0.0007859617471694946, 0.0008262991905212402, 0.0008666366338729858, 0.0009069740772247314, 0.000947311520576477, 0.0009876489639282227, 0.0010279864072799683, 0.0010683238506317139, 0.0011086612939834595, 0.001148998737335205, 0.0011893361806869507, 0.0012296736240386963, 0.001270011067390442, 0.0013103485107421875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 5.0, 5.0, 7.0, 9.0, 12.0, 27.0, 10.0, 18.0, 41.0, 57.0, 64.0, 85.0, 142.0, 215.0, 412.0, 1076.0, 754932.0, 289377.0, 965.0, 405.0, 188.0, 113.0, 93.0, 84.0, 60.0, 28.0, 19.0, 22.0, 11.0, 12.0, 11.0, 13.0, 8.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027191162109375, -0.026365995407104492, -0.025540828704833984, -0.024715662002563477, -0.02389049530029297, -0.02306532859802246, -0.022240161895751953, -0.021414995193481445, -0.020589828491210938, -0.01976466178894043, -0.018939495086669922, -0.018114328384399414, -0.017289161682128906, -0.0164639949798584, -0.01563882827758789, -0.014813661575317383, -0.013988494873046875, -0.013163328170776367, -0.01233816146850586, -0.011512994766235352, -0.010687828063964844, -0.009862661361694336, -0.009037494659423828, -0.00821232795715332, -0.0073871612548828125, -0.006561994552612305, -0.005736827850341797, -0.004911661148071289, -0.004086494445800781, -0.0032613277435302734, -0.0024361610412597656, -0.0016109943389892578, -0.00078582763671875, 3.933906555175781e-05, 0.0008645057678222656, 0.0016896724700927734, 0.0025148391723632812, 0.003340005874633789, 0.004165172576904297, 0.004990339279174805, 0.0058155059814453125, 0.00664067268371582, 0.007465839385986328, 0.008291006088256836, 0.009116172790527344, 0.009941339492797852, 0.01076650619506836, 0.011591672897338867, 0.012416839599609375, 0.013242006301879883, 0.01406717300415039, 0.014892339706420898, 0.015717506408691406, 0.016542673110961914, 0.017367839813232422, 0.01819300651550293, 0.019018173217773438, 0.019843339920043945, 0.020668506622314453, 0.02149367332458496, 0.02231884002685547, 0.023144006729125977, 0.023969173431396484, 0.024794340133666992, 0.0256195068359375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 29.0, 186.0, 479.0, 278.0, 32.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015911615919321775, -0.001514102448709309, -0.0014370433054864407, -0.0013599841622635722, -0.0012829250190407038, -0.0012058658758178353, -0.0011288067325949669, -0.0010517475893720984, -0.00097468844614923, -0.0008976293029263616, -0.0008205701597034931, -0.0007435110164806247, -0.0006664518732577562, -0.0005893927300348878, -0.0005123335868120193, -0.0004352744435891509, -0.00035821530036628246, -0.000281156157143414, -0.00020409701392054558, -0.00012703787069767714, -4.997872747480869e-05, 2.708041574805975e-05, 0.00010413955897092819, 0.00018119870219379663, 0.0002582578454166651, 0.0003353169886395335, 0.00041237613186240196, 0.0004894352750852704, 0.0005664944183081388, 0.0006435535615310073, 0.0007206127047538757, 0.0007976718479767442, 0.0008747312240302563, 0.0009517903672531247, 0.0010288495104759932, 0.0011059086536988616, 0.00118296779692173, 0.0012600269401445985, 0.001337086083367467, 0.0014141452265903354, 0.0014912043698132038, 0.0015682635130360723, 0.0016453226562589407, 0.0017223817994818091, 0.0017994409427046776, 0.001876500085927546, 0.0019535592291504145, 0.0020306184887886047, 0.0021076775155961514, 0.002184736542403698, 0.0022617958020418882, 0.0023388550616800785, 0.002415914088487625, 0.0024929731152951717, 0.002570032374933362, 0.0026470916345715523, 0.002724150661379099, 0.0028012096881866455, 0.0028782689478248358, 0.002955328207463026, 0.0030323872342705727, 0.0031094462610781193, 0.0031865055207163095, 0.0032635647803545, 0.0033406238071620464]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 1.0, 5.0, 7.0, 8.0, 7.0, 7.0, 9.0, 13.0, 12.0, 13.0, 15.0, 16.0, 28.0, 26.0, 22.0, 21.0, 22.0, 33.0, 28.0, 40.0, 40.0, 36.0, 40.0, 19.0, 34.0, 41.0, 40.0, 38.0, 32.0, 32.0, 45.0, 27.0, 39.0, 30.0, 23.0, 23.0, 20.0, 21.0, 20.0, 12.0, 15.0, 8.0, 4.0, 3.0, 6.0, 5.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0005944371223449707, -0.0005772272124886513, -0.0005600173026323318, -0.0005428073927760124, -0.000525597482919693, -0.0005083875730633736, -0.0004911776632070541, -0.0004739677533507347, -0.0004567578434944153, -0.00043954793363809586, -0.00042233802378177643, -0.000405128113925457, -0.0003879182040691376, -0.00037070829421281815, -0.0003534983843564987, -0.0003362884745001793, -0.00031907856464385986, -0.00030186865478754044, -0.000284658744931221, -0.0002674488350749016, -0.00025023892521858215, -0.00023302901536226273, -0.0002158191055059433, -0.00019860919564962387, -0.00018139928579330444, -0.00016418937593698502, -0.0001469794660806656, -0.00012976955622434616, -0.00011255964636802673, -9.53497365117073e-05, -7.813982665538788e-05, -6.092991679906845e-05, -4.3720006942749023e-05, -2.6510097086429596e-05, -9.300187230110168e-06, 7.909722626209259e-06, 2.5119632482528687e-05, 4.2329542338848114e-05, 5.953945219516754e-05, 7.674936205148697e-05, 9.39592719078064e-05, 0.00011116918176412582, 0.00012837909162044525, 0.00014558900147676468, 0.0001627989113330841, 0.00018000882118940353, 0.00019721873104572296, 0.0002144286409020424, 0.00023163855075836182, 0.00024884846061468124, 0.00026605837047100067, 0.0002832682803273201, 0.0003004781901836395, 0.00031768810003995895, 0.0003348980098962784, 0.0003521079197525978, 0.00036931782960891724, 0.00038652773946523666, 0.0004037376493215561, 0.0004209475591778755, 0.00043815746903419495, 0.0004553673788905144, 0.0004725772887468338, 0.0004897871986031532, 0.0005069971084594727]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 7.0, 14.0, 9.0, 15.0, 20.0, 22.0, 15.0, 24.0, 20.0, 28.0, 30.0, 36.0, 33.0, 32.0, 47.0, 27.0, 51.0, 46.0, 68.0, 40.0, 48.0, 38.0, 42.0, 37.0, 31.0, 29.0, 32.0, 25.0, 26.0, 19.0, 11.0, 16.0, 9.0, 12.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8046875, -11.4566650390625, -11.108642578125, -10.7606201171875, -10.41259765625, -10.0645751953125, -9.716552734375, -9.3685302734375, -9.0205078125, -8.6724853515625, -8.324462890625, -7.9764404296875, -7.62841796875, -7.2803955078125, -6.932373046875, -6.5843505859375, -6.236328125, -5.8883056640625, -5.540283203125, -5.1922607421875, -4.84423828125, -4.4962158203125, -4.148193359375, -3.8001708984375, -3.4521484375, -3.1041259765625, -2.756103515625, -2.4080810546875, -2.06005859375, -1.7120361328125, -1.364013671875, -1.0159912109375, -0.66796875, -0.3199462890625, 0.028076171875, 0.3760986328125, 0.72412109375, 1.0721435546875, 1.420166015625, 1.7681884765625, 2.1162109375, 2.4642333984375, 2.812255859375, 3.1602783203125, 3.50830078125, 3.8563232421875, 4.204345703125, 4.5523681640625, 4.900390625, 5.2484130859375, 5.596435546875, 5.9444580078125, 6.29248046875, 6.6405029296875, 6.988525390625, 7.3365478515625, 7.6845703125, 8.0325927734375, 8.380615234375, 8.7286376953125, 9.07666015625, 9.4246826171875, 9.772705078125, 10.1207275390625, 10.46875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 4.0, 11.0, 9.0, 7.0, 15.0, 31.0, 29.0, 38.0, 60.0, 79.0, 105.0, 137.0, 205.0, 278.0, 473.0, 971.0, 1914.0, 4323.0, 10800.0, 31078.0, 103465.0, 418380.0, 346598.0, 85959.0, 26587.0, 9239.0, 3758.0, 1706.0, 861.0, 493.0, 274.0, 174.0, 122.0, 94.0, 76.0, 49.0, 35.0, 31.0, 22.0, 21.0, 11.0, 7.0, 11.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.921875, -14.4820556640625, -14.042236328125, -13.6024169921875, -13.16259765625, -12.7227783203125, -12.282958984375, -11.8431396484375, -11.4033203125, -10.9635009765625, -10.523681640625, -10.0838623046875, -9.64404296875, -9.2042236328125, -8.764404296875, -8.3245849609375, -7.884765625, -7.4449462890625, -7.005126953125, -6.5653076171875, -6.12548828125, -5.6856689453125, -5.245849609375, -4.8060302734375, -4.3662109375, -3.9263916015625, -3.486572265625, -3.0467529296875, -2.60693359375, -2.1671142578125, -1.727294921875, -1.2874755859375, -0.84765625, -0.4078369140625, 0.031982421875, 0.4718017578125, 0.91162109375, 1.3514404296875, 1.791259765625, 2.2310791015625, 2.6708984375, 3.1107177734375, 3.550537109375, 3.9903564453125, 4.43017578125, 4.8699951171875, 5.309814453125, 5.7496337890625, 6.189453125, 6.6292724609375, 7.069091796875, 7.5089111328125, 7.94873046875, 8.3885498046875, 8.828369140625, 9.2681884765625, 9.7080078125, 10.1478271484375, 10.587646484375, 11.0274658203125, 11.46728515625, 11.9071044921875, 12.346923828125, 12.7867431640625, 13.2265625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 10.0, 11.0, 16.0, 14.0, 22.0, 17.0, 33.0, 42.0, 52.0, 49.0, 67.0, 66.0, 90.0, 124.0, 1617.0, 250.0, 137.0, 80.0, 59.0, 64.0, 44.0, 46.0, 26.0, 21.0, 21.0, 8.0, 11.0, 9.0, 12.0, 8.0, 4.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.03125, -44.84326171875, -43.6552734375, -42.46728515625, -41.279296875, -40.09130859375, -38.9033203125, -37.71533203125, -36.52734375, -35.33935546875, -34.1513671875, -32.96337890625, -31.775390625, -30.58740234375, -29.3994140625, -28.21142578125, -27.0234375, -25.83544921875, -24.6474609375, -23.45947265625, -22.271484375, -21.08349609375, -19.8955078125, -18.70751953125, -17.51953125, -16.33154296875, -15.1435546875, -13.95556640625, -12.767578125, -11.57958984375, -10.3916015625, -9.20361328125, -8.015625, -6.82763671875, -5.6396484375, -4.45166015625, -3.263671875, -2.07568359375, -0.8876953125, 0.30029296875, 1.48828125, 2.67626953125, 3.8642578125, 5.05224609375, 6.240234375, 7.42822265625, 8.6162109375, 9.80419921875, 10.9921875, 12.18017578125, 13.3681640625, 14.55615234375, 15.744140625, 16.93212890625, 18.1201171875, 19.30810546875, 20.49609375, 21.68408203125, 22.8720703125, 24.06005859375, 25.248046875, 26.43603515625, 27.6240234375, 28.81201171875, 30.0]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 3.0, 5.0, 12.0, 14.0, 16.0, 18.0, 26.0, 33.0, 49.0, 58.0, 61.0, 119.0, 155.0, 296.0, 442.0, 1101.0, 6611.0, 144017.0, 2928181.0, 58571.0, 3847.0, 799.0, 397.0, 286.0, 158.0, 104.0, 78.0, 49.0, 51.0, 30.0, 27.0, 15.0, 13.0, 19.0, 7.0, 6.0, 4.0, 7.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-48.4375, -46.89404296875, -45.3505859375, -43.80712890625, -42.263671875, -40.72021484375, -39.1767578125, -37.63330078125, -36.08984375, -34.54638671875, -33.0029296875, -31.45947265625, -29.916015625, -28.37255859375, -26.8291015625, -25.28564453125, -23.7421875, -22.19873046875, -20.6552734375, -19.11181640625, -17.568359375, -16.02490234375, -14.4814453125, -12.93798828125, -11.39453125, -9.85107421875, -8.3076171875, -6.76416015625, -5.220703125, -3.67724609375, -2.1337890625, -0.59033203125, 0.953125, 2.49658203125, 4.0400390625, 5.58349609375, 7.126953125, 8.67041015625, 10.2138671875, 11.75732421875, 13.30078125, 14.84423828125, 16.3876953125, 17.93115234375, 19.474609375, 21.01806640625, 22.5615234375, 24.10498046875, 25.6484375, 27.19189453125, 28.7353515625, 30.27880859375, 31.822265625, 33.36572265625, 34.9091796875, 36.45263671875, 37.99609375, 39.53955078125, 41.0830078125, 42.62646484375, 44.169921875, 45.71337890625, 47.2568359375, 48.80029296875, 50.34375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 18.0, 93.0, 369.0, 426.0, 98.0, 12.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-216.22935485839844, -211.8181610107422, -207.40696716308594, -202.9957733154297, -198.58457946777344, -194.1733856201172, -189.76219177246094, -185.35101318359375, -180.9398193359375, -176.52862548828125, -172.117431640625, -167.70623779296875, -163.2950439453125, -158.88385009765625, -154.47265625, -150.06146240234375, -145.6502685546875, -141.23907470703125, -136.827880859375, -132.41668701171875, -128.0054931640625, -123.59429931640625, -119.18311309814453, -114.77191925048828, -110.36072540283203, -105.94953155517578, -101.53833770751953, -97.12714385986328, -92.71595764160156, -88.30476379394531, -83.89356994628906, -79.48237609863281, -75.07119750976562, -70.66000366210938, -66.24880981445312, -61.83761978149414, -57.42642593383789, -53.01523208618164, -48.604042053222656, -44.192848205566406, -39.781654357910156, -35.370460510253906, -30.95926856994629, -26.548076629638672, -22.136882781982422, -17.725688934326172, -13.314496994018555, -8.903305053710938, -4.4921112060546875, -0.0809183120727539, 4.33027458190918, 8.741467475891113, 13.152660369873047, 17.563854217529297, 21.975046157836914, 26.38623809814453, 30.79743194580078, 35.20862579345703, 39.61981964111328, 44.031009674072266, 48.442203521728516, 52.853397369384766, 57.26458740234375, 61.67578125, 66.08697509765625]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 3.0, 9.0, 9.0, 12.0, 7.0, 10.0, 11.0, 15.0, 10.0, 20.0, 18.0, 31.0, 32.0, 27.0, 29.0, 53.0, 31.0, 38.0, 33.0, 41.0, 41.0, 32.0, 40.0, 47.0, 38.0, 37.0, 38.0, 28.0, 36.0, 29.0, 19.0, 33.0, 27.0, 21.0, 18.0, 12.0, 12.0, 9.0, 6.0, 10.0, 3.0, 6.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.91752624511719, -58.99882507324219, -57.08012008666992, -55.16141891479492, -53.242713928222656, -51.324012756347656, -49.405311584472656, -47.48660659790039, -45.567901611328125, -43.649200439453125, -41.73049545288086, -39.81179428100586, -37.893089294433594, -35.974388122558594, -34.055686950683594, -32.13698196411133, -30.218280792236328, -28.299577713012695, -26.380874633789062, -24.462173461914062, -22.543468475341797, -20.624767303466797, -18.706064224243164, -16.78736114501953, -14.868658065795898, -12.949954986572266, -11.031251907348633, -9.112549781799316, -7.193846702575684, -5.275143623352051, -3.3564414978027344, -1.4377384185791016, 0.48096466064453125, 2.399667501449585, 4.318370342254639, 6.237072944641113, 8.155776023864746, 10.074479103088379, 11.993181228637695, 13.911884307861328, 15.830587387084961, 17.749290466308594, 19.667993545532227, 21.58669662475586, 23.50539779663086, 25.424102783203125, 27.342803955078125, 29.261507034301758, 31.18021011352539, 33.09891128540039, 35.017616271972656, 36.936317443847656, 38.85502243041992, 40.77372360229492, 42.69242858886719, 44.61112976074219, 46.52983093261719, 48.44853210449219, 50.36723709106445, 52.28593826293945, 54.20464324951172, 56.12334442138672, 58.04204559326172, 59.960750579833984, 61.87945556640625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 7.0, 7.0, 12.0, 12.0, 22.0, 15.0, 14.0, 17.0, 21.0, 29.0, 34.0, 28.0, 35.0, 37.0, 38.0, 45.0, 58.0, 45.0, 51.0, 44.0, 53.0, 49.0, 41.0, 26.0, 33.0, 26.0, 31.0, 32.0, 28.0, 14.0, 18.0, 14.0, 17.0, 12.0, 6.0, 5.0, 5.0, 5.0, 2.0, 5.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.78125, -11.416259765625, -11.05126953125, -10.686279296875, -10.3212890625, -9.956298828125, -9.59130859375, -9.226318359375, -8.861328125, -8.496337890625, -8.13134765625, -7.766357421875, -7.4013671875, -7.036376953125, -6.67138671875, -6.306396484375, -5.94140625, -5.576416015625, -5.21142578125, -4.846435546875, -4.4814453125, -4.116455078125, -3.75146484375, -3.386474609375, -3.021484375, -2.656494140625, -2.29150390625, -1.926513671875, -1.5615234375, -1.196533203125, -0.83154296875, -0.466552734375, -0.1015625, 0.263427734375, 0.62841796875, 0.993408203125, 1.3583984375, 1.723388671875, 2.08837890625, 2.453369140625, 2.818359375, 3.183349609375, 3.54833984375, 3.913330078125, 4.2783203125, 4.643310546875, 5.00830078125, 5.373291015625, 5.73828125, 6.103271484375, 6.46826171875, 6.833251953125, 7.1982421875, 7.563232421875, 7.92822265625, 8.293212890625, 8.658203125, 9.023193359375, 9.38818359375, 9.753173828125, 10.1181640625, 10.483154296875, 10.84814453125, 11.213134765625, 11.578125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 4.0, 6.0, 7.0, 10.0, 12.0, 7.0, 12.0, 12.0, 17.0, 23.0, 16.0, 21.0, 31.0, 45.0, 59.0, 104.0, 211.0, 490.0, 1477.0, 6539.0, 101604.0, 2535766.0, 1498211.0, 42907.0, 4492.0, 1206.0, 433.0, 205.0, 84.0, 62.0, 31.0, 31.0, 29.0, 23.0, 21.0, 13.0, 12.0, 8.0, 12.0, 1.0, 4.0, 7.0, 5.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0], "bins": [-32.46875, -31.537841796875, -30.60693359375, -29.676025390625, -28.7451171875, -27.814208984375, -26.88330078125, -25.952392578125, -25.021484375, -24.090576171875, -23.15966796875, -22.228759765625, -21.2978515625, -20.366943359375, -19.43603515625, -18.505126953125, -17.57421875, -16.643310546875, -15.71240234375, -14.781494140625, -13.8505859375, -12.919677734375, -11.98876953125, -11.057861328125, -10.126953125, -9.196044921875, -8.26513671875, -7.334228515625, -6.4033203125, -5.472412109375, -4.54150390625, -3.610595703125, -2.6796875, -1.748779296875, -0.81787109375, 0.113037109375, 1.0439453125, 1.974853515625, 2.90576171875, 3.836669921875, 4.767578125, 5.698486328125, 6.62939453125, 7.560302734375, 8.4912109375, 9.422119140625, 10.35302734375, 11.283935546875, 12.21484375, 13.145751953125, 14.07666015625, 15.007568359375, 15.9384765625, 16.869384765625, 17.80029296875, 18.731201171875, 19.662109375, 20.593017578125, 21.52392578125, 22.454833984375, 23.3857421875, 24.316650390625, 25.24755859375, 26.178466796875, 27.109375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 8.0, 12.0, 21.0, 18.0, 18.0, 35.0, 55.0, 75.0, 115.0, 192.0, 327.0, 425.0, 605.0, 592.0, 512.0, 396.0, 226.0, 142.0, 97.0, 78.0, 31.0, 28.0, 16.0, 12.0, 9.0, 4.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.654541015625, -17.09033203125, -16.526123046875, -15.9619140625, -15.397705078125, -14.83349609375, -14.269287109375, -13.705078125, -13.140869140625, -12.57666015625, -12.012451171875, -11.4482421875, -10.884033203125, -10.31982421875, -9.755615234375, -9.19140625, -8.627197265625, -8.06298828125, -7.498779296875, -6.9345703125, -6.370361328125, -5.80615234375, -5.241943359375, -4.677734375, -4.113525390625, -3.54931640625, -2.985107421875, -2.4208984375, -1.856689453125, -1.29248046875, -0.728271484375, -0.1640625, 0.400146484375, 0.96435546875, 1.528564453125, 2.0927734375, 2.656982421875, 3.22119140625, 3.785400390625, 4.349609375, 4.913818359375, 5.47802734375, 6.042236328125, 6.6064453125, 7.170654296875, 7.73486328125, 8.299072265625, 8.86328125, 9.427490234375, 9.99169921875, 10.555908203125, 11.1201171875, 11.684326171875, 12.24853515625, 12.812744140625, 13.376953125, 13.941162109375, 14.50537109375, 15.069580078125, 15.6337890625, 16.197998046875, 16.76220703125, 17.326416015625, 17.890625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 6.0, 3.0, 6.0, 9.0, 8.0, 10.0, 17.0, 26.0, 21.0, 46.0, 43.0, 85.0, 154.0, 235.0, 538.0, 1266.0, 4495.0, 23328.0, 231247.0, 3455042.0, 435774.0, 33138.0, 5793.0, 1585.0, 543.0, 303.0, 175.0, 105.0, 69.0, 60.0, 35.0, 23.0, 17.0, 18.0, 10.0, 16.0, 7.0, 7.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.875, -30.897216796875, -29.91943359375, -28.941650390625, -27.9638671875, -26.986083984375, -26.00830078125, -25.030517578125, -24.052734375, -23.074951171875, -22.09716796875, -21.119384765625, -20.1416015625, -19.163818359375, -18.18603515625, -17.208251953125, -16.23046875, -15.252685546875, -14.27490234375, -13.297119140625, -12.3193359375, -11.341552734375, -10.36376953125, -9.385986328125, -8.408203125, -7.430419921875, -6.45263671875, -5.474853515625, -4.4970703125, -3.519287109375, -2.54150390625, -1.563720703125, -0.5859375, 0.391845703125, 1.36962890625, 2.347412109375, 3.3251953125, 4.302978515625, 5.28076171875, 6.258544921875, 7.236328125, 8.214111328125, 9.19189453125, 10.169677734375, 11.1474609375, 12.125244140625, 13.10302734375, 14.080810546875, 15.05859375, 16.036376953125, 17.01416015625, 17.991943359375, 18.9697265625, 19.947509765625, 20.92529296875, 21.903076171875, 22.880859375, 23.858642578125, 24.83642578125, 25.814208984375, 26.7919921875, 27.769775390625, 28.74755859375, 29.725341796875, 30.703125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 37.0, 112.0, 251.0, 272.0, 183.0, 106.0, 26.0, 9.0, 4.0, 2.0, 2.0, 2.0], "bins": [-211.31114196777344, -207.50074768066406, -203.6903533935547, -199.87997436523438, -196.069580078125, -192.25918579101562, -188.44879150390625, -184.63839721679688, -180.82801818847656, -177.0176239013672, -173.2072296142578, -169.3968505859375, -165.58645629882812, -161.77606201171875, -157.96566772460938, -154.1552734375, -150.34487915039062, -146.53448486328125, -142.72409057617188, -138.91371154785156, -135.1033172607422, -131.2929229736328, -127.48252868652344, -123.6721420288086, -119.86175537109375, -116.05136108398438, -112.24097442626953, -108.43058013916016, -104.62019348144531, -100.80979919433594, -96.99940490722656, -93.18901824951172, -89.37863159179688, -85.5682373046875, -81.75785064697266, -77.94745635986328, -74.13706970214844, -70.32667541503906, -66.51628112792969, -62.705894470214844, -58.8955078125, -55.08511734008789, -51.27472686767578, -47.464332580566406, -43.65394592285156, -39.84355163574219, -36.03316116333008, -32.22277069091797, -28.41238021850586, -24.60198974609375, -20.79159927368164, -16.9812068939209, -13.170816421508789, -9.36042594909668, -5.5500335693359375, -1.7396430969238281, 2.0707473754882812, 5.881138324737549, 9.691529273986816, 13.501920700073242, 17.31231117248535, 21.12270164489746, 24.933094024658203, 28.743484497070312, 32.55387496948242]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 5.0, 6.0, 7.0, 10.0, 15.0, 21.0, 15.0, 15.0, 23.0, 16.0, 23.0, 16.0, 29.0, 31.0, 36.0, 48.0, 33.0, 41.0, 49.0, 36.0, 41.0, 36.0, 37.0, 44.0, 32.0, 47.0, 36.0, 36.0, 22.0, 25.0, 24.0, 25.0, 19.0, 22.0, 14.0, 11.0, 13.0, 11.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.987091064453125, -49.46294403076172, -47.93879699707031, -46.41465377807617, -44.890506744384766, -43.36635971069336, -41.84221649169922, -40.31806945800781, -38.793922424316406, -37.269775390625, -35.745628356933594, -34.22148513793945, -32.69733810424805, -31.17319107055664, -29.649045944213867, -28.124900817871094, -26.600753784179688, -25.07660675048828, -23.552461624145508, -22.028316497802734, -20.504169464111328, -18.980022430419922, -17.45587730407715, -15.931731224060059, -14.407585144042969, -12.883439064025879, -11.359292984008789, -9.8351469039917, -8.31100082397461, -6.7868547439575195, -5.26270866394043, -3.73856258392334, -2.21441650390625, -0.6902704238891602, 0.8338756561279297, 2.3580217361450195, 3.8821678161621094, 5.406313896179199, 6.930459976196289, 8.454606056213379, 9.978752136230469, 11.502898216247559, 13.027044296264648, 14.551190376281738, 16.075336456298828, 17.599483489990234, 19.123628616333008, 20.64777374267578, 22.171920776367188, 23.696067810058594, 25.220212936401367, 26.74435806274414, 28.268505096435547, 29.792652130126953, 31.316797256469727, 32.8409423828125, 34.365089416503906, 35.88923645019531, 37.41338348388672, 38.93752670288086, 40.461673736572266, 41.98582077026367, 43.50996398925781, 45.03411102294922, 46.558258056640625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 11.0, 11.0, 8.0, 14.0, 15.0, 21.0, 23.0, 25.0, 28.0, 29.0, 23.0, 39.0, 29.0, 38.0, 44.0, 34.0, 61.0, 35.0, 56.0, 46.0, 40.0, 39.0, 41.0, 36.0, 21.0, 31.0, 21.0, 26.0, 23.0, 18.0, 15.0, 12.0, 17.0, 6.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0], "bins": [-11.1171875, -10.7828369140625, -10.448486328125, -10.1141357421875, -9.77978515625, -9.4454345703125, -9.111083984375, -8.7767333984375, -8.4423828125, -8.1080322265625, -7.773681640625, -7.4393310546875, -7.10498046875, -6.7706298828125, -6.436279296875, -6.1019287109375, -5.767578125, -5.4332275390625, -5.098876953125, -4.7645263671875, -4.43017578125, -4.0958251953125, -3.761474609375, -3.4271240234375, -3.0927734375, -2.7584228515625, -2.424072265625, -2.0897216796875, -1.75537109375, -1.4210205078125, -1.086669921875, -0.7523193359375, -0.41796875, -0.0836181640625, 0.250732421875, 0.5850830078125, 0.91943359375, 1.2537841796875, 1.588134765625, 1.9224853515625, 2.2568359375, 2.5911865234375, 2.925537109375, 3.2598876953125, 3.59423828125, 3.9285888671875, 4.262939453125, 4.5972900390625, 4.931640625, 5.2659912109375, 5.600341796875, 5.9346923828125, 6.26904296875, 6.6033935546875, 6.937744140625, 7.2720947265625, 7.6064453125, 7.9407958984375, 8.275146484375, 8.6094970703125, 8.94384765625, 9.2781982421875, 9.612548828125, 9.9468994140625, 10.28125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [7.0, 4.0, 7.0, 4.0, 14.0, 23.0, 36.0, 44.0, 56.0, 86.0, 101.0, 155.0, 177.0, 254.0, 359.0, 531.0, 734.0, 992.0, 1412.0, 1887.0, 2799.0, 3862.0, 5618.0, 8220.0, 11940.0, 17480.0, 26283.0, 40057.0, 64803.0, 118234.0, 303347.0, 195089.0, 88788.0, 52087.0, 33151.0, 21845.0, 14685.0, 10083.0, 6857.0, 4825.0, 3329.0, 2397.0, 1669.0, 1209.0, 869.0, 619.0, 430.0, 314.0, 221.0, 157.0, 102.0, 104.0, 69.0, 43.0, 39.0, 22.0, 18.0, 14.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.9814453125, -1.9170684814453125, -1.852691650390625, -1.7883148193359375, -1.72393798828125, -1.6595611572265625, -1.595184326171875, -1.5308074951171875, -1.4664306640625, -1.4020538330078125, -1.337677001953125, -1.2733001708984375, -1.20892333984375, -1.1445465087890625, -1.080169677734375, -1.0157928466796875, -0.951416015625, -0.8870391845703125, -0.822662353515625, -0.7582855224609375, -0.69390869140625, -0.6295318603515625, -0.565155029296875, -0.5007781982421875, -0.4364013671875, -0.3720245361328125, -0.307647705078125, -0.2432708740234375, -0.17889404296875, -0.1145172119140625, -0.050140380859375, 0.0142364501953125, 0.07861328125, 0.1429901123046875, 0.207366943359375, 0.2717437744140625, 0.33612060546875, 0.4004974365234375, 0.464874267578125, 0.5292510986328125, 0.5936279296875, 0.6580047607421875, 0.722381591796875, 0.7867584228515625, 0.85113525390625, 0.9155120849609375, 0.979888916015625, 1.0442657470703125, 1.108642578125, 1.1730194091796875, 1.237396240234375, 1.3017730712890625, 1.36614990234375, 1.4305267333984375, 1.494903564453125, 1.5592803955078125, 1.6236572265625, 1.6880340576171875, 1.752410888671875, 1.8167877197265625, 1.88116455078125, 1.9455413818359375, 2.009918212890625, 2.0742950439453125, 2.138671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 7.0, 7.0, 4.0, 8.0, 15.0, 12.0, 17.0, 15.0, 27.0, 16.0, 23.0, 24.0, 28.0, 32.0, 32.0, 32.0, 34.0, 34.0, 40.0, 42.0, 1063.0, 42.0, 37.0, 38.0, 40.0, 46.0, 39.0, 37.0, 31.0, 29.0, 17.0, 22.0, 18.0, 16.0, 22.0, 14.0, 12.0, 17.0, 7.0, 7.0, 6.0, 1.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-7.15234375, -6.9390869140625, -6.725830078125, -6.5125732421875, -6.29931640625, -6.0860595703125, -5.872802734375, -5.6595458984375, -5.4462890625, -5.2330322265625, -5.019775390625, -4.8065185546875, -4.59326171875, -4.3800048828125, -4.166748046875, -3.9534912109375, -3.740234375, -3.5269775390625, -3.313720703125, -3.1004638671875, -2.88720703125, -2.6739501953125, -2.460693359375, -2.2474365234375, -2.0341796875, -1.8209228515625, -1.607666015625, -1.3944091796875, -1.18115234375, -0.9678955078125, -0.754638671875, -0.5413818359375, -0.328125, -0.1148681640625, 0.098388671875, 0.3116455078125, 0.52490234375, 0.7381591796875, 0.951416015625, 1.1646728515625, 1.3779296875, 1.5911865234375, 1.804443359375, 2.0177001953125, 2.23095703125, 2.4442138671875, 2.657470703125, 2.8707275390625, 3.083984375, 3.2972412109375, 3.510498046875, 3.7237548828125, 3.93701171875, 4.1502685546875, 4.363525390625, 4.5767822265625, 4.7900390625, 5.0032958984375, 5.216552734375, 5.4298095703125, 5.64306640625, 5.8563232421875, 6.069580078125, 6.2828369140625, 6.49609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 14.0, 13.0, 19.0, 35.0, 29.0, 66.0, 103.0, 138.0, 209.0, 311.0, 421.0, 640.0, 937.0, 1460.0, 2139.0, 3300.0, 4867.0, 7301.0, 11034.0, 16514.0, 24398.0, 38246.0, 61037.0, 102809.0, 214144.0, 1306399.0, 113999.0, 66524.0, 40876.0, 26292.0, 17577.0, 11789.0, 7855.0, 5277.0, 3436.0, 2293.0, 1485.0, 1054.0, 700.0, 456.0, 283.0, 235.0, 144.0, 83.0, 63.0, 29.0, 40.0, 22.0, 10.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-2.13671875, -2.07012939453125, -2.0035400390625, -1.93695068359375, -1.870361328125, -1.80377197265625, -1.7371826171875, -1.67059326171875, -1.60400390625, -1.53741455078125, -1.4708251953125, -1.40423583984375, -1.337646484375, -1.27105712890625, -1.2044677734375, -1.13787841796875, -1.0712890625, -1.00469970703125, -0.9381103515625, -0.87152099609375, -0.804931640625, -0.73834228515625, -0.6717529296875, -0.60516357421875, -0.53857421875, -0.47198486328125, -0.4053955078125, -0.33880615234375, -0.272216796875, -0.20562744140625, -0.1390380859375, -0.07244873046875, -0.005859375, 0.06072998046875, 0.1273193359375, 0.19390869140625, 0.260498046875, 0.32708740234375, 0.3936767578125, 0.46026611328125, 0.52685546875, 0.59344482421875, 0.6600341796875, 0.72662353515625, 0.793212890625, 0.85980224609375, 0.9263916015625, 0.99298095703125, 1.0595703125, 1.12615966796875, 1.1927490234375, 1.25933837890625, 1.325927734375, 1.39251708984375, 1.4591064453125, 1.52569580078125, 1.59228515625, 1.65887451171875, 1.7254638671875, 1.79205322265625, 1.858642578125, 1.92523193359375, 1.9918212890625, 2.05841064453125, 2.125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 4.0, 5.0, 4.0, 10.0, 5.0, 9.0, 16.0, 6.0, 10.0, 20.0, 30.0, 21.0, 24.0, 35.0, 42.0, 64.0, 65.0, 62.0, 73.0, 65.0, 71.0, 57.0, 62.0, 37.0, 34.0, 22.0, 16.0, 15.0, 17.0, 12.0, 11.0, 8.0, 4.0, 12.0, 11.0, 7.0, 2.0, 1.0, 5.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 3.0], "bins": [-0.0012006759643554688, -0.0011669471859931946, -0.0011332184076309204, -0.0010994896292686462, -0.001065760850906372, -0.001032032072544098, -0.0009983032941818237, -0.0009645745158195496, -0.0009308457374572754, -0.0008971169590950012, -0.000863388180732727, -0.0008296594023704529, -0.0007959306240081787, -0.0007622018456459045, -0.0007284730672836304, -0.0006947442889213562, -0.000661015510559082, -0.0006272867321968079, -0.0005935579538345337, -0.0005598291754722595, -0.0005261003971099854, -0.0004923716187477112, -0.000458642840385437, -0.00042491406202316284, -0.00039118528366088867, -0.0003574565052986145, -0.00032372772693634033, -0.00028999894857406616, -0.000256270170211792, -0.00022254139184951782, -0.00018881261348724365, -0.00015508383512496948, -0.00012135505676269531, -8.762627840042114e-05, -5.389750003814697e-05, -2.0168721675872803e-05, 1.3560056686401367e-05, 4.728883504867554e-05, 8.101761341094971e-05, 0.00011474639177322388, 0.00014847517013549805, 0.00018220394849777222, 0.0002159327268600464, 0.00024966150522232056, 0.0002833902835845947, 0.0003171190619468689, 0.00035084784030914307, 0.00038457661867141724, 0.0004183053970336914, 0.0004520341753959656, 0.00048576295375823975, 0.0005194917321205139, 0.0005532205104827881, 0.0005869492888450623, 0.0006206780672073364, 0.0006544068455696106, 0.0006881356239318848, 0.0007218644022941589, 0.0007555931806564331, 0.0007893219590187073, 0.0008230507373809814, 0.0008567795157432556, 0.0008905082941055298, 0.000924237072467804, 0.0009579658508300781]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 6.0, 7.0, 7.0, 9.0, 11.0, 12.0, 16.0, 18.0, 31.0, 32.0, 37.0, 57.0, 92.0, 107.0, 184.0, 329.0, 652.0, 3276.0, 1031026.0, 10848.0, 722.0, 350.0, 232.0, 142.0, 92.0, 65.0, 36.0, 22.0, 28.0, 16.0, 17.0, 19.0, 10.0, 13.0, 10.0, 7.0, 1.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.029266357421875, -0.028420686721801758, -0.027575016021728516, -0.026729345321655273, -0.02588367462158203, -0.02503800392150879, -0.024192333221435547, -0.023346662521362305, -0.022500991821289062, -0.02165532112121582, -0.020809650421142578, -0.019963979721069336, -0.019118309020996094, -0.01827263832092285, -0.01742696762084961, -0.016581296920776367, -0.015735626220703125, -0.014889955520629883, -0.01404428482055664, -0.013198614120483398, -0.012352943420410156, -0.011507272720336914, -0.010661602020263672, -0.00981593132019043, -0.008970260620117188, -0.008124589920043945, -0.007278919219970703, -0.006433248519897461, -0.005587577819824219, -0.0047419071197509766, -0.0038962364196777344, -0.003050565719604492, -0.00220489501953125, -0.0013592243194580078, -0.0005135536193847656, 0.00033211708068847656, 0.0011777877807617188, 0.002023458480834961, 0.002869129180908203, 0.0037147998809814453, 0.0045604705810546875, 0.00540614128112793, 0.006251811981201172, 0.007097482681274414, 0.007943153381347656, 0.008788824081420898, 0.00963449478149414, 0.010480165481567383, 0.011325836181640625, 0.012171506881713867, 0.01301717758178711, 0.013862848281860352, 0.014708518981933594, 0.015554189682006836, 0.016399860382080078, 0.01724553108215332, 0.018091201782226562, 0.018936872482299805, 0.019782543182373047, 0.02062821388244629, 0.02147388458251953, 0.022319555282592773, 0.023165225982666016, 0.024010896682739258, 0.0248565673828125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 26.0, 505.0, 456.0, 26.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000415960093960166, -0.00027560224407352507, -0.00013524439418688416, 5.1134556997567415e-06, 0.00014547130558639765, 0.000285829184576869, 0.00042618700535967946, 0.0005665448261424899, 0.0007069027051329613, 0.0008472605841234326, 0.000987618463113904, 0.0011279762256890535, 0.001268334104679525, 0.0014086919836699963, 0.0015490497462451458, 0.0016894076252356172, 0.0018297655042260885, 0.001970123266801238, 0.0021104812622070312, 0.002250839024782181, 0.0023911967873573303, 0.0025315547827631235, 0.002671912545338273, 0.0028122705407440662, 0.0029526283033192158, 0.0030929860658943653, 0.0032333440613001585, 0.003373701823875308, 0.0035140598192811012, 0.0036544175818562508, 0.0037947753444314003, 0.00393513310700655, 0.004075490869581699, 0.004215848632156849, 0.0043562063947319984, 0.004496564622968435, 0.004636922385543585, 0.004777280148118734, 0.004917637910693884, 0.005057995673269033, 0.00519835390150547, 0.00533871166408062, 0.005479069426655769, 0.005619427654892206, 0.005759785417467356, 0.005900143180042505, 0.006040500942617655, 0.006180858705192804, 0.006321216467767954, 0.006461574230343103, 0.006601931992918253, 0.00674229022115469, 0.006882647983729839, 0.007023005746304989, 0.007163363508880138, 0.007303721271455288, 0.0074440790340304375, 0.007584436796605587, 0.0077247945591807365, 0.007865152321755886, 0.008005510084331036, 0.00814586877822876, 0.00828622654080391, 0.008426584303379059, 0.008566942065954208]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 8.0, 2.0, 6.0, 5.0, 9.0, 10.0, 9.0, 16.0, 16.0, 19.0, 19.0, 20.0, 27.0, 27.0, 24.0, 44.0, 31.0, 40.0, 54.0, 29.0, 37.0, 36.0, 39.0, 42.0, 36.0, 30.0, 35.0, 39.0, 30.0, 36.0, 32.0, 35.0, 22.0, 28.0, 21.0, 15.0, 12.0, 13.0, 16.0, 12.0, 4.0, 5.0, 3.0, 2.0, 5.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005609989166259766, -0.0005428865551948547, -0.0005247741937637329, -0.0005066618323326111, -0.0004885494709014893, -0.00047043710947036743, -0.0004523247480392456, -0.0004342123866081238, -0.00041610002517700195, -0.0003979876637458801, -0.0003798753023147583, -0.0003617629408836365, -0.00034365057945251465, -0.0003255382180213928, -0.000307425856590271, -0.00028931349515914917, -0.00027120113372802734, -0.0002530887722969055, -0.0002349764108657837, -0.00021686404943466187, -0.00019875168800354004, -0.0001806393265724182, -0.0001625269651412964, -0.00014441460371017456, -0.00012630224227905273, -0.00010818988084793091, -9.007751941680908e-05, -7.196515798568726e-05, -5.385279655456543e-05, -3.5740435123443604e-05, -1.7628073692321777e-05, 4.842877388000488e-07, 1.8596649169921875e-05, 3.67090106010437e-05, 5.482137203216553e-05, 7.293373346328735e-05, 9.104609489440918e-05, 0.000109158456325531, 0.00012727081775665283, 0.00014538317918777466, 0.00016349554061889648, 0.0001816079020500183, 0.00019972026348114014, 0.00021783262491226196, 0.0002359449863433838, 0.0002540573477745056, 0.00027216970920562744, 0.00029028207063674927, 0.0003083944320678711, 0.0003265067934989929, 0.00034461915493011475, 0.00036273151636123657, 0.0003808438777923584, 0.0003989562392234802, 0.00041706860065460205, 0.0004351809620857239, 0.0004532933235168457, 0.00047140568494796753, 0.0004895180463790894, 0.0005076304078102112, 0.000525742769241333, 0.0005438551306724548, 0.0005619674921035767, 0.0005800798535346985, 0.0005981922149658203]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 11.0, 11.0, 8.0, 14.0, 15.0, 21.0, 23.0, 25.0, 28.0, 29.0, 23.0, 39.0, 29.0, 38.0, 44.0, 34.0, 61.0, 35.0, 56.0, 46.0, 40.0, 39.0, 41.0, 36.0, 21.0, 31.0, 21.0, 26.0, 23.0, 18.0, 15.0, 12.0, 17.0, 6.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0], "bins": [-11.1171875, -10.7828369140625, -10.448486328125, -10.1141357421875, -9.77978515625, -9.4454345703125, -9.111083984375, -8.7767333984375, -8.4423828125, -8.1080322265625, -7.773681640625, -7.4393310546875, -7.10498046875, -6.7706298828125, -6.436279296875, -6.1019287109375, -5.767578125, -5.4332275390625, -5.098876953125, -4.7645263671875, -4.43017578125, -4.0958251953125, -3.761474609375, -3.4271240234375, -3.0927734375, -2.7584228515625, -2.424072265625, -2.0897216796875, -1.75537109375, -1.4210205078125, -1.086669921875, -0.7523193359375, -0.41796875, -0.0836181640625, 0.250732421875, 0.5850830078125, 0.91943359375, 1.2537841796875, 1.588134765625, 1.9224853515625, 2.2568359375, 2.5911865234375, 2.925537109375, 3.2598876953125, 3.59423828125, 3.9285888671875, 4.262939453125, 4.5972900390625, 4.931640625, 5.2659912109375, 5.600341796875, 5.9346923828125, 6.26904296875, 6.6033935546875, 6.937744140625, 7.2720947265625, 7.6064453125, 7.9407958984375, 8.275146484375, 8.6094970703125, 8.94384765625, 9.2781982421875, 9.612548828125, 9.9468994140625, 10.28125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 4.0, 5.0, 8.0, 6.0, 9.0, 15.0, 17.0, 29.0, 34.0, 44.0, 75.0, 71.0, 104.0, 152.0, 210.0, 308.0, 445.0, 788.0, 1364.0, 2788.0, 5919.0, 14935.0, 41089.0, 131726.0, 425221.0, 292919.0, 83025.0, 27388.0, 10355.0, 4337.0, 2073.0, 1069.0, 651.0, 384.0, 267.0, 192.0, 139.0, 92.0, 79.0, 56.0, 32.0, 37.0, 32.0, 16.0, 13.0, 11.0, 6.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-12.9921875, -12.583740234375, -12.17529296875, -11.766845703125, -11.3583984375, -10.949951171875, -10.54150390625, -10.133056640625, -9.724609375, -9.316162109375, -8.90771484375, -8.499267578125, -8.0908203125, -7.682373046875, -7.27392578125, -6.865478515625, -6.45703125, -6.048583984375, -5.64013671875, -5.231689453125, -4.8232421875, -4.414794921875, -4.00634765625, -3.597900390625, -3.189453125, -2.781005859375, -2.37255859375, -1.964111328125, -1.5556640625, -1.147216796875, -0.73876953125, -0.330322265625, 0.078125, 0.486572265625, 0.89501953125, 1.303466796875, 1.7119140625, 2.120361328125, 2.52880859375, 2.937255859375, 3.345703125, 3.754150390625, 4.16259765625, 4.571044921875, 4.9794921875, 5.387939453125, 5.79638671875, 6.204833984375, 6.61328125, 7.021728515625, 7.43017578125, 7.838623046875, 8.2470703125, 8.655517578125, 9.06396484375, 9.472412109375, 9.880859375, 10.289306640625, 10.69775390625, 11.106201171875, 11.5146484375, 11.923095703125, 12.33154296875, 12.739990234375, 13.1484375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 7.0, 9.0, 8.0, 11.0, 16.0, 10.0, 18.0, 23.0, 17.0, 17.0, 31.0, 34.0, 38.0, 41.0, 41.0, 53.0, 76.0, 105.0, 192.0, 1431.0, 246.0, 137.0, 79.0, 63.0, 52.0, 32.0, 38.0, 18.0, 22.0, 25.0, 22.0, 16.0, 18.0, 14.0, 10.0, 10.0, 19.0, 7.0, 9.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-24.328125, -23.509033203125, -22.68994140625, -21.870849609375, -21.0517578125, -20.232666015625, -19.41357421875, -18.594482421875, -17.775390625, -16.956298828125, -16.13720703125, -15.318115234375, -14.4990234375, -13.679931640625, -12.86083984375, -12.041748046875, -11.22265625, -10.403564453125, -9.58447265625, -8.765380859375, -7.9462890625, -7.127197265625, -6.30810546875, -5.489013671875, -4.669921875, -3.850830078125, -3.03173828125, -2.212646484375, -1.3935546875, -0.574462890625, 0.24462890625, 1.063720703125, 1.8828125, 2.701904296875, 3.52099609375, 4.340087890625, 5.1591796875, 5.978271484375, 6.79736328125, 7.616455078125, 8.435546875, 9.254638671875, 10.07373046875, 10.892822265625, 11.7119140625, 12.531005859375, 13.35009765625, 14.169189453125, 14.98828125, 15.807373046875, 16.62646484375, 17.445556640625, 18.2646484375, 19.083740234375, 19.90283203125, 20.721923828125, 21.541015625, 22.360107421875, 23.17919921875, 23.998291015625, 24.8173828125, 25.636474609375, 26.45556640625, 27.274658203125, 28.09375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 8.0, 5.0, 11.0, 22.0, 25.0, 22.0, 45.0, 37.0, 60.0, 80.0, 132.0, 148.0, 243.0, 391.0, 787.0, 3349.0, 88778.0, 2985383.0, 61483.0, 2671.0, 702.0, 368.0, 268.0, 172.0, 115.0, 93.0, 78.0, 47.0, 45.0, 24.0, 16.0, 18.0, 19.0, 11.0, 6.0, 10.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.09375, -49.51953125, -47.9453125, -46.37109375, -44.796875, -43.22265625, -41.6484375, -40.07421875, -38.5, -36.92578125, -35.3515625, -33.77734375, -32.203125, -30.62890625, -29.0546875, -27.48046875, -25.90625, -24.33203125, -22.7578125, -21.18359375, -19.609375, -18.03515625, -16.4609375, -14.88671875, -13.3125, -11.73828125, -10.1640625, -8.58984375, -7.015625, -5.44140625, -3.8671875, -2.29296875, -0.71875, 0.85546875, 2.4296875, 4.00390625, 5.578125, 7.15234375, 8.7265625, 10.30078125, 11.875, 13.44921875, 15.0234375, 16.59765625, 18.171875, 19.74609375, 21.3203125, 22.89453125, 24.46875, 26.04296875, 27.6171875, 29.19140625, 30.765625, 32.33984375, 33.9140625, 35.48828125, 37.0625, 38.63671875, 40.2109375, 41.78515625, 43.359375, 44.93359375, 46.5078125, 48.08203125, 49.65625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 206.0, 749.0, 50.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-438.3736267089844, -430.7219543457031, -423.07025146484375, -415.4185791015625, -407.76690673828125, -400.1152038574219, -392.4635314941406, -384.81182861328125, -377.16015625, -369.50848388671875, -361.8567810058594, -354.2051086425781, -346.5534362792969, -338.9017333984375, -331.25006103515625, -323.598388671875, -315.9466857910156, -308.2950134277344, -300.643310546875, -292.99163818359375, -285.3399658203125, -277.6882629394531, -270.0365905761719, -262.3848876953125, -254.7332305908203, -247.08154296875, -239.42987060546875, -231.77818298339844, -224.12649536132812, -216.47482299804688, -208.82313537597656, -201.17144775390625, -193.519775390625, -185.8680877685547, -178.21641540527344, -170.56472778320312, -162.9130401611328, -155.2613525390625, -147.60968017578125, -139.95799255371094, -132.30630493164062, -124.65462493896484, -117.00293731689453, -109.35125732421875, -101.69956970214844, -94.04788970947266, -86.39620971679688, -78.74452209472656, -71.09283447265625, -63.4411506652832, -55.789466857910156, -48.137786865234375, -40.48609924316406, -32.83441925048828, -25.182735443115234, -17.531051635742188, -9.879371643066406, -2.2276883125305176, 5.423995018005371, 13.075677871704102, 20.72736167907715, 28.379043579101562, 36.03072738647461, 43.682411193847656, 51.3340950012207]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 10.0, 8.0, 7.0, 11.0, 17.0, 18.0, 12.0, 19.0, 23.0, 27.0, 21.0, 34.0, 28.0, 29.0, 27.0, 39.0, 33.0, 34.0, 45.0, 38.0, 27.0, 51.0, 36.0, 31.0, 39.0, 26.0, 24.0, 42.0, 20.0, 31.0, 34.0, 30.0, 20.0, 12.0, 16.0, 16.0, 14.0, 10.0, 5.0, 2.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.45185852050781, -56.57313537597656, -54.69441223144531, -52.81568908691406, -50.93696594238281, -49.05824279785156, -47.17952346801758, -45.30080032348633, -43.42207717895508, -41.54335403442383, -39.66463088989258, -37.78590774536133, -35.907188415527344, -34.028465270996094, -32.149742126464844, -30.271018981933594, -28.392295837402344, -26.513572692871094, -24.634849548339844, -22.756128311157227, -20.877405166625977, -18.998682022094727, -17.11996078491211, -15.24123764038086, -13.36251449584961, -11.48379135131836, -9.605069160461426, -7.726346492767334, -5.847623825073242, -3.968900680541992, -2.0901784896850586, -0.211456298828125, 1.6672630310058594, 3.545985698699951, 5.424708366394043, 7.303431034088135, 9.182153701782227, 11.060876846313477, 12.93959903717041, 14.818321228027344, 16.697044372558594, 18.575767517089844, 20.454490661621094, 22.33321189880371, 24.21193504333496, 26.09065818786621, 27.969379425048828, 29.848102569580078, 31.726825714111328, 33.60554885864258, 35.48427200317383, 37.36299514770508, 39.24171447753906, 41.12043762207031, 42.99916076660156, 44.87788391113281, 46.75660705566406, 48.63533020019531, 50.51405334472656, 52.39277648925781, 54.27149963378906, 56.15022277832031, 58.0289421081543, 59.90766525268555, 61.7863883972168]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 9.0, 11.0, 10.0, 9.0, 9.0, 17.0, 16.0, 22.0, 22.0, 27.0, 33.0, 35.0, 27.0, 41.0, 41.0, 52.0, 41.0, 46.0, 53.0, 40.0, 39.0, 52.0, 41.0, 44.0, 45.0, 31.0, 30.0, 19.0, 23.0, 23.0, 18.0, 14.0, 10.0, 14.0, 10.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6824951171875, -11.310302734375, -10.9381103515625, -10.56591796875, -10.1937255859375, -9.821533203125, -9.4493408203125, -9.0771484375, -8.7049560546875, -8.332763671875, -7.9605712890625, -7.58837890625, -7.2161865234375, -6.843994140625, -6.4718017578125, -6.099609375, -5.7274169921875, -5.355224609375, -4.9830322265625, -4.61083984375, -4.2386474609375, -3.866455078125, -3.4942626953125, -3.1220703125, -2.7498779296875, -2.377685546875, -2.0054931640625, -1.63330078125, -1.2611083984375, -0.888916015625, -0.5167236328125, -0.14453125, 0.2276611328125, 0.599853515625, 0.9720458984375, 1.34423828125, 1.7164306640625, 2.088623046875, 2.4608154296875, 2.8330078125, 3.2052001953125, 3.577392578125, 3.9495849609375, 4.32177734375, 4.6939697265625, 5.066162109375, 5.4383544921875, 5.810546875, 6.1827392578125, 6.554931640625, 6.9271240234375, 7.29931640625, 7.6715087890625, 8.043701171875, 8.4158935546875, 8.7880859375, 9.1602783203125, 9.532470703125, 9.9046630859375, 10.27685546875, 10.6490478515625, 11.021240234375, 11.3934326171875, 11.765625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 13.0, 10.0, 9.0, 15.0, 13.0, 16.0, 28.0, 37.0, 28.0, 50.0, 50.0, 86.0, 108.0, 153.0, 195.0, 241.0, 308.0, 431.0, 1472.0, 4186444.0, 2542.0, 510.0, 373.0, 303.0, 208.0, 132.0, 128.0, 90.0, 60.0, 43.0, 34.0, 35.0, 23.0, 17.0, 18.0, 7.0, 10.0, 5.0, 4.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0], "bins": [-280.5, -272.6171875, -264.734375, -256.8515625, -248.96875, -241.0859375, -233.203125, -225.3203125, -217.4375, -209.5546875, -201.671875, -193.7890625, -185.90625, -178.0234375, -170.140625, -162.2578125, -154.375, -146.4921875, -138.609375, -130.7265625, -122.84375, -114.9609375, -107.078125, -99.1953125, -91.3125, -83.4296875, -75.546875, -67.6640625, -59.78125, -51.8984375, -44.015625, -36.1328125, -28.25, -20.3671875, -12.484375, -4.6015625, 3.28125, 11.1640625, 19.046875, 26.9296875, 34.8125, 42.6953125, 50.578125, 58.4609375, 66.34375, 74.2265625, 82.109375, 89.9921875, 97.875, 105.7578125, 113.640625, 121.5234375, 129.40625, 137.2890625, 145.171875, 153.0546875, 160.9375, 168.8203125, 176.703125, 184.5859375, 192.46875, 200.3515625, 208.234375, 216.1171875, 224.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 7.0, 19.0, 14.0, 17.0, 25.0, 34.0, 35.0, 76.0, 80.0, 119.0, 182.0, 311.0, 463.0, 637.0, 638.0, 477.0, 300.0, 193.0, 122.0, 79.0, 63.0, 38.0, 36.0, 24.0, 15.0, 11.0, 11.0, 8.0, 4.0, 5.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.34375, -15.779541015625, -15.21533203125, -14.651123046875, -14.0869140625, -13.522705078125, -12.95849609375, -12.394287109375, -11.830078125, -11.265869140625, -10.70166015625, -10.137451171875, -9.5732421875, -9.009033203125, -8.44482421875, -7.880615234375, -7.31640625, -6.752197265625, -6.18798828125, -5.623779296875, -5.0595703125, -4.495361328125, -3.93115234375, -3.366943359375, -2.802734375, -2.238525390625, -1.67431640625, -1.110107421875, -0.5458984375, 0.018310546875, 0.58251953125, 1.146728515625, 1.7109375, 2.275146484375, 2.83935546875, 3.403564453125, 3.9677734375, 4.531982421875, 5.09619140625, 5.660400390625, 6.224609375, 6.788818359375, 7.35302734375, 7.917236328125, 8.4814453125, 9.045654296875, 9.60986328125, 10.174072265625, 10.73828125, 11.302490234375, 11.86669921875, 12.430908203125, 12.9951171875, 13.559326171875, 14.12353515625, 14.687744140625, 15.251953125, 15.816162109375, 16.38037109375, 16.944580078125, 17.5087890625, 18.072998046875, 18.63720703125, 19.201416015625, 19.765625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 7.0, 10.0, 11.0, 18.0, 10.0, 15.0, 27.0, 17.0, 25.0, 33.0, 32.0, 46.0, 59.0, 69.0, 104.0, 323.0, 3320.0, 4091300.0, 97433.0, 786.0, 204.0, 77.0, 52.0, 46.0, 45.0, 32.0, 25.0, 30.0, 21.0, 17.0, 15.0, 16.0, 8.0, 6.0, 7.0, 9.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.5, -98.521484375, -94.54296875, -90.564453125, -86.5859375, -82.607421875, -78.62890625, -74.650390625, -70.671875, -66.693359375, -62.71484375, -58.736328125, -54.7578125, -50.779296875, -46.80078125, -42.822265625, -38.84375, -34.865234375, -30.88671875, -26.908203125, -22.9296875, -18.951171875, -14.97265625, -10.994140625, -7.015625, -3.037109375, 0.94140625, 4.919921875, 8.8984375, 12.876953125, 16.85546875, 20.833984375, 24.8125, 28.791015625, 32.76953125, 36.748046875, 40.7265625, 44.705078125, 48.68359375, 52.662109375, 56.640625, 60.619140625, 64.59765625, 68.576171875, 72.5546875, 76.533203125, 80.51171875, 84.490234375, 88.46875, 92.447265625, 96.42578125, 100.404296875, 104.3828125, 108.361328125, 112.33984375, 116.318359375, 120.296875, 124.275390625, 128.25390625, 132.232421875, 136.2109375, 140.189453125, 144.16796875, 148.146484375, 152.125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 195.0, 658.0, 152.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-371.9729309082031, -361.7693786621094, -351.5658264160156, -341.3623046875, -331.15875244140625, -320.9552001953125, -310.75164794921875, -300.548095703125, -290.34454345703125, -280.1409912109375, -269.93743896484375, -259.7339172363281, -249.53036499023438, -239.32681274414062, -229.12326049804688, -218.91970825195312, -208.7161865234375, -198.51263427734375, -188.30909729003906, -178.1055450439453, -167.90200805664062, -157.69845581054688, -147.49490356445312, -137.29135131835938, -127.08781433105469, -116.88426971435547, -106.68072509765625, -96.4771728515625, -86.27362823486328, -76.07008361816406, -65.86653137207031, -55.662986755371094, -45.45947265625, -35.25592803955078, -25.052379608154297, -14.848833084106445, -4.645286560058594, 5.558258056640625, 15.76180648803711, 25.965354919433594, 36.16889953613281, 46.37244415283203, 56.575992584228516, 66.779541015625, 76.98308563232422, 87.18663024902344, 97.39018249511719, 107.5937271118164, 117.79727172851562, 128.00082397460938, 138.20436096191406, 148.4079132080078, 158.6114501953125, 168.81500244140625, 179.0185546875, 189.22210693359375, 199.42564392089844, 209.6291961669922, 219.83273315429688, 230.03628540039062, 240.23983764648438, 250.44337463378906, 260.64691162109375, 270.8504638671875, 281.05401611328125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 11.0, 10.0, 9.0, 11.0, 17.0, 30.0, 21.0, 29.0, 37.0, 23.0, 48.0, 37.0, 37.0, 48.0, 47.0, 56.0, 46.0, 47.0, 48.0, 42.0, 60.0, 31.0, 40.0, 41.0, 24.0, 23.0, 22.0, 16.0, 17.0, 12.0, 10.0, 14.0, 8.0, 9.0, 8.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.5775146484375, -58.57398986816406, -56.570465087890625, -54.56694030761719, -52.56341552734375, -50.55989074707031, -48.556365966796875, -46.55284118652344, -44.54931640625, -42.54579162597656, -40.542266845703125, -38.53874206542969, -36.53521728515625, -34.53169250488281, -32.528167724609375, -30.524642944335938, -28.5211181640625, -26.517593383789062, -24.514068603515625, -22.510543823242188, -20.50701904296875, -18.503494262695312, -16.499969482421875, -14.496444702148438, -12.492919921875, -10.489395141601562, -8.485870361328125, -6.4823455810546875, -4.47882080078125, -2.4752960205078125, -0.471771240234375, 1.5317535400390625, 3.5352783203125, 5.5388031005859375, 7.542327880859375, 9.545852661132812, 11.54937744140625, 13.552902221679688, 15.556427001953125, 17.559951782226562, 19.5634765625, 21.567001342773438, 23.570526123046875, 25.574050903320312, 27.57757568359375, 29.581100463867188, 31.584625244140625, 33.58815002441406, 35.5916748046875, 37.59519958496094, 39.598724365234375, 41.60224914550781, 43.60577392578125, 45.60929870605469, 47.612823486328125, 49.61634826660156, 51.619873046875, 53.62339782714844, 55.626922607421875, 57.63044738769531, 59.63397216796875, 61.63749694824219, 63.641021728515625, 65.64454650878906, 67.6480712890625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 10.0, 4.0, 14.0, 15.0, 13.0, 21.0, 16.0, 22.0, 24.0, 43.0, 34.0, 42.0, 44.0, 41.0, 41.0, 50.0, 44.0, 52.0, 42.0, 53.0, 46.0, 29.0, 43.0, 44.0, 21.0, 23.0, 27.0, 18.0, 20.0, 20.0, 15.0, 15.0, 11.0, 8.0, 5.0, 5.0, 2.0, 5.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-12.6796875, -12.3193359375, -11.958984375, -11.5986328125, -11.23828125, -10.8779296875, -10.517578125, -10.1572265625, -9.796875, -9.4365234375, -9.076171875, -8.7158203125, -8.35546875, -7.9951171875, -7.634765625, -7.2744140625, -6.9140625, -6.5537109375, -6.193359375, -5.8330078125, -5.47265625, -5.1123046875, -4.751953125, -4.3916015625, -4.03125, -3.6708984375, -3.310546875, -2.9501953125, -2.58984375, -2.2294921875, -1.869140625, -1.5087890625, -1.1484375, -0.7880859375, -0.427734375, -0.0673828125, 0.29296875, 0.6533203125, 1.013671875, 1.3740234375, 1.734375, 2.0947265625, 2.455078125, 2.8154296875, 3.17578125, 3.5361328125, 3.896484375, 4.2568359375, 4.6171875, 4.9775390625, 5.337890625, 5.6982421875, 6.05859375, 6.4189453125, 6.779296875, 7.1396484375, 7.5, 7.8603515625, 8.220703125, 8.5810546875, 8.94140625, 9.3017578125, 9.662109375, 10.0224609375, 10.3828125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 4.0, 9.0, 17.0, 22.0, 27.0, 35.0, 45.0, 67.0, 108.0, 155.0, 209.0, 327.0, 437.0, 640.0, 950.0, 1375.0, 2116.0, 3258.0, 4931.0, 7236.0, 10837.0, 16987.0, 26770.0, 43650.0, 74401.0, 144206.0, 324245.0, 170056.0, 83205.0, 48363.0, 29300.0, 18771.0, 12128.0, 7921.0, 5181.0, 3427.0, 2309.0, 1581.0, 1113.0, 662.0, 480.0, 307.0, 235.0, 130.0, 106.0, 73.0, 44.0, 34.0, 20.0, 20.0, 9.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.228515625, -2.153228759765625, -2.07794189453125, -2.002655029296875, -1.9273681640625, -1.852081298828125, -1.77679443359375, -1.701507568359375, -1.626220703125, -1.550933837890625, -1.47564697265625, -1.400360107421875, -1.3250732421875, -1.249786376953125, -1.17449951171875, -1.099212646484375, -1.02392578125, -0.948638916015625, -0.87335205078125, -0.798065185546875, -0.7227783203125, -0.647491455078125, -0.57220458984375, -0.496917724609375, -0.421630859375, -0.346343994140625, -0.27105712890625, -0.195770263671875, -0.1204833984375, -0.045196533203125, 0.03009033203125, 0.105377197265625, 0.1806640625, 0.255950927734375, 0.33123779296875, 0.406524658203125, 0.4818115234375, 0.557098388671875, 0.63238525390625, 0.707672119140625, 0.782958984375, 0.858245849609375, 0.93353271484375, 1.008819580078125, 1.0841064453125, 1.159393310546875, 1.23468017578125, 1.309967041015625, 1.38525390625, 1.460540771484375, 1.53582763671875, 1.611114501953125, 1.6864013671875, 1.761688232421875, 1.83697509765625, 1.912261962890625, 1.987548828125, 2.062835693359375, 2.13812255859375, 2.213409423828125, 2.2886962890625, 2.363983154296875, 2.43927001953125, 2.514556884765625, 2.58984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 9.0, 10.0, 12.0, 20.0, 20.0, 20.0, 18.0, 26.0, 21.0, 32.0, 41.0, 48.0, 42.0, 52.0, 47.0, 39.0, 1077.0, 48.0, 50.0, 43.0, 36.0, 38.0, 40.0, 28.0, 36.0, 27.0, 18.0, 24.0, 20.0, 15.0, 8.0, 13.0, 6.0, 5.0, 6.0, 2.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.63543701171875, -6.3997802734375, -6.16412353515625, -5.928466796875, -5.69281005859375, -5.4571533203125, -5.22149658203125, -4.98583984375, -4.75018310546875, -4.5145263671875, -4.27886962890625, -4.043212890625, -3.80755615234375, -3.5718994140625, -3.33624267578125, -3.1005859375, -2.86492919921875, -2.6292724609375, -2.39361572265625, -2.157958984375, -1.92230224609375, -1.6866455078125, -1.45098876953125, -1.21533203125, -0.97967529296875, -0.7440185546875, -0.50836181640625, -0.272705078125, -0.03704833984375, 0.1986083984375, 0.43426513671875, 0.669921875, 0.90557861328125, 1.1412353515625, 1.37689208984375, 1.612548828125, 1.84820556640625, 2.0838623046875, 2.31951904296875, 2.55517578125, 2.79083251953125, 3.0264892578125, 3.26214599609375, 3.497802734375, 3.73345947265625, 3.9691162109375, 4.20477294921875, 4.4404296875, 4.67608642578125, 4.9117431640625, 5.14739990234375, 5.383056640625, 5.61871337890625, 5.8543701171875, 6.09002685546875, 6.32568359375, 6.56134033203125, 6.7969970703125, 7.03265380859375, 7.268310546875, 7.50396728515625, 7.7396240234375, 7.97528076171875, 8.2109375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 9.0, 14.0, 26.0, 30.0, 45.0, 75.0, 99.0, 144.0, 236.0, 340.0, 554.0, 864.0, 1276.0, 2029.0, 3173.0, 5050.0, 8162.0, 13050.0, 21188.0, 34456.0, 59828.0, 111752.0, 1329829.0, 254400.0, 106158.0, 57220.0, 33202.0, 20189.0, 12452.0, 7860.0, 4773.0, 3085.0, 1990.0, 1217.0, 816.0, 509.0, 333.0, 239.0, 150.0, 101.0, 73.0, 42.0, 33.0, 19.0, 17.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.451171875, -2.374481201171875, -2.29779052734375, -2.221099853515625, -2.1444091796875, -2.067718505859375, -1.99102783203125, -1.914337158203125, -1.837646484375, -1.760955810546875, -1.68426513671875, -1.607574462890625, -1.5308837890625, -1.454193115234375, -1.37750244140625, -1.300811767578125, -1.22412109375, -1.147430419921875, -1.07073974609375, -0.994049072265625, -0.9173583984375, -0.840667724609375, -0.76397705078125, -0.687286376953125, -0.610595703125, -0.533905029296875, -0.45721435546875, -0.380523681640625, -0.3038330078125, -0.227142333984375, -0.15045166015625, -0.073760986328125, 0.0029296875, 0.079620361328125, 0.15631103515625, 0.233001708984375, 0.3096923828125, 0.386383056640625, 0.46307373046875, 0.539764404296875, 0.616455078125, 0.693145751953125, 0.76983642578125, 0.846527099609375, 0.9232177734375, 0.999908447265625, 1.07659912109375, 1.153289794921875, 1.22998046875, 1.306671142578125, 1.38336181640625, 1.460052490234375, 1.5367431640625, 1.613433837890625, 1.69012451171875, 1.766815185546875, 1.843505859375, 1.920196533203125, 1.99688720703125, 2.073577880859375, 2.1502685546875, 2.226959228515625, 2.30364990234375, 2.380340576171875, 2.45703125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 5.0, 4.0, 10.0, 14.0, 16.0, 17.0, 36.0, 40.0, 66.0, 102.0, 122.0, 142.0, 109.0, 99.0, 61.0, 45.0, 27.0, 23.0, 16.0, 18.0, 8.0, 8.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0023651123046875, -0.00230194628238678, -0.0022387802600860596, -0.0021756142377853394, -0.002112448215484619, -0.002049282193183899, -0.0019861161708831787, -0.0019229501485824585, -0.0018597841262817383, -0.001796618103981018, -0.0017334520816802979, -0.0016702860593795776, -0.0016071200370788574, -0.0015439540147781372, -0.001480787992477417, -0.0014176219701766968, -0.0013544559478759766, -0.0012912899255752563, -0.0012281239032745361, -0.001164957880973816, -0.0011017918586730957, -0.0010386258363723755, -0.0009754598140716553, -0.0009122937917709351, -0.0008491277694702148, -0.0007859617471694946, -0.0007227957248687744, -0.0006596297025680542, -0.000596463680267334, -0.0005332976579666138, -0.00047013163566589355, -0.00040696561336517334, -0.0003437995910644531, -0.0002806335687637329, -0.0002174675464630127, -0.00015430152416229248, -9.113550186157227e-05, -2.796947956085205e-05, 3.5196542739868164e-05, 9.836256504058838e-05, 0.0001615285873413086, 0.0002246946096420288, 0.000287860631942749, 0.00035102665424346924, 0.00041419267654418945, 0.00047735869884490967, 0.0005405247211456299, 0.0006036907434463501, 0.0006668567657470703, 0.0007300227880477905, 0.0007931888103485107, 0.000856354832649231, 0.0009195208549499512, 0.0009826868772506714, 0.0010458528995513916, 0.0011090189218521118, 0.001172184944152832, 0.0012353509664535522, 0.0012985169887542725, 0.0013616830110549927, 0.0014248490333557129, 0.001488015055656433, 0.0015511810779571533, 0.0016143471002578735, 0.0016775131225585938]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 4.0, 10.0, 16.0, 34.0, 41.0, 53.0, 91.0, 139.0, 261.0, 478.0, 1308.0, 1005466.0, 38851.0, 876.0, 365.0, 203.0, 120.0, 67.0, 49.0, 26.0, 25.0, 19.0, 14.0, 8.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0290069580078125, -0.027925729751586914, -0.026844501495361328, -0.025763273239135742, -0.024682044982910156, -0.02360081672668457, -0.022519588470458984, -0.0214383602142334, -0.020357131958007812, -0.019275903701782227, -0.01819467544555664, -0.017113447189331055, -0.01603221893310547, -0.014950990676879883, -0.013869762420654297, -0.012788534164428711, -0.011707305908203125, -0.010626077651977539, -0.009544849395751953, -0.008463621139526367, -0.007382392883300781, -0.006301164627075195, -0.005219936370849609, -0.0041387081146240234, -0.0030574798583984375, -0.0019762516021728516, -0.0008950233459472656, 0.0001862049102783203, 0.0012674331665039062, 0.002348661422729492, 0.003429889678955078, 0.004511117935180664, 0.00559234619140625, 0.006673574447631836, 0.007754802703857422, 0.008836030960083008, 0.009917259216308594, 0.01099848747253418, 0.012079715728759766, 0.013160943984985352, 0.014242172241210938, 0.015323400497436523, 0.01640462875366211, 0.017485857009887695, 0.01856708526611328, 0.019648313522338867, 0.020729541778564453, 0.02181077003479004, 0.022891998291015625, 0.02397322654724121, 0.025054454803466797, 0.026135683059692383, 0.02721691131591797, 0.028298139572143555, 0.02937936782836914, 0.030460596084594727, 0.03154182434082031, 0.0326230525970459, 0.033704280853271484, 0.03478550910949707, 0.035866737365722656, 0.03694796562194824, 0.03802919387817383, 0.039110422134399414, 0.040191650390625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 59.0, 341.0, 457.0, 134.0, 12.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011018937220796943, -0.0010183961130678654, -0.0009348986204713583, -0.0008514010114595294, -0.0007679034606553614, -0.0006844059098511934, -0.0006009083008393645, -0.0005174107500351965, -0.00043391319923102856, -0.00035041564842686057, -0.00026691806851886213, -0.00018342048861086369, -9.99229378066957e-05, -1.6425387002527714e-05, 6.707222200930119e-05, 0.00015056977281346917, 0.00023406732361763716, 0.00031756487442180514, 0.0004010624543298036, 0.00048456003423780203, 0.00056805758504197, 0.000651555135846138, 0.0007350527448579669, 0.0008185502956621349, 0.0009020478464663029, 0.0009855454554781318, 0.0010690429480746388, 0.0011525405570864677, 0.0012360380496829748, 0.0013195356586948037, 0.0014030332677066326, 0.0014865307603031397, 0.0015700282528996468, 0.0016535258619114757, 0.0017370233545079827, 0.0018205209635198116, 0.0019040184561163187, 0.0019875159487128258, 0.0020710136741399765, 0.0021545111667364836, 0.0022380086593329906, 0.0023215061519294977, 0.0024050038773566484, 0.0024885013699531555, 0.0025719988625496626, 0.0026554963551461697, 0.0027389940805733204, 0.0028224915731698275, 0.002905989298596978, 0.0029894867911934853, 0.003072984516620636, 0.003156482009217143, 0.00323997950181365, 0.003323477227240801, 0.003406974719837308, 0.003490472212433815, 0.0035739699378609657, 0.003657467430457473, 0.0037409651558846235, 0.0038244626484811306, 0.003907960373908281, 0.003991457633674145, 0.0040749553591012955, 0.004158453084528446, 0.00424195034429431]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 15.0, 8.0, 10.0, 27.0, 24.0, 26.0, 28.0, 22.0, 35.0, 34.0, 37.0, 43.0, 52.0, 28.0, 39.0, 44.0, 38.0, 49.0, 42.0, 47.0, 44.0, 36.0, 33.0, 37.0, 28.0, 27.0, 15.0, 16.0, 17.0, 20.0, 12.0, 9.0, 9.0, 6.0, 5.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.000724494457244873, -0.0007041580975055695, -0.0006838217377662659, -0.0006634853780269623, -0.0006431490182876587, -0.0006228126585483551, -0.0006024762988090515, -0.0005821399390697479, -0.0005618035793304443, -0.0005414672195911407, -0.0005211308598518372, -0.0005007945001125336, -0.00048045814037323, -0.0004601217806339264, -0.0004397854208946228, -0.0004194490611553192, -0.0003991127014160156, -0.00037877634167671204, -0.00035843998193740845, -0.00033810362219810486, -0.00031776726245880127, -0.0002974309027194977, -0.0002770945429801941, -0.0002567581832408905, -0.00023642182350158691, -0.00021608546376228333, -0.00019574910402297974, -0.00017541274428367615, -0.00015507638454437256, -0.00013474002480506897, -0.00011440366506576538, -9.406730532646179e-05, -7.37309455871582e-05, -5.3394585847854614e-05, -3.3058226108551025e-05, -1.2721866369247437e-05, 7.614493370056152e-06, 2.795085310935974e-05, 4.828721284866333e-05, 6.862357258796692e-05, 8.895993232727051e-05, 0.0001092962920665741, 0.00012963265180587769, 0.00014996901154518127, 0.00017030537128448486, 0.00019064173102378845, 0.00021097809076309204, 0.00023131445050239563, 0.0002516508102416992, 0.0002719871699810028, 0.0002923235297203064, 0.00031265988945961, 0.0003329962491989136, 0.00035333260893821716, 0.00037366896867752075, 0.00039400532841682434, 0.00041434168815612793, 0.0004346780478954315, 0.0004550144076347351, 0.0004753507673740387, 0.0004956871271133423, 0.0005160234868526459, 0.0005363598465919495, 0.000556696206331253, 0.0005770325660705566]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 10.0, 4.0, 14.0, 15.0, 13.0, 21.0, 16.0, 22.0, 24.0, 43.0, 34.0, 42.0, 44.0, 41.0, 41.0, 50.0, 44.0, 52.0, 42.0, 53.0, 46.0, 29.0, 43.0, 44.0, 21.0, 23.0, 27.0, 18.0, 21.0, 19.0, 15.0, 15.0, 11.0, 8.0, 5.0, 5.0, 2.0, 5.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-12.6796875, -12.3193359375, -11.958984375, -11.5986328125, -11.23828125, -10.8779296875, -10.517578125, -10.1572265625, -9.796875, -9.4365234375, -9.076171875, -8.7158203125, -8.35546875, -7.9951171875, -7.634765625, -7.2744140625, -6.9140625, -6.5537109375, -6.193359375, -5.8330078125, -5.47265625, -5.1123046875, -4.751953125, -4.3916015625, -4.03125, -3.6708984375, -3.310546875, -2.9501953125, -2.58984375, -2.2294921875, -1.869140625, -1.5087890625, -1.1484375, -0.7880859375, -0.427734375, -0.0673828125, 0.29296875, 0.6533203125, 1.013671875, 1.3740234375, 1.734375, 2.0947265625, 2.455078125, 2.8154296875, 3.17578125, 3.5361328125, 3.896484375, 4.2568359375, 4.6171875, 4.9775390625, 5.337890625, 5.6982421875, 6.05859375, 6.4189453125, 6.779296875, 7.1396484375, 7.5, 7.8603515625, 8.220703125, 8.5810546875, 8.94140625, 9.3017578125, 9.662109375, 10.0224609375, 10.3828125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 8.0, 7.0, 14.0, 19.0, 24.0, 44.0, 55.0, 91.0, 109.0, 131.0, 206.0, 301.0, 408.0, 553.0, 745.0, 1109.0, 1645.0, 3571.0, 13413.0, 100194.0, 612909.0, 267951.0, 32206.0, 6098.0, 2272.0, 1268.0, 883.0, 645.0, 449.0, 372.0, 247.0, 174.0, 126.0, 92.0, 52.0, 44.0, 29.0, 31.0, 14.0, 16.0, 10.0, 8.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.865478515625, -18.23095703125, -17.596435546875, -16.9619140625, -16.327392578125, -15.69287109375, -15.058349609375, -14.423828125, -13.789306640625, -13.15478515625, -12.520263671875, -11.8857421875, -11.251220703125, -10.61669921875, -9.982177734375, -9.34765625, -8.713134765625, -8.07861328125, -7.444091796875, -6.8095703125, -6.175048828125, -5.54052734375, -4.906005859375, -4.271484375, -3.636962890625, -3.00244140625, -2.367919921875, -1.7333984375, -1.098876953125, -0.46435546875, 0.170166015625, 0.8046875, 1.439208984375, 2.07373046875, 2.708251953125, 3.3427734375, 3.977294921875, 4.61181640625, 5.246337890625, 5.880859375, 6.515380859375, 7.14990234375, 7.784423828125, 8.4189453125, 9.053466796875, 9.68798828125, 10.322509765625, 10.95703125, 11.591552734375, 12.22607421875, 12.860595703125, 13.4951171875, 14.129638671875, 14.76416015625, 15.398681640625, 16.033203125, 16.667724609375, 17.30224609375, 17.936767578125, 18.5712890625, 19.205810546875, 19.84033203125, 20.474853515625, 21.109375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 6.0, 7.0, 6.0, 14.0, 19.0, 17.0, 23.0, 32.0, 31.0, 44.0, 40.0, 56.0, 56.0, 67.0, 193.0, 1587.0, 293.0, 118.0, 70.0, 64.0, 47.0, 45.0, 32.0, 33.0, 20.0, 22.0, 13.0, 19.0, 9.0, 7.0, 12.0, 8.0, 8.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.40625, -32.38623046875, -31.3662109375, -30.34619140625, -29.326171875, -28.30615234375, -27.2861328125, -26.26611328125, -25.24609375, -24.22607421875, -23.2060546875, -22.18603515625, -21.166015625, -20.14599609375, -19.1259765625, -18.10595703125, -17.0859375, -16.06591796875, -15.0458984375, -14.02587890625, -13.005859375, -11.98583984375, -10.9658203125, -9.94580078125, -8.92578125, -7.90576171875, -6.8857421875, -5.86572265625, -4.845703125, -3.82568359375, -2.8056640625, -1.78564453125, -0.765625, 0.25439453125, 1.2744140625, 2.29443359375, 3.314453125, 4.33447265625, 5.3544921875, 6.37451171875, 7.39453125, 8.41455078125, 9.4345703125, 10.45458984375, 11.474609375, 12.49462890625, 13.5146484375, 14.53466796875, 15.5546875, 16.57470703125, 17.5947265625, 18.61474609375, 19.634765625, 20.65478515625, 21.6748046875, 22.69482421875, 23.71484375, 24.73486328125, 25.7548828125, 26.77490234375, 27.794921875, 28.81494140625, 29.8349609375, 30.85498046875, 31.875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 12.0, 12.0, 19.0, 21.0, 28.0, 31.0, 48.0, 48.0, 75.0, 91.0, 152.0, 233.0, 399.0, 762.0, 2227.0, 2767182.0, 370705.0, 1836.0, 706.0, 349.0, 214.0, 140.0, 103.0, 64.0, 47.0, 35.0, 23.0, 16.0, 23.0, 13.0, 14.0, 17.0, 7.0, 4.0, 5.0, 7.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-84.875, -82.130859375, -79.38671875, -76.642578125, -73.8984375, -71.154296875, -68.41015625, -65.666015625, -62.921875, -60.177734375, -57.43359375, -54.689453125, -51.9453125, -49.201171875, -46.45703125, -43.712890625, -40.96875, -38.224609375, -35.48046875, -32.736328125, -29.9921875, -27.248046875, -24.50390625, -21.759765625, -19.015625, -16.271484375, -13.52734375, -10.783203125, -8.0390625, -5.294921875, -2.55078125, 0.193359375, 2.9375, 5.681640625, 8.42578125, 11.169921875, 13.9140625, 16.658203125, 19.40234375, 22.146484375, 24.890625, 27.634765625, 30.37890625, 33.123046875, 35.8671875, 38.611328125, 41.35546875, 44.099609375, 46.84375, 49.587890625, 52.33203125, 55.076171875, 57.8203125, 60.564453125, 63.30859375, 66.052734375, 68.796875, 71.541015625, 74.28515625, 77.029296875, 79.7734375, 82.517578125, 85.26171875, 88.005859375, 90.75]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 46.0, 756.0, 208.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.02197265625, -182.2162322998047, -173.41049194335938, -164.60475158691406, -155.79901123046875, -146.99327087402344, -138.18753051757812, -129.3817901611328, -120.5760498046875, -111.77030944824219, -102.96456909179688, -94.15882873535156, -85.35308837890625, -76.54734802246094, -67.74160766601562, -58.93586730957031, -50.130126953125, -41.32438659667969, -32.518646240234375, -23.712905883789062, -14.90716552734375, -6.1014251708984375, 2.704315185546875, 11.510055541992188, 20.3157958984375, 29.121536254882812, 37.927276611328125, 46.73301696777344, 55.53875732421875, 64.34449768066406, 73.15023803710938, 81.95597839355469, 90.76168823242188, 99.56742858886719, 108.3731689453125, 117.17890930175781, 125.98464965820312, 134.79039001464844, 143.59613037109375, 152.40187072753906, 161.20761108398438, 170.0133514404297, 178.819091796875, 187.6248321533203, 196.43057250976562, 205.23631286621094, 214.04205322265625, 222.84779357910156, 231.65353393554688, 240.4592742919922, 249.2650146484375, 258.07073974609375, 266.8764953613281, 275.6822509765625, 284.48797607421875, 293.293701171875, 302.0994567871094, 310.90521240234375, 319.7109375, 328.51666259765625, 337.3224182128906, 346.128173828125, 354.93389892578125, 363.7396240234375, 372.5453796386719]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 7.0, 9.0, 4.0, 5.0, 9.0, 16.0, 20.0, 18.0, 21.0, 20.0, 29.0, 23.0, 22.0, 34.0, 34.0, 40.0, 38.0, 41.0, 38.0, 42.0, 47.0, 46.0, 46.0, 33.0, 44.0, 43.0, 41.0, 39.0, 27.0, 24.0, 13.0, 21.0, 27.0, 14.0, 12.0, 11.0, 9.0, 10.0, 11.0, 5.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0], "bins": [-102.64926147460938, -99.95166015625, -97.25405883789062, -94.55645751953125, -91.8588638305664, -89.16126251220703, -86.46366119384766, -83.76605987548828, -81.06846618652344, -78.37086486816406, -75.67326354980469, -72.97566223144531, -70.27806854248047, -67.5804672241211, -64.88286590576172, -62.185264587402344, -59.48766326904297, -56.790061950683594, -54.092464447021484, -51.39486312866211, -48.697265625, -45.999664306640625, -43.30206298828125, -40.604461669921875, -37.906864166259766, -35.20926284790039, -32.51166534423828, -29.814064025878906, -27.116464614868164, -24.418865203857422, -21.721263885498047, -19.023664474487305, -16.326065063476562, -13.62846565246582, -10.930865287780762, -8.233264923095703, -5.535665512084961, -2.8380661010742188, -0.14046478271484375, 2.5571346282958984, 5.254734039306641, 7.952333927154541, 10.649933815002441, 13.3475341796875, 16.045133590698242, 18.742733001708984, 21.44033432006836, 24.1379337310791, 26.835533142089844, 29.533132553100586, 32.23073196411133, 34.9283332824707, 37.62593078613281, 40.32353210449219, 43.02113342285156, 45.71873474121094, 48.41633224487305, 51.11393356323242, 53.81153106689453, 56.509132385253906, 59.20673370361328, 61.90433120727539, 64.6019287109375, 67.29953002929688, 69.99713134765625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 4.0, 9.0, 7.0, 11.0, 15.0, 15.0, 23.0, 21.0, 25.0, 30.0, 26.0, 30.0, 42.0, 43.0, 44.0, 55.0, 43.0, 46.0, 46.0, 50.0, 37.0, 35.0, 43.0, 33.0, 34.0, 30.0, 38.0, 18.0, 28.0, 21.0, 10.0, 14.0, 12.0, 18.0, 7.0, 11.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.5234375, -12.1656494140625, -11.807861328125, -11.4500732421875, -11.09228515625, -10.7344970703125, -10.376708984375, -10.0189208984375, -9.6611328125, -9.3033447265625, -8.945556640625, -8.5877685546875, -8.22998046875, -7.8721923828125, -7.514404296875, -7.1566162109375, -6.798828125, -6.4410400390625, -6.083251953125, -5.7254638671875, -5.36767578125, -5.0098876953125, -4.652099609375, -4.2943115234375, -3.9365234375, -3.5787353515625, -3.220947265625, -2.8631591796875, -2.50537109375, -2.1475830078125, -1.789794921875, -1.4320068359375, -1.07421875, -0.7164306640625, -0.358642578125, -0.0008544921875, 0.35693359375, 0.7147216796875, 1.072509765625, 1.4302978515625, 1.7880859375, 2.1458740234375, 2.503662109375, 2.8614501953125, 3.21923828125, 3.5770263671875, 3.934814453125, 4.2926025390625, 4.650390625, 5.0081787109375, 5.365966796875, 5.7237548828125, 6.08154296875, 6.4393310546875, 6.797119140625, 7.1549072265625, 7.5126953125, 7.8704833984375, 8.228271484375, 8.5860595703125, 8.94384765625, 9.3016357421875, 9.659423828125, 10.0172119140625, 10.375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 9.0, 8.0, 9.0, 15.0, 21.0, 24.0, 36.0, 45.0, 43.0, 76.0, 62.0, 111.0, 110.0, 143.0, 165.0, 243.0, 412.0, 1069.0, 4021.0, 29097.0, 729510.0, 3089464.0, 317869.0, 16569.0, 2853.0, 854.0, 382.0, 233.0, 177.0, 117.0, 131.0, 87.0, 67.0, 50.0, 46.0, 38.0, 27.0, 24.0, 17.0, 12.0, 11.0, 8.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.671875, -28.75537109375, -27.8388671875, -26.92236328125, -26.005859375, -25.08935546875, -24.1728515625, -23.25634765625, -22.33984375, -21.42333984375, -20.5068359375, -19.59033203125, -18.673828125, -17.75732421875, -16.8408203125, -15.92431640625, -15.0078125, -14.09130859375, -13.1748046875, -12.25830078125, -11.341796875, -10.42529296875, -9.5087890625, -8.59228515625, -7.67578125, -6.75927734375, -5.8427734375, -4.92626953125, -4.009765625, -3.09326171875, -2.1767578125, -1.26025390625, -0.34375, 0.57275390625, 1.4892578125, 2.40576171875, 3.322265625, 4.23876953125, 5.1552734375, 6.07177734375, 6.98828125, 7.90478515625, 8.8212890625, 9.73779296875, 10.654296875, 11.57080078125, 12.4873046875, 13.40380859375, 14.3203125, 15.23681640625, 16.1533203125, 17.06982421875, 17.986328125, 18.90283203125, 19.8193359375, 20.73583984375, 21.65234375, 22.56884765625, 23.4853515625, 24.40185546875, 25.318359375, 26.23486328125, 27.1513671875, 28.06787109375, 28.984375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 12.0, 12.0, 21.0, 29.0, 27.0, 49.0, 39.0, 68.0, 101.0, 120.0, 130.0, 215.0, 334.0, 487.0, 653.0, 550.0, 379.0, 247.0, 141.0, 113.0, 84.0, 72.0, 52.0, 48.0, 25.0, 16.0, 14.0, 9.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.46875, -22.81005859375, -22.1513671875, -21.49267578125, -20.833984375, -20.17529296875, -19.5166015625, -18.85791015625, -18.19921875, -17.54052734375, -16.8818359375, -16.22314453125, -15.564453125, -14.90576171875, -14.2470703125, -13.58837890625, -12.9296875, -12.27099609375, -11.6123046875, -10.95361328125, -10.294921875, -9.63623046875, -8.9775390625, -8.31884765625, -7.66015625, -7.00146484375, -6.3427734375, -5.68408203125, -5.025390625, -4.36669921875, -3.7080078125, -3.04931640625, -2.390625, -1.73193359375, -1.0732421875, -0.41455078125, 0.244140625, 0.90283203125, 1.5615234375, 2.22021484375, 2.87890625, 3.53759765625, 4.1962890625, 4.85498046875, 5.513671875, 6.17236328125, 6.8310546875, 7.48974609375, 8.1484375, 8.80712890625, 9.4658203125, 10.12451171875, 10.783203125, 11.44189453125, 12.1005859375, 12.75927734375, 13.41796875, 14.07666015625, 14.7353515625, 15.39404296875, 16.052734375, 16.71142578125, 17.3701171875, 18.02880859375, 18.6875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 13.0, 17.0, 34.0, 46.0, 99.0, 200.0, 549.0, 1828.0, 21600.0, 4060504.0, 105057.0, 2933.0, 791.0, 282.0, 154.0, 75.0, 42.0, 23.0, 16.0, 11.0, 6.0, 1.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-102.3125, -99.7314453125, -97.150390625, -94.5693359375, -91.98828125, -89.4072265625, -86.826171875, -84.2451171875, -81.6640625, -79.0830078125, -76.501953125, -73.9208984375, -71.33984375, -68.7587890625, -66.177734375, -63.5966796875, -61.015625, -58.4345703125, -55.853515625, -53.2724609375, -50.69140625, -48.1103515625, -45.529296875, -42.9482421875, -40.3671875, -37.7861328125, -35.205078125, -32.6240234375, -30.04296875, -27.4619140625, -24.880859375, -22.2998046875, -19.71875, -17.1376953125, -14.556640625, -11.9755859375, -9.39453125, -6.8134765625, -4.232421875, -1.6513671875, 0.9296875, 3.5107421875, 6.091796875, 8.6728515625, 11.25390625, 13.8349609375, 16.416015625, 18.9970703125, 21.578125, 24.1591796875, 26.740234375, 29.3212890625, 31.90234375, 34.4833984375, 37.064453125, 39.6455078125, 42.2265625, 44.8076171875, 47.388671875, 49.9697265625, 52.55078125, 55.1318359375, 57.712890625, 60.2939453125, 62.875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 28.0, 942.0, 45.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.0906982421875, -296.4898986816406, -270.8890686035156, -245.28826904296875, -219.68743896484375, -194.08663940429688, -168.48582458496094, -142.885009765625, -117.28419494628906, -91.68338012695312, -66.08256530761719, -40.48175811767578, -14.880943298339844, 10.719863891601562, 36.3206787109375, 61.92149353027344, 87.52230834960938, 113.12312316894531, 138.72393798828125, 164.32473754882812, 189.92556762695312, 215.5263671875, 241.12718200683594, 266.7279968261719, 292.32879638671875, 317.9295959472656, 343.5304260253906, 369.1312255859375, 394.7320556640625, 420.3328552246094, 445.93365478515625, 471.53448486328125, 497.13531494140625, 522.7361450195312, 548.3369140625, 573.937744140625, 599.53857421875, 625.139404296875, 650.7401733398438, 676.3410034179688, 701.9418334960938, 727.5426635742188, 753.1434326171875, 778.7442626953125, 804.3450927734375, 829.9459228515625, 855.5466918945312, 881.1475219726562, 906.748291015625, 932.34912109375, 957.9498901367188, 983.5507202148438, 1009.1515502929688, 1034.7523193359375, 1060.3531494140625, 1085.9539794921875, 1111.5548095703125, 1137.1556396484375, 1162.7564697265625, 1188.3572998046875, 1213.9580078125, 1239.558837890625, 1265.15966796875, 1290.760498046875, 1316.361328125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 9.0, 4.0, 4.0, 11.0, 3.0, 6.0, 11.0, 14.0, 16.0, 23.0, 17.0, 35.0, 35.0, 23.0, 51.0, 33.0, 32.0, 30.0, 45.0, 40.0, 41.0, 38.0, 40.0, 43.0, 50.0, 29.0, 43.0, 34.0, 31.0, 29.0, 23.0, 26.0, 16.0, 21.0, 14.0, 13.0, 14.0, 11.0, 9.0, 8.0, 6.0, 9.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-76.847412109375, -74.64696502685547, -72.4465103149414, -70.24606323242188, -68.04560852050781, -65.84516143798828, -63.64471435546875, -61.44426345825195, -59.243812561035156, -57.04336166381836, -54.84291076660156, -52.64246368408203, -50.442012786865234, -48.24156188964844, -46.041114807128906, -43.84066390991211, -41.64021301269531, -39.439762115478516, -37.23931121826172, -35.03886413574219, -32.83841323852539, -30.637962341308594, -28.43751335144043, -26.237064361572266, -24.03661346435547, -21.836162567138672, -19.635713577270508, -17.435264587402344, -15.234813690185547, -13.034363746643066, -10.833913803100586, -8.633463859558105, -6.433013916015625, -4.2325639724731445, -2.032114028930664, 0.1683359146118164, 2.368785858154297, 4.569235801696777, 6.769685745239258, 8.970135688781738, 11.170585632324219, 13.3710355758667, 15.57148551940918, 17.771934509277344, 19.97238540649414, 22.172836303710938, 24.3732852935791, 26.573734283447266, 28.774185180664062, 30.97463607788086, 33.175086975097656, 35.37553405761719, 37.575984954833984, 39.77643585205078, 41.97688293457031, 44.17733383178711, 46.377784729003906, 48.5782356262207, 50.7786865234375, 52.97913360595703, 55.17958450317383, 57.380035400390625, 59.580482482910156, 61.78093338012695, 63.98138427734375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 8.0, 16.0, 23.0, 23.0, 30.0, 36.0, 38.0, 48.0, 45.0, 38.0, 44.0, 47.0, 50.0, 54.0, 49.0, 46.0, 55.0, 48.0, 37.0, 33.0, 30.0, 28.0, 26.0, 20.0, 32.0, 19.0, 9.0, 12.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5859375, -8.28466796875, -7.9833984375, -7.68212890625, -7.380859375, -7.07958984375, -6.7783203125, -6.47705078125, -6.17578125, -5.87451171875, -5.5732421875, -5.27197265625, -4.970703125, -4.66943359375, -4.3681640625, -4.06689453125, -3.765625, -3.46435546875, -3.1630859375, -2.86181640625, -2.560546875, -2.25927734375, -1.9580078125, -1.65673828125, -1.35546875, -1.05419921875, -0.7529296875, -0.45166015625, -0.150390625, 0.15087890625, 0.4521484375, 0.75341796875, 1.0546875, 1.35595703125, 1.6572265625, 1.95849609375, 2.259765625, 2.56103515625, 2.8623046875, 3.16357421875, 3.46484375, 3.76611328125, 4.0673828125, 4.36865234375, 4.669921875, 4.97119140625, 5.2724609375, 5.57373046875, 5.875, 6.17626953125, 6.4775390625, 6.77880859375, 7.080078125, 7.38134765625, 7.6826171875, 7.98388671875, 8.28515625, 8.58642578125, 8.8876953125, 9.18896484375, 9.490234375, 9.79150390625, 10.0927734375, 10.39404296875, 10.6953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 8.0, 6.0, 8.0, 23.0, 21.0, 37.0, 60.0, 95.0, 154.0, 296.0, 407.0, 731.0, 1245.0, 2193.0, 3898.0, 7554.0, 15237.0, 30563.0, 65498.0, 164086.0, 458086.0, 167469.0, 67511.0, 30792.0, 15398.0, 7841.0, 3994.0, 2212.0, 1271.0, 715.0, 437.0, 237.0, 159.0, 99.0, 71.0, 39.0, 38.0, 22.0, 12.0, 11.0, 9.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.546875, -2.457550048828125, -2.36822509765625, -2.278900146484375, -2.1895751953125, -2.100250244140625, -2.01092529296875, -1.921600341796875, -1.832275390625, -1.742950439453125, -1.65362548828125, -1.564300537109375, -1.4749755859375, -1.385650634765625, -1.29632568359375, -1.207000732421875, -1.11767578125, -1.028350830078125, -0.93902587890625, -0.849700927734375, -0.7603759765625, -0.671051025390625, -0.58172607421875, -0.492401123046875, -0.403076171875, -0.313751220703125, -0.22442626953125, -0.135101318359375, -0.0457763671875, 0.043548583984375, 0.13287353515625, 0.222198486328125, 0.3115234375, 0.400848388671875, 0.49017333984375, 0.579498291015625, 0.6688232421875, 0.758148193359375, 0.84747314453125, 0.936798095703125, 1.026123046875, 1.115447998046875, 1.20477294921875, 1.294097900390625, 1.3834228515625, 1.472747802734375, 1.56207275390625, 1.651397705078125, 1.74072265625, 1.830047607421875, 1.91937255859375, 2.008697509765625, 2.0980224609375, 2.187347412109375, 2.27667236328125, 2.365997314453125, 2.455322265625, 2.544647216796875, 2.63397216796875, 2.723297119140625, 2.8126220703125, 2.901947021484375, 2.99127197265625, 3.080596923828125, 3.169921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 6.0, 14.0, 9.0, 11.0, 17.0, 19.0, 18.0, 12.0, 18.0, 29.0, 38.0, 25.0, 41.0, 40.0, 34.0, 52.0, 44.0, 43.0, 1074.0, 42.0, 37.0, 40.0, 41.0, 48.0, 36.0, 29.0, 20.0, 17.0, 28.0, 20.0, 21.0, 18.0, 16.0, 8.0, 13.0, 12.0, 1.0, 5.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.4140625, -5.25299072265625, -5.0919189453125, -4.93084716796875, -4.769775390625, -4.60870361328125, -4.4476318359375, -4.28656005859375, -4.12548828125, -3.96441650390625, -3.8033447265625, -3.64227294921875, -3.481201171875, -3.32012939453125, -3.1590576171875, -2.99798583984375, -2.8369140625, -2.67584228515625, -2.5147705078125, -2.35369873046875, -2.192626953125, -2.03155517578125, -1.8704833984375, -1.70941162109375, -1.54833984375, -1.38726806640625, -1.2261962890625, -1.06512451171875, -0.904052734375, -0.74298095703125, -0.5819091796875, -0.42083740234375, -0.259765625, -0.09869384765625, 0.0623779296875, 0.22344970703125, 0.384521484375, 0.54559326171875, 0.7066650390625, 0.86773681640625, 1.02880859375, 1.18988037109375, 1.3509521484375, 1.51202392578125, 1.673095703125, 1.83416748046875, 1.9952392578125, 2.15631103515625, 2.3173828125, 2.47845458984375, 2.6395263671875, 2.80059814453125, 2.961669921875, 3.12274169921875, 3.2838134765625, 3.44488525390625, 3.60595703125, 3.76702880859375, 3.9281005859375, 4.08917236328125, 4.250244140625, 4.41131591796875, 4.5723876953125, 4.73345947265625, 4.89453125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 15.0, 16.0, 16.0, 24.0, 42.0, 69.0, 92.0, 130.0, 191.0, 266.0, 414.0, 591.0, 896.0, 1267.0, 2030.0, 3000.0, 4558.0, 6913.0, 10465.0, 15822.0, 24096.0, 38054.0, 63951.0, 114410.0, 1322586.0, 224742.0, 102968.0, 58022.0, 34991.0, 22578.0, 14899.0, 9651.0, 6430.0, 4196.0, 2813.0, 1946.0, 1283.0, 856.0, 596.0, 393.0, 256.0, 185.0, 139.0, 82.0, 61.0, 36.0, 37.0, 22.0, 9.0, 10.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.609375, -1.5589447021484375, -1.508514404296875, -1.4580841064453125, -1.40765380859375, -1.3572235107421875, -1.306793212890625, -1.2563629150390625, -1.2059326171875, -1.1555023193359375, -1.105072021484375, -1.0546417236328125, -1.00421142578125, -0.9537811279296875, -0.903350830078125, -0.8529205322265625, -0.802490234375, -0.7520599365234375, -0.701629638671875, -0.6511993408203125, -0.60076904296875, -0.5503387451171875, -0.499908447265625, -0.4494781494140625, -0.3990478515625, -0.3486175537109375, -0.298187255859375, -0.2477569580078125, -0.19732666015625, -0.1468963623046875, -0.096466064453125, -0.0460357666015625, 0.00439453125, 0.0548248291015625, 0.105255126953125, 0.1556854248046875, 0.20611572265625, 0.2565460205078125, 0.306976318359375, 0.3574066162109375, 0.4078369140625, 0.4582672119140625, 0.508697509765625, 0.5591278076171875, 0.60955810546875, 0.6599884033203125, 0.710418701171875, 0.7608489990234375, 0.811279296875, 0.8617095947265625, 0.912139892578125, 0.9625701904296875, 1.01300048828125, 1.0634307861328125, 1.113861083984375, 1.1642913818359375, 1.2147216796875, 1.2651519775390625, 1.315582275390625, 1.3660125732421875, 1.41644287109375, 1.4668731689453125, 1.517303466796875, 1.5677337646484375, 1.6181640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 3.0, 2.0, 10.0, 7.0, 7.0, 16.0, 16.0, 15.0, 29.0, 32.0, 49.0, 63.0, 85.0, 108.0, 139.0, 97.0, 72.0, 51.0, 45.0, 31.0, 26.0, 16.0, 19.0, 11.0, 14.0, 9.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014858245849609375, -0.0014480650424957275, -0.0014103055000305176, -0.0013725459575653076, -0.0013347864151000977, -0.0012970268726348877, -0.0012592673301696777, -0.0012215077877044678, -0.0011837482452392578, -0.0011459887027740479, -0.0011082291603088379, -0.001070469617843628, -0.001032710075378418, -0.000994950532913208, -0.000957190990447998, -0.0009194314479827881, -0.0008816719055175781, -0.0008439123630523682, -0.0008061528205871582, -0.0007683932781219482, -0.0007306337356567383, -0.0006928741931915283, -0.0006551146507263184, -0.0006173551082611084, -0.0005795955657958984, -0.0005418360233306885, -0.0005040764808654785, -0.00046631693840026855, -0.0004285573959350586, -0.00039079785346984863, -0.00035303831100463867, -0.0003152787685394287, -0.00027751922607421875, -0.0002397596836090088, -0.00020200014114379883, -0.00016424059867858887, -0.0001264810562133789, -8.872151374816895e-05, -5.0961971282958984e-05, -1.3202428817749023e-05, 2.4557113647460938e-05, 6.23166561126709e-05, 0.00010007619857788086, 0.00013783574104309082, 0.00017559528350830078, 0.00021335482597351074, 0.0002511143684387207, 0.00028887391090393066, 0.0003266334533691406, 0.0003643929958343506, 0.00040215253829956055, 0.0004399120807647705, 0.00047767162322998047, 0.0005154311656951904, 0.0005531907081604004, 0.0005909502506256104, 0.0006287097930908203, 0.0006664693355560303, 0.0007042288780212402, 0.0007419884204864502, 0.0007797479629516602, 0.0008175075054168701, 0.0008552670478820801, 0.00089302659034729, 0.0009307861328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 8.0, 8.0, 8.0, 11.0, 13.0, 19.0, 21.0, 32.0, 39.0, 70.0, 84.0, 130.0, 177.0, 286.0, 534.0, 1109.0, 192336.0, 850794.0, 1293.0, 616.0, 309.0, 184.0, 109.0, 97.0, 65.0, 47.0, 25.0, 25.0, 29.0, 14.0, 9.0, 9.0, 13.0, 5.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0165557861328125, -0.01592087745666504, -0.015285968780517578, -0.014651060104370117, -0.014016151428222656, -0.013381242752075195, -0.012746334075927734, -0.012111425399780273, -0.011476516723632812, -0.010841608047485352, -0.01020669937133789, -0.00957179069519043, -0.008936882019042969, -0.008301973342895508, -0.007667064666748047, -0.007032155990600586, -0.006397247314453125, -0.005762338638305664, -0.005127429962158203, -0.004492521286010742, -0.0038576126098632812, -0.0032227039337158203, -0.0025877952575683594, -0.0019528865814208984, -0.0013179779052734375, -0.0006830692291259766, -4.8160552978515625e-05, 0.0005867481231689453, 0.0012216567993164062, 0.0018565654754638672, 0.002491474151611328, 0.003126382827758789, 0.00376129150390625, 0.004396200180053711, 0.005031108856201172, 0.005666017532348633, 0.006300926208496094, 0.006935834884643555, 0.007570743560791016, 0.008205652236938477, 0.008840560913085938, 0.009475469589233398, 0.01011037826538086, 0.01074528694152832, 0.011380195617675781, 0.012015104293823242, 0.012650012969970703, 0.013284921646118164, 0.013919830322265625, 0.014554738998413086, 0.015189647674560547, 0.015824556350708008, 0.01645946502685547, 0.01709437370300293, 0.01772928237915039, 0.01836419105529785, 0.018999099731445312, 0.019634008407592773, 0.020268917083740234, 0.020903825759887695, 0.021538734436035156, 0.022173643112182617, 0.022808551788330078, 0.02344346046447754, 0.024078369140625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 25.0, 204.0, 443.0, 273.0, 50.0, 12.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024858207907527685, -0.002432500012218952, -0.002379179000854492, -0.002325857989490032, -0.002272537210956216, -0.0022192164324223995, -0.0021658954210579395, -0.0021125744096934795, -0.002059253631159663, -0.002005932852625847, -0.0019526118412613869, -0.0018992909463122487, -0.0018459700513631105, -0.0017926491564139724, -0.0017393282614648342, -0.001686007366515696, -0.0016326864715665579, -0.0015793655766174197, -0.0015260446816682816, -0.0014727237867191434, -0.0014194028917700052, -0.001366081996820867, -0.001312761101871729, -0.0012594402069225907, -0.0012061193119734526, -0.0011527984170243144, -0.0010994775220751762, -0.001046156627126038, -0.0009928357321769, -0.0009395148372277617, -0.0008861939422786236, -0.0008328730473294854, -0.0007795522105880082, -0.00072623131563887, -0.0006729104206897318, -0.0006195895257405937, -0.0005662686307914555, -0.0005129477358423173, -0.0004596268408931792, -0.000406305945944041, -0.00035298505099490285, -0.0002996641560457647, -0.0002463432610966265, -0.00019302236614748836, -0.0001397014711983502, -8.638057624921203e-05, -3.305968130007386e-05, 2.0261213649064302e-05, 7.358210859820247e-05, 0.00012690300354734063, 0.0001802238984964788, 0.00023354479344561696, 0.0002868656883947551, 0.0003401865833438933, 0.00039350747829303145, 0.0004468283732421696, 0.0005001492681913078, 0.000553470163140446, 0.0006067910580895841, 0.0006601119530387223, 0.0007134328479878604, 0.0007667537429369986, 0.0008200746378861368, 0.0008733955328352749, 0.0009267164277844131]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 10.0, 18.0, 11.0, 18.0, 22.0, 13.0, 18.0, 26.0, 42.0, 23.0, 24.0, 29.0, 30.0, 37.0, 36.0, 40.0, 34.0, 50.0, 37.0, 40.0, 55.0, 38.0, 34.0, 28.0, 26.0, 33.0, 19.0, 19.0, 24.0, 24.0, 24.0, 13.0, 23.0, 14.0, 6.0, 13.0, 10.0, 1.0, 5.0, 6.0, 5.0, 1.0, 2.0, 4.0, 4.0, 1.0], "bins": [-0.00047093629837036133, -0.0004577683284878731, -0.0004446003586053848, -0.0004314323887228966, -0.0004182644188404083, -0.0004050964489579201, -0.0003919284790754318, -0.0003787605091929436, -0.0003655925393104553, -0.00035242456942796707, -0.0003392565995454788, -0.00032608862966299057, -0.0003129206597805023, -0.00029975268989801407, -0.0002865847200155258, -0.00027341675013303757, -0.0002602487802505493, -0.00024708081036806107, -0.00023391284048557281, -0.00022074487060308456, -0.0002075769007205963, -0.00019440893083810806, -0.0001812409609556198, -0.00016807299107313156, -0.0001549050211906433, -0.00014173705130815506, -0.0001285690814256668, -0.00011540111154317856, -0.00010223314166069031, -8.906517177820206e-05, -7.58972018957138e-05, -6.272923201322556e-05, -4.9561262130737305e-05, -3.6393292248249054e-05, -2.3225322365760803e-05, -1.0057352483272552e-05, 3.1106173992156982e-06, 1.627858728170395e-05, 2.94465571641922e-05, 4.261452704668045e-05, 5.57824969291687e-05, 6.895046681165695e-05, 8.21184366941452e-05, 9.528640657663345e-05, 0.0001084543764591217, 0.00012162234634160995, 0.0001347903162240982, 0.00014795828610658646, 0.0001611262559890747, 0.00017429422587156296, 0.0001874621957540512, 0.00020063016563653946, 0.0002137981355190277, 0.00022696610540151596, 0.0002401340752840042, 0.00025330204516649246, 0.0002664700150489807, 0.00027963798493146896, 0.0002928059548139572, 0.00030597392469644547, 0.0003191418945789337, 0.00033230986446142197, 0.0003454778343439102, 0.00035864580422639847, 0.0003718137741088867]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 8.0, 16.0, 23.0, 23.0, 30.0, 36.0, 38.0, 48.0, 45.0, 38.0, 44.0, 47.0, 50.0, 54.0, 49.0, 46.0, 55.0, 48.0, 37.0, 33.0, 30.0, 28.0, 26.0, 20.0, 32.0, 18.0, 10.0, 12.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5859375, -8.28466796875, -7.9833984375, -7.68212890625, -7.380859375, -7.07958984375, -6.7783203125, -6.47705078125, -6.17578125, -5.87451171875, -5.5732421875, -5.27197265625, -4.970703125, -4.66943359375, -4.3681640625, -4.06689453125, -3.765625, -3.46435546875, -3.1630859375, -2.86181640625, -2.560546875, -2.25927734375, -1.9580078125, -1.65673828125, -1.35546875, -1.05419921875, -0.7529296875, -0.45166015625, -0.150390625, 0.15087890625, 0.4521484375, 0.75341796875, 1.0546875, 1.35595703125, 1.6572265625, 1.95849609375, 2.259765625, 2.56103515625, 2.8623046875, 3.16357421875, 3.46484375, 3.76611328125, 4.0673828125, 4.36865234375, 4.669921875, 4.97119140625, 5.2724609375, 5.57373046875, 5.875, 6.17626953125, 6.4775390625, 6.77880859375, 7.080078125, 7.38134765625, 7.6826171875, 7.98388671875, 8.28515625, 8.58642578125, 8.8876953125, 9.18896484375, 9.490234375, 9.79150390625, 10.0927734375, 10.39404296875, 10.6953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 10.0, 5.0, 10.0, 13.0, 18.0, 22.0, 32.0, 60.0, 87.0, 112.0, 173.0, 236.0, 401.0, 591.0, 945.0, 1457.0, 2599.0, 5469.0, 23560.0, 322448.0, 630591.0, 44617.0, 7288.0, 2995.0, 1736.0, 1073.0, 692.0, 443.0, 267.0, 184.0, 120.0, 85.0, 86.0, 37.0, 28.0, 20.0, 11.0, 8.0, 8.0, 7.0, 3.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.921875, -26.15576171875, -25.3896484375, -24.62353515625, -23.857421875, -23.09130859375, -22.3251953125, -21.55908203125, -20.79296875, -20.02685546875, -19.2607421875, -18.49462890625, -17.728515625, -16.96240234375, -16.1962890625, -15.43017578125, -14.6640625, -13.89794921875, -13.1318359375, -12.36572265625, -11.599609375, -10.83349609375, -10.0673828125, -9.30126953125, -8.53515625, -7.76904296875, -7.0029296875, -6.23681640625, -5.470703125, -4.70458984375, -3.9384765625, -3.17236328125, -2.40625, -1.64013671875, -0.8740234375, -0.10791015625, 0.658203125, 1.42431640625, 2.1904296875, 2.95654296875, 3.72265625, 4.48876953125, 5.2548828125, 6.02099609375, 6.787109375, 7.55322265625, 8.3193359375, 9.08544921875, 9.8515625, 10.61767578125, 11.3837890625, 12.14990234375, 12.916015625, 13.68212890625, 14.4482421875, 15.21435546875, 15.98046875, 16.74658203125, 17.5126953125, 18.27880859375, 19.044921875, 19.81103515625, 20.5771484375, 21.34326171875, 22.109375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 7.0, 10.0, 11.0, 13.0, 20.0, 20.0, 18.0, 24.0, 30.0, 32.0, 40.0, 50.0, 43.0, 59.0, 84.0, 181.0, 1571.0, 299.0, 109.0, 65.0, 56.0, 45.0, 33.0, 20.0, 21.0, 21.0, 24.0, 25.0, 17.0, 10.0, 9.0, 13.0, 7.0, 3.0, 7.0, 6.0, 2.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-22.828125, -22.1884765625, -21.548828125, -20.9091796875, -20.26953125, -19.6298828125, -18.990234375, -18.3505859375, -17.7109375, -17.0712890625, -16.431640625, -15.7919921875, -15.15234375, -14.5126953125, -13.873046875, -13.2333984375, -12.59375, -11.9541015625, -11.314453125, -10.6748046875, -10.03515625, -9.3955078125, -8.755859375, -8.1162109375, -7.4765625, -6.8369140625, -6.197265625, -5.5576171875, -4.91796875, -4.2783203125, -3.638671875, -2.9990234375, -2.359375, -1.7197265625, -1.080078125, -0.4404296875, 0.19921875, 0.8388671875, 1.478515625, 2.1181640625, 2.7578125, 3.3974609375, 4.037109375, 4.6767578125, 5.31640625, 5.9560546875, 6.595703125, 7.2353515625, 7.875, 8.5146484375, 9.154296875, 9.7939453125, 10.43359375, 11.0732421875, 11.712890625, 12.3525390625, 12.9921875, 13.6318359375, 14.271484375, 14.9111328125, 15.55078125, 16.1904296875, 16.830078125, 17.4697265625, 18.109375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 6.0, 12.0, 9.0, 17.0, 15.0, 19.0, 33.0, 50.0, 49.0, 62.0, 98.0, 99.0, 187.0, 260.0, 500.0, 1186.0, 8252.0, 3122994.0, 9122.0, 1198.0, 536.0, 275.0, 171.0, 118.0, 94.0, 66.0, 63.0, 49.0, 27.0, 29.0, 27.0, 14.0, 18.0, 6.0, 6.0, 5.0, 5.0, 1.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-65.8125, -63.7880859375, -61.763671875, -59.7392578125, -57.71484375, -55.6904296875, -53.666015625, -51.6416015625, -49.6171875, -47.5927734375, -45.568359375, -43.5439453125, -41.51953125, -39.4951171875, -37.470703125, -35.4462890625, -33.421875, -31.3974609375, -29.373046875, -27.3486328125, -25.32421875, -23.2998046875, -21.275390625, -19.2509765625, -17.2265625, -15.2021484375, -13.177734375, -11.1533203125, -9.12890625, -7.1044921875, -5.080078125, -3.0556640625, -1.03125, 0.9931640625, 3.017578125, 5.0419921875, 7.06640625, 9.0908203125, 11.115234375, 13.1396484375, 15.1640625, 17.1884765625, 19.212890625, 21.2373046875, 23.26171875, 25.2861328125, 27.310546875, 29.3349609375, 31.359375, 33.3837890625, 35.408203125, 37.4326171875, 39.45703125, 41.4814453125, 43.505859375, 45.5302734375, 47.5546875, 49.5791015625, 51.603515625, 53.6279296875, 55.65234375, 57.6767578125, 59.701171875, 61.7255859375, 63.75]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 19.0, 50.0, 167.0, 315.0, 287.0, 121.0, 34.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.58602905273438, -143.53041076660156, -140.4747772216797, -137.41915893554688, -134.36354064941406, -131.30792236328125, -128.25228881835938, -125.19667053222656, -122.14104461669922, -119.08541870117188, -116.02980041503906, -112.97417449951172, -109.9185562133789, -106.86293029785156, -103.80731201171875, -100.7516860961914, -97.69606018066406, -94.64043426513672, -91.5848159790039, -88.52919006347656, -85.47357177734375, -82.4179458618164, -79.36231994628906, -76.30670166015625, -73.25108337402344, -70.1954574584961, -67.13983917236328, -64.08421325683594, -61.02859115600586, -57.97296905517578, -54.9173469543457, -51.861724853515625, -48.80609893798828, -45.7504768371582, -42.694854736328125, -39.63922882080078, -36.5836067199707, -33.527984619140625, -30.472362518310547, -27.416738510131836, -24.361116409301758, -21.30549430847168, -18.24987030029297, -15.19424819946289, -12.138625144958496, -9.083002090454102, -6.027379989624023, -2.9717559814453125, 0.08386611938476562, 3.139488935470581, 6.1951117515563965, 9.250734329223633, 12.306357383728027, 15.361980438232422, 18.4176025390625, 21.47322654724121, 24.52884864807129, 27.584470748901367, 30.640094757080078, 33.695716857910156, 36.751338958740234, 39.80696105957031, 42.862586975097656, 45.918209075927734, 48.97383117675781]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 2.0, 7.0, 2.0, 11.0, 18.0, 15.0, 19.0, 23.0, 6.0, 21.0, 20.0, 30.0, 27.0, 26.0, 33.0, 34.0, 28.0, 35.0, 35.0, 50.0, 42.0, 52.0, 40.0, 44.0, 37.0, 34.0, 31.0, 29.0, 36.0, 27.0, 29.0, 22.0, 17.0, 20.0, 13.0, 15.0, 8.0, 10.0, 10.0, 6.0, 7.0, 6.0, 3.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-69.73641967773438, -67.6644058227539, -65.59239196777344, -63.52037811279297, -61.4483642578125, -59.37635040283203, -57.30433654785156, -55.232322692871094, -53.160308837890625, -51.088294982910156, -49.01628112792969, -46.94426727294922, -44.87225341796875, -42.80023956298828, -40.72822570800781, -38.656211853027344, -36.584197998046875, -34.512184143066406, -32.44017028808594, -30.36815643310547, -28.296142578125, -26.22412872314453, -24.152114868164062, -22.080101013183594, -20.008087158203125, -17.936073303222656, -15.864059448242188, -13.792045593261719, -11.72003173828125, -9.648017883300781, -7.5760040283203125, -5.503990173339844, -3.4319725036621094, -1.3599586486816406, 0.7120552062988281, 2.784069061279297, 4.856082916259766, 6.928096771240234, 9.000110626220703, 11.072124481201172, 13.14413833618164, 15.21615219116211, 17.288166046142578, 19.360179901123047, 21.432193756103516, 23.504207611083984, 25.576221466064453, 27.648235321044922, 29.72024917602539, 31.79226303100586, 33.86427688598633, 35.9362907409668, 38.008304595947266, 40.080318450927734, 42.1523323059082, 44.22434616088867, 46.29636001586914, 48.36837387084961, 50.44038772583008, 52.51240158081055, 54.584415435791016, 56.656429290771484, 58.72844314575195, 60.80045700073242, 62.87247085571289]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 6.0, 3.0, 2.0, 7.0, 12.0, 8.0, 10.0, 15.0, 12.0, 19.0, 18.0, 30.0, 33.0, 36.0, 45.0, 38.0, 38.0, 52.0, 48.0, 42.0, 36.0, 50.0, 45.0, 48.0, 37.0, 41.0, 34.0, 38.0, 40.0, 37.0, 13.0, 15.0, 17.0, 24.0, 14.0, 10.0, 5.0, 9.0, 7.0, 1.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.0635986328125, -7.752197265625, -7.4407958984375, -7.12939453125, -6.8179931640625, -6.506591796875, -6.1951904296875, -5.8837890625, -5.5723876953125, -5.260986328125, -4.9495849609375, -4.63818359375, -4.3267822265625, -4.015380859375, -3.7039794921875, -3.392578125, -3.0811767578125, -2.769775390625, -2.4583740234375, -2.14697265625, -1.8355712890625, -1.524169921875, -1.2127685546875, -0.9013671875, -0.5899658203125, -0.278564453125, 0.0328369140625, 0.34423828125, 0.6556396484375, 0.967041015625, 1.2784423828125, 1.58984375, 1.9012451171875, 2.212646484375, 2.5240478515625, 2.83544921875, 3.1468505859375, 3.458251953125, 3.7696533203125, 4.0810546875, 4.3924560546875, 4.703857421875, 5.0152587890625, 5.32666015625, 5.6380615234375, 5.949462890625, 6.2608642578125, 6.572265625, 6.8836669921875, 7.195068359375, 7.5064697265625, 7.81787109375, 8.1292724609375, 8.440673828125, 8.7520751953125, 9.0634765625, 9.3748779296875, 9.686279296875, 9.9976806640625, 10.30908203125, 10.6204833984375, 10.931884765625, 11.2432861328125, 11.5546875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 6.0, 6.0, 7.0, 9.0, 15.0, 13.0, 27.0, 25.0, 36.0, 56.0, 71.0, 129.0, 153.0, 202.0, 329.0, 426.0, 708.0, 1105.0, 1897.0, 3340.0, 7278.0, 17675.0, 59116.0, 268398.0, 1110964.0, 1817904.0, 701493.0, 145786.0, 33556.0, 11377.0, 5127.0, 2649.0, 1545.0, 911.0, 613.0, 398.0, 262.0, 196.0, 129.0, 100.0, 64.0, 52.0, 48.0, 21.0, 18.0, 20.0, 10.0, 11.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.277587890625, -9.91455078125, -9.551513671875, -9.1884765625, -8.825439453125, -8.46240234375, -8.099365234375, -7.736328125, -7.373291015625, -7.01025390625, -6.647216796875, -6.2841796875, -5.921142578125, -5.55810546875, -5.195068359375, -4.83203125, -4.468994140625, -4.10595703125, -3.742919921875, -3.3798828125, -3.016845703125, -2.65380859375, -2.290771484375, -1.927734375, -1.564697265625, -1.20166015625, -0.838623046875, -0.4755859375, -0.112548828125, 0.25048828125, 0.613525390625, 0.9765625, 1.339599609375, 1.70263671875, 2.065673828125, 2.4287109375, 2.791748046875, 3.15478515625, 3.517822265625, 3.880859375, 4.243896484375, 4.60693359375, 4.969970703125, 5.3330078125, 5.696044921875, 6.05908203125, 6.422119140625, 6.78515625, 7.148193359375, 7.51123046875, 7.874267578125, 8.2373046875, 8.600341796875, 8.96337890625, 9.326416015625, 9.689453125, 10.052490234375, 10.41552734375, 10.778564453125, 11.1416015625, 11.504638671875, 11.86767578125, 12.230712890625, 12.59375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 7.0, 12.0, 12.0, 11.0, 14.0, 30.0, 46.0, 74.0, 104.0, 159.0, 236.0, 371.0, 500.0, 667.0, 536.0, 368.0, 276.0, 211.0, 145.0, 93.0, 67.0, 41.0, 33.0, 25.0, 14.0, 8.0, 4.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.921875, -17.318115234375, -16.71435546875, -16.110595703125, -15.5068359375, -14.903076171875, -14.29931640625, -13.695556640625, -13.091796875, -12.488037109375, -11.88427734375, -11.280517578125, -10.6767578125, -10.072998046875, -9.46923828125, -8.865478515625, -8.26171875, -7.657958984375, -7.05419921875, -6.450439453125, -5.8466796875, -5.242919921875, -4.63916015625, -4.035400390625, -3.431640625, -2.827880859375, -2.22412109375, -1.620361328125, -1.0166015625, -0.412841796875, 0.19091796875, 0.794677734375, 1.3984375, 2.002197265625, 2.60595703125, 3.209716796875, 3.8134765625, 4.417236328125, 5.02099609375, 5.624755859375, 6.228515625, 6.832275390625, 7.43603515625, 8.039794921875, 8.6435546875, 9.247314453125, 9.85107421875, 10.454833984375, 11.05859375, 11.662353515625, 12.26611328125, 12.869873046875, 13.4736328125, 14.077392578125, 14.68115234375, 15.284912109375, 15.888671875, 16.492431640625, 17.09619140625, 17.699951171875, 18.3037109375, 18.907470703125, 19.51123046875, 20.114990234375, 20.71875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 16.0, 12.0, 11.0, 39.0, 64.0, 99.0, 165.0, 304.0, 592.0, 1328.0, 3996.0, 307859.0, 3867192.0, 9131.0, 1856.0, 767.0, 327.0, 191.0, 138.0, 61.0, 44.0, 24.0, 11.0, 13.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.25, -54.5029296875, -52.755859375, -51.0087890625, -49.26171875, -47.5146484375, -45.767578125, -44.0205078125, -42.2734375, -40.5263671875, -38.779296875, -37.0322265625, -35.28515625, -33.5380859375, -31.791015625, -30.0439453125, -28.296875, -26.5498046875, -24.802734375, -23.0556640625, -21.30859375, -19.5615234375, -17.814453125, -16.0673828125, -14.3203125, -12.5732421875, -10.826171875, -9.0791015625, -7.33203125, -5.5849609375, -3.837890625, -2.0908203125, -0.34375, 1.4033203125, 3.150390625, 4.8974609375, 6.64453125, 8.3916015625, 10.138671875, 11.8857421875, 13.6328125, 15.3798828125, 17.126953125, 18.8740234375, 20.62109375, 22.3681640625, 24.115234375, 25.8623046875, 27.609375, 29.3564453125, 31.103515625, 32.8505859375, 34.59765625, 36.3447265625, 38.091796875, 39.8388671875, 41.5859375, 43.3330078125, 45.080078125, 46.8271484375, 48.57421875, 50.3212890625, 52.068359375, 53.8154296875, 55.5625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 35.0, 385.0, 556.0, 38.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-462.41070556640625, -452.58111572265625, -442.75152587890625, -432.92193603515625, -423.09234619140625, -413.26275634765625, -403.43316650390625, -393.60357666015625, -383.77398681640625, -373.94439697265625, -364.11480712890625, -354.28521728515625, -344.45562744140625, -334.62603759765625, -324.79644775390625, -314.96685791015625, -305.13726806640625, -295.30767822265625, -285.47808837890625, -275.64849853515625, -265.81890869140625, -255.98931884765625, -246.15972900390625, -236.33013916015625, -226.50054931640625, -216.67095947265625, -206.84136962890625, -197.01177978515625, -187.18218994140625, -177.35260009765625, -167.52301025390625, -157.69342041015625, -147.86386108398438, -138.03427124023438, -128.20468139648438, -118.37509155273438, -108.54550170898438, -98.71591186523438, -88.88632202148438, -79.05673217773438, -69.22714233398438, -59.397552490234375, -49.567962646484375, -39.738372802734375, -29.908782958984375, -20.079193115234375, -10.249603271484375, -0.420013427734375, 9.409576416015625, 19.239166259765625, 29.068756103515625, 38.898345947265625, 48.727935791015625, 58.557525634765625, 68.38711547851562, 78.21670532226562, 88.04629516601562, 97.87588500976562, 107.70547485351562, 117.53506469726562, 127.36465454101562, 137.19424438476562, 147.02383422851562, 156.85342407226562, 166.68301391601562]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 6.0, 6.0, 7.0, 10.0, 13.0, 12.0, 10.0, 17.0, 20.0, 29.0, 24.0, 32.0, 23.0, 31.0, 41.0, 43.0, 47.0, 44.0, 39.0, 36.0, 50.0, 38.0, 48.0, 41.0, 37.0, 40.0, 37.0, 29.0, 32.0, 25.0, 16.0, 20.0, 20.0, 12.0, 12.0, 8.0, 7.0, 11.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-69.17770385742188, -67.22195434570312, -65.26619720458984, -63.310447692871094, -61.35469436645508, -59.39894104003906, -57.44319152832031, -55.4874382019043, -53.53168487548828, -51.575931549072266, -49.62017822265625, -47.6644287109375, -45.708675384521484, -43.75292205810547, -41.79717254638672, -39.8414192199707, -37.88566589355469, -35.92991256713867, -33.974159240722656, -32.018409729003906, -30.06265640258789, -28.106903076171875, -26.151151657104492, -24.19540023803711, -22.239646911621094, -20.283893585205078, -18.328142166137695, -16.372390747070312, -14.416637420654297, -12.460885047912598, -10.505132675170898, -8.5493803024292, -6.5936279296875, -4.637875556945801, -2.6821231842041016, -0.7263708114624023, 1.2293815612792969, 3.185133934020996, 5.140886306762695, 7.0966386795043945, 9.052391052246094, 11.008143424987793, 12.963895797729492, 14.919648170471191, 16.87540054321289, 18.831153869628906, 20.78690528869629, 22.742656707763672, 24.698410034179688, 26.654163360595703, 28.609914779663086, 30.56566619873047, 32.521419525146484, 34.4771728515625, 36.43292236328125, 38.388675689697266, 40.34442901611328, 42.3001823425293, 44.25593566894531, 46.21168518066406, 48.16743850708008, 50.123191833496094, 52.078941345214844, 54.03469467163086, 55.990447998046875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 7.0, 8.0, 3.0, 7.0, 12.0, 12.0, 2.0, 18.0, 27.0, 17.0, 27.0, 23.0, 30.0, 27.0, 26.0, 41.0, 45.0, 33.0, 43.0, 57.0, 45.0, 44.0, 40.0, 51.0, 36.0, 41.0, 26.0, 31.0, 24.0, 29.0, 25.0, 29.0, 22.0, 15.0, 10.0, 17.0, 11.0, 8.0, 7.0, 6.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1015625, -6.8798828125, -6.658203125, -6.4365234375, -6.21484375, -5.9931640625, -5.771484375, -5.5498046875, -5.328125, -5.1064453125, -4.884765625, -4.6630859375, -4.44140625, -4.2197265625, -3.998046875, -3.7763671875, -3.5546875, -3.3330078125, -3.111328125, -2.8896484375, -2.66796875, -2.4462890625, -2.224609375, -2.0029296875, -1.78125, -1.5595703125, -1.337890625, -1.1162109375, -0.89453125, -0.6728515625, -0.451171875, -0.2294921875, -0.0078125, 0.2138671875, 0.435546875, 0.6572265625, 0.87890625, 1.1005859375, 1.322265625, 1.5439453125, 1.765625, 1.9873046875, 2.208984375, 2.4306640625, 2.65234375, 2.8740234375, 3.095703125, 3.3173828125, 3.5390625, 3.7607421875, 3.982421875, 4.2041015625, 4.42578125, 4.6474609375, 4.869140625, 5.0908203125, 5.3125, 5.5341796875, 5.755859375, 5.9775390625, 6.19921875, 6.4208984375, 6.642578125, 6.8642578125, 7.0859375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 10.0, 14.0, 12.0, 18.0, 42.0, 55.0, 80.0, 104.0, 122.0, 237.0, 335.0, 391.0, 666.0, 917.0, 1337.0, 2062.0, 2847.0, 4564.0, 6551.0, 10144.0, 15381.0, 24327.0, 39302.0, 66809.0, 126346.0, 323495.0, 194905.0, 89437.0, 50625.0, 30751.0, 19540.0, 12326.0, 8272.0, 5295.0, 3537.0, 2427.0, 1636.0, 1137.0, 801.0, 547.0, 335.0, 273.0, 164.0, 121.0, 77.0, 55.0, 39.0, 32.0, 18.0, 12.0, 11.0, 8.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.537109375, -1.4886932373046875, -1.440277099609375, -1.3918609619140625, -1.34344482421875, -1.2950286865234375, -1.246612548828125, -1.1981964111328125, -1.1497802734375, -1.1013641357421875, -1.052947998046875, -1.0045318603515625, -0.95611572265625, -0.9076995849609375, -0.859283447265625, -0.8108673095703125, -0.762451171875, -0.7140350341796875, -0.665618896484375, -0.6172027587890625, -0.56878662109375, -0.5203704833984375, -0.471954345703125, -0.4235382080078125, -0.3751220703125, -0.3267059326171875, -0.278289794921875, -0.2298736572265625, -0.18145751953125, -0.1330413818359375, -0.084625244140625, -0.0362091064453125, 0.01220703125, 0.0606231689453125, 0.109039306640625, 0.1574554443359375, 0.20587158203125, 0.2542877197265625, 0.302703857421875, 0.3511199951171875, 0.3995361328125, 0.4479522705078125, 0.496368408203125, 0.5447845458984375, 0.59320068359375, 0.6416168212890625, 0.690032958984375, 0.7384490966796875, 0.786865234375, 0.8352813720703125, 0.883697509765625, 0.9321136474609375, 0.98052978515625, 1.0289459228515625, 1.077362060546875, 1.1257781982421875, 1.1741943359375, 1.2226104736328125, 1.271026611328125, 1.3194427490234375, 1.36785888671875, 1.4162750244140625, 1.464691162109375, 1.5131072998046875, 1.5615234375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 7.0, 9.0, 11.0, 10.0, 14.0, 19.0, 20.0, 21.0, 32.0, 35.0, 40.0, 24.0, 29.0, 37.0, 60.0, 31.0, 45.0, 1061.0, 55.0, 47.0, 37.0, 39.0, 47.0, 32.0, 37.0, 22.0, 20.0, 24.0, 27.0, 26.0, 17.0, 13.0, 2.0, 12.0, 9.0, 8.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40234375, -4.26031494140625, -4.1182861328125, -3.97625732421875, -3.834228515625, -3.69219970703125, -3.5501708984375, -3.40814208984375, -3.26611328125, -3.12408447265625, -2.9820556640625, -2.84002685546875, -2.697998046875, -2.55596923828125, -2.4139404296875, -2.27191162109375, -2.1298828125, -1.98785400390625, -1.8458251953125, -1.70379638671875, -1.561767578125, -1.41973876953125, -1.2777099609375, -1.13568115234375, -0.99365234375, -0.85162353515625, -0.7095947265625, -0.56756591796875, -0.425537109375, -0.28350830078125, -0.1414794921875, 0.00054931640625, 0.142578125, 0.28460693359375, 0.4266357421875, 0.56866455078125, 0.710693359375, 0.85272216796875, 0.9947509765625, 1.13677978515625, 1.27880859375, 1.42083740234375, 1.5628662109375, 1.70489501953125, 1.846923828125, 1.98895263671875, 2.1309814453125, 2.27301025390625, 2.4150390625, 2.55706787109375, 2.6990966796875, 2.84112548828125, 2.983154296875, 3.12518310546875, 3.2672119140625, 3.40924072265625, 3.55126953125, 3.69329833984375, 3.8353271484375, 3.97735595703125, 4.119384765625, 4.26141357421875, 4.4034423828125, 4.54547119140625, 4.6875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 6.0, 12.0, 20.0, 27.0, 30.0, 46.0, 77.0, 102.0, 158.0, 235.0, 323.0, 461.0, 695.0, 1005.0, 1486.0, 2209.0, 3351.0, 4958.0, 7553.0, 11140.0, 17153.0, 27099.0, 42164.0, 69838.0, 126399.0, 1348300.0, 187473.0, 93026.0, 54167.0, 33830.0, 21717.0, 14087.0, 9202.0, 6222.0, 4035.0, 2792.0, 1835.0, 1243.0, 828.0, 569.0, 385.0, 272.0, 198.0, 123.0, 93.0, 59.0, 42.0, 24.0, 19.0, 17.0, 8.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.3876953125, -1.343994140625, -1.30029296875, -1.256591796875, -1.212890625, -1.169189453125, -1.12548828125, -1.081787109375, -1.0380859375, -0.994384765625, -0.95068359375, -0.906982421875, -0.86328125, -0.819580078125, -0.77587890625, -0.732177734375, -0.6884765625, -0.644775390625, -0.60107421875, -0.557373046875, -0.513671875, -0.469970703125, -0.42626953125, -0.382568359375, -0.3388671875, -0.295166015625, -0.25146484375, -0.207763671875, -0.1640625, -0.120361328125, -0.07666015625, -0.032958984375, 0.0107421875, 0.054443359375, 0.09814453125, 0.141845703125, 0.185546875, 0.229248046875, 0.27294921875, 0.316650390625, 0.3603515625, 0.404052734375, 0.44775390625, 0.491455078125, 0.53515625, 0.578857421875, 0.62255859375, 0.666259765625, 0.7099609375, 0.753662109375, 0.79736328125, 0.841064453125, 0.884765625, 0.928466796875, 0.97216796875, 1.015869140625, 1.0595703125, 1.103271484375, 1.14697265625, 1.190673828125, 1.234375, 1.278076171875, 1.32177734375, 1.365478515625, 1.4091796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 6.0, 6.0, 7.0, 18.0, 23.0, 36.0, 50.0, 48.0, 96.0, 147.0, 143.0, 128.0, 88.0, 58.0, 44.0, 26.0, 17.0, 10.0, 4.0, 7.0, 12.0, 3.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012636184692382812, -0.001215815544128418, -0.0011680126190185547, -0.0011202096939086914, -0.0010724067687988281, -0.0010246038436889648, -0.0009768009185791016, -0.0009289979934692383, -0.000881195068359375, -0.0008333921432495117, -0.0007855892181396484, -0.0007377862930297852, -0.0006899833679199219, -0.0006421804428100586, -0.0005943775177001953, -0.000546574592590332, -0.0004987716674804688, -0.00045096874237060547, -0.0004031658172607422, -0.0003553628921508789, -0.0003075599670410156, -0.00025975704193115234, -0.00021195411682128906, -0.00016415119171142578, -0.0001163482666015625, -6.854534149169922e-05, -2.0742416381835938e-05, 2.7060508728027344e-05, 7.486343383789062e-05, 0.0001226663589477539, 0.0001704692840576172, 0.00021827220916748047, 0.00026607513427734375, 0.00031387805938720703, 0.0003616809844970703, 0.0004094839096069336, 0.0004572868347167969, 0.0005050897598266602, 0.0005528926849365234, 0.0006006956100463867, 0.00064849853515625, 0.0006963014602661133, 0.0007441043853759766, 0.0007919073104858398, 0.0008397102355957031, 0.0008875131607055664, 0.0009353160858154297, 0.000983119010925293, 0.0010309219360351562, 0.0010787248611450195, 0.0011265277862548828, 0.001174330711364746, 0.0012221336364746094, 0.0012699365615844727, 0.001317739486694336, 0.0013655424118041992, 0.0014133453369140625, 0.0014611482620239258, 0.001508951187133789, 0.0015567541122436523, 0.0016045570373535156, 0.001652359962463379, 0.0017001628875732422, 0.0017479658126831055, 0.0017957687377929688]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 10.0, 5.0, 13.0, 26.0, 30.0, 42.0, 45.0, 93.0, 131.0, 209.0, 482.0, 1346.0, 1039219.0, 5283.0, 734.0, 324.0, 192.0, 135.0, 68.0, 50.0, 30.0, 18.0, 13.0, 9.0, 10.0, 4.0, 3.0, 7.0, 3.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0310821533203125, -0.030279159545898438, -0.029476165771484375, -0.028673171997070312, -0.02787017822265625, -0.027067184448242188, -0.026264190673828125, -0.025461196899414062, -0.024658203125, -0.023855209350585938, -0.023052215576171875, -0.022249221801757812, -0.02144622802734375, -0.020643234252929688, -0.019840240478515625, -0.019037246704101562, -0.0182342529296875, -0.017431259155273438, -0.016628265380859375, -0.015825271606445312, -0.01502227783203125, -0.014219284057617188, -0.013416290283203125, -0.012613296508789062, -0.011810302734375, -0.011007308959960938, -0.010204315185546875, -0.009401321411132812, -0.00859832763671875, -0.0077953338623046875, -0.006992340087890625, -0.0061893463134765625, -0.0053863525390625, -0.0045833587646484375, -0.003780364990234375, -0.0029773712158203125, -0.00217437744140625, -0.0013713836669921875, -0.000568389892578125, 0.0002346038818359375, 0.00103759765625, 0.0018405914306640625, 0.002643585205078125, 0.0034465789794921875, 0.00424957275390625, 0.0050525665283203125, 0.005855560302734375, 0.0066585540771484375, 0.0074615478515625, 0.008264541625976562, 0.009067535400390625, 0.009870529174804688, 0.01067352294921875, 0.011476516723632812, 0.012279510498046875, 0.013082504272460938, 0.013885498046875, 0.014688491821289062, 0.015491485595703125, 0.016294479370117188, 0.01709747314453125, 0.017900466918945312, 0.018703460693359375, 0.019506454467773438, 0.0203094482421875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 43.0, 485.0, 456.0, 25.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011713054263964295, -0.0011060769902542233, -0.0010408485541120172, -0.0009756201761774719, -0.0009103917400352657, -0.0008451633038930595, -0.0007799349259585142, -0.000714706489816308, -0.0006494780536741018, -0.0005842496175318956, -0.0005190211813896894, -0.00045379280345514417, -0.000388564367312938, -0.0003233359311707318, -0.00025810752413235605, -0.0001928791170939803, -0.00012765068095177412, -6.242225936148316e-05, 2.806162228807807e-06, 6.803458381909877e-05, 0.00013326300540938973, 0.00019849144155159593, 0.00026371984858997166, 0.0003289482556283474, 0.0003941766917705536, 0.0004594051279127598, 0.000524633564054966, 0.0005898619419895113, 0.0006550903781317174, 0.0007203188142739236, 0.0007855471922084689, 0.0008507756283506751, 0.0009160039480775595, 0.0009812323842197657, 0.0010464608203619719, 0.001111689256504178, 0.0011769176926463842, 0.0012421461287885904, 0.0013073744485154748, 0.001372602884657681, 0.0014378313207998872, 0.0015030597569420934, 0.0015682881930842996, 0.0016335166292265058, 0.0016987449489533901, 0.0017639733850955963, 0.0018292018212378025, 0.0018944302573800087, 0.001959658693522215, 0.002024887129664421, 0.0020901155658066273, 0.0021553440019488335, 0.0022205724380910397, 0.002285800874233246, 0.002351029310375452, 0.0024162577465176582, 0.0024814861826598644, 0.0025467146188020706, 0.002611943054944277, 0.002677171491086483, 0.002742399927228689, 0.0028076283633708954, 0.0028728567995131016, 0.0029380852356553078, 0.0030033134389668703]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 10.0, 5.0, 4.0, 6.0, 9.0, 4.0, 9.0, 8.0, 8.0, 23.0, 15.0, 15.0, 27.0, 23.0, 24.0, 20.0, 26.0, 27.0, 40.0, 32.0, 36.0, 41.0, 32.0, 36.0, 44.0, 32.0, 31.0, 41.0, 33.0, 31.0, 32.0, 35.0, 33.0, 22.0, 31.0, 27.0, 24.0, 24.0, 8.0, 13.0, 11.0, 16.0, 13.0, 8.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00046247243881225586, -0.0004483051598072052, -0.00043413788080215454, -0.0004199706017971039, -0.0004058033227920532, -0.00039163604378700256, -0.0003774687647819519, -0.00036330148577690125, -0.0003491342067718506, -0.0003349669277667999, -0.00032079964876174927, -0.0003066323697566986, -0.00029246509075164795, -0.0002782978117465973, -0.00026413053274154663, -0.00024996325373649597, -0.0002357959747314453, -0.00022162869572639465, -0.000207461416721344, -0.00019329413771629333, -0.00017912685871124268, -0.00016495957970619202, -0.00015079230070114136, -0.0001366250216960907, -0.00012245774269104004, -0.00010829046368598938, -9.412318468093872e-05, -7.995590567588806e-05, -6.57886266708374e-05, -5.162134766578674e-05, -3.7454068660736084e-05, -2.3286789655685425e-05, -9.119510650634766e-06, 5.0477683544158936e-06, 1.9215047359466553e-05, 3.338232636451721e-05, 4.754960536956787e-05, 6.171688437461853e-05, 7.588416337966919e-05, 9.005144238471985e-05, 0.00010421872138977051, 0.00011838600039482117, 0.00013255327939987183, 0.00014672055840492249, 0.00016088783740997314, 0.0001750551164150238, 0.00018922239542007446, 0.00020338967442512512, 0.00021755695343017578, 0.00023172423243522644, 0.0002458915114402771, 0.00026005879044532776, 0.0002742260694503784, 0.0002883933484554291, 0.00030256062746047974, 0.0003167279064655304, 0.00033089518547058105, 0.0003450624644756317, 0.0003592297434806824, 0.00037339702248573303, 0.0003875643014907837, 0.00040173158049583435, 0.000415898859500885, 0.00043006613850593567, 0.00044423341751098633]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 7.0, 8.0, 3.0, 7.0, 12.0, 12.0, 2.0, 18.0, 27.0, 17.0, 27.0, 23.0, 30.0, 27.0, 26.0, 41.0, 45.0, 33.0, 43.0, 57.0, 45.0, 44.0, 40.0, 51.0, 36.0, 41.0, 26.0, 31.0, 24.0, 29.0, 25.0, 29.0, 22.0, 15.0, 10.0, 17.0, 11.0, 8.0, 7.0, 6.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1015625, -6.8798828125, -6.658203125, -6.4365234375, -6.21484375, -5.9931640625, -5.771484375, -5.5498046875, -5.328125, -5.1064453125, -4.884765625, -4.6630859375, -4.44140625, -4.2197265625, -3.998046875, -3.7763671875, -3.5546875, -3.3330078125, -3.111328125, -2.8896484375, -2.66796875, -2.4462890625, -2.224609375, -2.0029296875, -1.78125, -1.5595703125, -1.337890625, -1.1162109375, -0.89453125, -0.6728515625, -0.451171875, -0.2294921875, -0.0078125, 0.2138671875, 0.435546875, 0.6572265625, 0.87890625, 1.1005859375, 1.322265625, 1.5439453125, 1.765625, 1.9873046875, 2.208984375, 2.4306640625, 2.65234375, 2.8740234375, 3.095703125, 3.3173828125, 3.5390625, 3.7607421875, 3.982421875, 4.2041015625, 4.42578125, 4.6474609375, 4.869140625, 5.0908203125, 5.3125, 5.5341796875, 5.755859375, 5.9775390625, 6.19921875, 6.4208984375, 6.642578125, 6.8642578125, 7.0859375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 7.0, 10.0, 8.0, 11.0, 17.0, 20.0, 29.0, 49.0, 53.0, 79.0, 113.0, 165.0, 211.0, 337.0, 512.0, 820.0, 1498.0, 2838.0, 6745.0, 20185.0, 83583.0, 556916.0, 300546.0, 49777.0, 13488.0, 4956.0, 2233.0, 1187.0, 740.0, 444.0, 267.0, 195.0, 128.0, 89.0, 82.0, 50.0, 36.0, 32.0, 24.0, 22.0, 10.0, 10.0, 13.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-13.3984375, -12.9903564453125, -12.582275390625, -12.1741943359375, -11.76611328125, -11.3580322265625, -10.949951171875, -10.5418701171875, -10.1337890625, -9.7257080078125, -9.317626953125, -8.9095458984375, -8.50146484375, -8.0933837890625, -7.685302734375, -7.2772216796875, -6.869140625, -6.4610595703125, -6.052978515625, -5.6448974609375, -5.23681640625, -4.8287353515625, -4.420654296875, -4.0125732421875, -3.6044921875, -3.1964111328125, -2.788330078125, -2.3802490234375, -1.97216796875, -1.5640869140625, -1.156005859375, -0.7479248046875, -0.33984375, 0.0682373046875, 0.476318359375, 0.8843994140625, 1.29248046875, 1.7005615234375, 2.108642578125, 2.5167236328125, 2.9248046875, 3.3328857421875, 3.740966796875, 4.1490478515625, 4.55712890625, 4.9652099609375, 5.373291015625, 5.7813720703125, 6.189453125, 6.5975341796875, 7.005615234375, 7.4136962890625, 7.82177734375, 8.2298583984375, 8.637939453125, 9.0460205078125, 9.4541015625, 9.8621826171875, 10.270263671875, 10.6783447265625, 11.08642578125, 11.4945068359375, 11.902587890625, 12.3106689453125, 12.71875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 3.0, 6.0, 12.0, 14.0, 18.0, 20.0, 23.0, 39.0, 40.0, 49.0, 63.0, 73.0, 83.0, 255.0, 1775.0, 166.0, 91.0, 60.0, 50.0, 51.0, 39.0, 29.0, 21.0, 18.0, 17.0, 8.0, 4.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.890625, -26.083740234375, -25.27685546875, -24.469970703125, -23.6630859375, -22.856201171875, -22.04931640625, -21.242431640625, -20.435546875, -19.628662109375, -18.82177734375, -18.014892578125, -17.2080078125, -16.401123046875, -15.59423828125, -14.787353515625, -13.98046875, -13.173583984375, -12.36669921875, -11.559814453125, -10.7529296875, -9.946044921875, -9.13916015625, -8.332275390625, -7.525390625, -6.718505859375, -5.91162109375, -5.104736328125, -4.2978515625, -3.490966796875, -2.68408203125, -1.877197265625, -1.0703125, -0.263427734375, 0.54345703125, 1.350341796875, 2.1572265625, 2.964111328125, 3.77099609375, 4.577880859375, 5.384765625, 6.191650390625, 6.99853515625, 7.805419921875, 8.6123046875, 9.419189453125, 10.22607421875, 11.032958984375, 11.83984375, 12.646728515625, 13.45361328125, 14.260498046875, 15.0673828125, 15.874267578125, 16.68115234375, 17.488037109375, 18.294921875, 19.101806640625, 19.90869140625, 20.715576171875, 21.5224609375, 22.329345703125, 23.13623046875, 23.943115234375, 24.75]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 3.0, 5.0, 8.0, 12.0, 14.0, 20.0, 22.0, 39.0, 51.0, 94.0, 156.0, 358.0, 885.0, 8764.0, 3131510.0, 2347.0, 671.0, 301.0, 148.0, 106.0, 57.0, 33.0, 21.0, 21.0, 10.0, 18.0, 10.0, 5.0, 4.0, 1.0, 1.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.125, -64.8369140625, -62.548828125, -60.2607421875, -57.97265625, -55.6845703125, -53.396484375, -51.1083984375, -48.8203125, -46.5322265625, -44.244140625, -41.9560546875, -39.66796875, -37.3798828125, -35.091796875, -32.8037109375, -30.515625, -28.2275390625, -25.939453125, -23.6513671875, -21.36328125, -19.0751953125, -16.787109375, -14.4990234375, -12.2109375, -9.9228515625, -7.634765625, -5.3466796875, -3.05859375, -0.7705078125, 1.517578125, 3.8056640625, 6.09375, 8.3818359375, 10.669921875, 12.9580078125, 15.24609375, 17.5341796875, 19.822265625, 22.1103515625, 24.3984375, 26.6865234375, 28.974609375, 31.2626953125, 33.55078125, 35.8388671875, 38.126953125, 40.4150390625, 42.703125, 44.9912109375, 47.279296875, 49.5673828125, 51.85546875, 54.1435546875, 56.431640625, 58.7197265625, 61.0078125, 63.2958984375, 65.583984375, 67.8720703125, 70.16015625, 72.4482421875, 74.736328125, 77.0244140625, 79.3125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 46.0, 550.0, 375.0, 34.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.448726654052734, -50.06769561767578, -46.68666076660156, -43.30562973022461, -39.924598693847656, -36.54356384277344, -33.162532806396484, -29.7814998626709, -26.400466918945312, -23.019433975219727, -19.63840103149414, -16.257369995117188, -12.876337051391602, -9.495304107666016, -6.1142730712890625, -2.7332401275634766, 0.6477928161621094, 4.028825283050537, 7.409857749938965, 10.790889739990234, 14.17192268371582, 17.552955627441406, 20.93398666381836, 24.315019607543945, 27.69605255126953, 31.077085494995117, 34.4581184387207, 37.839149475097656, 41.220184326171875, 44.60121536254883, 47.98224639892578, 51.36328125, 54.74430847167969, 58.12533950805664, 61.50637435913086, 64.88740539550781, 68.26844024658203, 71.64947509765625, 75.03050231933594, 78.41153717041016, 81.79257202148438, 85.1736068725586, 88.55463409423828, 91.9356689453125, 95.31670379638672, 98.69773864746094, 102.07876586914062, 105.45980072021484, 108.84082794189453, 112.22186279296875, 115.60289001464844, 118.98392486572266, 122.36495971679688, 125.74598693847656, 129.12701416015625, 132.508056640625, 135.8890838623047, 139.27011108398438, 142.65115356445312, 146.0321807861328, 149.4132080078125, 152.79425048828125, 156.17527770996094, 159.55630493164062, 162.93734741210938]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 6.0, 4.0, 6.0, 3.0, 8.0, 8.0, 13.0, 10.0, 18.0, 24.0, 32.0, 25.0, 28.0, 29.0, 27.0, 43.0, 41.0, 37.0, 48.0, 44.0, 53.0, 37.0, 43.0, 37.0, 37.0, 49.0, 38.0, 27.0, 35.0, 18.0, 31.0, 22.0, 22.0, 11.0, 15.0, 15.0, 10.0, 11.0, 7.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-43.581878662109375, -42.16793441772461, -40.75399398803711, -39.340049743652344, -37.92610549926758, -36.51216125488281, -35.09822082519531, -33.68427658081055, -32.27033233642578, -30.85638999938965, -29.442445755004883, -28.02850341796875, -26.614559173583984, -25.20061683654785, -23.78667449951172, -22.372730255126953, -20.95878791809082, -19.544845581054688, -18.130901336669922, -16.71695899963379, -15.303014755249023, -13.88907241821289, -12.475129127502441, -11.061185836791992, -9.647242546081543, -8.233299255371094, -6.8193559646606445, -5.4054131507873535, -3.9914698600769043, -2.577526569366455, -1.163583755493164, 0.25035953521728516, 1.6643028259277344, 3.0782461166381836, 4.492189407348633, 5.906132221221924, 7.320075511932373, 8.734018325805664, 10.147961616516113, 11.561904907226562, 12.975848197937012, 14.389791488647461, 15.80373477935791, 17.21767807006836, 18.631620407104492, 20.045564651489258, 21.45950698852539, 22.873451232910156, 24.28739356994629, 25.701335906982422, 27.115280151367188, 28.52922248840332, 29.943166732788086, 31.35710906982422, 32.771053314208984, 34.18499755859375, 35.59893798828125, 37.012882232666016, 38.426822662353516, 39.84076690673828, 41.25471115112305, 42.66865539550781, 44.08259582519531, 45.49654006958008, 46.910484313964844]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 4.0, 2.0, 6.0, 8.0, 3.0, 7.0, 10.0, 15.0, 14.0, 11.0, 17.0, 22.0, 21.0, 17.0, 32.0, 28.0, 31.0, 31.0, 37.0, 28.0, 30.0, 47.0, 40.0, 37.0, 39.0, 46.0, 36.0, 37.0, 30.0, 33.0, 35.0, 31.0, 23.0, 28.0, 19.0, 15.0, 21.0, 12.0, 13.0, 15.0, 8.0, 9.0, 8.0, 12.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-7.72265625, -7.48687744140625, -7.2510986328125, -7.01531982421875, -6.779541015625, -6.54376220703125, -6.3079833984375, -6.07220458984375, -5.83642578125, -5.60064697265625, -5.3648681640625, -5.12908935546875, -4.893310546875, -4.65753173828125, -4.4217529296875, -4.18597412109375, -3.9501953125, -3.71441650390625, -3.4786376953125, -3.24285888671875, -3.007080078125, -2.77130126953125, -2.5355224609375, -2.29974365234375, -2.06396484375, -1.82818603515625, -1.5924072265625, -1.35662841796875, -1.120849609375, -0.88507080078125, -0.6492919921875, -0.41351318359375, -0.177734375, 0.05804443359375, 0.2938232421875, 0.52960205078125, 0.765380859375, 1.00115966796875, 1.2369384765625, 1.47271728515625, 1.70849609375, 1.94427490234375, 2.1800537109375, 2.41583251953125, 2.651611328125, 2.88739013671875, 3.1231689453125, 3.35894775390625, 3.5947265625, 3.83050537109375, 4.0662841796875, 4.30206298828125, 4.537841796875, 4.77362060546875, 5.0093994140625, 5.24517822265625, 5.48095703125, 5.71673583984375, 5.9525146484375, 6.18829345703125, 6.424072265625, 6.65985107421875, 6.8956298828125, 7.13140869140625, 7.3671875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 6.0, 16.0, 12.0, 15.0, 17.0, 19.0, 34.0, 42.0, 37.0, 48.0, 54.0, 70.0, 93.0, 131.0, 167.0, 203.0, 305.0, 436.0, 734.0, 1542.0, 5395.0, 619910.0, 3538954.0, 20589.0, 2450.0, 969.0, 550.0, 373.0, 239.0, 179.0, 131.0, 130.0, 85.0, 72.0, 62.0, 38.0, 29.0, 24.0, 23.0, 17.0, 13.0, 16.0, 6.0, 12.0, 6.0, 9.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0], "bins": [-55.09375, -53.484375, -51.875, -50.265625, -48.65625, -47.046875, -45.4375, -43.828125, -42.21875, -40.609375, -39.0, -37.390625, -35.78125, -34.171875, -32.5625, -30.953125, -29.34375, -27.734375, -26.125, -24.515625, -22.90625, -21.296875, -19.6875, -18.078125, -16.46875, -14.859375, -13.25, -11.640625, -10.03125, -8.421875, -6.8125, -5.203125, -3.59375, -1.984375, -0.375, 1.234375, 2.84375, 4.453125, 6.0625, 7.671875, 9.28125, 10.890625, 12.5, 14.109375, 15.71875, 17.328125, 18.9375, 20.546875, 22.15625, 23.765625, 25.375, 26.984375, 28.59375, 30.203125, 31.8125, 33.421875, 35.03125, 36.640625, 38.25, 39.859375, 41.46875, 43.078125, 44.6875, 46.296875, 47.90625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 10.0, 5.0, 14.0, 20.0, 35.0, 55.0, 100.0, 233.0, 455.0, 830.0, 954.0, 676.0, 322.0, 169.0, 85.0, 35.0, 24.0, 18.0, 9.0, 10.0, 5.0, 1.0, 6.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.203125, -27.535400390625, -26.86767578125, -26.199951171875, -25.5322265625, -24.864501953125, -24.19677734375, -23.529052734375, -22.861328125, -22.193603515625, -21.52587890625, -20.858154296875, -20.1904296875, -19.522705078125, -18.85498046875, -18.187255859375, -17.51953125, -16.851806640625, -16.18408203125, -15.516357421875, -14.8486328125, -14.180908203125, -13.51318359375, -12.845458984375, -12.177734375, -11.510009765625, -10.84228515625, -10.174560546875, -9.5068359375, -8.839111328125, -8.17138671875, -7.503662109375, -6.8359375, -6.168212890625, -5.50048828125, -4.832763671875, -4.1650390625, -3.497314453125, -2.82958984375, -2.161865234375, -1.494140625, -0.826416015625, -0.15869140625, 0.509033203125, 1.1767578125, 1.844482421875, 2.51220703125, 3.179931640625, 3.84765625, 4.515380859375, 5.18310546875, 5.850830078125, 6.5185546875, 7.186279296875, 7.85400390625, 8.521728515625, 9.189453125, 9.857177734375, 10.52490234375, 11.192626953125, 11.8603515625, 12.528076171875, 13.19580078125, 13.863525390625, 14.53125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 11.0, 9.0, 13.0, 29.0, 49.0, 136.0, 294.0, 933.0, 4868.0, 105329.0, 3986484.0, 90233.0, 4524.0, 854.0, 272.0, 112.0, 57.0, 30.0, 17.0, 7.0, 7.0, 3.0, 1.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.28125, -37.202392578125, -36.12353515625, -35.044677734375, -33.9658203125, -32.886962890625, -31.80810546875, -30.729248046875, -29.650390625, -28.571533203125, -27.49267578125, -26.413818359375, -25.3349609375, -24.256103515625, -23.17724609375, -22.098388671875, -21.01953125, -19.940673828125, -18.86181640625, -17.782958984375, -16.7041015625, -15.625244140625, -14.54638671875, -13.467529296875, -12.388671875, -11.309814453125, -10.23095703125, -9.152099609375, -8.0732421875, -6.994384765625, -5.91552734375, -4.836669921875, -3.7578125, -2.678955078125, -1.60009765625, -0.521240234375, 0.5576171875, 1.636474609375, 2.71533203125, 3.794189453125, 4.873046875, 5.951904296875, 7.03076171875, 8.109619140625, 9.1884765625, 10.267333984375, 11.34619140625, 12.425048828125, 13.50390625, 14.582763671875, 15.66162109375, 16.740478515625, 17.8193359375, 18.898193359375, 19.97705078125, 21.055908203125, 22.134765625, 23.213623046875, 24.29248046875, 25.371337890625, 26.4501953125, 27.529052734375, 28.60791015625, 29.686767578125, 30.765625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 62.0, 214.0, 358.0, 258.0, 81.0, 17.0, 6.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.35330200195312, -242.5831756591797, -233.81304931640625, -225.04290771484375, -216.2727813720703, -207.50265502929688, -198.73252868652344, -189.96240234375, -181.1922607421875, -172.42213439941406, -163.65200805664062, -154.88186645507812, -146.1117401123047, -137.34161376953125, -128.5714874267578, -119.80136108398438, -111.03123474121094, -102.2611083984375, -93.49097442626953, -84.7208480834961, -75.95071411132812, -67.18058776855469, -58.41046142578125, -49.64033126831055, -40.870201110839844, -32.10007095336914, -23.32994270324707, -14.559814453125, -5.789684295654297, 2.9804458618164062, 11.750572204589844, 20.520702362060547, 29.29083251953125, 38.06096267700195, 46.831092834472656, 55.601219177246094, 64.37135314941406, 73.1414794921875, 81.91160583496094, 90.68173217773438, 99.45186614990234, 108.22199249267578, 116.99212646484375, 125.76225280761719, 134.53237915039062, 143.30252075195312, 152.0726318359375, 160.8427734375, 169.61289978027344, 178.38302612304688, 187.1531524658203, 195.92327880859375, 204.69342041015625, 213.4635467529297, 222.23367309570312, 231.00379943847656, 239.77392578125, 248.54405212402344, 257.3141784667969, 266.0843200683594, 274.85443115234375, 283.62457275390625, 292.39471435546875, 301.1648254394531, 309.9349670410156]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 1.0, 5.0, 4.0, 12.0, 14.0, 11.0, 7.0, 12.0, 20.0, 20.0, 25.0, 17.0, 37.0, 21.0, 32.0, 33.0, 34.0, 32.0, 45.0, 29.0, 47.0, 37.0, 43.0, 40.0, 32.0, 31.0, 46.0, 40.0, 38.0, 31.0, 31.0, 25.0, 20.0, 17.0, 20.0, 19.0, 8.0, 9.0, 10.0, 9.0, 7.0, 5.0, 4.0, 5.0, 6.0, 5.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-40.90593719482422, -39.5831298828125, -38.26032257080078, -36.93751525878906, -35.61470413208008, -34.29189682006836, -32.96908950805664, -31.646282196044922, -30.323474884033203, -29.000667572021484, -27.677858352661133, -26.355051040649414, -25.032243728637695, -23.709434509277344, -22.386627197265625, -21.063819885253906, -19.741010665893555, -18.418203353881836, -17.095394134521484, -15.772586822509766, -14.449779510498047, -13.126971244812012, -11.804162979125977, -10.481355667114258, -9.158547401428223, -7.835739612579346, -6.512931823730469, -5.190123558044434, -3.8673157691955566, -2.5445079803466797, -1.2216997146606445, 0.10110759735107422, 1.4239158630371094, 2.7467236518859863, 4.069531440734863, 5.392339706420898, 6.715147495269775, 8.037955284118652, 9.360763549804688, 10.683570861816406, 12.006379127502441, 13.329187393188477, 14.651994705200195, 15.97480297088623, 17.297611236572266, 18.620418548583984, 19.943225860595703, 21.266033172607422, 22.588842391967773, 23.911649703979492, 25.234458923339844, 26.557266235351562, 27.88007354736328, 29.202880859375, 30.52569007873535, 31.84849739074707, 33.17130661010742, 34.49411392211914, 35.81692123413086, 37.139732360839844, 38.46253967285156, 39.78534698486328, 41.108154296875, 42.43096160888672, 43.75376892089844]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 3.0, 8.0, 7.0, 5.0, 11.0, 13.0, 15.0, 17.0, 22.0, 19.0, 26.0, 28.0, 36.0, 27.0, 44.0, 44.0, 32.0, 40.0, 47.0, 38.0, 40.0, 45.0, 43.0, 39.0, 37.0, 41.0, 45.0, 30.0, 31.0, 28.0, 18.0, 16.0, 17.0, 18.0, 14.0, 6.0, 12.0, 5.0, 4.0, 4.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-70.625, -68.494140625, -66.36328125, -64.232421875, -62.1015625, -59.970703125, -57.83984375, -55.708984375, -53.578125, -51.447265625, -49.31640625, -47.185546875, -45.0546875, -42.923828125, -40.79296875, -38.662109375, -36.53125, -34.400390625, -32.26953125, -30.138671875, -28.0078125, -25.876953125, -23.74609375, -21.615234375, -19.484375, -17.353515625, -15.22265625, -13.091796875, -10.9609375, -8.830078125, -6.69921875, -4.568359375, -2.4375, -0.306640625, 1.82421875, 3.955078125, 6.0859375, 8.216796875, 10.34765625, 12.478515625, 14.609375, 16.740234375, 18.87109375, 21.001953125, 23.1328125, 25.263671875, 27.39453125, 29.525390625, 31.65625, 33.787109375, 35.91796875, 38.048828125, 40.1796875, 42.310546875, 44.44140625, 46.572265625, 48.703125, 50.833984375, 52.96484375, 55.095703125, 57.2265625, 59.357421875, 61.48828125, 63.619140625, 65.75]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 9.0, 12.0, 19.0, 30.0, 41.0, 75.0, 99.0, 134.0, 209.0, 280.0, 386.0, 573.0, 765.0, 1082.0, 1532.0, 2178.0, 3115.0, 4457.0, 6713.0, 9487.0, 14172.0, 21906.0, 33954.0, 55287.0, 95644.0, 207373.0, 289595.0, 117767.0, 65260.0, 39778.0, 25332.0, 16136.0, 10885.0, 7318.0, 5093.0, 3506.0, 2431.0, 1683.0, 1258.0, 892.0, 605.0, 432.0, 325.0, 234.0, 159.0, 111.0, 78.0, 49.0, 31.0, 28.0, 20.0, 8.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-12.3828125, -11.997802734375, -11.61279296875, -11.227783203125, -10.8427734375, -10.457763671875, -10.07275390625, -9.687744140625, -9.302734375, -8.917724609375, -8.53271484375, -8.147705078125, -7.7626953125, -7.377685546875, -6.99267578125, -6.607666015625, -6.22265625, -5.837646484375, -5.45263671875, -5.067626953125, -4.6826171875, -4.297607421875, -3.91259765625, -3.527587890625, -3.142578125, -2.757568359375, -2.37255859375, -1.987548828125, -1.6025390625, -1.217529296875, -0.83251953125, -0.447509765625, -0.0625, 0.322509765625, 0.70751953125, 1.092529296875, 1.4775390625, 1.862548828125, 2.24755859375, 2.632568359375, 3.017578125, 3.402587890625, 3.78759765625, 4.172607421875, 4.5576171875, 4.942626953125, 5.32763671875, 5.712646484375, 6.09765625, 6.482666015625, 6.86767578125, 7.252685546875, 7.6376953125, 8.022705078125, 8.40771484375, 8.792724609375, 9.177734375, 9.562744140625, 9.94775390625, 10.332763671875, 10.7177734375, 11.102783203125, 11.48779296875, 11.872802734375, 12.2578125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 7.0, 8.0, 4.0, 8.0, 13.0, 11.0, 9.0, 21.0, 20.0, 25.0, 16.0, 33.0, 28.0, 28.0, 28.0, 33.0, 33.0, 35.0, 42.0, 27.0, 45.0, 1052.0, 38.0, 40.0, 40.0, 37.0, 33.0, 31.0, 30.0, 32.0, 21.0, 20.0, 21.0, 25.0, 25.0, 14.0, 17.0, 10.0, 7.0, 11.0, 4.0, 9.0, 2.0, 4.0, 7.0, 4.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.84375, -33.6220703125, -32.400390625, -31.1787109375, -29.95703125, -28.7353515625, -27.513671875, -26.2919921875, -25.0703125, -23.8486328125, -22.626953125, -21.4052734375, -20.18359375, -18.9619140625, -17.740234375, -16.5185546875, -15.296875, -14.0751953125, -12.853515625, -11.6318359375, -10.41015625, -9.1884765625, -7.966796875, -6.7451171875, -5.5234375, -4.3017578125, -3.080078125, -1.8583984375, -0.63671875, 0.5849609375, 1.806640625, 3.0283203125, 4.25, 5.4716796875, 6.693359375, 7.9150390625, 9.13671875, 10.3583984375, 11.580078125, 12.8017578125, 14.0234375, 15.2451171875, 16.466796875, 17.6884765625, 18.91015625, 20.1318359375, 21.353515625, 22.5751953125, 23.796875, 25.0185546875, 26.240234375, 27.4619140625, 28.68359375, 29.9052734375, 31.126953125, 32.3486328125, 33.5703125, 34.7919921875, 36.013671875, 37.2353515625, 38.45703125, 39.6787109375, 40.900390625, 42.1220703125, 43.34375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 12.0, 16.0, 24.0, 39.0, 57.0, 88.0, 102.0, 197.0, 217.0, 340.0, 508.0, 703.0, 1048.0, 1605.0, 2344.0, 3489.0, 5155.0, 7548.0, 11332.0, 16963.0, 26139.0, 39450.0, 62657.0, 106024.0, 227351.0, 1289214.0, 109798.0, 64122.0, 40611.0, 26728.0, 17514.0, 11585.0, 7767.0, 5284.0, 3573.0, 2412.0, 1638.0, 1121.0, 747.0, 514.0, 364.0, 237.0, 156.0, 114.0, 78.0, 59.0, 34.0, 19.0, 12.0, 11.0, 8.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.9375, -12.5335693359375, -12.129638671875, -11.7257080078125, -11.32177734375, -10.9178466796875, -10.513916015625, -10.1099853515625, -9.7060546875, -9.3021240234375, -8.898193359375, -8.4942626953125, -8.09033203125, -7.6864013671875, -7.282470703125, -6.8785400390625, -6.474609375, -6.0706787109375, -5.666748046875, -5.2628173828125, -4.85888671875, -4.4549560546875, -4.051025390625, -3.6470947265625, -3.2431640625, -2.8392333984375, -2.435302734375, -2.0313720703125, -1.62744140625, -1.2235107421875, -0.819580078125, -0.4156494140625, -0.01171875, 0.3922119140625, 0.796142578125, 1.2000732421875, 1.60400390625, 2.0079345703125, 2.411865234375, 2.8157958984375, 3.2197265625, 3.6236572265625, 4.027587890625, 4.4315185546875, 4.83544921875, 5.2393798828125, 5.643310546875, 6.0472412109375, 6.451171875, 6.8551025390625, 7.259033203125, 7.6629638671875, 8.06689453125, 8.4708251953125, 8.874755859375, 9.2786865234375, 9.6826171875, 10.0865478515625, 10.490478515625, 10.8944091796875, 11.29833984375, 11.7022705078125, 12.106201171875, 12.5101318359375, 12.9140625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 4.0, 9.0, 17.0, 14.0, 20.0, 21.0, 40.0, 55.0, 74.0, 109.0, 139.0, 127.0, 119.0, 61.0, 38.0, 37.0, 28.0, 15.0, 12.0, 8.0, 8.0, 12.0, 4.0, 0.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01418304443359375, -0.013738632202148438, -0.013294219970703125, -0.012849807739257812, -0.0124053955078125, -0.011960983276367188, -0.011516571044921875, -0.011072158813476562, -0.01062774658203125, -0.010183334350585938, -0.009738922119140625, -0.009294509887695312, -0.00885009765625, -0.008405685424804688, -0.007961273193359375, -0.0075168609619140625, -0.00707244873046875, -0.0066280364990234375, -0.006183624267578125, -0.0057392120361328125, -0.0052947998046875, -0.0048503875732421875, -0.004405975341796875, -0.0039615631103515625, -0.00351715087890625, -0.0030727386474609375, -0.002628326416015625, -0.0021839141845703125, -0.001739501953125, -0.0012950897216796875, -0.000850677490234375, -0.0004062652587890625, 3.814697265625e-05, 0.0004825592041015625, 0.000926971435546875, 0.0013713836669921875, 0.0018157958984375, 0.0022602081298828125, 0.002704620361328125, 0.0031490325927734375, 0.00359344482421875, 0.0040378570556640625, 0.004482269287109375, 0.0049266815185546875, 0.00537109375, 0.0058155059814453125, 0.006259918212890625, 0.0067043304443359375, 0.00714874267578125, 0.0075931549072265625, 0.008037567138671875, 0.008481979370117188, 0.0089263916015625, 0.009370803833007812, 0.009815216064453125, 0.010259628295898438, 0.01070404052734375, 0.011148452758789062, 0.011592864990234375, 0.012037277221679688, 0.012481689453125, 0.012926101684570312, 0.013370513916015625, 0.013814926147460938, 0.01425933837890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 5.0, 8.0, 11.0, 8.0, 11.0, 15.0, 28.0, 31.0, 41.0, 45.0, 82.0, 101.0, 172.0, 277.0, 530.0, 1410.0, 5474.0, 37178.0, 670673.0, 304962.0, 21530.0, 3696.0, 1053.0, 426.0, 213.0, 165.0, 110.0, 75.0, 63.0, 41.0, 25.0, 18.0, 16.0, 8.0, 10.0, 5.0, 10.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.10748291015625, -0.1041107177734375, -0.100738525390625, -0.0973663330078125, -0.093994140625, -0.0906219482421875, -0.087249755859375, -0.0838775634765625, -0.08050537109375, -0.0771331787109375, -0.073760986328125, -0.0703887939453125, -0.0670166015625, -0.0636444091796875, -0.060272216796875, -0.0569000244140625, -0.05352783203125, -0.0501556396484375, -0.046783447265625, -0.0434112548828125, -0.0400390625, -0.0366668701171875, -0.033294677734375, -0.0299224853515625, -0.02655029296875, -0.0231781005859375, -0.019805908203125, -0.0164337158203125, -0.0130615234375, -0.0096893310546875, -0.006317138671875, -0.0029449462890625, 0.00042724609375, 0.0037994384765625, 0.007171630859375, 0.0105438232421875, 0.013916015625, 0.0172882080078125, 0.020660400390625, 0.0240325927734375, 0.02740478515625, 0.0307769775390625, 0.034149169921875, 0.0375213623046875, 0.0408935546875, 0.0442657470703125, 0.047637939453125, 0.0510101318359375, 0.05438232421875, 0.0577545166015625, 0.061126708984375, 0.0644989013671875, 0.06787109375, 0.0712432861328125, 0.074615478515625, 0.0779876708984375, 0.08135986328125, 0.0847320556640625, 0.088104248046875, 0.0914764404296875, 0.0948486328125, 0.0982208251953125, 0.101593017578125, 0.1049652099609375, 0.10833740234375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 7.0, 2.0, 4.0, 9.0, 23.0, 47.0, 62.0, 103.0, 168.0, 176.0, 167.0, 111.0, 62.0, 36.0, 14.0, 11.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010070371441543102, -0.00965904537588358, -0.009247719310224056, -0.008836394175887108, -0.008425068110227585, -0.008013742044568062, -0.007602415978908539, -0.007191089913249016, -0.00677976431325078, -0.006368438247591257, -0.005957112647593021, -0.005545786581933498, -0.005134460516273975, -0.00472313491627574, -0.004311808850616217, -0.0039004830177873373, -0.003489157184958458, -0.0030778313521295786, -0.0026665055193006992, -0.0022551794536411762, -0.0018438536208122969, -0.0014325277879834175, -0.0010212017223238945, -0.0006098758894950151, -0.0001985500566661358, 0.00021277583437040448, 0.0006241017254069448, 0.001035427674651146, 0.0014467535074800253, 0.0018580793403089046, 0.0022694054059684277, 0.002680731238797307, 0.0030920561403036118, 0.003503381973132491, 0.0039147078059613705, 0.0043260338716208935, 0.004737359471619129, 0.005148685537278652, 0.005560011602938175, 0.005971337668597698, 0.006382663268595934, 0.006793989334255457, 0.007205314934253693, 0.007616640999913216, 0.008027967065572739, 0.008439293131232262, 0.008850619196891785, 0.009261944331228733, 0.009673270396888256, 0.010084596462547779, 0.010495922528207302, 0.01090724766254425, 0.011318573728203773, 0.011729899793863297, 0.01214122585952282, 0.012552551925182343, 0.012963877990841866, 0.013375204056501389, 0.013786530122160912, 0.014197856187820435, 0.014609181322157383, 0.015020507387816906, 0.015431833453476429, 0.015843158587813377, 0.0162544846534729]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 6.0, 11.0, 7.0, 14.0, 11.0, 18.0, 17.0, 13.0, 15.0, 18.0, 30.0, 23.0, 31.0, 29.0, 37.0, 26.0, 29.0, 36.0, 42.0, 32.0, 34.0, 47.0, 27.0, 42.0, 29.0, 46.0, 36.0, 28.0, 23.0, 16.0, 30.0, 28.0, 28.0, 22.0, 27.0, 18.0, 5.0, 12.0, 10.0, 9.0, 7.0, 7.0, 6.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004115641117095947, -0.003977554850280285, -0.0038394685834646225, -0.00370138231664896, -0.0035632960498332977, -0.0034252097830176353, -0.003287123516201973, -0.0031490372493863106, -0.003010950982570648, -0.002872864715754986, -0.0027347784489393234, -0.002596692182123661, -0.0024586059153079987, -0.0023205196484923363, -0.002182433381676674, -0.0020443471148610115, -0.0019062608480453491, -0.0017681745812296867, -0.0016300883144140244, -0.001492002047598362, -0.0013539157807826996, -0.0012158295139670372, -0.0010777432471513748, -0.0009396569803357124, -0.00080157071352005, -0.0006634844467043877, -0.0005253981798887253, -0.0003873119130730629, -0.0002492256462574005, -0.00011113937944173813, 2.6946887373924255e-05, 0.00016503315418958664, 0.000303119421005249, 0.0004412056878209114, 0.0005792919546365738, 0.0007173782214522362, 0.0008554644882678986, 0.000993550755083561, 0.0011316370218992233, 0.0012697232887148857, 0.001407809555530548, 0.0015458958223462105, 0.0016839820891618729, 0.0018220683559775352, 0.0019601546227931976, 0.00209824088960886, 0.0022363271564245224, 0.002374413423240185, 0.002512499690055847, 0.0026505859568715096, 0.002788672223687172, 0.0029267584905028343, 0.0030648447573184967, 0.003202931024134159, 0.0033410172909498215, 0.003479103557765484, 0.0036171898245811462, 0.0037552760913968086, 0.003893362358212471, 0.004031448625028133, 0.004169534891843796, 0.004307621158659458, 0.0044457074254751205, 0.004583793692290783, 0.004721879959106445]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 3.0, 8.0, 7.0, 5.0, 11.0, 14.0, 14.0, 17.0, 23.0, 18.0, 27.0, 26.0, 37.0, 27.0, 43.0, 45.0, 32.0, 40.0, 47.0, 38.0, 39.0, 48.0, 41.0, 39.0, 37.0, 41.0, 45.0, 30.0, 31.0, 28.0, 18.0, 16.0, 17.0, 17.0, 15.0, 6.0, 12.0, 5.0, 4.0, 4.0, 7.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-70.625, -68.494140625, -66.36328125, -64.232421875, -62.1015625, -59.970703125, -57.83984375, -55.708984375, -53.578125, -51.447265625, -49.31640625, -47.185546875, -45.0546875, -42.923828125, -40.79296875, -38.662109375, -36.53125, -34.400390625, -32.26953125, -30.138671875, -28.0078125, -25.876953125, -23.74609375, -21.615234375, -19.484375, -17.353515625, -15.22265625, -13.091796875, -10.9609375, -8.830078125, -6.69921875, -4.568359375, -2.4375, -0.306640625, 1.82421875, 3.955078125, 6.0859375, 8.216796875, 10.34765625, 12.478515625, 14.609375, 16.740234375, 18.87109375, 21.001953125, 23.1328125, 25.263671875, 27.39453125, 29.525390625, 31.65625, 33.787109375, 35.91796875, 38.048828125, 40.1796875, 42.310546875, 44.44140625, 46.572265625, 48.703125, 50.833984375, 52.96484375, 55.095703125, 57.2265625, 59.357421875, 61.48828125, 63.619140625, 65.75]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 10.0, 11.0, 16.0, 15.0, 33.0, 23.0, 38.0, 50.0, 72.0, 93.0, 151.0, 210.0, 367.0, 560.0, 906.0, 1570.0, 2981.0, 5924.0, 14715.0, 49529.0, 249419.0, 555051.0, 118931.0, 28122.0, 9759.0, 4288.0, 2261.0, 1319.0, 772.0, 430.0, 290.0, 174.0, 138.0, 72.0, 66.0, 38.0, 40.0, 19.0, 13.0, 17.0, 12.0, 12.0, 8.0, 8.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0], "bins": [-19.3125, -18.749267578125, -18.18603515625, -17.622802734375, -17.0595703125, -16.496337890625, -15.93310546875, -15.369873046875, -14.806640625, -14.243408203125, -13.68017578125, -13.116943359375, -12.5537109375, -11.990478515625, -11.42724609375, -10.864013671875, -10.30078125, -9.737548828125, -9.17431640625, -8.611083984375, -8.0478515625, -7.484619140625, -6.92138671875, -6.358154296875, -5.794921875, -5.231689453125, -4.66845703125, -4.105224609375, -3.5419921875, -2.978759765625, -2.41552734375, -1.852294921875, -1.2890625, -0.725830078125, -0.16259765625, 0.400634765625, 0.9638671875, 1.527099609375, 2.09033203125, 2.653564453125, 3.216796875, 3.780029296875, 4.34326171875, 4.906494140625, 5.4697265625, 6.032958984375, 6.59619140625, 7.159423828125, 7.72265625, 8.285888671875, 8.84912109375, 9.412353515625, 9.9755859375, 10.538818359375, 11.10205078125, 11.665283203125, 12.228515625, 12.791748046875, 13.35498046875, 13.918212890625, 14.4814453125, 15.044677734375, 15.60791015625, 16.171142578125, 16.734375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 7.0, 18.0, 21.0, 32.0, 47.0, 57.0, 86.0, 93.0, 137.0, 2111.0, 80.0, 80.0, 54.0, 52.0, 48.0, 33.0, 22.0, 17.0, 13.0, 7.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.375, -153.498046875, -147.62109375, -141.744140625, -135.8671875, -129.990234375, -124.11328125, -118.236328125, -112.359375, -106.482421875, -100.60546875, -94.728515625, -88.8515625, -82.974609375, -77.09765625, -71.220703125, -65.34375, -59.466796875, -53.58984375, -47.712890625, -41.8359375, -35.958984375, -30.08203125, -24.205078125, -18.328125, -12.451171875, -6.57421875, -0.697265625, 5.1796875, 11.056640625, 16.93359375, 22.810546875, 28.6875, 34.564453125, 40.44140625, 46.318359375, 52.1953125, 58.072265625, 63.94921875, 69.826171875, 75.703125, 81.580078125, 87.45703125, 93.333984375, 99.2109375, 105.087890625, 110.96484375, 116.841796875, 122.71875, 128.595703125, 134.47265625, 140.349609375, 146.2265625, 152.103515625, 157.98046875, 163.857421875, 169.734375, 175.611328125, 181.48828125, 187.365234375, 193.2421875, 199.119140625, 204.99609375, 210.873046875, 216.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 1.0, 7.0, 3.0, 11.0, 14.0, 14.0, 18.0, 28.0, 40.0, 61.0, 101.0, 165.0, 233.0, 365.0, 694.0, 1556.0, 6632.0, 96878.0, 2968554.0, 62214.0, 5179.0, 1336.0, 615.0, 348.0, 211.0, 122.0, 101.0, 55.0, 45.0, 26.0, 23.0, 13.0, 7.0, 16.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-44.1875, -43.007080078125, -41.82666015625, -40.646240234375, -39.4658203125, -38.285400390625, -37.10498046875, -35.924560546875, -34.744140625, -33.563720703125, -32.38330078125, -31.202880859375, -30.0224609375, -28.842041015625, -27.66162109375, -26.481201171875, -25.30078125, -24.120361328125, -22.93994140625, -21.759521484375, -20.5791015625, -19.398681640625, -18.21826171875, -17.037841796875, -15.857421875, -14.677001953125, -13.49658203125, -12.316162109375, -11.1357421875, -9.955322265625, -8.77490234375, -7.594482421875, -6.4140625, -5.233642578125, -4.05322265625, -2.872802734375, -1.6923828125, -0.511962890625, 0.66845703125, 1.848876953125, 3.029296875, 4.209716796875, 5.39013671875, 6.570556640625, 7.7509765625, 8.931396484375, 10.11181640625, 11.292236328125, 12.47265625, 13.653076171875, 14.83349609375, 16.013916015625, 17.1943359375, 18.374755859375, 19.55517578125, 20.735595703125, 21.916015625, 23.096435546875, 24.27685546875, 25.457275390625, 26.6376953125, 27.818115234375, 28.99853515625, 30.178955078125, 31.359375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 9.0, 26.0, 77.0, 516.0, 321.0, 43.0, 17.0, 5.0, 3.0, 1.0], "bins": [-1193.829345703125, -1173.1912841796875, -1152.5533447265625, -1131.915283203125, -1111.2772216796875, -1090.6392822265625, -1070.001220703125, -1049.3631591796875, -1028.7252197265625, -1008.0872192382812, -987.4491577148438, -966.8111572265625, -946.1731567382812, -925.53515625, -904.8970947265625, -884.2590942382812, -863.6210327148438, -842.9830322265625, -822.344970703125, -801.7069702148438, -781.0689697265625, -760.430908203125, -739.7929077148438, -719.1549072265625, -698.516845703125, -677.8788452148438, -657.2407836914062, -636.602783203125, -615.9647827148438, -595.3267822265625, -574.688720703125, -554.0507202148438, -533.4127197265625, -512.7747192382812, -492.1366882324219, -471.4986572265625, -450.86065673828125, -430.2226257324219, -409.5845947265625, -388.94659423828125, -368.30859375, -347.6705627441406, -327.0325622558594, -306.39453125, -285.75653076171875, -265.1184997558594, -244.48046875, -223.8424530029297, -203.2044219970703, -182.56640625, -161.92837524414062, -141.2903594970703, -120.65234375, -100.01432800292969, -79.37630462646484, -58.73828125, -38.10026550292969, -17.46224594116211, 3.1757736206054688, 23.813793182373047, 44.451812744140625, 65.08982849121094, 85.72785186767578, 106.36587524414062, 127.00389099121094]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 3.0, 7.0, 9.0, 7.0, 4.0, 9.0, 17.0, 17.0, 16.0, 23.0, 12.0, 18.0, 25.0, 37.0, 35.0, 41.0, 37.0, 38.0, 40.0, 40.0, 37.0, 47.0, 42.0, 39.0, 46.0, 41.0, 43.0, 33.0, 31.0, 28.0, 20.0, 17.0, 20.0, 16.0, 19.0, 11.0, 12.0, 17.0, 7.0, 5.0, 8.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-120.850830078125, -117.04947662353516, -113.24813079833984, -109.44677734375, -105.64543151855469, -101.84407806396484, -98.04273223876953, -94.24137878417969, -90.44003295898438, -86.63867950439453, -82.83733367919922, -79.03598022460938, -75.23463439941406, -71.43328094482422, -67.6319351196289, -63.83058166503906, -60.029232025146484, -56.227882385253906, -52.42653274536133, -48.62518310546875, -44.82383346557617, -41.022483825683594, -37.22113037109375, -33.41978454589844, -29.618432998657227, -25.81708335876465, -22.01573371887207, -18.21438217163086, -14.413033485412598, -10.611682891845703, -6.810333251953125, -3.008983612060547, 0.7923660278320312, 4.593715667724609, 8.395065307617188, 12.196415901184082, 15.99776554107666, 19.799116134643555, 23.600465774536133, 27.40181541442871, 31.20316505432129, 35.0045166015625, 38.80586624145508, 42.607215881347656, 46.408565521240234, 50.20991516113281, 54.01126480102539, 57.81261444091797, 61.61396408081055, 65.41531372070312, 69.21666717529297, 73.01801300048828, 76.81936645507812, 80.62071228027344, 84.42206573486328, 88.2234115600586, 92.02476501464844, 95.82611846923828, 99.6274642944336, 103.42881774902344, 107.23016357421875, 111.0315170288086, 114.8328628540039, 118.63421630859375, 122.43556213378906]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 1.0, 7.0, 13.0, 15.0, 20.0, 28.0, 28.0, 39.0, 69.0, 86.0, 109.0, 140.0, 224.0, 294.0, 398.0, 516.0, 713.0, 988.0, 1040708.0, 1230.0, 687.0, 587.0, 456.0, 361.0, 215.0, 156.0, 134.0, 92.0, 52.0, 47.0, 31.0, 29.0, 15.0, 14.0, 10.0, 12.0, 6.0, 7.0, 9.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.9215087890625, -56.382286071777344, -54.84306335449219, -53.30384063720703, -51.764617919921875, -50.22539520263672, -48.68617248535156, -47.146949768066406, -45.60772705078125, -44.068504333496094, -42.52928161621094, -40.99005889892578, -39.450836181640625, -37.91161346435547, -36.37239074707031, -34.833168029785156, -33.2939453125, -31.754722595214844, -30.215499877929688, -28.67627716064453, -27.137054443359375, -25.59783172607422, -24.058609008789062, -22.519386291503906, -20.98016357421875, -19.440940856933594, -17.901718139648438, -16.36249542236328, -14.823272705078125, -13.284049987792969, -11.744827270507812, -10.205604553222656, -8.666385650634766, -7.127162933349609, -5.587940216064453, -4.048717498779297, -2.5094947814941406, -0.9702720642089844, 0.5689506530761719, 2.108173370361328, 3.6473960876464844, 5.186618804931641, 6.725841522216797, 8.265064239501953, 9.80428695678711, 11.343509674072266, 12.882732391357422, 14.421955108642578, 15.961177825927734, 17.50040054321289, 19.039623260498047, 20.578845977783203, 22.11806869506836, 23.657291412353516, 25.196514129638672, 26.735736846923828, 28.274959564208984, 29.81418228149414, 31.353404998779297, 32.89262771606445, 34.43185043334961, 35.971073150634766, 37.51029586791992, 39.04951858520508, 40.588741302490234]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 9.0, 14.0, 11.0, 16.0, 12.0, 28.0, 74.0, 388.0, 51462192.0, 215.0, 49.0, 33.0, 22.0, 15.0, 8.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 8.0, 2.0, 10.0, 5.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4534.5048828125, -4323.78173828125, -4113.05810546875, -3902.334716796875, -3691.611328125, -3480.88818359375, -3270.16455078125, -3059.44140625, -2848.7177734375, -2637.994384765625, -2427.27099609375, -2216.547607421875, -2005.82421875, -1795.1009521484375, -1584.3775634765625, -1373.6541748046875, -1162.930908203125, -952.20751953125, -741.484130859375, -530.7608032226562, -320.03741455078125, -109.3140869140625, 101.4093017578125, 312.1326904296875, 522.8560791015625, 733.5794677734375, 944.3028564453125, 1155.026123046875, 1365.74951171875, 1576.472900390625, 1787.1962890625, 1997.919677734375, 2208.64306640625, 2419.366455078125, 2630.08984375, 2840.813232421875, 3051.53662109375, 3262.259765625, 3472.9833984375, 3683.70654296875, 3894.43017578125, 4105.1533203125, 4315.876953125, 4526.60009765625, 4737.32373046875, 4948.046875, 5158.7705078125, 5369.49365234375, 5580.216796875, 5790.93994140625, 6001.66357421875, 6212.38671875, 6423.1103515625, 6633.83349609375, 6844.55712890625, 7055.2802734375, 7266.00390625, 7476.72705078125, 7687.45068359375, 7898.173828125, 8108.8974609375, 8319.62109375, 8530.34375, 8741.0673828125, 8951.791015625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [4.0, 4.0, 6.0, 20.0, 30.0, 31.0, 55.0, 74.0, 110.0, 159.0, 262.0, 386.0, 525.0, 805.0, 1245.0, 1814.0, 2868.0, 4271.0, 6573.0, 10099.0, 15530.0, 24492.0, 38382.0, 61380.0, 100692.0, 173551.0, 339870.0, 3450898.0, 1349936.0, 298772.0, 156733.0, 94264.0, 57992.0, 35608.0, 22687.0, 14332.0, 9309.0, 5918.0, 3896.0, 2582.0, 1662.0, 1169.0, 748.0, 541.0, 385.0, 242.0, 146.0, 113.0, 78.0, 53.0, 45.0, 32.0, 20.0, 19.0, 9.0, 5.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.578125, -6.342529296875, -6.10693359375, -5.871337890625, -5.6357421875, -5.400146484375, -5.16455078125, -4.928955078125, -4.693359375, -4.457763671875, -4.22216796875, -3.986572265625, -3.7509765625, -3.515380859375, -3.27978515625, -3.044189453125, -2.80859375, -2.572998046875, -2.33740234375, -2.101806640625, -1.8662109375, -1.630615234375, -1.39501953125, -1.159423828125, -0.923828125, -0.688232421875, -0.45263671875, -0.217041015625, 0.0185546875, 0.254150390625, 0.48974609375, 0.725341796875, 0.9609375, 1.196533203125, 1.43212890625, 1.667724609375, 1.9033203125, 2.138916015625, 2.37451171875, 2.610107421875, 2.845703125, 3.081298828125, 3.31689453125, 3.552490234375, 3.7880859375, 4.023681640625, 4.25927734375, 4.494873046875, 4.73046875, 4.966064453125, 5.20166015625, 5.437255859375, 5.6728515625, 5.908447265625, 6.14404296875, 6.379638671875, 6.615234375, 6.850830078125, 7.08642578125, 7.322021484375, 7.5576171875, 7.793212890625, 8.02880859375, 8.264404296875, 8.5]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 12.0, 15.0, 8.0, 15.0, 18.0, 14.0, 19.0, 23.0, 24.0, 34.0, 41.0, 35.0, 31.0, 33.0, 48.0, 54.0, 178.0, 657.0, 228.0, 92.0, 65.0, 44.0, 40.0, 23.0, 31.0, 21.0, 27.0, 30.0, 23.0, 25.0, 16.0, 20.0, 11.0, 12.0, 8.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.5823974609375, -16.102294921875, -15.6221923828125, -15.14208984375, -14.6619873046875, -14.181884765625, -13.7017822265625, -13.2216796875, -12.7415771484375, -12.261474609375, -11.7813720703125, -11.30126953125, -10.8211669921875, -10.341064453125, -9.8609619140625, -9.380859375, -8.9007568359375, -8.420654296875, -7.9405517578125, -7.46044921875, -6.9803466796875, -6.500244140625, -6.0201416015625, -5.5400390625, -5.0599365234375, -4.579833984375, -4.0997314453125, -3.61962890625, -3.1395263671875, -2.659423828125, -2.1793212890625, -1.69921875, -1.2191162109375, -0.739013671875, -0.2589111328125, 0.22119140625, 0.7012939453125, 1.181396484375, 1.6614990234375, 2.1416015625, 2.6217041015625, 3.101806640625, 3.5819091796875, 4.06201171875, 4.5421142578125, 5.022216796875, 5.5023193359375, 5.982421875, 6.4625244140625, 6.942626953125, 7.4227294921875, 7.90283203125, 8.3829345703125, 8.863037109375, 9.3431396484375, 9.8232421875, 10.3033447265625, 10.783447265625, 11.2635498046875, 11.74365234375, 12.2237548828125, 12.703857421875, 13.1839599609375, 13.6640625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 3.0, 6.0, 4.0, 12.0, 4.0, 10.0, 12.0, 13.0, 34.0, 57.0, 86.0, 141.0, 172.0, 212.0, 236.0, 394.0, 562.0, 858.0, 1256.0, 1606.0, 2352.0, 3289.0, 4835.0, 7128.0, 10619.0, 16593.0, 25300.0, 40584.0, 66717.0, 115908.0, 213765.0, 505599.0, 4049576.0, 650590.0, 244787.0, 128430.0, 73963.0, 44261.0, 27579.0, 17558.0, 11517.0, 7793.0, 5123.0, 3466.0, 2526.0, 1774.0, 1223.0, 791.0, 582.0, 466.0, 351.0, 248.0, 132.0, 109.0, 65.0, 52.0, 34.0, 26.0, 29.0, 12.0, 8.0, 2.0, 10.0], "bins": [-7.8515625, -7.61785888671875, -7.3841552734375, -7.15045166015625, -6.916748046875, -6.68304443359375, -6.4493408203125, -6.21563720703125, -5.98193359375, -5.74822998046875, -5.5145263671875, -5.28082275390625, -5.047119140625, -4.81341552734375, -4.5797119140625, -4.34600830078125, -4.1123046875, -3.87860107421875, -3.6448974609375, -3.41119384765625, -3.177490234375, -2.94378662109375, -2.7100830078125, -2.47637939453125, -2.24267578125, -2.00897216796875, -1.7752685546875, -1.54156494140625, -1.307861328125, -1.07415771484375, -0.8404541015625, -0.60675048828125, -0.373046875, -0.13934326171875, 0.0943603515625, 0.32806396484375, 0.561767578125, 0.79547119140625, 1.0291748046875, 1.26287841796875, 1.49658203125, 1.73028564453125, 1.9639892578125, 2.19769287109375, 2.431396484375, 2.66510009765625, 2.8988037109375, 3.13250732421875, 3.3662109375, 3.59991455078125, 3.8336181640625, 4.06732177734375, 4.301025390625, 4.53472900390625, 4.7684326171875, 5.00213623046875, 5.23583984375, 5.46954345703125, 5.7032470703125, 5.93695068359375, 6.170654296875, 6.40435791015625, 6.6380615234375, 6.87176513671875, 7.10546875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 12.0, 6.0, 6.0, 9.0, 8.0, 17.0, 16.0, 21.0, 29.0, 25.0, 26.0, 22.0, 34.0, 27.0, 50.0, 49.0, 48.0, 99.0, 273.0, 571.0, 149.0, 89.0, 65.0, 48.0, 36.0, 34.0, 39.0, 35.0, 26.0, 24.0, 20.0, 16.0, 13.0, 16.0, 13.0, 7.0, 6.0, 10.0, 6.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.859375, -9.521728515625, -9.18408203125, -8.846435546875, -8.5087890625, -8.171142578125, -7.83349609375, -7.495849609375, -7.158203125, -6.820556640625, -6.48291015625, -6.145263671875, -5.8076171875, -5.469970703125, -5.13232421875, -4.794677734375, -4.45703125, -4.119384765625, -3.78173828125, -3.444091796875, -3.1064453125, -2.768798828125, -2.43115234375, -2.093505859375, -1.755859375, -1.418212890625, -1.08056640625, -0.742919921875, -0.4052734375, -0.067626953125, 0.27001953125, 0.607666015625, 0.9453125, 1.282958984375, 1.62060546875, 1.958251953125, 2.2958984375, 2.633544921875, 2.97119140625, 3.308837890625, 3.646484375, 3.984130859375, 4.32177734375, 4.659423828125, 4.9970703125, 5.334716796875, 5.67236328125, 6.010009765625, 6.34765625, 6.685302734375, 7.02294921875, 7.360595703125, 7.6982421875, 8.035888671875, 8.37353515625, 8.711181640625, 9.048828125, 9.386474609375, 9.72412109375, 10.061767578125, 10.3994140625, 10.737060546875, 11.07470703125, 11.412353515625, 11.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 21.0, 21.0, 10.0, 9.0, 48.0, 44.0, 45.0, 56.0, 107.0, 175.0, 234.0, 299.0, 413.0, 670.0, 1000.0, 1567.0, 2691.0, 5304.0, 11459.0, 33924.0, 198611.0, 5942523.0, 58777.0, 17367.0, 6972.0, 3416.0, 1892.0, 1255.0, 764.0, 478.0, 355.0, 283.0, 184.0, 118.0, 94.0, 80.0, 27.0, 35.0, 26.0, 37.0, 21.0, 6.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-28.515625, -27.571533203125, -26.62744140625, -25.683349609375, -24.7392578125, -23.795166015625, -22.85107421875, -21.906982421875, -20.962890625, -20.018798828125, -19.07470703125, -18.130615234375, -17.1865234375, -16.242431640625, -15.29833984375, -14.354248046875, -13.41015625, -12.466064453125, -11.52197265625, -10.577880859375, -9.6337890625, -8.689697265625, -7.74560546875, -6.801513671875, -5.857421875, -4.913330078125, -3.96923828125, -3.025146484375, -2.0810546875, -1.136962890625, -0.19287109375, 0.751220703125, 1.6953125, 2.639404296875, 3.58349609375, 4.527587890625, 5.4716796875, 6.415771484375, 7.35986328125, 8.303955078125, 9.248046875, 10.192138671875, 11.13623046875, 12.080322265625, 13.0244140625, 13.968505859375, 14.91259765625, 15.856689453125, 16.80078125, 17.744873046875, 18.68896484375, 19.633056640625, 20.5771484375, 21.521240234375, 22.46533203125, 23.409423828125, 24.353515625, 25.297607421875, 26.24169921875, 27.185791015625, 28.1298828125, 29.073974609375, 30.01806640625, 30.962158203125, 31.90625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 8.0, 11.0, 18.0, 17.0, 16.0, 27.0, 28.0, 34.0, 27.0, 43.0, 44.0, 57.0, 67.0, 97.0, 256.0, 573.0, 196.0, 112.0, 68.0, 45.0, 47.0, 40.0, 35.0, 25.0, 23.0, 12.0, 20.0, 14.0, 8.0, 13.0, 7.0, 5.0, 2.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75, -7.455078125, -7.16015625, -6.865234375, -6.5703125, -6.275390625, -5.98046875, -5.685546875, -5.390625, -5.095703125, -4.80078125, -4.505859375, -4.2109375, -3.916015625, -3.62109375, -3.326171875, -3.03125, -2.736328125, -2.44140625, -2.146484375, -1.8515625, -1.556640625, -1.26171875, -0.966796875, -0.671875, -0.376953125, -0.08203125, 0.212890625, 0.5078125, 0.802734375, 1.09765625, 1.392578125, 1.6875, 1.982421875, 2.27734375, 2.572265625, 2.8671875, 3.162109375, 3.45703125, 3.751953125, 4.046875, 4.341796875, 4.63671875, 4.931640625, 5.2265625, 5.521484375, 5.81640625, 6.111328125, 6.40625, 6.701171875, 6.99609375, 7.291015625, 7.5859375, 7.880859375, 8.17578125, 8.470703125, 8.765625, 9.060546875, 9.35546875, 9.650390625, 9.9453125, 10.240234375, 10.53515625, 10.830078125, 11.125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 15.0, 35.0, 74.0, 175.0, 427.0, 129.0, 66.0, 27.0, 13.0, 10.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.213606834411621, -13.147137641906738, -12.080668449401855, -11.014199256896973, -9.94773006439209, -8.881260871887207, -7.814791679382324, -6.748322486877441, -5.681853294372559, -4.615384101867676, -3.548914909362793, -2.48244571685791, -1.4159765243530273, -0.34950733184814453, 0.7169618606567383, 1.783431053161621, 2.849900245666504, 3.9163694381713867, 4.9828386306762695, 6.049307823181152, 7.115777015686035, 8.182246208190918, 9.2487154006958, 10.315184593200684, 11.381653785705566, 12.44812297821045, 13.514592170715332, 14.581061363220215, 15.647530555725098, 16.714000701904297, 17.780467987060547, 18.846939086914062, 19.913406372070312, 20.979875564575195, 22.046344757080078, 23.11281394958496, 24.179283142089844, 25.245752334594727, 26.31222152709961, 27.378690719604492, 28.445159912109375, 29.511629104614258, 30.57809829711914, 31.644567489624023, 32.711036682128906, 33.777503967285156, 34.84397506713867, 35.91044616699219, 36.97691345214844, 38.04338073730469, 39.1098518371582, 40.17632293701172, 41.24279022216797, 42.30925750732422, 43.375728607177734, 44.44219970703125, 45.5086669921875, 46.57513427734375, 47.641605377197266, 48.70807647705078, 49.77454376220703, 50.84101104736328, 51.9074821472168, 52.97395324707031, 54.04042053222656]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 3.0, 4.0, 5.0, 9.0, 10.0, 17.0, 8.0, 16.0, 16.0, 13.0, 25.0, 26.0, 22.0, 26.0, 33.0, 46.0, 44.0, 45.0, 33.0, 38.0, 57.0, 44.0, 38.0, 39.0, 47.0, 41.0, 40.0, 34.0, 24.0, 26.0, 23.0, 16.0, 10.0, 20.0, 14.0, 13.0, 18.0, 9.0, 11.0, 12.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.54062271118164, -9.2019681930542, -8.863312721252441, -8.524658203125, -8.186002731323242, -7.847348213195801, -7.508693218231201, -7.170038223266602, -6.83138370513916, -6.4927287101745605, -6.154073715209961, -5.8154191970825195, -5.47676420211792, -5.13810920715332, -4.799454212188721, -4.460799217224121, -4.1221442222595215, -3.783489227294922, -3.4448344707489014, -3.1061794757843018, -2.7675247192382812, -2.4288697242736816, -2.090214729309082, -1.7515599727630615, -1.412904977798462, -1.0742501020431519, -0.735595166683197, -0.3969402313232422, -0.05828535556793213, 0.28036952018737793, 0.6190245151519775, 0.957679271697998, 1.2963342666625977, 1.6349891424179077, 1.9736440181732178, 2.3122990131378174, 2.650953769683838, 2.9896087646484375, 3.328263759613037, 3.6669185161590576, 4.005573272705078, 4.344228267669678, 4.682883262634277, 5.021537780761719, 5.360192775726318, 5.698847770690918, 6.037502765655518, 6.376157760620117, 6.714812755584717, 7.053467750549316, 7.392122745513916, 7.730777740478516, 8.069432258605957, 8.408086776733398, 8.746742248535156, 9.085396766662598, 9.424052238464355, 9.762706756591797, 10.101362228393555, 10.440016746520996, 10.778672218322754, 11.117326736450195, 11.455982208251953, 11.794636726379395, 12.133291244506836]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 3.0, 11.0, 10.0, 19.0, 15.0, 35.0, 38.0, 59.0, 74.0, 102.0, 169.0, 278.0, 437.0, 724.0, 1261.0, 2230.0, 5156.0, 13580.0, 90624.0, 4043310.0, 22822.0, 6586.0, 2840.0, 1456.0, 874.0, 485.0, 317.0, 234.0, 143.0, 106.0, 62.0, 63.0, 38.0, 23.0, 28.0, 17.0, 10.0, 8.0, 6.0, 7.0, 3.0, 1.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0323486328125, -0.03127861022949219, -0.030208587646484375, -0.029138565063476562, -0.02806854248046875, -0.026998519897460938, -0.025928497314453125, -0.024858474731445312, -0.0237884521484375, -0.022718429565429688, -0.021648406982421875, -0.020578384399414062, -0.01950836181640625, -0.018438339233398438, -0.017368316650390625, -0.016298294067382812, -0.015228271484375, -0.014158248901367188, -0.013088226318359375, -0.012018203735351562, -0.01094818115234375, -0.009878158569335938, -0.008808135986328125, -0.0077381134033203125, -0.0066680908203125, -0.0055980682373046875, -0.004528045654296875, -0.0034580230712890625, -0.00238800048828125, -0.0013179779052734375, -0.000247955322265625, 0.0008220672607421875, 0.00189208984375, 0.0029621124267578125, 0.004032135009765625, 0.0051021575927734375, 0.00617218017578125, 0.0072422027587890625, 0.008312225341796875, 0.009382247924804688, 0.0104522705078125, 0.011522293090820312, 0.012592315673828125, 0.013662338256835938, 0.01473236083984375, 0.015802383422851562, 0.016872406005859375, 0.017942428588867188, 0.019012451171875, 0.020082473754882812, 0.021152496337890625, 0.022222518920898438, 0.02329254150390625, 0.024362564086914062, 0.025432586669921875, 0.026502609252929688, 0.0275726318359375, 0.028642654418945312, 0.029712677001953125, 0.030782699584960938, 0.03185272216796875, 0.03292274475097656, 0.033992767333984375, 0.03506278991699219, 0.0361328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 12.0, 10.0, 10.0, 15.0, 11.0, 18.0, 26.0, 515.0, 279.0, 13.0, 15.0, 16.0, 6.0, 13.0, 3.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002681732177734375, -0.002581268548965454, -0.002480804920196533, -0.0023803412914276123, -0.0022798776626586914, -0.0021794140338897705, -0.0020789504051208496, -0.0019784867763519287, -0.0018780231475830078, -0.001777559518814087, -0.001677095890045166, -0.0015766322612762451, -0.0014761686325073242, -0.0013757050037384033, -0.0012752413749694824, -0.0011747777462005615, -0.0010743141174316406, -0.0009738504886627197, -0.0008733868598937988, -0.0007729232311248779, -0.000672459602355957, -0.0005719959735870361, -0.00047153234481811523, -0.00037106871604919434, -0.00027060508728027344, -0.00017014145851135254, -6.967782974243164e-05, 3.078579902648926e-05, 0.00013124942779541016, 0.00023171305656433105, 0.00033217668533325195, 0.00043264031410217285, 0.0005331039428710938, 0.0006335675716400146, 0.0007340312004089355, 0.0008344948291778564, 0.0009349584579467773, 0.0010354220867156982, 0.0011358857154846191, 0.00123634934425354, 0.001336812973022461, 0.0014372766017913818, 0.0015377402305603027, 0.0016382038593292236, 0.0017386674880981445, 0.0018391311168670654, 0.0019395947456359863, 0.0020400583744049072, 0.002140522003173828, 0.002240985631942749, 0.00234144926071167, 0.002441912889480591, 0.0025423765182495117, 0.0026428401470184326, 0.0027433037757873535, 0.0028437674045562744, 0.0029442310333251953, 0.003044694662094116, 0.003145158290863037, 0.003245621919631958, 0.003346085548400879, 0.0034465491771698, 0.0035470128059387207, 0.0036474764347076416, 0.0037479400634765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 11.0, 14.0, 24.0, 22.0, 42.0, 56.0, 98.0, 134.0, 197.0, 357.0, 707.0, 1463.0, 4111.0, 20093.0, 1641590.0, 2497982.0, 20228.0, 4026.0, 1432.0, 701.0, 364.0, 208.0, 149.0, 86.0, 66.0, 30.0, 31.0, 17.0, 13.0, 6.0, 10.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03752946853637695, -0.035965919494628906, -0.03440237045288086, -0.03283882141113281, -0.031275272369384766, -0.02971172332763672, -0.028148174285888672, -0.026584625244140625, -0.025021076202392578, -0.02345752716064453, -0.021893978118896484, -0.020330429077148438, -0.01876688003540039, -0.017203330993652344, -0.015639781951904297, -0.01407623291015625, -0.012512683868408203, -0.010949134826660156, -0.00938558578491211, -0.007822036743164062, -0.006258487701416016, -0.004694938659667969, -0.003131389617919922, -0.001567840576171875, -4.291534423828125e-06, 0.0015592575073242188, 0.0031228065490722656, 0.0046863555908203125, 0.006249904632568359, 0.007813453674316406, 0.009377002716064453, 0.0109405517578125, 0.012504100799560547, 0.014067649841308594, 0.01563119888305664, 0.017194747924804688, 0.018758296966552734, 0.02032184600830078, 0.021885395050048828, 0.023448944091796875, 0.025012493133544922, 0.02657604217529297, 0.028139591217041016, 0.029703140258789062, 0.03126668930053711, 0.032830238342285156, 0.0343937873840332, 0.03595733642578125, 0.0375208854675293, 0.039084434509277344, 0.04064798355102539, 0.04221153259277344, 0.043775081634521484, 0.04533863067626953, 0.04690217971801758, 0.048465728759765625, 0.05002927780151367, 0.05159282684326172, 0.053156375885009766, 0.05471992492675781, 0.05628347396850586, 0.057847023010253906, 0.05941057205200195, 0.06097412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 1.0, 8.0, 7.0, 8.0, 16.0, 18.0, 27.0, 31.0, 37.0, 41.0, 48.0, 89.0, 107.0, 171.0, 493.0, 1929.0, 404.0, 158.0, 124.0, 82.0, 59.0, 43.0, 34.0, 28.0, 27.0, 13.0, 20.0, 12.0, 10.0, 10.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00565338134765625, -0.0055024027824401855, -0.005351424217224121, -0.005200445652008057, -0.005049467086791992, -0.004898488521575928, -0.004747509956359863, -0.004596531391143799, -0.004445552825927734, -0.00429457426071167, -0.0041435956954956055, -0.003992617130279541, -0.0038416385650634766, -0.003690659999847412, -0.0035396814346313477, -0.003388702869415283, -0.0032377243041992188, -0.0030867457389831543, -0.00293576717376709, -0.0027847886085510254, -0.002633810043334961, -0.0024828314781188965, -0.002331852912902832, -0.0021808743476867676, -0.002029895782470703, -0.0018789172172546387, -0.0017279386520385742, -0.0015769600868225098, -0.0014259815216064453, -0.0012750029563903809, -0.0011240243911743164, -0.000973045825958252, -0.0008220672607421875, -0.000671088695526123, -0.0005201101303100586, -0.00036913156509399414, -0.0002181529998779297, -6.717443466186523e-05, 8.380413055419922e-05, 0.00023478269577026367, 0.0003857612609863281, 0.0005367398262023926, 0.000687718391418457, 0.0008386969566345215, 0.000989675521850586, 0.0011406540870666504, 0.0012916326522827148, 0.0014426112174987793, 0.0015935897827148438, 0.0017445683479309082, 0.0018955469131469727, 0.002046525478363037, 0.0021975040435791016, 0.002348482608795166, 0.0024994611740112305, 0.002650439739227295, 0.0028014183044433594, 0.002952396869659424, 0.0031033754348754883, 0.0032543540000915527, 0.003405332565307617, 0.0035563111305236816, 0.003707289695739746, 0.0038582682609558105, 0.004009246826171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 17.0, 40.0, 122.0, 346.0, 271.0, 109.0, 41.0, 10.0, 8.0, 8.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05224829167127609, -0.050494417548179626, -0.04874053969979286, -0.046986665576696396, -0.04523279145359993, -0.043478913605213165, -0.0417250394821167, -0.03997116535902023, -0.03821729123592377, -0.0364634171128273, -0.034709539264440536, -0.03295566514134407, -0.031201791018247604, -0.02944791503250599, -0.027694039046764374, -0.025940164923667908, -0.024186288937926292, -0.022432412952184677, -0.02067853882908821, -0.018924662843346596, -0.01717078872025013, -0.015416912734508514, -0.013663037680089474, -0.011909162625670433, -0.010155287571251392, -0.008401412516832352, -0.006647537462413311, -0.004893661942332983, -0.0031397868879139423, -0.0013859113678336143, 0.00036796368658542633, 0.002121838741004467, 0.0038757137954235077, 0.005629588849842548, 0.007383463904261589, 0.009137339890003204, 0.01089121401309967, 0.012645089998841286, 0.014398965053260326, 0.016152840107679367, 0.017906714230775833, 0.01966059021651745, 0.021414464339613914, 0.02316834032535553, 0.024922214448451996, 0.02667609043419361, 0.028429966419935226, 0.030183840543031693, 0.03193771839141846, 0.03369159251451492, 0.03544547036290169, 0.037199344485998154, 0.03895321860909462, 0.040707096457481384, 0.04246097058057785, 0.044214844703674316, 0.04596871882677078, 0.04772259294986725, 0.04947647079825401, 0.05123034492135048, 0.052984219044446945, 0.05473809689283371, 0.056491971015930176, 0.05824584513902664, 0.05999971926212311]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 2.0, 9.0, 11.0, 7.0, 10.0, 18.0, 26.0, 20.0, 37.0, 44.0, 47.0, 51.0, 56.0, 64.0, 63.0, 63.0, 62.0, 75.0, 41.0, 48.0, 48.0, 35.0, 35.0, 27.0, 28.0, 16.0, 16.0, 13.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016832709312438965, -0.01619180105626583, -0.015550892800092697, -0.014909984543919563, -0.01426907628774643, -0.013628168031573296, -0.012987259775400162, -0.012346351519227028, -0.011705443263053894, -0.01106453500688076, -0.010423626750707626, -0.009782718494534492, -0.009141810238361359, -0.008500901982188225, -0.007859993726015091, -0.007219085469841957, -0.006578177213668823, -0.005937268957495689, -0.0052963607013225555, -0.004655452445149422, -0.004014544188976288, -0.003373635932803154, -0.00273272767663002, -0.0020918194204568863, -0.0014509111642837524, -0.0008100029081106186, -0.00016909465193748474, 0.0004718136042356491, 0.001112721860408783, 0.0017536301165819168, 0.0023945383727550507, 0.0030354466289281845, 0.0036763548851013184, 0.004317263141274452, 0.004958171397447586, 0.00559907965362072, 0.006239987909793854, 0.006880896165966988, 0.0075218044221401215, 0.008162712678313255, 0.00880362093448639, 0.009444529190659523, 0.010085437446832657, 0.01072634570300579, 0.011367253959178925, 0.012008162215352058, 0.012649070471525192, 0.013289978727698326, 0.01393088698387146, 0.014571795240044594, 0.015212703496217728, 0.01585361175239086, 0.016494520008563995, 0.01713542826473713, 0.017776336520910263, 0.018417244777083397, 0.01905815303325653, 0.019699061289429665, 0.0203399695456028, 0.020980877801775932, 0.021621786057949066, 0.0222626943141222, 0.022903602570295334, 0.023544510826468468, 0.0241854190826416]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 4.0, 12.0, 5.0, 17.0, 21.0, 27.0, 40.0, 49.0, 75.0, 85.0, 143.0, 207.0, 291.0, 363.0, 578.0, 983.0, 1554.0, 2466.0, 4435.0, 9072.0, 21982.0, 721550.0, 245918.0, 19679.0, 8448.0, 4069.0, 2391.0, 1407.0, 868.0, 537.0, 357.0, 258.0, 171.0, 132.0, 105.0, 72.0, 56.0, 28.0, 30.0, 8.0, 20.0, 12.0, 13.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.035736083984375, -0.03461742401123047, -0.03349876403808594, -0.032380104064941406, -0.031261444091796875, -0.030142784118652344, -0.029024124145507812, -0.02790546417236328, -0.02678680419921875, -0.02566814422607422, -0.024549484252929688, -0.023430824279785156, -0.022312164306640625, -0.021193504333496094, -0.020074844360351562, -0.01895618438720703, -0.0178375244140625, -0.01671886444091797, -0.015600204467773438, -0.014481544494628906, -0.013362884521484375, -0.012244224548339844, -0.011125564575195312, -0.010006904602050781, -0.00888824462890625, -0.007769584655761719, -0.0066509246826171875, -0.005532264709472656, -0.004413604736328125, -0.0032949447631835938, -0.0021762847900390625, -0.0010576248168945312, 6.103515625e-05, 0.0011796951293945312, 0.0022983551025390625, 0.0034170150756835938, 0.004535675048828125, 0.005654335021972656, 0.0067729949951171875, 0.007891654968261719, 0.00901031494140625, 0.010128974914550781, 0.011247634887695312, 0.012366294860839844, 0.013484954833984375, 0.014603614807128906, 0.015722274780273438, 0.01684093475341797, 0.0179595947265625, 0.01907825469970703, 0.020196914672851562, 0.021315574645996094, 0.022434234619140625, 0.023552894592285156, 0.024671554565429688, 0.02579021453857422, 0.02690887451171875, 0.02802753448486328, 0.029146194458007812, 0.030264854431152344, 0.031383514404296875, 0.032502174377441406, 0.03362083435058594, 0.03473949432373047, 0.035858154296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 1.0, 5.0, 13.0, 11.0, 8.0, 13.0, 15.0, 24.0, 121.0, 538.0, 154.0, 18.0, 12.0, 11.0, 8.0, 6.0, 9.0, 8.0, 2.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025787353515625, -0.002480834722518921, -0.002382934093475342, -0.0022850334644317627, -0.0021871328353881836, -0.0020892322063446045, -0.0019913315773010254, -0.0018934309482574463, -0.0017955303192138672, -0.001697629690170288, -0.001599729061126709, -0.0015018284320831299, -0.0014039278030395508, -0.0013060271739959717, -0.0012081265449523926, -0.0011102259159088135, -0.0010123252868652344, -0.0009144246578216553, -0.0008165240287780762, -0.0007186233997344971, -0.000620722770690918, -0.0005228221416473389, -0.00042492151260375977, -0.00032702088356018066, -0.00022912025451660156, -0.00013121962547302246, -3.331899642944336e-05, 6.458163261413574e-05, 0.00016248226165771484, 0.00026038289070129395, 0.00035828351974487305, 0.00045618414878845215, 0.0005540847778320312, 0.0006519854068756104, 0.0007498860359191895, 0.0008477866649627686, 0.0009456872940063477, 0.0010435879230499268, 0.0011414885520935059, 0.001239389181137085, 0.001337289810180664, 0.0014351904392242432, 0.0015330910682678223, 0.0016309916973114014, 0.0017288923263549805, 0.0018267929553985596, 0.0019246935844421387, 0.0020225942134857178, 0.002120494842529297, 0.002218395471572876, 0.002316296100616455, 0.002414196729660034, 0.0025120973587036133, 0.0026099979877471924, 0.0027078986167907715, 0.0028057992458343506, 0.0029036998748779297, 0.003001600503921509, 0.003099501132965088, 0.003197401762008667, 0.003295302391052246, 0.003393203020095825, 0.0034911036491394043, 0.0035890042781829834, 0.0036869049072265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 11.0, 14.0, 18.0, 27.0, 34.0, 45.0, 63.0, 102.0, 117.0, 163.0, 222.0, 337.0, 512.0, 802.0, 1285.0, 2294.0, 4449.0, 10640.0, 46520.0, 839213.0, 112907.0, 15708.0, 5812.0, 2817.0, 1521.0, 946.0, 603.0, 395.0, 274.0, 173.0, 143.0, 105.0, 74.0, 54.0, 43.0, 18.0, 26.0, 8.0, 12.0, 8.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.041412353515625, -0.04001665115356445, -0.038620948791503906, -0.03722524642944336, -0.03582954406738281, -0.034433841705322266, -0.03303813934326172, -0.03164243698120117, -0.030246734619140625, -0.028851032257080078, -0.02745532989501953, -0.026059627532958984, -0.024663925170898438, -0.02326822280883789, -0.021872520446777344, -0.020476818084716797, -0.01908111572265625, -0.017685413360595703, -0.016289710998535156, -0.01489400863647461, -0.013498306274414062, -0.012102603912353516, -0.010706901550292969, -0.009311199188232422, -0.007915496826171875, -0.006519794464111328, -0.005124092102050781, -0.0037283897399902344, -0.0023326873779296875, -0.0009369850158691406, 0.00045871734619140625, 0.0018544197082519531, 0.0032501220703125, 0.004645824432373047, 0.006041526794433594, 0.007437229156494141, 0.008832931518554688, 0.010228633880615234, 0.011624336242675781, 0.013020038604736328, 0.014415740966796875, 0.015811443328857422, 0.01720714569091797, 0.018602848052978516, 0.019998550415039062, 0.02139425277709961, 0.022789955139160156, 0.024185657501220703, 0.02558135986328125, 0.026977062225341797, 0.028372764587402344, 0.02976846694946289, 0.031164169311523438, 0.032559871673583984, 0.03395557403564453, 0.03535127639770508, 0.036746978759765625, 0.03814268112182617, 0.03953838348388672, 0.040934085845947266, 0.04232978820800781, 0.04372549057006836, 0.045121192932128906, 0.04651689529418945, 0.04791259765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 3.0, 5.0, 12.0, 9.0, 9.0, 15.0, 20.0, 12.0, 25.0, 17.0, 20.0, 33.0, 31.0, 26.0, 38.0, 42.0, 31.0, 30.0, 46.0, 31.0, 45.0, 44.0, 37.0, 41.0, 41.0, 38.0, 41.0, 26.0, 32.0, 29.0, 22.0, 23.0, 26.0, 14.0, 17.0, 15.0, 5.0, 15.0, 7.0, 4.0, 5.0, 2.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009063720703125, -0.008743643760681152, -0.008423566818237305, -0.008103489875793457, -0.007783412933349609, -0.007463335990905762, -0.007143259048461914, -0.006823182106018066, -0.006503105163574219, -0.006183028221130371, -0.0058629512786865234, -0.005542874336242676, -0.005222797393798828, -0.0049027204513549805, -0.004582643508911133, -0.004262566566467285, -0.0039424896240234375, -0.00362241268157959, -0.003302335739135742, -0.0029822587966918945, -0.002662181854248047, -0.0023421049118041992, -0.0020220279693603516, -0.001701951026916504, -0.0013818740844726562, -0.0010617971420288086, -0.0007417201995849609, -0.0004216432571411133, -0.00010156631469726562, 0.00021851062774658203, 0.0005385875701904297, 0.0008586645126342773, 0.001178741455078125, 0.0014988183975219727, 0.0018188953399658203, 0.002138972282409668, 0.0024590492248535156, 0.0027791261672973633, 0.003099203109741211, 0.0034192800521850586, 0.0037393569946289062, 0.004059433937072754, 0.0043795108795166016, 0.004699587821960449, 0.005019664764404297, 0.0053397417068481445, 0.005659818649291992, 0.00597989559173584, 0.0062999725341796875, 0.006620049476623535, 0.006940126419067383, 0.0072602033615112305, 0.007580280303955078, 0.007900357246398926, 0.008220434188842773, 0.008540511131286621, 0.008860588073730469, 0.009180665016174316, 0.009500741958618164, 0.009820818901062012, 0.01014089584350586, 0.010460972785949707, 0.010781049728393555, 0.011101126670837402, 0.01142120361328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 0.0, 8.0, 9.0, 4.0, 12.0, 10.0, 11.0, 28.0, 37.0, 63.0, 77.0, 137.0, 169.0, 321.0, 616.0, 1485.0, 4722.0, 38534.0, 977956.0, 18394.0, 3396.0, 1182.0, 545.0, 281.0, 166.0, 110.0, 79.0, 50.0, 36.0, 30.0, 18.0, 14.0, 7.0, 7.0, 7.0, 3.0, 2.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0304412841796875, -0.029404878616333008, -0.028368473052978516, -0.027332067489624023, -0.02629566192626953, -0.02525925636291504, -0.024222850799560547, -0.023186445236206055, -0.022150039672851562, -0.02111363410949707, -0.020077228546142578, -0.019040822982788086, -0.018004417419433594, -0.0169680118560791, -0.01593160629272461, -0.014895200729370117, -0.013858795166015625, -0.012822389602661133, -0.01178598403930664, -0.010749578475952148, -0.009713172912597656, -0.008676767349243164, -0.007640361785888672, -0.00660395622253418, -0.0055675506591796875, -0.004531145095825195, -0.003494739532470703, -0.002458333969116211, -0.0014219284057617188, -0.00038552284240722656, 0.0006508827209472656, 0.0016872882843017578, 0.00272369384765625, 0.003760099411010742, 0.004796504974365234, 0.0058329105377197266, 0.006869316101074219, 0.007905721664428711, 0.008942127227783203, 0.009978532791137695, 0.011014938354492188, 0.01205134391784668, 0.013087749481201172, 0.014124155044555664, 0.015160560607910156, 0.01619696617126465, 0.01723337173461914, 0.018269777297973633, 0.019306182861328125, 0.020342588424682617, 0.02137899398803711, 0.0224153995513916, 0.023451805114746094, 0.024488210678100586, 0.025524616241455078, 0.02656102180480957, 0.027597427368164062, 0.028633832931518555, 0.029670238494873047, 0.03070664405822754, 0.03174304962158203, 0.03277945518493652, 0.033815860748291016, 0.03485226631164551, 0.035888671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 5.0, 8.0, 7.0, 8.0, 17.0, 16.0, 24.0, 20.0, 37.0, 54.0, 134.0, 151.0, 173.0, 119.0, 59.0, 48.0, 27.0, 21.0, 12.0, 17.0, 11.0, 7.0, 12.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2172927856445312e-05, -2.1434389054775238e-05, -2.0695850253105164e-05, -1.995731145143509e-05, -1.9218772649765015e-05, -1.848023384809494e-05, -1.7741695046424866e-05, -1.700315624475479e-05, -1.6264617443084717e-05, -1.5526078641414642e-05, -1.4787539839744568e-05, -1.4049001038074493e-05, -1.3310462236404419e-05, -1.2571923434734344e-05, -1.183338463306427e-05, -1.1094845831394196e-05, -1.0356307029724121e-05, -9.617768228054047e-06, -8.879229426383972e-06, -8.140690624713898e-06, -7.402151823043823e-06, -6.663613021373749e-06, -5.925074219703674e-06, -5.1865354180336e-06, -4.447996616363525e-06, -3.709457814693451e-06, -2.9709190130233765e-06, -2.232380211353302e-06, -1.4938414096832275e-06, -7.553026080131531e-07, -1.6763806343078613e-08, 7.217749953269958e-07, 1.4603137969970703e-06, 2.1988525986671448e-06, 2.9373914003372192e-06, 3.6759302020072937e-06, 4.414469003677368e-06, 5.153007805347443e-06, 5.891546607017517e-06, 6.6300854086875916e-06, 7.368624210357666e-06, 8.10716301202774e-06, 8.845701813697815e-06, 9.58424061536789e-06, 1.0322779417037964e-05, 1.1061318218708038e-05, 1.1799857020378113e-05, 1.2538395822048187e-05, 1.3276934623718262e-05, 1.4015473425388336e-05, 1.475401222705841e-05, 1.5492551028728485e-05, 1.623108983039856e-05, 1.6969628632068634e-05, 1.770816743373871e-05, 1.8446706235408783e-05, 1.9185245037078857e-05, 1.9923783838748932e-05, 2.0662322640419006e-05, 2.140086144208908e-05, 2.2139400243759155e-05, 2.287793904542923e-05, 2.3616477847099304e-05, 2.435501664876938e-05, 2.5093555450439453e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 14.0, 9.0, 18.0, 20.0, 21.0, 41.0, 58.0, 98.0, 121.0, 216.0, 421.0, 709.0, 1786.0, 5771.0, 98111.0, 928892.0, 8303.0, 1957.0, 911.0, 408.0, 223.0, 143.0, 90.0, 67.0, 37.0, 22.0, 17.0, 14.0, 12.0, 8.0, 7.0, 9.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.123046875, -0.11981773376464844, -0.11658859252929688, -0.11335945129394531, -0.11013031005859375, -0.10690116882324219, -0.10367202758789062, -0.10044288635253906, -0.0972137451171875, -0.09398460388183594, -0.09075546264648438, -0.08752632141113281, -0.08429718017578125, -0.08106803894042969, -0.07783889770507812, -0.07460975646972656, -0.071380615234375, -0.06815147399902344, -0.06492233276367188, -0.06169319152832031, -0.05846405029296875, -0.05523490905761719, -0.052005767822265625, -0.04877662658691406, -0.0455474853515625, -0.04231834411621094, -0.039089202880859375, -0.03586006164550781, -0.03263092041015625, -0.029401779174804688, -0.026172637939453125, -0.022943496704101562, -0.01971435546875, -0.016485214233398438, -0.013256072998046875, -0.010026931762695312, -0.00679779052734375, -0.0035686492919921875, -0.000339508056640625, 0.0028896331787109375, 0.0061187744140625, 0.009347915649414062, 0.012577056884765625, 0.015806198120117188, 0.01903533935546875, 0.022264480590820312, 0.025493621826171875, 0.028722763061523438, 0.031951904296875, 0.03518104553222656, 0.038410186767578125, 0.04163932800292969, 0.04486846923828125, 0.04809761047363281, 0.051326751708984375, 0.05455589294433594, 0.0577850341796875, 0.06101417541503906, 0.06424331665039062, 0.06747245788574219, 0.07070159912109375, 0.07393074035644531, 0.07715988159179688, 0.08038902282714844, 0.0836181640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 1.0, 7.0, 3.0, 6.0, 13.0, 14.0, 15.0, 23.0, 21.0, 23.0, 27.0, 174.0, 515.0, 48.0, 25.0, 12.0, 18.0, 17.0, 12.0, 4.0, 6.0, 7.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0262451171875, -0.02528095245361328, -0.024316787719726562, -0.023352622985839844, -0.022388458251953125, -0.021424293518066406, -0.020460128784179688, -0.01949596405029297, -0.01853179931640625, -0.01756763458251953, -0.016603469848632812, -0.015639305114746094, -0.014675140380859375, -0.013710975646972656, -0.012746810913085938, -0.011782646179199219, -0.0108184814453125, -0.009854316711425781, -0.008890151977539062, -0.007925987243652344, -0.006961822509765625, -0.005997657775878906, -0.0050334930419921875, -0.004069328308105469, -0.00310516357421875, -0.0021409988403320312, -0.0011768341064453125, -0.00021266937255859375, 0.000751495361328125, 0.0017156600952148438, 0.0026798248291015625, 0.0036439895629882812, 0.004608154296875, 0.005572319030761719, 0.0065364837646484375, 0.007500648498535156, 0.008464813232421875, 0.009428977966308594, 0.010393142700195312, 0.011357307434082031, 0.01232147216796875, 0.013285636901855469, 0.014249801635742188, 0.015213966369628906, 0.016178131103515625, 0.017142295837402344, 0.018106460571289062, 0.01907062530517578, 0.0200347900390625, 0.02099895477294922, 0.021963119506835938, 0.022927284240722656, 0.023891448974609375, 0.024855613708496094, 0.025819778442382812, 0.02678394317626953, 0.02774810791015625, 0.02871227264404297, 0.029676437377929688, 0.030640602111816406, 0.031604766845703125, 0.032568931579589844, 0.03353309631347656, 0.03449726104736328, 0.03546142578125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 12.0, 17.0, 84.0, 675.0, 132.0, 31.0, 12.0, 8.0, 4.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7512502670288086, -0.7306615114212036, -0.7100727558135986, -0.6894840002059937, -0.6688952445983887, -0.6483065485954285, -0.6277177929878235, -0.6071290373802185, -0.5865402817726135, -0.5659515261650085, -0.5453627705574036, -0.5247740149497986, -0.5041853189468384, -0.483596533536911, -0.4630078077316284, -0.44241905212402344, -0.42183029651641846, -0.4012415409088135, -0.3806527853012085, -0.3600640594959259, -0.3394753038883209, -0.31888654828071594, -0.29829782247543335, -0.27770906686782837, -0.2571203112602234, -0.2365315556526184, -0.21594281494617462, -0.19535407423973083, -0.17476531863212585, -0.15417656302452087, -0.1335878223180771, -0.1129990816116333, -0.09241032600402832, -0.07182157784700394, -0.05123282968997955, -0.03064408153295517, -0.010055333375930786, 0.010533414781093597, 0.03112216293811798, 0.05171090364456177, 0.07229965925216675, 0.09288840740919113, 0.11347715556621552, 0.1340658962726593, 0.15465465188026428, 0.17524340748786926, 0.19583214819431305, 0.21642088890075684, 0.23700964450836182, 0.2575984001159668, 0.2781871557235718, 0.29877588152885437, 0.31936463713645935, 0.33995339274406433, 0.3605421185493469, 0.3811308741569519, 0.4017196297645569, 0.42230838537216187, 0.44289714097976685, 0.46348586678504944, 0.4840746223926544, 0.504663348197937, 0.525252103805542, 0.545840859413147, 0.566429615020752]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 4.0, 2.0, 5.0, 5.0, 7.0, 11.0, 12.0, 26.0, 44.0, 64.0, 89.0, 114.0, 129.0, 148.0, 107.0, 79.0, 44.0, 30.0, 19.0, 15.0, 10.0, 11.0, 6.0, 3.0, 2.0, 3.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26447778940200806, -0.2566041648387909, -0.24873054027557373, -0.24085691571235657, -0.2329832911491394, -0.22510966658592224, -0.21723602712154388, -0.20936240255832672, -0.20148877799510956, -0.1936151534318924, -0.18574152886867523, -0.17786790430545807, -0.1699942648410797, -0.16212064027786255, -0.15424701571464539, -0.14637339115142822, -0.13849976658821106, -0.1306261420249939, -0.12275251746177673, -0.11487888544797897, -0.10700526088476181, -0.09913163632154465, -0.09125800430774689, -0.08338437974452972, -0.07551075518131256, -0.0676371306180954, -0.059763502329587936, -0.051889874041080475, -0.04401624947786331, -0.03614262491464615, -0.028268996626138687, -0.020395368337631226, -0.012521743774414062, -0.00464811734855175, 0.003225509077310562, 0.011099135503172874, 0.018972761929035187, 0.02684638649225235, 0.03472001478075981, 0.04259364306926727, 0.050467267632484436, 0.0583408921957016, 0.06621451675891876, 0.07408814877271652, 0.08196177333593369, 0.08983539789915085, 0.09770902991294861, 0.10558265447616577, 0.11345627903938293, 0.1213299036026001, 0.12920352816581726, 0.13707715272903442, 0.1449507772922516, 0.15282440185546875, 0.1606980413198471, 0.16857166588306427, 0.17644529044628143, 0.1843189150094986, 0.19219253957271576, 0.20006616413593292, 0.20793980360031128, 0.21581342816352844, 0.2236870527267456, 0.23156067728996277, 0.23943430185317993]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 8.0, 11.0, 9.0, 13.0, 10.0, 22.0, 29.0, 45.0, 77.0, 371.0, 14793.0, 4173785.0, 4588.0, 317.0, 70.0, 31.0, 24.0, 18.0, 10.0, 12.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.78125, -2.67578125, -2.5703125, -2.46484375, -2.359375, -2.25390625, -2.1484375, -2.04296875, -1.9375, -1.83203125, -1.7265625, -1.62109375, -1.515625, -1.41015625, -1.3046875, -1.19921875, -1.09375, -0.98828125, -0.8828125, -0.77734375, -0.671875, -0.56640625, -0.4609375, -0.35546875, -0.25, -0.14453125, -0.0390625, 0.06640625, 0.171875, 0.27734375, 0.3828125, 0.48828125, 0.59375, 0.69921875, 0.8046875, 0.91015625, 1.015625, 1.12109375, 1.2265625, 1.33203125, 1.4375, 1.54296875, 1.6484375, 1.75390625, 1.859375, 1.96484375, 2.0703125, 2.17578125, 2.28125, 2.38671875, 2.4921875, 2.59765625, 2.703125, 2.80859375, 2.9140625, 3.01953125, 3.125, 3.23046875, 3.3359375, 3.44140625, 3.546875, 3.65234375, 3.7578125, 3.86328125, 3.96875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 8.0, 4.0, 9.0, 8.0, 11.0, 18.0, 16.0, 29.0, 136.0, 382.0, 236.0, 47.0, 16.0, 14.0, 9.0, 5.0, 4.0, 8.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021495819091796875, -0.0020741522312164307, -0.001998722553253174, -0.001923292875289917, -0.0018478631973266602, -0.0017724335193634033, -0.0016970038414001465, -0.0016215741634368896, -0.0015461444854736328, -0.001470714807510376, -0.0013952851295471191, -0.0013198554515838623, -0.0012444257736206055, -0.0011689960956573486, -0.0010935664176940918, -0.001018136739730835, -0.0009427070617675781, -0.0008672773838043213, -0.0007918477058410645, -0.0007164180278778076, -0.0006409883499145508, -0.0005655586719512939, -0.0004901289939880371, -0.0004146993160247803, -0.00033926963806152344, -0.0002638399600982666, -0.00018841028213500977, -0.00011298060417175293, -3.7550926208496094e-05, 3.787875175476074e-05, 0.00011330842971801758, 0.00018873810768127441, 0.00026416778564453125, 0.0003395974636077881, 0.0004150271415710449, 0.0004904568195343018, 0.0005658864974975586, 0.0006413161754608154, 0.0007167458534240723, 0.0007921755313873291, 0.0008676052093505859, 0.0009430348873138428, 0.0010184645652770996, 0.0010938942432403564, 0.0011693239212036133, 0.0012447535991668701, 0.001320183277130127, 0.0013956129550933838, 0.0014710426330566406, 0.0015464723110198975, 0.0016219019889831543, 0.0016973316669464111, 0.001772761344909668, 0.0018481910228729248, 0.0019236207008361816, 0.0019990503787994385, 0.0020744800567626953, 0.002149909734725952, 0.002225339412689209, 0.002300769090652466, 0.0023761987686157227, 0.0024516284465789795, 0.0025270581245422363, 0.002602487802505493, 0.00267791748046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 12.0, 18.0, 15.0, 22.0, 38.0, 33.0, 58.0, 84.0, 115.0, 137.0, 241.0, 1165.0, 4171489.0, 19850.0, 352.0, 192.0, 110.0, 94.0, 56.0, 52.0, 39.0, 21.0, 30.0, 19.0, 7.0, 16.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.9306640625, -0.9066543579101562, -0.8826446533203125, -0.8586349487304688, -0.834625244140625, -0.8106155395507812, -0.7866058349609375, -0.7625961303710938, -0.73858642578125, -0.7145767211914062, -0.6905670166015625, -0.6665573120117188, -0.642547607421875, -0.6185379028320312, -0.5945281982421875, -0.5705184936523438, -0.5465087890625, -0.5224990844726562, -0.4984893798828125, -0.47447967529296875, -0.450469970703125, -0.42646026611328125, -0.4024505615234375, -0.37844085693359375, -0.35443115234375, -0.33042144775390625, -0.3064117431640625, -0.28240203857421875, -0.258392333984375, -0.23438262939453125, -0.2103729248046875, -0.18636322021484375, -0.162353515625, -0.13834381103515625, -0.1143341064453125, -0.09032440185546875, -0.066314697265625, -0.04230499267578125, -0.0182952880859375, 0.00571441650390625, 0.02972412109375, 0.05373382568359375, 0.0777435302734375, 0.10175323486328125, 0.125762939453125, 0.14977264404296875, 0.1737823486328125, 0.19779205322265625, 0.2218017578125, 0.24581146240234375, 0.2698211669921875, 0.29383087158203125, 0.317840576171875, 0.34185028076171875, 0.3658599853515625, 0.38986968994140625, 0.41387939453125, 0.43788909912109375, 0.4618988037109375, 0.48590850830078125, 0.509918212890625, 0.5339279174804688, 0.5579376220703125, 0.5819473266601562, 0.60595703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 16.0, 16.0, 28.0, 39.0, 43.0, 58.0, 89.0, 135.0, 185.0, 254.0, 352.0, 1475.0, 409.0, 257.0, 199.0, 135.0, 102.0, 76.0, 58.0, 32.0, 38.0, 26.0, 9.0, 13.0, 8.0, 1.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007480621337890625, -0.007281780242919922, -0.007082939147949219, -0.006884098052978516, -0.0066852569580078125, -0.006486415863037109, -0.006287574768066406, -0.006088733673095703, -0.005889892578125, -0.005691051483154297, -0.005492210388183594, -0.005293369293212891, -0.0050945281982421875, -0.004895687103271484, -0.004696846008300781, -0.004498004913330078, -0.004299163818359375, -0.004100322723388672, -0.0039014816284179688, -0.0037026405334472656, -0.0035037994384765625, -0.0033049583435058594, -0.0031061172485351562, -0.002907276153564453, -0.00270843505859375, -0.002509593963623047, -0.0023107528686523438, -0.0021119117736816406, -0.0019130706787109375, -0.0017142295837402344, -0.0015153884887695312, -0.0013165473937988281, -0.001117706298828125, -0.0009188652038574219, -0.0007200241088867188, -0.0005211830139160156, -0.0003223419189453125, -0.00012350082397460938, 7.534027099609375e-05, 0.0002741813659667969, 0.0004730224609375, 0.0006718635559082031, 0.0008707046508789062, 0.0010695457458496094, 0.0012683868408203125, 0.0014672279357910156, 0.0016660690307617188, 0.0018649101257324219, 0.002063751220703125, 0.002262592315673828, 0.0024614334106445312, 0.0026602745056152344, 0.0028591156005859375, 0.0030579566955566406, 0.0032567977905273438, 0.003455638885498047, 0.00365447998046875, 0.003853321075439453, 0.004052162170410156, 0.004251003265380859, 0.0044498443603515625, 0.004648685455322266, 0.004847526550292969, 0.005046367645263672, 0.005245208740234375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 15.0, 89.0, 802.0, 96.0, 2.0, 2.0, 2.0], "bins": [-0.7880571484565735, -0.7748634815216064, -0.7616698145866394, -0.7484761476516724, -0.7352824807167053, -0.7220888137817383, -0.7088951468467712, -0.6957014799118042, -0.6825078129768372, -0.6693141460418701, -0.6561204791069031, -0.642926812171936, -0.629733145236969, -0.616539478302002, -0.6033458113670349, -0.5901521444320679, -0.576958417892456, -0.563764750957489, -0.550571084022522, -0.5373774170875549, -0.5241837501525879, -0.5109900832176208, -0.4977964162826538, -0.48460274934768677, -0.4714090824127197, -0.4582154154777527, -0.44502174854278564, -0.4318280816078186, -0.41863441467285156, -0.4054407477378845, -0.3922470808029175, -0.37905341386795044, -0.3658597469329834, -0.35266607999801636, -0.3394724130630493, -0.3262787461280823, -0.31308507919311523, -0.2998914122581482, -0.28669774532318115, -0.2735040783882141, -0.26031041145324707, -0.24711674451828003, -0.233923077583313, -0.22072941064834595, -0.2075357437133789, -0.19434207677841187, -0.18114839494228363, -0.1679547280073166, -0.15476104617118835, -0.1415673792362213, -0.12837371230125427, -0.11518003791570663, -0.1019863709807396, -0.08879270404577255, -0.07559902966022491, -0.062405362725257874, -0.04921169951558113, -0.03601802885532379, -0.02282436192035675, -0.009630691260099411, 0.00356297567486763, 0.01675664260983467, 0.02995031699538231, 0.04314398393034935, 0.05633765086531639]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 5.0, 12.0, 16.0, 17.0, 19.0, 36.0, 37.0, 37.0, 46.0, 49.0, 60.0, 58.0, 55.0, 65.0, 64.0, 53.0, 56.0, 52.0, 39.0, 41.0, 43.0, 31.0, 21.0, 18.0, 13.0, 10.0, 12.0, 8.0, 5.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04609936475753784, -0.044866159558296204, -0.043632958084344864, -0.042399756610393524, -0.041166551411151886, -0.03993334621191025, -0.03870014473795891, -0.03746694326400757, -0.03623373806476593, -0.03500053286552429, -0.03376733139157295, -0.03253412991762161, -0.031300924718379974, -0.030067721381783485, -0.028834518045186996, -0.027601314708590508, -0.02636811137199402, -0.02513490803539753, -0.02390170469880104, -0.02266850136220455, -0.021435298025608063, -0.020202094689011574, -0.018968891352415085, -0.017735688015818596, -0.016502484679222107, -0.015269281342625618, -0.014036078006029129, -0.01280287466943264, -0.011569671332836151, -0.010336467996239662, -0.009103264659643173, -0.007870061323046684, -0.006636857986450195, -0.005403654649853706, -0.004170451313257217, -0.0029372479766607285, -0.0017040446400642395, -0.00047084130346775055, 0.0007623620331287384, 0.0019955653697252274, 0.0032287687063217163, 0.004461972042918205, 0.005695175379514694, 0.006928378716111183, 0.008161582052707672, 0.009394785389304161, 0.01062798872590065, 0.011861192062497139, 0.013094395399093628, 0.014327598735690117, 0.015560802072286606, 0.016794005408883095, 0.018027208745479584, 0.019260412082076073, 0.02049361541867256, 0.02172681875526905, 0.02296002209186554, 0.02419322542846203, 0.025426428765058517, 0.026659632101655006, 0.027892835438251495, 0.029126038774847984, 0.030359242111444473, 0.03159244358539581, 0.03282564878463745]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 9.0, 4.0, 13.0, 13.0, 25.0, 24.0, 30.0, 36.0, 66.0, 76.0, 91.0, 138.0, 245.0, 282.0, 375.0, 650.0, 898.0, 1364.0, 1956.0, 2907.0, 4817.0, 7821.0, 14824.0, 43110.0, 775639.0, 142145.0, 22821.0, 10651.0, 6056.0, 3811.0, 2417.0, 1660.0, 1090.0, 752.0, 483.0, 346.0, 244.0, 171.0, 140.0, 96.0, 60.0, 51.0, 41.0, 26.0, 28.0, 20.0, 8.0, 5.0, 3.0, 11.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.033935546875, -0.03289937973022461, -0.03186321258544922, -0.030827045440673828, -0.029790878295898438, -0.028754711151123047, -0.027718544006347656, -0.026682376861572266, -0.025646209716796875, -0.024610042572021484, -0.023573875427246094, -0.022537708282470703, -0.021501541137695312, -0.020465373992919922, -0.01942920684814453, -0.01839303970336914, -0.01735687255859375, -0.01632070541381836, -0.015284538269042969, -0.014248371124267578, -0.013212203979492188, -0.012176036834716797, -0.011139869689941406, -0.010103702545166016, -0.009067535400390625, -0.008031368255615234, -0.006995201110839844, -0.005959033966064453, -0.0049228668212890625, -0.003886699676513672, -0.0028505325317382812, -0.0018143653869628906, -0.0007781982421875, 0.0002579689025878906, 0.0012941360473632812, 0.002330303192138672, 0.0033664703369140625, 0.004402637481689453, 0.005438804626464844, 0.006474971771240234, 0.007511138916015625, 0.008547306060791016, 0.009583473205566406, 0.010619640350341797, 0.011655807495117188, 0.012691974639892578, 0.013728141784667969, 0.01476430892944336, 0.01580047607421875, 0.01683664321899414, 0.01787281036376953, 0.018908977508544922, 0.019945144653320312, 0.020981311798095703, 0.022017478942871094, 0.023053646087646484, 0.024089813232421875, 0.025125980377197266, 0.026162147521972656, 0.027198314666748047, 0.028234481811523438, 0.029270648956298828, 0.03030681610107422, 0.03134298324584961, 0.032379150390625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 5.0, 5.0, 5.0, 12.0, 3.0, 11.0, 12.0, 35.0, 120.0, 223.0, 257.0, 151.0, 54.0, 17.0, 11.0, 7.0, 6.0, 5.0, 5.0, 6.0, 7.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00167083740234375, -0.0016111135482788086, -0.0015513896942138672, -0.0014916658401489258, -0.0014319419860839844, -0.001372218132019043, -0.0013124942779541016, -0.0012527704238891602, -0.0011930465698242188, -0.0011333227157592773, -0.001073598861694336, -0.0010138750076293945, -0.0009541511535644531, -0.0008944272994995117, -0.0008347034454345703, -0.0007749795913696289, -0.0007152557373046875, -0.0006555318832397461, -0.0005958080291748047, -0.0005360841751098633, -0.0004763603210449219, -0.00041663646697998047, -0.00035691261291503906, -0.00029718875885009766, -0.00023746490478515625, -0.00017774105072021484, -0.00011801719665527344, -5.829334259033203e-05, 1.430511474609375e-06, 6.115436553955078e-05, 0.00012087821960449219, 0.0001806020736694336, 0.000240325927734375, 0.0003000497817993164, 0.0003597736358642578, 0.0004194974899291992, 0.0004792213439941406, 0.000538945198059082, 0.0005986690521240234, 0.0006583929061889648, 0.0007181167602539062, 0.0007778406143188477, 0.0008375644683837891, 0.0008972883224487305, 0.0009570121765136719, 0.0010167360305786133, 0.0010764598846435547, 0.001136183738708496, 0.0011959075927734375, 0.001255631446838379, 0.0013153553009033203, 0.0013750791549682617, 0.0014348030090332031, 0.0014945268630981445, 0.001554250717163086, 0.0016139745712280273, 0.0016736984252929688, 0.0017334222793579102, 0.0017931461334228516, 0.001852869987487793, 0.0019125938415527344, 0.0019723176956176758, 0.002032041549682617, 0.0020917654037475586, 0.0021514892578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 6.0, 3.0, 6.0, 6.0, 10.0, 11.0, 13.0, 11.0, 16.0, 33.0, 21.0, 28.0, 25.0, 46.0, 48.0, 40.0, 121.0, 409.0, 3244.0, 184173.0, 853906.0, 5377.0, 547.0, 110.0, 54.0, 48.0, 24.0, 31.0, 34.0, 27.0, 23.0, 18.0, 14.0, 18.0, 8.0, 7.0, 9.0, 7.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.114013671875, -0.1108551025390625, -0.107696533203125, -0.1045379638671875, -0.10137939453125, -0.0982208251953125, -0.095062255859375, -0.0919036865234375, -0.0887451171875, -0.0855865478515625, -0.082427978515625, -0.0792694091796875, -0.07611083984375, -0.0729522705078125, -0.069793701171875, -0.0666351318359375, -0.0634765625, -0.0603179931640625, -0.057159423828125, -0.0540008544921875, -0.05084228515625, -0.0476837158203125, -0.044525146484375, -0.0413665771484375, -0.0382080078125, -0.0350494384765625, -0.031890869140625, -0.0287322998046875, -0.02557373046875, -0.0224151611328125, -0.019256591796875, -0.0160980224609375, -0.012939453125, -0.0097808837890625, -0.006622314453125, -0.0034637451171875, -0.00030517578125, 0.0028533935546875, 0.006011962890625, 0.0091705322265625, 0.0123291015625, 0.0154876708984375, 0.018646240234375, 0.0218048095703125, 0.02496337890625, 0.0281219482421875, 0.031280517578125, 0.0344390869140625, 0.03759765625, 0.0407562255859375, 0.043914794921875, 0.0470733642578125, 0.05023193359375, 0.0533905029296875, 0.056549072265625, 0.0597076416015625, 0.0628662109375, 0.0660247802734375, 0.069183349609375, 0.0723419189453125, 0.07550048828125, 0.0786590576171875, 0.081817626953125, 0.0849761962890625, 0.088134765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 8.0, 8.0, 8.0, 15.0, 12.0, 13.0, 16.0, 18.0, 29.0, 27.0, 32.0, 37.0, 37.0, 40.0, 53.0, 49.0, 34.0, 55.0, 42.0, 44.0, 47.0, 50.0, 44.0, 36.0, 27.0, 40.0, 35.0, 24.0, 25.0, 14.0, 21.0, 11.0, 10.0, 7.0, 3.0, 7.0, 5.0, 8.0, 2.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00597381591796875, -0.005772113800048828, -0.005570411682128906, -0.005368709564208984, -0.0051670074462890625, -0.004965305328369141, -0.004763603210449219, -0.004561901092529297, -0.004360198974609375, -0.004158496856689453, -0.003956794738769531, -0.0037550926208496094, -0.0035533905029296875, -0.0033516883850097656, -0.0031499862670898438, -0.002948284149169922, -0.00274658203125, -0.002544879913330078, -0.0023431777954101562, -0.0021414756774902344, -0.0019397735595703125, -0.0017380714416503906, -0.0015363693237304688, -0.0013346672058105469, -0.001132965087890625, -0.0009312629699707031, -0.0007295608520507812, -0.0005278587341308594, -0.0003261566162109375, -0.00012445449829101562, 7.724761962890625e-05, 0.0002789497375488281, 0.00048065185546875, 0.0006823539733886719, 0.0008840560913085938, 0.0010857582092285156, 0.0012874603271484375, 0.0014891624450683594, 0.0016908645629882812, 0.0018925666809082031, 0.002094268798828125, 0.002295970916748047, 0.0024976730346679688, 0.0026993751525878906, 0.0029010772705078125, 0.0031027793884277344, 0.0033044815063476562, 0.003506183624267578, 0.0037078857421875, 0.003909587860107422, 0.004111289978027344, 0.004312992095947266, 0.0045146942138671875, 0.004716396331787109, 0.004918098449707031, 0.005119800567626953, 0.005321502685546875, 0.005523204803466797, 0.005724906921386719, 0.005926609039306641, 0.0061283111572265625, 0.006330013275146484, 0.006531715393066406, 0.006733417510986328, 0.00693511962890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 6.0, 18.0, 43.0, 67.0, 120.0, 1720.0, 1045040.0, 1283.0, 126.0, 62.0, 32.0, 14.0, 9.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.17992448806762695, -0.1761331558227539, -0.17234182357788086, -0.1685504913330078, -0.16475915908813477, -0.16096782684326172, -0.15717649459838867, -0.15338516235351562, -0.14959383010864258, -0.14580249786376953, -0.14201116561889648, -0.13821983337402344, -0.1344285011291504, -0.13063716888427734, -0.1268458366394043, -0.12305450439453125, -0.1192631721496582, -0.11547183990478516, -0.11168050765991211, -0.10788917541503906, -0.10409784317016602, -0.10030651092529297, -0.09651517868041992, -0.09272384643554688, -0.08893251419067383, -0.08514118194580078, -0.08134984970092773, -0.07755851745605469, -0.07376718521118164, -0.0699758529663086, -0.06618452072143555, -0.0623931884765625, -0.05860185623168945, -0.054810523986816406, -0.05101919174194336, -0.04722785949707031, -0.043436527252197266, -0.03964519500732422, -0.03585386276245117, -0.032062530517578125, -0.028271198272705078, -0.02447986602783203, -0.020688533782958984, -0.016897201538085938, -0.01310586929321289, -0.009314537048339844, -0.005523204803466797, -0.00173187255859375, 0.002059459686279297, 0.005850791931152344, 0.00964212417602539, 0.013433456420898438, 0.017224788665771484, 0.02101612091064453, 0.024807453155517578, 0.028598785400390625, 0.03239011764526367, 0.03618144989013672, 0.039972782135009766, 0.04376411437988281, 0.04755544662475586, 0.051346778869628906, 0.05513811111450195, 0.058929443359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 9.0, 3.0, 5.0, 7.0, 9.0, 8.0, 17.0, 20.0, 32.0, 24.0, 76.0, 257.0, 272.0, 99.0, 49.0, 28.0, 24.0, 14.0, 16.0, 5.0, 4.0, 9.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013518333435058594, -0.00013109296560287476, -0.00012700259685516357, -0.0001229122281074524, -0.00011882185935974121, -0.00011473149061203003, -0.00011064112186431885, -0.00010655075311660767, -0.00010246038436889648, -9.83700156211853e-05, -9.427964687347412e-05, -9.018927812576294e-05, -8.609890937805176e-05, -8.200854063034058e-05, -7.79181718826294e-05, -7.382780313491821e-05, -6.973743438720703e-05, -6.564706563949585e-05, -6.155669689178467e-05, -5.7466328144073486e-05, -5.3375959396362305e-05, -4.928559064865112e-05, -4.519522190093994e-05, -4.110485315322876e-05, -3.701448440551758e-05, -3.2924115657806396e-05, -2.8833746910095215e-05, -2.4743378162384033e-05, -2.065300941467285e-05, -1.656264066696167e-05, -1.2472271919250488e-05, -8.381903171539307e-06, -4.291534423828125e-06, -2.0116567611694336e-07, 3.889203071594238e-06, 7.97957181930542e-06, 1.2069940567016602e-05, 1.6160309314727783e-05, 2.0250678062438965e-05, 2.4341046810150146e-05, 2.8431415557861328e-05, 3.252178430557251e-05, 3.661215305328369e-05, 4.070252180099487e-05, 4.4792890548706055e-05, 4.8883259296417236e-05, 5.297362804412842e-05, 5.70639967918396e-05, 6.115436553955078e-05, 6.524473428726196e-05, 6.933510303497314e-05, 7.342547178268433e-05, 7.751584053039551e-05, 8.160620927810669e-05, 8.569657802581787e-05, 8.978694677352905e-05, 9.387731552124023e-05, 9.796768426895142e-05, 0.0001020580530166626, 0.00010614842176437378, 0.00011023879051208496, 0.00011432915925979614, 0.00011841952800750732, 0.0001225098967552185, 0.0001266002655029297]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 16.0, 9.0, 9.0, 12.0, 29.0, 61.0, 117.0, 273.0, 949.0, 7300.0, 931858.0, 103287.0, 3502.0, 688.0, 191.0, 86.0, 41.0, 34.0, 21.0, 19.0, 17.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043548583984375, -0.04213714599609375, -0.0407257080078125, -0.03931427001953125, -0.03790283203125, -0.03649139404296875, -0.0350799560546875, -0.03366851806640625, -0.032257080078125, -0.03084564208984375, -0.0294342041015625, -0.02802276611328125, -0.026611328125, -0.02519989013671875, -0.0237884521484375, -0.02237701416015625, -0.020965576171875, -0.01955413818359375, -0.0181427001953125, -0.01673126220703125, -0.01531982421875, -0.01390838623046875, -0.0124969482421875, -0.01108551025390625, -0.009674072265625, -0.00826263427734375, -0.0068511962890625, -0.00543975830078125, -0.0040283203125, -0.00261688232421875, -0.0012054443359375, 0.00020599365234375, 0.001617431640625, 0.00302886962890625, 0.0044403076171875, 0.00585174560546875, 0.00726318359375, 0.00867462158203125, 0.0100860595703125, 0.01149749755859375, 0.012908935546875, 0.01432037353515625, 0.0157318115234375, 0.01714324951171875, 0.0185546875, 0.01996612548828125, 0.0213775634765625, 0.02278900146484375, 0.024200439453125, 0.02561187744140625, 0.0270233154296875, 0.02843475341796875, 0.02984619140625, 0.03125762939453125, 0.0326690673828125, 0.03408050537109375, 0.035491943359375, 0.03690338134765625, 0.0383148193359375, 0.03972625732421875, 0.0411376953125, 0.04254913330078125, 0.0439605712890625, 0.04537200927734375, 0.046783447265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 2.0, 2.0, 8.0, 6.0, 9.0, 29.0, 33.0, 41.0, 70.0, 181.0, 360.0, 99.0, 35.0, 40.0, 29.0, 14.0, 13.0, 12.0, 7.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01091766357421875, -0.010517358779907227, -0.010117053985595703, -0.00971674919128418, -0.009316444396972656, -0.008916139602661133, -0.00851583480834961, -0.008115530014038086, -0.0077152252197265625, -0.007314920425415039, -0.006914615631103516, -0.006514310836791992, -0.006114006042480469, -0.005713701248168945, -0.005313396453857422, -0.0049130916595458984, -0.004512786865234375, -0.0041124820709228516, -0.003712177276611328, -0.0033118724822998047, -0.0029115676879882812, -0.002511262893676758, -0.0021109580993652344, -0.001710653305053711, -0.0013103485107421875, -0.0009100437164306641, -0.0005097389221191406, -0.00010943412780761719, 0.00029087066650390625, 0.0006911754608154297, 0.0010914802551269531, 0.0014917850494384766, 0.00189208984375, 0.0022923946380615234, 0.002692699432373047, 0.0030930042266845703, 0.0034933090209960938, 0.003893613815307617, 0.004293918609619141, 0.004694223403930664, 0.0050945281982421875, 0.005494832992553711, 0.005895137786865234, 0.006295442581176758, 0.006695747375488281, 0.007096052169799805, 0.007496356964111328, 0.007896661758422852, 0.008296966552734375, 0.008697271347045898, 0.009097576141357422, 0.009497880935668945, 0.009898185729980469, 0.010298490524291992, 0.010698795318603516, 0.011099100112915039, 0.011499404907226562, 0.011899709701538086, 0.01230001449584961, 0.012700319290161133, 0.013100624084472656, 0.01350092887878418, 0.013901233673095703, 0.014301538467407227, 0.01470184326171875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 5.0, 9.0, 11.0, 32.0, 75.0, 338.0, 334.0, 97.0, 36.0, 15.0, 8.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10782767832279205, -0.10367798805236816, -0.09952829033136368, -0.09537859261035919, -0.0912289023399353, -0.08707921206951141, -0.08292951434850693, -0.07877981662750244, -0.07463012635707855, -0.07048043608665466, -0.06633073836565018, -0.06218104436993599, -0.0580313503742218, -0.053881656378507614, -0.049731962382793427, -0.04558226838707924, -0.04143257439136505, -0.037282880395650864, -0.033133186399936676, -0.02898349240422249, -0.0248337984085083, -0.020684104412794113, -0.016534410417079926, -0.012384716421365738, -0.00823502242565155, -0.004085328429937363, 6.436556577682495e-05, 0.004214059561491013, 0.0083637535572052, 0.012513447552919388, 0.016663141548633575, 0.020812835544347763, 0.02496252954006195, 0.02911222353577614, 0.033261917531490326, 0.037411611527204514, 0.0415613055229187, 0.04571099951863289, 0.049860693514347076, 0.054010387510061264, 0.05816008150577545, 0.06230977550148964, 0.06645946949720383, 0.07060916721820831, 0.0747588574886322, 0.07890854775905609, 0.08305824548006058, 0.08720794320106506, 0.09135763347148895, 0.09550732374191284, 0.09965702146291733, 0.10380671918392181, 0.1079564094543457, 0.11210609972476959, 0.11625579744577408, 0.12040549516677856, 0.12455518543720245, 0.12870487570762634, 0.13285458087921143, 0.13700427114963531, 0.1411539614200592, 0.1453036516904831, 0.14945334196090698, 0.15360304713249207, 0.15775273740291595]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 4.0, 4.0, 4.0, 5.0, 7.0, 6.0, 11.0, 22.0, 31.0, 39.0, 41.0, 52.0, 66.0, 88.0, 86.0, 78.0, 75.0, 94.0, 75.0, 48.0, 43.0, 34.0, 20.0, 18.0, 5.0, 6.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.07622992992401123, -0.0742097720503807, -0.07218962162733078, -0.07016946375370026, -0.06814931333065033, -0.0661291554570198, -0.06410899758338928, -0.06208884343504906, -0.06006868928670883, -0.05804853513836861, -0.05602838099002838, -0.05400822311639786, -0.05198806896805763, -0.04996791481971741, -0.047947756946086884, -0.04592760279774666, -0.04390744864940643, -0.04188729450106621, -0.03986714035272598, -0.03784698247909546, -0.035826828330755234, -0.03380667418241501, -0.031786516308784485, -0.02976636216044426, -0.027746208012104034, -0.02572605386376381, -0.023705897852778435, -0.02168574184179306, -0.019665587693452835, -0.01764543354511261, -0.015625277534127235, -0.013605122454464436, -0.011584967374801636, -0.009564812295138836, -0.007544657215476036, -0.005524502135813236, -0.0035043470561504364, -0.0014841919764876366, 0.0005359631031751633, 0.002556118182837963, 0.004576273262500763, 0.006596428342163563, 0.008616583421826363, 0.010636738501489162, 0.012656893581151962, 0.014677048660814762, 0.016697203740477562, 0.018717359751462936, 0.02073751389980316, 0.022757668048143387, 0.02477782405912876, 0.026797980070114136, 0.02881813421845436, 0.030838288366794586, 0.03285844624042511, 0.034878600388765335, 0.03689875453710556, 0.038918908685445786, 0.04093906283378601, 0.042959220707416534, 0.04497937485575676, 0.046999529004096985, 0.04901968687772751, 0.051039841026067734, 0.05305999517440796]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 2.0, 2.0, 8.0, 14.0, 8.0, 16.0, 12.0, 14.0, 36.0, 28.0, 44.0, 122.0, 4161392.0, 32198.0, 186.0, 35.0, 29.0, 14.0, 18.0, 10.0, 10.0, 22.0, 6.0, 8.0, 2.0, 4.0, 2.0, 6.0, 2.0, 6.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8134765625, -1.7408599853515625, -1.668243408203125, -1.5956268310546875, -1.52301025390625, -1.4503936767578125, -1.377777099609375, -1.3051605224609375, -1.2325439453125, -1.1599273681640625, -1.087310791015625, -1.0146942138671875, -0.94207763671875, -0.8694610595703125, -0.796844482421875, -0.7242279052734375, -0.651611328125, -0.5789947509765625, -0.506378173828125, -0.4337615966796875, -0.36114501953125, -0.2885284423828125, -0.215911865234375, -0.1432952880859375, -0.0706787109375, 0.0019378662109375, 0.074554443359375, 0.1471710205078125, 0.21978759765625, 0.2924041748046875, 0.365020751953125, 0.4376373291015625, 0.51025390625, 0.5828704833984375, 0.655487060546875, 0.7281036376953125, 0.80072021484375, 0.8733367919921875, 0.945953369140625, 1.0185699462890625, 1.0911865234375, 1.1638031005859375, 1.236419677734375, 1.3090362548828125, 1.38165283203125, 1.4542694091796875, 1.526885986328125, 1.5995025634765625, 1.672119140625, 1.7447357177734375, 1.817352294921875, 1.8899688720703125, 1.96258544921875, 2.0352020263671875, 2.107818603515625, 2.1804351806640625, 2.2530517578125, 2.3256683349609375, 2.398284912109375, 2.4709014892578125, 2.54351806640625, 2.6161346435546875, 2.688751220703125, 2.7613677978515625, 2.833984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 6.0, 4.0, 4.0, 8.0, 5.0, 9.0, 8.0, 11.0, 10.0, 13.0, 31.0, 89.0, 176.0, 231.0, 183.0, 100.0, 37.0, 20.0, 11.0, 8.0, 6.0, 5.0, 6.0, 2.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0020046234130859375, -0.001942664384841919, -0.0018807053565979004, -0.0018187463283538818, -0.0017567873001098633, -0.0016948282718658447, -0.0016328692436218262, -0.0015709102153778076, -0.001508951187133789, -0.0014469921588897705, -0.001385033130645752, -0.0013230741024017334, -0.0012611150741577148, -0.0011991560459136963, -0.0011371970176696777, -0.0010752379894256592, -0.0010132789611816406, -0.0009513199329376221, -0.0008893609046936035, -0.000827401876449585, -0.0007654428482055664, -0.0007034838199615479, -0.0006415247917175293, -0.0005795657634735107, -0.0005176067352294922, -0.00045564770698547363, -0.0003936886787414551, -0.0003317296504974365, -0.00026977062225341797, -0.00020781159400939941, -0.00014585256576538086, -8.38935375213623e-05, -2.193450927734375e-05, 4.0024518966674805e-05, 0.00010198354721069336, 0.00016394257545471191, 0.00022590160369873047, 0.000287860631942749, 0.0003498196601867676, 0.00041177868843078613, 0.0004737377166748047, 0.0005356967449188232, 0.0005976557731628418, 0.0006596148014068604, 0.0007215738296508789, 0.0007835328578948975, 0.000845491886138916, 0.0009074509143829346, 0.0009694099426269531, 0.0010313689708709717, 0.0010933279991149902, 0.0011552870273590088, 0.0012172460556030273, 0.001279205083847046, 0.0013411641120910645, 0.001403123140335083, 0.0014650821685791016, 0.0015270411968231201, 0.0015890002250671387, 0.0016509592533111572, 0.0017129182815551758, 0.0017748773097991943, 0.0018368363380432129, 0.0018987953662872314, 0.00196075439453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 7.0, 8.0, 9.0, 18.0, 30.0, 34.0, 71.0, 101.0, 188.0, 586.0, 4191302.0, 1334.0, 235.0, 113.0, 76.0, 48.0, 31.0, 24.0, 21.0, 11.0, 12.0, 5.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5107421875, -0.49350738525390625, -0.4762725830078125, -0.45903778076171875, -0.441802978515625, -0.42456817626953125, -0.4073333740234375, -0.39009857177734375, -0.37286376953125, -0.35562896728515625, -0.3383941650390625, -0.32115936279296875, -0.303924560546875, -0.28668975830078125, -0.2694549560546875, -0.25222015380859375, -0.2349853515625, -0.21775054931640625, -0.2005157470703125, -0.18328094482421875, -0.166046142578125, -0.14881134033203125, -0.1315765380859375, -0.11434173583984375, -0.09710693359375, -0.07987213134765625, -0.0626373291015625, -0.04540252685546875, -0.028167724609375, -0.01093292236328125, 0.0063018798828125, 0.02353668212890625, 0.040771484375, 0.05800628662109375, 0.0752410888671875, 0.09247589111328125, 0.109710693359375, 0.12694549560546875, 0.1441802978515625, 0.16141510009765625, 0.17864990234375, 0.19588470458984375, 0.2131195068359375, 0.23035430908203125, 0.247589111328125, 0.26482391357421875, 0.2820587158203125, 0.29929351806640625, 0.3165283203125, 0.33376312255859375, 0.3509979248046875, 0.36823272705078125, 0.385467529296875, 0.40270233154296875, 0.4199371337890625, 0.43717193603515625, 0.45440673828125, 0.47164154052734375, 0.4888763427734375, 0.5061111450195312, 0.523345947265625, 0.5405807495117188, 0.5578155517578125, 0.5750503540039062, 0.59228515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 8.0, 9.0, 18.0, 20.0, 38.0, 71.0, 121.0, 199.0, 456.0, 1766.0, 663.0, 294.0, 147.0, 94.0, 59.0, 25.0, 26.0, 22.0, 12.0, 10.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00408172607421875, -0.003922879695892334, -0.003764033317565918, -0.003605186939239502, -0.003446340560913086, -0.00328749418258667, -0.003128647804260254, -0.002969801425933838, -0.002810955047607422, -0.002652108669281006, -0.00249326229095459, -0.002334415912628174, -0.002175569534301758, -0.002016723155975342, -0.0018578767776489258, -0.0016990303993225098, -0.0015401840209960938, -0.0013813376426696777, -0.0012224912643432617, -0.0010636448860168457, -0.0009047985076904297, -0.0007459521293640137, -0.0005871057510375977, -0.00042825937271118164, -0.0002694129943847656, -0.00011056661605834961, 4.8279762268066406e-05, 0.00020712614059448242, 0.00036597251892089844, 0.0005248188972473145, 0.0006836652755737305, 0.0008425116539001465, 0.0010013580322265625, 0.0011602044105529785, 0.0013190507888793945, 0.0014778971672058105, 0.0016367435455322266, 0.0017955899238586426, 0.0019544363021850586, 0.0021132826805114746, 0.0022721290588378906, 0.0024309754371643066, 0.0025898218154907227, 0.0027486681938171387, 0.0029075145721435547, 0.0030663609504699707, 0.0032252073287963867, 0.0033840537071228027, 0.0035429000854492188, 0.0037017464637756348, 0.0038605928421020508, 0.004019439220428467, 0.004178285598754883, 0.004337131977081299, 0.004495978355407715, 0.004654824733734131, 0.004813671112060547, 0.004972517490386963, 0.005131363868713379, 0.005290210247039795, 0.005449056625366211, 0.005607903003692627, 0.005766749382019043, 0.005925595760345459, 0.006084442138671875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 10.0, 987.0, 22.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11288654804229736, -0.08866234868764877, -0.06443814933300018, -0.040213942527770996, -0.015989743173122406, 0.008234456181526184, 0.03245866298675537, 0.056682854890823364, 0.08090706169605255, 0.10513126105070114, 0.12935546040534973, 0.15357966721057892, 0.1778038740158081, 0.2020280659198761, 0.22625227272510529, 0.2504764795303345, 0.27470067143440247, 0.29892486333847046, 0.32314908504486084, 0.34737327694892883, 0.3715974688529968, 0.3958216905593872, 0.4200458824634552, 0.4442700743675232, 0.4684942960739136, 0.49271848797798157, 0.5169426798820496, 0.5411669015884399, 0.5653911232948303, 0.5896152853965759, 0.6138395071029663, 0.6380636692047119, 0.6622878909111023, 0.6865121126174927, 0.7107362747192383, 0.7349604964256287, 0.759184718132019, 0.7834088802337646, 0.807633101940155, 0.8318573236465454, 0.856081485748291, 0.8803057074546814, 0.904529869556427, 0.9287540912628174, 0.9529783129692078, 0.9772024750709534, 1.0014266967773438, 1.0256508588790894, 1.0498751401901245, 1.0740993022918701, 1.0983235836029053, 1.1225477457046509, 1.1467719078063965, 1.1709961891174316, 1.1952203512191772, 1.2194445133209229, 1.2436686754226685, 1.267892837524414, 1.2921171188354492, 1.3163412809371948, 1.3405654430389404, 1.3647897243499756, 1.3890138864517212, 1.4132380485534668, 1.437462329864502]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 16.0, 38.0, 93.0, 138.0, 185.0, 191.0, 175.0, 83.0, 49.0, 22.0, 14.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04213511943817139, -0.039557844400405884, -0.03698056936264038, -0.034403298050165176, -0.03182602301239967, -0.02924874797463417, -0.026671474799513817, -0.024094201624393463, -0.02151692658662796, -0.018939651548862457, -0.016362378373742104, -0.013785104267299175, -0.011207830160856247, -0.008630556054413319, -0.00605328194797039, -0.0034760087728500366, -0.0008987337350845337, 0.0016785403713583946, 0.004255814477801323, 0.006833088584244251, 0.00941036269068718, 0.011987636797130108, 0.014564910903573036, 0.01714218407869339, 0.019719459116458893, 0.022296734154224396, 0.02487400732934475, 0.027451280504465103, 0.030028555542230606, 0.03260583057999611, 0.035183101892471313, 0.037760376930236816, 0.04033765196800232, 0.04291492700576782, 0.045492202043533325, 0.04806947335600853, 0.05064674839377403, 0.053224023431539536, 0.05580129474401474, 0.05837856978178024, 0.060955844819545746, 0.06353311985731125, 0.06611039489507675, 0.06868766993284225, 0.07126493752002716, 0.07384221255779266, 0.07641948759555817, 0.07899676263332367, 0.08157403767108917, 0.08415131270885468, 0.08672858774662018, 0.08930586278438568, 0.09188313782215118, 0.09446040540933609, 0.09703768044710159, 0.0996149554848671, 0.1021922305226326, 0.1047695055603981, 0.1073467805981636, 0.10992405563592911, 0.11250132322311401, 0.11507859826087952, 0.11765587329864502, 0.12023314833641052, 0.12281042337417603]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 6.0, 5.0, 12.0, 10.0, 9.0, 11.0, 13.0, 19.0, 23.0, 22.0, 36.0, 26.0, 33.0, 37.0, 35.0, 41.0, 45.0, 132.0, 33869.0, 1013297.0, 409.0, 80.0, 46.0, 46.0, 40.0, 26.0, 28.0, 29.0, 28.0, 28.0, 15.0, 21.0, 7.0, 14.0, 12.0, 11.0, 8.0, 8.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.219482421875, -0.21306610107421875, -0.2066497802734375, -0.20023345947265625, -0.193817138671875, -0.18740081787109375, -0.1809844970703125, -0.17456817626953125, -0.16815185546875, -0.16173553466796875, -0.1553192138671875, -0.14890289306640625, -0.142486572265625, -0.13607025146484375, -0.1296539306640625, -0.12323760986328125, -0.1168212890625, -0.11040496826171875, -0.1039886474609375, -0.09757232666015625, -0.091156005859375, -0.08473968505859375, -0.0783233642578125, -0.07190704345703125, -0.06549072265625, -0.05907440185546875, -0.0526580810546875, -0.04624176025390625, -0.039825439453125, -0.03340911865234375, -0.0269927978515625, -0.02057647705078125, -0.01416015625, -0.00774383544921875, -0.0013275146484375, 0.00508880615234375, 0.011505126953125, 0.01792144775390625, 0.0243377685546875, 0.03075408935546875, 0.03717041015625, 0.04358673095703125, 0.0500030517578125, 0.05641937255859375, 0.062835693359375, 0.06925201416015625, 0.0756683349609375, 0.08208465576171875, 0.0885009765625, 0.09491729736328125, 0.1013336181640625, 0.10774993896484375, 0.114166259765625, 0.12058258056640625, 0.1269989013671875, 0.13341522216796875, 0.13983154296875, 0.14624786376953125, 0.1526641845703125, 0.15908050537109375, 0.165496826171875, 0.17191314697265625, 0.1783294677734375, 0.18474578857421875, 0.191162109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 12.0, 120.0, 440.0, 366.0, 77.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003528594970703125, -0.002933681011199951, -0.0023387670516967773, -0.0017438530921936035, -0.0011489391326904297, -0.0005540251731872559, 4.088878631591797e-05, 0.0006358027458190918, 0.0012307167053222656, 0.0018256306648254395, 0.0024205446243286133, 0.003015458583831787, 0.003610372543334961, 0.004205286502838135, 0.004800200462341309, 0.005395114421844482, 0.005990028381347656, 0.00658494234085083, 0.007179856300354004, 0.007774770259857178, 0.008369684219360352, 0.008964598178863525, 0.0095595121383667, 0.010154426097869873, 0.010749340057373047, 0.01134425401687622, 0.011939167976379395, 0.012534081935882568, 0.013128995895385742, 0.013723909854888916, 0.01431882381439209, 0.014913737773895264, 0.015508651733398438, 0.01610356569290161, 0.016698479652404785, 0.01729339361190796, 0.017888307571411133, 0.018483221530914307, 0.01907813549041748, 0.019673049449920654, 0.020267963409423828, 0.020862877368927002, 0.021457791328430176, 0.02205270528793335, 0.022647619247436523, 0.023242533206939697, 0.02383744716644287, 0.024432361125946045, 0.02502727508544922, 0.025622189044952393, 0.026217103004455566, 0.02681201696395874, 0.027406930923461914, 0.028001844882965088, 0.02859675884246826, 0.029191672801971436, 0.02978658676147461, 0.030381500720977783, 0.030976414680480957, 0.03157132863998413, 0.032166242599487305, 0.03276115655899048, 0.03335607051849365, 0.033950984477996826, 0.0345458984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 4.0, 4.0, 12.0, 17.0, 16.0, 20.0, 24.0, 55.0, 75.0, 103.0, 221.0, 383.0, 833.0, 2470.0, 10333.0, 68808.0, 770537.0, 169866.0, 18434.0, 4040.0, 1171.0, 477.0, 215.0, 127.0, 90.0, 47.0, 34.0, 30.0, 23.0, 18.0, 14.0, 9.0, 9.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08154296875, -0.07919120788574219, -0.07683944702148438, -0.07448768615722656, -0.07213592529296875, -0.06978416442871094, -0.06743240356445312, -0.06508064270019531, -0.0627288818359375, -0.06037712097167969, -0.058025360107421875, -0.05567359924316406, -0.05332183837890625, -0.05097007751464844, -0.048618316650390625, -0.04626655578613281, -0.043914794921875, -0.04156303405761719, -0.039211273193359375, -0.03685951232910156, -0.03450775146484375, -0.03215599060058594, -0.029804229736328125, -0.027452468872070312, -0.0251007080078125, -0.022748947143554688, -0.020397186279296875, -0.018045425415039062, -0.01569366455078125, -0.013341903686523438, -0.010990142822265625, -0.008638381958007812, -0.00628662109375, -0.0039348602294921875, -0.001583099365234375, 0.0007686614990234375, 0.00312042236328125, 0.0054721832275390625, 0.007823944091796875, 0.010175704956054688, 0.0125274658203125, 0.014879226684570312, 0.017230987548828125, 0.019582748413085938, 0.02193450927734375, 0.024286270141601562, 0.026638031005859375, 0.028989791870117188, 0.031341552734375, 0.03369331359863281, 0.036045074462890625, 0.03839683532714844, 0.04074859619140625, 0.04310035705566406, 0.045452117919921875, 0.04780387878417969, 0.0501556396484375, 0.05250740051269531, 0.054859161376953125, 0.05721092224121094, 0.05956268310546875, 0.06191444396972656, 0.06426620483398438, 0.06661796569824219, 0.0689697265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 7.0, 11.0, 9.0, 13.0, 20.0, 17.0, 14.0, 27.0, 31.0, 40.0, 43.0, 48.0, 59.0, 55.0, 61.0, 63.0, 62.0, 62.0, 68.0, 44.0, 35.0, 32.0, 32.0, 25.0, 25.0, 17.0, 18.0, 12.0, 15.0, 8.0, 7.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.0309906005859375, -0.030187606811523438, -0.029384613037109375, -0.028581619262695312, -0.02777862548828125, -0.026975631713867188, -0.026172637939453125, -0.025369644165039062, -0.024566650390625, -0.023763656616210938, -0.022960662841796875, -0.022157669067382812, -0.02135467529296875, -0.020551681518554688, -0.019748687744140625, -0.018945693969726562, -0.0181427001953125, -0.017339706420898438, -0.016536712646484375, -0.015733718872070312, -0.01493072509765625, -0.014127731323242188, -0.013324737548828125, -0.012521743774414062, -0.01171875, -0.010915756225585938, -0.010112762451171875, -0.009309768676757812, -0.00850677490234375, -0.0077037811279296875, -0.006900787353515625, -0.0060977935791015625, -0.0052947998046875, -0.0044918060302734375, -0.003688812255859375, -0.0028858184814453125, -0.00208282470703125, -0.0012798309326171875, -0.000476837158203125, 0.0003261566162109375, 0.001129150390625, 0.0019321441650390625, 0.002735137939453125, 0.0035381317138671875, 0.00434112548828125, 0.0051441192626953125, 0.005947113037109375, 0.0067501068115234375, 0.0075531005859375, 0.008356094360351562, 0.009159088134765625, 0.009962081909179688, 0.01076507568359375, 0.011568069458007812, 0.012371063232421875, 0.013174057006835938, 0.01397705078125, 0.014780044555664062, 0.015583038330078125, 0.016386032104492188, 0.01718902587890625, 0.017992019653320312, 0.018795013427734375, 0.019598007202148438, 0.0204010009765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 1.0, 7.0, 4.0, 5.0, 14.0, 11.0, 14.0, 19.0, 26.0, 51.0, 82.0, 126.0, 216.0, 545.0, 1441.0, 5136.0, 29524.0, 942332.0, 58883.0, 6874.0, 1883.0, 658.0, 294.0, 151.0, 68.0, 49.0, 35.0, 27.0, 21.0, 19.0, 7.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1016845703125, -0.0982503890991211, -0.09481620788574219, -0.09138202667236328, -0.08794784545898438, -0.08451366424560547, -0.08107948303222656, -0.07764530181884766, -0.07421112060546875, -0.07077693939208984, -0.06734275817871094, -0.06390857696533203, -0.060474395751953125, -0.05704021453857422, -0.05360603332519531, -0.050171852111816406, -0.0467376708984375, -0.043303489685058594, -0.03986930847167969, -0.03643512725830078, -0.033000946044921875, -0.02956676483154297, -0.026132583618164062, -0.022698402404785156, -0.01926422119140625, -0.015830039978027344, -0.012395858764648438, -0.008961677551269531, -0.005527496337890625, -0.0020933151245117188, 0.0013408660888671875, 0.004775047302246094, 0.008209228515625, 0.011643409729003906, 0.015077590942382812, 0.01851177215576172, 0.021945953369140625, 0.02538013458251953, 0.028814315795898438, 0.032248497009277344, 0.03568267822265625, 0.039116859436035156, 0.04255104064941406, 0.04598522186279297, 0.049419403076171875, 0.05285358428955078, 0.05628776550292969, 0.059721946716308594, 0.0631561279296875, 0.0665903091430664, 0.07002449035644531, 0.07345867156982422, 0.07689285278320312, 0.08032703399658203, 0.08376121520996094, 0.08719539642333984, 0.09062957763671875, 0.09406375885009766, 0.09749794006347656, 0.10093212127685547, 0.10436630249023438, 0.10780048370361328, 0.11123466491699219, 0.1146688461303711, 0.11810302734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 2.0, 9.0, 9.0, 10.0, 21.0, 19.0, 28.0, 55.0, 124.0, 142.0, 166.0, 168.0, 93.0, 52.0, 29.0, 21.0, 11.0, 13.0, 8.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.09808349609375e-05, -2.0330771803855896e-05, -1.9680708646774292e-05, -1.9030645489692688e-05, -1.8380582332611084e-05, -1.773051917552948e-05, -1.7080456018447876e-05, -1.6430392861366272e-05, -1.5780329704284668e-05, -1.5130266547203064e-05, -1.448020339012146e-05, -1.3830140233039856e-05, -1.3180077075958252e-05, -1.2530013918876648e-05, -1.1879950761795044e-05, -1.122988760471344e-05, -1.0579824447631836e-05, -9.929761290550232e-06, -9.279698133468628e-06, -8.629634976387024e-06, -7.97957181930542e-06, -7.329508662223816e-06, -6.679445505142212e-06, -6.029382348060608e-06, -5.379319190979004e-06, -4.7292560338974e-06, -4.079192876815796e-06, -3.429129719734192e-06, -2.779066562652588e-06, -2.129003405570984e-06, -1.4789402484893799e-06, -8.288770914077759e-07, -1.7881393432617188e-07, 4.7124922275543213e-07, 1.1213123798370361e-06, 1.7713755369186401e-06, 2.421438694000244e-06, 3.071501851081848e-06, 3.721565008163452e-06, 4.371628165245056e-06, 5.02169132232666e-06, 5.671754479408264e-06, 6.321817636489868e-06, 6.971880793571472e-06, 7.621943950653076e-06, 8.27200710773468e-06, 8.922070264816284e-06, 9.572133421897888e-06, 1.0222196578979492e-05, 1.0872259736061096e-05, 1.15223228931427e-05, 1.2172386050224304e-05, 1.2822449207305908e-05, 1.3472512364387512e-05, 1.4122575521469116e-05, 1.477263867855072e-05, 1.5422701835632324e-05, 1.6072764992713928e-05, 1.6722828149795532e-05, 1.7372891306877136e-05, 1.802295446395874e-05, 1.8673017621040344e-05, 1.9323080778121948e-05, 1.9973143935203552e-05, 2.0623207092285156e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 8.0, 11.0, 12.0, 26.0, 32.0, 37.0, 70.0, 118.0, 161.0, 325.0, 748.0, 1854.0, 6709.0, 56469.0, 956006.0, 19682.0, 3868.0, 1258.0, 523.0, 239.0, 139.0, 79.0, 51.0, 40.0, 21.0, 23.0, 9.0, 7.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1689453125, -0.16402244567871094, -0.15909957885742188, -0.1541767120361328, -0.14925384521484375, -0.1443309783935547, -0.13940811157226562, -0.13448524475097656, -0.1295623779296875, -0.12463951110839844, -0.11971664428710938, -0.11479377746582031, -0.10987091064453125, -0.10494804382324219, -0.10002517700195312, -0.09510231018066406, -0.090179443359375, -0.08525657653808594, -0.08033370971679688, -0.07541084289550781, -0.07048797607421875, -0.06556510925292969, -0.060642242431640625, -0.05571937561035156, -0.0507965087890625, -0.04587364196777344, -0.040950775146484375, -0.03602790832519531, -0.03110504150390625, -0.026182174682617188, -0.021259307861328125, -0.016336441040039062, -0.01141357421875, -0.0064907073974609375, -0.001567840576171875, 0.0033550262451171875, 0.00827789306640625, 0.013200759887695312, 0.018123626708984375, 0.023046493530273438, 0.0279693603515625, 0.03289222717285156, 0.037815093994140625, 0.04273796081542969, 0.04766082763671875, 0.05258369445800781, 0.057506561279296875, 0.06242942810058594, 0.067352294921875, 0.07227516174316406, 0.07719802856445312, 0.08212089538574219, 0.08704376220703125, 0.09196662902832031, 0.09688949584960938, 0.10181236267089844, 0.1067352294921875, 0.11165809631347656, 0.11658096313476562, 0.12150382995605469, 0.12642669677734375, 0.1313495635986328, 0.13627243041992188, 0.14119529724121094, 0.1461181640625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 8.0, 8.0, 11.0, 20.0, 32.0, 76.0, 125.0, 226.0, 225.0, 111.0, 64.0, 19.0, 21.0, 15.0, 8.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07562255859375, -0.07368040084838867, -0.07173824310302734, -0.06979608535766602, -0.06785392761230469, -0.06591176986694336, -0.06396961212158203, -0.0620274543762207, -0.060085296630859375, -0.05814313888549805, -0.05620098114013672, -0.05425882339477539, -0.05231666564941406, -0.050374507904052734, -0.048432350158691406, -0.04649019241333008, -0.04454803466796875, -0.04260587692260742, -0.040663719177246094, -0.038721561431884766, -0.03677940368652344, -0.03483724594116211, -0.03289508819580078, -0.030952930450439453, -0.029010772705078125, -0.027068614959716797, -0.02512645721435547, -0.02318429946899414, -0.021242141723632812, -0.019299983978271484, -0.017357826232910156, -0.015415668487548828, -0.0134735107421875, -0.011531352996826172, -0.009589195251464844, -0.007647037506103516, -0.0057048797607421875, -0.0037627220153808594, -0.0018205642700195312, 0.00012159347534179688, 0.002063751220703125, 0.004005908966064453, 0.005948066711425781, 0.00789022445678711, 0.009832382202148438, 0.011774539947509766, 0.013716697692871094, 0.015658855438232422, 0.01760101318359375, 0.019543170928955078, 0.021485328674316406, 0.023427486419677734, 0.025369644165039062, 0.02731180191040039, 0.02925395965576172, 0.031196117401123047, 0.033138275146484375, 0.0350804328918457, 0.03702259063720703, 0.03896474838256836, 0.04090690612792969, 0.042849063873291016, 0.044791221618652344, 0.04673337936401367, 0.048675537109375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [10.0, 721.0, 286.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23293253779411316, -0.11313716322183609, 0.006658211350440979, 0.12645357847213745, 0.24624896049499512, 0.3660443127155304, 0.48583969473838806, 0.6056350469589233, 0.7254304885864258, 0.8452258706092834, 0.9650212526321411, 1.084816575050354, 1.2046120166778564, 1.3244073390960693, 1.4442026615142822, 1.5639981031417847, 1.6837934255599976, 1.8035887479782104, 1.923384189605713, 2.043179512023926, 2.1629748344421387, 2.2827701568603516, 2.4025657176971436, 2.5223610401153564, 2.6421563625335693, 2.7619516849517822, 2.881747007369995, 3.001542568206787, 3.121337890625, 3.241133213043213, 3.360928535461426, 3.4807238578796387, 3.6005194187164307, 3.7203147411346436, 3.8401100635528564, 3.9599056243896484, 4.079700946807861, 4.199496269226074, 4.319291591644287, 4.4390869140625, 4.558882236480713, 4.678677558898926, 4.798472881317139, 4.918268203735352, 5.0380635261535645, 5.157858848571777, 5.277654647827148, 5.397449970245361, 5.517245292663574, 5.637040615081787, 5.7568359375, 5.876631259918213, 5.996426582336426, 6.116222381591797, 6.23601770401001, 6.355813026428223, 6.4756083488464355, 6.595403671264648, 6.715198993682861, 6.834994316101074, 6.954789638519287, 7.0745849609375, 7.194380760192871, 7.314176082611084, 7.433971405029297]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 11.0, 21.0, 39.0, 46.0, 74.0, 90.0, 118.0, 125.0, 128.0, 99.0, 86.0, 75.0, 36.0, 30.0, 16.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.186595618724823, -0.17369957268238068, -0.16080352663993835, -0.14790749549865723, -0.1350114494562149, -0.12211540341377258, -0.10921935737133026, -0.09632331877946854, -0.08342727273702621, -0.07053122669458389, -0.05763518810272217, -0.044739142060279846, -0.03184309974312782, -0.0189470574259758, -0.006051011383533478, 0.006845027208328247, 0.01974107325077057, 0.03263711556792259, 0.045533157885074615, 0.05842920392751694, 0.07132524251937866, 0.08422128856182098, 0.0971173346042633, 0.11001337319612503, 0.12290941923856735, 0.13580545783042908, 0.1487015038728714, 0.16159754991531372, 0.17449359595775604, 0.18738964200019836, 0.2002856731414795, 0.21318171918392181, 0.22607776522636414, 0.23897381126880646, 0.2518698573112488, 0.2647658884525299, 0.2776619493961334, 0.29055798053741455, 0.30345404148101807, 0.3163500726222992, 0.3292461037635803, 0.34214213490486145, 0.35503819584846497, 0.3679342269897461, 0.3808302879333496, 0.39372631907463074, 0.40662235021591187, 0.4195184111595154, 0.4324144721031189, 0.4453105032444, 0.45820656418800354, 0.47110259532928467, 0.4839986562728882, 0.4968946874141693, 0.5097907185554504, 0.522686779499054, 0.5355827808380127, 0.5484788417816162, 0.561374843120575, 0.5742709040641785, 0.587166965007782, 0.6000629663467407, 0.6129590272903442, 0.6258550882339478, 0.6387511491775513]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 23.0, 150.0, 998.0, 4190286.0, 2207.0, 350.0, 129.0, 54.0, 33.0, 24.0, 14.0, 12.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2459716796875, -0.2227649688720703, -0.19955825805664062, -0.17635154724121094, -0.15314483642578125, -0.12993812561035156, -0.10673141479492188, -0.08352470397949219, -0.0603179931640625, -0.03711128234863281, -0.013904571533203125, 0.009302139282226562, 0.03250885009765625, 0.05571556091308594, 0.07892227172851562, 0.10212898254394531, 0.125335693359375, 0.1485424041748047, 0.17174911499023438, 0.19495582580566406, 0.21816253662109375, 0.24136924743652344, 0.2645759582519531, 0.2877826690673828, 0.3109893798828125, 0.3341960906982422, 0.3574028015136719, 0.38060951232910156, 0.40381622314453125, 0.42702293395996094, 0.4502296447753906, 0.4734363555908203, 0.49664306640625, 0.5198497772216797, 0.5430564880371094, 0.5662631988525391, 0.5894699096679688, 0.6126766204833984, 0.6358833312988281, 0.6590900421142578, 0.6822967529296875, 0.7055034637451172, 0.7287101745605469, 0.7519168853759766, 0.7751235961914062, 0.7983303070068359, 0.8215370178222656, 0.8447437286376953, 0.867950439453125, 0.8911571502685547, 0.9143638610839844, 0.9375705718994141, 0.9607772827148438, 0.9839839935302734, 1.0071907043457031, 1.0303974151611328, 1.0536041259765625, 1.0768108367919922, 1.1000175476074219, 1.1232242584228516, 1.1464309692382812, 1.169637680053711, 1.1928443908691406, 1.2160511016845703, 1.2392578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 20.0, 97.0, 249.0, 340.0, 221.0, 68.0, 21.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003814697265625, -0.0031189918518066406, -0.0024232864379882812, -0.0017275810241699219, -0.0010318756103515625, -0.0003361701965332031, 0.00035953521728515625, 0.0010552406311035156, 0.001750946044921875, 0.0024466514587402344, 0.0031423568725585938, 0.003838062286376953, 0.0045337677001953125, 0.005229473114013672, 0.005925178527832031, 0.006620883941650391, 0.00731658935546875, 0.00801229476928711, 0.008708000183105469, 0.009403705596923828, 0.010099411010742188, 0.010795116424560547, 0.011490821838378906, 0.012186527252197266, 0.012882232666015625, 0.013577938079833984, 0.014273643493652344, 0.014969348907470703, 0.015665054321289062, 0.016360759735107422, 0.01705646514892578, 0.01775217056274414, 0.0184478759765625, 0.01914358139038086, 0.01983928680419922, 0.020534992218017578, 0.021230697631835938, 0.021926403045654297, 0.022622108459472656, 0.023317813873291016, 0.024013519287109375, 0.024709224700927734, 0.025404930114746094, 0.026100635528564453, 0.026796340942382812, 0.027492046356201172, 0.02818775177001953, 0.02888345718383789, 0.02957916259765625, 0.03027486801147461, 0.03097057342529297, 0.03166627883911133, 0.03236198425292969, 0.03305768966674805, 0.033753395080566406, 0.034449100494384766, 0.035144805908203125, 0.035840511322021484, 0.036536216735839844, 0.0372319221496582, 0.03792762756347656, 0.03862333297729492, 0.03931903839111328, 0.04001474380493164, 0.04071044921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 13.0, 25.0, 32.0, 61.0, 80.0, 121.0, 240.0, 498.0, 42117.0, 4149635.0, 648.0, 271.0, 142.0, 116.0, 103.0, 61.0, 39.0, 35.0, 26.0, 11.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9521484375, -0.915679931640625, -0.87921142578125, -0.842742919921875, -0.8062744140625, -0.769805908203125, -0.73333740234375, -0.696868896484375, -0.660400390625, -0.623931884765625, -0.58746337890625, -0.550994873046875, -0.5145263671875, -0.478057861328125, -0.44158935546875, -0.405120849609375, -0.36865234375, -0.332183837890625, -0.29571533203125, -0.259246826171875, -0.2227783203125, -0.186309814453125, -0.14984130859375, -0.113372802734375, -0.076904296875, -0.040435791015625, -0.00396728515625, 0.032501220703125, 0.0689697265625, 0.105438232421875, 0.14190673828125, 0.178375244140625, 0.21484375, 0.251312255859375, 0.28778076171875, 0.324249267578125, 0.3607177734375, 0.397186279296875, 0.43365478515625, 0.470123291015625, 0.506591796875, 0.543060302734375, 0.57952880859375, 0.615997314453125, 0.6524658203125, 0.688934326171875, 0.72540283203125, 0.761871337890625, 0.79833984375, 0.834808349609375, 0.87127685546875, 0.907745361328125, 0.9442138671875, 0.980682373046875, 1.01715087890625, 1.053619384765625, 1.090087890625, 1.126556396484375, 1.16302490234375, 1.199493408203125, 1.2359619140625, 1.272430419921875, 1.30889892578125, 1.345367431640625, 1.3818359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 19.0, 156.0, 3757.0, 139.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055328369140625, -0.050527095794677734, -0.04572582244873047, -0.0409245491027832, -0.03612327575683594, -0.03132200241088867, -0.026520729064941406, -0.02171945571899414, -0.016918182373046875, -0.01211690902709961, -0.007315635681152344, -0.002514362335205078, 0.0022869110107421875, 0.007088184356689453, 0.011889457702636719, 0.016690731048583984, 0.02149200439453125, 0.026293277740478516, 0.03109455108642578, 0.03589582443237305, 0.04069709777832031, 0.04549837112426758, 0.050299644470214844, 0.05510091781616211, 0.059902191162109375, 0.06470346450805664, 0.0695047378540039, 0.07430601119995117, 0.07910728454589844, 0.0839085578918457, 0.08870983123779297, 0.09351110458374023, 0.0983123779296875, 0.10311365127563477, 0.10791492462158203, 0.1127161979675293, 0.11751747131347656, 0.12231874465942383, 0.1271200180053711, 0.13192129135131836, 0.13672256469726562, 0.1415238380432129, 0.14632511138916016, 0.15112638473510742, 0.1559276580810547, 0.16072893142700195, 0.16553020477294922, 0.17033147811889648, 0.17513275146484375, 0.17993402481079102, 0.18473529815673828, 0.18953657150268555, 0.1943378448486328, 0.19913911819458008, 0.20394039154052734, 0.2087416648864746, 0.21354293823242188, 0.21834421157836914, 0.2231454849243164, 0.22794675827026367, 0.23274803161621094, 0.2375493049621582, 0.24235057830810547, 0.24715185165405273, 0.251953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 9.0, 53.0, 615.0, 309.0, 21.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7131343483924866, -0.6577354073524475, -0.6023364663124084, -0.5469375252723694, -0.4915385842323303, -0.43613964319229126, -0.3807407021522522, -0.32534176111221313, -0.2699428200721741, -0.214543879032135, -0.15914493799209595, -0.10374599695205688, -0.04834705591201782, 0.00705188512802124, 0.0624508261680603, 0.11784976720809937, 0.17324870824813843, 0.2286476492881775, 0.28404659032821655, 0.3394455313682556, 0.3948444724082947, 0.45024341344833374, 0.5056423544883728, 0.5610412955284119, 0.6164402365684509, 0.67183917760849, 0.727238118648529, 0.7826370596885681, 0.8380360007286072, 0.8934349417686462, 0.9488338828086853, 1.0042328834533691, 1.0596318244934082, 1.1150307655334473, 1.1704297065734863, 1.2258286476135254, 1.2812275886535645, 1.3366265296936035, 1.3920254707336426, 1.4474244117736816, 1.5028233528137207, 1.5582222938537598, 1.6136212348937988, 1.669020175933838, 1.724419116973877, 1.779818058013916, 1.835216999053955, 1.8906159400939941, 1.9460148811340332, 2.0014138221740723, 2.0568127632141113, 2.1122117042541504, 2.1676106452941895, 2.2230095863342285, 2.2784085273742676, 2.3338074684143066, 2.3892064094543457, 2.4446053504943848, 2.500004291534424, 2.555403232574463, 2.610802173614502, 2.666201114654541, 2.72160005569458, 2.776998996734619, 2.832397937774658]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 16.0, 42.0, 61.0, 87.0, 116.0, 134.0, 178.0, 127.0, 108.0, 54.0, 43.0, 13.0, 12.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6850806474685669, -0.6631802320480347, -0.6412798166275024, -0.6193794012069702, -0.5974789261817932, -0.575578510761261, -0.5536780953407288, -0.5317776799201965, -0.5098772048950195, -0.4879767894744873, -0.4660763442516327, -0.44417592883110046, -0.42227548360824585, -0.4003750681877136, -0.3784746527671814, -0.35657423734664917, -0.33467382192611694, -0.3127734065055847, -0.2908729612827301, -0.2689725458621979, -0.24707211554050446, -0.22517168521881104, -0.2032712697982788, -0.1813708394765854, -0.15947040915489197, -0.13756997883319855, -0.11566955596208572, -0.0937691330909729, -0.07186870276927948, -0.04996827244758606, -0.028067857027053833, -0.006167426705360413, 0.015732944011688232, 0.037633370608091354, 0.059533797204494476, 0.0814342200756073, 0.10333465039730072, 0.12523508071899414, 0.14713549613952637, 0.1690359264612198, 0.1909363567829132, 0.21283678710460663, 0.23473721742630005, 0.2566376328468323, 0.2785380482673645, 0.3004384934902191, 0.32233890891075134, 0.34423935413360596, 0.3661397695541382, 0.3880401849746704, 0.409940630197525, 0.43184104561805725, 0.45374149084091187, 0.4756419062614441, 0.4975423216819763, 0.5194427371025085, 0.5413432121276855, 0.5632436275482178, 0.58514404296875, 0.6070444583892822, 0.6289449334144592, 0.6508453488349915, 0.6727457642555237, 0.6946461796760559, 0.7165465950965881]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 4.0, 6.0, 9.0, 4.0, 9.0, 15.0, 7.0, 17.0, 30.0, 25.0, 38.0, 60.0, 104.0, 169.0, 356.0, 834.0, 3261.0, 27217.0, 848380.0, 156367.0, 8770.0, 1658.0, 532.0, 246.0, 125.0, 99.0, 49.0, 33.0, 26.0, 16.0, 20.0, 14.0, 11.0, 9.0, 6.0, 4.0, 4.0, 4.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.3349609375, -0.3255958557128906, -0.31623077392578125, -0.3068656921386719, -0.2975006103515625, -0.2881355285644531, -0.27877044677734375, -0.2694053649902344, -0.260040283203125, -0.2506752014160156, -0.24131011962890625, -0.23194503784179688, -0.2225799560546875, -0.21321487426757812, -0.20384979248046875, -0.19448471069335938, -0.18511962890625, -0.17575454711914062, -0.16638946533203125, -0.15702438354492188, -0.1476593017578125, -0.13829421997070312, -0.12892913818359375, -0.11956405639648438, -0.110198974609375, -0.10083389282226562, -0.09146881103515625, -0.08210372924804688, -0.0727386474609375, -0.06337356567382812, -0.05400848388671875, -0.044643402099609375, -0.0352783203125, -0.025913238525390625, -0.01654815673828125, -0.007183074951171875, 0.0021820068359375, 0.011547088623046875, 0.02091217041015625, 0.030277252197265625, 0.039642333984375, 0.049007415771484375, 0.05837249755859375, 0.06773757934570312, 0.0771026611328125, 0.08646774291992188, 0.09583282470703125, 0.10519790649414062, 0.11456298828125, 0.12392807006835938, 0.13329315185546875, 0.14265823364257812, 0.1520233154296875, 0.16138839721679688, 0.17075347900390625, 0.18011856079101562, 0.189483642578125, 0.19884872436523438, 0.20821380615234375, 0.21757888793945312, 0.2269439697265625, 0.23630905151367188, 0.24567413330078125, 0.2550392150878906, 0.264404296875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 11.0, 15.0, 48.0, 84.0, 118.0, 180.0, 201.0, 146.0, 96.0, 54.0, 33.0, 13.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210418701171875, -0.019826173782348633, -0.018610477447509766, -0.0173947811126709, -0.01617908477783203, -0.014963388442993164, -0.013747692108154297, -0.01253199577331543, -0.011316299438476562, -0.010100603103637695, -0.008884906768798828, -0.007669210433959961, -0.006453514099121094, -0.0052378177642822266, -0.004022121429443359, -0.002806425094604492, -0.001590728759765625, -0.0003750324249267578, 0.0008406639099121094, 0.0020563602447509766, 0.0032720565795898438, 0.004487752914428711, 0.005703449249267578, 0.006919145584106445, 0.008134841918945312, 0.00935053825378418, 0.010566234588623047, 0.011781930923461914, 0.012997627258300781, 0.014213323593139648, 0.015429019927978516, 0.016644716262817383, 0.01786041259765625, 0.019076108932495117, 0.020291805267333984, 0.02150750160217285, 0.02272319793701172, 0.023938894271850586, 0.025154590606689453, 0.02637028694152832, 0.027585983276367188, 0.028801679611206055, 0.030017375946044922, 0.03123307228088379, 0.032448768615722656, 0.03366446495056152, 0.03488016128540039, 0.03609585762023926, 0.037311553955078125, 0.03852725028991699, 0.03974294662475586, 0.04095864295959473, 0.042174339294433594, 0.04339003562927246, 0.04460573196411133, 0.045821428298950195, 0.04703712463378906, 0.04825282096862793, 0.0494685173034668, 0.050684213638305664, 0.05189990997314453, 0.0531156063079834, 0.054331302642822266, 0.05554699897766113, 0.0567626953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 2.0, 7.0, 3.0, 6.0, 12.0, 9.0, 8.0, 15.0, 14.0, 26.0, 23.0, 45.0, 90.0, 127.0, 325.0, 932.0, 3488.0, 20133.0, 286191.0, 688892.0, 39879.0, 5974.0, 1384.0, 467.0, 171.0, 111.0, 55.0, 39.0, 25.0, 16.0, 14.0, 12.0, 10.0, 10.0, 7.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.146728515625, -0.1418628692626953, -0.13699722290039062, -0.13213157653808594, -0.12726593017578125, -0.12240028381347656, -0.11753463745117188, -0.11266899108886719, -0.1078033447265625, -0.10293769836425781, -0.09807205200195312, -0.09320640563964844, -0.08834075927734375, -0.08347511291503906, -0.07860946655273438, -0.07374382019042969, -0.068878173828125, -0.06401252746582031, -0.059146881103515625, -0.05428123474121094, -0.04941558837890625, -0.04454994201660156, -0.039684295654296875, -0.03481864929199219, -0.0299530029296875, -0.025087356567382812, -0.020221710205078125, -0.015356063842773438, -0.01049041748046875, -0.0056247711181640625, -0.000759124755859375, 0.0041065216064453125, 0.00897216796875, 0.013837814331054688, 0.018703460693359375, 0.023569107055664062, 0.02843475341796875, 0.03330039978027344, 0.038166046142578125, 0.04303169250488281, 0.0478973388671875, 0.05276298522949219, 0.057628631591796875, 0.06249427795410156, 0.06735992431640625, 0.07222557067871094, 0.07709121704101562, 0.08195686340332031, 0.086822509765625, 0.09168815612792969, 0.09655380249023438, 0.10141944885253906, 0.10628509521484375, 0.11115074157714844, 0.11601638793945312, 0.12088203430175781, 0.1257476806640625, 0.1306133270263672, 0.13547897338867188, 0.14034461975097656, 0.14521026611328125, 0.15007591247558594, 0.15494155883789062, 0.1598072052001953, 0.1646728515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 14.0, 7.0, 10.0, 18.0, 16.0, 16.0, 23.0, 16.0, 37.0, 38.0, 27.0, 45.0, 60.0, 44.0, 53.0, 53.0, 59.0, 61.0, 49.0, 45.0, 38.0, 47.0, 36.0, 28.0, 23.0, 17.0, 17.0, 13.0, 14.0, 8.0, 16.0, 6.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 5.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.050933837890625, -0.0492243766784668, -0.047514915466308594, -0.04580545425415039, -0.04409599304199219, -0.042386531829833984, -0.04067707061767578, -0.03896760940551758, -0.037258148193359375, -0.03554868698120117, -0.03383922576904297, -0.032129764556884766, -0.030420303344726562, -0.02871084213256836, -0.027001380920410156, -0.025291919708251953, -0.02358245849609375, -0.021872997283935547, -0.020163536071777344, -0.01845407485961914, -0.016744613647460938, -0.015035152435302734, -0.013325691223144531, -0.011616230010986328, -0.009906768798828125, -0.008197307586669922, -0.006487846374511719, -0.004778385162353516, -0.0030689239501953125, -0.0013594627380371094, 0.00034999847412109375, 0.002059459686279297, 0.0037689208984375, 0.005478382110595703, 0.007187843322753906, 0.00889730453491211, 0.010606765747070312, 0.012316226959228516, 0.014025688171386719, 0.015735149383544922, 0.017444610595703125, 0.019154071807861328, 0.02086353302001953, 0.022572994232177734, 0.024282455444335938, 0.02599191665649414, 0.027701377868652344, 0.029410839080810547, 0.03112030029296875, 0.03282976150512695, 0.034539222717285156, 0.03624868392944336, 0.03795814514160156, 0.039667606353759766, 0.04137706756591797, 0.04308652877807617, 0.044795989990234375, 0.04650545120239258, 0.04821491241455078, 0.049924373626708984, 0.05163383483886719, 0.05334329605102539, 0.055052757263183594, 0.0567622184753418, 0.0584716796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 9.0, 14.0, 15.0, 23.0, 25.0, 47.0, 77.0, 143.0, 294.0, 697.0, 1981.0, 7587.0, 104388.0, 892064.0, 34024.0, 4677.0, 1431.0, 518.0, 233.0, 114.0, 71.0, 33.0, 26.0, 9.0, 10.0, 10.0, 3.0, 14.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08782958984375, -0.08461761474609375, -0.0814056396484375, -0.07819366455078125, -0.074981689453125, -0.07176971435546875, -0.0685577392578125, -0.06534576416015625, -0.0621337890625, -0.05892181396484375, -0.0557098388671875, -0.05249786376953125, -0.049285888671875, -0.04607391357421875, -0.0428619384765625, -0.03964996337890625, -0.03643798828125, -0.03322601318359375, -0.0300140380859375, -0.02680206298828125, -0.023590087890625, -0.02037811279296875, -0.0171661376953125, -0.01395416259765625, -0.0107421875, -0.00753021240234375, -0.0043182373046875, -0.00110626220703125, 0.002105712890625, 0.00531768798828125, 0.0085296630859375, 0.01174163818359375, 0.01495361328125, 0.01816558837890625, 0.0213775634765625, 0.02458953857421875, 0.027801513671875, 0.03101348876953125, 0.0342254638671875, 0.03743743896484375, 0.0406494140625, 0.04386138916015625, 0.0470733642578125, 0.05028533935546875, 0.053497314453125, 0.05670928955078125, 0.0599212646484375, 0.06313323974609375, 0.06634521484375, 0.06955718994140625, 0.0727691650390625, 0.07598114013671875, 0.079193115234375, 0.08240509033203125, 0.0856170654296875, 0.08882904052734375, 0.092041015625, 0.09525299072265625, 0.0984649658203125, 0.10167694091796875, 0.104888916015625, 0.10810089111328125, 0.1113128662109375, 0.11452484130859375, 0.11773681640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 10.0, 12.0, 19.0, 23.0, 36.0, 50.0, 60.0, 65.0, 76.0, 77.0, 96.0, 75.0, 92.0, 62.0, 60.0, 48.0, 30.0, 31.0, 27.0, 11.0, 10.0, 4.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2576580047607422e-05, -1.2267380952835083e-05, -1.1958181858062744e-05, -1.1648982763290405e-05, -1.1339783668518066e-05, -1.1030584573745728e-05, -1.0721385478973389e-05, -1.041218638420105e-05, -1.0102987289428711e-05, -9.793788194656372e-06, -9.484589099884033e-06, -9.175390005111694e-06, -8.866190910339355e-06, -8.556991815567017e-06, -8.247792720794678e-06, -7.938593626022339e-06, -7.62939453125e-06, -7.320195436477661e-06, -7.010996341705322e-06, -6.701797246932983e-06, -6.3925981521606445e-06, -6.083399057388306e-06, -5.774199962615967e-06, -5.465000867843628e-06, -5.155801773071289e-06, -4.84660267829895e-06, -4.537403583526611e-06, -4.2282044887542725e-06, -3.919005393981934e-06, -3.6098062992095947e-06, -3.300607204437256e-06, -2.991408109664917e-06, -2.682209014892578e-06, -2.3730099201202393e-06, -2.0638108253479004e-06, -1.7546117305755615e-06, -1.4454126358032227e-06, -1.1362135410308838e-06, -8.270144462585449e-07, -5.178153514862061e-07, -2.086162567138672e-07, 1.0058283805847168e-07, 4.0978193283081055e-07, 7.189810276031494e-07, 1.0281801223754883e-06, 1.3373792171478271e-06, 1.646578311920166e-06, 1.955777406692505e-06, 2.2649765014648438e-06, 2.5741755962371826e-06, 2.8833746910095215e-06, 3.1925737857818604e-06, 3.5017728805541992e-06, 3.810971975326538e-06, 4.120171070098877e-06, 4.429370164871216e-06, 4.738569259643555e-06, 5.0477683544158936e-06, 5.356967449188232e-06, 5.666166543960571e-06, 5.97536563873291e-06, 6.284564733505249e-06, 6.593763828277588e-06, 6.902962923049927e-06, 7.212162017822266e-06]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 14.0, 18.0, 28.0, 67.0, 135.0, 340.0, 1307.0, 17506.0, 1012128.0, 15123.0, 1216.0, 372.0, 142.0, 73.0, 43.0, 16.0, 10.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1759033203125, -0.1699371337890625, -0.163970947265625, -0.1580047607421875, -0.15203857421875, -0.1460723876953125, -0.140106201171875, -0.1341400146484375, -0.128173828125, -0.1222076416015625, -0.116241455078125, -0.1102752685546875, -0.10430908203125, -0.0983428955078125, -0.092376708984375, -0.0864105224609375, -0.0804443359375, -0.0744781494140625, -0.068511962890625, -0.0625457763671875, -0.05657958984375, -0.0506134033203125, -0.044647216796875, -0.0386810302734375, -0.03271484375, -0.0267486572265625, -0.020782470703125, -0.0148162841796875, -0.00885009765625, -0.0028839111328125, 0.003082275390625, 0.0090484619140625, 0.0150146484375, 0.0209808349609375, 0.026947021484375, 0.0329132080078125, 0.03887939453125, 0.0448455810546875, 0.050811767578125, 0.0567779541015625, 0.062744140625, 0.0687103271484375, 0.074676513671875, 0.0806427001953125, 0.08660888671875, 0.0925750732421875, 0.098541259765625, 0.1045074462890625, 0.1104736328125, 0.1164398193359375, 0.122406005859375, 0.1283721923828125, 0.13433837890625, 0.1403045654296875, 0.146270751953125, 0.1522369384765625, 0.158203125, 0.1641693115234375, 0.170135498046875, 0.1761016845703125, 0.18206787109375, 0.1880340576171875, 0.194000244140625, 0.1999664306640625, 0.2059326171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 11.0, 29.0, 49.0, 99.0, 198.0, 235.0, 192.0, 84.0, 43.0, 23.0, 10.0, 11.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050506591796875, -0.04759836196899414, -0.04469013214111328, -0.04178190231323242, -0.03887367248535156, -0.0359654426574707, -0.033057212829589844, -0.030148983001708984, -0.027240753173828125, -0.024332523345947266, -0.021424293518066406, -0.018516063690185547, -0.015607833862304688, -0.012699604034423828, -0.009791374206542969, -0.006883144378662109, -0.00397491455078125, -0.0010666847229003906, 0.0018415451049804688, 0.004749774932861328, 0.0076580047607421875, 0.010566234588623047, 0.013474464416503906, 0.016382694244384766, 0.019290924072265625, 0.022199153900146484, 0.025107383728027344, 0.028015613555908203, 0.030923843383789062, 0.03383207321166992, 0.03674030303955078, 0.03964853286743164, 0.0425567626953125, 0.04546499252319336, 0.04837322235107422, 0.05128145217895508, 0.05418968200683594, 0.0570979118347168, 0.060006141662597656, 0.06291437149047852, 0.06582260131835938, 0.06873083114624023, 0.0716390609741211, 0.07454729080200195, 0.07745552062988281, 0.08036375045776367, 0.08327198028564453, 0.08618021011352539, 0.08908843994140625, 0.09199666976928711, 0.09490489959716797, 0.09781312942504883, 0.10072135925292969, 0.10362958908081055, 0.1065378189086914, 0.10944604873657227, 0.11235427856445312, 0.11526250839233398, 0.11817073822021484, 0.1210789680480957, 0.12398719787597656, 0.12689542770385742, 0.12980365753173828, 0.13271188735961914, 0.1356201171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 43.0, 390.0, 539.0, 33.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2392401695251465, -1.1626038551330566, -1.0859675407409668, -1.0093313455581665, -0.9326950311660767, -0.8560587167739868, -0.7794224619865417, -0.7027862071990967, -0.6261498928070068, -0.549513578414917, -0.4728773236274719, -0.39624103903770447, -0.319604754447937, -0.24296846985816956, -0.1663321852684021, -0.08969593048095703, -0.013059616088867188, 0.06357666850090027, 0.14021295309066772, 0.21684923768043518, 0.29348552227020264, 0.3701218068599701, 0.44675809144973755, 0.5233943462371826, 0.6000306606292725, 0.6766669750213623, 0.7533032298088074, 0.8299394845962524, 0.9065757989883423, 0.9832121133804321, 1.0598483085632324, 1.1364846229553223, 1.2131211757659912, 1.289757490158081, 1.366393804550171, 1.4430299997329712, 1.519666314125061, 1.5963026285171509, 1.6729388236999512, 1.749575138092041, 1.8262114524841309, 1.9028477668762207, 1.9794840812683105, 2.0561203956604004, 2.1327567100524902, 2.209392786026001, 2.286029100418091, 2.3626654148101807, 2.4393017292022705, 2.5159380435943604, 2.59257435798645, 2.66921067237854, 2.745846748352051, 2.8224830627441406, 2.8991193771362305, 2.9757556915283203, 3.05239200592041, 3.1290283203125, 3.20566463470459, 3.2823009490966797, 3.3589372634887695, 3.4355733394622803, 3.51220965385437, 3.58884596824646, 3.66548228263855]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 10.0, 8.0, 8.0, 7.0, 13.0, 17.0, 15.0, 26.0, 18.0, 34.0, 46.0, 40.0, 34.0, 39.0, 43.0, 40.0, 50.0, 45.0, 50.0, 50.0, 43.0, 46.0, 34.0, 45.0, 37.0, 27.0, 25.0, 21.0, 19.0, 23.0, 12.0, 10.0, 12.0, 7.0, 4.0, 9.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.3503272533416748, -0.33959850668907166, -0.3288697302341461, -0.31814098358154297, -0.3074122369289398, -0.29668349027633667, -0.28595471382141113, -0.275225967168808, -0.26449722051620483, -0.2537684738636017, -0.24303971230983734, -0.232310950756073, -0.22158220410346985, -0.2108534425497055, -0.20012468099594116, -0.189395934343338, -0.17866715788841248, -0.16793839633464813, -0.15720964968204498, -0.14648088812828064, -0.1357521414756775, -0.12502337992191315, -0.1142946183681488, -0.10356586426496506, -0.09283711016178131, -0.08210835605859756, -0.07137960195541382, -0.060650840401649475, -0.04992208629846573, -0.03919333219528198, -0.02846457064151764, -0.017735816538333893, -0.0070070624351501465, 0.003721693530678749, 0.014450449496507645, 0.02517920732498169, 0.035907961428165436, 0.04663671553134918, 0.057365477085113525, 0.06809423118829727, 0.07882298529148102, 0.08955173939466476, 0.10028049349784851, 0.11100925505161285, 0.1217380091547966, 0.13246676325798035, 0.1431955248117447, 0.15392428636550903, 0.16465303301811218, 0.17538179457187653, 0.18611054122447968, 0.19683930277824402, 0.20756804943084717, 0.2182968109846115, 0.22902557253837585, 0.239754319190979, 0.25048309564590454, 0.2612118422985077, 0.2719406187534332, 0.2826693654060364, 0.2933981120586395, 0.3041268587112427, 0.3148556351661682, 0.32558438181877136, 0.3363131284713745]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 12.0, 15.0, 45.0, 106.0, 234.0, 710.0, 2605.0, 15306.0, 302965.0, 3820093.0, 43715.0, 5547.0, 1443.0, 582.0, 299.0, 150.0, 99.0, 66.0, 58.0, 42.0, 33.0, 34.0, 25.0, 22.0, 14.0, 14.0, 13.0, 6.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11370849609375, -0.10670185089111328, -0.09969520568847656, -0.09268856048583984, -0.08568191528320312, -0.0786752700805664, -0.07166862487792969, -0.06466197967529297, -0.05765533447265625, -0.05064868927001953, -0.04364204406738281, -0.036635398864746094, -0.029628753662109375, -0.022622108459472656, -0.015615463256835938, -0.008608818054199219, -0.0016021728515625, 0.005404472351074219, 0.012411117553710938, 0.019417762756347656, 0.026424407958984375, 0.033431053161621094, 0.04043769836425781, 0.04744434356689453, 0.05445098876953125, 0.06145763397216797, 0.06846427917480469, 0.0754709243774414, 0.08247756958007812, 0.08948421478271484, 0.09649085998535156, 0.10349750518798828, 0.110504150390625, 0.11751079559326172, 0.12451744079589844, 0.13152408599853516, 0.13853073120117188, 0.1455373764038086, 0.1525440216064453, 0.15955066680908203, 0.16655731201171875, 0.17356395721435547, 0.1805706024169922, 0.1875772476196289, 0.19458389282226562, 0.20159053802490234, 0.20859718322753906, 0.21560382843017578, 0.2226104736328125, 0.22961711883544922, 0.23662376403808594, 0.24363040924072266, 0.2506370544433594, 0.2576436996459961, 0.2646503448486328, 0.27165699005126953, 0.27866363525390625, 0.28567028045654297, 0.2926769256591797, 0.2996835708618164, 0.3066902160644531, 0.31369686126708984, 0.32070350646972656, 0.3277101516723633, 0.334716796875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 22.0, 53.0, 89.0, 125.0, 164.0, 149.0, 136.0, 118.0, 70.0, 29.0, 20.0, 4.0, 9.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01428985595703125, -0.013133406639099121, -0.011976957321166992, -0.010820508003234863, -0.009664058685302734, -0.008507609367370605, -0.0073511600494384766, -0.006194710731506348, -0.005038261413574219, -0.00388181209564209, -0.002725362777709961, -0.001568913459777832, -0.0004124641418457031, 0.0007439851760864258, 0.0019004344940185547, 0.0030568838119506836, 0.0042133331298828125, 0.005369782447814941, 0.00652623176574707, 0.007682681083679199, 0.008839130401611328, 0.009995579719543457, 0.011152029037475586, 0.012308478355407715, 0.013464927673339844, 0.014621376991271973, 0.0157778263092041, 0.01693427562713623, 0.01809072494506836, 0.01924717426300049, 0.020403623580932617, 0.021560072898864746, 0.022716522216796875, 0.023872971534729004, 0.025029420852661133, 0.02618587017059326, 0.02734231948852539, 0.02849876880645752, 0.02965521812438965, 0.030811667442321777, 0.031968116760253906, 0.033124566078186035, 0.034281015396118164, 0.03543746471405029, 0.03659391403198242, 0.03775036334991455, 0.03890681266784668, 0.04006326198577881, 0.04121971130371094, 0.042376160621643066, 0.043532609939575195, 0.044689059257507324, 0.04584550857543945, 0.04700195789337158, 0.04815840721130371, 0.04931485652923584, 0.05047130584716797, 0.0516277551651001, 0.05278420448303223, 0.053940653800964355, 0.055097103118896484, 0.05625355243682861, 0.05741000175476074, 0.05856645107269287, 0.059722900390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 27.0, 41.0, 135.0, 565.0, 284005.0, 3908094.0, 970.0, 259.0, 110.0, 40.0, 23.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91259765625, -0.8646469116210938, -0.8166961669921875, -0.7687454223632812, -0.720794677734375, -0.6728439331054688, -0.6248931884765625, -0.5769424438476562, -0.52899169921875, -0.48104095458984375, -0.4330902099609375, -0.38513946533203125, -0.337188720703125, -0.28923797607421875, -0.2412872314453125, -0.19333648681640625, -0.1453857421875, -0.09743499755859375, -0.0494842529296875, -0.00153350830078125, 0.046417236328125, 0.09436798095703125, 0.1423187255859375, 0.19026947021484375, 0.23822021484375, 0.28617095947265625, 0.3341217041015625, 0.38207244873046875, 0.430023193359375, 0.47797393798828125, 0.5259246826171875, 0.5738754272460938, 0.621826171875, 0.6697769165039062, 0.7177276611328125, 0.7656784057617188, 0.813629150390625, 0.8615798950195312, 0.9095306396484375, 0.9574813842773438, 1.00543212890625, 1.0533828735351562, 1.1013336181640625, 1.1492843627929688, 1.197235107421875, 1.2451858520507812, 1.2931365966796875, 1.3410873413085938, 1.3890380859375, 1.4369888305664062, 1.4849395751953125, 1.5328903198242188, 1.580841064453125, 1.6287918090820312, 1.6767425537109375, 1.7246932983398438, 1.77264404296875, 1.8205947875976562, 1.8685455322265625, 1.9164962768554688, 1.964447021484375, 2.0123977661132812, 2.0603485107421875, 2.1082992553710938, 2.15625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 16.0, 54.0, 238.0, 3440.0, 271.0, 40.0, 16.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046417236328125, -0.0415339469909668, -0.036650657653808594, -0.03176736831665039, -0.026884078979492188, -0.022000789642333984, -0.01711750030517578, -0.012234210968017578, -0.007350921630859375, -0.002467632293701172, 0.0024156570434570312, 0.007298946380615234, 0.012182235717773438, 0.01706552505493164, 0.021948814392089844, 0.026832103729248047, 0.03171539306640625, 0.03659868240356445, 0.041481971740722656, 0.04636526107788086, 0.05124855041503906, 0.056131839752197266, 0.06101512908935547, 0.06589841842651367, 0.07078170776367188, 0.07566499710083008, 0.08054828643798828, 0.08543157577514648, 0.09031486511230469, 0.09519815444946289, 0.1000814437866211, 0.1049647331237793, 0.1098480224609375, 0.1147313117980957, 0.1196146011352539, 0.12449789047241211, 0.1293811798095703, 0.13426446914672852, 0.13914775848388672, 0.14403104782104492, 0.14891433715820312, 0.15379762649536133, 0.15868091583251953, 0.16356420516967773, 0.16844749450683594, 0.17333078384399414, 0.17821407318115234, 0.18309736251831055, 0.18798065185546875, 0.19286394119262695, 0.19774723052978516, 0.20263051986694336, 0.20751380920410156, 0.21239709854125977, 0.21728038787841797, 0.22216367721557617, 0.22704696655273438, 0.23193025588989258, 0.23681354522705078, 0.24169683456420898, 0.2465801239013672, 0.2514634132385254, 0.2563467025756836, 0.2612299919128418, 0.26611328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 16.0, 266.0, 701.0, 25.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5084495544433594, -3.4370200634002686, -3.3655905723571777, -3.294160842895508, -3.222731351852417, -3.151301860809326, -3.0798721313476562, -3.0084426403045654, -2.9370131492614746, -2.865583658218384, -2.794154167175293, -2.722724437713623, -2.6512949466705322, -2.5798654556274414, -2.5084357261657715, -2.4370062351226807, -2.36557674407959, -2.294147253036499, -2.222717761993408, -2.1512880325317383, -2.0798585414886475, -2.0084290504455566, -1.9369994401931763, -1.865569829940796, -1.794140338897705, -1.7227108478546143, -1.6512812376022339, -1.5798516273498535, -1.5084221363067627, -1.4369926452636719, -1.3655630350112915, -1.2941334247589111, -1.2227036952972412, -1.1512742042541504, -1.07984459400177, -1.0084149837493896, -0.9369854927062988, -0.8655559420585632, -0.7941263914108276, -0.722696840763092, -0.6512672901153564, -0.5798377394676208, -0.5084081888198853, -0.43697863817214966, -0.36554908752441406, -0.29411953687667847, -0.22268998622894287, -0.15126043558120728, -0.07983088493347168, -0.008401334285736084, 0.06302821636199951, 0.1344577670097351, 0.2058873176574707, 0.2773168683052063, 0.3487464189529419, 0.4201759696006775, 0.4916055202484131, 0.5630350708961487, 0.6344646215438843, 0.7058941721916199, 0.7773237228393555, 0.8487532734870911, 0.9201828241348267, 0.9916123747825623, 1.0630419254302979]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 10.0, 25.0, 27.0, 49.0, 67.0, 98.0, 123.0, 120.0, 109.0, 87.0, 86.0, 70.0, 58.0, 28.0, 25.0, 2.0, 2.0, 7.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5035858154296875, -0.4864669144153595, -0.4693479835987091, -0.4522290825843811, -0.4351101517677307, -0.4179912507534027, -0.4008723497390747, -0.3837534189224243, -0.3666345179080963, -0.3495156168937683, -0.3323966860771179, -0.3152777850627899, -0.2981588840484619, -0.2810399532318115, -0.2639210522174835, -0.24680213630199432, -0.22968322038650513, -0.21256430447101593, -0.19544538855552673, -0.17832648754119873, -0.16120757162570953, -0.14408865571022034, -0.12696975469589233, -0.10985083878040314, -0.09273192286491394, -0.07561300694942474, -0.058494098484516144, -0.041375186294317245, -0.024256274104118347, -0.00713735818862915, 0.00998155027627945, 0.02710045874118805, 0.04421931505203247, 0.06133822724223137, 0.07845713943243027, 0.09557604789733887, 0.11269496381282806, 0.12981387972831726, 0.14693278074264526, 0.16405169665813446, 0.18117061257362366, 0.19828952848911285, 0.21540844440460205, 0.23252734541893005, 0.24964626133441925, 0.26676517724990845, 0.28388407826423645, 0.30100297927856445, 0.31812191009521484, 0.33524081110954285, 0.35235974192619324, 0.36947864294052124, 0.38659757375717163, 0.40371647477149963, 0.42083537578582764, 0.437954306602478, 0.45507320761680603, 0.47219210863113403, 0.4893110394477844, 0.5064299702644348, 0.5235488414764404, 0.5406677722930908, 0.5577867031097412, 0.5749055743217468, 0.5920245051383972]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 10.0, 6.0, 16.0, 13.0, 18.0, 27.0, 49.0, 45.0, 73.0, 102.0, 160.0, 221.0, 368.0, 675.0, 1522.0, 4806.0, 21025.0, 149862.0, 744629.0, 102067.0, 16156.0, 3723.0, 1367.0, 596.0, 340.0, 201.0, 119.0, 90.0, 64.0, 41.0, 38.0, 23.0, 24.0, 12.0, 14.0, 10.0, 3.0, 2.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 6.0, 2.0], "bins": [-0.2320556640625, -0.22568321228027344, -0.21931076049804688, -0.2129383087158203, -0.20656585693359375, -0.2001934051513672, -0.19382095336914062, -0.18744850158691406, -0.1810760498046875, -0.17470359802246094, -0.16833114624023438, -0.1619586944580078, -0.15558624267578125, -0.1492137908935547, -0.14284133911132812, -0.13646888732910156, -0.130096435546875, -0.12372398376464844, -0.11735153198242188, -0.11097908020019531, -0.10460662841796875, -0.09823417663574219, -0.09186172485351562, -0.08548927307128906, -0.0791168212890625, -0.07274436950683594, -0.06637191772460938, -0.05999946594238281, -0.05362701416015625, -0.04725456237792969, -0.040882110595703125, -0.03450965881347656, -0.02813720703125, -0.021764755249023438, -0.015392303466796875, -0.009019851684570312, -0.00264739990234375, 0.0037250518798828125, 0.010097503662109375, 0.016469955444335938, 0.0228424072265625, 0.029214859008789062, 0.035587310791015625, 0.04195976257324219, 0.04833221435546875, 0.05470466613769531, 0.061077117919921875, 0.06744956970214844, 0.073822021484375, 0.08019447326660156, 0.08656692504882812, 0.09293937683105469, 0.09931182861328125, 0.10568428039550781, 0.11205673217773438, 0.11842918395996094, 0.1248016357421875, 0.13117408752441406, 0.13754653930664062, 0.1439189910888672, 0.15029144287109375, 0.1566638946533203, 0.16303634643554688, 0.16940879821777344, 0.17578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 11.0, 17.0, 39.0, 49.0, 78.0, 82.0, 99.0, 150.0, 132.0, 98.0, 88.0, 54.0, 40.0, 31.0, 16.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0263519287109375, -0.025025129318237305, -0.02369832992553711, -0.022371530532836914, -0.02104473114013672, -0.019717931747436523, -0.018391132354736328, -0.017064332962036133, -0.015737533569335938, -0.014410734176635742, -0.013083934783935547, -0.011757135391235352, -0.010430335998535156, -0.009103536605834961, -0.007776737213134766, -0.00644993782043457, -0.005123138427734375, -0.0037963390350341797, -0.0024695396423339844, -0.001142740249633789, 0.00018405914306640625, 0.0015108585357666016, 0.002837657928466797, 0.004164457321166992, 0.0054912567138671875, 0.006818056106567383, 0.008144855499267578, 0.009471654891967773, 0.010798454284667969, 0.012125253677368164, 0.01345205307006836, 0.014778852462768555, 0.01610565185546875, 0.017432451248168945, 0.01875925064086914, 0.020086050033569336, 0.02141284942626953, 0.022739648818969727, 0.024066448211669922, 0.025393247604370117, 0.026720046997070312, 0.028046846389770508, 0.029373645782470703, 0.0307004451751709, 0.032027244567871094, 0.03335404396057129, 0.034680843353271484, 0.03600764274597168, 0.037334442138671875, 0.03866124153137207, 0.039988040924072266, 0.04131484031677246, 0.042641639709472656, 0.04396843910217285, 0.04529523849487305, 0.04662203788757324, 0.04794883728027344, 0.04927563667297363, 0.05060243606567383, 0.05192923545837402, 0.05325603485107422, 0.054582834243774414, 0.05590963363647461, 0.057236433029174805, 0.058563232421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 13.0, 9.0, 14.0, 25.0, 34.0, 51.0, 110.0, 199.0, 437.0, 1060.0, 3563.0, 14797.0, 92985.0, 729888.0, 175133.0, 22524.0, 5088.0, 1506.0, 537.0, 244.0, 132.0, 58.0, 38.0, 29.0, 18.0, 9.0, 10.0, 8.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1529541015625, -0.14796066284179688, -0.14296722412109375, -0.13797378540039062, -0.1329803466796875, -0.12798690795898438, -0.12299346923828125, -0.11800003051757812, -0.113006591796875, -0.10801315307617188, -0.10301971435546875, -0.09802627563476562, -0.0930328369140625, -0.08803939819335938, -0.08304595947265625, -0.07805252075195312, -0.07305908203125, -0.06806564331054688, -0.06307220458984375, -0.058078765869140625, -0.0530853271484375, -0.048091888427734375, -0.04309844970703125, -0.038105010986328125, -0.033111572265625, -0.028118133544921875, -0.02312469482421875, -0.018131256103515625, -0.0131378173828125, -0.008144378662109375, -0.00315093994140625, 0.001842498779296875, 0.0068359375, 0.011829376220703125, 0.01682281494140625, 0.021816253662109375, 0.0268096923828125, 0.031803131103515625, 0.03679656982421875, 0.041790008544921875, 0.046783447265625, 0.051776885986328125, 0.05677032470703125, 0.061763763427734375, 0.0667572021484375, 0.07175064086914062, 0.07674407958984375, 0.08173751831054688, 0.08673095703125, 0.09172439575195312, 0.09671783447265625, 0.10171127319335938, 0.1067047119140625, 0.11169815063476562, 0.11669158935546875, 0.12168502807617188, 0.126678466796875, 0.13167190551757812, 0.13666534423828125, 0.14165878295898438, 0.1466522216796875, 0.15164566040039062, 0.15663909912109375, 0.16163253784179688, 0.1666259765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 9.0, 7.0, 5.0, 8.0, 11.0, 17.0, 11.0, 21.0, 29.0, 29.0, 38.0, 35.0, 44.0, 55.0, 65.0, 62.0, 53.0, 55.0, 60.0, 66.0, 53.0, 52.0, 36.0, 24.0, 32.0, 21.0, 20.0, 25.0, 14.0, 15.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09063720703125, -0.08772659301757812, -0.08481597900390625, -0.08190536499023438, -0.0789947509765625, -0.07608413696289062, -0.07317352294921875, -0.07026290893554688, -0.067352294921875, -0.06444168090820312, -0.06153106689453125, -0.058620452880859375, -0.0557098388671875, -0.052799224853515625, -0.04988861083984375, -0.046977996826171875, -0.0440673828125, -0.041156768798828125, -0.03824615478515625, -0.035335540771484375, -0.0324249267578125, -0.029514312744140625, -0.02660369873046875, -0.023693084716796875, -0.020782470703125, -0.017871856689453125, -0.01496124267578125, -0.012050628662109375, -0.0091400146484375, -0.006229400634765625, -0.00331878662109375, -0.000408172607421875, 0.00250244140625, 0.005413055419921875, 0.00832366943359375, 0.011234283447265625, 0.0141448974609375, 0.017055511474609375, 0.01996612548828125, 0.022876739501953125, 0.025787353515625, 0.028697967529296875, 0.03160858154296875, 0.034519195556640625, 0.0374298095703125, 0.040340423583984375, 0.04325103759765625, 0.046161651611328125, 0.049072265625, 0.051982879638671875, 0.05489349365234375, 0.057804107666015625, 0.0607147216796875, 0.06362533569335938, 0.06653594970703125, 0.06944656372070312, 0.072357177734375, 0.07526779174804688, 0.07817840576171875, 0.08108901977539062, 0.0839996337890625, 0.08691024780273438, 0.08982086181640625, 0.09273147583007812, 0.09564208984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 5.0, 5.0, 14.0, 18.0, 38.0, 81.0, 150.0, 505.0, 1637.0, 11071.0, 872539.0, 156204.0, 4784.0, 925.0, 293.0, 137.0, 72.0, 28.0, 13.0, 14.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.123046875, -0.11877632141113281, -0.11450576782226562, -0.11023521423339844, -0.10596466064453125, -0.10169410705566406, -0.09742355346679688, -0.09315299987792969, -0.0888824462890625, -0.08461189270019531, -0.08034133911132812, -0.07607078552246094, -0.07180023193359375, -0.06752967834472656, -0.06325912475585938, -0.05898857116699219, -0.054718017578125, -0.05044746398925781, -0.046176910400390625, -0.04190635681152344, -0.03763580322265625, -0.03336524963378906, -0.029094696044921875, -0.024824142456054688, -0.0205535888671875, -0.016283035278320312, -0.012012481689453125, -0.0077419281005859375, -0.00347137451171875, 0.0007991790771484375, 0.005069732666015625, 0.009340286254882812, 0.01361083984375, 0.017881393432617188, 0.022151947021484375, 0.026422500610351562, 0.03069305419921875, 0.03496360778808594, 0.039234161376953125, 0.04350471496582031, 0.0477752685546875, 0.05204582214355469, 0.056316375732421875, 0.06058692932128906, 0.06485748291015625, 0.06912803649902344, 0.07339859008789062, 0.07766914367675781, 0.081939697265625, 0.08621025085449219, 0.09048080444335938, 0.09475135803222656, 0.09902191162109375, 0.10329246520996094, 0.10756301879882812, 0.11183357238769531, 0.1161041259765625, 0.12037467956542969, 0.12464523315429688, 0.12891578674316406, 0.13318634033203125, 0.13745689392089844, 0.14172744750976562, 0.1459980010986328, 0.1502685546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 7.0, 16.0, 18.0, 16.0, 26.0, 26.0, 24.0, 39.0, 36.0, 39.0, 54.0, 47.0, 55.0, 64.0, 52.0, 88.0, 45.0, 40.0, 40.0, 35.0, 33.0, 45.0, 23.0, 19.0, 20.0, 17.0, 9.0, 15.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.450580596923828e-06, -7.2503462433815e-06, -7.050111889839172e-06, -6.8498775362968445e-06, -6.649643182754517e-06, -6.449408829212189e-06, -6.249174475669861e-06, -6.048940122127533e-06, -5.848705768585205e-06, -5.648471415042877e-06, -5.448237061500549e-06, -5.2480027079582214e-06, -5.0477683544158936e-06, -4.847534000873566e-06, -4.647299647331238e-06, -4.44706529378891e-06, -4.246830940246582e-06, -4.046596586704254e-06, -3.846362233161926e-06, -3.6461278796195984e-06, -3.4458935260772705e-06, -3.2456591725349426e-06, -3.0454248189926147e-06, -2.845190465450287e-06, -2.644956111907959e-06, -2.444721758365631e-06, -2.2444874048233032e-06, -2.0442530512809753e-06, -1.8440186977386475e-06, -1.6437843441963196e-06, -1.4435499906539917e-06, -1.2433156371116638e-06, -1.043081283569336e-06, -8.428469300270081e-07, -6.426125764846802e-07, -4.423782229423523e-07, -2.421438694000244e-07, -4.190951585769653e-08, 1.5832483768463135e-07, 3.5855919122695923e-07, 5.587935447692871e-07, 7.59027898311615e-07, 9.592622518539429e-07, 1.1594966053962708e-06, 1.3597309589385986e-06, 1.5599653124809265e-06, 1.7601996660232544e-06, 1.9604340195655823e-06, 2.16066837310791e-06, 2.360902726650238e-06, 2.561137080192566e-06, 2.761371433734894e-06, 2.9616057872772217e-06, 3.1618401408195496e-06, 3.3620744943618774e-06, 3.5623088479042053e-06, 3.762543201446533e-06, 3.962777554988861e-06, 4.163011908531189e-06, 4.363246262073517e-06, 4.563480615615845e-06, 4.763714969158173e-06, 4.9639493227005005e-06, 5.164183676242828e-06, 5.364418029785156e-06]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 11.0, 13.0, 22.0, 21.0, 51.0, 71.0, 158.0, 238.0, 612.0, 1887.0, 10347.0, 246342.0, 760571.0, 23330.0, 3273.0, 861.0, 342.0, 150.0, 82.0, 57.0, 36.0, 24.0, 15.0, 12.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06903076171875, -0.06639385223388672, -0.06375694274902344, -0.061120033264160156, -0.058483123779296875, -0.055846214294433594, -0.05320930480957031, -0.05057239532470703, -0.04793548583984375, -0.04529857635498047, -0.04266166687011719, -0.040024757385253906, -0.037387847900390625, -0.034750938415527344, -0.03211402893066406, -0.02947711944580078, -0.0268402099609375, -0.02420330047607422, -0.021566390991210938, -0.018929481506347656, -0.016292572021484375, -0.013655662536621094, -0.011018753051757812, -0.008381843566894531, -0.00574493408203125, -0.0031080245971679688, -0.0004711151123046875, 0.0021657943725585938, 0.004802703857421875, 0.007439613342285156, 0.010076522827148438, 0.012713432312011719, 0.015350341796875, 0.01798725128173828, 0.020624160766601562, 0.023261070251464844, 0.025897979736328125, 0.028534889221191406, 0.031171798706054688, 0.03380870819091797, 0.03644561767578125, 0.03908252716064453, 0.04171943664550781, 0.044356346130371094, 0.046993255615234375, 0.049630165100097656, 0.05226707458496094, 0.05490398406982422, 0.0575408935546875, 0.06017780303955078, 0.06281471252441406, 0.06545162200927734, 0.06808853149414062, 0.0707254409790039, 0.07336235046386719, 0.07599925994873047, 0.07863616943359375, 0.08127307891845703, 0.08390998840332031, 0.0865468978881836, 0.08918380737304688, 0.09182071685791016, 0.09445762634277344, 0.09709453582763672, 0.0997314453125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 7.0, 9.0, 15.0, 15.0, 24.0, 34.0, 57.0, 85.0, 83.0, 107.0, 121.0, 116.0, 102.0, 72.0, 40.0, 30.0, 19.0, 18.0, 15.0, 12.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046173095703125, -0.04455280303955078, -0.04293251037597656, -0.041312217712402344, -0.039691925048828125, -0.038071632385253906, -0.03645133972167969, -0.03483104705810547, -0.03321075439453125, -0.03159046173095703, -0.029970169067382812, -0.028349876403808594, -0.026729583740234375, -0.025109291076660156, -0.023488998413085938, -0.02186870574951172, -0.0202484130859375, -0.01862812042236328, -0.017007827758789062, -0.015387535095214844, -0.013767242431640625, -0.012146949768066406, -0.010526657104492188, -0.008906364440917969, -0.00728607177734375, -0.005665779113769531, -0.0040454864501953125, -0.0024251937866210938, -0.000804901123046875, 0.0008153915405273438, 0.0024356842041015625, 0.004055976867675781, 0.00567626953125, 0.007296562194824219, 0.008916854858398438, 0.010537147521972656, 0.012157440185546875, 0.013777732849121094, 0.015398025512695312, 0.01701831817626953, 0.01863861083984375, 0.02025890350341797, 0.021879196166992188, 0.023499488830566406, 0.025119781494140625, 0.026740074157714844, 0.028360366821289062, 0.02998065948486328, 0.0316009521484375, 0.03322124481201172, 0.03484153747558594, 0.036461830139160156, 0.038082122802734375, 0.039702415466308594, 0.04132270812988281, 0.04294300079345703, 0.04456329345703125, 0.04618358612060547, 0.04780387878417969, 0.049424171447753906, 0.051044464111328125, 0.052664756774902344, 0.05428504943847656, 0.05590534210205078, 0.057525634765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 10.0, 30.0, 106.0, 388.0, 332.0, 96.0, 24.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1637670993804932, -1.1189684867858887, -1.0741699934005737, -1.0293713808059692, -0.9845727682113647, -0.939774215221405, -0.8949756622314453, -0.8501770496368408, -0.8053784966468811, -0.7605799436569214, -0.7157813310623169, -0.6709827780723572, -0.6261842250823975, -0.581385612487793, -0.5365870594978333, -0.49178847670555115, -0.44698989391326904, -0.40219131112098694, -0.35739272832870483, -0.3125941753387451, -0.267795592546463, -0.2229970097541809, -0.1781984567642212, -0.1333998739719391, -0.08860129117965698, -0.043802715837955475, 0.0009958595037460327, 0.04579442739486694, 0.09059301018714905, 0.13539159297943115, 0.18019014596939087, 0.22498872876167297, 0.2697873115539551, 0.3145858943462372, 0.3593844771385193, 0.404183030128479, 0.4489816129207611, 0.4937801957130432, 0.5385787487030029, 0.5833773612976074, 0.6281759142875671, 0.6729744672775269, 0.7177730798721313, 0.7625716328620911, 0.8073701858520508, 0.8521687984466553, 0.896967351436615, 0.9417659044265747, 0.9865645170211792, 1.0313631296157837, 1.0761616230010986, 1.1209602355957031, 1.1657588481903076, 1.210557460784912, 1.255355954170227, 1.3001545667648315, 1.3449530601501465, 1.389751672744751, 1.434550166130066, 1.4793487787246704, 1.524147391319275, 1.5689458847045898, 1.6137444972991943, 1.6585431098937988, 1.7033417224884033]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 2.0, 4.0, 7.0, 9.0, 17.0, 14.0, 18.0, 18.0, 28.0, 25.0, 36.0, 48.0, 41.0, 51.0, 50.0, 56.0, 71.0, 50.0, 59.0, 39.0, 46.0, 47.0, 38.0, 26.0, 31.0, 27.0, 24.0, 23.0, 25.0, 15.0, 8.0, 9.0, 11.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48197221755981445, -0.46676188707351685, -0.45155155658721924, -0.43634122610092163, -0.421130895614624, -0.4059205651283264, -0.3907102048397064, -0.3754998743534088, -0.3602895438671112, -0.3450792133808136, -0.329868882894516, -0.3146585524082184, -0.2994481921195984, -0.2842378616333008, -0.2690275311470032, -0.25381720066070557, -0.23860687017440796, -0.22339653968811035, -0.20818620920181274, -0.19297586381435394, -0.17776553332805634, -0.16255520284175873, -0.14734485745429993, -0.13213452696800232, -0.11692419648170471, -0.1017138659954071, -0.0865035280585289, -0.0712931901216507, -0.05608285963535309, -0.04087252914905548, -0.025662191212177277, -0.010451853275299072, 0.004758477210998535, 0.01996881142258644, 0.03517914563417435, 0.05038947984576225, 0.06559981405735016, 0.08081014454364777, 0.09602048248052597, 0.11123082041740417, 0.12644115090370178, 0.1416514813899994, 0.156861811876297, 0.1720721572637558, 0.1872824877500534, 0.202492818236351, 0.21770316362380981, 0.23291349411010742, 0.24812382459640503, 0.26333415508270264, 0.27854448556900024, 0.29375481605529785, 0.30896514654159546, 0.32417547702789307, 0.33938583731651306, 0.35459616780281067, 0.3698064982891083, 0.3850168287754059, 0.4002271592617035, 0.4154374897480011, 0.4306478500366211, 0.4458581805229187, 0.4610685110092163, 0.4762788414955139, 0.4914891719818115]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 7.0, 9.0, 12.0, 5.0, 18.0, 33.0, 59.0, 108.0, 187.0, 290.0, 692.0, 1571.0, 4289.0, 16398.0, 140189.0, 3856591.0, 148783.0, 16629.0, 4498.0, 1684.0, 870.0, 469.0, 263.0, 174.0, 112.0, 86.0, 55.0, 44.0, 30.0, 28.0, 22.0, 20.0, 7.0, 13.0, 7.0, 9.0, 5.0, 1.0, 3.0, 5.0, 0.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.1160888671875, -0.11069297790527344, -0.10529708862304688, -0.09990119934082031, -0.09450531005859375, -0.08910942077636719, -0.08371353149414062, -0.07831764221191406, -0.0729217529296875, -0.06752586364746094, -0.062129974365234375, -0.05673408508300781, -0.05133819580078125, -0.04594230651855469, -0.040546417236328125, -0.03515052795410156, -0.029754638671875, -0.024358749389648438, -0.018962860107421875, -0.013566970825195312, -0.00817108154296875, -0.0027751922607421875, 0.002620697021484375, 0.008016586303710938, 0.0134124755859375, 0.018808364868164062, 0.024204254150390625, 0.029600143432617188, 0.03499603271484375, 0.04039192199707031, 0.045787811279296875, 0.05118370056152344, 0.05657958984375, 0.06197547912597656, 0.06737136840820312, 0.07276725769042969, 0.07816314697265625, 0.08355903625488281, 0.08895492553710938, 0.09435081481933594, 0.0997467041015625, 0.10514259338378906, 0.11053848266601562, 0.11593437194824219, 0.12133026123046875, 0.1267261505126953, 0.13212203979492188, 0.13751792907714844, 0.142913818359375, 0.14830970764160156, 0.15370559692382812, 0.1591014862060547, 0.16449737548828125, 0.1698932647705078, 0.17528915405273438, 0.18068504333496094, 0.1860809326171875, 0.19147682189941406, 0.19687271118164062, 0.2022686004638672, 0.20766448974609375, 0.2130603790283203, 0.21845626831054688, 0.22385215759277344, 0.229248046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 16.0, 28.0, 42.0, 48.0, 82.0, 77.0, 107.0, 133.0, 105.0, 96.0, 76.0, 60.0, 47.0, 31.0, 14.0, 10.0, 6.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0208740234375, -0.019629478454589844, -0.018384933471679688, -0.01714038848876953, -0.015895843505859375, -0.014651298522949219, -0.013406753540039062, -0.012162208557128906, -0.01091766357421875, -0.009673118591308594, -0.008428573608398438, -0.007184028625488281, -0.005939483642578125, -0.004694938659667969, -0.0034503936767578125, -0.0022058486938476562, -0.0009613037109375, 0.00028324127197265625, 0.0015277862548828125, 0.0027723312377929688, 0.004016876220703125, 0.005261421203613281, 0.0065059661865234375, 0.007750511169433594, 0.00899505615234375, 0.010239601135253906, 0.011484146118164062, 0.012728691101074219, 0.013973236083984375, 0.015217781066894531, 0.016462326049804688, 0.017706871032714844, 0.018951416015625, 0.020195960998535156, 0.021440505981445312, 0.02268505096435547, 0.023929595947265625, 0.02517414093017578, 0.026418685913085938, 0.027663230895996094, 0.02890777587890625, 0.030152320861816406, 0.03139686584472656, 0.03264141082763672, 0.033885955810546875, 0.03513050079345703, 0.03637504577636719, 0.037619590759277344, 0.0388641357421875, 0.040108680725097656, 0.04135322570800781, 0.04259777069091797, 0.043842315673828125, 0.04508686065673828, 0.04633140563964844, 0.047575950622558594, 0.04882049560546875, 0.050065040588378906, 0.05130958557128906, 0.05255413055419922, 0.053798675537109375, 0.05504322052001953, 0.05628776550292969, 0.057532310485839844, 0.05877685546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 12.0, 25.0, 50.0, 77.0, 99.0, 163.0, 434.0, 344738.0, 3847920.0, 460.0, 144.0, 67.0, 43.0, 27.0, 10.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.189453125, -2.1447982788085938, -2.1001434326171875, -2.0554885864257812, -2.010833740234375, -1.9661788940429688, -1.9215240478515625, -1.8768692016601562, -1.83221435546875, -1.7875595092773438, -1.7429046630859375, -1.6982498168945312, -1.653594970703125, -1.6089401245117188, -1.5642852783203125, -1.5196304321289062, -1.4749755859375, -1.4303207397460938, -1.3856658935546875, -1.3410110473632812, -1.296356201171875, -1.2517013549804688, -1.2070465087890625, -1.1623916625976562, -1.11773681640625, -1.0730819702148438, -1.0284271240234375, -0.9837722778320312, -0.939117431640625, -0.8944625854492188, -0.8498077392578125, -0.8051528930664062, -0.760498046875, -0.7158432006835938, -0.6711883544921875, -0.6265335083007812, -0.581878662109375, -0.5372238159179688, -0.4925689697265625, -0.44791412353515625, -0.40325927734375, -0.35860443115234375, -0.3139495849609375, -0.26929473876953125, -0.224639892578125, -0.17998504638671875, -0.1353302001953125, -0.09067535400390625, -0.0460205078125, -0.00136566162109375, 0.0432891845703125, 0.08794403076171875, 0.132598876953125, 0.17725372314453125, 0.2219085693359375, 0.26656341552734375, 0.31121826171875, 0.35587310791015625, 0.4005279541015625, 0.44518280029296875, 0.489837646484375, 0.5344924926757812, 0.5791473388671875, 0.6238021850585938, 0.66845703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 12.0, 119.0, 3427.0, 475.0, 40.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333740234375, -0.3274106979370117, -0.32108116149902344, -0.31475162506103516, -0.3084220886230469, -0.3020925521850586, -0.2957630157470703, -0.28943347930908203, -0.28310394287109375, -0.27677440643310547, -0.2704448699951172, -0.2641153335571289, -0.2577857971191406, -0.25145626068115234, -0.24512672424316406, -0.23879718780517578, -0.2324676513671875, -0.22613811492919922, -0.21980857849121094, -0.21347904205322266, -0.20714950561523438, -0.2008199691772461, -0.1944904327392578, -0.18816089630126953, -0.18183135986328125, -0.17550182342529297, -0.1691722869873047, -0.1628427505493164, -0.15651321411132812, -0.15018367767333984, -0.14385414123535156, -0.13752460479736328, -0.131195068359375, -0.12486553192138672, -0.11853599548339844, -0.11220645904541016, -0.10587692260742188, -0.0995473861694336, -0.09321784973144531, -0.08688831329345703, -0.08055877685546875, -0.07422924041748047, -0.06789970397949219, -0.061570167541503906, -0.055240631103515625, -0.048911094665527344, -0.04258155822753906, -0.03625202178955078, -0.0299224853515625, -0.02359294891357422, -0.017263412475585938, -0.010933876037597656, -0.004604339599609375, 0.0017251968383789062, 0.008054733276367188, 0.014384269714355469, 0.02071380615234375, 0.02704334259033203, 0.03337287902832031, 0.039702415466308594, 0.046031951904296875, 0.052361488342285156, 0.05869102478027344, 0.06502056121826172, 0.07135009765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 9.0, 983.0, 24.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3385868072509766, -2.2248640060424805, -2.1111412048339844, -1.9974181652069092, -1.883695363998413, -1.769972562789917, -1.6562496423721313, -1.5425267219543457, -1.4288039207458496, -1.3150811195373535, -1.2013581991195679, -1.0876352787017822, -0.9739124774932861, -0.8601896166801453, -0.7464667558670044, -0.6327438950538635, -0.5190210342407227, -0.4052981734275818, -0.2915753126144409, -0.17785245180130005, -0.06412959098815918, 0.04959326982498169, 0.16331613063812256, 0.2770389914512634, 0.3907618522644043, 0.5044847130775452, 0.618207573890686, 0.7319304347038269, 0.8456532955169678, 0.9593761563301086, 1.0730990171432495, 1.1868219375610352, 1.3005447387695312, 1.4142675399780273, 1.527990460395813, 1.6417133808135986, 1.7554361820220947, 1.8691589832305908, 1.9828819036483765, 2.096604824066162, 2.210327625274658, 2.3240504264831543, 2.4377732276916504, 2.5514962673187256, 2.6652190685272217, 2.7789418697357178, 2.892664909362793, 3.006387710571289, 3.120110511779785, 3.2338333129882812, 3.3475561141967773, 3.4612791538238525, 3.5750019550323486, 3.6887247562408447, 3.80244779586792, 3.916170597076416, 4.029893398284912, 4.143616199493408, 4.257339000701904, 4.3710618019104, 4.484785079956055, 4.598507881164551, 4.712230682373047, 4.825953483581543, 4.939676284790039]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 26.0, 55.0, 105.0, 157.0, 204.0, 175.0, 133.0, 94.0, 34.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4285390377044678, -0.41109713912010193, -0.3936552405357361, -0.37621334195137024, -0.3587714433670044, -0.34132957458496094, -0.3238876760005951, -0.30644577741622925, -0.2890038788318634, -0.27156198024749756, -0.2541200816631317, -0.23667819797992706, -0.21923629939556122, -0.20179440081119537, -0.18435251712799072, -0.16691061854362488, -0.14946871995925903, -0.1320268213748932, -0.11458493024110794, -0.09714303910732269, -0.07970114052295685, -0.062259241938591, -0.044817350804805756, -0.027375459671020508, -0.009933561086654663, 0.007508333772420883, 0.02495022863149643, 0.042392123490571976, 0.05983401834964752, 0.07727591693401337, 0.09471780806779861, 0.11215969920158386, 0.12960165739059448, 0.14704355597496033, 0.16448545455932617, 0.18192733824253082, 0.19936923682689667, 0.2168111354112625, 0.23425301909446716, 0.251694917678833, 0.26913681626319885, 0.2865787148475647, 0.30402061343193054, 0.3214625120162964, 0.33890438079833984, 0.3563463091850281, 0.37378817796707153, 0.3912300765514374, 0.4086719751358032, 0.42611387372016907, 0.4435557723045349, 0.46099767088890076, 0.4784395694732666, 0.49588143825531006, 0.5133233666419983, 0.5307652354240417, 0.54820716381073, 0.5656490325927734, 0.5830909609794617, 0.6005328297615051, 0.6179747581481934, 0.6354166269302368, 0.652858555316925, 0.6703004240989685, 0.687742292881012]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 2.0, 15.0, 5.0, 10.0, 19.0, 23.0, 34.0, 51.0, 64.0, 98.0, 132.0, 245.0, 378.0, 696.0, 1478.0, 4193.0, 15914.0, 85418.0, 601999.0, 284470.0, 39475.0, 8862.0, 2629.0, 1050.0, 485.0, 302.0, 159.0, 104.0, 69.0, 46.0, 41.0, 21.0, 14.0, 19.0, 9.0, 8.0, 7.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.14066314697265625, -0.1359405517578125, -0.13121795654296875, -0.126495361328125, -0.12177276611328125, -0.1170501708984375, -0.11232757568359375, -0.10760498046875, -0.10288238525390625, -0.0981597900390625, -0.09343719482421875, -0.088714599609375, -0.08399200439453125, -0.0792694091796875, -0.07454681396484375, -0.06982421875, -0.06510162353515625, -0.0603790283203125, -0.05565643310546875, -0.050933837890625, -0.04621124267578125, -0.0414886474609375, -0.03676605224609375, -0.03204345703125, -0.02732086181640625, -0.0225982666015625, -0.01787567138671875, -0.013153076171875, -0.00843048095703125, -0.0037078857421875, 0.00101470947265625, 0.0057373046875, 0.01045989990234375, 0.0151824951171875, 0.01990509033203125, 0.024627685546875, 0.02935028076171875, 0.0340728759765625, 0.03879547119140625, 0.04351806640625, 0.04824066162109375, 0.0529632568359375, 0.05768585205078125, 0.062408447265625, 0.06713104248046875, 0.0718536376953125, 0.07657623291015625, 0.081298828125, 0.08602142333984375, 0.0907440185546875, 0.09546661376953125, 0.100189208984375, 0.10491180419921875, 0.1096343994140625, 0.11435699462890625, 0.11907958984375, 0.12380218505859375, 0.1285247802734375, 0.13324737548828125, 0.137969970703125, 0.14269256591796875, 0.1474151611328125, 0.15213775634765625, 0.1568603515625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 23.0, 23.0, 40.0, 56.0, 64.0, 75.0, 81.0, 104.0, 100.0, 93.0, 88.0, 63.0, 49.0, 42.0, 28.0, 21.0, 17.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0225982666015625, -0.02158379554748535, -0.020569324493408203, -0.019554853439331055, -0.018540382385253906, -0.017525911331176758, -0.01651144027709961, -0.015496969223022461, -0.014482498168945312, -0.013468027114868164, -0.012453556060791016, -0.011439085006713867, -0.010424613952636719, -0.00941014289855957, -0.008395671844482422, -0.0073812007904052734, -0.006366729736328125, -0.0053522586822509766, -0.004337787628173828, -0.0033233165740966797, -0.0023088455200195312, -0.0012943744659423828, -0.0002799034118652344, 0.0007345676422119141, 0.0017490386962890625, 0.002763509750366211, 0.0037779808044433594, 0.004792451858520508, 0.005806922912597656, 0.006821393966674805, 0.007835865020751953, 0.008850336074829102, 0.00986480712890625, 0.010879278182983398, 0.011893749237060547, 0.012908220291137695, 0.013922691345214844, 0.014937162399291992, 0.01595163345336914, 0.01696610450744629, 0.017980575561523438, 0.018995046615600586, 0.020009517669677734, 0.021023988723754883, 0.02203845977783203, 0.02305293083190918, 0.024067401885986328, 0.025081872940063477, 0.026096343994140625, 0.027110815048217773, 0.028125286102294922, 0.02913975715637207, 0.03015422821044922, 0.031168699264526367, 0.032183170318603516, 0.033197641372680664, 0.03421211242675781, 0.03522658348083496, 0.03624105453491211, 0.03725552558898926, 0.038269996643066406, 0.039284467697143555, 0.0402989387512207, 0.04131340980529785, 0.042327880859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 11.0, 24.0, 32.0, 32.0, 55.0, 83.0, 146.0, 279.0, 550.0, 1141.0, 2753.0, 8324.0, 33027.0, 226226.0, 647993.0, 99742.0, 18808.0, 5474.0, 1989.0, 857.0, 414.0, 220.0, 136.0, 62.0, 38.0, 36.0, 21.0, 18.0, 9.0, 3.0, 6.0, 4.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1171875, -0.11304855346679688, -0.10890960693359375, -0.10477066040039062, -0.1006317138671875, -0.09649276733398438, -0.09235382080078125, -0.08821487426757812, -0.084075927734375, -0.07993698120117188, -0.07579803466796875, -0.07165908813476562, -0.0675201416015625, -0.06338119506835938, -0.05924224853515625, -0.055103302001953125, -0.05096435546875, -0.046825408935546875, -0.04268646240234375, -0.038547515869140625, -0.0344085693359375, -0.030269622802734375, -0.02613067626953125, -0.021991729736328125, -0.017852783203125, -0.013713836669921875, -0.00957489013671875, -0.005435943603515625, -0.0012969970703125, 0.002841949462890625, 0.00698089599609375, 0.011119842529296875, 0.0152587890625, 0.019397735595703125, 0.02353668212890625, 0.027675628662109375, 0.0318145751953125, 0.035953521728515625, 0.04009246826171875, 0.044231414794921875, 0.048370361328125, 0.052509307861328125, 0.05664825439453125, 0.060787200927734375, 0.0649261474609375, 0.06906509399414062, 0.07320404052734375, 0.07734298706054688, 0.08148193359375, 0.08562088012695312, 0.08975982666015625, 0.09389877319335938, 0.0980377197265625, 0.10217666625976562, 0.10631561279296875, 0.11045455932617188, 0.114593505859375, 0.11873245239257812, 0.12287139892578125, 0.12701034545898438, 0.1311492919921875, 0.13528823852539062, 0.13942718505859375, 0.14356613159179688, 0.147705078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 4.0, 14.0, 11.0, 12.0, 13.0, 14.0, 31.0, 20.0, 35.0, 42.0, 57.0, 66.0, 69.0, 51.0, 77.0, 64.0, 62.0, 48.0, 49.0, 47.0, 39.0, 31.0, 29.0, 20.0, 23.0, 16.0, 8.0, 11.0, 3.0, 6.0, 1.0, 6.0, 5.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08587646484375, -0.08277606964111328, -0.07967567443847656, -0.07657527923583984, -0.07347488403320312, -0.0703744888305664, -0.06727409362792969, -0.06417369842529297, -0.06107330322265625, -0.05797290802001953, -0.05487251281738281, -0.051772117614746094, -0.048671722412109375, -0.045571327209472656, -0.04247093200683594, -0.03937053680419922, -0.0362701416015625, -0.03316974639892578, -0.030069351196289062, -0.026968955993652344, -0.023868560791015625, -0.020768165588378906, -0.017667770385742188, -0.014567375183105469, -0.01146697998046875, -0.008366584777832031, -0.0052661895751953125, -0.0021657943725585938, 0.000934600830078125, 0.004034996032714844, 0.0071353912353515625, 0.010235786437988281, 0.013336181640625, 0.01643657684326172, 0.019536972045898438, 0.022637367248535156, 0.025737762451171875, 0.028838157653808594, 0.03193855285644531, 0.03503894805908203, 0.03813934326171875, 0.04123973846435547, 0.04434013366699219, 0.047440528869628906, 0.050540924072265625, 0.053641319274902344, 0.05674171447753906, 0.05984210968017578, 0.0629425048828125, 0.06604290008544922, 0.06914329528808594, 0.07224369049072266, 0.07534408569335938, 0.0784444808959961, 0.08154487609863281, 0.08464527130126953, 0.08774566650390625, 0.09084606170654297, 0.09394645690917969, 0.0970468521118164, 0.10014724731445312, 0.10324764251708984, 0.10634803771972656, 0.10944843292236328, 0.112548828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 6.0, 16.0, 29.0, 30.0, 77.0, 136.0, 220.0, 399.0, 819.0, 2308.0, 11705.0, 269234.0, 733091.0, 24695.0, 3552.0, 1134.0, 490.0, 264.0, 136.0, 68.0, 65.0, 33.0, 12.0, 5.0, 10.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.10894775390625, -0.10630083084106445, -0.1036539077758789, -0.10100698471069336, -0.09836006164550781, -0.09571313858032227, -0.09306621551513672, -0.09041929244995117, -0.08777236938476562, -0.08512544631958008, -0.08247852325439453, -0.07983160018920898, -0.07718467712402344, -0.07453775405883789, -0.07189083099365234, -0.0692439079284668, -0.06659698486328125, -0.0639500617980957, -0.061303138732910156, -0.05865621566772461, -0.05600929260253906, -0.053362369537353516, -0.05071544647216797, -0.04806852340698242, -0.045421600341796875, -0.04277467727661133, -0.04012775421142578, -0.037480831146240234, -0.03483390808105469, -0.03218698501586914, -0.029540061950683594, -0.026893138885498047, -0.0242462158203125, -0.021599292755126953, -0.018952369689941406, -0.01630544662475586, -0.013658523559570312, -0.011011600494384766, -0.008364677429199219, -0.005717754364013672, -0.003070831298828125, -0.0004239082336425781, 0.0022230148315429688, 0.004869937896728516, 0.0075168609619140625, 0.01016378402709961, 0.012810707092285156, 0.015457630157470703, 0.01810455322265625, 0.020751476287841797, 0.023398399353027344, 0.02604532241821289, 0.028692245483398438, 0.031339168548583984, 0.03398609161376953, 0.03663301467895508, 0.039279937744140625, 0.04192686080932617, 0.04457378387451172, 0.047220706939697266, 0.04986763000488281, 0.05251455307006836, 0.055161476135253906, 0.05780839920043945, 0.060455322265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 10.0, 20.0, 26.0, 41.0, 37.0, 78.0, 91.0, 68.0, 99.0, 90.0, 88.0, 112.0, 57.0, 61.0, 42.0, 26.0, 21.0, 10.0, 8.0, 11.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.417533874511719e-06, -9.082257747650146e-06, -8.746981620788574e-06, -8.411705493927002e-06, -8.07642936706543e-06, -7.741153240203857e-06, -7.405877113342285e-06, -7.070600986480713e-06, -6.735324859619141e-06, -6.400048732757568e-06, -6.064772605895996e-06, -5.729496479034424e-06, -5.3942203521728516e-06, -5.058944225311279e-06, -4.723668098449707e-06, -4.388391971588135e-06, -4.0531158447265625e-06, -3.7178397178649902e-06, -3.382563591003418e-06, -3.0472874641418457e-06, -2.7120113372802734e-06, -2.376735210418701e-06, -2.041459083557129e-06, -1.7061829566955566e-06, -1.3709068298339844e-06, -1.0356307029724121e-06, -7.003545761108398e-07, -3.650784492492676e-07, -2.9802322387695312e-08, 3.0547380447387695e-07, 6.407499313354492e-07, 9.760260581970215e-07, 1.3113021850585938e-06, 1.646578311920166e-06, 1.9818544387817383e-06, 2.3171305656433105e-06, 2.652406692504883e-06, 2.987682819366455e-06, 3.3229589462280273e-06, 3.6582350730895996e-06, 3.993511199951172e-06, 4.328787326812744e-06, 4.664063453674316e-06, 4.999339580535889e-06, 5.334615707397461e-06, 5.669891834259033e-06, 6.0051679611206055e-06, 6.340444087982178e-06, 6.67572021484375e-06, 7.010996341705322e-06, 7.3462724685668945e-06, 7.681548595428467e-06, 8.016824722290039e-06, 8.352100849151611e-06, 8.687376976013184e-06, 9.022653102874756e-06, 9.357929229736328e-06, 9.6932053565979e-06, 1.0028481483459473e-05, 1.0363757610321045e-05, 1.0699033737182617e-05, 1.103430986404419e-05, 1.1369585990905762e-05, 1.1704862117767334e-05, 1.2040138244628906e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 3.0, 5.0, 4.0, 9.0, 16.0, 26.0, 31.0, 64.0, 106.0, 225.0, 515.0, 1525.0, 7237.0, 149597.0, 849834.0, 34048.0, 3617.0, 962.0, 355.0, 162.0, 73.0, 52.0, 31.0, 24.0, 11.0, 9.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.0687112808227539, -0.06619453430175781, -0.06367778778076172, -0.061161041259765625, -0.05864429473876953, -0.05612754821777344, -0.053610801696777344, -0.05109405517578125, -0.048577308654785156, -0.04606056213378906, -0.04354381561279297, -0.041027069091796875, -0.03851032257080078, -0.03599357604980469, -0.033476829528808594, -0.0309600830078125, -0.028443336486816406, -0.025926589965820312, -0.02340984344482422, -0.020893096923828125, -0.01837635040283203, -0.015859603881835938, -0.013342857360839844, -0.01082611083984375, -0.008309364318847656, -0.0057926177978515625, -0.0032758712768554688, -0.000759124755859375, 0.0017576217651367188, 0.0042743682861328125, 0.006791114807128906, 0.009307861328125, 0.011824607849121094, 0.014341354370117188, 0.01685810089111328, 0.019374847412109375, 0.02189159393310547, 0.024408340454101562, 0.026925086975097656, 0.02944183349609375, 0.031958580017089844, 0.03447532653808594, 0.03699207305908203, 0.039508819580078125, 0.04202556610107422, 0.04454231262207031, 0.047059059143066406, 0.0495758056640625, 0.052092552185058594, 0.05460929870605469, 0.05712604522705078, 0.059642791748046875, 0.06215953826904297, 0.06467628479003906, 0.06719303131103516, 0.06970977783203125, 0.07222652435302734, 0.07474327087402344, 0.07726001739501953, 0.07977676391601562, 0.08229351043701172, 0.08481025695800781, 0.0873270034790039, 0.08984375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 10.0, 21.0, 19.0, 42.0, 37.0, 77.0, 94.0, 131.0, 119.0, 121.0, 87.0, 74.0, 47.0, 38.0, 19.0, 15.0, 13.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.046630859375, -0.044928550720214844, -0.04322624206542969, -0.04152393341064453, -0.039821624755859375, -0.03811931610107422, -0.03641700744628906, -0.034714698791503906, -0.03301239013671875, -0.031310081481933594, -0.029607772827148438, -0.02790546417236328, -0.026203155517578125, -0.02450084686279297, -0.022798538208007812, -0.021096229553222656, -0.0193939208984375, -0.017691612243652344, -0.015989303588867188, -0.014286994934082031, -0.012584686279296875, -0.010882377624511719, -0.009180068969726562, -0.007477760314941406, -0.00577545166015625, -0.004073143005371094, -0.0023708343505859375, -0.0006685256958007812, 0.001033782958984375, 0.0027360916137695312, 0.0044384002685546875, 0.006140708923339844, 0.007843017578125, 0.009545326232910156, 0.011247634887695312, 0.012949943542480469, 0.014652252197265625, 0.01635456085205078, 0.018056869506835938, 0.019759178161621094, 0.02146148681640625, 0.023163795471191406, 0.024866104125976562, 0.02656841278076172, 0.028270721435546875, 0.02997303009033203, 0.03167533874511719, 0.033377647399902344, 0.0350799560546875, 0.036782264709472656, 0.03848457336425781, 0.04018688201904297, 0.041889190673828125, 0.04359149932861328, 0.04529380798339844, 0.046996116638183594, 0.04869842529296875, 0.050400733947753906, 0.05210304260253906, 0.05380535125732422, 0.055507659912109375, 0.05720996856689453, 0.05891227722167969, 0.060614585876464844, 0.06231689453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 9.0, 9.0, 36.0, 59.0, 128.0, 219.0, 239.0, 147.0, 77.0, 32.0, 20.0, 10.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5815286636352539, -0.5524561405181885, -0.523383617401123, -0.49431106448173523, -0.4652385115623474, -0.436165988445282, -0.40709346532821655, -0.37802091240882874, -0.3489483594894409, -0.3198758363723755, -0.29080328345298767, -0.26173076033592224, -0.23265820741653442, -0.203585684299469, -0.17451314628124237, -0.14544060826301575, -0.11636808514595032, -0.0872955471277237, -0.05822301283478737, -0.029150478541851044, -7.794052362442017e-05, 0.028994590044021606, 0.05806712806224823, 0.08713966608047485, 0.11621220409870148, 0.1452847421169281, 0.17435728013515472, 0.20342981815338135, 0.23250234127044678, 0.2615748643875122, 0.2906474173069, 0.31971997022628784, 0.34879249334335327, 0.3778650164604187, 0.4069375693798065, 0.43601009249687195, 0.46508264541625977, 0.4941551685333252, 0.5232276916503906, 0.552300214767456, 0.5813727974891663, 0.6104453206062317, 0.6395178437232971, 0.6685904264450073, 0.6976629495620728, 0.7267354726791382, 0.7558079957962036, 0.784880518913269, 0.8139530420303345, 0.8430255651473999, 0.8720980882644653, 0.9011706709861755, 0.930243194103241, 0.9593157172203064, 0.9883882403373718, 1.017460823059082, 1.0465333461761475, 1.075605869293213, 1.1046783924102783, 1.1337509155273438, 1.1628234386444092, 1.1918959617614746, 1.2209686040878296, 1.250041127204895, 1.2791136503219604]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 2.0, 7.0, 3.0, 13.0, 6.0, 9.0, 11.0, 17.0, 17.0, 18.0, 18.0, 33.0, 28.0, 35.0, 29.0, 46.0, 46.0, 48.0, 40.0, 37.0, 34.0, 48.0, 36.0, 51.0, 40.0, 38.0, 49.0, 25.0, 34.0, 32.0, 21.0, 15.0, 22.0, 19.0, 17.0, 15.0, 13.0, 7.0, 5.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4302947521209717, -0.4167306125164032, -0.4031664729118347, -0.3896023631095886, -0.37603822350502014, -0.36247408390045166, -0.34890997409820557, -0.3353458344936371, -0.3217816948890686, -0.3082175552845001, -0.29465341567993164, -0.28108930587768555, -0.26752516627311707, -0.2539610266685486, -0.2403969019651413, -0.226832777261734, -0.21326863765716553, -0.19970449805259705, -0.18614037334918976, -0.17257624864578247, -0.159012109041214, -0.1454479694366455, -0.13188384473323822, -0.11831971257925034, -0.10475558042526245, -0.09119144827127457, -0.07762731611728668, -0.0640631839632988, -0.05049905180931091, -0.03693491965532303, -0.023370787501335144, -0.00980665534734726, 0.003757476806640625, 0.01732160896062851, 0.030885741114616394, 0.04444987326860428, 0.05801400542259216, 0.07157813757658005, 0.08514226973056793, 0.09870640188455582, 0.1122705340385437, 0.12583467364311218, 0.13939879834651947, 0.15296292304992676, 0.16652706265449524, 0.18009120225906372, 0.193655326962471, 0.2072194516658783, 0.22078359127044678, 0.23434773087501526, 0.24791185557842255, 0.26147598028182983, 0.2750401198863983, 0.2886042594909668, 0.3021683692932129, 0.31573250889778137, 0.32929664850234985, 0.34286078810691833, 0.3564249277114868, 0.3699890375137329, 0.3835531771183014, 0.3971173167228699, 0.41068142652511597, 0.42424556612968445, 0.43780970573425293]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 5.0, 12.0, 16.0, 37.0, 37.0, 82.0, 142.0, 300.0, 563.0, 1275.0, 3608.0, 11754.0, 58955.0, 2442958.0, 1606814.0, 50584.0, 10607.0, 3502.0, 1398.0, 675.0, 340.0, 210.0, 124.0, 75.0, 66.0, 37.0, 22.0, 26.0, 14.0, 11.0, 8.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1551513671875, -0.14997482299804688, -0.14479827880859375, -0.13962173461914062, -0.1344451904296875, -0.12926864624023438, -0.12409210205078125, -0.11891555786132812, -0.113739013671875, -0.10856246948242188, -0.10338592529296875, -0.09820938110351562, -0.0930328369140625, -0.08785629272460938, -0.08267974853515625, -0.07750320434570312, -0.07232666015625, -0.06715011596679688, -0.06197357177734375, -0.056797027587890625, -0.0516204833984375, -0.046443939208984375, -0.04126739501953125, -0.036090850830078125, -0.030914306640625, -0.025737762451171875, -0.02056121826171875, -0.015384674072265625, -0.0102081298828125, -0.005031585693359375, 0.00014495849609375, 0.005321502685546875, 0.010498046875, 0.015674591064453125, 0.02085113525390625, 0.026027679443359375, 0.0312042236328125, 0.036380767822265625, 0.04155731201171875, 0.046733856201171875, 0.051910400390625, 0.057086944580078125, 0.06226348876953125, 0.06744003295898438, 0.0726165771484375, 0.07779312133789062, 0.08296966552734375, 0.08814620971679688, 0.09332275390625, 0.09849929809570312, 0.10367584228515625, 0.10885238647460938, 0.1140289306640625, 0.11920547485351562, 0.12438201904296875, 0.12955856323242188, 0.134735107421875, 0.13991165161132812, 0.14508819580078125, 0.15026473999023438, 0.1554412841796875, 0.16061782836914062, 0.16579437255859375, 0.17097091674804688, 0.1761474609375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 9.0, 18.0, 21.0, 39.0, 52.0, 57.0, 69.0, 99.0, 97.0, 99.0, 102.0, 86.0, 80.0, 47.0, 38.0, 36.0, 19.0, 14.0, 10.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0254058837890625, -0.024319887161254883, -0.023233890533447266, -0.02214789390563965, -0.02106189727783203, -0.019975900650024414, -0.018889904022216797, -0.01780390739440918, -0.016717910766601562, -0.015631914138793945, -0.014545917510986328, -0.013459920883178711, -0.012373924255371094, -0.011287927627563477, -0.01020193099975586, -0.009115934371948242, -0.008029937744140625, -0.006943941116333008, -0.005857944488525391, -0.0047719478607177734, -0.0036859512329101562, -0.002599954605102539, -0.0015139579772949219, -0.0004279613494873047, 0.0006580352783203125, 0.0017440319061279297, 0.002830028533935547, 0.003916025161743164, 0.005002021789550781, 0.0060880184173583984, 0.007174015045166016, 0.008260011672973633, 0.00934600830078125, 0.010432004928588867, 0.011518001556396484, 0.012603998184204102, 0.013689994812011719, 0.014775991439819336, 0.015861988067626953, 0.01694798469543457, 0.018033981323242188, 0.019119977951049805, 0.020205974578857422, 0.02129197120666504, 0.022377967834472656, 0.023463964462280273, 0.02454996109008789, 0.025635957717895508, 0.026721954345703125, 0.027807950973510742, 0.02889394760131836, 0.029979944229125977, 0.031065940856933594, 0.03215193748474121, 0.03323793411254883, 0.034323930740356445, 0.03540992736816406, 0.03649592399597168, 0.0375819206237793, 0.038667917251586914, 0.03975391387939453, 0.04083991050720215, 0.041925907135009766, 0.04301190376281738, 0.044097900390625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 7.0, 13.0, 25.0, 26.0, 45.0, 99.0, 169.0, 567.0, 2736.0, 20567.0, 4074971.0, 88580.0, 4936.0, 917.0, 300.0, 144.0, 66.0, 44.0, 27.0, 17.0, 12.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343994140625, -0.3320045471191406, -0.32001495361328125, -0.3080253601074219, -0.2960357666015625, -0.2840461730957031, -0.27205657958984375, -0.2600669860839844, -0.248077392578125, -0.23608779907226562, -0.22409820556640625, -0.21210861206054688, -0.2001190185546875, -0.18812942504882812, -0.17613983154296875, -0.16415023803710938, -0.15216064453125, -0.14017105102539062, -0.12818145751953125, -0.11619186401367188, -0.1042022705078125, -0.09221267700195312, -0.08022308349609375, -0.06823348999023438, -0.056243896484375, -0.044254302978515625, -0.03226470947265625, -0.020275115966796875, -0.0082855224609375, 0.003704071044921875, 0.01569366455078125, 0.027683258056640625, 0.0396728515625, 0.051662445068359375, 0.06365203857421875, 0.07564163208007812, 0.0876312255859375, 0.09962081909179688, 0.11161041259765625, 0.12360000610351562, 0.135589599609375, 0.14757919311523438, 0.15956878662109375, 0.17155838012695312, 0.1835479736328125, 0.19553756713867188, 0.20752716064453125, 0.21951675415039062, 0.23150634765625, 0.24349594116210938, 0.25548553466796875, 0.2674751281738281, 0.2794647216796875, 0.2914543151855469, 0.30344390869140625, 0.3154335021972656, 0.327423095703125, 0.3394126892089844, 0.35140228271484375, 0.3633918762207031, 0.3753814697265625, 0.3873710632324219, 0.39936065673828125, 0.4113502502441406, 0.42333984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 16.0, 27.0, 44.0, 89.0, 275.0, 1256.0, 1814.0, 327.0, 105.0, 48.0, 13.0, 14.0, 8.0, 10.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0887451171875, -0.0855855941772461, -0.08242607116699219, -0.07926654815673828, -0.07610702514648438, -0.07294750213623047, -0.06978797912597656, -0.06662845611572266, -0.06346893310546875, -0.060309410095214844, -0.05714988708496094, -0.05399036407470703, -0.050830841064453125, -0.04767131805419922, -0.04451179504394531, -0.041352272033691406, -0.0381927490234375, -0.035033226013183594, -0.03187370300292969, -0.02871417999267578, -0.025554656982421875, -0.02239513397216797, -0.019235610961914062, -0.016076087951660156, -0.01291656494140625, -0.009757041931152344, -0.0065975189208984375, -0.0034379959106445312, -0.000278472900390625, 0.0028810501098632812, 0.0060405731201171875, 0.009200096130371094, 0.012359619140625, 0.015519142150878906, 0.018678665161132812, 0.02183818817138672, 0.024997711181640625, 0.02815723419189453, 0.03131675720214844, 0.034476280212402344, 0.03763580322265625, 0.040795326232910156, 0.04395484924316406, 0.04711437225341797, 0.050273895263671875, 0.05343341827392578, 0.05659294128417969, 0.059752464294433594, 0.0629119873046875, 0.0660715103149414, 0.06923103332519531, 0.07239055633544922, 0.07555007934570312, 0.07870960235595703, 0.08186912536621094, 0.08502864837646484, 0.08818817138671875, 0.09134769439697266, 0.09450721740722656, 0.09766674041748047, 0.10082626342773438, 0.10398578643798828, 0.10714530944824219, 0.1103048324584961, 0.11346435546875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 28.0, 153.0, 564.0, 220.0, 31.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8084172606468201, -0.7710904479026794, -0.733763575553894, -0.6964367628097534, -0.6591099500656128, -0.6217831373214722, -0.5844562649726868, -0.5471294522285461, -0.5098025798797607, -0.47247573733329773, -0.4351489245891571, -0.3978220820426941, -0.36049526929855347, -0.32316842675209045, -0.28584158420562744, -0.24851477146148682, -0.2111879587173462, -0.17386113107204437, -0.13653430342674255, -0.09920746088027954, -0.06188063323497772, -0.024553805589675903, 0.01277303695678711, 0.050099849700927734, 0.08742669224739075, 0.12475351989269257, 0.16208034753799438, 0.1994071900844574, 0.23673401772975922, 0.27406084537506104, 0.31138768792152405, 0.3487145006656647, 0.38604140281677246, 0.4233682453632355, 0.4606950581073761, 0.4980219006538391, 0.5353487133979797, 0.5726755857467651, 0.6100023984909058, 0.6473292112350464, 0.684656023979187, 0.7219828367233276, 0.759309709072113, 0.7966365218162537, 0.8339633345603943, 0.8712902069091797, 0.9086170196533203, 0.9459438323974609, 0.9832707047462463, 1.0205975770950317, 1.0579243898391724, 1.095251202583313, 1.1325780153274536, 1.1699048280715942, 1.2072317600250244, 1.244558572769165, 1.2818853855133057, 1.3192121982574463, 1.356539011001587, 1.3938658237457275, 1.4311927556991577, 1.4685195684432983, 1.505846381187439, 1.5431731939315796, 1.5805000066757202]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 8.0, 4.0, 17.0, 12.0, 17.0, 35.0, 43.0, 44.0, 67.0, 79.0, 72.0, 75.0, 92.0, 72.0, 83.0, 62.0, 59.0, 40.0, 35.0, 27.0, 16.0, 11.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2521904706954956, -0.2429962158203125, -0.2338019609451294, -0.2246077060699463, -0.21541345119476318, -0.20621919631958008, -0.19702495634555817, -0.18783070147037506, -0.17863644659519196, -0.16944219172000885, -0.16024793684482574, -0.15105368196964264, -0.14185944199562073, -0.13266518712043762, -0.12347093224525452, -0.11427667737007141, -0.1050824224948883, -0.0958881676197052, -0.0866939127445221, -0.07749966531991959, -0.06830541044473648, -0.059111155569553375, -0.04991690441966057, -0.04072265326976776, -0.031528398394584656, -0.0223341453820467, -0.013139892369508743, -0.003945639356970787, 0.005248613655567169, 0.014442868530750275, 0.02363711968064308, 0.03283137083053589, 0.042025625705718994, 0.0512198805809021, 0.06041413173079491, 0.06960838288068771, 0.07880263775587082, 0.08799689263105392, 0.09719114005565643, 0.10638539493083954, 0.11557964980602264, 0.12477390468120575, 0.13396815955638885, 0.14316241443157196, 0.15235665440559387, 0.16155090928077698, 0.17074516415596008, 0.1799394190311432, 0.1891336739063263, 0.1983279287815094, 0.2075221836566925, 0.2167164385318756, 0.22591069340705872, 0.23510494828224182, 0.24429918825626373, 0.25349342823028564, 0.26268768310546875, 0.27188193798065186, 0.28107619285583496, 0.29027044773101807, 0.29946470260620117, 0.3086589574813843, 0.3178532123565674, 0.3270474672317505, 0.3362417221069336]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 2.0, 8.0, 16.0, 11.0, 16.0, 26.0, 36.0, 43.0, 45.0, 73.0, 121.0, 202.0, 257.0, 421.0, 907.0, 2186.0, 6031.0, 21550.0, 109828.0, 580492.0, 267478.0, 42360.0, 10054.0, 3394.0, 1382.0, 614.0, 352.0, 185.0, 126.0, 85.0, 64.0, 45.0, 41.0, 26.0, 19.0, 9.0, 12.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12286376953125, -0.11899089813232422, -0.11511802673339844, -0.11124515533447266, -0.10737228393554688, -0.1034994125366211, -0.09962654113769531, -0.09575366973876953, -0.09188079833984375, -0.08800792694091797, -0.08413505554199219, -0.0802621841430664, -0.07638931274414062, -0.07251644134521484, -0.06864356994628906, -0.06477069854736328, -0.0608978271484375, -0.05702495574951172, -0.05315208435058594, -0.049279212951660156, -0.045406341552734375, -0.041533470153808594, -0.03766059875488281, -0.03378772735595703, -0.02991485595703125, -0.02604198455810547, -0.022169113159179688, -0.018296241760253906, -0.014423370361328125, -0.010550498962402344, -0.0066776275634765625, -0.0028047561645507812, 0.001068115234375, 0.004940986633300781, 0.008813858032226562, 0.012686729431152344, 0.016559600830078125, 0.020432472229003906, 0.024305343627929688, 0.02817821502685547, 0.03205108642578125, 0.03592395782470703, 0.03979682922363281, 0.043669700622558594, 0.047542572021484375, 0.051415443420410156, 0.05528831481933594, 0.05916118621826172, 0.0630340576171875, 0.06690692901611328, 0.07077980041503906, 0.07465267181396484, 0.07852554321289062, 0.0823984146118164, 0.08627128601074219, 0.09014415740966797, 0.09401702880859375, 0.09788990020751953, 0.10176277160644531, 0.1056356430053711, 0.10950851440429688, 0.11338138580322266, 0.11725425720214844, 0.12112712860107422, 0.125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 2.0, 6.0, 5.0, 7.0, 12.0, 22.0, 29.0, 26.0, 51.0, 52.0, 72.0, 77.0, 89.0, 92.0, 86.0, 73.0, 84.0, 49.0, 47.0, 35.0, 34.0, 16.0, 21.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0238800048828125, -0.022980928421020508, -0.022081851959228516, -0.021182775497436523, -0.02028369903564453, -0.01938462257385254, -0.018485546112060547, -0.017586469650268555, -0.016687393188476562, -0.01578831672668457, -0.014889240264892578, -0.013990163803100586, -0.013091087341308594, -0.012192010879516602, -0.01129293441772461, -0.010393857955932617, -0.009494781494140625, -0.008595705032348633, -0.007696628570556641, -0.0067975521087646484, -0.005898475646972656, -0.004999399185180664, -0.004100322723388672, -0.0032012462615966797, -0.0023021697998046875, -0.0014030933380126953, -0.0005040168762207031, 0.00039505958557128906, 0.0012941360473632812, 0.0021932125091552734, 0.0030922889709472656, 0.003991365432739258, 0.00489044189453125, 0.005789518356323242, 0.006688594818115234, 0.0075876712799072266, 0.008486747741699219, 0.009385824203491211, 0.010284900665283203, 0.011183977127075195, 0.012083053588867188, 0.01298213005065918, 0.013881206512451172, 0.014780282974243164, 0.015679359436035156, 0.01657843589782715, 0.01747751235961914, 0.018376588821411133, 0.019275665283203125, 0.020174741744995117, 0.02107381820678711, 0.0219728946685791, 0.022871971130371094, 0.023771047592163086, 0.024670124053955078, 0.02556920051574707, 0.026468276977539062, 0.027367353439331055, 0.028266429901123047, 0.02916550636291504, 0.03006458282470703, 0.030963659286499023, 0.031862735748291016, 0.03276181221008301, 0.033660888671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 5.0, 12.0, 13.0, 12.0, 14.0, 30.0, 39.0, 62.0, 84.0, 146.0, 231.0, 371.0, 611.0, 1020.0, 1686.0, 3062.0, 5741.0, 11122.0, 22682.0, 49779.0, 116082.0, 243773.0, 291444.0, 165355.0, 71303.0, 31837.0, 15002.0, 7580.0, 4064.0, 2122.0, 1316.0, 741.0, 463.0, 258.0, 170.0, 115.0, 61.0, 35.0, 35.0, 20.0, 18.0, 9.0, 8.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.04681396484375, -0.04540443420410156, -0.043994903564453125, -0.04258537292480469, -0.04117584228515625, -0.03976631164550781, -0.038356781005859375, -0.03694725036621094, -0.0355377197265625, -0.03412818908691406, -0.032718658447265625, -0.03130912780761719, -0.02989959716796875, -0.028490066528320312, -0.027080535888671875, -0.025671005249023438, -0.024261474609375, -0.022851943969726562, -0.021442413330078125, -0.020032882690429688, -0.01862335205078125, -0.017213821411132812, -0.015804290771484375, -0.014394760131835938, -0.0129852294921875, -0.011575698852539062, -0.010166168212890625, -0.008756637573242188, -0.00734710693359375, -0.0059375762939453125, -0.004528045654296875, -0.0031185150146484375, -0.001708984375, -0.0002994537353515625, 0.001110076904296875, 0.0025196075439453125, 0.00392913818359375, 0.0053386688232421875, 0.006748199462890625, 0.008157730102539062, 0.0095672607421875, 0.010976791381835938, 0.012386322021484375, 0.013795852661132812, 0.01520538330078125, 0.016614913940429688, 0.018024444580078125, 0.019433975219726562, 0.020843505859375, 0.022253036499023438, 0.023662567138671875, 0.025072097778320312, 0.02648162841796875, 0.027891159057617188, 0.029300689697265625, 0.030710220336914062, 0.0321197509765625, 0.03352928161621094, 0.034938812255859375, 0.03634834289550781, 0.03775787353515625, 0.03916740417480469, 0.040576934814453125, 0.04198646545410156, 0.04339599609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 6.0, 3.0, 0.0, 6.0, 6.0, 15.0, 15.0, 20.0, 17.0, 17.0, 22.0, 25.0, 31.0, 42.0, 35.0, 40.0, 39.0, 47.0, 41.0, 52.0, 44.0, 49.0, 43.0, 45.0, 37.0, 33.0, 32.0, 38.0, 33.0, 32.0, 22.0, 20.0, 23.0, 7.0, 12.0, 9.0, 9.0, 18.0, 9.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.060821533203125, -0.05873537063598633, -0.056649208068847656, -0.054563045501708984, -0.05247688293457031, -0.05039072036743164, -0.04830455780029297, -0.0462183952331543, -0.044132232666015625, -0.04204607009887695, -0.03995990753173828, -0.03787374496459961, -0.03578758239746094, -0.033701419830322266, -0.031615257263183594, -0.029529094696044922, -0.02744293212890625, -0.025356769561767578, -0.023270606994628906, -0.021184444427490234, -0.019098281860351562, -0.01701211929321289, -0.014925956726074219, -0.012839794158935547, -0.010753631591796875, -0.008667469024658203, -0.006581306457519531, -0.004495143890380859, -0.0024089813232421875, -0.0003228187561035156, 0.0017633438110351562, 0.003849506378173828, 0.0059356689453125, 0.008021831512451172, 0.010107994079589844, 0.012194156646728516, 0.014280319213867188, 0.01636648178100586, 0.01845264434814453, 0.020538806915283203, 0.022624969482421875, 0.024711132049560547, 0.02679729461669922, 0.02888345718383789, 0.030969619750976562, 0.033055782318115234, 0.035141944885253906, 0.03722810745239258, 0.03931427001953125, 0.04140043258666992, 0.043486595153808594, 0.045572757720947266, 0.04765892028808594, 0.04974508285522461, 0.05183124542236328, 0.05391740798950195, 0.056003570556640625, 0.0580897331237793, 0.06017589569091797, 0.06226205825805664, 0.06434822082519531, 0.06643438339233398, 0.06852054595947266, 0.07060670852661133, 0.07269287109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 10.0, 11.0, 12.0, 29.0, 42.0, 62.0, 97.0, 133.0, 266.0, 395.0, 699.0, 1297.0, 3079.0, 9655.0, 50326.0, 315711.0, 514096.0, 124306.0, 19146.0, 4943.0, 1968.0, 921.0, 500.0, 316.0, 188.0, 128.0, 74.0, 44.0, 24.0, 20.0, 13.0, 10.0, 11.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0285797119140625, -0.027634382247924805, -0.02668905258178711, -0.025743722915649414, -0.02479839324951172, -0.023853063583374023, -0.022907733917236328, -0.021962404251098633, -0.021017074584960938, -0.020071744918823242, -0.019126415252685547, -0.01818108558654785, -0.017235755920410156, -0.01629042625427246, -0.015345096588134766, -0.01439976692199707, -0.013454437255859375, -0.01250910758972168, -0.011563777923583984, -0.010618448257446289, -0.009673118591308594, -0.008727788925170898, -0.007782459259033203, -0.006837129592895508, -0.0058917999267578125, -0.004946470260620117, -0.004001140594482422, -0.0030558109283447266, -0.0021104812622070312, -0.001165151596069336, -0.00021982192993164062, 0.0007255077362060547, 0.00167083740234375, 0.0026161670684814453, 0.0035614967346191406, 0.004506826400756836, 0.005452156066894531, 0.0063974857330322266, 0.007342815399169922, 0.008288145065307617, 0.009233474731445312, 0.010178804397583008, 0.011124134063720703, 0.012069463729858398, 0.013014793395996094, 0.013960123062133789, 0.014905452728271484, 0.01585078239440918, 0.016796112060546875, 0.01774144172668457, 0.018686771392822266, 0.01963210105895996, 0.020577430725097656, 0.02152276039123535, 0.022468090057373047, 0.023413419723510742, 0.024358749389648438, 0.025304079055786133, 0.026249408721923828, 0.027194738388061523, 0.02814006805419922, 0.029085397720336914, 0.03003072738647461, 0.030976057052612305, 0.03192138671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 13.0, 22.0, 23.0, 52.0, 55.0, 65.0, 85.0, 119.0, 110.0, 100.0, 95.0, 78.0, 64.0, 34.0, 33.0, 27.0, 13.0, 10.0, 5.0, 0.0, 1.0, 2.0], "bins": [-1.817941665649414e-05, -1.7819926142692566e-05, -1.746043562889099e-05, -1.7100945115089417e-05, -1.6741454601287842e-05, -1.6381964087486267e-05, -1.6022473573684692e-05, -1.5662983059883118e-05, -1.5303492546081543e-05, -1.4944002032279968e-05, -1.4584511518478394e-05, -1.4225021004676819e-05, -1.3865530490875244e-05, -1.350603997707367e-05, -1.3146549463272095e-05, -1.278705894947052e-05, -1.2427568435668945e-05, -1.206807792186737e-05, -1.1708587408065796e-05, -1.1349096894264221e-05, -1.0989606380462646e-05, -1.0630115866661072e-05, -1.0270625352859497e-05, -9.911134839057922e-06, -9.551644325256348e-06, -9.192153811454773e-06, -8.832663297653198e-06, -8.473172783851624e-06, -8.113682270050049e-06, -7.754191756248474e-06, -7.394701242446899e-06, -7.035210728645325e-06, -6.67572021484375e-06, -6.316229701042175e-06, -5.956739187240601e-06, -5.597248673439026e-06, -5.237758159637451e-06, -4.8782676458358765e-06, -4.518777132034302e-06, -4.159286618232727e-06, -3.7997961044311523e-06, -3.4403055906295776e-06, -3.080815076828003e-06, -2.7213245630264282e-06, -2.3618340492248535e-06, -2.002343535423279e-06, -1.642853021621704e-06, -1.2833625078201294e-06, -9.238719940185547e-07, -5.6438148021698e-07, -2.0489096641540527e-07, 1.5459954738616943e-07, 5.140900611877441e-07, 8.735805749893188e-07, 1.2330710887908936e-06, 1.5925616025924683e-06, 1.952052116394043e-06, 2.3115426301956177e-06, 2.6710331439971924e-06, 3.030523657798767e-06, 3.390014171600342e-06, 3.7495046854019165e-06, 4.108995199203491e-06, 4.468485713005066e-06, 4.827976226806641e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 18.0, 17.0, 38.0, 79.0, 154.0, 399.0, 983.0, 3322.0, 28408.0, 514316.0, 470708.0, 25424.0, 3119.0, 910.0, 356.0, 138.0, 71.0, 37.0, 17.0, 14.0, 9.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0499267578125, -0.04841279983520508, -0.046898841857910156, -0.045384883880615234, -0.04387092590332031, -0.04235696792602539, -0.04084300994873047, -0.03932905197143555, -0.037815093994140625, -0.0363011360168457, -0.03478717803955078, -0.03327322006225586, -0.03175926208496094, -0.030245304107666016, -0.028731346130371094, -0.027217388153076172, -0.02570343017578125, -0.024189472198486328, -0.022675514221191406, -0.021161556243896484, -0.019647598266601562, -0.01813364028930664, -0.01661968231201172, -0.015105724334716797, -0.013591766357421875, -0.012077808380126953, -0.010563850402832031, -0.00904989242553711, -0.0075359344482421875, -0.006021976470947266, -0.004508018493652344, -0.002994060516357422, -0.0014801025390625, 3.3855438232421875e-05, 0.0015478134155273438, 0.0030617713928222656, 0.0045757293701171875, 0.006089687347412109, 0.007603645324707031, 0.009117603302001953, 0.010631561279296875, 0.012145519256591797, 0.013659477233886719, 0.01517343521118164, 0.016687393188476562, 0.018201351165771484, 0.019715309143066406, 0.021229267120361328, 0.02274322509765625, 0.024257183074951172, 0.025771141052246094, 0.027285099029541016, 0.028799057006835938, 0.03031301498413086, 0.03182697296142578, 0.0333409309387207, 0.034854888916015625, 0.03636884689331055, 0.03788280487060547, 0.03939676284790039, 0.04091072082519531, 0.042424678802490234, 0.043938636779785156, 0.04545259475708008, 0.046966552734375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 9.0, 10.0, 22.0, 21.0, 37.0, 52.0, 66.0, 65.0, 91.0, 112.0, 112.0, 86.0, 69.0, 71.0, 45.0, 49.0, 30.0, 19.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.03619194030761719, -0.035030364990234375, -0.03386878967285156, -0.03270721435546875, -0.03154563903808594, -0.030384063720703125, -0.029222488403320312, -0.0280609130859375, -0.026899337768554688, -0.025737762451171875, -0.024576187133789062, -0.02341461181640625, -0.022253036499023438, -0.021091461181640625, -0.019929885864257812, -0.018768310546875, -0.017606735229492188, -0.016445159912109375, -0.015283584594726562, -0.01412200927734375, -0.012960433959960938, -0.011798858642578125, -0.010637283325195312, -0.0094757080078125, -0.008314132690429688, -0.007152557373046875, -0.0059909820556640625, -0.00482940673828125, -0.0036678314208984375, -0.002506256103515625, -0.0013446807861328125, -0.00018310546875, 0.0009784698486328125, 0.002140045166015625, 0.0033016204833984375, 0.00446319580078125, 0.0056247711181640625, 0.006786346435546875, 0.007947921752929688, 0.0091094970703125, 0.010271072387695312, 0.011432647705078125, 0.012594223022460938, 0.01375579833984375, 0.014917373657226562, 0.016078948974609375, 0.017240524291992188, 0.018402099609375, 0.019563674926757812, 0.020725250244140625, 0.021886825561523438, 0.02304840087890625, 0.024209976196289062, 0.025371551513671875, 0.026533126831054688, 0.0276947021484375, 0.028856277465820312, 0.030017852783203125, 0.031179428100585938, 0.03234100341796875, 0.03350257873535156, 0.034664154052734375, 0.03582572937011719, 0.0369873046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 10.0, 9.0, 14.0, 24.0, 77.0, 106.0, 215.0, 215.0, 136.0, 81.0, 56.0, 21.0, 16.0, 7.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8354989290237427, -0.8147929310798645, -0.7940868735313416, -0.7733808755874634, -0.7526748180389404, -0.7319688200950623, -0.7112628221511841, -0.6905567646026611, -0.669850766658783, -0.6491447687149048, -0.6284387111663818, -0.6077327132225037, -0.5870267152786255, -0.5663206577301025, -0.5456146597862244, -0.5249086618423462, -0.5042026042938232, -0.4834965765476227, -0.4627905488014221, -0.44208455085754395, -0.4213785231113434, -0.4006724953651428, -0.37996649742126465, -0.3592604696750641, -0.3385544419288635, -0.31784841418266296, -0.2971423864364624, -0.27643638849258423, -0.25573036074638367, -0.2350243330001831, -0.21431832015514374, -0.19361230731010437, -0.17290621995925903, -0.15220019221305847, -0.1314941793680191, -0.11078815907239914, -0.09008213877677917, -0.06937611848115921, -0.048670098185539246, -0.027964085340499878, -0.007258057594299316, 0.013447962701320648, 0.03415398299694061, 0.05486000329256058, 0.07556602358818054, 0.0962720438838005, 0.11697806417942047, 0.13768407702445984, 0.1583901047706604, 0.17909613251686096, 0.19980214536190033, 0.2205081582069397, 0.24121418595314026, 0.2619202136993408, 0.282626211643219, 0.30333223938941956, 0.3240382671356201, 0.3447442948818207, 0.36545032262802124, 0.3861563205718994, 0.4068623483181, 0.42756837606430054, 0.4482743740081787, 0.4689804017543793, 0.48968642950057983]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 2.0, 5.0, 2.0, 8.0, 7.0, 12.0, 9.0, 10.0, 19.0, 31.0, 28.0, 29.0, 34.0, 47.0, 35.0, 46.0, 57.0, 44.0, 66.0, 46.0, 50.0, 50.0, 48.0, 38.0, 39.0, 32.0, 36.0, 34.0, 17.0, 20.0, 18.0, 15.0, 13.0, 15.0, 11.0, 8.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4434008002281189, -0.42979100346565247, -0.41618117690086365, -0.4025713801383972, -0.3889615833759308, -0.37535178661346436, -0.36174196004867554, -0.3481321632862091, -0.3345223665237427, -0.32091256976127625, -0.3073027431964874, -0.293692946434021, -0.28008314967155457, -0.26647335290908813, -0.2528635263442993, -0.23925372958183289, -0.22564391791820526, -0.21203410625457764, -0.1984243094921112, -0.18481449782848358, -0.17120470106601715, -0.15759488940238953, -0.1439850926399231, -0.13037528097629547, -0.11676547676324844, -0.10315567255020142, -0.08954586833715439, -0.07593606412410736, -0.062326256185770035, -0.04871644824743271, -0.03510664403438568, -0.021496839821338654, -0.007887035608291626, 0.005722769536077976, 0.01933257468044758, 0.032942380756139755, 0.04655218496918678, 0.06016199290752411, 0.07377179712057114, 0.08738160133361816, 0.10099140554666519, 0.11460120975971222, 0.12821102142333984, 0.14182081818580627, 0.1554306298494339, 0.16904044151306152, 0.18265023827552795, 0.19626003503799438, 0.209869846701622, 0.22347965836524963, 0.23708945512771606, 0.2506992518901825, 0.2643090784549713, 0.27791887521743774, 0.2915286719799042, 0.3051384687423706, 0.3187482953071594, 0.33235809206962585, 0.3459679186344147, 0.3595777153968811, 0.37318751215934753, 0.38679730892181396, 0.4004071354866028, 0.4140169322490692, 0.42762672901153564]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 9.0, 13.0, 26.0, 33.0, 56.0, 94.0, 180.0, 329.0, 665.0, 1539.0, 3867.0, 13720.0, 82328.0, 3236107.0, 795457.0, 45089.0, 9243.0, 2936.0, 1188.0, 571.0, 290.0, 187.0, 109.0, 70.0, 38.0, 38.0, 17.0, 30.0, 12.0, 13.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06298828125, -0.06010627746582031, -0.057224273681640625, -0.05434226989746094, -0.05146026611328125, -0.04857826232910156, -0.045696258544921875, -0.04281425476074219, -0.0399322509765625, -0.03705024719238281, -0.034168243408203125, -0.03128623962402344, -0.02840423583984375, -0.025522232055664062, -0.022640228271484375, -0.019758224487304688, -0.016876220703125, -0.013994216918945312, -0.011112213134765625, -0.008230209350585938, -0.00534820556640625, -0.0024662017822265625, 0.000415802001953125, 0.0032978057861328125, 0.0061798095703125, 0.009061813354492188, 0.011943817138671875, 0.014825820922851562, 0.01770782470703125, 0.020589828491210938, 0.023471832275390625, 0.026353836059570312, 0.02923583984375, 0.03211784362792969, 0.034999847412109375, 0.03788185119628906, 0.04076385498046875, 0.04364585876464844, 0.046527862548828125, 0.04940986633300781, 0.0522918701171875, 0.05517387390136719, 0.058055877685546875, 0.06093788146972656, 0.06381988525390625, 0.06670188903808594, 0.06958389282226562, 0.07246589660644531, 0.075347900390625, 0.07822990417480469, 0.08111190795898438, 0.08399391174316406, 0.08687591552734375, 0.08975791931152344, 0.09263992309570312, 0.09552192687988281, 0.0984039306640625, 0.10128593444824219, 0.10416793823242188, 0.10704994201660156, 0.10993194580078125, 0.11281394958496094, 0.11569595336914062, 0.11857795715332031, 0.1214599609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 6.0, 17.0, 24.0, 27.0, 27.0, 52.0, 47.0, 54.0, 70.0, 73.0, 78.0, 71.0, 68.0, 76.0, 57.0, 47.0, 40.0, 36.0, 27.0, 26.0, 18.0, 14.0, 8.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.024627685546875, -0.023814678192138672, -0.023001670837402344, -0.022188663482666016, -0.021375656127929688, -0.02056264877319336, -0.01974964141845703, -0.018936634063720703, -0.018123626708984375, -0.017310619354248047, -0.01649761199951172, -0.01568460464477539, -0.014871597290039062, -0.014058589935302734, -0.013245582580566406, -0.012432575225830078, -0.01161956787109375, -0.010806560516357422, -0.009993553161621094, -0.009180545806884766, -0.008367538452148438, -0.007554531097412109, -0.006741523742675781, -0.005928516387939453, -0.005115509033203125, -0.004302501678466797, -0.0034894943237304688, -0.0026764869689941406, -0.0018634796142578125, -0.0010504722595214844, -0.00023746490478515625, 0.0005755424499511719, 0.0013885498046875, 0.002201557159423828, 0.0030145645141601562, 0.0038275718688964844, 0.0046405792236328125, 0.005453586578369141, 0.006266593933105469, 0.007079601287841797, 0.007892608642578125, 0.008705615997314453, 0.009518623352050781, 0.01033163070678711, 0.011144638061523438, 0.011957645416259766, 0.012770652770996094, 0.013583660125732422, 0.01439666748046875, 0.015209674835205078, 0.016022682189941406, 0.016835689544677734, 0.017648696899414062, 0.01846170425415039, 0.01927471160888672, 0.020087718963623047, 0.020900726318359375, 0.021713733673095703, 0.02252674102783203, 0.02333974838256836, 0.024152755737304688, 0.024965763092041016, 0.025778770446777344, 0.026591777801513672, 0.02740478515625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 14.0, 28.0, 52.0, 92.0, 135.0, 204.0, 449.0, 1280.0, 9667.0, 3379905.0, 794552.0, 6267.0, 920.0, 321.0, 164.0, 101.0, 50.0, 34.0, 24.0, 10.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.156494140625, -0.14995193481445312, -0.14340972900390625, -0.13686752319335938, -0.1303253173828125, -0.12378311157226562, -0.11724090576171875, -0.11069869995117188, -0.104156494140625, -0.09761428833007812, -0.09107208251953125, -0.08452987670898438, -0.0779876708984375, -0.07144546508789062, -0.06490325927734375, -0.058361053466796875, -0.05181884765625, -0.045276641845703125, -0.03873443603515625, -0.032192230224609375, -0.0256500244140625, -0.019107818603515625, -0.01256561279296875, -0.006023406982421875, 0.000518798828125, 0.007061004638671875, 0.01360321044921875, 0.020145416259765625, 0.0266876220703125, 0.033229827880859375, 0.03977203369140625, 0.046314239501953125, 0.0528564453125, 0.059398651123046875, 0.06594085693359375, 0.07248306274414062, 0.0790252685546875, 0.08556747436523438, 0.09210968017578125, 0.09865188598632812, 0.105194091796875, 0.11173629760742188, 0.11827850341796875, 0.12482070922851562, 0.1313629150390625, 0.13790512084960938, 0.14444732666015625, 0.15098953247070312, 0.15753173828125, 0.16407394409179688, 0.17061614990234375, 0.17715835571289062, 0.1837005615234375, 0.19024276733398438, 0.19678497314453125, 0.20332717895507812, 0.209869384765625, 0.21641159057617188, 0.22295379638671875, 0.22949600219726562, 0.2360382080078125, 0.24258041381835938, 0.24912261962890625, 0.2556648254394531, 0.26220703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 8.0, 12.0, 27.0, 55.0, 108.0, 345.0, 1204.0, 1634.0, 437.0, 124.0, 51.0, 22.0, 14.0, 7.0, 8.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0718994140625, -0.07037353515625, -0.06884765625, -0.06732177734375, -0.0657958984375, -0.06427001953125, -0.062744140625, -0.06121826171875, -0.0596923828125, -0.05816650390625, -0.056640625, -0.05511474609375, -0.0535888671875, -0.05206298828125, -0.050537109375, -0.04901123046875, -0.0474853515625, -0.04595947265625, -0.04443359375, -0.04290771484375, -0.0413818359375, -0.03985595703125, -0.038330078125, -0.03680419921875, -0.0352783203125, -0.03375244140625, -0.0322265625, -0.03070068359375, -0.0291748046875, -0.02764892578125, -0.026123046875, -0.02459716796875, -0.0230712890625, -0.02154541015625, -0.02001953125, -0.01849365234375, -0.0169677734375, -0.01544189453125, -0.013916015625, -0.01239013671875, -0.0108642578125, -0.00933837890625, -0.0078125, -0.00628662109375, -0.0047607421875, -0.00323486328125, -0.001708984375, -0.00018310546875, 0.0013427734375, 0.00286865234375, 0.00439453125, 0.00592041015625, 0.0074462890625, 0.00897216796875, 0.010498046875, 0.01202392578125, 0.0135498046875, 0.01507568359375, 0.0166015625, 0.01812744140625, 0.0196533203125, 0.02117919921875, 0.022705078125, 0.02423095703125, 0.0257568359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 30.0, 454.0, 478.0, 35.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1256685256958008, -1.0953459739685059, -1.0650235414505005, -1.0347009897232056, -1.0043784379959106, -0.9740559458732605, -0.9437334537506104, -0.9134109020233154, -0.8830883502960205, -0.8527658581733704, -0.8224433064460754, -0.7921208143234253, -0.7617982625961304, -0.7314757704734802, -0.7011532783508301, -0.6708307266235352, -0.640508234500885, -0.6101857423782349, -0.5798631906509399, -0.5495406985282898, -0.5192181468009949, -0.4888956546783447, -0.4585731327533722, -0.42825061082839966, -0.3979280889034271, -0.3676055669784546, -0.33728304505348206, -0.3069605231285095, -0.2766380310058594, -0.24631549417972565, -0.2159929871559143, -0.18567046523094177, -0.155348002910614, -0.12502548098564148, -0.09470296651124954, -0.0643804520368576, -0.03405793011188507, -0.0037354081869125366, 0.026587098836898804, 0.05690962076187134, 0.08723214268684387, 0.1175546646118164, 0.14787718653678894, 0.17819969356060028, 0.20852221548557281, 0.23884473741054535, 0.2691672444343567, 0.2994897663593292, 0.32981228828430176, 0.3601348102092743, 0.3904573321342468, 0.420779824256897, 0.4511023759841919, 0.48142486810684204, 0.5117473602294922, 0.5420699119567871, 0.572392463684082, 0.6027149558067322, 0.6330375075340271, 0.6633599996566772, 0.6936825513839722, 0.7240050435066223, 0.7543275356292725, 0.7846500873565674, 0.8149725794792175]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 7.0, 15.0, 27.0, 23.0, 52.0, 58.0, 75.0, 74.0, 97.0, 115.0, 86.0, 95.0, 85.0, 56.0, 44.0, 36.0, 21.0, 14.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23254454135894775, -0.22534097731113434, -0.21813739836215973, -0.2109338343143463, -0.2037302702665329, -0.19652670621871948, -0.18932312726974487, -0.18211956322193146, -0.17491599917411804, -0.16771243512630463, -0.16050885617733002, -0.1533052921295166, -0.14610172808170319, -0.13889816403388977, -0.13169458508491516, -0.12449102103710175, -0.11728744208812714, -0.11008387058973312, -0.10288030654191971, -0.0956767350435257, -0.08847317099571228, -0.08126959949731827, -0.07406602799892426, -0.06686246395111084, -0.05965889245271683, -0.05245532467961311, -0.0452517569065094, -0.03804818540811539, -0.030844617635011673, -0.02364104986190796, -0.016437478363513947, -0.009233910590410233, -0.0020303428173065186, 0.00517322588711977, 0.012376794591546059, 0.019580364227294922, 0.026783932000398636, 0.03398749977350235, 0.04119107127189636, 0.048394639045000076, 0.05559820681810379, 0.0628017783164978, 0.07000534236431122, 0.07720891386270523, 0.08441248536109924, 0.09161604940891266, 0.09881962090730667, 0.10602319240570068, 0.1132267564535141, 0.12043032795190811, 0.12763389945030212, 0.13483746349811554, 0.14204102754592896, 0.14924460649490356, 0.15644817054271698, 0.1636517345905304, 0.170855313539505, 0.17805887758731842, 0.18526245653629303, 0.19246602058410645, 0.19966958463191986, 0.20687314867973328, 0.21407672762870789, 0.2212802916765213, 0.22848385572433472]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 3.0, 4.0, 3.0, 10.0, 14.0, 11.0, 24.0, 31.0, 38.0, 48.0, 96.0, 128.0, 191.0, 321.0, 529.0, 956.0, 1860.0, 4180.0, 11600.0, 38724.0, 171374.0, 500006.0, 240830.0, 52706.0, 14922.0, 5175.0, 2176.0, 1041.0, 548.0, 355.0, 225.0, 122.0, 100.0, 56.0, 36.0, 28.0, 20.0, 9.0, 11.0, 14.0, 12.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.08673095703125, -0.08398723602294922, -0.08124351501464844, -0.07849979400634766, -0.07575607299804688, -0.0730123519897461, -0.07026863098144531, -0.06752490997314453, -0.06478118896484375, -0.06203746795654297, -0.05929374694824219, -0.056550025939941406, -0.053806304931640625, -0.051062583923339844, -0.04831886291503906, -0.04557514190673828, -0.0428314208984375, -0.04008769989013672, -0.03734397888183594, -0.034600257873535156, -0.031856536865234375, -0.029112815856933594, -0.026369094848632812, -0.02362537384033203, -0.02088165283203125, -0.01813793182373047, -0.015394210815429688, -0.012650489807128906, -0.009906768798828125, -0.007163047790527344, -0.0044193267822265625, -0.0016756057739257812, 0.001068115234375, 0.0038118362426757812, 0.0065555572509765625, 0.009299278259277344, 0.012042999267578125, 0.014786720275878906, 0.017530441284179688, 0.02027416229248047, 0.02301788330078125, 0.02576160430908203, 0.028505325317382812, 0.031249046325683594, 0.033992767333984375, 0.036736488342285156, 0.03948020935058594, 0.04222393035888672, 0.0449676513671875, 0.04771137237548828, 0.05045509338378906, 0.053198814392089844, 0.055942535400390625, 0.058686256408691406, 0.06142997741699219, 0.06417369842529297, 0.06691741943359375, 0.06966114044189453, 0.07240486145019531, 0.0751485824584961, 0.07789230346679688, 0.08063602447509766, 0.08337974548339844, 0.08612346649169922, 0.0888671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 10.0, 13.0, 31.0, 25.0, 27.0, 36.0, 44.0, 64.0, 68.0, 71.0, 86.0, 71.0, 63.0, 80.0, 56.0, 52.0, 51.0, 37.0, 18.0, 20.0, 21.0, 16.0, 13.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249176025390625, -0.024096965789794922, -0.023276329040527344, -0.022455692291259766, -0.021635055541992188, -0.02081441879272461, -0.01999378204345703, -0.019173145294189453, -0.018352508544921875, -0.017531871795654297, -0.01671123504638672, -0.01589059829711914, -0.015069961547851562, -0.014249324798583984, -0.013428688049316406, -0.012608051300048828, -0.01178741455078125, -0.010966777801513672, -0.010146141052246094, -0.009325504302978516, -0.008504867553710938, -0.007684230804443359, -0.006863594055175781, -0.006042957305908203, -0.005222320556640625, -0.004401683807373047, -0.0035810470581054688, -0.0027604103088378906, -0.0019397735595703125, -0.0011191368103027344, -0.00029850006103515625, 0.0005221366882324219, 0.0013427734375, 0.002163410186767578, 0.0029840469360351562, 0.0038046836853027344, 0.0046253204345703125, 0.005445957183837891, 0.006266593933105469, 0.007087230682373047, 0.007907867431640625, 0.008728504180908203, 0.009549140930175781, 0.01036977767944336, 0.011190414428710938, 0.012011051177978516, 0.012831687927246094, 0.013652324676513672, 0.01447296142578125, 0.015293598175048828, 0.016114234924316406, 0.016934871673583984, 0.017755508422851562, 0.01857614517211914, 0.01939678192138672, 0.020217418670654297, 0.021038055419921875, 0.021858692169189453, 0.02267932891845703, 0.02349996566772461, 0.024320602416992188, 0.025141239166259766, 0.025961875915527344, 0.026782512664794922, 0.0276031494140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 1.0, 9.0, 9.0, 11.0, 11.0, 14.0, 20.0, 31.0, 37.0, 40.0, 92.0, 121.0, 178.0, 262.0, 422.0, 687.0, 1173.0, 2059.0, 3785.0, 7214.0, 14894.0, 31702.0, 73130.0, 169647.0, 295376.0, 241603.0, 113593.0, 48157.0, 21876.0, 10404.0, 5269.0, 2791.0, 1512.0, 932.0, 527.0, 338.0, 208.0, 115.0, 111.0, 55.0, 40.0, 27.0, 16.0, 14.0, 8.0, 9.0, 11.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.041290283203125, -0.03998994827270508, -0.038689613342285156, -0.037389278411865234, -0.03608894348144531, -0.03478860855102539, -0.03348827362060547, -0.03218793869018555, -0.030887603759765625, -0.029587268829345703, -0.02828693389892578, -0.02698659896850586, -0.025686264038085938, -0.024385929107666016, -0.023085594177246094, -0.021785259246826172, -0.02048492431640625, -0.019184589385986328, -0.017884254455566406, -0.016583919525146484, -0.015283584594726562, -0.01398324966430664, -0.012682914733886719, -0.011382579803466797, -0.010082244873046875, -0.008781909942626953, -0.007481575012207031, -0.006181240081787109, -0.0048809051513671875, -0.0035805702209472656, -0.0022802352905273438, -0.0009799003601074219, 0.0003204345703125, 0.0016207695007324219, 0.0029211044311523438, 0.004221439361572266, 0.0055217742919921875, 0.006822109222412109, 0.008122444152832031, 0.009422779083251953, 0.010723114013671875, 0.012023448944091797, 0.013323783874511719, 0.01462411880493164, 0.015924453735351562, 0.017224788665771484, 0.018525123596191406, 0.019825458526611328, 0.02112579345703125, 0.022426128387451172, 0.023726463317871094, 0.025026798248291016, 0.026327133178710938, 0.02762746810913086, 0.02892780303955078, 0.030228137969970703, 0.031528472900390625, 0.03282880783081055, 0.03412914276123047, 0.03542947769165039, 0.03672981262207031, 0.038030147552490234, 0.039330482482910156, 0.04063081741333008, 0.04193115234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 5.0, 1.0, 5.0, 3.0, 18.0, 11.0, 10.0, 15.0, 16.0, 19.0, 36.0, 33.0, 38.0, 38.0, 30.0, 47.0, 38.0, 53.0, 42.0, 41.0, 43.0, 46.0, 49.0, 38.0, 33.0, 31.0, 27.0, 31.0, 29.0, 33.0, 33.0, 16.0, 20.0, 17.0, 10.0, 8.0, 11.0, 10.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0648193359375, -0.06276798248291016, -0.06071662902832031, -0.05866527557373047, -0.056613922119140625, -0.05456256866455078, -0.05251121520996094, -0.050459861755371094, -0.04840850830078125, -0.046357154846191406, -0.04430580139160156, -0.04225444793701172, -0.040203094482421875, -0.03815174102783203, -0.03610038757324219, -0.034049034118652344, -0.0319976806640625, -0.029946327209472656, -0.027894973754882812, -0.02584362030029297, -0.023792266845703125, -0.02174091339111328, -0.019689559936523438, -0.017638206481933594, -0.01558685302734375, -0.013535499572753906, -0.011484146118164062, -0.009432792663574219, -0.007381439208984375, -0.005330085754394531, -0.0032787322998046875, -0.0012273788452148438, 0.000823974609375, 0.0028753280639648438, 0.0049266815185546875, 0.006978034973144531, 0.009029388427734375, 0.011080741882324219, 0.013132095336914062, 0.015183448791503906, 0.01723480224609375, 0.019286155700683594, 0.021337509155273438, 0.02338886260986328, 0.025440216064453125, 0.02749156951904297, 0.029542922973632812, 0.031594276428222656, 0.0336456298828125, 0.035696983337402344, 0.03774833679199219, 0.03979969024658203, 0.041851043701171875, 0.04390239715576172, 0.04595375061035156, 0.048005104064941406, 0.05005645751953125, 0.052107810974121094, 0.05415916442871094, 0.05621051788330078, 0.058261871337890625, 0.06031322479248047, 0.06236457824707031, 0.06441593170166016, 0.06646728515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 12.0, 16.0, 14.0, 32.0, 54.0, 77.0, 118.0, 203.0, 415.0, 707.0, 1537.0, 4287.0, 17647.0, 118704.0, 542153.0, 306513.0, 43161.0, 8050.0, 2597.0, 1036.0, 498.0, 300.0, 151.0, 94.0, 57.0, 41.0, 19.0, 22.0, 11.0, 7.0, 6.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0299530029296875, -0.029038429260253906, -0.028123855590820312, -0.02720928192138672, -0.026294708251953125, -0.02538013458251953, -0.024465560913085938, -0.023550987243652344, -0.02263641357421875, -0.021721839904785156, -0.020807266235351562, -0.01989269256591797, -0.018978118896484375, -0.01806354522705078, -0.017148971557617188, -0.016234397888183594, -0.01531982421875, -0.014405250549316406, -0.013490676879882812, -0.012576103210449219, -0.011661529541015625, -0.010746955871582031, -0.009832382202148438, -0.008917808532714844, -0.00800323486328125, -0.007088661193847656, -0.0061740875244140625, -0.005259513854980469, -0.004344940185546875, -0.0034303665161132812, -0.0025157928466796875, -0.0016012191772460938, -0.0006866455078125, 0.00022792816162109375, 0.0011425018310546875, 0.0020570755004882812, 0.002971649169921875, 0.0038862228393554688, 0.0048007965087890625, 0.005715370178222656, 0.00662994384765625, 0.007544517517089844, 0.008459091186523438, 0.009373664855957031, 0.010288238525390625, 0.011202812194824219, 0.012117385864257812, 0.013031959533691406, 0.013946533203125, 0.014861106872558594, 0.015775680541992188, 0.01669025421142578, 0.017604827880859375, 0.01851940155029297, 0.019433975219726562, 0.020348548889160156, 0.02126312255859375, 0.022177696228027344, 0.023092269897460938, 0.02400684356689453, 0.024921417236328125, 0.02583599090576172, 0.026750564575195312, 0.027665138244628906, 0.0285797119140625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 6.0, 8.0, 18.0, 15.0, 29.0, 39.0, 56.0, 58.0, 90.0, 78.0, 71.0, 118.0, 68.0, 100.0, 51.0, 47.0, 34.0, 36.0, 24.0, 18.0, 16.0, 6.0, 9.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.761882781982422e-06, -8.49645584821701e-06, -8.231028914451599e-06, -7.965601980686188e-06, -7.700175046920776e-06, -7.434748113155365e-06, -7.169321179389954e-06, -6.903894245624542e-06, -6.638467311859131e-06, -6.3730403780937195e-06, -6.107613444328308e-06, -5.842186510562897e-06, -5.576759576797485e-06, -5.311332643032074e-06, -5.045905709266663e-06, -4.780478775501251e-06, -4.51505184173584e-06, -4.2496249079704285e-06, -3.984197974205017e-06, -3.7187710404396057e-06, -3.4533441066741943e-06, -3.187917172908783e-06, -2.9224902391433716e-06, -2.65706330537796e-06, -2.391636371612549e-06, -2.1262094378471375e-06, -1.860782504081726e-06, -1.5953555703163147e-06, -1.3299286365509033e-06, -1.064501702785492e-06, -7.990747690200806e-07, -5.336478352546692e-07, -2.682209014892578e-07, -2.7939677238464355e-09, 2.6263296604156494e-07, 5.280598998069763e-07, 7.934868335723877e-07, 1.058913767337799e-06, 1.3243407011032104e-06, 1.5897676348686218e-06, 1.8551945686340332e-06, 2.1206215023994446e-06, 2.386048436164856e-06, 2.6514753699302673e-06, 2.9169023036956787e-06, 3.18232923746109e-06, 3.4477561712265015e-06, 3.713183104991913e-06, 3.978610038757324e-06, 4.244036972522736e-06, 4.509463906288147e-06, 4.774890840053558e-06, 5.04031777381897e-06, 5.305744707584381e-06, 5.5711716413497925e-06, 5.836598575115204e-06, 6.102025508880615e-06, 6.367452442646027e-06, 6.632879376411438e-06, 6.898306310176849e-06, 7.163733243942261e-06, 7.429160177707672e-06, 7.694587111473083e-06, 7.960014045238495e-06, 8.225440979003906e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 7.0, 5.0, 15.0, 20.0, 13.0, 38.0, 43.0, 63.0, 124.0, 208.0, 408.0, 835.0, 2219.0, 9659.0, 82120.0, 550179.0, 355311.0, 38776.0, 5515.0, 1556.0, 675.0, 321.0, 152.0, 88.0, 60.0, 50.0, 22.0, 17.0, 21.0, 6.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031951904296875, -0.03091573715209961, -0.02987957000732422, -0.028843402862548828, -0.027807235717773438, -0.026771068572998047, -0.025734901428222656, -0.024698734283447266, -0.023662567138671875, -0.022626399993896484, -0.021590232849121094, -0.020554065704345703, -0.019517898559570312, -0.018481731414794922, -0.01744556427001953, -0.01640939712524414, -0.01537322998046875, -0.01433706283569336, -0.013300895690917969, -0.012264728546142578, -0.011228561401367188, -0.010192394256591797, -0.009156227111816406, -0.008120059967041016, -0.007083892822265625, -0.006047725677490234, -0.005011558532714844, -0.003975391387939453, -0.0029392242431640625, -0.0019030570983886719, -0.0008668899536132812, 0.00016927719116210938, 0.0012054443359375, 0.0022416114807128906, 0.0032777786254882812, 0.004313945770263672, 0.0053501129150390625, 0.006386280059814453, 0.007422447204589844, 0.008458614349365234, 0.009494781494140625, 0.010530948638916016, 0.011567115783691406, 0.012603282928466797, 0.013639450073242188, 0.014675617218017578, 0.01571178436279297, 0.01674795150756836, 0.01778411865234375, 0.01882028579711914, 0.01985645294189453, 0.020892620086669922, 0.021928787231445312, 0.022964954376220703, 0.024001121520996094, 0.025037288665771484, 0.026073455810546875, 0.027109622955322266, 0.028145790100097656, 0.029181957244873047, 0.030218124389648438, 0.03125429153442383, 0.03229045867919922, 0.03332662582397461, 0.03436279296875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 10.0, 6.0, 8.0, 15.0, 17.0, 25.0, 29.0, 23.0, 37.0, 57.0, 63.0, 65.0, 62.0, 78.0, 79.0, 74.0, 74.0, 68.0, 45.0, 38.0, 26.0, 22.0, 15.0, 14.0, 12.0, 6.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02801513671875, -0.027238845825195312, -0.026462554931640625, -0.025686264038085938, -0.02490997314453125, -0.024133682250976562, -0.023357391357421875, -0.022581100463867188, -0.0218048095703125, -0.021028518676757812, -0.020252227783203125, -0.019475936889648438, -0.01869964599609375, -0.017923355102539062, -0.017147064208984375, -0.016370773315429688, -0.015594482421875, -0.014818191528320312, -0.014041900634765625, -0.013265609741210938, -0.01248931884765625, -0.011713027954101562, -0.010936737060546875, -0.010160446166992188, -0.0093841552734375, -0.008607864379882812, -0.007831573486328125, -0.0070552825927734375, -0.00627899169921875, -0.0055027008056640625, -0.004726409912109375, -0.0039501190185546875, -0.003173828125, -0.0023975372314453125, -0.001621246337890625, -0.0008449554443359375, -6.866455078125e-05, 0.0007076263427734375, 0.001483917236328125, 0.0022602081298828125, 0.0030364990234375, 0.0038127899169921875, 0.004589080810546875, 0.0053653717041015625, 0.00614166259765625, 0.0069179534912109375, 0.007694244384765625, 0.008470535278320312, 0.009246826171875, 0.010023117065429688, 0.010799407958984375, 0.011575698852539062, 0.01235198974609375, 0.013128280639648438, 0.013904571533203125, 0.014680862426757812, 0.0154571533203125, 0.016233444213867188, 0.017009735107421875, 0.017786026000976562, 0.01856231689453125, 0.019338607788085938, 0.020114898681640625, 0.020891189575195312, 0.02166748046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 40.0, 309.0, 574.0, 76.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.738105833530426, -0.6659846305847168, -0.5938633680343628, -0.5217421650886536, -0.44962096214294434, -0.3774997591972351, -0.3053785264492035, -0.23325729370117188, -0.16113609075546265, -0.08901487290859222, -0.016893655061721802, 0.05522756278514862, 0.12734878063201904, 0.19946998357772827, 0.2715912163257599, 0.3437124490737915, 0.41583365201950073, 0.48795485496520996, 0.560076117515564, 0.6321973204612732, 0.7043185234069824, 0.7764397263526917, 0.8485609292984009, 0.9206821918487549, 0.9928033947944641, 1.0649245977401733, 1.1370458602905273, 1.2091670036315918, 1.2812882661819458, 1.3534095287322998, 1.4255306720733643, 1.4976519346237183, 1.5697731971740723, 1.6418944597244263, 1.7140156030654907, 1.7861368656158447, 1.8582580089569092, 1.9303792715072632, 2.002500534057617, 2.0746216773986816, 2.146742820739746, 2.2188639640808105, 2.290985345840454, 2.3631064891815186, 2.435227632522583, 2.5073490142822266, 2.579470157623291, 2.6515913009643555, 2.723712682723999, 2.7958338260650635, 2.867955207824707, 2.9400763511657715, 3.012197494506836, 3.0843186378479004, 3.156440019607544, 3.2285611629486084, 3.300682544708252, 3.3728036880493164, 3.44492506980896, 3.5170462131500244, 3.589167356491089, 3.6612887382507324, 3.733409881591797, 3.8055310249328613, 3.877652168273926]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 11.0, 11.0, 13.0, 13.0, 14.0, 11.0, 20.0, 20.0, 19.0, 23.0, 34.0, 25.0, 34.0, 43.0, 28.0, 45.0, 45.0, 42.0, 38.0, 53.0, 54.0, 46.0, 36.0, 35.0, 30.0, 37.0, 27.0, 33.0, 19.0, 12.0, 22.0, 16.0, 22.0, 9.0, 14.0, 7.0, 9.0, 4.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32423484325408936, -0.3133905231952667, -0.3025461733341217, -0.2917018532752991, -0.28085750341415405, -0.2700131833553314, -0.2591688632965088, -0.24832452833652496, -0.23748019337654114, -0.2266358584165573, -0.2157915234565735, -0.20494720339775085, -0.19410286843776703, -0.1832585334777832, -0.17241421341896057, -0.16156987845897675, -0.15072554349899292, -0.1398812085390091, -0.12903687357902527, -0.11819255352020264, -0.10734821856021881, -0.09650388360023499, -0.08565955609083176, -0.07481522858142853, -0.0639708936214447, -0.053126562386751175, -0.04228223115205765, -0.03143789991736412, -0.020593568682670593, -0.009749237447977066, 0.0010950937867164612, 0.01193942129611969, 0.022783756256103516, 0.03362808749079704, 0.04447241872549057, 0.0553167499601841, 0.06616108119487762, 0.07700541615486145, 0.08784974366426468, 0.09869407117366791, 0.10953840613365173, 0.12038274109363556, 0.13122707605361938, 0.14207139611244202, 0.15291573107242584, 0.16376006603240967, 0.1746043860912323, 0.18544872105121613, 0.19629305601119995, 0.20713739097118378, 0.2179817259311676, 0.22882604598999023, 0.23967038094997406, 0.2505147159099579, 0.2613590359687805, 0.27220338582992554, 0.28304770588874817, 0.2938920259475708, 0.3047363758087158, 0.31558069586753845, 0.3264250159263611, 0.3372693657875061, 0.34811368584632874, 0.35895800590515137, 0.3698023557662964]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 6.0, 9.0, 20.0, 55.0, 119.0, 568.0, 9071.0, 4146251.0, 36936.0, 942.0, 183.0, 60.0, 30.0, 16.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2276611328125, -0.21607017517089844, -0.20447921752929688, -0.1928882598876953, -0.18129730224609375, -0.1697063446044922, -0.15811538696289062, -0.14652442932128906, -0.1349334716796875, -0.12334251403808594, -0.11175155639648438, -0.10016059875488281, -0.08856964111328125, -0.07697868347167969, -0.06538772583007812, -0.05379676818847656, -0.042205810546875, -0.030614852905273438, -0.019023895263671875, -0.0074329376220703125, 0.00415802001953125, 0.015748977661132812, 0.027339935302734375, 0.03893089294433594, 0.0505218505859375, 0.06211280822753906, 0.07370376586914062, 0.08529472351074219, 0.09688568115234375, 0.10847663879394531, 0.12006759643554688, 0.13165855407714844, 0.14324951171875, 0.15484046936035156, 0.16643142700195312, 0.1780223846435547, 0.18961334228515625, 0.2012042999267578, 0.21279525756835938, 0.22438621520996094, 0.2359771728515625, 0.24756813049316406, 0.2591590881347656, 0.2707500457763672, 0.28234100341796875, 0.2939319610595703, 0.3055229187011719, 0.31711387634277344, 0.328704833984375, 0.34029579162597656, 0.3518867492675781, 0.3634777069091797, 0.37506866455078125, 0.3866596221923828, 0.3982505798339844, 0.40984153747558594, 0.4214324951171875, 0.43302345275878906, 0.4446144104003906, 0.4562053680419922, 0.46779632568359375, 0.4793872833251953, 0.4909782409667969, 0.5025691986083984, 0.51416015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 11.0, 10.0, 20.0, 19.0, 33.0, 30.0, 33.0, 40.0, 35.0, 51.0, 52.0, 62.0, 55.0, 73.0, 64.0, 60.0, 63.0, 41.0, 47.0, 37.0, 33.0, 21.0, 17.0, 28.0, 18.0, 7.0, 8.0, 6.0, 4.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0242767333984375, -0.02352738380432129, -0.022778034210205078, -0.022028684616088867, -0.021279335021972656, -0.020529985427856445, -0.019780635833740234, -0.019031286239624023, -0.018281936645507812, -0.0175325870513916, -0.01678323745727539, -0.01603388786315918, -0.015284538269042969, -0.014535188674926758, -0.013785839080810547, -0.013036489486694336, -0.012287139892578125, -0.011537790298461914, -0.010788440704345703, -0.010039091110229492, -0.009289741516113281, -0.00854039192199707, -0.007791042327880859, -0.0070416927337646484, -0.0062923431396484375, -0.0055429935455322266, -0.004793643951416016, -0.004044294357299805, -0.0032949447631835938, -0.002545595169067383, -0.0017962455749511719, -0.001046895980834961, -0.00029754638671875, 0.00045180320739746094, 0.0012011528015136719, 0.0019505023956298828, 0.0026998519897460938, 0.0034492015838623047, 0.004198551177978516, 0.0049479007720947266, 0.0056972503662109375, 0.0064465999603271484, 0.007195949554443359, 0.00794529914855957, 0.008694648742675781, 0.009443998336791992, 0.010193347930908203, 0.010942697525024414, 0.011692047119140625, 0.012441396713256836, 0.013190746307373047, 0.013940095901489258, 0.014689445495605469, 0.01543879508972168, 0.01618814468383789, 0.0169374942779541, 0.017686843872070312, 0.018436193466186523, 0.019185543060302734, 0.019934892654418945, 0.020684242248535156, 0.021433591842651367, 0.022182941436767578, 0.02293229103088379, 0.023681640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 8.0, 14.0, 21.0, 25.0, 54.0, 81.0, 163.0, 247.0, 485.0, 1127.0, 3939.0, 25930.0, 1187441.0, 2927649.0, 39723.0, 5052.0, 1260.0, 502.0, 238.0, 119.0, 78.0, 49.0, 26.0, 20.0, 9.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10601806640625, -0.1023721694946289, -0.09872627258300781, -0.09508037567138672, -0.09143447875976562, -0.08778858184814453, -0.08414268493652344, -0.08049678802490234, -0.07685089111328125, -0.07320499420166016, -0.06955909729003906, -0.06591320037841797, -0.062267303466796875, -0.05862140655517578, -0.05497550964355469, -0.051329612731933594, -0.0476837158203125, -0.044037818908691406, -0.04039192199707031, -0.03674602508544922, -0.033100128173828125, -0.02945423126220703, -0.025808334350585938, -0.022162437438964844, -0.01851654052734375, -0.014870643615722656, -0.011224746704101562, -0.007578849792480469, -0.003932952880859375, -0.00028705596923828125, 0.0033588409423828125, 0.007004737854003906, 0.010650634765625, 0.014296531677246094, 0.017942428588867188, 0.02158832550048828, 0.025234222412109375, 0.02888011932373047, 0.03252601623535156, 0.036171913146972656, 0.03981781005859375, 0.043463706970214844, 0.04710960388183594, 0.05075550079345703, 0.054401397705078125, 0.05804729461669922, 0.06169319152832031, 0.0653390884399414, 0.0689849853515625, 0.0726308822631836, 0.07627677917480469, 0.07992267608642578, 0.08356857299804688, 0.08721446990966797, 0.09086036682128906, 0.09450626373291016, 0.09815216064453125, 0.10179805755615234, 0.10544395446777344, 0.10908985137939453, 0.11273574829101562, 0.11638164520263672, 0.12002754211425781, 0.1236734390258789, 0.1273193359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 16.0, 20.0, 55.0, 128.0, 340.0, 1319.0, 1488.0, 414.0, 161.0, 59.0, 22.0, 15.0, 7.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.070556640625, -0.06879520416259766, -0.06703376770019531, -0.06527233123779297, -0.06351089477539062, -0.06174945831298828, -0.05998802185058594, -0.058226585388183594, -0.05646514892578125, -0.054703712463378906, -0.05294227600097656, -0.05118083953857422, -0.049419403076171875, -0.04765796661376953, -0.04589653015136719, -0.044135093688964844, -0.0423736572265625, -0.040612220764160156, -0.03885078430175781, -0.03708934783935547, -0.035327911376953125, -0.03356647491455078, -0.03180503845214844, -0.030043601989746094, -0.02828216552734375, -0.026520729064941406, -0.024759292602539062, -0.02299785614013672, -0.021236419677734375, -0.01947498321533203, -0.017713546752929688, -0.015952110290527344, -0.014190673828125, -0.012429237365722656, -0.010667800903320312, -0.008906364440917969, -0.007144927978515625, -0.005383491516113281, -0.0036220550537109375, -0.0018606185913085938, -9.918212890625e-05, 0.0016622543334960938, 0.0034236907958984375, 0.005185127258300781, 0.006946563720703125, 0.008708000183105469, 0.010469436645507812, 0.012230873107910156, 0.0139923095703125, 0.015753746032714844, 0.017515182495117188, 0.01927661895751953, 0.021038055419921875, 0.02279949188232422, 0.024560928344726562, 0.026322364807128906, 0.02808380126953125, 0.029845237731933594, 0.03160667419433594, 0.03336811065673828, 0.035129547119140625, 0.03689098358154297, 0.03865242004394531, 0.040413856506347656, 0.04217529296875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 10.0, 11.0, 44.0, 164.0, 396.0, 279.0, 88.0, 16.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5058526992797852, -0.48882973194122314, -0.47180676460266113, -0.4547837972640991, -0.4377608299255371, -0.4207378625869751, -0.4037148952484131, -0.3866919279098511, -0.36966896057128906, -0.35264599323272705, -0.33562302589416504, -0.318600058555603, -0.301577091217041, -0.284554123878479, -0.267531156539917, -0.250508189201355, -0.23348522186279297, -0.21646225452423096, -0.19943928718566895, -0.18241631984710693, -0.16539335250854492, -0.1483703851699829, -0.1313474178314209, -0.11432445049285889, -0.09730148315429688, -0.08027851581573486, -0.06325554847717285, -0.04623258113861084, -0.029209613800048828, -0.012186646461486816, 0.004836320877075195, 0.021859288215637207, 0.03888225555419922, 0.05590522289276123, 0.07292819023132324, 0.08995115756988525, 0.10697412490844727, 0.12399709224700928, 0.1410200595855713, 0.1580430269241333, 0.1750659942626953, 0.19208896160125732, 0.20911192893981934, 0.22613489627838135, 0.24315786361694336, 0.26018083095550537, 0.2772037982940674, 0.2942267656326294, 0.3112497329711914, 0.3282727003097534, 0.34529566764831543, 0.36231863498687744, 0.37934160232543945, 0.39636456966400146, 0.4133875370025635, 0.4304105043411255, 0.4474334716796875, 0.4644564390182495, 0.4814794063568115, 0.49850237369537354, 0.5155253410339355, 0.5325483083724976, 0.5495712757110596, 0.5665942430496216, 0.5836172103881836]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 8.0, 21.0, 22.0, 27.0, 39.0, 45.0, 47.0, 73.0, 60.0, 80.0, 80.0, 89.0, 67.0, 76.0, 59.0, 48.0, 45.0, 30.0, 23.0, 16.0, 13.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2014034390449524, -0.19624276459217072, -0.19108209013938904, -0.18592143058776855, -0.18076075613498688, -0.1756000816822052, -0.17043940722942352, -0.16527873277664185, -0.16011807322502136, -0.15495739877223969, -0.149796724319458, -0.14463606476783752, -0.13947539031505585, -0.13431471586227417, -0.1291540414094925, -0.12399336695671082, -0.11883269250392914, -0.11367201805114746, -0.10851135104894638, -0.1033506765961647, -0.09819000959396362, -0.09302933514118195, -0.08786866068840027, -0.08270798623561859, -0.07754731923341751, -0.07238664478063583, -0.06722597777843475, -0.062065303325653076, -0.0569046325981617, -0.05174396187067032, -0.04658328741788864, -0.04142261669039726, -0.036261945962905884, -0.031101275235414505, -0.025940602645277977, -0.02077993005514145, -0.01561925932765007, -0.010458588600158691, -0.005297916010022163, -0.00013724341988563538, 0.005023427307605743, 0.010184098966419697, 0.01534477062523365, 0.020505443215370178, 0.025666113942861557, 0.030826784670352936, 0.03598745912313461, 0.04114812985062599, 0.04630880057811737, 0.05146947130560875, 0.05663014203310013, 0.061790816485881805, 0.06695148348808289, 0.07211215794086456, 0.07727283239364624, 0.08243350684642792, 0.087594173848629, 0.09275484830141068, 0.09791551530361176, 0.10307618975639343, 0.10823686420917511, 0.11339753121137619, 0.11855820566415787, 0.12371887266635895, 0.12887954711914062]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 5.0, 4.0, 6.0, 17.0, 26.0, 35.0, 47.0, 85.0, 140.0, 246.0, 452.0, 902.0, 1978.0, 4590.0, 12826.0, 45429.0, 224997.0, 547775.0, 157695.0, 33957.0, 10143.0, 3785.0, 1713.0, 790.0, 366.0, 217.0, 118.0, 76.0, 46.0, 40.0, 22.0, 6.0, 8.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.099853515625, -0.09667301177978516, -0.09349250793457031, -0.09031200408935547, -0.08713150024414062, -0.08395099639892578, -0.08077049255371094, -0.0775899887084961, -0.07440948486328125, -0.0712289810180664, -0.06804847717285156, -0.06486797332763672, -0.061687469482421875, -0.05850696563720703, -0.05532646179199219, -0.052145957946777344, -0.0489654541015625, -0.045784950256347656, -0.04260444641113281, -0.03942394256591797, -0.036243438720703125, -0.03306293487548828, -0.029882431030273438, -0.026701927185058594, -0.02352142333984375, -0.020340919494628906, -0.017160415649414062, -0.013979911804199219, -0.010799407958984375, -0.007618904113769531, -0.0044384002685546875, -0.0012578964233398438, 0.001922607421875, 0.005103111267089844, 0.008283615112304688, 0.011464118957519531, 0.014644622802734375, 0.01782512664794922, 0.021005630493164062, 0.024186134338378906, 0.02736663818359375, 0.030547142028808594, 0.03372764587402344, 0.03690814971923828, 0.040088653564453125, 0.04326915740966797, 0.04644966125488281, 0.049630165100097656, 0.0528106689453125, 0.055991172790527344, 0.05917167663574219, 0.06235218048095703, 0.06553268432617188, 0.06871318817138672, 0.07189369201660156, 0.0750741958618164, 0.07825469970703125, 0.0814352035522461, 0.08461570739746094, 0.08779621124267578, 0.09097671508789062, 0.09415721893310547, 0.09733772277832031, 0.10051822662353516, 0.10369873046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 6.0, 11.0, 8.0, 18.0, 19.0, 34.0, 34.0, 34.0, 60.0, 46.0, 56.0, 64.0, 71.0, 79.0, 73.0, 60.0, 57.0, 53.0, 45.0, 36.0, 29.0, 22.0, 16.0, 22.0, 11.0, 6.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252227783203125, -0.02439117431640625, -0.0235595703125, -0.02272796630859375, -0.0218963623046875, -0.02106475830078125, -0.020233154296875, -0.01940155029296875, -0.0185699462890625, -0.01773834228515625, -0.01690673828125, -0.01607513427734375, -0.0152435302734375, -0.01441192626953125, -0.013580322265625, -0.01274871826171875, -0.0119171142578125, -0.01108551025390625, -0.01025390625, -0.00942230224609375, -0.0085906982421875, -0.00775909423828125, -0.006927490234375, -0.00609588623046875, -0.0052642822265625, -0.00443267822265625, -0.00360107421875, -0.00276947021484375, -0.0019378662109375, -0.00110626220703125, -0.000274658203125, 0.00055694580078125, 0.0013885498046875, 0.00222015380859375, 0.0030517578125, 0.00388336181640625, 0.0047149658203125, 0.00554656982421875, 0.006378173828125, 0.00720977783203125, 0.0080413818359375, 0.00887298583984375, 0.00970458984375, 0.01053619384765625, 0.0113677978515625, 0.01219940185546875, 0.013031005859375, 0.01386260986328125, 0.0146942138671875, 0.01552581787109375, 0.016357421875, 0.01718902587890625, 0.0180206298828125, 0.01885223388671875, 0.019683837890625, 0.02051544189453125, 0.0213470458984375, 0.02217864990234375, 0.02301025390625, 0.02384185791015625, 0.0246734619140625, 0.02550506591796875, 0.026336669921875, 0.02716827392578125, 0.0279998779296875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 12.0, 22.0, 21.0, 42.0, 51.0, 90.0, 158.0, 311.0, 638.0, 1461.0, 3751.0, 10633.0, 34402.0, 137273.0, 447671.0, 306357.0, 74311.0, 20108.0, 6653.0, 2460.0, 1050.0, 459.0, 239.0, 137.0, 99.0, 50.0, 29.0, 11.0, 13.0, 3.0, 7.0, 7.0, 3.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06976318359375, -0.06749725341796875, -0.0652313232421875, -0.06296539306640625, -0.060699462890625, -0.05843353271484375, -0.0561676025390625, -0.05390167236328125, -0.0516357421875, -0.04936981201171875, -0.0471038818359375, -0.04483795166015625, -0.042572021484375, -0.04030609130859375, -0.0380401611328125, -0.03577423095703125, -0.03350830078125, -0.03124237060546875, -0.0289764404296875, -0.02671051025390625, -0.024444580078125, -0.02217864990234375, -0.0199127197265625, -0.01764678955078125, -0.015380859375, -0.01311492919921875, -0.0108489990234375, -0.00858306884765625, -0.006317138671875, -0.00405120849609375, -0.0017852783203125, 0.00048065185546875, 0.00274658203125, 0.00501251220703125, 0.0072784423828125, 0.00954437255859375, 0.011810302734375, 0.01407623291015625, 0.0163421630859375, 0.01860809326171875, 0.0208740234375, 0.02313995361328125, 0.0254058837890625, 0.02767181396484375, 0.029937744140625, 0.03220367431640625, 0.0344696044921875, 0.03673553466796875, 0.03900146484375, 0.04126739501953125, 0.0435333251953125, 0.04579925537109375, 0.048065185546875, 0.05033111572265625, 0.0525970458984375, 0.05486297607421875, 0.05712890625, 0.05939483642578125, 0.0616607666015625, 0.06392669677734375, 0.066192626953125, 0.06845855712890625, 0.0707244873046875, 0.07299041748046875, 0.07525634765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 13.0, 6.0, 7.0, 7.0, 12.0, 23.0, 18.0, 14.0, 26.0, 31.0, 33.0, 48.0, 42.0, 35.0, 58.0, 34.0, 46.0, 48.0, 56.0, 53.0, 43.0, 48.0, 41.0, 30.0, 35.0, 45.0, 30.0, 21.0, 22.0, 15.0, 13.0, 11.0, 11.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0802001953125, -0.0776662826538086, -0.07513236999511719, -0.07259845733642578, -0.07006454467773438, -0.06753063201904297, -0.06499671936035156, -0.062462806701660156, -0.05992889404296875, -0.057394981384277344, -0.05486106872558594, -0.05232715606689453, -0.049793243408203125, -0.04725933074951172, -0.04472541809082031, -0.042191505432128906, -0.0396575927734375, -0.037123680114746094, -0.03458976745605469, -0.03205585479736328, -0.029521942138671875, -0.02698802947998047, -0.024454116821289062, -0.021920204162597656, -0.01938629150390625, -0.016852378845214844, -0.014318466186523438, -0.011784553527832031, -0.009250640869140625, -0.006716728210449219, -0.0041828155517578125, -0.0016489028930664062, 0.000885009765625, 0.0034189224243164062, 0.0059528350830078125, 0.008486747741699219, 0.011020660400390625, 0.013554573059082031, 0.016088485717773438, 0.018622398376464844, 0.02115631103515625, 0.023690223693847656, 0.026224136352539062, 0.02875804901123047, 0.031291961669921875, 0.03382587432861328, 0.03635978698730469, 0.038893699645996094, 0.0414276123046875, 0.043961524963378906, 0.04649543762207031, 0.04902935028076172, 0.051563262939453125, 0.05409717559814453, 0.05663108825683594, 0.059165000915527344, 0.06169891357421875, 0.06423282623291016, 0.06676673889160156, 0.06930065155029297, 0.07183456420898438, 0.07436847686767578, 0.07690238952636719, 0.0794363021850586, 0.08197021484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 10.0, 6.0, 14.0, 18.0, 33.0, 75.0, 126.0, 244.0, 458.0, 1029.0, 3278.0, 90982.0, 924512.0, 24028.0, 2135.0, 786.0, 378.0, 199.0, 100.0, 76.0, 34.0, 20.0, 9.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08056640625, -0.0779123306274414, -0.07525825500488281, -0.07260417938232422, -0.06995010375976562, -0.06729602813720703, -0.06464195251464844, -0.061987876892089844, -0.05933380126953125, -0.056679725646972656, -0.05402565002441406, -0.05137157440185547, -0.048717498779296875, -0.04606342315673828, -0.04340934753417969, -0.040755271911621094, -0.0381011962890625, -0.035447120666503906, -0.03279304504394531, -0.03013896942138672, -0.027484893798828125, -0.02483081817626953, -0.022176742553710938, -0.019522666931152344, -0.01686859130859375, -0.014214515686035156, -0.011560440063476562, -0.008906364440917969, -0.006252288818359375, -0.0035982131958007812, -0.0009441375732421875, 0.0017099380493164062, 0.004364013671875, 0.007018089294433594, 0.009672164916992188, 0.012326240539550781, 0.014980316162109375, 0.01763439178466797, 0.020288467407226562, 0.022942543029785156, 0.02559661865234375, 0.028250694274902344, 0.030904769897460938, 0.03355884552001953, 0.036212921142578125, 0.03886699676513672, 0.04152107238769531, 0.044175148010253906, 0.0468292236328125, 0.049483299255371094, 0.05213737487792969, 0.05479145050048828, 0.057445526123046875, 0.06009960174560547, 0.06275367736816406, 0.06540775299072266, 0.06806182861328125, 0.07071590423583984, 0.07336997985839844, 0.07602405548095703, 0.07867813110351562, 0.08133220672607422, 0.08398628234863281, 0.0866403579711914, 0.08929443359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 17.0, 16.0, 39.0, 76.0, 109.0, 118.0, 139.0, 147.0, 115.0, 83.0, 49.0, 47.0, 23.0, 9.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3589859008789062e-05, -1.3163313269615173e-05, -1.2736767530441284e-05, -1.2310221791267395e-05, -1.1883676052093506e-05, -1.1457130312919617e-05, -1.1030584573745728e-05, -1.0604038834571838e-05, -1.017749309539795e-05, -9.75094735622406e-06, -9.324401617050171e-06, -8.897855877876282e-06, -8.471310138702393e-06, -8.044764399528503e-06, -7.618218660354614e-06, -7.191672921180725e-06, -6.765127182006836e-06, -6.338581442832947e-06, -5.912035703659058e-06, -5.4854899644851685e-06, -5.058944225311279e-06, -4.63239848613739e-06, -4.205852746963501e-06, -3.779307007789612e-06, -3.3527612686157227e-06, -2.9262155294418335e-06, -2.4996697902679443e-06, -2.073124051094055e-06, -1.646578311920166e-06, -1.2200325727462769e-06, -7.934868335723877e-07, -3.6694109439849854e-07, 5.960464477539063e-08, 4.861503839492798e-07, 9.126961231231689e-07, 1.339241862297058e-06, 1.7657876014709473e-06, 2.1923333406448364e-06, 2.6188790798187256e-06, 3.0454248189926147e-06, 3.471970558166504e-06, 3.898516297340393e-06, 4.325062036514282e-06, 4.751607775688171e-06, 5.1781535148620605e-06, 5.60469925403595e-06, 6.031244993209839e-06, 6.457790732383728e-06, 6.884336471557617e-06, 7.310882210731506e-06, 7.737427949905396e-06, 8.163973689079285e-06, 8.590519428253174e-06, 9.017065167427063e-06, 9.443610906600952e-06, 9.870156645774841e-06, 1.029670238494873e-05, 1.072324812412262e-05, 1.1149793863296509e-05, 1.1576339602470398e-05, 1.2002885341644287e-05, 1.2429431080818176e-05, 1.2855976819992065e-05, 1.3282522559165955e-05, 1.3709068298339844e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 3.0, 5.0, 21.0, 25.0, 35.0, 61.0, 116.0, 200.0, 418.0, 1135.0, 4938.0, 72451.0, 865959.0, 95351.0, 5693.0, 1168.0, 418.0, 217.0, 137.0, 63.0, 61.0, 18.0, 20.0, 14.0, 9.0, 0.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06390380859375, -0.06193971633911133, -0.059975624084472656, -0.058011531829833984, -0.05604743957519531, -0.05408334732055664, -0.05211925506591797, -0.0501551628112793, -0.048191070556640625, -0.04622697830200195, -0.04426288604736328, -0.04229879379272461, -0.04033470153808594, -0.038370609283447266, -0.036406517028808594, -0.03444242477416992, -0.03247833251953125, -0.030514240264892578, -0.028550148010253906, -0.026586055755615234, -0.024621963500976562, -0.02265787124633789, -0.02069377899169922, -0.018729686737060547, -0.016765594482421875, -0.014801502227783203, -0.012837409973144531, -0.01087331771850586, -0.008909225463867188, -0.006945133209228516, -0.004981040954589844, -0.003016948699951172, -0.0010528564453125, 0.0009112358093261719, 0.0028753280639648438, 0.004839420318603516, 0.0068035125732421875, 0.00876760482788086, 0.010731697082519531, 0.012695789337158203, 0.014659881591796875, 0.016623973846435547, 0.01858806610107422, 0.02055215835571289, 0.022516250610351562, 0.024480342864990234, 0.026444435119628906, 0.028408527374267578, 0.03037261962890625, 0.03233671188354492, 0.034300804138183594, 0.036264896392822266, 0.03822898864746094, 0.04019308090209961, 0.04215717315673828, 0.04412126541137695, 0.046085357666015625, 0.0480494499206543, 0.05001354217529297, 0.05197763442993164, 0.05394172668457031, 0.055905818939208984, 0.057869911193847656, 0.05983400344848633, 0.061798095703125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 13.0, 31.0, 33.0, 42.0, 69.0, 109.0, 133.0, 120.0, 136.0, 98.0, 75.0, 53.0, 33.0, 20.0, 15.0, 11.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0506591796875, -0.04866218566894531, -0.046665191650390625, -0.04466819763183594, -0.04267120361328125, -0.04067420959472656, -0.038677215576171875, -0.03668022155761719, -0.0346832275390625, -0.03268623352050781, -0.030689239501953125, -0.028692245483398438, -0.02669525146484375, -0.024698257446289062, -0.022701263427734375, -0.020704269409179688, -0.018707275390625, -0.016710281372070312, -0.014713287353515625, -0.012716293334960938, -0.01071929931640625, -0.008722305297851562, -0.006725311279296875, -0.0047283172607421875, -0.0027313232421875, -0.0007343292236328125, 0.001262664794921875, 0.0032596588134765625, 0.00525665283203125, 0.0072536468505859375, 0.009250640869140625, 0.011247634887695312, 0.01324462890625, 0.015241622924804688, 0.017238616943359375, 0.019235610961914062, 0.02123260498046875, 0.023229598999023438, 0.025226593017578125, 0.027223587036132812, 0.0292205810546875, 0.031217575073242188, 0.033214569091796875, 0.03521156311035156, 0.03720855712890625, 0.03920555114746094, 0.041202545166015625, 0.04319953918457031, 0.045196533203125, 0.04719352722167969, 0.049190521240234375, 0.05118751525878906, 0.05318450927734375, 0.05518150329589844, 0.057178497314453125, 0.05917549133300781, 0.0611724853515625, 0.06316947937011719, 0.06516647338867188, 0.06716346740722656, 0.06916046142578125, 0.07115745544433594, 0.07315444946289062, 0.07515144348144531, 0.0771484375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 26.0, 48.0, 99.0, 197.0, 245.0, 194.0, 93.0, 49.0, 16.0, 11.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35292643308639526, -0.3271464705467224, -0.30136650800704956, -0.2755865752696991, -0.24980661273002625, -0.2240266501903534, -0.19824670255184174, -0.17246675491333008, -0.14668679237365723, -0.12090683728456497, -0.09512688219547272, -0.06934692710638046, -0.04356697201728821, -0.017787009477615356, 0.007992938160896301, 0.03377288579940796, 0.05955284833908081, 0.08533280342817307, 0.11111275851726532, 0.13689270615577698, 0.16267266869544983, 0.18845263123512268, 0.21423257887363434, 0.240012526512146, 0.26579248905181885, 0.2915724515914917, 0.31735241413116455, 0.343132346868515, 0.36891230940818787, 0.3946922719478607, 0.4204722046852112, 0.44625216722488403, 0.4720320701599121, 0.49781203269958496, 0.5235919952392578, 0.5493719577789307, 0.5751519203186035, 0.6009318828582764, 0.6267117857933044, 0.6524917483329773, 0.6782717108726501, 0.704051673412323, 0.7298316359519958, 0.7556115984916687, 0.7813915014266968, 0.8071714639663696, 0.8329514265060425, 0.8587313890457153, 0.8845113515853882, 0.910291314125061, 0.9360712766647339, 0.9618512392044067, 0.9876312017440796, 1.0134111642837524, 1.0391911268234253, 1.0649709701538086, 1.0907509326934814, 1.1165308952331543, 1.1423108577728271, 1.1680908203125, 1.1938707828521729, 1.2196507453918457, 1.2454307079315186, 1.2712106704711914, 1.2969906330108643]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 3.0, 2.0, 3.0, 8.0, 6.0, 15.0, 11.0, 14.0, 14.0, 10.0, 24.0, 26.0, 23.0, 32.0, 25.0, 28.0, 33.0, 37.0, 34.0, 48.0, 40.0, 40.0, 30.0, 41.0, 36.0, 30.0, 43.0, 37.0, 40.0, 29.0, 33.0, 29.0, 26.0, 30.0, 18.0, 20.0, 13.0, 18.0, 4.0, 8.0, 7.0, 5.0, 6.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31715041399002075, -0.3067113161087036, -0.2962721884250641, -0.28583309054374695, -0.2753939628601074, -0.2649548649787903, -0.25451573729515076, -0.24407663941383362, -0.2336375117301941, -0.22319839894771576, -0.21275928616523743, -0.2023201733827591, -0.19188106060028076, -0.18144194781780243, -0.1710028350353241, -0.16056373715400696, -0.15012462437152863, -0.1396855115890503, -0.12924639880657196, -0.11880728602409363, -0.1083681732416153, -0.09792906045913696, -0.08748995512723923, -0.0770508423447609, -0.06661172956228256, -0.05617261677980423, -0.0457335039973259, -0.03529439494013786, -0.02485528215765953, -0.014416169375181198, -0.003977060317993164, 0.0064620524644851685, 0.0169011652469635, 0.027340278029441833, 0.037779390811920166, 0.0482184998691082, 0.05865761265158653, 0.06909672915935516, 0.0795358344912529, 0.08997494727373123, 0.10041406005620956, 0.1108531728386879, 0.12129228562116623, 0.13173139095306396, 0.1421705037355423, 0.15260961651802063, 0.16304872930049896, 0.1734878420829773, 0.18392695486545563, 0.19436606764793396, 0.2048051804304123, 0.21524429321289062, 0.22568340599536896, 0.2361225187778473, 0.24656161665916443, 0.25700074434280396, 0.2674398422241211, 0.27787894010543823, 0.28831806778907776, 0.2987571656703949, 0.3091962933540344, 0.31963539123535156, 0.3300745189189911, 0.3405136168003082, 0.35095274448394775]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 12.0, 25.0, 28.0, 43.0, 55.0, 114.0, 172.0, 384.0, 759.0, 1747.0, 5221.0, 24567.0, 491087.0, 3596033.0, 60748.0, 8732.0, 2508.0, 1025.0, 475.0, 235.0, 123.0, 73.0, 36.0, 22.0, 16.0, 13.0, 3.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08306884765625, -0.0797719955444336, -0.07647514343261719, -0.07317829132080078, -0.06988143920898438, -0.06658458709716797, -0.06328773498535156, -0.059990882873535156, -0.05669403076171875, -0.053397178649902344, -0.05010032653808594, -0.04680347442626953, -0.043506622314453125, -0.04020977020263672, -0.03691291809082031, -0.033616065979003906, -0.0303192138671875, -0.027022361755371094, -0.023725509643554688, -0.02042865753173828, -0.017131805419921875, -0.013834953308105469, -0.010538101196289062, -0.007241249084472656, -0.00394439697265625, -0.0006475448608398438, 0.0026493072509765625, 0.005946159362792969, 0.009243011474609375, 0.012539863586425781, 0.015836715698242188, 0.019133567810058594, 0.022430419921875, 0.025727272033691406, 0.029024124145507812, 0.03232097625732422, 0.035617828369140625, 0.03891468048095703, 0.04221153259277344, 0.045508384704589844, 0.04880523681640625, 0.052102088928222656, 0.05539894104003906, 0.05869579315185547, 0.061992645263671875, 0.06528949737548828, 0.06858634948730469, 0.0718832015991211, 0.0751800537109375, 0.0784769058227539, 0.08177375793457031, 0.08507061004638672, 0.08836746215820312, 0.09166431427001953, 0.09496116638183594, 0.09825801849365234, 0.10155487060546875, 0.10485172271728516, 0.10814857482910156, 0.11144542694091797, 0.11474227905273438, 0.11803913116455078, 0.12133598327636719, 0.1246328353881836, 0.1279296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 13.0, 17.0, 24.0, 28.0, 39.0, 37.0, 46.0, 63.0, 63.0, 64.0, 67.0, 76.0, 69.0, 60.0, 48.0, 47.0, 38.0, 38.0, 38.0, 27.0, 21.0, 19.0, 12.0, 8.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025360107421875, -0.024494409561157227, -0.023628711700439453, -0.02276301383972168, -0.021897315979003906, -0.021031618118286133, -0.02016592025756836, -0.019300222396850586, -0.018434524536132812, -0.01756882667541504, -0.016703128814697266, -0.015837430953979492, -0.014971733093261719, -0.014106035232543945, -0.013240337371826172, -0.012374639511108398, -0.011508941650390625, -0.010643243789672852, -0.009777545928955078, -0.008911848068237305, -0.008046150207519531, -0.007180452346801758, -0.006314754486083984, -0.005449056625366211, -0.0045833587646484375, -0.003717660903930664, -0.0028519630432128906, -0.001986265182495117, -0.0011205673217773438, -0.0002548694610595703, 0.0006108283996582031, 0.0014765262603759766, 0.00234222412109375, 0.0032079219818115234, 0.004073619842529297, 0.00493931770324707, 0.005805015563964844, 0.006670713424682617, 0.007536411285400391, 0.008402109146118164, 0.009267807006835938, 0.010133504867553711, 0.010999202728271484, 0.011864900588989258, 0.012730598449707031, 0.013596296310424805, 0.014461994171142578, 0.015327692031860352, 0.016193389892578125, 0.0170590877532959, 0.017924785614013672, 0.018790483474731445, 0.01965618133544922, 0.020521879196166992, 0.021387577056884766, 0.02225327491760254, 0.023118972778320312, 0.023984670639038086, 0.02485036849975586, 0.025716066360473633, 0.026581764221191406, 0.02744746208190918, 0.028313159942626953, 0.029178857803344727, 0.0300445556640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 5.0, 2.0, 8.0, 18.0, 30.0, 38.0, 80.0, 135.0, 243.0, 412.0, 952.0, 2272.0, 8916.0, 90018.0, 3745177.0, 322603.0, 17426.0, 3563.0, 1229.0, 541.0, 262.0, 167.0, 94.0, 42.0, 28.0, 18.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103271484375, -0.09990501403808594, -0.09653854370117188, -0.09317207336425781, -0.08980560302734375, -0.08643913269042969, -0.08307266235351562, -0.07970619201660156, -0.0763397216796875, -0.07297325134277344, -0.06960678100585938, -0.06624031066894531, -0.06287384033203125, -0.05950736999511719, -0.056140899658203125, -0.05277442932128906, -0.049407958984375, -0.04604148864746094, -0.042675018310546875, -0.03930854797363281, -0.03594207763671875, -0.03257560729980469, -0.029209136962890625, -0.025842666625976562, -0.0224761962890625, -0.019109725952148438, -0.015743255615234375, -0.012376785278320312, -0.00901031494140625, -0.0056438446044921875, -0.002277374267578125, 0.0010890960693359375, 0.00445556640625, 0.007822036743164062, 0.011188507080078125, 0.014554977416992188, 0.01792144775390625, 0.021287918090820312, 0.024654388427734375, 0.028020858764648438, 0.0313873291015625, 0.03475379943847656, 0.038120269775390625, 0.04148674011230469, 0.04485321044921875, 0.04821968078613281, 0.051586151123046875, 0.05495262145996094, 0.058319091796875, 0.06168556213378906, 0.06505203247070312, 0.06841850280761719, 0.07178497314453125, 0.07515144348144531, 0.07851791381835938, 0.08188438415527344, 0.0852508544921875, 0.08861732482910156, 0.09198379516601562, 0.09535026550292969, 0.09871673583984375, 0.10208320617675781, 0.10544967651367188, 0.10881614685058594, 0.1121826171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 14.0, 13.0, 26.0, 37.0, 79.0, 165.0, 347.0, 922.0, 1569.0, 476.0, 195.0, 101.0, 47.0, 25.0, 19.0, 11.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.046630859375, -0.045497894287109375, -0.04436492919921875, -0.043231964111328125, -0.0420989990234375, -0.040966033935546875, -0.03983306884765625, -0.038700103759765625, -0.037567138671875, -0.036434173583984375, -0.03530120849609375, -0.034168243408203125, -0.0330352783203125, -0.031902313232421875, -0.03076934814453125, -0.029636383056640625, -0.02850341796875, -0.027370452880859375, -0.02623748779296875, -0.025104522705078125, -0.0239715576171875, -0.022838592529296875, -0.02170562744140625, -0.020572662353515625, -0.019439697265625, -0.018306732177734375, -0.01717376708984375, -0.016040802001953125, -0.0149078369140625, -0.013774871826171875, -0.01264190673828125, -0.011508941650390625, -0.0103759765625, -0.009243011474609375, -0.00811004638671875, -0.006977081298828125, -0.0058441162109375, -0.004711151123046875, -0.00357818603515625, -0.002445220947265625, -0.001312255859375, -0.000179290771484375, 0.00095367431640625, 0.002086639404296875, 0.0032196044921875, 0.004352569580078125, 0.00548553466796875, 0.006618499755859375, 0.00775146484375, 0.008884429931640625, 0.01001739501953125, 0.011150360107421875, 0.0122833251953125, 0.013416290283203125, 0.01454925537109375, 0.015682220458984375, 0.016815185546875, 0.017948150634765625, 0.01908111572265625, 0.020214080810546875, 0.0213470458984375, 0.022480010986328125, 0.02361297607421875, 0.024745941162109375, 0.02587890625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 11.0, 34.0, 115.0, 239.0, 327.0, 187.0, 56.0, 18.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5148007869720459, -0.5034155249595642, -0.4920302927494049, -0.4806450307369232, -0.4692597985267639, -0.4578745365142822, -0.44648927450180054, -0.43510401248931885, -0.42371878027915955, -0.41233351826667786, -0.40094828605651855, -0.38956302404403687, -0.3781777620315552, -0.3667925298213959, -0.3554072678089142, -0.3440220355987549, -0.3326367735862732, -0.3212515115737915, -0.3098662793636322, -0.2984810173511505, -0.2870957851409912, -0.2757105231285095, -0.26432526111602783, -0.25293999910354614, -0.24155476689338684, -0.23016951978206635, -0.21878427267074585, -0.20739901065826416, -0.19601376354694366, -0.18462851643562317, -0.17324325442314148, -0.16185800731182098, -0.1504727303981781, -0.1390874832868576, -0.1277022361755371, -0.11631697416305542, -0.10493172705173492, -0.09354647994041443, -0.08216122537851334, -0.07077597081661224, -0.05939072370529175, -0.048005472868680954, -0.03662022203207016, -0.025234971195459366, -0.013849720358848572, -0.0024644695222377777, 0.008920781314373016, 0.02030603587627411, 0.031691282987594604, 0.0430765338242054, 0.05446178466081619, 0.06584703922271729, 0.07723228633403778, 0.08861753344535828, 0.10000278800725937, 0.11138804256916046, 0.12277328968048096, 0.13415853679180145, 0.14554378390312195, 0.15692904591560364, 0.16831429302692413, 0.17969954013824463, 0.19108480215072632, 0.20247004926204681, 0.2138552963733673]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 26.0, 29.0, 55.0, 56.0, 79.0, 78.0, 112.0, 105.0, 102.0, 92.0, 85.0, 62.0, 38.0, 33.0, 21.0, 7.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22590118646621704, -0.2201852649450302, -0.21446934342384338, -0.20875342190265656, -0.20303750038146973, -0.1973215639591217, -0.19160564243793488, -0.18588972091674805, -0.18017379939556122, -0.1744578778743744, -0.16874195635318756, -0.16302603483200073, -0.1573100984096527, -0.15159417688846588, -0.14587825536727905, -0.14016233384609222, -0.1344464123249054, -0.12873049080371857, -0.12301456928253174, -0.11729864031076431, -0.11158271878957748, -0.10586679726839066, -0.10015086829662323, -0.0944349467754364, -0.08871902525424957, -0.08300310373306274, -0.07728718221187592, -0.07157125324010849, -0.06585533171892166, -0.06013941019773483, -0.054423484951257706, -0.04870755970478058, -0.04299163818359375, -0.03727571666240692, -0.031559791415929794, -0.025843868032097816, -0.02012794464826584, -0.01441202126443386, -0.008696097880601883, -0.002980172634124756, 0.0027357488870620728, 0.00845167227089405, 0.014167595654726028, 0.019883519038558006, 0.025599442422389984, 0.03131536394357681, 0.03703128919005394, 0.04274721443653107, 0.048463135957717896, 0.054179057478904724, 0.05989498272538185, 0.06561090797185898, 0.0713268294930458, 0.07704275101423264, 0.08275867998600006, 0.08847460150718689, 0.09419052302837372, 0.09990644454956055, 0.10562236607074738, 0.1113382950425148, 0.11705421656370163, 0.12277013808488846, 0.12848606705665588, 0.1342019885778427, 0.13991791009902954]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 9.0, 12.0, 9.0, 27.0, 22.0, 35.0, 61.0, 98.0, 157.0, 268.0, 409.0, 787.0, 1609.0, 3706.0, 9362.0, 29007.0, 121211.0, 455793.0, 322955.0, 71751.0, 19100.0, 6617.0, 2687.0, 1241.0, 647.0, 367.0, 211.0, 142.0, 89.0, 46.0, 36.0, 24.0, 23.0, 13.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.10107421875, -0.09808635711669922, -0.09509849548339844, -0.09211063385009766, -0.08912277221679688, -0.0861349105834961, -0.08314704895019531, -0.08015918731689453, -0.07717132568359375, -0.07418346405029297, -0.07119560241699219, -0.0682077407836914, -0.06521987915039062, -0.062232017517089844, -0.05924415588378906, -0.05625629425048828, -0.0532684326171875, -0.05028057098388672, -0.04729270935058594, -0.044304847717285156, -0.041316986083984375, -0.038329124450683594, -0.03534126281738281, -0.03235340118408203, -0.02936553955078125, -0.02637767791748047, -0.023389816284179688, -0.020401954650878906, -0.017414093017578125, -0.014426231384277344, -0.011438369750976562, -0.008450508117675781, -0.005462646484375, -0.0024747848510742188, 0.0005130767822265625, 0.0035009384155273438, 0.006488800048828125, 0.009476661682128906, 0.012464523315429688, 0.015452384948730469, 0.01844024658203125, 0.02142810821533203, 0.024415969848632812, 0.027403831481933594, 0.030391693115234375, 0.033379554748535156, 0.03636741638183594, 0.03935527801513672, 0.0423431396484375, 0.04533100128173828, 0.04831886291503906, 0.051306724548339844, 0.054294586181640625, 0.057282447814941406, 0.06027030944824219, 0.06325817108154297, 0.06624603271484375, 0.06923389434814453, 0.07222175598144531, 0.0752096176147461, 0.07819747924804688, 0.08118534088134766, 0.08417320251464844, 0.08716106414794922, 0.09014892578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 7.0, 14.0, 15.0, 14.0, 32.0, 44.0, 40.0, 37.0, 46.0, 51.0, 60.0, 66.0, 70.0, 63.0, 71.0, 55.0, 46.0, 51.0, 44.0, 37.0, 25.0, 29.0, 17.0, 11.0, 15.0, 12.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0246124267578125, -0.023759841918945312, -0.022907257080078125, -0.022054672241210938, -0.02120208740234375, -0.020349502563476562, -0.019496917724609375, -0.018644332885742188, -0.017791748046875, -0.016939163208007812, -0.016086578369140625, -0.015233993530273438, -0.01438140869140625, -0.013528823852539062, -0.012676239013671875, -0.011823654174804688, -0.0109710693359375, -0.010118484497070312, -0.009265899658203125, -0.008413314819335938, -0.00756072998046875, -0.0067081451416015625, -0.005855560302734375, -0.0050029754638671875, -0.004150390625, -0.0032978057861328125, -0.002445220947265625, -0.0015926361083984375, -0.00074005126953125, 0.0001125335693359375, 0.000965118408203125, 0.0018177032470703125, 0.0026702880859375, 0.0035228729248046875, 0.004375457763671875, 0.0052280426025390625, 0.00608062744140625, 0.0069332122802734375, 0.007785797119140625, 0.008638381958007812, 0.009490966796875, 0.010343551635742188, 0.011196136474609375, 0.012048721313476562, 0.01290130615234375, 0.013753890991210938, 0.014606475830078125, 0.015459060668945312, 0.0163116455078125, 0.017164230346679688, 0.018016815185546875, 0.018869400024414062, 0.01972198486328125, 0.020574569702148438, 0.021427154541015625, 0.022279739379882812, 0.02313232421875, 0.023984909057617188, 0.024837493896484375, 0.025690078735351562, 0.02654266357421875, 0.027395248413085938, 0.028247833251953125, 0.029100418090820312, 0.0299530029296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 0.0, 4.0, 6.0, 6.0, 4.0, 13.0, 18.0, 21.0, 21.0, 28.0, 44.0, 81.0, 92.0, 167.0, 346.0, 564.0, 1163.0, 2319.0, 4870.0, 11299.0, 27476.0, 73766.0, 194687.0, 343120.0, 235426.0, 93158.0, 34405.0, 13736.0, 5992.0, 2794.0, 1342.0, 644.0, 345.0, 243.0, 115.0, 88.0, 50.0, 19.0, 20.0, 14.0, 14.0, 10.0, 8.0, 6.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.053070068359375, -0.05153703689575195, -0.050004005432128906, -0.04847097396850586, -0.04693794250488281, -0.045404911041259766, -0.04387187957763672, -0.04233884811401367, -0.040805816650390625, -0.03927278518676758, -0.03773975372314453, -0.036206722259521484, -0.03467369079589844, -0.03314065933227539, -0.031607627868652344, -0.030074596405029297, -0.02854156494140625, -0.027008533477783203, -0.025475502014160156, -0.02394247055053711, -0.022409439086914062, -0.020876407623291016, -0.01934337615966797, -0.017810344696044922, -0.016277313232421875, -0.014744281768798828, -0.013211250305175781, -0.011678218841552734, -0.010145187377929688, -0.00861215591430664, -0.007079124450683594, -0.005546092987060547, -0.0040130615234375, -0.002480030059814453, -0.0009469985961914062, 0.0005860328674316406, 0.0021190643310546875, 0.0036520957946777344, 0.005185127258300781, 0.006718158721923828, 0.008251190185546875, 0.009784221649169922, 0.011317253112792969, 0.012850284576416016, 0.014383316040039062, 0.01591634750366211, 0.017449378967285156, 0.018982410430908203, 0.02051544189453125, 0.022048473358154297, 0.023581504821777344, 0.02511453628540039, 0.026647567749023438, 0.028180599212646484, 0.02971363067626953, 0.031246662139892578, 0.032779693603515625, 0.03431272506713867, 0.03584575653076172, 0.037378787994384766, 0.03891181945800781, 0.04044485092163086, 0.041977882385253906, 0.04351091384887695, 0.0450439453125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 9.0, 11.0, 7.0, 8.0, 19.0, 11.0, 18.0, 23.0, 23.0, 24.0, 27.0, 31.0, 30.0, 43.0, 34.0, 45.0, 41.0, 27.0, 40.0, 46.0, 33.0, 45.0, 48.0, 33.0, 29.0, 36.0, 43.0, 27.0, 36.0, 25.0, 19.0, 12.0, 11.0, 19.0, 16.0, 7.0, 6.0, 5.0, 6.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06414794921875, -0.062064170837402344, -0.05998039245605469, -0.05789661407470703, -0.055812835693359375, -0.05372905731201172, -0.05164527893066406, -0.049561500549316406, -0.04747772216796875, -0.045393943786621094, -0.04331016540527344, -0.04122638702392578, -0.039142608642578125, -0.03705883026123047, -0.03497505187988281, -0.032891273498535156, -0.0308074951171875, -0.028723716735839844, -0.026639938354492188, -0.02455615997314453, -0.022472381591796875, -0.02038860321044922, -0.018304824829101562, -0.016221046447753906, -0.01413726806640625, -0.012053489685058594, -0.009969711303710938, -0.007885932922363281, -0.005802154541015625, -0.0037183761596679688, -0.0016345977783203125, 0.00044918060302734375, 0.002532958984375, 0.004616737365722656, 0.0067005157470703125, 0.008784294128417969, 0.010868072509765625, 0.012951850891113281, 0.015035629272460938, 0.017119407653808594, 0.01920318603515625, 0.021286964416503906, 0.023370742797851562, 0.02545452117919922, 0.027538299560546875, 0.02962207794189453, 0.03170585632324219, 0.033789634704589844, 0.0358734130859375, 0.037957191467285156, 0.04004096984863281, 0.04212474822998047, 0.044208526611328125, 0.04629230499267578, 0.04837608337402344, 0.050459861755371094, 0.05254364013671875, 0.054627418518066406, 0.05671119689941406, 0.05879497528076172, 0.060878753662109375, 0.06296253204345703, 0.06504631042480469, 0.06713008880615234, 0.0692138671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 6.0, 9.0, 11.0, 10.0, 16.0, 24.0, 27.0, 35.0, 43.0, 49.0, 74.0, 110.0, 127.0, 210.0, 375.0, 788.0, 2001.0, 7685.0, 51481.0, 527467.0, 410565.0, 37738.0, 6141.0, 1756.0, 678.0, 334.0, 202.0, 156.0, 87.0, 80.0, 47.0, 39.0, 33.0, 30.0, 20.0, 12.0, 14.0, 14.0, 3.0, 10.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.042572021484375, -0.041100502014160156, -0.03962898254394531, -0.03815746307373047, -0.036685943603515625, -0.03521442413330078, -0.03374290466308594, -0.032271385192871094, -0.03079986572265625, -0.029328346252441406, -0.027856826782226562, -0.02638530731201172, -0.024913787841796875, -0.02344226837158203, -0.021970748901367188, -0.020499229431152344, -0.0190277099609375, -0.017556190490722656, -0.016084671020507812, -0.014613151550292969, -0.013141632080078125, -0.011670112609863281, -0.010198593139648438, -0.008727073669433594, -0.00725555419921875, -0.005784034729003906, -0.0043125152587890625, -0.0028409957885742188, -0.001369476318359375, 0.00010204315185546875, 0.0015735626220703125, 0.0030450820922851562, 0.0045166015625, 0.005988121032714844, 0.0074596405029296875, 0.008931159973144531, 0.010402679443359375, 0.011874198913574219, 0.013345718383789062, 0.014817237854003906, 0.01628875732421875, 0.017760276794433594, 0.019231796264648438, 0.02070331573486328, 0.022174835205078125, 0.02364635467529297, 0.025117874145507812, 0.026589393615722656, 0.0280609130859375, 0.029532432556152344, 0.031003952026367188, 0.03247547149658203, 0.033946990966796875, 0.03541851043701172, 0.03689002990722656, 0.038361549377441406, 0.03983306884765625, 0.041304588317871094, 0.04277610778808594, 0.04424762725830078, 0.045719146728515625, 0.04719066619873047, 0.04866218566894531, 0.050133705139160156, 0.051605224609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 11.0, 22.0, 27.0, 50.0, 63.0, 84.0, 84.0, 116.0, 90.0, 95.0, 106.0, 69.0, 61.0, 41.0, 22.0, 19.0, 15.0, 9.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.238719940185547e-06, -8.874572813510895e-06, -8.510425686836243e-06, -8.14627856016159e-06, -7.782131433486938e-06, -7.417984306812286e-06, -7.053837180137634e-06, -6.689690053462982e-06, -6.32554292678833e-06, -5.961395800113678e-06, -5.597248673439026e-06, -5.233101546764374e-06, -4.868954420089722e-06, -4.50480729341507e-06, -4.1406601667404175e-06, -3.7765130400657654e-06, -3.4123659133911133e-06, -3.048218786716461e-06, -2.684071660041809e-06, -2.319924533367157e-06, -1.955777406692505e-06, -1.5916302800178528e-06, -1.2274831533432007e-06, -8.633360266685486e-07, -4.991888999938965e-07, -1.3504177331924438e-07, 2.2910535335540771e-07, 5.932524800300598e-07, 9.57399606704712e-07, 1.321546733379364e-06, 1.6856938600540161e-06, 2.0498409867286682e-06, 2.4139881134033203e-06, 2.7781352400779724e-06, 3.1422823667526245e-06, 3.5064294934272766e-06, 3.870576620101929e-06, 4.234723746776581e-06, 4.598870873451233e-06, 4.963018000125885e-06, 5.327165126800537e-06, 5.691312253475189e-06, 6.055459380149841e-06, 6.419606506824493e-06, 6.7837536334991455e-06, 7.147900760173798e-06, 7.51204788684845e-06, 7.876195013523102e-06, 8.240342140197754e-06, 8.604489266872406e-06, 8.968636393547058e-06, 9.33278352022171e-06, 9.696930646896362e-06, 1.0061077773571014e-05, 1.0425224900245667e-05, 1.0789372026920319e-05, 1.115351915359497e-05, 1.1517666280269623e-05, 1.1881813406944275e-05, 1.2245960533618927e-05, 1.2610107660293579e-05, 1.2974254786968231e-05, 1.3338401913642883e-05, 1.3702549040317535e-05, 1.4066696166992188e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 20.0, 32.0, 98.0, 216.0, 825.0, 10405.0, 911252.0, 122647.0, 2425.0, 403.0, 132.0, 43.0, 27.0, 13.0, 11.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134765625, -0.1311960220336914, -0.1276264190673828, -0.12405681610107422, -0.12048721313476562, -0.11691761016845703, -0.11334800720214844, -0.10977840423583984, -0.10620880126953125, -0.10263919830322266, -0.09906959533691406, -0.09549999237060547, -0.09193038940429688, -0.08836078643798828, -0.08479118347167969, -0.0812215805053711, -0.0776519775390625, -0.0740823745727539, -0.07051277160644531, -0.06694316864013672, -0.06337356567382812, -0.05980396270751953, -0.05623435974121094, -0.052664756774902344, -0.04909515380859375, -0.045525550842285156, -0.04195594787597656, -0.03838634490966797, -0.034816741943359375, -0.03124713897705078, -0.027677536010742188, -0.024107933044433594, -0.020538330078125, -0.016968727111816406, -0.013399124145507812, -0.009829521179199219, -0.006259918212890625, -0.0026903152465820312, 0.0008792877197265625, 0.004448890686035156, 0.00801849365234375, 0.011588096618652344, 0.015157699584960938, 0.01872730255126953, 0.022296905517578125, 0.02586650848388672, 0.029436111450195312, 0.033005714416503906, 0.0365753173828125, 0.040144920349121094, 0.04371452331542969, 0.04728412628173828, 0.050853729248046875, 0.05442333221435547, 0.05799293518066406, 0.061562538146972656, 0.06513214111328125, 0.06870174407958984, 0.07227134704589844, 0.07584095001220703, 0.07941055297851562, 0.08298015594482422, 0.08654975891113281, 0.0901193618774414, 0.09368896484375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 8.0, 17.0, 25.0, 40.0, 60.0, 120.0, 165.0, 157.0, 175.0, 107.0, 62.0, 38.0, 18.0, 10.0, 5.0, 4.0, 0.0, 4.0], "bins": [-0.1195068359375, -0.11726880073547363, -0.11503076553344727, -0.1127927303314209, -0.11055469512939453, -0.10831665992736816, -0.1060786247253418, -0.10384058952331543, -0.10160255432128906, -0.0993645191192627, -0.09712648391723633, -0.09488844871520996, -0.0926504135131836, -0.09041237831115723, -0.08817434310913086, -0.08593630790710449, -0.08369827270507812, -0.08146023750305176, -0.07922220230102539, -0.07698416709899902, -0.07474613189697266, -0.07250809669494629, -0.07027006149291992, -0.06803202629089355, -0.06579399108886719, -0.06355595588684082, -0.06131792068481445, -0.059079885482788086, -0.05684185028076172, -0.05460381507873535, -0.052365779876708984, -0.05012774467468262, -0.04788970947265625, -0.04565167427062988, -0.043413639068603516, -0.04117560386657715, -0.03893756866455078, -0.036699533462524414, -0.03446149826049805, -0.03222346305847168, -0.029985427856445312, -0.027747392654418945, -0.025509357452392578, -0.02327132225036621, -0.021033287048339844, -0.018795251846313477, -0.01655721664428711, -0.014319181442260742, -0.012081146240234375, -0.009843111038208008, -0.007605075836181641, -0.0053670406341552734, -0.0031290054321289062, -0.0008909702301025391, 0.0013470649719238281, 0.0035851001739501953, 0.0058231353759765625, 0.00806117057800293, 0.010299205780029297, 0.012537240982055664, 0.014775276184082031, 0.0170133113861084, 0.019251346588134766, 0.021489381790161133, 0.0237274169921875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 29.0, 62.0, 124.0, 222.0, 243.0, 181.0, 78.0, 36.0, 16.0, 9.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2709808349609375, -1.2423155307769775, -1.2136502265930176, -1.1849849224090576, -1.156319499015808, -1.1276541948318481, -1.0989888906478882, -1.0703235864639282, -1.0416582822799683, -1.0129929780960083, -0.9843276143074036, -0.9556623101234436, -0.9269970059394836, -0.8983316421508789, -0.869666337966919, -0.841001033782959, -0.812335729598999, -0.7836704254150391, -0.7550050616264343, -0.7263397574424744, -0.6976744532585144, -0.6690090894699097, -0.6403437852859497, -0.6116784811019897, -0.583013117313385, -0.554347813129425, -0.5256824493408203, -0.49701714515686035, -0.4683518409729004, -0.43968650698661804, -0.4110211730003357, -0.38235586881637573, -0.35369056463241577, -0.3250252306461334, -0.29635992646217346, -0.2676945924758911, -0.23902928829193115, -0.2103639543056488, -0.18169863522052765, -0.1530333161354065, -0.12436799705028534, -0.09570267796516418, -0.06703735888004303, -0.03837203234434128, -0.009706713259220123, 0.01895861327648163, 0.04762393236160278, 0.07628925144672394, 0.10495457053184509, 0.13361988961696625, 0.1622852087020874, 0.19095054268836975, 0.2196158468723297, 0.24828118085861206, 0.276946485042572, 0.30561181902885437, 0.3342771530151367, 0.36294248700141907, 0.39160779118537903, 0.4202731251716614, 0.44893842935562134, 0.4776037633419037, 0.506269097328186, 0.534934401512146, 0.563599705696106]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 3.0, 8.0, 4.0, 5.0, 10.0, 13.0, 13.0, 7.0, 12.0, 18.0, 14.0, 25.0, 25.0, 38.0, 23.0, 35.0, 50.0, 42.0, 44.0, 41.0, 56.0, 40.0, 41.0, 35.0, 45.0, 43.0, 39.0, 34.0, 44.0, 21.0, 31.0, 28.0, 18.0, 24.0, 11.0, 14.0, 9.0, 9.0, 8.0, 3.0, 3.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.3749595284461975, -0.3644661009311676, -0.3539726734161377, -0.3434792459011078, -0.3329858183860779, -0.322492390871048, -0.31199896335601807, -0.30150553584098816, -0.29101210832595825, -0.28051868081092834, -0.27002525329589844, -0.25953182578086853, -0.24903839826583862, -0.23854497075080872, -0.2280515432357788, -0.2175581157207489, -0.2070646733045578, -0.1965712457895279, -0.18607781827449799, -0.17558439075946808, -0.16509096324443817, -0.15459753572940826, -0.14410409331321716, -0.13361066579818726, -0.12311724573373795, -0.11262381821870804, -0.10213039070367813, -0.09163695573806763, -0.08114352822303772, -0.07065010070800781, -0.060156673192977905, -0.049663245677948, -0.03916981816291809, -0.028676390647888184, -0.018182961270213127, -0.007689531892538071, 0.0028038956224918365, 0.013297323137521744, 0.02379075437784195, 0.03428418189287186, 0.044777609407901764, 0.05527103692293167, 0.06576446443796158, 0.07625789940357208, 0.08675132691860199, 0.0972447544336319, 0.1077381819486618, 0.11823160946369171, 0.12872503697872162, 0.13921846449375153, 0.14971189200878143, 0.16020531952381134, 0.17069874703884125, 0.18119217455387115, 0.19168561697006226, 0.20217904448509216, 0.21267247200012207, 0.22316589951515198, 0.23365932703018188, 0.2441527545452118, 0.2546461820602417, 0.2651396095752716, 0.2756330370903015, 0.2861264646053314, 0.29661989212036133]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 9.0, 9.0, 15.0, 31.0, 44.0, 45.0, 75.0, 84.0, 96.0, 154.0, 228.0, 395.0, 623.0, 1283.0, 2964.0, 8721.0, 45001.0, 3249447.0, 837600.0, 34920.0, 7381.0, 2520.0, 1103.0, 563.0, 283.0, 185.0, 144.0, 96.0, 66.0, 59.0, 26.0, 25.0, 21.0, 13.0, 12.0, 9.0, 6.0, 6.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1014404296875, -0.097808837890625, -0.09417724609375, -0.090545654296875, -0.0869140625, -0.083282470703125, -0.07965087890625, -0.076019287109375, -0.0723876953125, -0.068756103515625, -0.06512451171875, -0.061492919921875, -0.057861328125, -0.054229736328125, -0.05059814453125, -0.046966552734375, -0.0433349609375, -0.039703369140625, -0.03607177734375, -0.032440185546875, -0.02880859375, -0.025177001953125, -0.02154541015625, -0.017913818359375, -0.0142822265625, -0.010650634765625, -0.00701904296875, -0.003387451171875, 0.000244140625, 0.003875732421875, 0.00750732421875, 0.011138916015625, 0.0147705078125, 0.018402099609375, 0.02203369140625, 0.025665283203125, 0.029296875, 0.032928466796875, 0.03656005859375, 0.040191650390625, 0.0438232421875, 0.047454833984375, 0.05108642578125, 0.054718017578125, 0.058349609375, 0.061981201171875, 0.06561279296875, 0.069244384765625, 0.0728759765625, 0.076507568359375, 0.08013916015625, 0.083770751953125, 0.08740234375, 0.091033935546875, 0.09466552734375, 0.098297119140625, 0.1019287109375, 0.105560302734375, 0.10919189453125, 0.112823486328125, 0.116455078125, 0.120086669921875, 0.12371826171875, 0.127349853515625, 0.1309814453125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 5.0, 7.0, 8.0, 9.0, 18.0, 17.0, 21.0, 28.0, 35.0, 36.0, 39.0, 70.0, 54.0, 65.0, 57.0, 62.0, 62.0, 55.0, 61.0, 50.0, 45.0, 40.0, 39.0, 24.0, 28.0, 17.0, 16.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024566650390625, -0.02370595932006836, -0.02284526824951172, -0.021984577178955078, -0.021123886108398438, -0.020263195037841797, -0.019402503967285156, -0.018541812896728516, -0.017681121826171875, -0.016820430755615234, -0.015959739685058594, -0.015099048614501953, -0.014238357543945312, -0.013377666473388672, -0.012516975402832031, -0.01165628433227539, -0.01079559326171875, -0.00993490219116211, -0.009074211120605469, -0.008213520050048828, -0.0073528289794921875, -0.006492137908935547, -0.005631446838378906, -0.004770755767822266, -0.003910064697265625, -0.0030493736267089844, -0.0021886825561523438, -0.0013279914855957031, -0.0004673004150390625, 0.0003933906555175781, 0.0012540817260742188, 0.0021147727966308594, 0.0029754638671875, 0.0038361549377441406, 0.004696846008300781, 0.005557537078857422, 0.0064182281494140625, 0.007278919219970703, 0.008139610290527344, 0.009000301361083984, 0.009860992431640625, 0.010721683502197266, 0.011582374572753906, 0.012443065643310547, 0.013303756713867188, 0.014164447784423828, 0.015025138854980469, 0.01588582992553711, 0.01674652099609375, 0.01760721206665039, 0.01846790313720703, 0.019328594207763672, 0.020189285278320312, 0.021049976348876953, 0.021910667419433594, 0.022771358489990234, 0.023632049560546875, 0.024492740631103516, 0.025353431701660156, 0.026214122772216797, 0.027074813842773438, 0.027935504913330078, 0.02879619598388672, 0.02965688705444336, 0.030517578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 8.0, 16.0, 24.0, 19.0, 49.0, 60.0, 119.0, 202.0, 315.0, 574.0, 1088.0, 2467.0, 6661.0, 26367.0, 271324.0, 3730191.0, 128415.0, 17527.0, 4949.0, 1918.0, 885.0, 432.0, 265.0, 134.0, 99.0, 61.0, 47.0, 12.0, 19.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.109619140625, -0.10660552978515625, -0.1035919189453125, -0.10057830810546875, -0.097564697265625, -0.09455108642578125, -0.0915374755859375, -0.08852386474609375, -0.08551025390625, -0.08249664306640625, -0.0794830322265625, -0.07646942138671875, -0.073455810546875, -0.07044219970703125, -0.0674285888671875, -0.06441497802734375, -0.0614013671875, -0.05838775634765625, -0.0553741455078125, -0.05236053466796875, -0.049346923828125, -0.04633331298828125, -0.0433197021484375, -0.04030609130859375, -0.03729248046875, -0.03427886962890625, -0.0312652587890625, -0.02825164794921875, -0.025238037109375, -0.02222442626953125, -0.0192108154296875, -0.01619720458984375, -0.01318359375, -0.01016998291015625, -0.0071563720703125, -0.00414276123046875, -0.001129150390625, 0.00188446044921875, 0.0048980712890625, 0.00791168212890625, 0.01092529296875, 0.01393890380859375, 0.0169525146484375, 0.01996612548828125, 0.022979736328125, 0.02599334716796875, 0.0290069580078125, 0.03202056884765625, 0.0350341796875, 0.03804779052734375, 0.0410614013671875, 0.04407501220703125, 0.047088623046875, 0.05010223388671875, 0.0531158447265625, 0.05612945556640625, 0.05914306640625, 0.06215667724609375, 0.0651702880859375, 0.06818389892578125, 0.071197509765625, 0.07421112060546875, 0.0772247314453125, 0.08023834228515625, 0.083251953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 8.0, 22.0, 37.0, 98.0, 220.0, 911.0, 2147.0, 354.0, 126.0, 57.0, 24.0, 22.0, 7.0, 4.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061187744140625, -0.059586524963378906, -0.05798530578613281, -0.05638408660888672, -0.054782867431640625, -0.05318164825439453, -0.05158042907714844, -0.049979209899902344, -0.04837799072265625, -0.046776771545410156, -0.04517555236816406, -0.04357433319091797, -0.041973114013671875, -0.04037189483642578, -0.03877067565917969, -0.037169456481933594, -0.0355682373046875, -0.033967018127441406, -0.03236579895019531, -0.03076457977294922, -0.029163360595703125, -0.02756214141845703, -0.025960922241210938, -0.024359703063964844, -0.02275848388671875, -0.021157264709472656, -0.019556045532226562, -0.01795482635498047, -0.016353607177734375, -0.014752388000488281, -0.013151168823242188, -0.011549949645996094, -0.00994873046875, -0.008347511291503906, -0.0067462921142578125, -0.005145072937011719, -0.003543853759765625, -0.0019426345825195312, -0.0003414154052734375, 0.0012598037719726562, 0.00286102294921875, 0.004462242126464844, 0.0060634613037109375, 0.007664680480957031, 0.009265899658203125, 0.010867118835449219, 0.012468338012695312, 0.014069557189941406, 0.0156707763671875, 0.017271995544433594, 0.018873214721679688, 0.02047443389892578, 0.022075653076171875, 0.02367687225341797, 0.025278091430664062, 0.026879310607910156, 0.02848052978515625, 0.030081748962402344, 0.03168296813964844, 0.03328418731689453, 0.034885406494140625, 0.03648662567138672, 0.03808784484863281, 0.039689064025878906, 0.041290283203125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 13.0, 67.0, 255.0, 456.0, 174.0, 24.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8411245346069336, -0.8244690299034119, -0.8078134655952454, -0.7911579608917236, -0.7745023965835571, -0.7578468918800354, -0.7411913871765137, -0.7245358228683472, -0.7078803181648254, -0.6912248134613037, -0.6745692491531372, -0.6579137444496155, -0.6412582397460938, -0.6246026754379272, -0.6079471707344055, -0.591291606426239, -0.5746361017227173, -0.5579805970191956, -0.541325032711029, -0.5246695280075073, -0.5080139636993408, -0.4913584589958191, -0.47470295429229736, -0.45804741978645325, -0.44139188528060913, -0.424736350774765, -0.4080808162689209, -0.39142531156539917, -0.37476977705955505, -0.35811424255371094, -0.3414587378501892, -0.3248032033443451, -0.30814769864082336, -0.29149216413497925, -0.2748366594314575, -0.2581811249256134, -0.2415255904197693, -0.22487005591392517, -0.20821453630924225, -0.19155901670455933, -0.1749034821987152, -0.1582479476928711, -0.14159242808818817, -0.12493690103292465, -0.10828137397766113, -0.09162584692239761, -0.0749703198671341, -0.058314792811870575, -0.041659265756607056, -0.025003738701343536, -0.008348211646080017, 0.008307315409183502, 0.02496284246444702, 0.04161836951971054, 0.05827389657497406, 0.07492942363023758, 0.0915849506855011, 0.10824047774076462, 0.12489600479602814, 0.14155152440071106, 0.15820705890655518, 0.1748625934123993, 0.19151811301708221, 0.20817363262176514, 0.22482916712760925]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 5.0, 9.0, 14.0, 10.0, 9.0, 13.0, 22.0, 29.0, 39.0, 54.0, 42.0, 75.0, 83.0, 59.0, 60.0, 63.0, 74.0, 50.0, 60.0, 45.0, 39.0, 33.0, 30.0, 22.0, 13.0, 14.0, 6.0, 8.0, 9.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12491750717163086, -0.12103912234306335, -0.11716074496507645, -0.11328236758708954, -0.10940398275852203, -0.10552559792995453, -0.10164722055196762, -0.09776884317398071, -0.09389045834541321, -0.0900120735168457, -0.0861336961388588, -0.08225531876087189, -0.07837693393230438, -0.07449854910373688, -0.07062017172574997, -0.06674179434776306, -0.06286340951919556, -0.05898502841591835, -0.055106647312641144, -0.05122826620936394, -0.04734988510608673, -0.043471504002809525, -0.03959312289953232, -0.03571474179625511, -0.031836360692977905, -0.0279579795897007, -0.024079598486423492, -0.020201217383146286, -0.01632283627986908, -0.012444455176591873, -0.008566074073314667, -0.00468769297003746, -0.0008093118667602539, 0.0030690692365169525, 0.006947450339794159, 0.010825831443071365, 0.014704212546348572, 0.018582593649625778, 0.022460974752902985, 0.02633935585618019, 0.030217736959457397, 0.034096118062734604, 0.03797449916601181, 0.04185288026928902, 0.04573126137256622, 0.04960964247584343, 0.053488023579120636, 0.05736640468239784, 0.06124478578567505, 0.06512317061424255, 0.06900154799222946, 0.07287992537021637, 0.07675831019878387, 0.08063669502735138, 0.08451507240533829, 0.0883934497833252, 0.0922718346118927, 0.0961502194404602, 0.10002859681844711, 0.10390697419643402, 0.10778535902500153, 0.11166374385356903, 0.11554212123155594, 0.11942049860954285, 0.12329888343811035]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 16.0, 19.0, 32.0, 58.0, 115.0, 169.0, 348.0, 671.0, 1395.0, 3253.0, 8892.0, 26951.0, 98922.0, 332079.0, 390108.0, 131750.0, 35363.0, 11089.0, 4057.0, 1684.0, 711.0, 362.0, 176.0, 111.0, 81.0, 40.0, 36.0, 29.0, 10.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.08941650390625, -0.08679485321044922, -0.08417320251464844, -0.08155155181884766, -0.07892990112304688, -0.0763082504272461, -0.07368659973144531, -0.07106494903564453, -0.06844329833984375, -0.06582164764404297, -0.06319999694824219, -0.060578346252441406, -0.057956695556640625, -0.055335044860839844, -0.05271339416503906, -0.05009174346923828, -0.0474700927734375, -0.04484844207763672, -0.04222679138183594, -0.039605140686035156, -0.036983489990234375, -0.034361839294433594, -0.03174018859863281, -0.02911853790283203, -0.02649688720703125, -0.02387523651123047, -0.021253585815429688, -0.018631935119628906, -0.016010284423828125, -0.013388633728027344, -0.010766983032226562, -0.008145332336425781, -0.005523681640625, -0.0029020309448242188, -0.0002803802490234375, 0.0023412704467773438, 0.004962921142578125, 0.007584571838378906, 0.010206222534179688, 0.012827873229980469, 0.01544952392578125, 0.01807117462158203, 0.020692825317382812, 0.023314476013183594, 0.025936126708984375, 0.028557777404785156, 0.031179428100585938, 0.03380107879638672, 0.0364227294921875, 0.03904438018798828, 0.04166603088378906, 0.044287681579589844, 0.046909332275390625, 0.049530982971191406, 0.05215263366699219, 0.05477428436279297, 0.05739593505859375, 0.06001758575439453, 0.06263923645019531, 0.0652608871459961, 0.06788253784179688, 0.07050418853759766, 0.07312583923339844, 0.07574748992919922, 0.078369140625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 11.0, 10.0, 15.0, 28.0, 23.0, 31.0, 41.0, 40.0, 52.0, 67.0, 62.0, 68.0, 62.0, 51.0, 53.0, 62.0, 51.0, 52.0, 39.0, 30.0, 26.0, 22.0, 28.0, 19.0, 12.0, 6.0, 6.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.026947021484375, -0.02604389190673828, -0.025140762329101562, -0.024237632751464844, -0.023334503173828125, -0.022431373596191406, -0.021528244018554688, -0.02062511444091797, -0.01972198486328125, -0.01881885528564453, -0.017915725708007812, -0.017012596130371094, -0.016109466552734375, -0.015206336975097656, -0.014303207397460938, -0.013400077819824219, -0.0124969482421875, -0.011593818664550781, -0.010690689086914062, -0.009787559509277344, -0.008884429931640625, -0.007981300354003906, -0.0070781707763671875, -0.006175041198730469, -0.00527191162109375, -0.004368782043457031, -0.0034656524658203125, -0.0025625228881835938, -0.001659393310546875, -0.0007562637329101562, 0.0001468658447265625, 0.0010499954223632812, 0.001953125, 0.0028562545776367188, 0.0037593841552734375, 0.004662513732910156, 0.005565643310546875, 0.006468772888183594, 0.0073719024658203125, 0.008275032043457031, 0.00917816162109375, 0.010081291198730469, 0.010984420776367188, 0.011887550354003906, 0.012790679931640625, 0.013693809509277344, 0.014596939086914062, 0.015500068664550781, 0.0164031982421875, 0.01730632781982422, 0.018209457397460938, 0.019112586975097656, 0.020015716552734375, 0.020918846130371094, 0.021821975708007812, 0.02272510528564453, 0.02362823486328125, 0.02453136444091797, 0.025434494018554688, 0.026337623596191406, 0.027240753173828125, 0.028143882751464844, 0.029047012329101562, 0.02995014190673828, 0.030853271484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 17.0, 16.0, 37.0, 51.0, 61.0, 89.0, 129.0, 246.0, 385.0, 857.0, 1864.0, 5232.0, 16321.0, 56663.0, 199228.0, 426584.0, 240714.0, 69561.0, 19860.0, 6334.0, 2207.0, 879.0, 435.0, 267.0, 169.0, 112.0, 67.0, 43.0, 31.0, 22.0, 16.0, 9.0, 6.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049407958984375, -0.04739809036254883, -0.045388221740722656, -0.043378353118896484, -0.04136848449707031, -0.03935861587524414, -0.03734874725341797, -0.0353388786315918, -0.033329010009765625, -0.03131914138793945, -0.02930927276611328, -0.02729940414428711, -0.025289535522460938, -0.023279666900634766, -0.021269798278808594, -0.019259929656982422, -0.01725006103515625, -0.015240192413330078, -0.013230323791503906, -0.011220455169677734, -0.009210586547851562, -0.007200717926025391, -0.005190849304199219, -0.003180980682373047, -0.001171112060546875, 0.0008387565612792969, 0.0028486251831054688, 0.004858493804931641, 0.0068683624267578125, 0.008878231048583984, 0.010888099670410156, 0.012897968292236328, 0.0149078369140625, 0.016917705535888672, 0.018927574157714844, 0.020937442779541016, 0.022947311401367188, 0.02495718002319336, 0.02696704864501953, 0.028976917266845703, 0.030986785888671875, 0.03299665451049805, 0.03500652313232422, 0.03701639175415039, 0.03902626037597656, 0.041036128997802734, 0.043045997619628906, 0.04505586624145508, 0.04706573486328125, 0.04907560348510742, 0.051085472106933594, 0.053095340728759766, 0.05510520935058594, 0.05711507797241211, 0.05912494659423828, 0.06113481521606445, 0.06314468383789062, 0.0651545524597168, 0.06716442108154297, 0.06917428970336914, 0.07118415832519531, 0.07319402694702148, 0.07520389556884766, 0.07721376419067383, 0.0792236328125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 9.0, 3.0, 5.0, 6.0, 5.0, 10.0, 12.0, 8.0, 18.0, 19.0, 23.0, 27.0, 14.0, 30.0, 35.0, 31.0, 36.0, 33.0, 38.0, 50.0, 37.0, 54.0, 51.0, 44.0, 33.0, 48.0, 38.0, 23.0, 36.0, 33.0, 28.0, 33.0, 28.0, 16.0, 12.0, 18.0, 9.0, 12.0, 9.0, 6.0, 9.0, 2.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07745361328125, -0.07486629486083984, -0.07227897644042969, -0.06969165802001953, -0.06710433959960938, -0.06451702117919922, -0.06192970275878906, -0.059342384338378906, -0.05675506591796875, -0.054167747497558594, -0.05158042907714844, -0.04899311065673828, -0.046405792236328125, -0.04381847381591797, -0.04123115539550781, -0.038643836975097656, -0.0360565185546875, -0.033469200134277344, -0.030881881713867188, -0.02829456329345703, -0.025707244873046875, -0.02311992645263672, -0.020532608032226562, -0.017945289611816406, -0.01535797119140625, -0.012770652770996094, -0.010183334350585938, -0.007596015930175781, -0.005008697509765625, -0.0024213790893554688, 0.0001659393310546875, 0.0027532577514648438, 0.005340576171875, 0.007927894592285156, 0.010515213012695312, 0.013102531433105469, 0.015689849853515625, 0.01827716827392578, 0.020864486694335938, 0.023451805114746094, 0.02603912353515625, 0.028626441955566406, 0.031213760375976562, 0.03380107879638672, 0.036388397216796875, 0.03897571563720703, 0.04156303405761719, 0.044150352478027344, 0.0467376708984375, 0.049324989318847656, 0.05191230773925781, 0.05449962615966797, 0.057086944580078125, 0.05967426300048828, 0.06226158142089844, 0.0648488998413086, 0.06743621826171875, 0.0700235366821289, 0.07261085510253906, 0.07519817352294922, 0.07778549194335938, 0.08037281036376953, 0.08296012878417969, 0.08554744720458984, 0.088134765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 14.0, 25.0, 24.0, 60.0, 102.0, 204.0, 395.0, 1043.0, 2934.0, 11864.0, 103468.0, 726269.0, 178954.0, 17163.0, 3697.0, 1280.0, 540.0, 246.0, 113.0, 63.0, 39.0, 21.0, 11.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044708251953125, -0.04329347610473633, -0.041878700256347656, -0.040463924407958984, -0.03904914855957031, -0.03763437271118164, -0.03621959686279297, -0.0348048210144043, -0.033390045166015625, -0.03197526931762695, -0.03056049346923828, -0.02914571762084961, -0.027730941772460938, -0.026316165924072266, -0.024901390075683594, -0.023486614227294922, -0.02207183837890625, -0.020657062530517578, -0.019242286682128906, -0.017827510833740234, -0.016412734985351562, -0.01499795913696289, -0.013583183288574219, -0.012168407440185547, -0.010753631591796875, -0.009338855743408203, -0.007924079895019531, -0.006509304046630859, -0.0050945281982421875, -0.0036797523498535156, -0.0022649765014648438, -0.0008502006530761719, 0.0005645751953125, 0.001979351043701172, 0.0033941268920898438, 0.004808902740478516, 0.0062236785888671875, 0.007638454437255859, 0.009053230285644531, 0.010468006134033203, 0.011882781982421875, 0.013297557830810547, 0.014712333679199219, 0.01612710952758789, 0.017541885375976562, 0.018956661224365234, 0.020371437072753906, 0.021786212921142578, 0.02320098876953125, 0.024615764617919922, 0.026030540466308594, 0.027445316314697266, 0.028860092163085938, 0.03027486801147461, 0.03168964385986328, 0.03310441970825195, 0.034519195556640625, 0.0359339714050293, 0.03734874725341797, 0.03876352310180664, 0.04017829895019531, 0.041593074798583984, 0.043007850646972656, 0.04442262649536133, 0.04583740234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 7.0, 8.0, 23.0, 28.0, 49.0, 60.0, 77.0, 100.0, 129.0, 119.0, 114.0, 104.0, 61.0, 48.0, 33.0, 16.0, 14.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.239776611328125e-05, -1.2021511793136597e-05, -1.1645257472991943e-05, -1.126900315284729e-05, -1.0892748832702637e-05, -1.0516494512557983e-05, -1.014024019241333e-05, -9.763985872268677e-06, -9.387731552124023e-06, -9.01147723197937e-06, -8.635222911834717e-06, -8.258968591690063e-06, -7.88271427154541e-06, -7.506459951400757e-06, -7.1302056312561035e-06, -6.75395131111145e-06, -6.377696990966797e-06, -6.0014426708221436e-06, -5.62518835067749e-06, -5.248934030532837e-06, -4.872679710388184e-06, -4.49642539024353e-06, -4.120171070098877e-06, -3.7439167499542236e-06, -3.3676624298095703e-06, -2.991408109664917e-06, -2.6151537895202637e-06, -2.2388994693756104e-06, -1.862645149230957e-06, -1.4863908290863037e-06, -1.1101365089416504e-06, -7.338821887969971e-07, -3.5762786865234375e-07, 1.862645149230957e-08, 3.948807716369629e-07, 7.711350917816162e-07, 1.1473894119262695e-06, 1.5236437320709229e-06, 1.8998980522155762e-06, 2.2761523723602295e-06, 2.652406692504883e-06, 3.028661012649536e-06, 3.4049153327941895e-06, 3.7811696529388428e-06, 4.157423973083496e-06, 4.533678293228149e-06, 4.909932613372803e-06, 5.286186933517456e-06, 5.662441253662109e-06, 6.038695573806763e-06, 6.414949893951416e-06, 6.791204214096069e-06, 7.167458534240723e-06, 7.543712854385376e-06, 7.91996717453003e-06, 8.296221494674683e-06, 8.672475814819336e-06, 9.04873013496399e-06, 9.424984455108643e-06, 9.801238775253296e-06, 1.017749309539795e-05, 1.0553747415542603e-05, 1.0930001735687256e-05, 1.130625605583191e-05, 1.1682510375976562e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 17.0, 20.0, 16.0, 30.0, 43.0, 63.0, 84.0, 153.0, 245.0, 522.0, 1114.0, 2790.0, 8376.0, 34152.0, 177786.0, 493462.0, 259561.0, 52219.0, 11601.0, 3520.0, 1353.0, 592.0, 319.0, 183.0, 102.0, 56.0, 54.0, 34.0, 21.0, 15.0, 14.0, 5.0, 4.0, 9.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.022705078125, -0.021819114685058594, -0.020933151245117188, -0.02004718780517578, -0.019161224365234375, -0.01827526092529297, -0.017389297485351562, -0.016503334045410156, -0.01561737060546875, -0.014731407165527344, -0.013845443725585938, -0.012959480285644531, -0.012073516845703125, -0.011187553405761719, -0.010301589965820312, -0.009415626525878906, -0.0085296630859375, -0.007643699645996094, -0.0067577362060546875, -0.005871772766113281, -0.004985809326171875, -0.004099845886230469, -0.0032138824462890625, -0.0023279190063476562, -0.00144195556640625, -0.0005559921264648438, 0.0003299713134765625, 0.0012159347534179688, 0.002101898193359375, 0.0029878616333007812, 0.0038738250732421875, 0.004759788513183594, 0.005645751953125, 0.006531715393066406, 0.0074176788330078125, 0.008303642272949219, 0.009189605712890625, 0.010075569152832031, 0.010961532592773438, 0.011847496032714844, 0.01273345947265625, 0.013619422912597656, 0.014505386352539062, 0.015391349792480469, 0.016277313232421875, 0.01716327667236328, 0.018049240112304688, 0.018935203552246094, 0.0198211669921875, 0.020707130432128906, 0.021593093872070312, 0.02247905731201172, 0.023365020751953125, 0.02425098419189453, 0.025136947631835938, 0.026022911071777344, 0.02690887451171875, 0.027794837951660156, 0.028680801391601562, 0.02956676483154297, 0.030452728271484375, 0.03133869171142578, 0.03222465515136719, 0.033110618591308594, 0.03399658203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 14.0, 18.0, 33.0, 45.0, 60.0, 74.0, 94.0, 110.0, 119.0, 114.0, 99.0, 81.0, 52.0, 35.0, 21.0, 14.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0386962890625, -0.03716325759887695, -0.035630226135253906, -0.03409719467163086, -0.03256416320800781, -0.031031131744384766, -0.02949810028076172, -0.027965068817138672, -0.026432037353515625, -0.024899005889892578, -0.02336597442626953, -0.021832942962646484, -0.020299911499023438, -0.01876688003540039, -0.017233848571777344, -0.015700817108154297, -0.01416778564453125, -0.012634754180908203, -0.011101722717285156, -0.00956869125366211, -0.008035659790039062, -0.006502628326416016, -0.004969596862792969, -0.003436565399169922, -0.001903533935546875, -0.0003705024719238281, 0.0011625289916992188, 0.0026955604553222656, 0.0042285919189453125, 0.005761623382568359, 0.007294654846191406, 0.008827686309814453, 0.0103607177734375, 0.011893749237060547, 0.013426780700683594, 0.01495981216430664, 0.016492843627929688, 0.018025875091552734, 0.01955890655517578, 0.021091938018798828, 0.022624969482421875, 0.024158000946044922, 0.02569103240966797, 0.027224063873291016, 0.028757095336914062, 0.03029012680053711, 0.031823158264160156, 0.0333561897277832, 0.03488922119140625, 0.0364222526550293, 0.037955284118652344, 0.03948831558227539, 0.04102134704589844, 0.042554378509521484, 0.04408740997314453, 0.04562044143676758, 0.047153472900390625, 0.04868650436401367, 0.05021953582763672, 0.051752567291259766, 0.05328559875488281, 0.05481863021850586, 0.056351661682128906, 0.05788469314575195, 0.059417724609375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 12.0, 25.0, 37.0, 91.0, 203.0, 248.0, 200.0, 115.0, 49.0, 14.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4271184206008911, -1.397168755531311, -1.367219090461731, -1.3372694253921509, -1.3073197603225708, -1.2773700952529907, -1.2474204301834106, -1.2174708843231201, -1.18752121925354, -1.15757155418396, -1.1276218891143799, -1.0976722240447998, -1.0677225589752197, -1.0377728939056396, -1.0078232288360596, -0.9778736233711243, -0.9479238986968994, -0.9179742336273193, -0.8880245685577393, -0.8580749034881592, -0.8281252384185791, -0.798175573348999, -0.7682259678840637, -0.7382763028144836, -0.7083266377449036, -0.6783769726753235, -0.6484273076057434, -0.6184776425361633, -0.588528037071228, -0.558578372001648, -0.5286287069320679, -0.4986790418624878, -0.4687294065952301, -0.43877974152565, -0.40883010625839233, -0.37888044118881226, -0.3489307761192322, -0.3189811110496521, -0.289031445980072, -0.25908181071281433, -0.22913214564323425, -0.19918248057365417, -0.1692328304052353, -0.1392831802368164, -0.10933351516723633, -0.07938385009765625, -0.049434199929237366, -0.01948454976081848, 0.010465115308761597, 0.04041477292776108, 0.07036443054676056, 0.10031408816576004, 0.13026374578475952, 0.1602134108543396, 0.19016306102275848, 0.22011271119117737, 0.25006237626075745, 0.2800120413303375, 0.3099616765975952, 0.3399113416671753, 0.36986100673675537, 0.39981067180633545, 0.4297603368759155, 0.4597099721431732, 0.4896596372127533]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 6.0, 14.0, 14.0, 18.0, 28.0, 23.0, 27.0, 36.0, 24.0, 32.0, 26.0, 37.0, 38.0, 52.0, 46.0, 50.0, 42.0, 36.0, 41.0, 48.0, 33.0, 44.0, 30.0, 26.0, 38.0, 24.0, 25.0, 18.0, 12.0, 22.0, 15.0, 14.0, 9.0, 12.0, 4.0, 4.0, 2.0, 4.0, 6.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44073212146759033, -0.4274516701698303, -0.4141712486743927, -0.4008907973766327, -0.38761037588119507, -0.37432992458343506, -0.36104947328567505, -0.34776902198791504, -0.3344886004924774, -0.3212081491947174, -0.3079277276992798, -0.2946472764015198, -0.28136682510375977, -0.26808640360832214, -0.25480595231056213, -0.24152551591396332, -0.2282450795173645, -0.21496464312076569, -0.20168420672416687, -0.18840375542640686, -0.17512331902980804, -0.16184288263320923, -0.14856243133544922, -0.1352819949388504, -0.12200155854225159, -0.10872112214565277, -0.09544067829847336, -0.08216023445129395, -0.06887979805469513, -0.055599361658096313, -0.0423189178109169, -0.029038473963737488, -0.015758037567138672, -0.0024775974452495575, 0.010802842676639557, 0.02408328279852867, 0.037363722920417786, 0.0506441593170166, 0.06392460316419601, 0.07720504701137543, 0.09048548340797424, 0.10376591980457306, 0.11704636365175247, 0.13032680749893188, 0.1436072438955307, 0.15688768029212952, 0.17016813158988953, 0.18344856798648834, 0.19672900438308716, 0.21000944077968597, 0.2232898771762848, 0.2365703284740448, 0.24985076487064362, 0.26313120126724243, 0.27641165256500244, 0.28969210386276245, 0.3029725253582001, 0.3162529766559601, 0.3295333981513977, 0.3428138494491577, 0.3560943007469177, 0.36937472224235535, 0.38265517354011536, 0.395935595035553, 0.409216046333313]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 11.0, 27.0, 30.0, 33.0, 60.0, 83.0, 125.0, 207.0, 293.0, 542.0, 934.0, 1926.0, 4408.0, 14432.0, 91960.0, 3835812.0, 210604.0, 22192.0, 5929.0, 2267.0, 995.0, 532.0, 310.0, 188.0, 113.0, 87.0, 45.0, 40.0, 26.0, 16.0, 17.0, 10.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.10595703125, -0.10280704498291016, -0.09965705871582031, -0.09650707244873047, -0.09335708618164062, -0.09020709991455078, -0.08705711364746094, -0.0839071273803711, -0.08075714111328125, -0.0776071548461914, -0.07445716857910156, -0.07130718231201172, -0.06815719604492188, -0.06500720977783203, -0.06185722351074219, -0.058707237243652344, -0.0555572509765625, -0.052407264709472656, -0.04925727844238281, -0.04610729217529297, -0.042957305908203125, -0.03980731964111328, -0.03665733337402344, -0.033507347106933594, -0.03035736083984375, -0.027207374572753906, -0.024057388305664062, -0.02090740203857422, -0.017757415771484375, -0.014607429504394531, -0.011457443237304688, -0.008307456970214844, -0.005157470703125, -0.0020074844360351562, 0.0011425018310546875, 0.004292488098144531, 0.007442474365234375, 0.010592460632324219, 0.013742446899414062, 0.016892433166503906, 0.02004241943359375, 0.023192405700683594, 0.026342391967773438, 0.02949237823486328, 0.032642364501953125, 0.03579235076904297, 0.03894233703613281, 0.042092323303222656, 0.0452423095703125, 0.048392295837402344, 0.05154228210449219, 0.05469226837158203, 0.057842254638671875, 0.06099224090576172, 0.06414222717285156, 0.0672922134399414, 0.07044219970703125, 0.0735921859741211, 0.07674217224121094, 0.07989215850830078, 0.08304214477539062, 0.08619213104248047, 0.08934211730957031, 0.09249210357666016, 0.09564208984375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 4.0, 7.0, 8.0, 8.0, 10.0, 7.0, 11.0, 21.0, 21.0, 23.0, 30.0, 23.0, 38.0, 48.0, 45.0, 55.0, 70.0, 60.0, 51.0, 68.0, 47.0, 57.0, 38.0, 57.0, 41.0, 35.0, 26.0, 21.0, 18.0, 8.0, 11.0, 13.0, 6.0, 6.0, 7.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0276336669921875, -0.02672123908996582, -0.02580881118774414, -0.02489638328552246, -0.02398395538330078, -0.0230715274810791, -0.022159099578857422, -0.021246671676635742, -0.020334243774414062, -0.019421815872192383, -0.018509387969970703, -0.017596960067749023, -0.016684532165527344, -0.015772104263305664, -0.014859676361083984, -0.013947248458862305, -0.013034820556640625, -0.012122392654418945, -0.011209964752197266, -0.010297536849975586, -0.009385108947753906, -0.008472681045532227, -0.007560253143310547, -0.006647825241088867, -0.0057353973388671875, -0.004822969436645508, -0.003910541534423828, -0.0029981136322021484, -0.0020856857299804688, -0.001173257827758789, -0.0002608299255371094, 0.0006515979766845703, 0.00156402587890625, 0.0024764537811279297, 0.0033888816833496094, 0.004301309585571289, 0.005213737487792969, 0.0061261653900146484, 0.007038593292236328, 0.007951021194458008, 0.008863449096679688, 0.009775876998901367, 0.010688304901123047, 0.011600732803344727, 0.012513160705566406, 0.013425588607788086, 0.014338016510009766, 0.015250444412231445, 0.016162872314453125, 0.017075300216674805, 0.017987728118896484, 0.018900156021118164, 0.019812583923339844, 0.020725011825561523, 0.021637439727783203, 0.022549867630004883, 0.023462295532226562, 0.024374723434448242, 0.025287151336669922, 0.0261995792388916, 0.02711200714111328, 0.02802443504333496, 0.02893686294555664, 0.02984929084777832, 0.03076171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 2.0, 6.0, 9.0, 17.0, 22.0, 32.0, 38.0, 63.0, 107.0, 203.0, 334.0, 727.0, 1516.0, 3952.0, 18748.0, 444321.0, 3675526.0, 38486.0, 6164.0, 2042.0, 964.0, 429.0, 219.0, 117.0, 80.0, 50.0, 43.0, 16.0, 23.0, 11.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.1443347930908203, -0.14011001586914062, -0.13588523864746094, -0.13166046142578125, -0.12743568420410156, -0.12321090698242188, -0.11898612976074219, -0.1147613525390625, -0.11053657531738281, -0.10631179809570312, -0.10208702087402344, -0.09786224365234375, -0.09363746643066406, -0.08941268920898438, -0.08518791198730469, -0.080963134765625, -0.07673835754394531, -0.07251358032226562, -0.06828880310058594, -0.06406402587890625, -0.05983924865722656, -0.055614471435546875, -0.05138969421386719, -0.0471649169921875, -0.04294013977050781, -0.038715362548828125, -0.03449058532714844, -0.03026580810546875, -0.026041030883789062, -0.021816253662109375, -0.017591476440429688, -0.01336669921875, -0.009141921997070312, -0.004917144775390625, -0.0006923675537109375, 0.00353240966796875, 0.0077571868896484375, 0.011981964111328125, 0.016206741333007812, 0.0204315185546875, 0.024656295776367188, 0.028881072998046875, 0.03310585021972656, 0.03733062744140625, 0.04155540466308594, 0.045780181884765625, 0.05000495910644531, 0.054229736328125, 0.05845451354980469, 0.06267929077148438, 0.06690406799316406, 0.07112884521484375, 0.07535362243652344, 0.07957839965820312, 0.08380317687988281, 0.0880279541015625, 0.09225273132324219, 0.09647750854492188, 0.10070228576660156, 0.10492706298828125, 0.10915184020996094, 0.11337661743164062, 0.11760139465332031, 0.121826171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 12.0, 26.0, 32.0, 77.0, 384.0, 2763.0, 544.0, 125.0, 42.0, 21.0, 18.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10894775390625, -0.10644865036010742, -0.10394954681396484, -0.10145044326782227, -0.09895133972167969, -0.09645223617553711, -0.09395313262939453, -0.09145402908325195, -0.08895492553710938, -0.0864558219909668, -0.08395671844482422, -0.08145761489868164, -0.07895851135253906, -0.07645940780639648, -0.0739603042602539, -0.07146120071411133, -0.06896209716796875, -0.06646299362182617, -0.0639638900756836, -0.061464786529541016, -0.05896568298339844, -0.05646657943725586, -0.05396747589111328, -0.0514683723449707, -0.048969268798828125, -0.04647016525268555, -0.04397106170654297, -0.04147195816040039, -0.03897285461425781, -0.036473751068115234, -0.033974647521972656, -0.03147554397583008, -0.0289764404296875, -0.026477336883544922, -0.023978233337402344, -0.021479129791259766, -0.018980026245117188, -0.01648092269897461, -0.013981819152832031, -0.011482715606689453, -0.008983612060546875, -0.006484508514404297, -0.003985404968261719, -0.0014863014221191406, 0.0010128021240234375, 0.0035119056701660156, 0.006011009216308594, 0.008510112762451172, 0.01100921630859375, 0.013508319854736328, 0.016007423400878906, 0.018506526947021484, 0.021005630493164062, 0.02350473403930664, 0.02600383758544922, 0.028502941131591797, 0.031002044677734375, 0.03350114822387695, 0.03600025177001953, 0.03849935531616211, 0.04099845886230469, 0.043497562408447266, 0.045996665954589844, 0.04849576950073242, 0.050994873046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 3.0, 13.0, 25.0, 40.0, 76.0, 142.0, 199.0, 170.0, 136.0, 82.0, 42.0, 25.0, 18.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24553218483924866, -0.23781095445156097, -0.23008973896503448, -0.2223685085773468, -0.21464727818965912, -0.20692604780197144, -0.19920483231544495, -0.19148360192775726, -0.18376237154006958, -0.1760411411523819, -0.1683199256658554, -0.16059869527816772, -0.15287746489048004, -0.14515623450279236, -0.13743501901626587, -0.12971378862857819, -0.1219925731420517, -0.11427135020494461, -0.10655011981725693, -0.09882889688014984, -0.09110766649246216, -0.08338644355535507, -0.07566522061824799, -0.0679439902305603, -0.06022276729345322, -0.05250154063105583, -0.04478031396865845, -0.03705909103155136, -0.029337864369153976, -0.021616637706756592, -0.013895414769649506, -0.006174188107252121, 0.0015470385551452637, 0.009268264286220074, 0.016989490017294884, 0.02471071481704712, 0.032431941479444504, 0.04015316814184189, 0.047874391078948975, 0.05559561774134636, 0.06331684440374374, 0.07103806734085083, 0.07875929772853851, 0.0864805206656456, 0.09420174360275269, 0.10192297399044037, 0.10964419692754745, 0.11736541986465454, 0.12508665025234222, 0.1328078806400299, 0.1405290961265564, 0.14825032651424408, 0.15597155690193176, 0.16369277238845825, 0.17141400277614594, 0.17913523316383362, 0.1868564486503601, 0.1945776790380478, 0.20229889452457428, 0.21002012491226196, 0.21774135529994965, 0.22546258568763733, 0.23318380117416382, 0.2409050315618515, 0.24862626194953918]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 5.0, 11.0, 29.0, 48.0, 51.0, 74.0, 101.0, 112.0, 94.0, 87.0, 101.0, 65.0, 62.0, 47.0, 35.0, 24.0, 16.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2644222378730774, -0.25635817646980286, -0.24829411506652832, -0.24023005366325378, -0.23216600716114044, -0.2241019457578659, -0.21603788435459137, -0.20797382295131683, -0.1999097764492035, -0.19184571504592896, -0.18378165364265442, -0.17571759223937988, -0.16765354573726654, -0.159589484333992, -0.15152542293071747, -0.14346136152744293, -0.1353973001241684, -0.12733323872089386, -0.11926918476819992, -0.11120512336492538, -0.10314106941223145, -0.09507700800895691, -0.08701294660568237, -0.07894888520240784, -0.0708848312497139, -0.06282076984643936, -0.05475671589374542, -0.046692654490470886, -0.03862859681248665, -0.03056453913450241, -0.022500477731227875, -0.014436420053243637, -0.006372362375259399, 0.0016916962340474129, 0.009755754843354225, 0.017819814383983612, 0.02588387206196785, 0.03394792973995209, 0.042011991143226624, 0.05007604882121086, 0.0581401064991951, 0.06620416790246964, 0.07426822185516357, 0.08233228325843811, 0.09039634466171265, 0.09846039861440659, 0.10652446001768112, 0.11458851397037506, 0.1226525753736496, 0.13071663677692413, 0.13878069818019867, 0.146844744682312, 0.15490880608558655, 0.16297286748886108, 0.17103692889213562, 0.17910099029541016, 0.1871650516986847, 0.19522911310195923, 0.20329317450523376, 0.2113572359085083, 0.21942128241062164, 0.22748534381389618, 0.23554940521717072, 0.24361346662044525, 0.2516775131225586]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 9.0, 9.0, 5.0, 21.0, 24.0, 40.0, 88.0, 96.0, 190.0, 355.0, 556.0, 1144.0, 2485.0, 5931.0, 16859.0, 55399.0, 201990.0, 444133.0, 226027.0, 62547.0, 18684.0, 6516.0, 2616.0, 1279.0, 640.0, 378.0, 192.0, 128.0, 70.0, 48.0, 34.0, 23.0, 12.0, 10.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068359375, -0.0659646987915039, -0.06357002258300781, -0.06117534637451172, -0.058780670166015625, -0.05638599395751953, -0.05399131774902344, -0.051596641540527344, -0.04920196533203125, -0.046807289123535156, -0.04441261291503906, -0.04201793670654297, -0.039623260498046875, -0.03722858428955078, -0.03483390808105469, -0.032439231872558594, -0.0300445556640625, -0.027649879455566406, -0.025255203247070312, -0.02286052703857422, -0.020465850830078125, -0.01807117462158203, -0.015676498413085938, -0.013281822204589844, -0.01088714599609375, -0.008492469787597656, -0.0060977935791015625, -0.0037031173706054688, -0.001308441162109375, 0.0010862350463867188, 0.0034809112548828125, 0.005875587463378906, 0.008270263671875, 0.010664939880371094, 0.013059616088867188, 0.015454292297363281, 0.017848968505859375, 0.02024364471435547, 0.022638320922851562, 0.025032997131347656, 0.02742767333984375, 0.029822349548339844, 0.03221702575683594, 0.03461170196533203, 0.037006378173828125, 0.03940105438232422, 0.04179573059082031, 0.044190406799316406, 0.0465850830078125, 0.048979759216308594, 0.05137443542480469, 0.05376911163330078, 0.056163787841796875, 0.05855846405029297, 0.06095314025878906, 0.06334781646728516, 0.06574249267578125, 0.06813716888427734, 0.07053184509277344, 0.07292652130126953, 0.07532119750976562, 0.07771587371826172, 0.08011054992675781, 0.0825052261352539, 0.08489990234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 11.0, 3.0, 8.0, 11.0, 16.0, 24.0, 22.0, 29.0, 39.0, 40.0, 63.0, 55.0, 65.0, 72.0, 73.0, 58.0, 55.0, 61.0, 61.0, 51.0, 50.0, 29.0, 18.0, 20.0, 16.0, 14.0, 10.0, 6.0, 8.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030426025390625, -0.029325485229492188, -0.028224945068359375, -0.027124404907226562, -0.02602386474609375, -0.024923324584960938, -0.023822784423828125, -0.022722244262695312, -0.0216217041015625, -0.020521163940429688, -0.019420623779296875, -0.018320083618164062, -0.01721954345703125, -0.016119003295898438, -0.015018463134765625, -0.013917922973632812, -0.0128173828125, -0.011716842651367188, -0.010616302490234375, -0.009515762329101562, -0.00841522216796875, -0.0073146820068359375, -0.006214141845703125, -0.0051136016845703125, -0.0040130615234375, -0.0029125213623046875, -0.001811981201171875, -0.0007114410400390625, 0.00038909912109375, 0.0014896392822265625, 0.002590179443359375, 0.0036907196044921875, 0.004791259765625, 0.0058917999267578125, 0.006992340087890625, 0.008092880249023438, 0.00919342041015625, 0.010293960571289062, 0.011394500732421875, 0.012495040893554688, 0.0135955810546875, 0.014696121215820312, 0.015796661376953125, 0.016897201538085938, 0.01799774169921875, 0.019098281860351562, 0.020198822021484375, 0.021299362182617188, 0.02239990234375, 0.023500442504882812, 0.024600982666015625, 0.025701522827148438, 0.02680206298828125, 0.027902603149414062, 0.029003143310546875, 0.030103683471679688, 0.0312042236328125, 0.03230476379394531, 0.033405303955078125, 0.03450584411621094, 0.03560638427734375, 0.03670692443847656, 0.037807464599609375, 0.03890800476074219, 0.040008544921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 22.0, 19.0, 36.0, 49.0, 92.0, 129.0, 219.0, 376.0, 933.0, 2784.0, 10387.0, 49946.0, 319766.0, 539617.0, 98756.0, 18254.0, 4413.0, 1443.0, 561.0, 284.0, 134.0, 75.0, 64.0, 55.0, 34.0, 18.0, 26.0, 10.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09283447265625, -0.0899505615234375, -0.087066650390625, -0.0841827392578125, -0.081298828125, -0.0784149169921875, -0.075531005859375, -0.0726470947265625, -0.06976318359375, -0.0668792724609375, -0.063995361328125, -0.0611114501953125, -0.0582275390625, -0.0553436279296875, -0.052459716796875, -0.0495758056640625, -0.04669189453125, -0.0438079833984375, -0.040924072265625, -0.0380401611328125, -0.03515625, -0.0322723388671875, -0.029388427734375, -0.0265045166015625, -0.02362060546875, -0.0207366943359375, -0.017852783203125, -0.0149688720703125, -0.0120849609375, -0.0092010498046875, -0.006317138671875, -0.0034332275390625, -0.00054931640625, 0.0023345947265625, 0.005218505859375, 0.0081024169921875, 0.010986328125, 0.0138702392578125, 0.016754150390625, 0.0196380615234375, 0.02252197265625, 0.0254058837890625, 0.028289794921875, 0.0311737060546875, 0.0340576171875, 0.0369415283203125, 0.039825439453125, 0.0427093505859375, 0.04559326171875, 0.0484771728515625, 0.051361083984375, 0.0542449951171875, 0.05712890625, 0.0600128173828125, 0.062896728515625, 0.0657806396484375, 0.06866455078125, 0.0715484619140625, 0.074432373046875, 0.0773162841796875, 0.0802001953125, 0.0830841064453125, 0.085968017578125, 0.0888519287109375, 0.09173583984375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 5.0, 9.0, 5.0, 9.0, 8.0, 11.0, 18.0, 22.0, 27.0, 26.0, 30.0, 32.0, 37.0, 35.0, 44.0, 41.0, 47.0, 34.0, 59.0, 52.0, 57.0, 37.0, 48.0, 43.0, 37.0, 36.0, 30.0, 27.0, 24.0, 29.0, 16.0, 13.0, 14.0, 8.0, 9.0, 3.0, 7.0, 3.0, 5.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09954833984375, -0.09619903564453125, -0.0928497314453125, -0.08950042724609375, -0.086151123046875, -0.08280181884765625, -0.0794525146484375, -0.07610321044921875, -0.07275390625, -0.06940460205078125, -0.0660552978515625, -0.06270599365234375, -0.059356689453125, -0.05600738525390625, -0.0526580810546875, -0.04930877685546875, -0.04595947265625, -0.04261016845703125, -0.0392608642578125, -0.03591156005859375, -0.032562255859375, -0.02921295166015625, -0.0258636474609375, -0.02251434326171875, -0.0191650390625, -0.01581573486328125, -0.0124664306640625, -0.00911712646484375, -0.005767822265625, -0.00241851806640625, 0.0009307861328125, 0.00428009033203125, 0.00762939453125, 0.01097869873046875, 0.0143280029296875, 0.01767730712890625, 0.021026611328125, 0.02437591552734375, 0.0277252197265625, 0.03107452392578125, 0.034423828125, 0.03777313232421875, 0.0411224365234375, 0.04447174072265625, 0.047821044921875, 0.05117034912109375, 0.0545196533203125, 0.05786895751953125, 0.06121826171875, 0.06456756591796875, 0.0679168701171875, 0.07126617431640625, 0.074615478515625, 0.07796478271484375, 0.0813140869140625, 0.08466339111328125, 0.0880126953125, 0.09136199951171875, 0.0947113037109375, 0.09806060791015625, 0.101409912109375, 0.10475921630859375, 0.1081085205078125, 0.11145782470703125, 0.11480712890625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 9.0, 17.0, 27.0, 30.0, 44.0, 59.0, 88.0, 154.0, 240.0, 433.0, 812.0, 1723.0, 4479.0, 19193.0, 235643.0, 724481.0, 48157.0, 8000.0, 2482.0, 1121.0, 574.0, 298.0, 155.0, 98.0, 68.0, 58.0, 39.0, 21.0, 23.0, 14.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05096435546875, -0.04902076721191406, -0.047077178955078125, -0.04513359069824219, -0.04319000244140625, -0.04124641418457031, -0.039302825927734375, -0.03735923767089844, -0.0354156494140625, -0.03347206115722656, -0.031528472900390625, -0.029584884643554688, -0.02764129638671875, -0.025697708129882812, -0.023754119873046875, -0.021810531616210938, -0.019866943359375, -0.017923355102539062, -0.015979766845703125, -0.014036178588867188, -0.01209259033203125, -0.010149002075195312, -0.008205413818359375, -0.0062618255615234375, -0.0043182373046875, -0.0023746490478515625, -0.000431060791015625, 0.0015125274658203125, 0.00345611572265625, 0.0053997039794921875, 0.007343292236328125, 0.009286880493164062, 0.01123046875, 0.013174057006835938, 0.015117645263671875, 0.017061233520507812, 0.01900482177734375, 0.020948410034179688, 0.022891998291015625, 0.024835586547851562, 0.0267791748046875, 0.028722763061523438, 0.030666351318359375, 0.03260993957519531, 0.03455352783203125, 0.03649711608886719, 0.038440704345703125, 0.04038429260253906, 0.042327880859375, 0.04427146911621094, 0.046215057373046875, 0.04815864562988281, 0.05010223388671875, 0.05204582214355469, 0.053989410400390625, 0.05593299865722656, 0.0578765869140625, 0.05982017517089844, 0.061763763427734375, 0.06370735168457031, 0.06565093994140625, 0.06759452819824219, 0.06953811645507812, 0.07148170471191406, 0.07342529296875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 9.0, 17.0, 28.0, 28.0, 38.0, 50.0, 50.0, 65.0, 59.0, 76.0, 79.0, 70.0, 68.0, 69.0, 80.0, 44.0, 38.0, 34.0, 16.0, 14.0, 11.0, 18.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-1.055002212524414e-05, -1.0295771062374115e-05, -1.004151999950409e-05, -9.787268936634064e-06, -9.533017873764038e-06, -9.278766810894012e-06, -9.024515748023987e-06, -8.770264685153961e-06, -8.516013622283936e-06, -8.26176255941391e-06, -8.007511496543884e-06, -7.753260433673859e-06, -7.499009370803833e-06, -7.244758307933807e-06, -6.990507245063782e-06, -6.736256182193756e-06, -6.4820051193237305e-06, -6.227754056453705e-06, -5.973502993583679e-06, -5.7192519307136536e-06, -5.465000867843628e-06, -5.210749804973602e-06, -4.956498742103577e-06, -4.702247679233551e-06, -4.447996616363525e-06, -4.1937455534935e-06, -3.939494490623474e-06, -3.6852434277534485e-06, -3.430992364883423e-06, -3.1767413020133972e-06, -2.9224902391433716e-06, -2.668239176273346e-06, -2.4139881134033203e-06, -2.1597370505332947e-06, -1.905485987663269e-06, -1.6512349247932434e-06, -1.3969838619232178e-06, -1.1427327990531921e-06, -8.884817361831665e-07, -6.342306733131409e-07, -3.7997961044311523e-07, -1.257285475730896e-07, 1.2852251529693604e-07, 3.8277357816696167e-07, 6.370246410369873e-07, 8.912757039070129e-07, 1.1455267667770386e-06, 1.3997778296470642e-06, 1.6540288925170898e-06, 1.9082799553871155e-06, 2.162531018257141e-06, 2.4167820811271667e-06, 2.6710331439971924e-06, 2.925284206867218e-06, 3.1795352697372437e-06, 3.4337863326072693e-06, 3.688037395477295e-06, 3.9422884583473206e-06, 4.196539521217346e-06, 4.450790584087372e-06, 4.7050416469573975e-06, 4.959292709827423e-06, 5.213543772697449e-06, 5.467794835567474e-06, 5.7220458984375e-06]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 10.0, 10.0, 11.0, 18.0, 37.0, 60.0, 121.0, 187.0, 323.0, 596.0, 1502.0, 4835.0, 44426.0, 883975.0, 101499.0, 7401.0, 1897.0, 772.0, 380.0, 208.0, 107.0, 61.0, 43.0, 29.0, 14.0, 8.0, 8.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.077880859375, -0.07525157928466797, -0.07262229919433594, -0.0699930191040039, -0.06736373901367188, -0.06473445892333984, -0.06210517883300781, -0.05947589874267578, -0.05684661865234375, -0.05421733856201172, -0.05158805847167969, -0.048958778381347656, -0.046329498291015625, -0.043700218200683594, -0.04107093811035156, -0.03844165802001953, -0.0358123779296875, -0.03318309783935547, -0.030553817749023438, -0.027924537658691406, -0.025295257568359375, -0.022665977478027344, -0.020036697387695312, -0.01740741729736328, -0.01477813720703125, -0.012148857116699219, -0.009519577026367188, -0.006890296936035156, -0.004261016845703125, -0.0016317367553710938, 0.0009975433349609375, 0.0036268234252929688, 0.006256103515625, 0.008885383605957031, 0.011514663696289062, 0.014143943786621094, 0.016773223876953125, 0.019402503967285156, 0.022031784057617188, 0.02466106414794922, 0.02729034423828125, 0.02991962432861328, 0.03254890441894531, 0.035178184509277344, 0.037807464599609375, 0.040436744689941406, 0.04306602478027344, 0.04569530487060547, 0.0483245849609375, 0.05095386505126953, 0.05358314514160156, 0.056212425231933594, 0.058841705322265625, 0.061470985412597656, 0.06410026550292969, 0.06672954559326172, 0.06935882568359375, 0.07198810577392578, 0.07461738586425781, 0.07724666595458984, 0.07987594604492188, 0.0825052261352539, 0.08513450622558594, 0.08776378631591797, 0.09039306640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 12.0, 19.0, 31.0, 111.0, 256.0, 285.0, 169.0, 74.0, 16.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1109619140625, -0.10689163208007812, -0.10282135009765625, -0.09875106811523438, -0.0946807861328125, -0.09061050415039062, -0.08654022216796875, -0.08246994018554688, -0.078399658203125, -0.07432937622070312, -0.07025909423828125, -0.06618881225585938, -0.0621185302734375, -0.058048248291015625, -0.05397796630859375, -0.049907684326171875, -0.04583740234375, -0.041767120361328125, -0.03769683837890625, -0.033626556396484375, -0.0295562744140625, -0.025485992431640625, -0.02141571044921875, -0.017345428466796875, -0.013275146484375, -0.009204864501953125, -0.00513458251953125, -0.001064300537109375, 0.0030059814453125, 0.007076263427734375, 0.01114654541015625, 0.015216827392578125, 0.019287109375, 0.023357391357421875, 0.02742767333984375, 0.031497955322265625, 0.0355682373046875, 0.039638519287109375, 0.04370880126953125, 0.047779083251953125, 0.051849365234375, 0.055919647216796875, 0.05998992919921875, 0.06406021118164062, 0.0681304931640625, 0.07220077514648438, 0.07627105712890625, 0.08034133911132812, 0.08441162109375, 0.08848190307617188, 0.09255218505859375, 0.09662246704101562, 0.1006927490234375, 0.10476303100585938, 0.10883331298828125, 0.11290359497070312, 0.116973876953125, 0.12104415893554688, 0.12511444091796875, 0.12918472290039062, 0.1332550048828125, 0.13732528686523438, 0.14139556884765625, 0.14546585083007812, 0.1495361328125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 13.0, 16.0, 37.0, 111.0, 168.0, 230.0, 197.0, 121.0, 55.0, 30.0, 15.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9257702827453613, -0.8955456018447876, -0.8653209209442139, -0.8350961804389954, -0.8048714995384216, -0.7746468186378479, -0.7444220781326294, -0.7141973972320557, -0.6839727163314819, -0.6537480354309082, -0.6235233545303345, -0.593298614025116, -0.5630739331245422, -0.5328492522239685, -0.50262451171875, -0.47239983081817627, -0.44217514991760254, -0.4119504690170288, -0.3817257583141327, -0.3515010476112366, -0.32127636671066284, -0.2910516858100891, -0.260826975107193, -0.23060227930545807, -0.20037758350372314, -0.17015288770198822, -0.1399281919002533, -0.10970349609851837, -0.07947880029678345, -0.04925410449504852, -0.0190294086933136, 0.011195287108421326, 0.04141998291015625, 0.07164467871189117, 0.1018693745136261, 0.13209407031536102, 0.16231876611709595, 0.19254346191883087, 0.2227681577205658, 0.2529928684234619, 0.28321754932403564, 0.3134422302246094, 0.3436669409275055, 0.3738916516304016, 0.40411633253097534, 0.4343410134315491, 0.4645657241344452, 0.4947904348373413, 0.525015115737915, 0.5552397966384888, 0.5854644775390625, 0.615689218044281, 0.6459138989448547, 0.6761385798454285, 0.706363320350647, 0.7365880012512207, 0.7668126821517944, 0.7970373630523682, 0.8272620439529419, 0.8574867844581604, 0.8877114653587341, 0.9179361462593079, 0.9481608867645264, 0.9783855676651001, 1.0086102485656738]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 8.0, 5.0, 10.0, 12.0, 7.0, 9.0, 16.0, 21.0, 27.0, 26.0, 34.0, 34.0, 31.0, 38.0, 45.0, 45.0, 48.0, 39.0, 53.0, 58.0, 50.0, 46.0, 44.0, 33.0, 40.0, 33.0, 29.0, 35.0, 22.0, 17.0, 18.0, 9.0, 13.0, 12.0, 9.0, 0.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6328655481338501, -0.6157649755477905, -0.5986643433570862, -0.5815637707710266, -0.564463198184967, -0.5473625659942627, -0.5302619934082031, -0.5131614208221436, -0.4960608184337616, -0.47896021604537964, -0.46185964345932007, -0.4447590410709381, -0.42765843868255615, -0.4105578660964966, -0.3934572637081146, -0.37635666131973267, -0.3592560887336731, -0.34215548634529114, -0.32505491375923157, -0.3079543113708496, -0.29085373878479004, -0.2737531363964081, -0.2566525340080261, -0.23955194652080536, -0.2224513590335846, -0.20535077154636383, -0.18825018405914307, -0.1711495816707611, -0.15404899418354034, -0.13694840669631958, -0.11984781175851822, -0.10274721682071686, -0.0856466293334961, -0.06854604184627533, -0.05144544690847397, -0.034344855695962906, -0.017244264483451843, -0.0001436769962310791, 0.016956917941570282, 0.03405751287937164, 0.05115810036659241, 0.06825868785381317, 0.08535928279161453, 0.1024598777294159, 0.11956046521663666, 0.13666105270385742, 0.15376165509223938, 0.17086224257946014, 0.1879628300666809, 0.20506341755390167, 0.22216400504112244, 0.2392646074295044, 0.25636518001556396, 0.2734657824039459, 0.2905663847923279, 0.30766695737838745, 0.3247675597667694, 0.34186816215515137, 0.35896873474121094, 0.3760693371295929, 0.39316993951797485, 0.4102705121040344, 0.4273711144924164, 0.44447171688079834, 0.4615722894668579]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 9.0, 8.0, 16.0, 34.0, 37.0, 91.0, 166.0, 298.0, 658.0, 3342.0, 100203.0, 4081822.0, 5903.0, 937.0, 333.0, 167.0, 97.0, 63.0, 44.0, 21.0, 10.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.26868629455566406, -0.2612495422363281, -0.2538127899169922, -0.24637603759765625, -0.2389392852783203, -0.23150253295898438, -0.22406578063964844, -0.2166290283203125, -0.20919227600097656, -0.20175552368164062, -0.1943187713623047, -0.18688201904296875, -0.1794452667236328, -0.17200851440429688, -0.16457176208496094, -0.157135009765625, -0.14969825744628906, -0.14226150512695312, -0.1348247528076172, -0.12738800048828125, -0.11995124816894531, -0.11251449584960938, -0.10507774353027344, -0.0976409912109375, -0.09020423889160156, -0.08276748657226562, -0.07533073425292969, -0.06789398193359375, -0.06045722961425781, -0.053020477294921875, -0.04558372497558594, -0.03814697265625, -0.030710220336914062, -0.023273468017578125, -0.015836715698242188, -0.00839996337890625, -0.0009632110595703125, 0.006473541259765625, 0.013910293579101562, 0.0213470458984375, 0.028783798217773438, 0.036220550537109375, 0.04365730285644531, 0.05109405517578125, 0.05853080749511719, 0.06596755981445312, 0.07340431213378906, 0.080841064453125, 0.08827781677246094, 0.09571456909179688, 0.10315132141113281, 0.11058807373046875, 0.11802482604980469, 0.12546157836914062, 0.13289833068847656, 0.1403350830078125, 0.14777183532714844, 0.15520858764648438, 0.1626453399658203, 0.17008209228515625, 0.1775188446044922, 0.18495559692382812, 0.19239234924316406, 0.1998291015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 8.0, 5.0, 13.0, 15.0, 22.0, 26.0, 25.0, 38.0, 44.0, 52.0, 59.0, 59.0, 53.0, 67.0, 76.0, 50.0, 55.0, 53.0, 38.0, 41.0, 36.0, 38.0, 22.0, 25.0, 12.0, 11.0, 17.0, 6.0, 6.0, 3.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02886962890625, -0.027765274047851562, -0.026660919189453125, -0.025556564331054688, -0.02445220947265625, -0.023347854614257812, -0.022243499755859375, -0.021139144897460938, -0.0200347900390625, -0.018930435180664062, -0.017826080322265625, -0.016721725463867188, -0.01561737060546875, -0.014513015747070312, -0.013408660888671875, -0.012304306030273438, -0.011199951171875, -0.010095596313476562, -0.008991241455078125, -0.007886886596679688, -0.00678253173828125, -0.0056781768798828125, -0.004573822021484375, -0.0034694671630859375, -0.0023651123046875, -0.0012607574462890625, -0.000156402587890625, 0.0009479522705078125, 0.00205230712890625, 0.0031566619873046875, 0.004261016845703125, 0.0053653717041015625, 0.0064697265625, 0.0075740814208984375, 0.008678436279296875, 0.009782791137695312, 0.01088714599609375, 0.011991500854492188, 0.013095855712890625, 0.014200210571289062, 0.0153045654296875, 0.016408920288085938, 0.017513275146484375, 0.018617630004882812, 0.01972198486328125, 0.020826339721679688, 0.021930694580078125, 0.023035049438476562, 0.024139404296875, 0.025243759155273438, 0.026348114013671875, 0.027452468872070312, 0.02855682373046875, 0.029661178588867188, 0.030765533447265625, 0.03186988830566406, 0.0329742431640625, 0.03407859802246094, 0.035182952880859375, 0.03628730773925781, 0.03739166259765625, 0.03849601745605469, 0.039600372314453125, 0.04070472717285156, 0.04180908203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 6.0, 17.0, 11.0, 26.0, 26.0, 35.0, 45.0, 87.0, 146.0, 232.0, 554.0, 1508.0, 5461.0, 105282.0, 4065370.0, 11871.0, 2287.0, 644.0, 270.0, 137.0, 80.0, 59.0, 29.0, 19.0, 17.0, 19.0, 5.0, 7.0, 7.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1729736328125, -0.16724586486816406, -0.16151809692382812, -0.1557903289794922, -0.15006256103515625, -0.1443347930908203, -0.13860702514648438, -0.13287925720214844, -0.1271514892578125, -0.12142372131347656, -0.11569595336914062, -0.10996818542480469, -0.10424041748046875, -0.09851264953613281, -0.09278488159179688, -0.08705711364746094, -0.081329345703125, -0.07560157775878906, -0.06987380981445312, -0.06414604187011719, -0.05841827392578125, -0.05269050598144531, -0.046962738037109375, -0.04123497009277344, -0.0355072021484375, -0.029779434204101562, -0.024051666259765625, -0.018323898315429688, -0.01259613037109375, -0.0068683624267578125, -0.001140594482421875, 0.0045871734619140625, 0.01031494140625, 0.016042709350585938, 0.021770477294921875, 0.027498245239257812, 0.03322601318359375, 0.03895378112792969, 0.044681549072265625, 0.05040931701660156, 0.0561370849609375, 0.06186485290527344, 0.06759262084960938, 0.07332038879394531, 0.07904815673828125, 0.08477592468261719, 0.09050369262695312, 0.09623146057128906, 0.101959228515625, 0.10768699645996094, 0.11341476440429688, 0.11914253234863281, 0.12487030029296875, 0.1305980682373047, 0.13632583618164062, 0.14205360412597656, 0.1477813720703125, 0.15350914001464844, 0.15923690795898438, 0.1649646759033203, 0.17069244384765625, 0.1764202117919922, 0.18214797973632812, 0.18787574768066406, 0.193603515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 17.0, 26.0, 64.0, 229.0, 3470.0, 158.0, 56.0, 16.0, 10.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035308837890625, -0.03451383113861084, -0.03371882438659668, -0.03292381763458252, -0.03212881088256836, -0.0313338041305542, -0.03053879737854004, -0.02974379062652588, -0.02894878387451172, -0.02815377712249756, -0.0273587703704834, -0.02656376361846924, -0.025768756866455078, -0.024973750114440918, -0.024178743362426758, -0.023383736610412598, -0.022588729858398438, -0.021793723106384277, -0.020998716354370117, -0.020203709602355957, -0.019408702850341797, -0.018613696098327637, -0.017818689346313477, -0.017023682594299316, -0.016228675842285156, -0.015433669090270996, -0.014638662338256836, -0.013843655586242676, -0.013048648834228516, -0.012253642082214355, -0.011458635330200195, -0.010663628578186035, -0.009868621826171875, -0.009073615074157715, -0.008278608322143555, -0.0074836015701293945, -0.006688594818115234, -0.005893588066101074, -0.005098581314086914, -0.004303574562072754, -0.0035085678100585938, -0.0027135610580444336, -0.0019185543060302734, -0.0011235475540161133, -0.0003285408020019531, 0.00046646595001220703, 0.0012614727020263672, 0.0020564794540405273, 0.0028514862060546875, 0.0036464929580688477, 0.004441499710083008, 0.005236506462097168, 0.006031513214111328, 0.006826519966125488, 0.0076215267181396484, 0.008416533470153809, 0.009211540222167969, 0.010006546974182129, 0.010801553726196289, 0.01159656047821045, 0.01239156723022461, 0.01318657398223877, 0.01398158073425293, 0.01477658748626709, 0.01557159423828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 7.0, 29.0, 88.0, 180.0, 303.0, 273.0, 93.0, 20.0, 9.0, 3.0, 3.0], "bins": [-0.3543626666069031, -0.3482592701911926, -0.3421558439731598, -0.33605244755744934, -0.3299490213394165, -0.32384562492370605, -0.3177422285079956, -0.31163880228996277, -0.3055354058742523, -0.29943200945854187, -0.29332858324050903, -0.2872251868247986, -0.28112176060676575, -0.2750183641910553, -0.26891496777534485, -0.262811541557312, -0.25670814514160156, -0.2506047487258911, -0.24450132250785828, -0.23839792609214783, -0.23229451477527618, -0.22619110345840454, -0.2200876921415329, -0.21398428082466125, -0.2078808695077896, -0.20177745819091797, -0.19567404687404633, -0.18957065045833588, -0.18346723914146423, -0.1773638278245926, -0.17126041650772095, -0.1651570200920105, -0.15905362367630005, -0.1529502123594284, -0.14684680104255676, -0.1407434046268463, -0.13463999330997467, -0.12853658199310303, -0.12243317067623138, -0.11632976680994034, -0.1102263554930687, -0.10412294417619705, -0.098019540309906, -0.09191612899303436, -0.08581272512674332, -0.07970931380987167, -0.07360590994358063, -0.06750249862670898, -0.06139909103512764, -0.055295683443546295, -0.04919227585196495, -0.043088868260383606, -0.03698545694351196, -0.030882051214575768, -0.024778641760349274, -0.01867523416876793, -0.012571826577186584, -0.0064684185199439526, -0.00036501046270132065, 0.005738398060202599, 0.011841805651783943, 0.017945213243365288, 0.02404862269759178, 0.030152030289173126, 0.03625543788075447]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 11.0, 10.0, 20.0, 13.0, 23.0, 16.0, 29.0, 37.0, 27.0, 28.0, 36.0, 40.0, 48.0, 51.0, 45.0, 39.0, 45.0, 54.0, 52.0, 51.0, 36.0, 31.0, 37.0, 24.0, 28.0, 34.0, 20.0, 25.0, 19.0, 11.0, 12.0, 12.0, 5.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.06473273038864136, -0.06307819485664368, -0.06142366677522659, -0.05976913124322891, -0.05811459943652153, -0.05646006762981415, -0.05480553209781647, -0.053151000291109085, -0.0514964684844017, -0.04984193667769432, -0.04818740487098694, -0.04653286933898926, -0.044878337532281876, -0.04322380572557449, -0.04156927019357681, -0.03991473838686943, -0.03826020658016205, -0.036605674773454666, -0.034951142966747284, -0.0332966074347496, -0.03164207562804222, -0.02998754382133484, -0.028333010151982307, -0.026678476482629776, -0.025023944675922394, -0.02336941286921501, -0.02171487919986248, -0.02006034553050995, -0.018405813723802567, -0.016751281917095184, -0.015096748247742653, -0.013442215509712696, -0.01178768277168274, -0.010133150033652782, -0.008478617295622826, -0.006824084557592869, -0.005169551819562912, -0.003515019081532955, -0.0018604863435029984, -0.00020595360547304153, 0.0014485791325569153, 0.003103111870586872, 0.004757644608616829, 0.006412177346646786, 0.008066710084676743, 0.0097212428227067, 0.011375775560736656, 0.013030308298766613, 0.01468484103679657, 0.016339372843503952, 0.017993906512856483, 0.019648440182209015, 0.021302971988916397, 0.02295750379562378, 0.02461203746497631, 0.026266571134328842, 0.027921102941036224, 0.029575634747743607, 0.031230168417096138, 0.03288470208644867, 0.03453923389315605, 0.036193765699863434, 0.037848301231861115, 0.0395028330385685, 0.04115736484527588]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 8.0, 3.0, 8.0, 9.0, 14.0, 14.0, 35.0, 62.0, 84.0, 102.0, 200.0, 273.0, 424.0, 769.0, 1295.0, 2504.0, 4800.0, 10111.0, 21928.0, 50984.0, 121090.0, 259910.0, 297476.0, 157019.0, 65668.0, 28175.0, 12699.0, 5881.0, 2995.0, 1621.0, 908.0, 525.0, 341.0, 209.0, 131.0, 91.0, 81.0, 40.0, 26.0, 11.0, 6.0, 11.0, 3.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.05487060546875, -0.053109169006347656, -0.05134773254394531, -0.04958629608154297, -0.047824859619140625, -0.04606342315673828, -0.04430198669433594, -0.042540550231933594, -0.04077911376953125, -0.039017677307128906, -0.03725624084472656, -0.03549480438232422, -0.033733367919921875, -0.03197193145751953, -0.030210494995117188, -0.028449058532714844, -0.0266876220703125, -0.024926185607910156, -0.023164749145507812, -0.02140331268310547, -0.019641876220703125, -0.01788043975830078, -0.016119003295898438, -0.014357566833496094, -0.01259613037109375, -0.010834693908691406, -0.009073257446289062, -0.007311820983886719, -0.005550384521484375, -0.0037889480590820312, -0.0020275115966796875, -0.00026607513427734375, 0.001495361328125, 0.0032567977905273438, 0.0050182342529296875, 0.006779670715332031, 0.008541107177734375, 0.010302543640136719, 0.012063980102539062, 0.013825416564941406, 0.01558685302734375, 0.017348289489746094, 0.019109725952148438, 0.02087116241455078, 0.022632598876953125, 0.02439403533935547, 0.026155471801757812, 0.027916908264160156, 0.0296783447265625, 0.031439781188964844, 0.03320121765136719, 0.03496265411376953, 0.036724090576171875, 0.03848552703857422, 0.04024696350097656, 0.042008399963378906, 0.04376983642578125, 0.045531272888183594, 0.04729270935058594, 0.04905414581298828, 0.050815582275390625, 0.05257701873779297, 0.05433845520019531, 0.056099891662597656, 0.057861328125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 13.0, 7.0, 19.0, 11.0, 17.0, 21.0, 17.0, 26.0, 46.0, 38.0, 46.0, 50.0, 56.0, 41.0, 58.0, 41.0, 58.0, 51.0, 41.0, 37.0, 46.0, 47.0, 34.0, 25.0, 24.0, 26.0, 18.0, 15.0, 13.0, 13.0, 12.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03155517578125, -0.030458927154541016, -0.02936267852783203, -0.028266429901123047, -0.027170181274414062, -0.026073932647705078, -0.024977684020996094, -0.02388143539428711, -0.022785186767578125, -0.02168893814086914, -0.020592689514160156, -0.019496440887451172, -0.018400192260742188, -0.017303943634033203, -0.01620769500732422, -0.015111446380615234, -0.01401519775390625, -0.012918949127197266, -0.011822700500488281, -0.010726451873779297, -0.009630203247070312, -0.008533954620361328, -0.007437705993652344, -0.006341457366943359, -0.005245208740234375, -0.004148960113525391, -0.0030527114868164062, -0.001956462860107422, -0.0008602142333984375, 0.00023603439331054688, 0.0013322830200195312, 0.0024285316467285156, 0.0035247802734375, 0.004621028900146484, 0.005717277526855469, 0.006813526153564453, 0.007909774780273438, 0.009006023406982422, 0.010102272033691406, 0.01119852066040039, 0.012294769287109375, 0.01339101791381836, 0.014487266540527344, 0.015583515167236328, 0.016679763793945312, 0.017776012420654297, 0.01887226104736328, 0.019968509674072266, 0.02106475830078125, 0.022161006927490234, 0.02325725555419922, 0.024353504180908203, 0.025449752807617188, 0.026546001434326172, 0.027642250061035156, 0.02873849868774414, 0.029834747314453125, 0.03093099594116211, 0.032027244567871094, 0.03312349319458008, 0.03421974182128906, 0.03531599044799805, 0.03641223907470703, 0.037508487701416016, 0.038604736328125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 5.0, 15.0, 16.0, 46.0, 73.0, 133.0, 179.0, 294.0, 696.0, 2481.0, 16052.0, 210272.0, 736010.0, 72695.0, 6984.0, 1413.0, 514.0, 246.0, 156.0, 103.0, 57.0, 39.0, 28.0, 19.0, 15.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.1730947494506836, -0.1684551239013672, -0.16381549835205078, -0.15917587280273438, -0.15453624725341797, -0.14989662170410156, -0.14525699615478516, -0.14061737060546875, -0.13597774505615234, -0.13133811950683594, -0.12669849395751953, -0.12205886840820312, -0.11741924285888672, -0.11277961730957031, -0.1081399917602539, -0.1035003662109375, -0.0988607406616211, -0.09422111511230469, -0.08958148956298828, -0.08494186401367188, -0.08030223846435547, -0.07566261291503906, -0.07102298736572266, -0.06638336181640625, -0.061743736267089844, -0.05710411071777344, -0.05246448516845703, -0.047824859619140625, -0.04318523406982422, -0.03854560852050781, -0.033905982971191406, -0.029266357421875, -0.024626731872558594, -0.019987106323242188, -0.015347480773925781, -0.010707855224609375, -0.006068229675292969, -0.0014286041259765625, 0.0032110214233398438, 0.00785064697265625, 0.012490272521972656, 0.017129898071289062, 0.02176952362060547, 0.026409149169921875, 0.03104877471923828, 0.03568840026855469, 0.040328025817871094, 0.0449676513671875, 0.049607276916503906, 0.05424690246582031, 0.05888652801513672, 0.06352615356445312, 0.06816577911376953, 0.07280540466308594, 0.07744503021240234, 0.08208465576171875, 0.08672428131103516, 0.09136390686035156, 0.09600353240966797, 0.10064315795898438, 0.10528278350830078, 0.10992240905761719, 0.1145620346069336, 0.11920166015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 15.0, 17.0, 27.0, 46.0, 56.0, 52.0, 73.0, 64.0, 83.0, 96.0, 79.0, 71.0, 70.0, 68.0, 43.0, 57.0, 32.0, 14.0, 12.0, 9.0, 11.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2763671875, -0.2687797546386719, -0.26119232177734375, -0.2536048889160156, -0.2460174560546875, -0.23843002319335938, -0.23084259033203125, -0.22325515747070312, -0.215667724609375, -0.20808029174804688, -0.20049285888671875, -0.19290542602539062, -0.1853179931640625, -0.17773056030273438, -0.17014312744140625, -0.16255569458007812, -0.15496826171875, -0.14738082885742188, -0.13979339599609375, -0.13220596313476562, -0.1246185302734375, -0.11703109741210938, -0.10944366455078125, -0.10185623168945312, -0.094268798828125, -0.08668136596679688, -0.07909393310546875, -0.07150650024414062, -0.0639190673828125, -0.056331634521484375, -0.04874420166015625, -0.041156768798828125, -0.0335693359375, -0.025981903076171875, -0.01839447021484375, -0.010807037353515625, -0.0032196044921875, 0.004367828369140625, 0.01195526123046875, 0.019542694091796875, 0.027130126953125, 0.034717559814453125, 0.04230499267578125, 0.049892425537109375, 0.0574798583984375, 0.06506729125976562, 0.07265472412109375, 0.08024215698242188, 0.08782958984375, 0.09541702270507812, 0.10300445556640625, 0.11059188842773438, 0.1181793212890625, 0.12576675415039062, 0.13335418701171875, 0.14094161987304688, 0.148529052734375, 0.15611648559570312, 0.16370391845703125, 0.17129135131835938, 0.1788787841796875, 0.18646621704101562, 0.19405364990234375, 0.20164108276367188, 0.209228515625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 8.0, 7.0, 9.0, 12.0, 20.0, 26.0, 47.0, 86.0, 193.0, 464.0, 1540.0, 6925.0, 48350.0, 617808.0, 339189.0, 27571.0, 4448.0, 1144.0, 360.0, 150.0, 80.0, 48.0, 22.0, 11.0, 13.0, 3.0, 4.0, 8.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05877685546875, -0.05709123611450195, -0.055405616760253906, -0.05371999740600586, -0.05203437805175781, -0.050348758697509766, -0.04866313934326172, -0.04697751998901367, -0.045291900634765625, -0.04360628128051758, -0.04192066192626953, -0.040235042572021484, -0.03854942321777344, -0.03686380386352539, -0.035178184509277344, -0.0334925651550293, -0.03180694580078125, -0.030121326446533203, -0.028435707092285156, -0.02675008773803711, -0.025064468383789062, -0.023378849029541016, -0.02169322967529297, -0.020007610321044922, -0.018321990966796875, -0.016636371612548828, -0.014950752258300781, -0.013265132904052734, -0.011579513549804688, -0.00989389419555664, -0.008208274841308594, -0.006522655487060547, -0.0048370361328125, -0.003151416778564453, -0.0014657974243164062, 0.00021982192993164062, 0.0019054412841796875, 0.0035910606384277344, 0.005276679992675781, 0.006962299346923828, 0.008647918701171875, 0.010333538055419922, 0.012019157409667969, 0.013704776763916016, 0.015390396118164062, 0.01707601547241211, 0.018761634826660156, 0.020447254180908203, 0.02213287353515625, 0.023818492889404297, 0.025504112243652344, 0.02718973159790039, 0.028875350952148438, 0.030560970306396484, 0.03224658966064453, 0.03393220901489258, 0.035617828369140625, 0.03730344772338867, 0.03898906707763672, 0.040674686431884766, 0.04236030578613281, 0.04404592514038086, 0.045731544494628906, 0.04741716384887695, 0.049102783203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 6.0, 12.0, 8.0, 20.0, 31.0, 34.0, 39.0, 39.0, 41.0, 73.0, 67.0, 76.0, 69.0, 60.0, 79.0, 57.0, 51.0, 39.0, 39.0, 41.0, 19.0, 23.0, 17.0, 12.0, 13.0, 9.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.165836334228516e-06, -7.915310561656952e-06, -7.664784789085388e-06, -7.4142590165138245e-06, -7.163733243942261e-06, -6.913207471370697e-06, -6.662681698799133e-06, -6.41215592622757e-06, -6.161630153656006e-06, -5.911104381084442e-06, -5.660578608512878e-06, -5.410052835941315e-06, -5.159527063369751e-06, -4.909001290798187e-06, -4.6584755182266235e-06, -4.40794974565506e-06, -4.157423973083496e-06, -3.906898200511932e-06, -3.6563724279403687e-06, -3.405846655368805e-06, -3.155320882797241e-06, -2.9047951102256775e-06, -2.6542693376541138e-06, -2.40374356508255e-06, -2.1532177925109863e-06, -1.9026920199394226e-06, -1.6521662473678589e-06, -1.4016404747962952e-06, -1.1511147022247314e-06, -9.005889296531677e-07, -6.50063157081604e-07, -3.995373845100403e-07, -1.4901161193847656e-07, 1.0151416063308716e-07, 3.520399332046509e-07, 6.025657057762146e-07, 8.530914783477783e-07, 1.103617250919342e-06, 1.3541430234909058e-06, 1.6046687960624695e-06, 1.8551945686340332e-06, 2.105720341205597e-06, 2.3562461137771606e-06, 2.6067718863487244e-06, 2.857297658920288e-06, 3.107823431491852e-06, 3.3583492040634155e-06, 3.6088749766349792e-06, 3.859400749206543e-06, 4.109926521778107e-06, 4.36045229434967e-06, 4.610978066921234e-06, 4.861503839492798e-06, 5.1120296120643616e-06, 5.362555384635925e-06, 5.613081157207489e-06, 5.863606929779053e-06, 6.1141327023506165e-06, 6.36465847492218e-06, 6.615184247493744e-06, 6.865710020065308e-06, 7.116235792636871e-06, 7.366761565208435e-06, 7.617287337779999e-06, 7.867813110351562e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 5.0, 14.0, 18.0, 28.0, 30.0, 35.0, 79.0, 109.0, 184.0, 259.0, 574.0, 1071.0, 2383.0, 6006.0, 18221.0, 69730.0, 328798.0, 469875.0, 110824.0, 26080.0, 8144.0, 3119.0, 1408.0, 653.0, 318.0, 205.0, 133.0, 85.0, 58.0, 37.0, 19.0, 10.0, 9.0, 14.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0282745361328125, -0.027270078659057617, -0.026265621185302734, -0.02526116371154785, -0.02425670623779297, -0.023252248764038086, -0.022247791290283203, -0.02124333381652832, -0.020238876342773438, -0.019234418869018555, -0.018229961395263672, -0.01722550392150879, -0.016221046447753906, -0.015216588973999023, -0.01421213150024414, -0.013207674026489258, -0.012203216552734375, -0.011198759078979492, -0.01019430160522461, -0.009189844131469727, -0.008185386657714844, -0.007180929183959961, -0.006176471710205078, -0.005172014236450195, -0.0041675567626953125, -0.0031630992889404297, -0.002158641815185547, -0.001154184341430664, -0.00014972686767578125, 0.0008547306060791016, 0.0018591880798339844, 0.002863645553588867, 0.00386810302734375, 0.004872560501098633, 0.005877017974853516, 0.0068814754486083984, 0.007885932922363281, 0.008890390396118164, 0.009894847869873047, 0.01089930534362793, 0.011903762817382812, 0.012908220291137695, 0.013912677764892578, 0.014917135238647461, 0.015921592712402344, 0.016926050186157227, 0.01793050765991211, 0.018934965133666992, 0.019939422607421875, 0.020943880081176758, 0.02194833755493164, 0.022952795028686523, 0.023957252502441406, 0.02496170997619629, 0.025966167449951172, 0.026970624923706055, 0.027975082397460938, 0.02897953987121582, 0.029983997344970703, 0.030988454818725586, 0.03199291229248047, 0.03299736976623535, 0.034001827239990234, 0.03500628471374512, 0.0360107421875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 0.0, 3.0, 6.0, 15.0, 14.0, 28.0, 51.0, 82.0, 100.0, 117.0, 144.0, 129.0, 95.0, 79.0, 43.0, 34.0, 27.0, 14.0, 8.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041168212890625, -0.039327144622802734, -0.03748607635498047, -0.0356450080871582, -0.03380393981933594, -0.03196287155151367, -0.030121803283691406, -0.02828073501586914, -0.026439666748046875, -0.02459859848022461, -0.022757530212402344, -0.020916461944580078, -0.019075393676757812, -0.017234325408935547, -0.015393257141113281, -0.013552188873291016, -0.01171112060546875, -0.009870052337646484, -0.008028984069824219, -0.006187915802001953, -0.0043468475341796875, -0.002505779266357422, -0.0006647109985351562, 0.0011763572692871094, 0.003017425537109375, 0.004858493804931641, 0.006699562072753906, 0.008540630340576172, 0.010381698608398438, 0.012222766876220703, 0.014063835144042969, 0.015904903411865234, 0.0177459716796875, 0.019587039947509766, 0.02142810821533203, 0.023269176483154297, 0.025110244750976562, 0.026951313018798828, 0.028792381286621094, 0.03063344955444336, 0.032474517822265625, 0.03431558609008789, 0.036156654357910156, 0.03799772262573242, 0.03983879089355469, 0.04167985916137695, 0.04352092742919922, 0.045361995697021484, 0.04720306396484375, 0.049044132232666016, 0.05088520050048828, 0.05272626876831055, 0.05456733703613281, 0.05640840530395508, 0.058249473571777344, 0.06009054183959961, 0.061931610107421875, 0.06377267837524414, 0.0656137466430664, 0.06745481491088867, 0.06929588317871094, 0.0711369514465332, 0.07297801971435547, 0.07481908798217773, 0.07666015625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [3.0, 11.0, 48.0, 121.0, 303.0, 315.0, 156.0, 40.0, 18.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28202515840530396, -0.2264825403690338, -0.17093992233276367, -0.11539728939533234, -0.059854671359062195, -0.004312038421630859, 0.05123057961463928, 0.10677319765090942, 0.16231581568717957, 0.2178584337234497, 0.27340105175971985, 0.32894366979599, 0.3844863176345825, 0.44002893567085266, 0.4955715537071228, 0.5511142015457153, 0.6066567897796631, 0.6621994376182556, 0.7177420258522034, 0.7732846736907959, 0.8288272619247437, 0.8843699097633362, 0.9399125576019287, 0.9954551458358765, 1.0509977340698242, 1.106540322303772, 1.1620830297470093, 1.217625617980957, 1.2731682062149048, 1.3287107944488525, 1.3842535018920898, 1.4397960901260376, 1.495338797569275, 1.5508813858032227, 1.60642409324646, 1.6619666814804077, 1.7175092697143555, 1.7730519771575928, 1.8285945653915405, 1.8841371536254883, 1.939679741859436, 1.9952223300933838, 2.050765037536621, 2.1063075065612793, 2.1618502140045166, 2.217392921447754, 2.272935390472412, 2.3284780979156494, 2.3840208053588867, 2.439563512802124, 2.4951059818267822, 2.5506486892700195, 2.606191396713257, 2.661733865737915, 2.7172765731811523, 2.7728190422058105, 2.828361749649048, 2.883904457092285, 2.9394469261169434, 2.9949896335601807, 3.050532341003418, 3.106074810028076, 3.1616175174713135, 3.217160224914551, 3.272702693939209]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 17.0, 10.0, 11.0, 21.0, 20.0, 17.0, 31.0, 26.0, 38.0, 40.0, 48.0, 30.0, 45.0, 50.0, 48.0, 41.0, 46.0, 50.0, 36.0, 45.0, 41.0, 41.0, 26.0, 36.0, 23.0, 25.0, 15.0, 23.0, 18.0, 13.0, 6.0, 8.0, 8.0, 8.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.7527416944503784, -0.7315936088562012, -0.7104455232620239, -0.6892974376678467, -0.6681493520736694, -0.6470012664794922, -0.6258531808853149, -0.6047050952911377, -0.5835570096969604, -0.5624089241027832, -0.541260838508606, -0.5201127529144287, -0.49896466732025146, -0.4778165817260742, -0.456668496131897, -0.4355204105377197, -0.4143723249435425, -0.39322423934936523, -0.372076153755188, -0.35092806816101074, -0.3297799825668335, -0.30863189697265625, -0.287483811378479, -0.26633572578430176, -0.2451876401901245, -0.22403955459594727, -0.20289146900177002, -0.18174338340759277, -0.16059529781341553, -0.13944721221923828, -0.11829912662506104, -0.09715104103088379, -0.07600289583206177, -0.05485481023788452, -0.033706724643707275, -0.01255863904953003, 0.008589446544647217, 0.029737532138824463, 0.05088561773300171, 0.07203370332717896, 0.0931817889213562, 0.11432987451553345, 0.1354779601097107, 0.15662604570388794, 0.17777413129806519, 0.19892221689224243, 0.22007030248641968, 0.24121838808059692, 0.26236647367477417, 0.2835145592689514, 0.30466264486312866, 0.3258107304573059, 0.34695881605148315, 0.3681069016456604, 0.38925498723983765, 0.4104030728340149, 0.43155115842819214, 0.4526992440223694, 0.47384732961654663, 0.4949954152107239, 0.5161435008049011, 0.5372915863990784, 0.5584396719932556, 0.5795877575874329, 0.6007358431816101]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 15.0, 22.0, 31.0, 51.0, 121.0, 221.0, 477.0, 1136.0, 3644.0, 22536.0, 4079913.0, 76152.0, 6905.0, 1774.0, 675.0, 275.0, 137.0, 84.0, 44.0, 17.0, 13.0, 7.0, 14.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1177978515625, -0.1143026351928711, -0.11080741882324219, -0.10731220245361328, -0.10381698608398438, -0.10032176971435547, -0.09682655334472656, -0.09333133697509766, -0.08983612060546875, -0.08634090423583984, -0.08284568786621094, -0.07935047149658203, -0.07585525512695312, -0.07236003875732422, -0.06886482238769531, -0.0653696060180664, -0.0618743896484375, -0.058379173278808594, -0.05488395690917969, -0.05138874053955078, -0.047893524169921875, -0.04439830780029297, -0.04090309143066406, -0.037407875061035156, -0.03391265869140625, -0.030417442321777344, -0.026922225952148438, -0.02342700958251953, -0.019931793212890625, -0.01643657684326172, -0.012941360473632812, -0.009446144104003906, -0.005950927734375, -0.0024557113647460938, 0.0010395050048828125, 0.004534721374511719, 0.008029937744140625, 0.011525154113769531, 0.015020370483398438, 0.018515586853027344, 0.02201080322265625, 0.025506019592285156, 0.029001235961914062, 0.03249645233154297, 0.035991668701171875, 0.03948688507080078, 0.04298210144042969, 0.046477317810058594, 0.0499725341796875, 0.053467750549316406, 0.05696296691894531, 0.06045818328857422, 0.06395339965820312, 0.06744861602783203, 0.07094383239746094, 0.07443904876708984, 0.07793426513671875, 0.08142948150634766, 0.08492469787597656, 0.08841991424560547, 0.09191513061523438, 0.09541034698486328, 0.09890556335449219, 0.1024007797241211, 0.10589599609375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 11.0, 13.0, 13.0, 19.0, 25.0, 33.0, 37.0, 35.0, 44.0, 52.0, 50.0, 51.0, 51.0, 43.0, 55.0, 46.0, 58.0, 40.0, 48.0, 36.0, 41.0, 31.0, 34.0, 20.0, 13.0, 16.0, 12.0, 10.0, 8.0, 10.0, 7.0, 6.0, 0.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0308685302734375, -0.029770612716674805, -0.02867269515991211, -0.027574777603149414, -0.02647686004638672, -0.025378942489624023, -0.024281024932861328, -0.023183107376098633, -0.022085189819335938, -0.020987272262573242, -0.019889354705810547, -0.01879143714904785, -0.017693519592285156, -0.01659560203552246, -0.015497684478759766, -0.01439976692199707, -0.013301849365234375, -0.01220393180847168, -0.011106014251708984, -0.010008096694946289, -0.008910179138183594, -0.0078122615814208984, -0.006714344024658203, -0.005616426467895508, -0.0045185089111328125, -0.003420591354370117, -0.002322673797607422, -0.0012247562408447266, -0.00012683868408203125, 0.0009710788726806641, 0.0020689964294433594, 0.0031669139862060547, 0.00426483154296875, 0.005362749099731445, 0.006460666656494141, 0.007558584213256836, 0.008656501770019531, 0.009754419326782227, 0.010852336883544922, 0.011950254440307617, 0.013048171997070312, 0.014146089553833008, 0.015244007110595703, 0.0163419246673584, 0.017439842224121094, 0.01853775978088379, 0.019635677337646484, 0.02073359489440918, 0.021831512451171875, 0.02292943000793457, 0.024027347564697266, 0.02512526512145996, 0.026223182678222656, 0.02732110023498535, 0.028419017791748047, 0.029516935348510742, 0.030614852905273438, 0.03171277046203613, 0.03281068801879883, 0.03390860557556152, 0.03500652313232422, 0.036104440689086914, 0.03720235824584961, 0.038300275802612305, 0.039398193359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 8.0, 6.0, 6.0, 15.0, 19.0, 27.0, 24.0, 38.0, 75.0, 92.0, 139.0, 234.0, 407.0, 709.0, 1270.0, 2351.0, 5015.0, 14332.0, 71928.0, 3916986.0, 145996.0, 21561.0, 6750.0, 2935.0, 1454.0, 737.0, 404.0, 242.0, 158.0, 101.0, 70.0, 45.0, 46.0, 21.0, 16.0, 17.0, 9.0, 2.0, 7.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0716552734375, -0.06964540481567383, -0.06763553619384766, -0.06562566757202148, -0.06361579895019531, -0.06160593032836914, -0.05959606170654297, -0.0575861930847168, -0.055576324462890625, -0.05356645584106445, -0.05155658721923828, -0.04954671859741211, -0.04753684997558594, -0.045526981353759766, -0.043517112731933594, -0.04150724411010742, -0.03949737548828125, -0.03748750686645508, -0.035477638244628906, -0.033467769622802734, -0.03145790100097656, -0.02944803237915039, -0.02743816375732422, -0.025428295135498047, -0.023418426513671875, -0.021408557891845703, -0.01939868927001953, -0.01738882064819336, -0.015378952026367188, -0.013369083404541016, -0.011359214782714844, -0.009349346160888672, -0.0073394775390625, -0.005329608917236328, -0.0033197402954101562, -0.0013098716735839844, 0.0006999969482421875, 0.0027098655700683594, 0.004719734191894531, 0.006729602813720703, 0.008739471435546875, 0.010749340057373047, 0.012759208679199219, 0.01476907730102539, 0.016778945922851562, 0.018788814544677734, 0.020798683166503906, 0.022808551788330078, 0.02481842041015625, 0.026828289031982422, 0.028838157653808594, 0.030848026275634766, 0.03285789489746094, 0.03486776351928711, 0.03687763214111328, 0.03888750076293945, 0.040897369384765625, 0.0429072380065918, 0.04491710662841797, 0.04692697525024414, 0.04893684387207031, 0.050946712493896484, 0.052956581115722656, 0.05496644973754883, 0.056976318359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 8.0, 8.0, 12.0, 17.0, 47.0, 78.0, 196.0, 3248.0, 191.0, 79.0, 62.0, 37.0, 20.0, 12.0, 15.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0109710693359375, -0.010483026504516602, -0.009994983673095703, -0.009506940841674805, -0.009018898010253906, -0.008530855178833008, -0.00804281234741211, -0.007554769515991211, -0.0070667266845703125, -0.006578683853149414, -0.006090641021728516, -0.005602598190307617, -0.005114555358886719, -0.00462651252746582, -0.004138469696044922, -0.0036504268646240234, -0.003162384033203125, -0.0026743412017822266, -0.002186298370361328, -0.0016982555389404297, -0.0012102127075195312, -0.0007221698760986328, -0.00023412704467773438, 0.00025391578674316406, 0.0007419586181640625, 0.001230001449584961, 0.0017180442810058594, 0.002206087112426758, 0.0026941299438476562, 0.0031821727752685547, 0.003670215606689453, 0.0041582584381103516, 0.00464630126953125, 0.0051343441009521484, 0.005622386932373047, 0.006110429763793945, 0.006598472595214844, 0.007086515426635742, 0.007574558258056641, 0.008062601089477539, 0.008550643920898438, 0.009038686752319336, 0.009526729583740234, 0.010014772415161133, 0.010502815246582031, 0.01099085807800293, 0.011478900909423828, 0.011966943740844727, 0.012454986572265625, 0.012943029403686523, 0.013431072235107422, 0.01391911506652832, 0.014407157897949219, 0.014895200729370117, 0.015383243560791016, 0.015871286392211914, 0.016359329223632812, 0.01684737205505371, 0.01733541488647461, 0.017823457717895508, 0.018311500549316406, 0.018799543380737305, 0.019287586212158203, 0.0197756290435791, 0.020263671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 16.0, 135.0, 477.0, 302.0, 69.0, 12.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.058001577854156494, -0.04751954972743988, -0.03703752160072327, -0.026555489748716354, -0.01607346162199974, -0.005591433495283127, 0.004890598356723785, 0.0153726264834404, 0.025854654610157013, 0.03633668273687363, 0.04681871086359024, 0.05730074271559715, 0.06778277456760406, 0.07826480269432068, 0.08874683082103729, 0.0992288589477539, 0.10971088707447052, 0.12019291520118713, 0.13067494332790375, 0.14115697145462036, 0.15163899958133698, 0.1621210277080536, 0.1726030707359314, 0.18308508396148682, 0.19356712698936462, 0.20404915511608124, 0.21453118324279785, 0.22501321136951447, 0.23549523949623108, 0.2459772676229477, 0.2564592957496643, 0.2669413387775421, 0.27742335200309753, 0.28790539503097534, 0.29838740825653076, 0.30886945128440857, 0.319351464509964, 0.3298335075378418, 0.3403155207633972, 0.350797563791275, 0.36127957701683044, 0.37176162004470825, 0.38224363327026367, 0.3927256762981415, 0.4032076895236969, 0.4136897325515747, 0.4241717457771301, 0.43465378880500793, 0.44513583183288574, 0.45561787486076355, 0.46609988808631897, 0.4765819311141968, 0.4870639443397522, 0.49754598736763, 0.5080280303955078, 0.5185100436210632, 0.5289920568466187, 0.5394740700721741, 0.5499561429023743, 0.5604381561279297, 0.5709201693534851, 0.5814021825790405, 0.5918842554092407, 0.6023662686347961, 0.6128482818603516]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 10.0, 8.0, 17.0, 12.0, 19.0, 26.0, 35.0, 22.0, 43.0, 46.0, 52.0, 31.0, 58.0, 65.0, 48.0, 56.0, 57.0, 53.0, 49.0, 47.0, 55.0, 44.0, 31.0, 34.0, 23.0, 17.0, 17.0, 14.0, 8.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05031031370162964, -0.04824412241578102, -0.046177931129932404, -0.044111739844083786, -0.04204554855823517, -0.03997935727238655, -0.03791316598653793, -0.035846974700689316, -0.0337807834148407, -0.03171459212899208, -0.029648400843143463, -0.027582209557294846, -0.025516018271446228, -0.02344982698559761, -0.021383635699748993, -0.019317444413900375, -0.017251253128051758, -0.01518506184220314, -0.013118870556354523, -0.011052679270505905, -0.008986487984657288, -0.00692029669880867, -0.0048541054129600525, -0.002787914127111435, -0.0007217228412628174, 0.0013444684445858002, 0.0034106597304344177, 0.005476851016283035, 0.007543042302131653, 0.00960923358798027, 0.011675424873828888, 0.013741616159677505, 0.015807807445526123, 0.01787399873137474, 0.019940190017223358, 0.022006381303071976, 0.024072572588920593, 0.02613876387476921, 0.02820495516061783, 0.030271146446466446, 0.032337337732315063, 0.03440352901816368, 0.0364697203040123, 0.038535911589860916, 0.040602102875709534, 0.04266829416155815, 0.04473448544740677, 0.046800676733255386, 0.048866868019104004, 0.05093305930495262, 0.05299925059080124, 0.05506544187664986, 0.057131633162498474, 0.05919782444834709, 0.06126401573419571, 0.06333020329475403, 0.06539639830589294, 0.06746259331703186, 0.06952878087759018, 0.0715949684381485, 0.07366116344928741, 0.07572735846042633, 0.07779354602098465, 0.07985973358154297, 0.08192592859268188]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 15.0, 15.0, 13.0, 21.0, 47.0, 58.0, 93.0, 115.0, 188.0, 264.0, 407.0, 727.0, 1207.0, 2182.0, 4034.0, 7863.0, 16499.0, 36043.0, 82755.0, 189743.0, 304487.0, 220147.0, 99153.0, 43085.0, 19532.0, 9310.0, 4615.0, 2429.0, 1356.0, 763.0, 464.0, 300.0, 186.0, 142.0, 92.0, 61.0, 42.0, 23.0, 26.0, 10.0, 11.0, 7.0, 5.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043487548828125, -0.04196739196777344, -0.040447235107421875, -0.03892707824707031, -0.03740692138671875, -0.03588676452636719, -0.034366607666015625, -0.03284645080566406, -0.0313262939453125, -0.029806137084960938, -0.028285980224609375, -0.026765823364257812, -0.02524566650390625, -0.023725509643554688, -0.022205352783203125, -0.020685195922851562, -0.0191650390625, -0.017644882202148438, -0.016124725341796875, -0.014604568481445312, -0.01308441162109375, -0.011564254760742188, -0.010044097900390625, -0.008523941040039062, -0.0070037841796875, -0.0054836273193359375, -0.003963470458984375, -0.0024433135986328125, -0.00092315673828125, 0.0005970001220703125, 0.002117156982421875, 0.0036373138427734375, 0.005157470703125, 0.0066776275634765625, 0.008197784423828125, 0.009717941284179688, 0.01123809814453125, 0.012758255004882812, 0.014278411865234375, 0.015798568725585938, 0.0173187255859375, 0.018838882446289062, 0.020359039306640625, 0.021879196166992188, 0.02339935302734375, 0.024919509887695312, 0.026439666748046875, 0.027959823608398438, 0.02947998046875, 0.031000137329101562, 0.032520294189453125, 0.03404045104980469, 0.03556060791015625, 0.03708076477050781, 0.038600921630859375, 0.04012107849121094, 0.0416412353515625, 0.04316139221191406, 0.044681549072265625, 0.04620170593261719, 0.04772186279296875, 0.04924201965332031, 0.050762176513671875, 0.05228233337402344, 0.053802490234375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 1.0, 6.0, 3.0, 11.0, 8.0, 15.0, 15.0, 20.0, 21.0, 18.0, 30.0, 36.0, 50.0, 42.0, 57.0, 50.0, 43.0, 56.0, 44.0, 49.0, 45.0, 41.0, 49.0, 43.0, 47.0, 42.0, 37.0, 19.0, 14.0, 15.0, 8.0, 12.0, 12.0, 10.0, 7.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0299224853515625, -0.0288388729095459, -0.027755260467529297, -0.026671648025512695, -0.025588035583496094, -0.024504423141479492, -0.02342081069946289, -0.02233719825744629, -0.021253585815429688, -0.020169973373413086, -0.019086360931396484, -0.018002748489379883, -0.01691913604736328, -0.01583552360534668, -0.014751911163330078, -0.013668298721313477, -0.012584686279296875, -0.011501073837280273, -0.010417461395263672, -0.00933384895324707, -0.008250236511230469, -0.007166624069213867, -0.006083011627197266, -0.004999399185180664, -0.0039157867431640625, -0.002832174301147461, -0.0017485618591308594, -0.0006649494171142578, 0.00041866302490234375, 0.0015022754669189453, 0.002585887908935547, 0.0036695003509521484, 0.00475311279296875, 0.0058367252349853516, 0.006920337677001953, 0.008003950119018555, 0.009087562561035156, 0.010171175003051758, 0.01125478744506836, 0.012338399887084961, 0.013422012329101562, 0.014505624771118164, 0.015589237213134766, 0.016672849655151367, 0.01775646209716797, 0.01884007453918457, 0.019923686981201172, 0.021007299423217773, 0.022090911865234375, 0.023174524307250977, 0.024258136749267578, 0.02534174919128418, 0.02642536163330078, 0.027508974075317383, 0.028592586517333984, 0.029676198959350586, 0.030759811401367188, 0.03184342384338379, 0.03292703628540039, 0.03401064872741699, 0.035094261169433594, 0.036177873611450195, 0.0372614860534668, 0.0383450984954834, 0.0394287109375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 11.0, 11.0, 15.0, 17.0, 28.0, 32.0, 47.0, 54.0, 77.0, 95.0, 184.0, 280.0, 507.0, 963.0, 2464.0, 7229.0, 29836.0, 169969.0, 626470.0, 168213.0, 29597.0, 7513.0, 2563.0, 1012.0, 530.0, 263.0, 157.0, 100.0, 84.0, 51.0, 38.0, 29.0, 21.0, 17.0, 18.0, 4.0, 10.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1007080078125, -0.09778881072998047, -0.09486961364746094, -0.0919504165649414, -0.08903121948242188, -0.08611202239990234, -0.08319282531738281, -0.08027362823486328, -0.07735443115234375, -0.07443523406982422, -0.07151603698730469, -0.06859683990478516, -0.06567764282226562, -0.0627584457397461, -0.05983924865722656, -0.05692005157470703, -0.0540008544921875, -0.05108165740966797, -0.04816246032714844, -0.045243263244628906, -0.042324066162109375, -0.039404869079589844, -0.03648567199707031, -0.03356647491455078, -0.03064727783203125, -0.02772808074951172, -0.024808883666992188, -0.021889686584472656, -0.018970489501953125, -0.016051292419433594, -0.013132095336914062, -0.010212898254394531, -0.007293701171875, -0.004374504089355469, -0.0014553070068359375, 0.0014638900756835938, 0.004383087158203125, 0.007302284240722656, 0.010221481323242188, 0.013140678405761719, 0.01605987548828125, 0.01897907257080078, 0.021898269653320312, 0.024817466735839844, 0.027736663818359375, 0.030655860900878906, 0.03357505798339844, 0.03649425506591797, 0.0394134521484375, 0.04233264923095703, 0.04525184631347656, 0.048171043395996094, 0.051090240478515625, 0.054009437561035156, 0.05692863464355469, 0.05984783172607422, 0.06276702880859375, 0.06568622589111328, 0.06860542297363281, 0.07152462005615234, 0.07444381713867188, 0.0773630142211914, 0.08028221130371094, 0.08320140838623047, 0.08612060546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 6.0, 8.0, 8.0, 9.0, 16.0, 13.0, 13.0, 19.0, 17.0, 26.0, 20.0, 28.0, 34.0, 30.0, 45.0, 48.0, 44.0, 36.0, 43.0, 37.0, 42.0, 37.0, 38.0, 38.0, 39.0, 37.0, 36.0, 27.0, 27.0, 32.0, 18.0, 15.0, 15.0, 15.0, 15.0, 18.0, 5.0, 3.0, 4.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1219482421875, -0.1182708740234375, -0.114593505859375, -0.1109161376953125, -0.10723876953125, -0.1035614013671875, -0.099884033203125, -0.0962066650390625, -0.092529296875, -0.0888519287109375, -0.085174560546875, -0.0814971923828125, -0.07781982421875, -0.0741424560546875, -0.070465087890625, -0.0667877197265625, -0.0631103515625, -0.0594329833984375, -0.055755615234375, -0.0520782470703125, -0.04840087890625, -0.0447235107421875, -0.041046142578125, -0.0373687744140625, -0.03369140625, -0.0300140380859375, -0.026336669921875, -0.0226593017578125, -0.01898193359375, -0.0153045654296875, -0.011627197265625, -0.0079498291015625, -0.0042724609375, -0.0005950927734375, 0.003082275390625, 0.0067596435546875, 0.01043701171875, 0.0141143798828125, 0.017791748046875, 0.0214691162109375, 0.025146484375, 0.0288238525390625, 0.032501220703125, 0.0361785888671875, 0.03985595703125, 0.0435333251953125, 0.047210693359375, 0.0508880615234375, 0.0545654296875, 0.0582427978515625, 0.061920166015625, 0.0655975341796875, 0.06927490234375, 0.0729522705078125, 0.076629638671875, 0.0803070068359375, 0.083984375, 0.0876617431640625, 0.091339111328125, 0.0950164794921875, 0.09869384765625, 0.1023712158203125, 0.106048583984375, 0.1097259521484375, 0.1134033203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 13.0, 8.0, 21.0, 33.0, 62.0, 167.0, 458.0, 1670.0, 12782.0, 313425.0, 688995.0, 27225.0, 2657.0, 638.0, 218.0, 78.0, 51.0, 20.0, 14.0, 12.0, 8.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.063720703125, -0.061957359313964844, -0.06019401550292969, -0.05843067169189453, -0.056667327880859375, -0.05490398406982422, -0.05314064025878906, -0.051377296447753906, -0.04961395263671875, -0.047850608825683594, -0.04608726501464844, -0.04432392120361328, -0.042560577392578125, -0.04079723358154297, -0.03903388977050781, -0.037270545959472656, -0.0355072021484375, -0.033743858337402344, -0.03198051452636719, -0.03021717071533203, -0.028453826904296875, -0.02669048309326172, -0.024927139282226562, -0.023163795471191406, -0.02140045166015625, -0.019637107849121094, -0.017873764038085938, -0.01611042022705078, -0.014347076416015625, -0.012583732604980469, -0.010820388793945312, -0.009057044982910156, -0.007293701171875, -0.005530357360839844, -0.0037670135498046875, -0.0020036697387695312, -0.000240325927734375, 0.0015230178833007812, 0.0032863616943359375, 0.005049705505371094, 0.00681304931640625, 0.008576393127441406, 0.010339736938476562, 0.012103080749511719, 0.013866424560546875, 0.01562976837158203, 0.017393112182617188, 0.019156455993652344, 0.0209197998046875, 0.022683143615722656, 0.024446487426757812, 0.02620983123779297, 0.027973175048828125, 0.02973651885986328, 0.03149986267089844, 0.033263206481933594, 0.03502655029296875, 0.036789894104003906, 0.03855323791503906, 0.04031658172607422, 0.042079925537109375, 0.04384326934814453, 0.04560661315917969, 0.047369956970214844, 0.04913330078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 9.0, 5.0, 17.0, 16.0, 18.0, 26.0, 49.0, 56.0, 70.0, 82.0, 82.0, 103.0, 88.0, 75.0, 75.0, 60.0, 51.0, 39.0, 26.0, 23.0, 11.0, 3.0, 5.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4373016357421875e-06, -6.141141057014465e-06, -5.844980478286743e-06, -5.548819899559021e-06, -5.252659320831299e-06, -4.956498742103577e-06, -4.6603381633758545e-06, -4.364177584648132e-06, -4.06801700592041e-06, -3.771856427192688e-06, -3.475695848464966e-06, -3.1795352697372437e-06, -2.8833746910095215e-06, -2.5872141122817993e-06, -2.291053533554077e-06, -1.994892954826355e-06, -1.6987323760986328e-06, -1.4025717973709106e-06, -1.1064112186431885e-06, -8.102506399154663e-07, -5.140900611877441e-07, -2.1792948246002197e-07, 7.82310962677002e-08, 3.7439167499542236e-07, 6.705522537231445e-07, 9.667128324508667e-07, 1.2628734111785889e-06, 1.559033989906311e-06, 1.8551945686340332e-06, 2.1513551473617554e-06, 2.4475157260894775e-06, 2.7436763048171997e-06, 3.039836883544922e-06, 3.335997462272644e-06, 3.632158041000366e-06, 3.928318619728088e-06, 4.2244791984558105e-06, 4.520639777183533e-06, 4.816800355911255e-06, 5.112960934638977e-06, 5.409121513366699e-06, 5.705282092094421e-06, 6.0014426708221436e-06, 6.297603249549866e-06, 6.593763828277588e-06, 6.88992440700531e-06, 7.186084985733032e-06, 7.482245564460754e-06, 7.778406143188477e-06, 8.074566721916199e-06, 8.370727300643921e-06, 8.666887879371643e-06, 8.963048458099365e-06, 9.259209036827087e-06, 9.55536961555481e-06, 9.851530194282532e-06, 1.0147690773010254e-05, 1.0443851351737976e-05, 1.0740011930465698e-05, 1.103617250919342e-05, 1.1332333087921143e-05, 1.1628493666648865e-05, 1.1924654245376587e-05, 1.2220814824104309e-05, 1.2516975402832031e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 12.0, 20.0, 26.0, 44.0, 55.0, 103.0, 163.0, 285.0, 595.0, 1441.0, 5024.0, 33905.0, 396260.0, 551287.0, 49414.0, 6763.0, 1714.0, 628.0, 337.0, 167.0, 104.0, 67.0, 46.0, 21.0, 15.0, 11.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0313720703125, -0.030069351196289062, -0.028766632080078125, -0.027463912963867188, -0.02616119384765625, -0.024858474731445312, -0.023555755615234375, -0.022253036499023438, -0.0209503173828125, -0.019647598266601562, -0.018344879150390625, -0.017042160034179688, -0.01573944091796875, -0.014436721801757812, -0.013134002685546875, -0.011831283569335938, -0.010528564453125, -0.009225845336914062, -0.007923126220703125, -0.0066204071044921875, -0.00531768798828125, -0.0040149688720703125, -0.002712249755859375, -0.0014095306396484375, -0.0001068115234375, 0.0011959075927734375, 0.002498626708984375, 0.0038013458251953125, 0.00510406494140625, 0.0064067840576171875, 0.007709503173828125, 0.009012222290039062, 0.01031494140625, 0.011617660522460938, 0.012920379638671875, 0.014223098754882812, 0.01552581787109375, 0.016828536987304688, 0.018131256103515625, 0.019433975219726562, 0.0207366943359375, 0.022039413452148438, 0.023342132568359375, 0.024644851684570312, 0.02594757080078125, 0.027250289916992188, 0.028553009033203125, 0.029855728149414062, 0.031158447265625, 0.03246116638183594, 0.033763885498046875, 0.03506660461425781, 0.03636932373046875, 0.03767204284667969, 0.038974761962890625, 0.04027748107910156, 0.0415802001953125, 0.04288291931152344, 0.044185638427734375, 0.04548835754394531, 0.04679107666015625, 0.04809379577636719, 0.049396514892578125, 0.05069923400878906, 0.052001953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 8.0, 13.0, 24.0, 36.0, 62.0, 78.0, 114.0, 121.0, 136.0, 120.0, 105.0, 69.0, 37.0, 26.0, 23.0, 14.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039276123046875, -0.037427425384521484, -0.03557872772216797, -0.03373003005981445, -0.03188133239746094, -0.030032634735107422, -0.028183937072753906, -0.02633523941040039, -0.024486541748046875, -0.02263784408569336, -0.020789146423339844, -0.018940448760986328, -0.017091751098632812, -0.015243053436279297, -0.013394355773925781, -0.011545658111572266, -0.00969696044921875, -0.007848262786865234, -0.005999565124511719, -0.004150867462158203, -0.0023021697998046875, -0.0004534721374511719, 0.0013952255249023438, 0.0032439231872558594, 0.005092620849609375, 0.006941318511962891, 0.008790016174316406, 0.010638713836669922, 0.012487411499023438, 0.014336109161376953, 0.01618480682373047, 0.018033504486083984, 0.0198822021484375, 0.021730899810791016, 0.02357959747314453, 0.025428295135498047, 0.027276992797851562, 0.029125690460205078, 0.030974388122558594, 0.03282308578491211, 0.034671783447265625, 0.03652048110961914, 0.038369178771972656, 0.04021787643432617, 0.04206657409667969, 0.0439152717590332, 0.04576396942138672, 0.047612667083740234, 0.04946136474609375, 0.051310062408447266, 0.05315876007080078, 0.0550074577331543, 0.05685615539550781, 0.05870485305786133, 0.060553550720214844, 0.06240224838256836, 0.06425094604492188, 0.06609964370727539, 0.0679483413696289, 0.06979703903198242, 0.07164573669433594, 0.07349443435668945, 0.07534313201904297, 0.07719182968139648, 0.07904052734375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 15.0, 34.0, 41.0, 77.0, 120.0, 115.0, 155.0, 150.0, 110.0, 63.0, 48.0, 25.0, 19.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5223500728607178, -0.49903082847595215, -0.4757115840911865, -0.4523923397064209, -0.4290730953216553, -0.40575385093688965, -0.38243457674980164, -0.359115332365036, -0.3357960879802704, -0.31247684359550476, -0.28915759921073914, -0.2658383250236511, -0.2425190955400467, -0.21919985115528107, -0.19588059186935425, -0.17256134748458862, -0.149242103099823, -0.12592285871505737, -0.10260360687971115, -0.07928435504436493, -0.055965110659599304, -0.03264586627483368, -0.00932660698890686, 0.013992637395858765, 0.03731188178062439, 0.06063112989068031, 0.08395037800073624, 0.10726962983608246, 0.13058887422084808, 0.1539081186056137, 0.17722737789154053, 0.20054662227630615, 0.22386586666107178, 0.2471851110458374, 0.270504355430603, 0.29382359981536865, 0.3171428442001343, 0.3404620885848999, 0.3637813627719879, 0.38710060715675354, 0.41041985154151917, 0.4337390959262848, 0.4570583403110504, 0.4803776144981384, 0.503696858882904, 0.5270161032676697, 0.5503353476524353, 0.5736545920372009, 0.5969738364219666, 0.6202930808067322, 0.6436123251914978, 0.6669315695762634, 0.690250813961029, 0.7135700583457947, 0.7368893623352051, 0.7602086067199707, 0.7835278511047363, 0.806847095489502, 0.8301663398742676, 0.8534855842590332, 0.8768048286437988, 0.9001240730285645, 0.9234433174133301, 0.9467625617980957, 0.9700818061828613]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 6.0, 14.0, 13.0, 9.0, 16.0, 25.0, 19.0, 20.0, 42.0, 44.0, 38.0, 40.0, 54.0, 58.0, 50.0, 63.0, 69.0, 61.0, 56.0, 47.0, 44.0, 36.0, 32.0, 26.0, 25.0, 17.0, 11.0, 17.0, 11.0, 5.0, 9.0, 4.0, 5.0, 4.0, 0.0, 1.0, 3.0, 2.0], "bins": [-1.0178167819976807, -0.9932148456573486, -0.9686128497123718, -0.9440109133720398, -0.9194089770317078, -0.894806981086731, -0.8702050447463989, -0.8456031084060669, -0.8210011720657349, -0.7963992357254028, -0.771797239780426, -0.747195303440094, -0.722593367099762, -0.6979913711547852, -0.6733894348144531, -0.6487874984741211, -0.6241855025291443, -0.5995835661888123, -0.5749815702438354, -0.5503796339035034, -0.5257776975631714, -0.5011757612228394, -0.47657376527786255, -0.4519718289375305, -0.4273698627948761, -0.4027678966522217, -0.37816596031188965, -0.35356399416923523, -0.3289620280265808, -0.3043600916862488, -0.27975812554359436, -0.25515615940093994, -0.2305542230606079, -0.20595227181911469, -0.18135032057762146, -0.15674835443496704, -0.13214640319347382, -0.10754445195198059, -0.08294248580932617, -0.05834053456783295, -0.03373858332633972, -0.009136628359556198, 0.015465326607227325, 0.04006728529930115, 0.06466923654079437, 0.0892711877822876, 0.11387315392494202, 0.13847510516643524, 0.16307705640792847, 0.1876790076494217, 0.21228095889091492, 0.23688292503356934, 0.26148486137390137, 0.2860868275165558, 0.3106887936592102, 0.33529072999954224, 0.35989269614219666, 0.3844946622848511, 0.4090965986251831, 0.4336985647678375, 0.45830053091049194, 0.482902467250824, 0.5075044631958008, 0.5321063995361328, 0.5567083358764648]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 12.0, 16.0, 13.0, 26.0, 36.0, 32.0, 46.0, 78.0, 186.0, 941.0, 20978.0, 4167256.0, 3905.0, 381.0, 118.0, 76.0, 52.0, 36.0, 34.0, 16.0, 12.0, 12.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.380615234375, -0.3713951110839844, -0.36217498779296875, -0.3529548645019531, -0.3437347412109375, -0.3345146179199219, -0.32529449462890625, -0.3160743713378906, -0.306854248046875, -0.2976341247558594, -0.28841400146484375, -0.2791938781738281, -0.2699737548828125, -0.2607536315917969, -0.25153350830078125, -0.24231338500976562, -0.23309326171875, -0.22387313842773438, -0.21465301513671875, -0.20543289184570312, -0.1962127685546875, -0.18699264526367188, -0.17777252197265625, -0.16855239868164062, -0.159332275390625, -0.15011215209960938, -0.14089202880859375, -0.13167190551757812, -0.1224517822265625, -0.11323165893554688, -0.10401153564453125, -0.09479141235351562, -0.0855712890625, -0.07635116577148438, -0.06713104248046875, -0.057910919189453125, -0.0486907958984375, -0.039470672607421875, -0.03025054931640625, -0.021030426025390625, -0.011810302734375, -0.002590179443359375, 0.00662994384765625, 0.015850067138671875, 0.0250701904296875, 0.034290313720703125, 0.04351043701171875, 0.052730560302734375, 0.06195068359375, 0.07117080688476562, 0.08039093017578125, 0.08961105346679688, 0.0988311767578125, 0.10805130004882812, 0.11727142333984375, 0.12649154663085938, 0.135711669921875, 0.14493179321289062, 0.15415191650390625, 0.16337203979492188, 0.1725921630859375, 0.18181228637695312, 0.19103240966796875, 0.20025253295898438, 0.20947265625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 5.0, 12.0, 13.0, 11.0, 24.0, 19.0, 11.0, 23.0, 29.0, 30.0, 46.0, 36.0, 52.0, 51.0, 57.0, 39.0, 52.0, 65.0, 48.0, 42.0, 44.0, 40.0, 39.0, 33.0, 26.0, 30.0, 17.0, 25.0, 10.0, 8.0, 10.0, 6.0, 9.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0310211181640625, -0.029928922653198242, -0.028836727142333984, -0.027744531631469727, -0.02665233612060547, -0.02556014060974121, -0.024467945098876953, -0.023375749588012695, -0.022283554077148438, -0.02119135856628418, -0.020099163055419922, -0.019006967544555664, -0.017914772033691406, -0.01682257652282715, -0.01573038101196289, -0.014638185501098633, -0.013545989990234375, -0.012453794479370117, -0.01136159896850586, -0.010269403457641602, -0.009177207946777344, -0.008085012435913086, -0.006992816925048828, -0.00590062141418457, -0.0048084259033203125, -0.0037162303924560547, -0.002624034881591797, -0.001531839370727539, -0.00043964385986328125, 0.0006525516510009766, 0.0017447471618652344, 0.002836942672729492, 0.00392913818359375, 0.005021333694458008, 0.006113529205322266, 0.0072057247161865234, 0.008297920227050781, 0.009390115737915039, 0.010482311248779297, 0.011574506759643555, 0.012666702270507812, 0.01375889778137207, 0.014851093292236328, 0.015943288803100586, 0.017035484313964844, 0.0181276798248291, 0.01921987533569336, 0.020312070846557617, 0.021404266357421875, 0.022496461868286133, 0.02358865737915039, 0.02468085289001465, 0.025773048400878906, 0.026865243911743164, 0.027957439422607422, 0.02904963493347168, 0.030141830444335938, 0.031234025955200195, 0.03232622146606445, 0.03341841697692871, 0.03451061248779297, 0.03560280799865723, 0.036695003509521484, 0.03778719902038574, 0.03887939453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 2.0, 5.0, 10.0, 13.0, 12.0, 11.0, 25.0, 31.0, 33.0, 39.0, 52.0, 69.0, 72.0, 114.0, 182.0, 242.0, 473.0, 1196.0, 5928.0, 195088.0, 3980673.0, 7202.0, 1354.0, 531.0, 242.0, 158.0, 114.0, 73.0, 75.0, 47.0, 44.0, 34.0, 30.0, 23.0, 17.0, 15.0, 12.0, 6.0, 9.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1593017578125, -0.15433120727539062, -0.14936065673828125, -0.14439010620117188, -0.1394195556640625, -0.13444900512695312, -0.12947845458984375, -0.12450790405273438, -0.119537353515625, -0.11456680297851562, -0.10959625244140625, -0.10462570190429688, -0.0996551513671875, -0.09468460083007812, -0.08971405029296875, -0.08474349975585938, -0.07977294921875, -0.07480239868164062, -0.06983184814453125, -0.06486129760742188, -0.0598907470703125, -0.054920196533203125, -0.04994964599609375, -0.044979095458984375, -0.040008544921875, -0.035037994384765625, -0.03006744384765625, -0.025096893310546875, -0.0201263427734375, -0.015155792236328125, -0.01018524169921875, -0.005214691162109375, -0.000244140625, 0.004726409912109375, 0.00969696044921875, 0.014667510986328125, 0.0196380615234375, 0.024608612060546875, 0.02957916259765625, 0.034549713134765625, 0.039520263671875, 0.044490814208984375, 0.04946136474609375, 0.054431915283203125, 0.0594024658203125, 0.06437301635742188, 0.06934356689453125, 0.07431411743164062, 0.07928466796875, 0.08425521850585938, 0.08922576904296875, 0.09419631958007812, 0.0991668701171875, 0.10413742065429688, 0.10910797119140625, 0.11407852172851562, 0.119049072265625, 0.12401962280273438, 0.12899017333984375, 0.13396072387695312, 0.1389312744140625, 0.14390182495117188, 0.14887237548828125, 0.15384292602539062, 0.1588134765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 10.0, 27.0, 119.0, 3814.0, 83.0, 20.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04498291015625, -0.04333829879760742, -0.041693687438964844, -0.040049076080322266, -0.03840446472167969, -0.03675985336303711, -0.03511524200439453, -0.03347063064575195, -0.031826019287109375, -0.030181407928466797, -0.02853679656982422, -0.02689218521118164, -0.025247573852539062, -0.023602962493896484, -0.021958351135253906, -0.020313739776611328, -0.01866912841796875, -0.017024517059326172, -0.015379905700683594, -0.013735294342041016, -0.012090682983398438, -0.01044607162475586, -0.008801460266113281, -0.007156848907470703, -0.005512237548828125, -0.003867626190185547, -0.0022230148315429688, -0.0005784034729003906, 0.0010662078857421875, 0.0027108192443847656, 0.004355430603027344, 0.006000041961669922, 0.0076446533203125, 0.009289264678955078, 0.010933876037597656, 0.012578487396240234, 0.014223098754882812, 0.01586771011352539, 0.01751232147216797, 0.019156932830810547, 0.020801544189453125, 0.022446155548095703, 0.02409076690673828, 0.02573537826538086, 0.027379989624023438, 0.029024600982666016, 0.030669212341308594, 0.03231382369995117, 0.03395843505859375, 0.03560304641723633, 0.037247657775878906, 0.038892269134521484, 0.04053688049316406, 0.04218149185180664, 0.04382610321044922, 0.0454707145690918, 0.047115325927734375, 0.04875993728637695, 0.05040454864501953, 0.05204916000366211, 0.05369377136230469, 0.055338382720947266, 0.056982994079589844, 0.05862760543823242, 0.060272216796875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 15.0, 17.0, 147.0, 331.0, 319.0, 120.0, 40.0, 13.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24801190197467804, -0.24067266285419464, -0.23333340883255005, -0.22599416971206665, -0.21865493059158325, -0.21131569147109985, -0.20397645235061646, -0.19663719832897186, -0.18929795920848846, -0.18195872008800507, -0.17461946606636047, -0.16728022694587708, -0.15994098782539368, -0.15260174870491028, -0.14526250958442688, -0.1379232555627823, -0.1305840164422989, -0.12324477732181549, -0.1159055307507515, -0.1085662841796875, -0.1012270450592041, -0.0938878059387207, -0.08654855936765671, -0.07920931279659271, -0.07187007367610931, -0.06453083455562592, -0.05719158798456192, -0.04985234513878822, -0.042513102293014526, -0.03517385944724083, -0.027834616601467133, -0.020495373755693436, -0.013156116008758545, -0.005816873162984848, 0.0015223696827888489, 0.008861612528562546, 0.016200855374336243, 0.02354009822010994, 0.030879341065883636, 0.03821858391165733, 0.04555782675743103, 0.05289706960320473, 0.060236312448978424, 0.06757555902004242, 0.07491479814052582, 0.08225403726100922, 0.08959328383207321, 0.09693253040313721, 0.1042717695236206, 0.111611008644104, 0.118950255215168, 0.126289501786232, 0.1336287409067154, 0.1409679800271988, 0.14830723404884338, 0.15564647316932678, 0.16298571228981018, 0.17032495141029358, 0.17766419053077698, 0.18500344455242157, 0.19234268367290497, 0.19968192279338837, 0.20702117681503296, 0.21436041593551636, 0.22169965505599976]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 9.0, 10.0, 8.0, 7.0, 11.0, 13.0, 22.0, 18.0, 18.0, 22.0, 26.0, 31.0, 38.0, 29.0, 32.0, 34.0, 37.0, 39.0, 45.0, 41.0, 49.0, 35.0, 34.0, 47.0, 38.0, 32.0, 35.0, 31.0, 29.0, 28.0, 22.0, 22.0, 14.0, 17.0, 11.0, 8.0, 4.0, 11.0, 5.0, 3.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.04955697059631348, -0.048129647970199585, -0.04670232534408569, -0.0452749989926815, -0.04384767636656761, -0.04242035374045372, -0.04099302738904953, -0.03956570476293564, -0.03813838213682175, -0.036711059510707855, -0.035283736884593964, -0.033856410533189774, -0.03242908790707588, -0.03100176528096199, -0.02957444079220295, -0.02814711630344391, -0.026719793677330017, -0.025292471051216125, -0.023865146562457085, -0.022437822073698044, -0.021010499447584152, -0.01958317682147026, -0.01815585233271122, -0.01672852784395218, -0.015301205217838287, -0.013873881660401821, -0.012446558102965355, -0.011019234545528889, -0.009591910988092422, -0.008164587430655956, -0.00673726387321949, -0.005309940315783024, -0.0038826167583465576, -0.0024552932009100914, -0.0010279696434736252, 0.00039935391396284103, 0.0018266774713993073, 0.0032540010288357735, 0.00468132458627224, 0.006108648143708706, 0.007535971701145172, 0.008963295258581638, 0.010390618816018105, 0.01181794237345457, 0.013245265930891037, 0.014672589488327503, 0.01609991304576397, 0.01752723753452301, 0.018954560160636902, 0.020381882786750793, 0.021809207275509834, 0.023236531764268875, 0.024663854390382767, 0.02609117701649666, 0.0275185015052557, 0.02894582599401474, 0.03037314862012863, 0.03180047124624252, 0.033227793872356415, 0.034655120223760605, 0.036082442849874496, 0.03750976547598839, 0.03893709182739258, 0.04036441445350647, 0.04179173707962036]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 6.0, 4.0, 13.0, 9.0, 13.0, 20.0, 29.0, 38.0, 63.0, 71.0, 92.0, 145.0, 229.0, 319.0, 451.0, 653.0, 1054.0, 1779.0, 3562.0, 10215.0, 55447.0, 439722.0, 456103.0, 59113.0, 10754.0, 3623.0, 1802.0, 1006.0, 735.0, 453.0, 243.0, 217.0, 176.0, 113.0, 91.0, 58.0, 35.0, 26.0, 21.0, 14.0, 12.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0960693359375, -0.09263992309570312, -0.08921051025390625, -0.08578109741210938, -0.0823516845703125, -0.07892227172851562, -0.07549285888671875, -0.07206344604492188, -0.068634033203125, -0.06520462036132812, -0.06177520751953125, -0.058345794677734375, -0.0549163818359375, -0.051486968994140625, -0.04805755615234375, -0.044628143310546875, -0.04119873046875, -0.037769317626953125, -0.03433990478515625, -0.030910491943359375, -0.0274810791015625, -0.024051666259765625, -0.02062225341796875, -0.017192840576171875, -0.013763427734375, -0.010334014892578125, -0.00690460205078125, -0.003475189208984375, -4.57763671875e-05, 0.003383636474609375, 0.00681304931640625, 0.010242462158203125, 0.013671875, 0.017101287841796875, 0.02053070068359375, 0.023960113525390625, 0.0273895263671875, 0.030818939208984375, 0.03424835205078125, 0.037677764892578125, 0.041107177734375, 0.044536590576171875, 0.04796600341796875, 0.051395416259765625, 0.0548248291015625, 0.058254241943359375, 0.06168365478515625, 0.06511306762695312, 0.06854248046875, 0.07197189331054688, 0.07540130615234375, 0.07883071899414062, 0.0822601318359375, 0.08568954467773438, 0.08911895751953125, 0.09254837036132812, 0.095977783203125, 0.09940719604492188, 0.10283660888671875, 0.10626602172851562, 0.1096954345703125, 0.11312484741210938, 0.11655426025390625, 0.11998367309570312, 0.1234130859375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 3.0, 8.0, 16.0, 8.0, 15.0, 16.0, 16.0, 12.0, 26.0, 22.0, 26.0, 43.0, 34.0, 36.0, 51.0, 33.0, 45.0, 59.0, 50.0, 42.0, 50.0, 41.0, 43.0, 45.0, 39.0, 36.0, 21.0, 25.0, 23.0, 24.0, 14.0, 13.0, 6.0, 11.0, 9.0, 8.0, 8.0, 6.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.032623291015625, -0.03148174285888672, -0.030340194702148438, -0.029198646545410156, -0.028057098388671875, -0.026915550231933594, -0.025774002075195312, -0.02463245391845703, -0.02349090576171875, -0.02234935760498047, -0.021207809448242188, -0.020066261291503906, -0.018924713134765625, -0.017783164978027344, -0.016641616821289062, -0.015500068664550781, -0.0143585205078125, -0.013216972351074219, -0.012075424194335938, -0.010933876037597656, -0.009792327880859375, -0.008650779724121094, -0.0075092315673828125, -0.006367683410644531, -0.00522613525390625, -0.004084587097167969, -0.0029430389404296875, -0.0018014907836914062, -0.000659942626953125, 0.00048160552978515625, 0.0016231536865234375, 0.0027647018432617188, 0.00390625, 0.005047798156738281, 0.0061893463134765625, 0.007330894470214844, 0.008472442626953125, 0.009613990783691406, 0.010755538940429688, 0.011897087097167969, 0.01303863525390625, 0.014180183410644531, 0.015321731567382812, 0.016463279724121094, 0.017604827880859375, 0.018746376037597656, 0.019887924194335938, 0.02102947235107422, 0.0221710205078125, 0.02331256866455078, 0.024454116821289062, 0.025595664978027344, 0.026737213134765625, 0.027878761291503906, 0.029020309448242188, 0.03016185760498047, 0.03130340576171875, 0.03244495391845703, 0.03358650207519531, 0.034728050231933594, 0.035869598388671875, 0.037011146545410156, 0.03815269470214844, 0.03929424285888672, 0.040435791015625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 10.0, 8.0, 18.0, 36.0, 49.0, 79.0, 164.0, 317.0, 565.0, 1095.0, 2286.0, 7103.0, 149463.0, 862113.0, 18533.0, 3499.0, 1565.0, 749.0, 378.0, 227.0, 127.0, 64.0, 37.0, 20.0, 12.0, 9.0, 3.0, 4.0, 6.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2313232421875, -0.22414588928222656, -0.21696853637695312, -0.2097911834716797, -0.20261383056640625, -0.1954364776611328, -0.18825912475585938, -0.18108177185058594, -0.1739044189453125, -0.16672706604003906, -0.15954971313476562, -0.1523723602294922, -0.14519500732421875, -0.1380176544189453, -0.13084030151367188, -0.12366294860839844, -0.116485595703125, -0.10930824279785156, -0.10213088989257812, -0.09495353698730469, -0.08777618408203125, -0.08059883117675781, -0.07342147827148438, -0.06624412536621094, -0.0590667724609375, -0.05188941955566406, -0.044712066650390625, -0.03753471374511719, -0.03035736083984375, -0.023180007934570312, -0.016002655029296875, -0.008825302124023438, -0.00164794921875, 0.0055294036865234375, 0.012706756591796875, 0.019884109497070312, 0.02706146240234375, 0.03423881530761719, 0.041416168212890625, 0.04859352111816406, 0.0557708740234375, 0.06294822692871094, 0.07012557983398438, 0.07730293273925781, 0.08448028564453125, 0.09165763854980469, 0.09883499145507812, 0.10601234436035156, 0.113189697265625, 0.12036705017089844, 0.12754440307617188, 0.1347217559814453, 0.14189910888671875, 0.1490764617919922, 0.15625381469726562, 0.16343116760253906, 0.1706085205078125, 0.17778587341308594, 0.18496322631835938, 0.1921405792236328, 0.19931793212890625, 0.2064952850341797, 0.21367263793945312, 0.22084999084472656, 0.22802734375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 8.0, 6.0, 7.0, 14.0, 18.0, 23.0, 25.0, 27.0, 31.0, 33.0, 40.0, 64.0, 54.0, 59.0, 64.0, 59.0, 75.0, 64.0, 57.0, 53.0, 44.0, 47.0, 35.0, 24.0, 15.0, 15.0, 14.0, 9.0, 3.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.178466796875, -0.17183303833007812, -0.16519927978515625, -0.15856552124023438, -0.1519317626953125, -0.14529800415039062, -0.13866424560546875, -0.13203048706054688, -0.125396728515625, -0.11876296997070312, -0.11212921142578125, -0.10549545288085938, -0.0988616943359375, -0.09222793579101562, -0.08559417724609375, -0.07896041870117188, -0.07232666015625, -0.06569290161132812, -0.05905914306640625, -0.052425384521484375, -0.0457916259765625, -0.039157867431640625, -0.03252410888671875, -0.025890350341796875, -0.019256591796875, -0.012622833251953125, -0.00598907470703125, 0.000644683837890625, 0.0072784423828125, 0.013912200927734375, 0.02054595947265625, 0.027179718017578125, 0.0338134765625, 0.040447235107421875, 0.04708099365234375, 0.053714752197265625, 0.0603485107421875, 0.06698226928710938, 0.07361602783203125, 0.08024978637695312, 0.086883544921875, 0.09351730346679688, 0.10015106201171875, 0.10678482055664062, 0.1134185791015625, 0.12005233764648438, 0.12668609619140625, 0.13331985473632812, 0.13995361328125, 0.14658737182617188, 0.15322113037109375, 0.15985488891601562, 0.1664886474609375, 0.17312240600585938, 0.17975616455078125, 0.18638992309570312, 0.193023681640625, 0.19965744018554688, 0.20629119873046875, 0.21292495727539062, 0.2195587158203125, 0.22619247436523438, 0.23282623291015625, 0.23945999145507812, 0.24609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 9.0, 7.0, 15.0, 26.0, 52.0, 83.0, 170.0, 254.0, 560.0, 1406.0, 4212.0, 27737.0, 826129.0, 173322.0, 10359.0, 2470.0, 857.0, 447.0, 172.0, 99.0, 67.0, 38.0, 15.0, 11.0, 10.0, 5.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06231689453125, -0.060151100158691406, -0.05798530578613281, -0.05581951141357422, -0.053653717041015625, -0.05148792266845703, -0.04932212829589844, -0.047156333923339844, -0.04499053955078125, -0.042824745178222656, -0.04065895080566406, -0.03849315643310547, -0.036327362060546875, -0.03416156768798828, -0.03199577331542969, -0.029829978942871094, -0.0276641845703125, -0.025498390197753906, -0.023332595825195312, -0.02116680145263672, -0.019001007080078125, -0.01683521270751953, -0.014669418334960938, -0.012503623962402344, -0.01033782958984375, -0.008172035217285156, -0.0060062408447265625, -0.0038404464721679688, -0.001674652099609375, 0.0004911422729492188, 0.0026569366455078125, 0.004822731018066406, 0.006988525390625, 0.009154319763183594, 0.011320114135742188, 0.013485908508300781, 0.015651702880859375, 0.01781749725341797, 0.019983291625976562, 0.022149085998535156, 0.02431488037109375, 0.026480674743652344, 0.028646469116210938, 0.03081226348876953, 0.032978057861328125, 0.03514385223388672, 0.03730964660644531, 0.039475440979003906, 0.0416412353515625, 0.043807029724121094, 0.04597282409667969, 0.04813861846923828, 0.050304412841796875, 0.05247020721435547, 0.05463600158691406, 0.056801795959472656, 0.05896759033203125, 0.061133384704589844, 0.06329917907714844, 0.06546497344970703, 0.06763076782226562, 0.06979656219482422, 0.07196235656738281, 0.0741281509399414, 0.0762939453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 13.0, 11.0, 32.0, 69.0, 103.0, 166.0, 187.0, 173.0, 115.0, 42.0, 41.0, 21.0, 9.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7762184143066406e-05, -1.7231330275535583e-05, -1.670047640800476e-05, -1.6169622540473938e-05, -1.5638768672943115e-05, -1.5107914805412292e-05, -1.457706093788147e-05, -1.4046207070350647e-05, -1.3515353202819824e-05, -1.2984499335289001e-05, -1.2453645467758179e-05, -1.1922791600227356e-05, -1.1391937732696533e-05, -1.086108386516571e-05, -1.0330229997634888e-05, -9.799376130104065e-06, -9.268522262573242e-06, -8.73766839504242e-06, -8.206814527511597e-06, -7.675960659980774e-06, -7.145106792449951e-06, -6.614252924919128e-06, -6.083399057388306e-06, -5.552545189857483e-06, -5.02169132232666e-06, -4.490837454795837e-06, -3.959983587265015e-06, -3.429129719734192e-06, -2.898275852203369e-06, -2.3674219846725464e-06, -1.8365681171417236e-06, -1.3057142496109009e-06, -7.748603820800781e-07, -2.4400651454925537e-07, 2.868473529815674e-07, 8.177012205123901e-07, 1.3485550880432129e-06, 1.8794089555740356e-06, 2.4102628231048584e-06, 2.941116690635681e-06, 3.471970558166504e-06, 4.002824425697327e-06, 4.533678293228149e-06, 5.064532160758972e-06, 5.595386028289795e-06, 6.126239895820618e-06, 6.6570937633514404e-06, 7.187947630882263e-06, 7.718801498413086e-06, 8.249655365943909e-06, 8.780509233474731e-06, 9.311363101005554e-06, 9.842216968536377e-06, 1.03730708360672e-05, 1.0903924703598022e-05, 1.1434778571128845e-05, 1.1965632438659668e-05, 1.249648630619049e-05, 1.3027340173721313e-05, 1.3558194041252136e-05, 1.4089047908782959e-05, 1.4619901776313782e-05, 1.5150755643844604e-05, 1.5681609511375427e-05, 1.621246337890625e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 14.0, 16.0, 49.0, 84.0, 171.0, 360.0, 859.0, 2323.0, 9814.0, 576677.0, 445536.0, 8775.0, 2140.0, 860.0, 398.0, 212.0, 104.0, 50.0, 33.0, 20.0, 20.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1197509765625, -0.11642265319824219, -0.11309432983398438, -0.10976600646972656, -0.10643768310546875, -0.10310935974121094, -0.09978103637695312, -0.09645271301269531, -0.0931243896484375, -0.08979606628417969, -0.08646774291992188, -0.08313941955566406, -0.07981109619140625, -0.07648277282714844, -0.07315444946289062, -0.06982612609863281, -0.066497802734375, -0.06316947937011719, -0.059841156005859375, -0.05651283264160156, -0.05318450927734375, -0.04985618591308594, -0.046527862548828125, -0.04319953918457031, -0.0398712158203125, -0.03654289245605469, -0.033214569091796875, -0.029886245727539062, -0.02655792236328125, -0.023229598999023438, -0.019901275634765625, -0.016572952270507812, -0.01324462890625, -0.009916305541992188, -0.006587982177734375, -0.0032596588134765625, 6.866455078125e-05, 0.0033969879150390625, 0.006725311279296875, 0.010053634643554688, 0.0133819580078125, 0.016710281372070312, 0.020038604736328125, 0.023366928100585938, 0.02669525146484375, 0.030023574829101562, 0.033351898193359375, 0.03668022155761719, 0.040008544921875, 0.04333686828613281, 0.046665191650390625, 0.04999351501464844, 0.05332183837890625, 0.05665016174316406, 0.059978485107421875, 0.06330680847167969, 0.0666351318359375, 0.06996345520019531, 0.07329177856445312, 0.07662010192871094, 0.07994842529296875, 0.08327674865722656, 0.08660507202148438, 0.08993339538574219, 0.09326171875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 4.0, 6.0, 9.0, 17.0, 35.0, 106.0, 306.0, 273.0, 137.0, 41.0, 17.0, 12.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12224388122558594, -0.11716842651367188, -0.11209297180175781, -0.10701751708984375, -0.10194206237792969, -0.09686660766601562, -0.09179115295410156, -0.0867156982421875, -0.08164024353027344, -0.07656478881835938, -0.07148933410644531, -0.06641387939453125, -0.06133842468261719, -0.056262969970703125, -0.05118751525878906, -0.046112060546875, -0.04103660583496094, -0.035961151123046875, -0.030885696411132812, -0.02581024169921875, -0.020734786987304688, -0.015659332275390625, -0.010583877563476562, -0.0055084228515625, -0.0004329681396484375, 0.004642486572265625, 0.009717941284179688, 0.01479339599609375, 0.019868850708007812, 0.024944305419921875, 0.030019760131835938, 0.03509521484375, 0.04017066955566406, 0.045246124267578125, 0.05032157897949219, 0.05539703369140625, 0.06047248840332031, 0.06554794311523438, 0.07062339782714844, 0.0756988525390625, 0.08077430725097656, 0.08584976196289062, 0.09092521667480469, 0.09600067138671875, 0.10107612609863281, 0.10615158081054688, 0.11122703552246094, 0.116302490234375, 0.12137794494628906, 0.12645339965820312, 0.1315288543701172, 0.13660430908203125, 0.1416797637939453, 0.14675521850585938, 0.15183067321777344, 0.1569061279296875, 0.16198158264160156, 0.16705703735351562, 0.1721324920654297, 0.17720794677734375, 0.1822834014892578, 0.18735885620117188, 0.19243431091308594, 0.197509765625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 12.0, 17.0, 28.0, 60.0, 98.0, 156.0, 183.0, 149.0, 109.0, 66.0, 45.0, 43.0, 8.0, 14.0, 9.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28918594121932983, -0.2577432096004486, -0.22630049288272858, -0.19485777616500854, -0.16341504454612732, -0.1319723129272461, -0.10052959620952606, -0.06908687949180603, -0.037644147872924805, -0.006201423704624176, 0.025241300463676453, 0.05668402463197708, 0.08812674880027771, 0.11956948041915894, 0.15101219713687897, 0.182454913854599, 0.21389764547348022, 0.24534037709236145, 0.2767831087112427, 0.3082258105278015, 0.33966854214668274, 0.37111127376556396, 0.4025539755821228, 0.43399670720100403, 0.46543943881988525, 0.4968821704387665, 0.5283249020576477, 0.5597676038742065, 0.5912103652954102, 0.622653067111969, 0.6540957689285278, 0.6855385303497314, 0.7169811725616455, 0.7484238743782043, 0.779866635799408, 0.8113093376159668, 0.8427520990371704, 0.8741948008537292, 0.9056375026702881, 0.9370802640914917, 0.9685229659080505, 0.9999656677246094, 1.031408429145813, 1.0628511905670166, 1.0942938327789307, 1.1257365942001343, 1.157179355621338, 1.188621997833252, 1.2200647592544556, 1.2515075206756592, 1.2829501628875732, 1.3143929243087769, 1.3458356857299805, 1.3772783279418945, 1.4087210893630981, 1.4401638507843018, 1.4716064929962158, 1.5030492544174194, 1.5344918966293335, 1.565934658050537, 1.5973774194717407, 1.6288201808929443, 1.6602628231048584, 1.691705584526062, 1.7231483459472656]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 3.0, 7.0, 13.0, 10.0, 10.0, 15.0, 20.0, 27.0, 27.0, 24.0, 29.0, 36.0, 36.0, 46.0, 52.0, 40.0, 52.0, 46.0, 56.0, 36.0, 43.0, 49.0, 35.0, 39.0, 25.0, 26.0, 23.0, 27.0, 19.0, 16.0, 17.0, 19.0, 10.0, 14.0, 15.0, 9.0, 10.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.7512623071670532, -0.729004979133606, -0.7067477107048035, -0.6844903826713562, -0.6622331142425537, -0.6399757862091064, -0.617718517780304, -0.5954611897468567, -0.5732039213180542, -0.5509465932846069, -0.5286893248558044, -0.5064319968223572, -0.4841747283935547, -0.4619174301624298, -0.43966013193130493, -0.41740280389785767, -0.3951455056667328, -0.3728882074356079, -0.35063090920448303, -0.32837361097335815, -0.3061163127422333, -0.2838590145111084, -0.26160168647766113, -0.23934440314769745, -0.21708710491657257, -0.1948298066854477, -0.17257250845432281, -0.15031519532203674, -0.12805789709091187, -0.10580060631036758, -0.08354330062866211, -0.06128600239753723, -0.039028704166412354, -0.016771404072642326, 0.005485896021127701, 0.027743197977542877, 0.050000496208667755, 0.07225779443979263, 0.09451510012149811, 0.11677239835262299, 0.13902969658374786, 0.16128699481487274, 0.18354429304599762, 0.2058016061782837, 0.22805890440940857, 0.25031620264053345, 0.2725735008716583, 0.2948307991027832, 0.3170880973339081, 0.33934539556503296, 0.36160269379615784, 0.3838599920272827, 0.4061172902584076, 0.42837458848953247, 0.45063191652297974, 0.4728891849517822, 0.4951465129852295, 0.5174038410186768, 0.5396611094474792, 0.5619184374809265, 0.584175705909729, 0.6064330339431763, 0.6286903023719788, 0.650947630405426, 0.6732048988342285]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 6.0, 2.0, 6.0, 9.0, 18.0, 22.0, 24.0, 37.0, 58.0, 75.0, 86.0, 114.0, 200.0, 469.0, 1610.0, 18195.0, 4155536.0, 15123.0, 1564.0, 459.0, 213.0, 113.0, 82.0, 70.0, 43.0, 32.0, 19.0, 14.0, 25.0, 15.0, 5.0, 10.0, 7.0, 6.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.232666015625, -0.226287841796875, -0.21990966796875, -0.213531494140625, -0.2071533203125, -0.200775146484375, -0.19439697265625, -0.188018798828125, -0.181640625, -0.175262451171875, -0.16888427734375, -0.162506103515625, -0.1561279296875, -0.149749755859375, -0.14337158203125, -0.136993408203125, -0.130615234375, -0.124237060546875, -0.11785888671875, -0.111480712890625, -0.1051025390625, -0.098724365234375, -0.09234619140625, -0.085968017578125, -0.07958984375, -0.073211669921875, -0.06683349609375, -0.060455322265625, -0.0540771484375, -0.047698974609375, -0.04132080078125, -0.034942626953125, -0.028564453125, -0.022186279296875, -0.01580810546875, -0.009429931640625, -0.0030517578125, 0.003326416015625, 0.00970458984375, 0.016082763671875, 0.0224609375, 0.028839111328125, 0.03521728515625, 0.041595458984375, 0.0479736328125, 0.054351806640625, 0.06072998046875, 0.067108154296875, 0.073486328125, 0.079864501953125, 0.08624267578125, 0.092620849609375, 0.0989990234375, 0.105377197265625, 0.11175537109375, 0.118133544921875, 0.12451171875, 0.130889892578125, 0.13726806640625, 0.143646240234375, 0.1500244140625, 0.156402587890625, 0.16278076171875, 0.169158935546875, 0.175537109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 12.0, 12.0, 11.0, 11.0, 15.0, 26.0, 25.0, 26.0, 33.0, 42.0, 43.0, 55.0, 40.0, 42.0, 47.0, 60.0, 42.0, 57.0, 44.0, 40.0, 47.0, 39.0, 39.0, 26.0, 31.0, 19.0, 17.0, 15.0, 9.0, 10.0, 15.0, 3.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.032928466796875, -0.03178739547729492, -0.030646324157714844, -0.029505252838134766, -0.028364181518554688, -0.02722311019897461, -0.02608203887939453, -0.024940967559814453, -0.023799896240234375, -0.022658824920654297, -0.02151775360107422, -0.02037668228149414, -0.019235610961914062, -0.018094539642333984, -0.016953468322753906, -0.015812397003173828, -0.01467132568359375, -0.013530254364013672, -0.012389183044433594, -0.011248111724853516, -0.010107040405273438, -0.00896596908569336, -0.007824897766113281, -0.006683826446533203, -0.005542755126953125, -0.004401683807373047, -0.0032606124877929688, -0.0021195411682128906, -0.0009784698486328125, 0.00016260147094726562, 0.0013036727905273438, 0.002444744110107422, 0.0035858154296875, 0.004726886749267578, 0.005867958068847656, 0.007009029388427734, 0.008150100708007812, 0.00929117202758789, 0.010432243347167969, 0.011573314666748047, 0.012714385986328125, 0.013855457305908203, 0.014996528625488281, 0.01613759994506836, 0.017278671264648438, 0.018419742584228516, 0.019560813903808594, 0.020701885223388672, 0.02184295654296875, 0.022984027862548828, 0.024125099182128906, 0.025266170501708984, 0.026407241821289062, 0.02754831314086914, 0.02868938446044922, 0.029830455780029297, 0.030971527099609375, 0.03211259841918945, 0.03325366973876953, 0.03439474105834961, 0.03553581237792969, 0.036676883697509766, 0.037817955017089844, 0.03895902633666992, 0.04010009765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 5.0, 8.0, 5.0, 21.0, 15.0, 29.0, 37.0, 46.0, 64.0, 98.0, 107.0, 161.0, 261.0, 400.0, 709.0, 1750.0, 6109.0, 171490.0, 3999112.0, 9460.0, 2162.0, 833.0, 482.0, 251.0, 160.0, 138.0, 86.0, 69.0, 47.0, 40.0, 39.0, 14.0, 22.0, 8.0, 8.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.1934814453125, -0.18781089782714844, -0.18214035034179688, -0.1764698028564453, -0.17079925537109375, -0.1651287078857422, -0.15945816040039062, -0.15378761291503906, -0.1481170654296875, -0.14244651794433594, -0.13677597045898438, -0.1311054229736328, -0.12543487548828125, -0.11976432800292969, -0.11409378051757812, -0.10842323303222656, -0.102752685546875, -0.09708213806152344, -0.09141159057617188, -0.08574104309082031, -0.08007049560546875, -0.07439994812011719, -0.06872940063476562, -0.06305885314941406, -0.0573883056640625, -0.05171775817871094, -0.046047210693359375, -0.04037666320800781, -0.03470611572265625, -0.029035568237304688, -0.023365020751953125, -0.017694473266601562, -0.01202392578125, -0.0063533782958984375, -0.000682830810546875, 0.0049877166748046875, 0.01065826416015625, 0.016328811645507812, 0.021999359130859375, 0.027669906616210938, 0.0333404541015625, 0.03901100158691406, 0.044681549072265625, 0.05035209655761719, 0.05602264404296875, 0.06169319152832031, 0.06736373901367188, 0.07303428649902344, 0.078704833984375, 0.08437538146972656, 0.09004592895507812, 0.09571647644042969, 0.10138702392578125, 0.10705757141113281, 0.11272811889648438, 0.11839866638183594, 0.1240692138671875, 0.12973976135253906, 0.13541030883789062, 0.1410808563232422, 0.14675140380859375, 0.1524219512939453, 0.15809249877929688, 0.16376304626464844, 0.16943359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 8.0, 10.0, 28.0, 130.0, 3654.0, 187.0, 41.0, 9.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10504150390625, -0.1020059585571289, -0.09897041320800781, -0.09593486785888672, -0.09289932250976562, -0.08986377716064453, -0.08682823181152344, -0.08379268646240234, -0.08075714111328125, -0.07772159576416016, -0.07468605041503906, -0.07165050506591797, -0.06861495971679688, -0.06557941436767578, -0.06254386901855469, -0.059508323669433594, -0.0564727783203125, -0.053437232971191406, -0.05040168762207031, -0.04736614227294922, -0.044330596923828125, -0.04129505157470703, -0.03825950622558594, -0.035223960876464844, -0.03218841552734375, -0.029152870178222656, -0.026117324829101562, -0.02308177947998047, -0.020046234130859375, -0.01701068878173828, -0.013975143432617188, -0.010939598083496094, -0.007904052734375, -0.004868507385253906, -0.0018329620361328125, 0.0012025833129882812, 0.004238128662109375, 0.007273674011230469, 0.010309219360351562, 0.013344764709472656, 0.01638031005859375, 0.019415855407714844, 0.022451400756835938, 0.02548694610595703, 0.028522491455078125, 0.03155803680419922, 0.03459358215332031, 0.037629127502441406, 0.0406646728515625, 0.043700218200683594, 0.04673576354980469, 0.04977130889892578, 0.052806854248046875, 0.05584239959716797, 0.05887794494628906, 0.061913490295410156, 0.06494903564453125, 0.06798458099365234, 0.07102012634277344, 0.07405567169189453, 0.07709121704101562, 0.08012676239013672, 0.08316230773925781, 0.0861978530883789, 0.0892333984375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 16.0, 23.0, 41.0, 68.0, 86.0, 142.0, 155.0, 140.0, 103.0, 85.0, 43.0, 31.0, 15.0, 14.0, 3.0, 8.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2550264000892639, -0.24864712357521057, -0.24226786196231842, -0.23588858544826508, -0.22950930893421173, -0.22313004732131958, -0.21675077080726624, -0.2103714942932129, -0.20399221777915955, -0.1976129412651062, -0.19123367965221405, -0.1848544031381607, -0.17847512662410736, -0.1720958650112152, -0.16571658849716187, -0.15933731198310852, -0.15295805037021637, -0.14657877385616302, -0.14019951224327087, -0.13382023572921753, -0.12744095921516418, -0.12106169015169144, -0.11468242108821869, -0.10830314457416534, -0.1019238755106926, -0.09554460644721985, -0.0891653299331665, -0.08278606086969376, -0.07640679180622101, -0.07002751529216766, -0.06364824622869492, -0.05726897343993187, -0.05088970065116882, -0.04451042786240578, -0.03813115507364273, -0.03175188601016998, -0.025372613221406937, -0.01899334043264389, -0.012614071369171143, -0.006234798580408096, 0.00014447420835494995, 0.006523746065795422, 0.012903017923235893, 0.01928228884935379, 0.025661561638116837, 0.03204083442687988, 0.03842010349035263, 0.04479937627911568, 0.05117864906787872, 0.05755792185664177, 0.06393719464540482, 0.07031646370887756, 0.07669574022293091, 0.08307500928640366, 0.0894542783498764, 0.09583355486392975, 0.1022128239274025, 0.10859209299087524, 0.11497136950492859, 0.12135063856840134, 0.12772990763187408, 0.13410918414592743, 0.14048844575881958, 0.14686772227287292, 0.15324699878692627]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 9.0, 7.0, 14.0, 21.0, 17.0, 19.0, 25.0, 36.0, 20.0, 33.0, 50.0, 51.0, 46.0, 51.0, 46.0, 52.0, 53.0, 48.0, 47.0, 41.0, 47.0, 33.0, 31.0, 37.0, 32.0, 24.0, 16.0, 13.0, 12.0, 5.0, 9.0, 13.0, 5.0, 5.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1212194561958313, -0.1174180805683136, -0.1136167123913765, -0.10981534421443939, -0.10601396858692169, -0.10221259295940399, -0.09841122478246689, -0.09460985660552979, -0.09080848097801208, -0.08700710535049438, -0.08320573717355728, -0.07940436899662018, -0.07560299336910248, -0.07180161774158478, -0.06800024956464767, -0.06419888138771057, -0.06039750576019287, -0.05659613385796547, -0.05279476195573807, -0.048993390053510666, -0.045192018151283264, -0.04139064624905586, -0.03758927434682846, -0.03378790244460106, -0.029986530542373657, -0.026185158640146255, -0.022383786737918854, -0.018582414835691452, -0.01478104293346405, -0.010979671031236649, -0.007178299129009247, -0.003376927226781845, 0.00042444467544555664, 0.004225816577672958, 0.00802718847990036, 0.011828560382127762, 0.015629932284355164, 0.019431304186582565, 0.023232676088809967, 0.02703404799103737, 0.03083541989326477, 0.03463679179549217, 0.038438163697719574, 0.042239535599946976, 0.04604090750217438, 0.04984227940440178, 0.05364365130662918, 0.05744502320885658, 0.061246395111083984, 0.06504777073860168, 0.06884913891553879, 0.07265050709247589, 0.07645188271999359, 0.08025325834751129, 0.0840546265244484, 0.0878559947013855, 0.0916573703289032, 0.0954587459564209, 0.099260114133358, 0.1030614823102951, 0.1068628579378128, 0.1106642335653305, 0.11446560174226761, 0.11826696991920471, 0.12206834554672241]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 5.0, 7.0, 11.0, 17.0, 22.0, 20.0, 32.0, 42.0, 51.0, 72.0, 112.0, 170.0, 282.0, 428.0, 691.0, 1211.0, 2253.0, 4236.0, 8505.0, 17893.0, 39863.0, 96644.0, 232246.0, 324282.0, 184627.0, 74649.0, 30915.0, 14361.0, 6922.0, 3369.0, 1833.0, 1073.0, 609.0, 371.0, 231.0, 141.0, 90.0, 73.0, 45.0, 37.0, 22.0, 18.0, 19.0, 19.0, 8.0, 4.0, 6.0, 1.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.046661376953125, -0.04517316818237305, -0.043684959411621094, -0.04219675064086914, -0.04070854187011719, -0.039220333099365234, -0.03773212432861328, -0.03624391555786133, -0.034755706787109375, -0.03326749801635742, -0.03177928924560547, -0.030291080474853516, -0.028802871704101562, -0.02731466293334961, -0.025826454162597656, -0.024338245391845703, -0.02285003662109375, -0.021361827850341797, -0.019873619079589844, -0.01838541030883789, -0.016897201538085938, -0.015408992767333984, -0.013920783996582031, -0.012432575225830078, -0.010944366455078125, -0.009456157684326172, -0.007967948913574219, -0.006479740142822266, -0.0049915313720703125, -0.0035033226013183594, -0.0020151138305664062, -0.0005269050598144531, 0.0009613037109375, 0.002449512481689453, 0.003937721252441406, 0.005425930023193359, 0.0069141387939453125, 0.008402347564697266, 0.009890556335449219, 0.011378765106201172, 0.012866973876953125, 0.014355182647705078, 0.01584339141845703, 0.017331600189208984, 0.018819808959960938, 0.02030801773071289, 0.021796226501464844, 0.023284435272216797, 0.02477264404296875, 0.026260852813720703, 0.027749061584472656, 0.02923727035522461, 0.030725479125976562, 0.032213687896728516, 0.03370189666748047, 0.03519010543823242, 0.036678314208984375, 0.03816652297973633, 0.03965473175048828, 0.041142940521240234, 0.04263114929199219, 0.04411935806274414, 0.045607566833496094, 0.04709577560424805, 0.048583984375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 2.0, 5.0, 12.0, 13.0, 10.0, 11.0, 32.0, 32.0, 32.0, 42.0, 35.0, 46.0, 39.0, 35.0, 61.0, 37.0, 45.0, 54.0, 47.0, 42.0, 48.0, 49.0, 41.0, 37.0, 25.0, 27.0, 25.0, 18.0, 8.0, 13.0, 15.0, 15.0, 9.0, 1.0, 6.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.034332275390625, -0.033145904541015625, -0.03195953369140625, -0.030773162841796875, -0.0295867919921875, -0.028400421142578125, -0.02721405029296875, -0.026027679443359375, -0.02484130859375, -0.023654937744140625, -0.02246856689453125, -0.021282196044921875, -0.0200958251953125, -0.018909454345703125, -0.01772308349609375, -0.016536712646484375, -0.015350341796875, -0.014163970947265625, -0.01297760009765625, -0.011791229248046875, -0.0106048583984375, -0.009418487548828125, -0.00823211669921875, -0.007045745849609375, -0.005859375, -0.004673004150390625, -0.00348663330078125, -0.002300262451171875, -0.0011138916015625, 7.2479248046875e-05, 0.00125885009765625, 0.002445220947265625, 0.003631591796875, 0.004817962646484375, 0.00600433349609375, 0.007190704345703125, 0.0083770751953125, 0.009563446044921875, 0.01074981689453125, 0.011936187744140625, 0.01312255859375, 0.014308929443359375, 0.01549530029296875, 0.016681671142578125, 0.0178680419921875, 0.019054412841796875, 0.02024078369140625, 0.021427154541015625, 0.022613525390625, 0.023799896240234375, 0.02498626708984375, 0.026172637939453125, 0.0273590087890625, 0.028545379638671875, 0.02973175048828125, 0.030918121337890625, 0.0321044921875, 0.033290863037109375, 0.03447723388671875, 0.035663604736328125, 0.0368499755859375, 0.038036346435546875, 0.03922271728515625, 0.040409088134765625, 0.041595458984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 3.0, 4.0, 10.0, 16.0, 24.0, 27.0, 36.0, 45.0, 50.0, 78.0, 140.0, 211.0, 384.0, 775.0, 2030.0, 7932.0, 46882.0, 479962.0, 454144.0, 44567.0, 7460.0, 2054.0, 757.0, 351.0, 156.0, 122.0, 96.0, 47.0, 48.0, 22.0, 31.0, 19.0, 12.0, 10.0, 9.0, 6.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.111083984375, -0.10771656036376953, -0.10434913635253906, -0.1009817123413086, -0.09761428833007812, -0.09424686431884766, -0.09087944030761719, -0.08751201629638672, -0.08414459228515625, -0.08077716827392578, -0.07740974426269531, -0.07404232025146484, -0.07067489624023438, -0.0673074722290039, -0.06394004821777344, -0.06057262420654297, -0.0572052001953125, -0.05383777618408203, -0.05047035217285156, -0.047102928161621094, -0.043735504150390625, -0.040368080139160156, -0.03700065612792969, -0.03363323211669922, -0.03026580810546875, -0.02689838409423828, -0.023530960083007812, -0.020163536071777344, -0.016796112060546875, -0.013428688049316406, -0.010061264038085938, -0.006693840026855469, -0.003326416015625, 4.100799560546875e-05, 0.0034084320068359375, 0.006775856018066406, 0.010143280029296875, 0.013510704040527344, 0.016878128051757812, 0.02024555206298828, 0.02361297607421875, 0.02698040008544922, 0.030347824096679688, 0.033715248107910156, 0.037082672119140625, 0.040450096130371094, 0.04381752014160156, 0.04718494415283203, 0.0505523681640625, 0.05391979217529297, 0.05728721618652344, 0.060654640197753906, 0.06402206420898438, 0.06738948822021484, 0.07075691223144531, 0.07412433624267578, 0.07749176025390625, 0.08085918426513672, 0.08422660827636719, 0.08759403228759766, 0.09096145629882812, 0.0943288803100586, 0.09769630432128906, 0.10106372833251953, 0.10443115234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 2.0, 5.0, 3.0, 9.0, 16.0, 18.0, 17.0, 12.0, 27.0, 27.0, 23.0, 26.0, 35.0, 51.0, 42.0, 42.0, 44.0, 48.0, 51.0, 66.0, 45.0, 40.0, 46.0, 51.0, 42.0, 43.0, 33.0, 16.0, 28.0, 14.0, 15.0, 13.0, 11.0, 10.0, 7.0, 11.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.1700439453125, -0.1654338836669922, -0.16082382202148438, -0.15621376037597656, -0.15160369873046875, -0.14699363708496094, -0.14238357543945312, -0.1377735137939453, -0.1331634521484375, -0.1285533905029297, -0.12394332885742188, -0.11933326721191406, -0.11472320556640625, -0.11011314392089844, -0.10550308227539062, -0.10089302062988281, -0.096282958984375, -0.09167289733886719, -0.08706283569335938, -0.08245277404785156, -0.07784271240234375, -0.07323265075683594, -0.06862258911132812, -0.06401252746582031, -0.0594024658203125, -0.05479240417480469, -0.050182342529296875, -0.04557228088378906, -0.04096221923828125, -0.03635215759277344, -0.031742095947265625, -0.027132034301757812, -0.02252197265625, -0.017911911010742188, -0.013301849365234375, -0.008691787719726562, -0.00408172607421875, 0.0005283355712890625, 0.005138397216796875, 0.009748458862304688, 0.0143585205078125, 0.018968582153320312, 0.023578643798828125, 0.028188705444335938, 0.03279876708984375, 0.03740882873535156, 0.042018890380859375, 0.04662895202636719, 0.051239013671875, 0.05584907531738281, 0.060459136962890625, 0.06506919860839844, 0.06967926025390625, 0.07428932189941406, 0.07889938354492188, 0.08350944519042969, 0.0881195068359375, 0.09272956848144531, 0.09733963012695312, 0.10194969177246094, 0.10655975341796875, 0.11116981506347656, 0.11577987670898438, 0.12038993835449219, 0.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 6.0, 6.0, 11.0, 11.0, 24.0, 38.0, 63.0, 127.0, 209.0, 494.0, 1281.0, 5072.0, 39721.0, 714799.0, 265619.0, 16509.0, 2879.0, 879.0, 367.0, 183.0, 98.0, 65.0, 25.0, 15.0, 15.0, 8.0, 7.0, 4.0, 6.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04010009765625, -0.03891420364379883, -0.037728309631347656, -0.036542415618896484, -0.03535652160644531, -0.03417062759399414, -0.03298473358154297, -0.0317988395690918, -0.030612945556640625, -0.029427051544189453, -0.02824115753173828, -0.02705526351928711, -0.025869369506835938, -0.024683475494384766, -0.023497581481933594, -0.022311687469482422, -0.02112579345703125, -0.019939899444580078, -0.018754005432128906, -0.017568111419677734, -0.016382217407226562, -0.01519632339477539, -0.014010429382324219, -0.012824535369873047, -0.011638641357421875, -0.010452747344970703, -0.009266853332519531, -0.00808095932006836, -0.0068950653076171875, -0.005709171295166016, -0.004523277282714844, -0.003337383270263672, -0.0021514892578125, -0.0009655952453613281, 0.00022029876708984375, 0.0014061927795410156, 0.0025920867919921875, 0.0037779808044433594, 0.004963874816894531, 0.006149768829345703, 0.007335662841796875, 0.008521556854248047, 0.009707450866699219, 0.01089334487915039, 0.012079238891601562, 0.013265132904052734, 0.014451026916503906, 0.015636920928955078, 0.01682281494140625, 0.018008708953857422, 0.019194602966308594, 0.020380496978759766, 0.021566390991210938, 0.02275228500366211, 0.02393817901611328, 0.025124073028564453, 0.026309967041015625, 0.027495861053466797, 0.02868175506591797, 0.02986764907836914, 0.031053543090820312, 0.032239437103271484, 0.033425331115722656, 0.03461122512817383, 0.035797119140625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 9.0, 7.0, 19.0, 23.0, 21.0, 37.0, 45.0, 45.0, 67.0, 79.0, 85.0, 69.0, 72.0, 80.0, 59.0, 54.0, 52.0, 38.0, 24.0, 22.0, 20.0, 16.0, 15.0, 9.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.735324859619141e-06, -6.514601409435272e-06, -6.293877959251404e-06, -6.073154509067535e-06, -5.852431058883667e-06, -5.631707608699799e-06, -5.41098415851593e-06, -5.190260708332062e-06, -4.969537258148193e-06, -4.748813807964325e-06, -4.5280903577804565e-06, -4.307366907596588e-06, -4.08664345741272e-06, -3.865920007228851e-06, -3.645196557044983e-06, -3.4244731068611145e-06, -3.203749656677246e-06, -2.9830262064933777e-06, -2.7623027563095093e-06, -2.541579306125641e-06, -2.3208558559417725e-06, -2.100132405757904e-06, -1.8794089555740356e-06, -1.6586855053901672e-06, -1.4379620552062988e-06, -1.2172386050224304e-06, -9.96515154838562e-07, -7.757917046546936e-07, -5.550682544708252e-07, -3.343448042869568e-07, -1.1362135410308838e-07, 1.0710209608078003e-07, 3.2782554626464844e-07, 5.485489964485168e-07, 7.692724466323853e-07, 9.899958968162537e-07, 1.210719347000122e-06, 1.4314427971839905e-06, 1.6521662473678589e-06, 1.8728896975517273e-06, 2.0936131477355957e-06, 2.314336597919464e-06, 2.5350600481033325e-06, 2.755783498287201e-06, 2.9765069484710693e-06, 3.1972303986549377e-06, 3.417953848838806e-06, 3.6386772990226746e-06, 3.859400749206543e-06, 4.080124199390411e-06, 4.30084764957428e-06, 4.521571099758148e-06, 4.742294549942017e-06, 4.963018000125885e-06, 5.183741450309753e-06, 5.404464900493622e-06, 5.62518835067749e-06, 5.845911800861359e-06, 6.066635251045227e-06, 6.2873587012290955e-06, 6.508082151412964e-06, 6.728805601596832e-06, 6.949529051780701e-06, 7.170252501964569e-06, 7.3909759521484375e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 13.0, 30.0, 55.0, 113.0, 316.0, 1967.0, 130484.0, 909037.0, 5768.0, 543.0, 115.0, 62.0, 27.0, 12.0, 9.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08441162109375, -0.08130645751953125, -0.0782012939453125, -0.07509613037109375, -0.071990966796875, -0.06888580322265625, -0.0657806396484375, -0.06267547607421875, -0.0595703125, -0.05646514892578125, -0.0533599853515625, -0.05025482177734375, -0.047149658203125, -0.04404449462890625, -0.0409393310546875, -0.03783416748046875, -0.03472900390625, -0.03162384033203125, -0.0285186767578125, -0.02541351318359375, -0.022308349609375, -0.01920318603515625, -0.0160980224609375, -0.01299285888671875, -0.0098876953125, -0.00678253173828125, -0.0036773681640625, -0.00057220458984375, 0.002532958984375, 0.00563812255859375, 0.0087432861328125, 0.01184844970703125, 0.01495361328125, 0.01805877685546875, 0.0211639404296875, 0.02426910400390625, 0.027374267578125, 0.03047943115234375, 0.0335845947265625, 0.03668975830078125, 0.039794921875, 0.04290008544921875, 0.0460052490234375, 0.04911041259765625, 0.052215576171875, 0.05532073974609375, 0.0584259033203125, 0.06153106689453125, 0.06463623046875, 0.06774139404296875, 0.0708465576171875, 0.07395172119140625, 0.077056884765625, 0.08016204833984375, 0.0832672119140625, 0.08637237548828125, 0.0894775390625, 0.09258270263671875, 0.0956878662109375, 0.09879302978515625, 0.101898193359375, 0.10500335693359375, 0.1081085205078125, 0.11121368408203125, 0.11431884765625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 10.0, 7.0, 19.0, 42.0, 70.0, 111.0, 183.0, 192.0, 164.0, 100.0, 55.0, 24.0, 21.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1180419921875, -0.11565589904785156, -0.11326980590820312, -0.11088371276855469, -0.10849761962890625, -0.10611152648925781, -0.10372543334960938, -0.10133934020996094, -0.0989532470703125, -0.09656715393066406, -0.09418106079101562, -0.09179496765136719, -0.08940887451171875, -0.08702278137207031, -0.08463668823242188, -0.08225059509277344, -0.079864501953125, -0.07747840881347656, -0.07509231567382812, -0.07270622253417969, -0.07032012939453125, -0.06793403625488281, -0.06554794311523438, -0.06316184997558594, -0.0607757568359375, -0.05838966369628906, -0.056003570556640625, -0.05361747741699219, -0.05123138427734375, -0.04884529113769531, -0.046459197998046875, -0.04407310485839844, -0.04168701171875, -0.03930091857910156, -0.036914825439453125, -0.03452873229980469, -0.03214263916015625, -0.029756546020507812, -0.027370452880859375, -0.024984359741210938, -0.0225982666015625, -0.020212173461914062, -0.017826080322265625, -0.015439987182617188, -0.01305389404296875, -0.010667800903320312, -0.008281707763671875, -0.0058956146240234375, -0.003509521484375, -0.0011234283447265625, 0.001262664794921875, 0.0036487579345703125, 0.00603485107421875, 0.008420944213867188, 0.010807037353515625, 0.013193130493164062, 0.0155792236328125, 0.017965316772460938, 0.020351409912109375, 0.022737503051757812, 0.02512359619140625, 0.027509689331054688, 0.029895782470703125, 0.03228187561035156, 0.03466796875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 18.0, 42.0, 85.0, 173.0, 202.0, 178.0, 130.0, 92.0, 36.0, 22.0, 10.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3255603611469269, -0.29497021436691284, -0.2643800973892212, -0.23378996551036835, -0.2031998336315155, -0.17260970175266266, -0.14201956987380981, -0.11142943799495697, -0.08083930611610413, -0.05024917423725128, -0.019659042358398438, 0.010931089520454407, 0.04152122139930725, 0.0721113532781601, 0.10270148515701294, 0.13329161703586578, 0.16388174891471863, 0.19447188079357147, 0.22506201267242432, 0.25565212965011597, 0.28624227643013, 0.31683242321014404, 0.3474225401878357, 0.37801265716552734, 0.4086028039455414, 0.4391929507255554, 0.46978306770324707, 0.5003731846809387, 0.5309633016586304, 0.5615534782409668, 0.5921435952186584, 0.6227337121963501, 0.6533238887786865, 0.6839140057563782, 0.7145041227340698, 0.7450942993164062, 0.7756844162940979, 0.8062745332717896, 0.836864709854126, 0.8674548268318176, 0.8980449438095093, 0.9286350607872009, 0.9592251777648926, 0.989815354347229, 1.0204055309295654, 1.0509955883026123, 1.0815857648849487, 1.1121758222579956, 1.142765998840332, 1.1733561754226685, 1.2039462327957153, 1.2345364093780518, 1.2651264667510986, 1.295716643333435, 1.3263068199157715, 1.3568968772888184, 1.3874870538711548, 1.4180772304534912, 1.448667287826538, 1.4792574644088745, 1.509847640991211, 1.5404376983642578, 1.5710278749465942, 1.6016179323196411, 1.6322081089019775]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 6.0, 7.0, 7.0, 11.0, 9.0, 12.0, 11.0, 18.0, 19.0, 24.0, 25.0, 28.0, 29.0, 28.0, 27.0, 31.0, 41.0, 31.0, 36.0, 47.0, 33.0, 41.0, 40.0, 48.0, 44.0, 27.0, 36.0, 30.0, 29.0, 29.0, 26.0, 20.0, 22.0, 15.0, 16.0, 22.0, 13.0, 7.0, 11.0, 3.0, 7.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.5592297315597534, -0.5424671769142151, -0.5257046222686768, -0.5089421272277832, -0.4921795725822449, -0.47541701793670654, -0.4586544632911682, -0.44189193844795227, -0.42512941360473633, -0.408366858959198, -0.39160433411598206, -0.3748417794704437, -0.3580792546272278, -0.34131669998168945, -0.3245541453361511, -0.3077916204929352, -0.29102906584739685, -0.2742665112018585, -0.2575039863586426, -0.24074143171310425, -0.2239789068698883, -0.20721635222434998, -0.19045381247997284, -0.1736912727355957, -0.15692873299121857, -0.14016619324684143, -0.1234036535024643, -0.10664110630750656, -0.08987856656312943, -0.07311602681875229, -0.056353479623794556, -0.03959093987941742, -0.022828400135040283, -0.006065858528017998, 0.010696683079004288, 0.027459226548671722, 0.04422176629304886, 0.060984306037425995, 0.07774685323238373, 0.09450939297676086, 0.111271932721138, 0.12803447246551514, 0.14479701220989227, 0.1615595519542694, 0.17832210659980774, 0.19508463144302368, 0.211847186088562, 0.22860972583293915, 0.24537226557731628, 0.2621348202228546, 0.27889734506607056, 0.2956598997116089, 0.31242242455482483, 0.32918497920036316, 0.3459475040435791, 0.36271005868911743, 0.37947261333465576, 0.3962351679801941, 0.41299769282341003, 0.42976024746894836, 0.4465227723121643, 0.46328532695770264, 0.48004788160324097, 0.4968104064464569, 0.5135729312896729]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 18.0, 29.0, 56.0, 75.0, 184.0, 354.0, 674.0, 1545.0, 3892.0, 11669.0, 51841.0, 1646907.0, 2399507.0, 57366.0, 12659.0, 4407.0, 1654.0, 744.0, 332.0, 189.0, 87.0, 35.0, 22.0, 17.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05126953125, -0.048709869384765625, -0.04615020751953125, -0.043590545654296875, -0.0410308837890625, -0.038471221923828125, -0.03591156005859375, -0.033351898193359375, -0.030792236328125, -0.028232574462890625, -0.02567291259765625, -0.023113250732421875, -0.0205535888671875, -0.017993927001953125, -0.01543426513671875, -0.012874603271484375, -0.01031494140625, -0.007755279541015625, -0.00519561767578125, -0.002635955810546875, -7.62939453125e-05, 0.002483367919921875, 0.00504302978515625, 0.007602691650390625, 0.010162353515625, 0.012722015380859375, 0.01528167724609375, 0.017841339111328125, 0.0204010009765625, 0.022960662841796875, 0.02552032470703125, 0.028079986572265625, 0.0306396484375, 0.033199310302734375, 0.03575897216796875, 0.038318634033203125, 0.0408782958984375, 0.043437957763671875, 0.04599761962890625, 0.048557281494140625, 0.051116943359375, 0.053676605224609375, 0.05623626708984375, 0.058795928955078125, 0.0613555908203125, 0.06391525268554688, 0.06647491455078125, 0.06903457641601562, 0.07159423828125, 0.07415390014648438, 0.07671356201171875, 0.07927322387695312, 0.0818328857421875, 0.08439254760742188, 0.08695220947265625, 0.08951187133789062, 0.092071533203125, 0.09463119506835938, 0.09719085693359375, 0.09975051879882812, 0.1023101806640625, 0.10486984252929688, 0.10742950439453125, 0.10998916625976562, 0.112548828125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 7.0, 12.0, 18.0, 11.0, 15.0, 26.0, 25.0, 37.0, 37.0, 47.0, 41.0, 55.0, 34.0, 59.0, 47.0, 47.0, 59.0, 53.0, 55.0, 33.0, 37.0, 37.0, 34.0, 33.0, 20.0, 14.0, 21.0, 10.0, 13.0, 18.0, 11.0, 4.0, 3.0, 4.0, 2.0, 2.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03729248046875, -0.03614044189453125, -0.0349884033203125, -0.03383636474609375, -0.032684326171875, -0.03153228759765625, -0.0303802490234375, -0.02922821044921875, -0.028076171875, -0.02692413330078125, -0.0257720947265625, -0.02462005615234375, -0.023468017578125, -0.02231597900390625, -0.0211639404296875, -0.02001190185546875, -0.01885986328125, -0.01770782470703125, -0.0165557861328125, -0.01540374755859375, -0.014251708984375, -0.01309967041015625, -0.0119476318359375, -0.01079559326171875, -0.0096435546875, -0.00849151611328125, -0.0073394775390625, -0.00618743896484375, -0.005035400390625, -0.00388336181640625, -0.0027313232421875, -0.00157928466796875, -0.00042724609375, 0.00072479248046875, 0.0018768310546875, 0.00302886962890625, 0.004180908203125, 0.00533294677734375, 0.0064849853515625, 0.00763702392578125, 0.0087890625, 0.00994110107421875, 0.0110931396484375, 0.01224517822265625, 0.013397216796875, 0.01454925537109375, 0.0157012939453125, 0.01685333251953125, 0.01800537109375, 0.01915740966796875, 0.0203094482421875, 0.02146148681640625, 0.022613525390625, 0.02376556396484375, 0.0249176025390625, 0.02606964111328125, 0.0272216796875, 0.02837371826171875, 0.0295257568359375, 0.03067779541015625, 0.031829833984375, 0.03298187255859375, 0.0341339111328125, 0.03528594970703125, 0.03643798828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 6.0, 5.0, 5.0, 10.0, 14.0, 27.0, 32.0, 50.0, 80.0, 224.0, 664.0, 4555.0, 69339.0, 4050896.0, 63127.0, 4215.0, 608.0, 205.0, 89.0, 47.0, 24.0, 16.0, 13.0, 13.0, 8.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11907958984375, -0.11353778839111328, -0.10799598693847656, -0.10245418548583984, -0.09691238403320312, -0.0913705825805664, -0.08582878112792969, -0.08028697967529297, -0.07474517822265625, -0.06920337677001953, -0.06366157531738281, -0.058119773864746094, -0.052577972412109375, -0.047036170959472656, -0.04149436950683594, -0.03595256805419922, -0.0304107666015625, -0.02486896514892578, -0.019327163696289062, -0.013785362243652344, -0.008243560791015625, -0.0027017593383789062, 0.0028400421142578125, 0.008381843566894531, 0.01392364501953125, 0.01946544647216797, 0.025007247924804688, 0.030549049377441406, 0.036090850830078125, 0.041632652282714844, 0.04717445373535156, 0.05271625518798828, 0.058258056640625, 0.06379985809326172, 0.06934165954589844, 0.07488346099853516, 0.08042526245117188, 0.0859670639038086, 0.09150886535644531, 0.09705066680908203, 0.10259246826171875, 0.10813426971435547, 0.11367607116699219, 0.1192178726196289, 0.12475967407226562, 0.13030147552490234, 0.13584327697753906, 0.14138507843017578, 0.1469268798828125, 0.15246868133544922, 0.15801048278808594, 0.16355228424072266, 0.16909408569335938, 0.1746358871459961, 0.1801776885986328, 0.18571949005126953, 0.19126129150390625, 0.19680309295654297, 0.2023448944091797, 0.2078866958618164, 0.21342849731445312, 0.21897029876708984, 0.22451210021972656, 0.23005390167236328, 0.235595703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 9.0, 7.0, 9.0, 25.0, 16.0, 29.0, 36.0, 68.0, 167.0, 556.0, 1643.0, 929.0, 279.0, 107.0, 49.0, 34.0, 25.0, 15.0, 12.0, 13.0, 5.0, 5.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10888671875, -0.105926513671875, -0.10296630859375, -0.100006103515625, -0.0970458984375, -0.094085693359375, -0.09112548828125, -0.088165283203125, -0.085205078125, -0.082244873046875, -0.07928466796875, -0.076324462890625, -0.0733642578125, -0.070404052734375, -0.06744384765625, -0.064483642578125, -0.0615234375, -0.058563232421875, -0.05560302734375, -0.052642822265625, -0.0496826171875, -0.046722412109375, -0.04376220703125, -0.040802001953125, -0.037841796875, -0.034881591796875, -0.03192138671875, -0.028961181640625, -0.0260009765625, -0.023040771484375, -0.02008056640625, -0.017120361328125, -0.01416015625, -0.011199951171875, -0.00823974609375, -0.005279541015625, -0.0023193359375, 0.000640869140625, 0.00360107421875, 0.006561279296875, 0.009521484375, 0.012481689453125, 0.01544189453125, 0.018402099609375, 0.0213623046875, 0.024322509765625, 0.02728271484375, 0.030242919921875, 0.033203125, 0.036163330078125, 0.03912353515625, 0.042083740234375, 0.0450439453125, 0.048004150390625, 0.05096435546875, 0.053924560546875, 0.056884765625, 0.059844970703125, 0.06280517578125, 0.065765380859375, 0.0687255859375, 0.071685791015625, 0.07464599609375, 0.077606201171875, 0.08056640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 26.0, 49.0, 113.0, 256.0, 252.0, 176.0, 68.0, 16.0, 15.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3399028778076172, -1.3089771270751953, -1.2780513763427734, -1.247125506401062, -1.2161997556686401, -1.1852740049362183, -1.1543481349945068, -1.123422384262085, -1.092496633529663, -1.0615708827972412, -1.0306451320648193, -0.9997192621231079, -0.968793511390686, -0.9378677606582642, -0.9069419503211975, -0.8760161399841309, -0.845090389251709, -0.8141646385192871, -0.7832388281822205, -0.7523130178451538, -0.7213872671127319, -0.6904615163803101, -0.6595357060432434, -0.6286098957061768, -0.5976841449737549, -0.566758394241333, -0.5358325839042664, -0.5049067735671997, -0.47398102283477783, -0.44305524230003357, -0.4121294617652893, -0.38120368123054504, -0.3502779006958008, -0.3193521201610565, -0.28842633962631226, -0.257500559091568, -0.22657477855682373, -0.19564899802207947, -0.1647232174873352, -0.13379743695259094, -0.10287165641784668, -0.07194587588310242, -0.041020095348358154, -0.010094314813613892, 0.02083146572113037, 0.051757246255874634, 0.0826830267906189, 0.11360880732536316, 0.14453458786010742, 0.17546036839485168, 0.20638614892959595, 0.2373119294643402, 0.2682377099990845, 0.29916349053382874, 0.330089271068573, 0.36101505160331726, 0.3919408321380615, 0.4228666126728058, 0.45379239320755005, 0.4847181737422943, 0.5156439542770386, 0.5465697050094604, 0.5774955153465271, 0.6084213256835938, 0.6393470764160156]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 7.0, 7.0, 6.0, 9.0, 6.0, 13.0, 17.0, 13.0, 20.0, 28.0, 23.0, 25.0, 35.0, 27.0, 37.0, 45.0, 44.0, 47.0, 43.0, 61.0, 48.0, 43.0, 30.0, 46.0, 42.0, 32.0, 31.0, 31.0, 30.0, 34.0, 15.0, 22.0, 12.0, 17.0, 6.0, 10.0, 10.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.31617963314056396, -0.3059959411621094, -0.2958122491836548, -0.2856285870075226, -0.275444895029068, -0.2652612030506134, -0.2550775110721588, -0.24489383399486542, -0.23471015691757202, -0.22452646493911743, -0.21434278786182404, -0.20415909588336945, -0.19397541880607605, -0.18379172682762146, -0.17360803484916687, -0.16342435777187347, -0.15324066579341888, -0.1430569738149643, -0.1328732967376709, -0.12268960475921631, -0.11250592768192291, -0.10232223570346832, -0.09213855117559433, -0.08195486664772034, -0.07177118211984634, -0.06158749759197235, -0.05140381306409836, -0.04122012481093407, -0.031036440283060074, -0.02085275575518608, -0.01066906750202179, -0.00048538297414779663, 0.009698301553726196, 0.01988198608160019, 0.03006567247211933, 0.040249358862638474, 0.050433043390512466, 0.06061672791838646, 0.07080041617155075, 0.08098410069942474, 0.09116778522729874, 0.10135146975517273, 0.11153515428304672, 0.12171883881092072, 0.1319025307893753, 0.1420862078666687, 0.1522698998451233, 0.16245359182357788, 0.17263726890087128, 0.18282096087932587, 0.19300463795661926, 0.20318832993507385, 0.21337200701236725, 0.22355569899082184, 0.23373937606811523, 0.24392306804656982, 0.2541067600250244, 0.264290452003479, 0.2744741439819336, 0.2846578061580658, 0.2948414981365204, 0.305025190114975, 0.31520888209342957, 0.32539254426956177, 0.33557623624801636]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 16.0, 22.0, 42.0, 51.0, 79.0, 154.0, 286.0, 551.0, 1193.0, 2578.0, 5705.0, 14425.0, 38044.0, 105782.0, 255827.0, 332405.0, 181474.0, 68315.0, 24688.0, 9414.0, 3888.0, 1812.0, 856.0, 412.0, 220.0, 122.0, 62.0, 47.0, 28.0, 14.0, 12.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.054046630859375, -0.05237245559692383, -0.050698280334472656, -0.049024105072021484, -0.04734992980957031, -0.04567575454711914, -0.04400157928466797, -0.0423274040222168, -0.040653228759765625, -0.03897905349731445, -0.03730487823486328, -0.03563070297241211, -0.03395652770996094, -0.032282352447509766, -0.030608177185058594, -0.028934001922607422, -0.02725982666015625, -0.025585651397705078, -0.023911476135253906, -0.022237300872802734, -0.020563125610351562, -0.01888895034790039, -0.01721477508544922, -0.015540599822998047, -0.013866424560546875, -0.012192249298095703, -0.010518074035644531, -0.00884389877319336, -0.0071697235107421875, -0.005495548248291016, -0.0038213729858398438, -0.002147197723388672, -0.0004730224609375, 0.0012011528015136719, 0.0028753280639648438, 0.004549503326416016, 0.0062236785888671875, 0.00789785385131836, 0.009572029113769531, 0.011246204376220703, 0.012920379638671875, 0.014594554901123047, 0.01626873016357422, 0.01794290542602539, 0.019617080688476562, 0.021291255950927734, 0.022965431213378906, 0.024639606475830078, 0.02631378173828125, 0.027987957000732422, 0.029662132263183594, 0.031336307525634766, 0.03301048278808594, 0.03468465805053711, 0.03635883331298828, 0.03803300857543945, 0.039707183837890625, 0.0413813591003418, 0.04305553436279297, 0.04472970962524414, 0.04640388488769531, 0.048078060150146484, 0.049752235412597656, 0.05142641067504883, 0.0531005859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 10.0, 4.0, 8.0, 8.0, 16.0, 18.0, 17.0, 30.0, 32.0, 37.0, 37.0, 31.0, 47.0, 46.0, 37.0, 51.0, 62.0, 49.0, 52.0, 52.0, 48.0, 46.0, 45.0, 34.0, 30.0, 16.0, 30.0, 22.0, 21.0, 10.0, 9.0, 13.0, 11.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0364990234375, -0.03532695770263672, -0.03415489196777344, -0.032982826232910156, -0.031810760498046875, -0.030638694763183594, -0.029466629028320312, -0.02829456329345703, -0.02712249755859375, -0.02595043182373047, -0.024778366088867188, -0.023606300354003906, -0.022434234619140625, -0.021262168884277344, -0.020090103149414062, -0.01891803741455078, -0.0177459716796875, -0.01657390594482422, -0.015401840209960938, -0.014229774475097656, -0.013057708740234375, -0.011885643005371094, -0.010713577270507812, -0.009541511535644531, -0.00836944580078125, -0.007197380065917969, -0.0060253143310546875, -0.004853248596191406, -0.003681182861328125, -0.0025091171264648438, -0.0013370513916015625, -0.00016498565673828125, 0.001007080078125, 0.0021791458129882812, 0.0033512115478515625, 0.004523277282714844, 0.005695343017578125, 0.006867408752441406, 0.008039474487304688, 0.009211540222167969, 0.01038360595703125, 0.011555671691894531, 0.012727737426757812, 0.013899803161621094, 0.015071868896484375, 0.016243934631347656, 0.017416000366210938, 0.01858806610107422, 0.0197601318359375, 0.02093219757080078, 0.022104263305664062, 0.023276329040527344, 0.024448394775390625, 0.025620460510253906, 0.026792526245117188, 0.02796459197998047, 0.02913665771484375, 0.03030872344970703, 0.03148078918457031, 0.032652854919433594, 0.033824920654296875, 0.034996986389160156, 0.03616905212402344, 0.03734111785888672, 0.03851318359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 13.0, 7.0, 15.0, 28.0, 32.0, 36.0, 51.0, 98.0, 176.0, 286.0, 538.0, 1150.0, 3573.0, 25684.0, 553225.0, 435780.0, 22215.0, 3398.0, 1092.0, 473.0, 229.0, 153.0, 105.0, 56.0, 49.0, 29.0, 20.0, 10.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.163818359375, -0.15961456298828125, -0.1554107666015625, -0.15120697021484375, -0.147003173828125, -0.14279937744140625, -0.1385955810546875, -0.13439178466796875, -0.13018798828125, -0.12598419189453125, -0.1217803955078125, -0.11757659912109375, -0.113372802734375, -0.10916900634765625, -0.1049652099609375, -0.10076141357421875, -0.0965576171875, -0.09235382080078125, -0.0881500244140625, -0.08394622802734375, -0.079742431640625, -0.07553863525390625, -0.0713348388671875, -0.06713104248046875, -0.06292724609375, -0.05872344970703125, -0.0545196533203125, -0.05031585693359375, -0.046112060546875, -0.04190826416015625, -0.0377044677734375, -0.03350067138671875, -0.029296875, -0.02509307861328125, -0.0208892822265625, -0.01668548583984375, -0.012481689453125, -0.00827789306640625, -0.0040740966796875, 0.00012969970703125, 0.00433349609375, 0.00853729248046875, 0.0127410888671875, 0.01694488525390625, 0.021148681640625, 0.02535247802734375, 0.0295562744140625, 0.03376007080078125, 0.0379638671875, 0.04216766357421875, 0.0463714599609375, 0.05057525634765625, 0.054779052734375, 0.05898284912109375, 0.0631866455078125, 0.06739044189453125, 0.07159423828125, 0.07579803466796875, 0.0800018310546875, 0.08420562744140625, 0.088409423828125, 0.09261322021484375, 0.0968170166015625, 0.10102081298828125, 0.105224609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 9.0, 6.0, 5.0, 16.0, 13.0, 15.0, 19.0, 17.0, 31.0, 14.0, 45.0, 42.0, 41.0, 48.0, 36.0, 37.0, 51.0, 51.0, 51.0, 51.0, 53.0, 41.0, 52.0, 36.0, 44.0, 32.0, 28.0, 24.0, 17.0, 14.0, 13.0, 12.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.1297130584716797, -0.12539291381835938, -0.12107276916503906, -0.11675262451171875, -0.11243247985839844, -0.10811233520507812, -0.10379219055175781, -0.0994720458984375, -0.09515190124511719, -0.09083175659179688, -0.08651161193847656, -0.08219146728515625, -0.07787132263183594, -0.07355117797851562, -0.06923103332519531, -0.064910888671875, -0.06059074401855469, -0.056270599365234375, -0.05195045471191406, -0.04763031005859375, -0.04331016540527344, -0.038990020751953125, -0.03466987609863281, -0.0303497314453125, -0.026029586791992188, -0.021709442138671875, -0.017389297485351562, -0.01306915283203125, -0.008749008178710938, -0.004428863525390625, -0.0001087188720703125, 0.00421142578125, 0.008531570434570312, 0.012851715087890625, 0.017171859741210938, 0.02149200439453125, 0.025812149047851562, 0.030132293701171875, 0.03445243835449219, 0.0387725830078125, 0.04309272766113281, 0.047412872314453125, 0.05173301696777344, 0.05605316162109375, 0.06037330627441406, 0.06469345092773438, 0.06901359558105469, 0.073333740234375, 0.07765388488769531, 0.08197402954101562, 0.08629417419433594, 0.09061431884765625, 0.09493446350097656, 0.09925460815429688, 0.10357475280761719, 0.1078948974609375, 0.11221504211425781, 0.11653518676757812, 0.12085533142089844, 0.12517547607421875, 0.12949562072753906, 0.13381576538085938, 0.1381359100341797, 0.1424560546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 8.0, 4.0, 7.0, 9.0, 10.0, 23.0, 23.0, 25.0, 47.0, 68.0, 89.0, 131.0, 171.0, 276.0, 403.0, 664.0, 1193.0, 2227.0, 4924.0, 13972.0, 71540.0, 671337.0, 236776.0, 29131.0, 8106.0, 3344.0, 1574.0, 896.0, 505.0, 313.0, 229.0, 165.0, 107.0, 61.0, 48.0, 33.0, 24.0, 15.0, 17.0, 12.0, 10.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.033477783203125, -0.03242349624633789, -0.03136920928955078, -0.030314922332763672, -0.029260635375976562, -0.028206348419189453, -0.027152061462402344, -0.026097774505615234, -0.025043487548828125, -0.023989200592041016, -0.022934913635253906, -0.021880626678466797, -0.020826339721679688, -0.019772052764892578, -0.01871776580810547, -0.01766347885131836, -0.01660919189453125, -0.01555490493774414, -0.014500617980957031, -0.013446331024169922, -0.012392044067382812, -0.011337757110595703, -0.010283470153808594, -0.009229183197021484, -0.008174896240234375, -0.007120609283447266, -0.006066322326660156, -0.005012035369873047, -0.0039577484130859375, -0.002903461456298828, -0.0018491744995117188, -0.0007948875427246094, 0.0002593994140625, 0.0013136863708496094, 0.0023679733276367188, 0.003422260284423828, 0.0044765472412109375, 0.005530834197998047, 0.006585121154785156, 0.007639408111572266, 0.008693695068359375, 0.009747982025146484, 0.010802268981933594, 0.011856555938720703, 0.012910842895507812, 0.013965129852294922, 0.015019416809082031, 0.01607370376586914, 0.01712799072265625, 0.01818227767944336, 0.01923656463623047, 0.020290851593017578, 0.021345138549804688, 0.022399425506591797, 0.023453712463378906, 0.024507999420166016, 0.025562286376953125, 0.026616573333740234, 0.027670860290527344, 0.028725147247314453, 0.029779434204101562, 0.030833721160888672, 0.03188800811767578, 0.03294229507446289, 0.03399658203125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 13.0, 12.0, 25.0, 38.0, 73.0, 108.0, 170.0, 144.0, 150.0, 108.0, 60.0, 36.0, 21.0, 10.0, 5.0, 6.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6033649444580078e-05, -1.5469267964363098e-05, -1.4904886484146118e-05, -1.4340505003929138e-05, -1.3776123523712158e-05, -1.3211742043495178e-05, -1.2647360563278198e-05, -1.2082979083061218e-05, -1.1518597602844238e-05, -1.0954216122627258e-05, -1.0389834642410278e-05, -9.825453162193298e-06, -9.261071681976318e-06, -8.696690201759338e-06, -8.132308721542358e-06, -7.567927241325378e-06, -7.0035457611083984e-06, -6.4391642808914185e-06, -5.8747828006744385e-06, -5.3104013204574585e-06, -4.7460198402404785e-06, -4.1816383600234985e-06, -3.6172568798065186e-06, -3.0528753995895386e-06, -2.4884939193725586e-06, -1.9241124391555786e-06, -1.3597309589385986e-06, -7.953494787216187e-07, -2.3096799850463867e-07, 3.334134817123413e-07, 8.977949619293213e-07, 1.4621764421463013e-06, 2.0265579223632812e-06, 2.5909394025802612e-06, 3.155320882797241e-06, 3.719702363014221e-06, 4.284083843231201e-06, 4.848465323448181e-06, 5.412846803665161e-06, 5.977228283882141e-06, 6.541609764099121e-06, 7.105991244316101e-06, 7.670372724533081e-06, 8.234754204750061e-06, 8.799135684967041e-06, 9.363517165184021e-06, 9.927898645401001e-06, 1.0492280125617981e-05, 1.1056661605834961e-05, 1.1621043086051941e-05, 1.2185424566268921e-05, 1.2749806046485901e-05, 1.3314187526702881e-05, 1.387856900691986e-05, 1.444295048713684e-05, 1.500733196735382e-05, 1.55717134475708e-05, 1.613609492778778e-05, 1.670047640800476e-05, 1.726485788822174e-05, 1.782923936843872e-05, 1.83936208486557e-05, 1.895800232887268e-05, 1.952238380908966e-05, 2.008676528930664e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 9.0, 4.0, 11.0, 6.0, 27.0, 21.0, 42.0, 54.0, 74.0, 138.0, 212.0, 380.0, 822.0, 1794.0, 5034.0, 20442.0, 178971.0, 729875.0, 90790.0, 13283.0, 3669.0, 1437.0, 617.0, 345.0, 178.0, 113.0, 60.0, 43.0, 29.0, 20.0, 13.0, 9.0, 8.0, 10.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.037872314453125, -0.03670215606689453, -0.03553199768066406, -0.034361839294433594, -0.033191680908203125, -0.032021522521972656, -0.030851364135742188, -0.02968120574951172, -0.02851104736328125, -0.02734088897705078, -0.026170730590820312, -0.025000572204589844, -0.023830413818359375, -0.022660255432128906, -0.021490097045898438, -0.02031993865966797, -0.0191497802734375, -0.01797962188720703, -0.016809463500976562, -0.015639305114746094, -0.014469146728515625, -0.013298988342285156, -0.012128829956054688, -0.010958671569824219, -0.00978851318359375, -0.008618354797363281, -0.0074481964111328125, -0.006278038024902344, -0.005107879638671875, -0.003937721252441406, -0.0027675628662109375, -0.0015974044799804688, -0.00042724609375, 0.0007429122924804688, 0.0019130706787109375, 0.0030832290649414062, 0.004253387451171875, 0.005423545837402344, 0.0065937042236328125, 0.007763862609863281, 0.00893402099609375, 0.010104179382324219, 0.011274337768554688, 0.012444496154785156, 0.013614654541015625, 0.014784812927246094, 0.015954971313476562, 0.01712512969970703, 0.0182952880859375, 0.01946544647216797, 0.020635604858398438, 0.021805763244628906, 0.022975921630859375, 0.024146080017089844, 0.025316238403320312, 0.02648639678955078, 0.02765655517578125, 0.02882671356201172, 0.029996871948242188, 0.031167030334472656, 0.032337188720703125, 0.033507347106933594, 0.03467750549316406, 0.03584766387939453, 0.037017822265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 6.0, 8.0, 5.0, 10.0, 10.0, 17.0, 21.0, 26.0, 19.0, 34.0, 38.0, 51.0, 48.0, 64.0, 55.0, 54.0, 53.0, 72.0, 54.0, 55.0, 41.0, 39.0, 35.0, 31.0, 35.0, 30.0, 14.0, 10.0, 15.0, 8.0, 6.0, 11.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0302734375, -0.029396533966064453, -0.028519630432128906, -0.02764272689819336, -0.026765823364257812, -0.025888919830322266, -0.02501201629638672, -0.024135112762451172, -0.023258209228515625, -0.022381305694580078, -0.02150440216064453, -0.020627498626708984, -0.019750595092773438, -0.01887369155883789, -0.017996788024902344, -0.017119884490966797, -0.01624298095703125, -0.015366077423095703, -0.014489173889160156, -0.01361227035522461, -0.012735366821289062, -0.011858463287353516, -0.010981559753417969, -0.010104656219482422, -0.009227752685546875, -0.008350849151611328, -0.007473945617675781, -0.006597042083740234, -0.0057201385498046875, -0.004843235015869141, -0.003966331481933594, -0.003089427947998047, -0.0022125244140625, -0.0013356208801269531, -0.00045871734619140625, 0.0004181861877441406, 0.0012950897216796875, 0.0021719932556152344, 0.0030488967895507812, 0.003925800323486328, 0.004802703857421875, 0.005679607391357422, 0.006556510925292969, 0.007433414459228516, 0.008310317993164062, 0.00918722152709961, 0.010064125061035156, 0.010941028594970703, 0.01181793212890625, 0.012694835662841797, 0.013571739196777344, 0.01444864273071289, 0.015325546264648438, 0.016202449798583984, 0.01707935333251953, 0.017956256866455078, 0.018833160400390625, 0.019710063934326172, 0.02058696746826172, 0.021463871002197266, 0.022340774536132812, 0.02321767807006836, 0.024094581604003906, 0.024971485137939453, 0.025848388671875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 9.0, 22.0, 53.0, 222.0, 378.0, 224.0, 59.0, 15.0, 9.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8675267696380615, -1.8201826810836792, -1.7728385925292969, -1.7254945039749146, -1.6781504154205322, -1.63080632686615, -1.5834622383117676, -1.5361181497573853, -1.488774061203003, -1.4414299726486206, -1.3940858840942383, -1.346741795539856, -1.2993977069854736, -1.2520536184310913, -1.204709529876709, -1.1573654413223267, -1.1100213527679443, -1.062677264213562, -1.0153331756591797, -0.9679890871047974, -0.920644998550415, -0.8733009099960327, -0.8259568214416504, -0.7786127328872681, -0.7312687635421753, -0.683924674987793, -0.6365805864334106, -0.5892364978790283, -0.541892409324646, -0.49454832077026367, -0.44720426201820374, -0.3998601734638214, -0.3525160551071167, -0.3051719665527344, -0.25782787799835205, -0.21048380434513092, -0.1631397157907486, -0.11579562723636627, -0.06845155358314514, -0.021107465028762817, 0.026236623525619507, 0.07358071208000183, 0.12092479318380356, 0.16826887428760529, 0.2156129628419876, 0.26295703649520874, 0.31030112504959106, 0.3576452136039734, 0.4049893021583557, 0.45233339071273804, 0.49967747926712036, 0.5470215678215027, 0.594365656375885, 0.6417097449302673, 0.6890537738800049, 0.7363978624343872, 0.7837419509887695, 0.8310860395431519, 0.8784301280975342, 0.9257742166519165, 0.9731183052062988, 1.0204623937606812, 1.0678064823150635, 1.1151505708694458, 1.1624946594238281]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 5.0, 5.0, 9.0, 12.0, 11.0, 14.0, 24.0, 31.0, 23.0, 31.0, 46.0, 36.0, 52.0, 45.0, 39.0, 57.0, 72.0, 67.0, 59.0, 47.0, 42.0, 44.0, 40.0, 40.0, 28.0, 26.0, 20.0, 27.0, 12.0, 16.0, 11.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.595794141292572, -0.5758812427520752, -0.5559683442115784, -0.5360554456710815, -0.5161425471305847, -0.4962296485900879, -0.47631675004959106, -0.45640385150909424, -0.4364909529685974, -0.4165780544281006, -0.39666515588760376, -0.37675225734710693, -0.3568393588066101, -0.3369264602661133, -0.31701356172561646, -0.29710066318511963, -0.2771877646446228, -0.257274866104126, -0.23736196756362915, -0.21744906902313232, -0.1975361704826355, -0.17762327194213867, -0.15771037340164185, -0.13779747486114502, -0.1178845763206482, -0.09797167778015137, -0.07805877923965454, -0.058145880699157715, -0.03823298215866089, -0.018320083618164062, 0.0015928149223327637, 0.02150571346282959, 0.04141855239868164, 0.06133145093917847, 0.08124434947967529, 0.10115724802017212, 0.12107014656066895, 0.14098304510116577, 0.1608959436416626, 0.18080884218215942, 0.20072174072265625, 0.22063463926315308, 0.2405475378036499, 0.26046043634414673, 0.28037333488464355, 0.3002862334251404, 0.3201991319656372, 0.34011203050613403, 0.36002492904663086, 0.3799378275871277, 0.3998507261276245, 0.41976362466812134, 0.43967652320861816, 0.459589421749115, 0.4795023202896118, 0.49941521883010864, 0.5193281173706055, 0.5392410159111023, 0.5591539144515991, 0.579066812992096, 0.5989797115325928, 0.6188926100730896, 0.6388055086135864, 0.6587184071540833, 0.6786313056945801]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 5.0, 8.0, 13.0, 10.0, 14.0, 32.0, 52.0, 72.0, 123.0, 192.0, 329.0, 3844.0, 4187925.0, 908.0, 287.0, 167.0, 101.0, 72.0, 44.0, 26.0, 17.0, 15.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6826171875, -0.6585311889648438, -0.6344451904296875, -0.6103591918945312, -0.586273193359375, -0.5621871948242188, -0.5381011962890625, -0.5140151977539062, -0.48992919921875, -0.46584320068359375, -0.4417572021484375, -0.41767120361328125, -0.393585205078125, -0.36949920654296875, -0.3454132080078125, -0.32132720947265625, -0.2972412109375, -0.27315521240234375, -0.2490692138671875, -0.22498321533203125, -0.200897216796875, -0.17681121826171875, -0.1527252197265625, -0.12863922119140625, -0.10455322265625, -0.08046722412109375, -0.0563812255859375, -0.03229522705078125, -0.008209228515625, 0.01587677001953125, 0.0399627685546875, 0.06404876708984375, 0.088134765625, 0.11222076416015625, 0.1363067626953125, 0.16039276123046875, 0.184478759765625, 0.20856475830078125, 0.2326507568359375, 0.25673675537109375, 0.28082275390625, 0.30490875244140625, 0.3289947509765625, 0.35308074951171875, 0.377166748046875, 0.40125274658203125, 0.4253387451171875, 0.44942474365234375, 0.4735107421875, 0.49759674072265625, 0.5216827392578125, 0.5457687377929688, 0.569854736328125, 0.5939407348632812, 0.6180267333984375, 0.6421127319335938, 0.66619873046875, 0.6902847290039062, 0.7143707275390625, 0.7384567260742188, 0.762542724609375, 0.7866287231445312, 0.8107147216796875, 0.8348007202148438, 0.85888671875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 7.0, 22.0, 26.0, 46.0, 62.0, 58.0, 98.0, 84.0, 109.0, 108.0, 72.0, 80.0, 62.0, 49.0, 29.0, 21.0, 22.0, 17.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037017822265625, -0.03494977951049805, -0.032881736755371094, -0.03081369400024414, -0.028745651245117188, -0.026677608489990234, -0.02460956573486328, -0.022541522979736328, -0.020473480224609375, -0.018405437469482422, -0.01633739471435547, -0.014269351959228516, -0.012201309204101562, -0.01013326644897461, -0.008065223693847656, -0.005997180938720703, -0.00392913818359375, -0.0018610954284667969, 0.00020694732666015625, 0.0022749900817871094, 0.0043430328369140625, 0.006411075592041016, 0.008479118347167969, 0.010547161102294922, 0.012615203857421875, 0.014683246612548828, 0.01675128936767578, 0.018819332122802734, 0.020887374877929688, 0.02295541763305664, 0.025023460388183594, 0.027091503143310547, 0.0291595458984375, 0.031227588653564453, 0.033295631408691406, 0.03536367416381836, 0.03743171691894531, 0.039499759674072266, 0.04156780242919922, 0.04363584518432617, 0.045703887939453125, 0.04777193069458008, 0.04983997344970703, 0.051908016204833984, 0.05397605895996094, 0.05604410171508789, 0.058112144470214844, 0.0601801872253418, 0.06224822998046875, 0.0643162727355957, 0.06638431549072266, 0.06845235824584961, 0.07052040100097656, 0.07258844375610352, 0.07465648651123047, 0.07672452926635742, 0.07879257202148438, 0.08086061477661133, 0.08292865753173828, 0.08499670028686523, 0.08706474304199219, 0.08913278579711914, 0.0912008285522461, 0.09326887130737305, 0.0953369140625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 12.0, 20.0, 51.0, 62.0, 143.0, 330.0, 731.0, 1921.0, 6038.0, 26202.0, 294293.0, 3745207.0, 98632.0, 15256.0, 3551.0, 1050.0, 379.0, 178.0, 74.0, 51.0, 28.0, 20.0, 12.0, 10.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07684326171875, -0.07380962371826172, -0.07077598571777344, -0.06774234771728516, -0.06470870971679688, -0.061675071716308594, -0.05864143371582031, -0.05560779571533203, -0.05257415771484375, -0.04954051971435547, -0.04650688171386719, -0.043473243713378906, -0.040439605712890625, -0.037405967712402344, -0.03437232971191406, -0.03133869171142578, -0.0283050537109375, -0.02527141571044922, -0.022237777709960938, -0.019204139709472656, -0.016170501708984375, -0.013136863708496094, -0.010103225708007812, -0.007069587707519531, -0.00403594970703125, -0.0010023117065429688, 0.0020313262939453125, 0.005064964294433594, 0.008098602294921875, 0.011132240295410156, 0.014165878295898438, 0.01719951629638672, 0.020233154296875, 0.02326679229736328, 0.026300430297851562, 0.029334068298339844, 0.032367706298828125, 0.035401344299316406, 0.03843498229980469, 0.04146862030029297, 0.04450225830078125, 0.04753589630126953, 0.05056953430175781, 0.053603172302246094, 0.056636810302734375, 0.059670448303222656, 0.06270408630371094, 0.06573772430419922, 0.0687713623046875, 0.07180500030517578, 0.07483863830566406, 0.07787227630615234, 0.08090591430664062, 0.0839395523071289, 0.08697319030761719, 0.09000682830810547, 0.09304046630859375, 0.09607410430908203, 0.09910774230957031, 0.1021413803100586, 0.10517501831054688, 0.10820865631103516, 0.11124229431152344, 0.11427593231201172, 0.1173095703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 8.0, 9.0, 7.0, 6.0, 13.0, 16.0, 12.0, 22.0, 34.0, 48.0, 91.0, 173.0, 374.0, 755.0, 1141.0, 660.0, 284.0, 160.0, 72.0, 52.0, 20.0, 20.0, 18.0, 11.0, 13.0, 7.0, 9.0, 10.0, 6.0, 1.0, 3.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07989501953125, -0.07786703109741211, -0.07583904266357422, -0.07381105422973633, -0.07178306579589844, -0.06975507736206055, -0.06772708892822266, -0.06569910049438477, -0.06367111206054688, -0.061643123626708984, -0.059615135192871094, -0.0575871467590332, -0.05555915832519531, -0.05353116989135742, -0.05150318145751953, -0.04947519302368164, -0.04744720458984375, -0.04541921615600586, -0.04339122772216797, -0.04136323928833008, -0.03933525085449219, -0.0373072624206543, -0.035279273986816406, -0.033251285552978516, -0.031223297119140625, -0.029195308685302734, -0.027167320251464844, -0.025139331817626953, -0.023111343383789062, -0.021083354949951172, -0.01905536651611328, -0.01702737808227539, -0.0149993896484375, -0.01297140121459961, -0.010943412780761719, -0.008915424346923828, -0.0068874359130859375, -0.004859447479248047, -0.0028314590454101562, -0.0008034706115722656, 0.001224517822265625, 0.0032525062561035156, 0.005280494689941406, 0.007308483123779297, 0.009336471557617188, 0.011364459991455078, 0.013392448425292969, 0.01542043685913086, 0.01744842529296875, 0.01947641372680664, 0.02150440216064453, 0.023532390594482422, 0.025560379028320312, 0.027588367462158203, 0.029616355895996094, 0.031644344329833984, 0.033672332763671875, 0.035700321197509766, 0.037728309631347656, 0.03975629806518555, 0.04178428649902344, 0.04381227493286133, 0.04584026336669922, 0.04786825180053711, 0.049896240234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 15.0, 26.0, 50.0, 97.0, 141.0, 179.0, 154.0, 132.0, 64.0, 48.0, 36.0, 16.0, 9.0, 6.0, 3.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28014251589775085, -0.2633552551269531, -0.2465679794549942, -0.22978070378303528, -0.21299344301223755, -0.19620616734027863, -0.1794188916683197, -0.16263163089752197, -0.14584435522556305, -0.12905707955360413, -0.1122698187828064, -0.09548254311084747, -0.07869527488946915, -0.06190800666809082, -0.0451207309961319, -0.02833346277475357, -0.011546194553375244, 0.0052410755306482315, 0.022028345614671707, 0.03881561756134033, 0.05560288578271866, 0.07239015400409698, 0.08917742967605591, 0.10596469789743423, 0.12275196611881256, 0.13953924179077148, 0.1563265025615692, 0.17311377823352814, 0.18990105390548706, 0.2066883146762848, 0.2234755903482437, 0.24026286602020264, 0.25705015659332275, 0.2738374173641205, 0.2906247079372406, 0.30741196870803833, 0.32419922947883606, 0.3409864902496338, 0.3577737808227539, 0.37456104159355164, 0.39134830236434937, 0.4081355631351471, 0.4249228537082672, 0.44171011447906494, 0.45849737524986267, 0.4752846360206604, 0.4920719265937805, 0.5088592171669006, 0.525646448135376, 0.5424337387084961, 0.5592209696769714, 0.5760082602500916, 0.5927955508232117, 0.609582781791687, 0.6263700723648071, 0.6431573629379272, 0.6599446535110474, 0.6767319440841675, 0.6935191750526428, 0.7103064656257629, 0.7270937561988831, 0.7438809871673584, 0.7606682777404785, 0.7774555683135986, 0.794242799282074]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 16.0, 10.0, 14.0, 15.0, 23.0, 27.0, 35.0, 22.0, 33.0, 57.0, 49.0, 47.0, 39.0, 58.0, 43.0, 57.0, 58.0, 70.0, 36.0, 44.0, 32.0, 42.0, 25.0, 20.0, 22.0, 7.0, 17.0, 7.0, 11.0, 7.0, 14.0, 5.0, 9.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.3658565282821655, -0.35613828897476196, -0.3464200496673584, -0.3367018401622772, -0.32698360085487366, -0.3172653615474701, -0.3075471520423889, -0.29782891273498535, -0.2881106734275818, -0.2783924341201782, -0.26867419481277466, -0.2589559853076935, -0.24923774600028992, -0.23951950669288635, -0.22980128228664398, -0.2200830578804016, -0.21036481857299805, -0.20064657926559448, -0.1909283548593521, -0.18121013045310974, -0.17149189114570618, -0.1617736518383026, -0.15205542743206024, -0.14233720302581787, -0.1326189637184143, -0.12290073186159134, -0.11318250000476837, -0.1034642681479454, -0.09374603629112244, -0.08402780443429947, -0.0743095725774765, -0.06459134072065353, -0.054873108863830566, -0.0451548770070076, -0.03543664515018463, -0.025718413293361664, -0.016000181436538696, -0.006281949579715729, 0.0034362822771072388, 0.013154514133930206, 0.022872745990753174, 0.03259097784757614, 0.04230920970439911, 0.052027441561222076, 0.061745673418045044, 0.07146390527486801, 0.08118213713169098, 0.09090036898851395, 0.10061860084533691, 0.11033683270215988, 0.12005506455898285, 0.12977328896522522, 0.13949152827262878, 0.14920976758003235, 0.15892799198627472, 0.1686462163925171, 0.17836445569992065, 0.18808269500732422, 0.1978009194135666, 0.20751914381980896, 0.21723738312721252, 0.2269556224346161, 0.23667384684085846, 0.24639207124710083, 0.2561103105545044]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 9.0, 8.0, 6.0, 10.0, 17.0, 22.0, 30.0, 38.0, 105.0, 109.0, 213.0, 432.0, 867.0, 1815.0, 4620.0, 12929.0, 40728.0, 137383.0, 358499.0, 324814.0, 113936.0, 33671.0, 10839.0, 4103.0, 1676.0, 758.0, 396.0, 223.0, 113.0, 62.0, 40.0, 25.0, 17.0, 14.0, 11.0, 9.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055511474609375, -0.053369998931884766, -0.05122852325439453, -0.0490870475769043, -0.04694557189941406, -0.04480409622192383, -0.042662620544433594, -0.04052114486694336, -0.038379669189453125, -0.03623819351196289, -0.034096717834472656, -0.03195524215698242, -0.029813766479492188, -0.027672290802001953, -0.02553081512451172, -0.023389339447021484, -0.02124786376953125, -0.019106388092041016, -0.01696491241455078, -0.014823436737060547, -0.012681961059570312, -0.010540485382080078, -0.008399009704589844, -0.006257534027099609, -0.004116058349609375, -0.0019745826721191406, 0.00016689300537109375, 0.002308368682861328, 0.0044498443603515625, 0.006591320037841797, 0.008732795715332031, 0.010874271392822266, 0.0130157470703125, 0.015157222747802734, 0.01729869842529297, 0.019440174102783203, 0.021581649780273438, 0.023723125457763672, 0.025864601135253906, 0.02800607681274414, 0.030147552490234375, 0.03228902816772461, 0.034430503845214844, 0.03657197952270508, 0.03871345520019531, 0.04085493087768555, 0.04299640655517578, 0.045137882232666016, 0.04727935791015625, 0.049420833587646484, 0.05156230926513672, 0.05370378494262695, 0.05584526062011719, 0.05798673629760742, 0.060128211975097656, 0.06226968765258789, 0.06441116333007812, 0.06655263900756836, 0.0686941146850586, 0.07083559036254883, 0.07297706604003906, 0.0751185417175293, 0.07726001739501953, 0.07940149307250977, 0.08154296875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 6.0, 5.0, 11.0, 9.0, 21.0, 18.0, 31.0, 20.0, 35.0, 33.0, 43.0, 56.0, 67.0, 57.0, 58.0, 53.0, 56.0, 53.0, 63.0, 50.0, 39.0, 34.0, 26.0, 29.0, 22.0, 25.0, 18.0, 13.0, 15.0, 8.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035552978515625, -0.034316062927246094, -0.03307914733886719, -0.03184223175048828, -0.030605316162109375, -0.02936840057373047, -0.028131484985351562, -0.026894569396972656, -0.02565765380859375, -0.024420738220214844, -0.023183822631835938, -0.02194690704345703, -0.020709991455078125, -0.01947307586669922, -0.018236160278320312, -0.016999244689941406, -0.0157623291015625, -0.014525413513183594, -0.013288497924804688, -0.012051582336425781, -0.010814666748046875, -0.009577751159667969, -0.008340835571289062, -0.007103919982910156, -0.00586700439453125, -0.004630088806152344, -0.0033931732177734375, -0.0021562576293945312, -0.000919342041015625, 0.00031757354736328125, 0.0015544891357421875, 0.0027914047241210938, 0.0040283203125, 0.005265235900878906, 0.0065021514892578125, 0.007739067077636719, 0.008975982666015625, 0.010212898254394531, 0.011449813842773438, 0.012686729431152344, 0.01392364501953125, 0.015160560607910156, 0.016397476196289062, 0.01763439178466797, 0.018871307373046875, 0.02010822296142578, 0.021345138549804688, 0.022582054138183594, 0.0238189697265625, 0.025055885314941406, 0.026292800903320312, 0.02752971649169922, 0.028766632080078125, 0.03000354766845703, 0.031240463256835938, 0.032477378845214844, 0.03371429443359375, 0.034951210021972656, 0.03618812561035156, 0.03742504119873047, 0.038661956787109375, 0.03989887237548828, 0.04113578796386719, 0.042372703552246094, 0.043609619140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 1.0, 4.0, 7.0, 8.0, 4.0, 9.0, 15.0, 23.0, 48.0, 58.0, 119.0, 261.0, 547.0, 1472.0, 6009.0, 47484.0, 634098.0, 327799.0, 24600.0, 4038.0, 1036.0, 472.0, 186.0, 99.0, 65.0, 36.0, 18.0, 15.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.12827301025390625, -0.1239776611328125, -0.11968231201171875, -0.115386962890625, -0.11109161376953125, -0.1067962646484375, -0.10250091552734375, -0.09820556640625, -0.09391021728515625, -0.0896148681640625, -0.08531951904296875, -0.081024169921875, -0.07672882080078125, -0.0724334716796875, -0.06813812255859375, -0.0638427734375, -0.05954742431640625, -0.0552520751953125, -0.05095672607421875, -0.046661376953125, -0.04236602783203125, -0.0380706787109375, -0.03377532958984375, -0.02947998046875, -0.02518463134765625, -0.0208892822265625, -0.01659393310546875, -0.012298583984375, -0.00800323486328125, -0.0037078857421875, 0.00058746337890625, 0.0048828125, 0.00917816162109375, 0.0134735107421875, 0.01776885986328125, 0.022064208984375, 0.02635955810546875, 0.0306549072265625, 0.03495025634765625, 0.03924560546875, 0.04354095458984375, 0.0478363037109375, 0.05213165283203125, 0.056427001953125, 0.06072235107421875, 0.0650177001953125, 0.06931304931640625, 0.0736083984375, 0.07790374755859375, 0.0821990966796875, 0.08649444580078125, 0.090789794921875, 0.09508514404296875, 0.0993804931640625, 0.10367584228515625, 0.10797119140625, 0.11226654052734375, 0.1165618896484375, 0.12085723876953125, 0.125152587890625, 0.12944793701171875, 0.1337432861328125, 0.13803863525390625, 0.142333984375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 8.0, 6.0, 7.0, 4.0, 9.0, 14.0, 9.0, 11.0, 22.0, 24.0, 29.0, 30.0, 18.0, 28.0, 38.0, 32.0, 35.0, 46.0, 42.0, 35.0, 45.0, 53.0, 38.0, 48.0, 40.0, 27.0, 34.0, 49.0, 25.0, 35.0, 19.0, 14.0, 24.0, 14.0, 18.0, 17.0, 9.0, 9.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0989990234375, -0.09574604034423828, -0.09249305725097656, -0.08924007415771484, -0.08598709106445312, -0.0827341079711914, -0.07948112487792969, -0.07622814178466797, -0.07297515869140625, -0.06972217559814453, -0.06646919250488281, -0.0632162094116211, -0.059963226318359375, -0.056710243225097656, -0.05345726013183594, -0.05020427703857422, -0.0469512939453125, -0.04369831085205078, -0.04044532775878906, -0.037192344665527344, -0.033939361572265625, -0.030686378479003906, -0.027433395385742188, -0.02418041229248047, -0.02092742919921875, -0.01767444610595703, -0.014421463012695312, -0.011168479919433594, -0.007915496826171875, -0.004662513732910156, -0.0014095306396484375, 0.0018434524536132812, 0.005096435546875, 0.008349418640136719, 0.011602401733398438, 0.014855384826660156, 0.018108367919921875, 0.021361351013183594, 0.024614334106445312, 0.02786731719970703, 0.03112030029296875, 0.03437328338623047, 0.03762626647949219, 0.040879249572753906, 0.044132232666015625, 0.047385215759277344, 0.05063819885253906, 0.05389118194580078, 0.0571441650390625, 0.06039714813232422, 0.06365013122558594, 0.06690311431884766, 0.07015609741210938, 0.0734090805053711, 0.07666206359863281, 0.07991504669189453, 0.08316802978515625, 0.08642101287841797, 0.08967399597167969, 0.0929269790649414, 0.09617996215820312, 0.09943294525146484, 0.10268592834472656, 0.10593891143798828, 0.10919189453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 4.0, 15.0, 21.0, 23.0, 39.0, 60.0, 74.0, 159.0, 332.0, 736.0, 2323.0, 12422.0, 938508.0, 86181.0, 5224.0, 1304.0, 505.0, 256.0, 134.0, 70.0, 47.0, 35.0, 28.0, 21.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.182861328125, -0.17691993713378906, -0.17097854614257812, -0.1650371551513672, -0.15909576416015625, -0.1531543731689453, -0.14721298217773438, -0.14127159118652344, -0.1353302001953125, -0.12938880920410156, -0.12344741821289062, -0.11750602722167969, -0.11156463623046875, -0.10562324523925781, -0.09968185424804688, -0.09374046325683594, -0.087799072265625, -0.08185768127441406, -0.07591629028320312, -0.06997489929199219, -0.06403350830078125, -0.05809211730957031, -0.052150726318359375, -0.04620933532714844, -0.0402679443359375, -0.03432655334472656, -0.028385162353515625, -0.022443771362304688, -0.01650238037109375, -0.010560989379882812, -0.004619598388671875, 0.0013217926025390625, 0.00726318359375, 0.013204574584960938, 0.019145965576171875, 0.025087356567382812, 0.03102874755859375, 0.03697013854980469, 0.042911529541015625, 0.04885292053222656, 0.0547943115234375, 0.06073570251464844, 0.06667709350585938, 0.07261848449707031, 0.07855987548828125, 0.08450126647949219, 0.09044265747070312, 0.09638404846191406, 0.102325439453125, 0.10826683044433594, 0.11420822143554688, 0.12014961242675781, 0.12609100341796875, 0.1320323944091797, 0.13797378540039062, 0.14391517639160156, 0.1498565673828125, 0.15579795837402344, 0.16173934936523438, 0.1676807403564453, 0.17362213134765625, 0.1795635223388672, 0.18550491333007812, 0.19144630432128906, 0.1973876953125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 10.0, 24.0, 98.0, 500.0, 280.0, 60.0, 7.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.775161743164062e-05, -9.502191096544266e-05, -9.229220449924469e-05, -8.956249803304672e-05, -8.683279156684875e-05, -8.410308510065079e-05, -8.137337863445282e-05, -7.864367216825485e-05, -7.591396570205688e-05, -7.318425923585892e-05, -7.045455276966095e-05, -6.772484630346298e-05, -6.499513983726501e-05, -6.226543337106705e-05, -5.953572690486908e-05, -5.680602043867111e-05, -5.4076313972473145e-05, -5.134660750627518e-05, -4.861690104007721e-05, -4.588719457387924e-05, -4.3157488107681274e-05, -4.042778164148331e-05, -3.769807517528534e-05, -3.496836870908737e-05, -3.2238662242889404e-05, -2.9508955776691437e-05, -2.677924931049347e-05, -2.4049542844295502e-05, -2.1319836378097534e-05, -1.8590129911899567e-05, -1.58604234457016e-05, -1.3130716979503632e-05, -1.0401010513305664e-05, -7.671304047107697e-06, -4.941597580909729e-06, -2.2118911147117615e-06, 5.178153514862061e-07, 3.2475218176841736e-06, 5.977228283882141e-06, 8.706934750080109e-06, 1.1436641216278076e-05, 1.4166347682476044e-05, 1.689605414867401e-05, 1.962576061487198e-05, 2.2355467081069946e-05, 2.5085173547267914e-05, 2.781488001346588e-05, 3.054458647966385e-05, 3.3274292945861816e-05, 3.6003999412059784e-05, 3.873370587825775e-05, 4.146341234445572e-05, 4.4193118810653687e-05, 4.6922825276851654e-05, 4.965253174304962e-05, 5.238223820924759e-05, 5.511194467544556e-05, 5.7841651141643524e-05, 6.057135760784149e-05, 6.330106407403946e-05, 6.603077054023743e-05, 6.87604770064354e-05, 7.149018347263336e-05, 7.421988993883133e-05, 7.69495964050293e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 9.0, 8.0, 23.0, 21.0, 62.0, 99.0, 231.0, 499.0, 1403.0, 4937.0, 34258.0, 920747.0, 76223.0, 7060.0, 1766.0, 657.0, 227.0, 129.0, 62.0, 32.0, 26.0, 19.0, 14.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.131103515625, -0.12731647491455078, -0.12352943420410156, -0.11974239349365234, -0.11595535278320312, -0.1121683120727539, -0.10838127136230469, -0.10459423065185547, -0.10080718994140625, -0.09702014923095703, -0.09323310852050781, -0.0894460678100586, -0.08565902709960938, -0.08187198638916016, -0.07808494567871094, -0.07429790496826172, -0.0705108642578125, -0.06672382354736328, -0.06293678283691406, -0.059149742126464844, -0.055362701416015625, -0.051575660705566406, -0.04778861999511719, -0.04400157928466797, -0.04021453857421875, -0.03642749786376953, -0.03264045715332031, -0.028853416442871094, -0.025066375732421875, -0.021279335021972656, -0.017492294311523438, -0.013705253601074219, -0.009918212890625, -0.006131172180175781, -0.0023441314697265625, 0.0014429092407226562, 0.005229949951171875, 0.009016990661621094, 0.012804031372070312, 0.01659107208251953, 0.02037811279296875, 0.02416515350341797, 0.027952194213867188, 0.031739234924316406, 0.035526275634765625, 0.039313316345214844, 0.04310035705566406, 0.04688739776611328, 0.0506744384765625, 0.05446147918701172, 0.05824851989746094, 0.062035560607910156, 0.06582260131835938, 0.0696096420288086, 0.07339668273925781, 0.07718372344970703, 0.08097076416015625, 0.08475780487060547, 0.08854484558105469, 0.0923318862915039, 0.09611892700195312, 0.09990596771240234, 0.10369300842285156, 0.10748004913330078, 0.11126708984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 12.0, 23.0, 31.0, 50.0, 77.0, 100.0, 122.0, 108.0, 124.0, 97.0, 80.0, 53.0, 31.0, 18.0, 18.0, 7.0, 9.0, 6.0, 1.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06597900390625, -0.06382083892822266, -0.06166267395019531, -0.05950450897216797, -0.057346343994140625, -0.05518817901611328, -0.05303001403808594, -0.050871849060058594, -0.04871368408203125, -0.046555519104003906, -0.04439735412597656, -0.04223918914794922, -0.040081024169921875, -0.03792285919189453, -0.03576469421386719, -0.033606529235839844, -0.0314483642578125, -0.029290199279785156, -0.027132034301757812, -0.02497386932373047, -0.022815704345703125, -0.02065753936767578, -0.018499374389648438, -0.016341209411621094, -0.01418304443359375, -0.012024879455566406, -0.009866714477539062, -0.007708549499511719, -0.005550384521484375, -0.0033922195434570312, -0.0012340545654296875, 0.0009241104125976562, 0.003082275390625, 0.005240440368652344, 0.0073986053466796875, 0.009556770324707031, 0.011714935302734375, 0.013873100280761719, 0.016031265258789062, 0.018189430236816406, 0.02034759521484375, 0.022505760192871094, 0.024663925170898438, 0.02682209014892578, 0.028980255126953125, 0.03113842010498047, 0.03329658508300781, 0.035454750061035156, 0.0376129150390625, 0.039771080017089844, 0.04192924499511719, 0.04408740997314453, 0.046245574951171875, 0.04840373992919922, 0.05056190490722656, 0.052720069885253906, 0.05487823486328125, 0.057036399841308594, 0.05919456481933594, 0.06135272979736328, 0.06351089477539062, 0.06566905975341797, 0.06782722473144531, 0.06998538970947266, 0.0721435546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 11.0, 14.0, 41.0, 102.0, 224.0, 330.0, 174.0, 68.0, 18.0, 11.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1976585388183594, -2.1443958282470703, -2.0911331176757812, -2.037870168685913, -1.984607458114624, -1.931344747543335, -1.8780819177627563, -1.8248192071914673, -1.7715563774108887, -1.7182936668395996, -1.665030837059021, -1.611768126487732, -1.5585052967071533, -1.5052425861358643, -1.4519797563552856, -1.3987170457839966, -1.345454216003418, -1.292191505432129, -1.2389286756515503, -1.1856659650802612, -1.1324031352996826, -1.0791404247283936, -1.025877594947815, -0.9726148843765259, -0.9193521738052368, -0.866089403629303, -0.8128266334533691, -0.7595638632774353, -0.7063010931015015, -0.6530383825302124, -0.5997755527496338, -0.5465128421783447, -0.4932500123977661, -0.4399872422218323, -0.38672447204589844, -0.3334617018699646, -0.28019893169403076, -0.2269361913204193, -0.17367342114448547, -0.12041065096855164, -0.0671478807926178, -0.013885114341974258, 0.03937765210866928, 0.09264041483402252, 0.14590318500995636, 0.199165940284729, 0.25242871046066284, 0.3056914806365967, 0.3589542508125305, 0.41221702098846436, 0.4654797911643982, 0.518742561340332, 0.5720053315162659, 0.6252681016921997, 0.6785308122634888, 0.7317936420440674, 0.7850563526153564, 0.8383191227912903, 0.8915818929672241, 0.944844663143158, 0.9981074333190918, 1.0513701438903809, 1.1046329736709595, 1.1578956842422485, 1.2111585140228271]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 1.0, 3.0, 7.0, 7.0, 9.0, 9.0, 13.0, 23.0, 23.0, 21.0, 30.0, 24.0, 41.0, 28.0, 42.0, 51.0, 49.0, 63.0, 61.0, 73.0, 50.0, 59.0, 46.0, 33.0, 40.0, 25.0, 25.0, 24.0, 20.0, 26.0, 12.0, 16.0, 12.0, 12.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5501708388328552, -0.5324216485023499, -0.5146724581718445, -0.4969232976436615, -0.47917410731315613, -0.46142494678497314, -0.4436757564544678, -0.4259265661239624, -0.40817737579345703, -0.39042818546295166, -0.3726790249347687, -0.3549298346042633, -0.33718064427375793, -0.31943148374557495, -0.3016822934150696, -0.2839331030845642, -0.2661839425563812, -0.24843476712703705, -0.23068557679653168, -0.2129364013671875, -0.19518721103668213, -0.17743803560733795, -0.15968886017799377, -0.1419396698474884, -0.12419049441814423, -0.10644131153821945, -0.08869212865829468, -0.0709429532289505, -0.053193770349025726, -0.03544458746910095, -0.017695412039756775, 5.377084016799927e-05, 0.017802953720092773, 0.03555213660001755, 0.05330131575465202, 0.0710504949092865, 0.08879967778921127, 0.10654886066913605, 0.12429803609848022, 0.1420472264289856, 0.15979640185832977, 0.17754557728767395, 0.19529476761817932, 0.2130439430475235, 0.23079311847686768, 0.24854230880737305, 0.2662914991378784, 0.2840406596660614, 0.3017898499965668, 0.31953904032707214, 0.3372882008552551, 0.3550373911857605, 0.37278658151626587, 0.39053577184677124, 0.4082849323749542, 0.4260341227054596, 0.4437832832336426, 0.46153247356414795, 0.47928163409233093, 0.4970308244228363, 0.5147799849510193, 0.5325291752815247, 0.55027836561203, 0.5680275559425354, 0.5857767462730408]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 8.0, 3.0, 4.0, 6.0, 10.0, 20.0, 24.0, 36.0, 42.0, 105.0, 236.0, 671.0, 3504.0, 62274.0, 3929089.0, 190122.0, 6518.0, 972.0, 289.0, 137.0, 84.0, 55.0, 24.0, 15.0, 14.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1474609375, -0.14264678955078125, -0.1378326416015625, -0.13301849365234375, -0.128204345703125, -0.12339019775390625, -0.1185760498046875, -0.11376190185546875, -0.10894775390625, -0.10413360595703125, -0.0993194580078125, -0.09450531005859375, -0.089691162109375, -0.08487701416015625, -0.0800628662109375, -0.07524871826171875, -0.0704345703125, -0.06562042236328125, -0.0608062744140625, -0.05599212646484375, -0.051177978515625, -0.04636383056640625, -0.0415496826171875, -0.03673553466796875, -0.03192138671875, -0.02710723876953125, -0.0222930908203125, -0.01747894287109375, -0.012664794921875, -0.00785064697265625, -0.0030364990234375, 0.00177764892578125, 0.006591796875, 0.01140594482421875, 0.0162200927734375, 0.02103424072265625, 0.025848388671875, 0.03066253662109375, 0.0354766845703125, 0.04029083251953125, 0.04510498046875, 0.04991912841796875, 0.0547332763671875, 0.05954742431640625, 0.064361572265625, 0.06917572021484375, 0.0739898681640625, 0.07880401611328125, 0.0836181640625, 0.08843231201171875, 0.0932464599609375, 0.09806060791015625, 0.102874755859375, 0.10768890380859375, 0.1125030517578125, 0.11731719970703125, 0.12213134765625, 0.12694549560546875, 0.1317596435546875, 0.13657379150390625, 0.141387939453125, 0.14620208740234375, 0.1510162353515625, 0.15583038330078125, 0.16064453125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 7.0, 5.0, 7.0, 4.0, 6.0, 10.0, 12.0, 15.0, 17.0, 24.0, 20.0, 33.0, 24.0, 34.0, 44.0, 39.0, 53.0, 53.0, 48.0, 51.0, 47.0, 40.0, 51.0, 56.0, 42.0, 32.0, 34.0, 30.0, 29.0, 17.0, 22.0, 10.0, 19.0, 10.0, 13.0, 12.0, 13.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.030792236328125, -0.0298306941986084, -0.028869152069091797, -0.027907609939575195, -0.026946067810058594, -0.025984525680541992, -0.02502298355102539, -0.02406144142150879, -0.023099899291992188, -0.022138357162475586, -0.021176815032958984, -0.020215272903442383, -0.01925373077392578, -0.01829218864440918, -0.017330646514892578, -0.016369104385375977, -0.015407562255859375, -0.014446020126342773, -0.013484477996826172, -0.01252293586730957, -0.011561393737792969, -0.010599851608276367, -0.009638309478759766, -0.008676767349243164, -0.0077152252197265625, -0.006753683090209961, -0.005792140960693359, -0.004830598831176758, -0.0038690567016601562, -0.0029075145721435547, -0.0019459724426269531, -0.0009844303131103516, -2.288818359375e-05, 0.0009386539459228516, 0.0019001960754394531, 0.0028617382049560547, 0.0038232803344726562, 0.004784822463989258, 0.005746364593505859, 0.006707906723022461, 0.0076694488525390625, 0.008630990982055664, 0.009592533111572266, 0.010554075241088867, 0.011515617370605469, 0.01247715950012207, 0.013438701629638672, 0.014400243759155273, 0.015361785888671875, 0.016323328018188477, 0.017284870147705078, 0.01824641227722168, 0.01920795440673828, 0.020169496536254883, 0.021131038665771484, 0.022092580795288086, 0.023054122924804688, 0.02401566505432129, 0.02497720718383789, 0.025938749313354492, 0.026900291442871094, 0.027861833572387695, 0.028823375701904297, 0.0297849178314209, 0.0307464599609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 15.0, 30.0, 46.0, 80.0, 145.0, 448.0, 3206.0, 212830.0, 3966977.0, 9322.0, 726.0, 207.0, 91.0, 47.0, 37.0, 20.0, 13.0, 10.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.38916015625, -0.37993812561035156, -0.3707160949707031, -0.3614940643310547, -0.35227203369140625, -0.3430500030517578, -0.3338279724121094, -0.32460594177246094, -0.3153839111328125, -0.30616188049316406, -0.2969398498535156, -0.2877178192138672, -0.27849578857421875, -0.2692737579345703, -0.2600517272949219, -0.25082969665527344, -0.241607666015625, -0.23238563537597656, -0.22316360473632812, -0.2139415740966797, -0.20471954345703125, -0.1954975128173828, -0.18627548217773438, -0.17705345153808594, -0.1678314208984375, -0.15860939025878906, -0.14938735961914062, -0.1401653289794922, -0.13094329833984375, -0.12172126770019531, -0.11249923706054688, -0.10327720642089844, -0.09405517578125, -0.08483314514160156, -0.07561111450195312, -0.06638908386230469, -0.05716705322265625, -0.04794502258300781, -0.038722991943359375, -0.029500961303710938, -0.0202789306640625, -0.011056900024414062, -0.001834869384765625, 0.0073871612548828125, 0.01660919189453125, 0.025831222534179688, 0.035053253173828125, 0.04427528381347656, 0.053497314453125, 0.06271934509277344, 0.07194137573242188, 0.08116340637207031, 0.09038543701171875, 0.09960746765136719, 0.10882949829101562, 0.11805152893066406, 0.1272735595703125, 0.13649559020996094, 0.14571762084960938, 0.1549396514892578, 0.16416168212890625, 0.1733837127685547, 0.18260574340820312, 0.19182777404785156, 0.2010498046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 10.0, 6.0, 8.0, 14.0, 14.0, 16.0, 25.0, 39.0, 50.0, 70.0, 124.0, 217.0, 427.0, 740.0, 928.0, 567.0, 267.0, 183.0, 112.0, 68.0, 42.0, 30.0, 26.0, 17.0, 17.0, 10.0, 10.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.1077880859375, -0.10529422760009766, -0.10280036926269531, -0.10030651092529297, -0.09781265258789062, -0.09531879425048828, -0.09282493591308594, -0.0903310775756836, -0.08783721923828125, -0.0853433609008789, -0.08284950256347656, -0.08035564422607422, -0.07786178588867188, -0.07536792755126953, -0.07287406921386719, -0.07038021087646484, -0.0678863525390625, -0.06539249420166016, -0.06289863586425781, -0.06040477752685547, -0.057910919189453125, -0.05541706085205078, -0.05292320251464844, -0.050429344177246094, -0.04793548583984375, -0.045441627502441406, -0.04294776916503906, -0.04045391082763672, -0.037960052490234375, -0.03546619415283203, -0.03297233581542969, -0.030478477478027344, -0.027984619140625, -0.025490760803222656, -0.022996902465820312, -0.02050304412841797, -0.018009185791015625, -0.015515327453613281, -0.013021469116210938, -0.010527610778808594, -0.00803375244140625, -0.005539894104003906, -0.0030460357666015625, -0.0005521774291992188, 0.001941680908203125, 0.004435539245605469, 0.0069293975830078125, 0.009423255920410156, 0.0119171142578125, 0.014410972595214844, 0.016904830932617188, 0.01939868927001953, 0.021892547607421875, 0.02438640594482422, 0.026880264282226562, 0.029374122619628906, 0.03186798095703125, 0.034361839294433594, 0.03685569763183594, 0.03934955596923828, 0.041843414306640625, 0.04433727264404297, 0.04683113098144531, 0.049324989318847656, 0.05181884765625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 9.0, 7.0, 17.0, 45.0, 71.0, 135.0, 196.0, 193.0, 148.0, 72.0, 36.0, 26.0, 13.0, 7.0, 9.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8570115566253662, -0.8162966370582581, -0.7755817770957947, -0.7348668575286865, -0.6941519975662231, -0.653437077999115, -0.6127221584320068, -0.5720072984695435, -0.5312923789024353, -0.49057748913764954, -0.44986259937286377, -0.4091476798057556, -0.36843279004096985, -0.3277179002761841, -0.2870029807090759, -0.24628809094429016, -0.2055732011795044, -0.16485831141471863, -0.12414340674877167, -0.0834285095334053, -0.04271361231803894, -0.001998722553253174, 0.03871618211269379, 0.07943108677864075, 0.12014597654342651, 0.16086086630821228, 0.20157577097415924, 0.2422906756401062, 0.28300556540489197, 0.32372045516967773, 0.3644353747367859, 0.40515026450157166, 0.44586503505706787, 0.48657992482185364, 0.5272948145866394, 0.5680097341537476, 0.6087245941162109, 0.6494395136833191, 0.6901544332504272, 0.7308692932128906, 0.7715842127799988, 0.8122991323471069, 0.8530139923095703, 0.8937289118766785, 0.9344438314437866, 0.97515869140625, 1.0158735513687134, 1.0565885305404663, 1.0973033905029297, 1.138018250465393, 1.178733229637146, 1.2194480895996094, 1.2601629495620728, 1.3008778095245361, 1.341592788696289, 1.3823076486587524, 1.4230225086212158, 1.4637373685836792, 1.5044523477554321, 1.5451672077178955, 1.5858820676803589, 1.6265969276428223, 1.6673119068145752, 1.7080267667770386, 1.7487417459487915]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 9.0, 6.0, 11.0, 7.0, 10.0, 12.0, 15.0, 19.0, 30.0, 33.0, 25.0, 48.0, 38.0, 51.0, 52.0, 53.0, 51.0, 67.0, 54.0, 66.0, 46.0, 61.0, 44.0, 38.0, 32.0, 32.0, 13.0, 18.0, 20.0, 10.0, 9.0, 10.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4171532392501831, -0.40451580286026, -0.3918783962726593, -0.3792409598827362, -0.3666035234928131, -0.3539661169052124, -0.3413286805152893, -0.3286912441253662, -0.3160538077354431, -0.30341637134552, -0.2907789647579193, -0.2781415283679962, -0.2655040919780731, -0.2528666853904724, -0.24022924900054932, -0.22759181261062622, -0.2149544060230255, -0.2023169845342636, -0.18967954814434052, -0.1770421266555786, -0.16440469026565552, -0.15176726877689362, -0.1391298472881317, -0.12649241089820862, -0.11385498940944672, -0.10121756047010422, -0.08858013153076172, -0.07594271004199982, -0.06330528110265732, -0.05066785216331482, -0.03803043067455292, -0.02539300173521042, -0.01275557279586792, -0.00011814571917057037, 0.01251928135752678, 0.02515670657157898, 0.03779413551092148, 0.05043156445026398, 0.06306898593902588, 0.07570641487836838, 0.08834384381771088, 0.10098127275705338, 0.11361870169639587, 0.12625612318515778, 0.13889354467391968, 0.15153098106384277, 0.16416840255260468, 0.17680582404136658, 0.18944326043128967, 0.20208068192005157, 0.21471811830997467, 0.22735553979873657, 0.23999297618865967, 0.25263041257858276, 0.26526781916618347, 0.27790525555610657, 0.2905426621437073, 0.30318009853363037, 0.3158175051212311, 0.3284549415111542, 0.34109237790107727, 0.353729784488678, 0.3663672208786011, 0.37900465726852417, 0.39164209365844727]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 11.0, 16.0, 18.0, 23.0, 36.0, 57.0, 91.0, 159.0, 310.0, 608.0, 1195.0, 2781.0, 6426.0, 15935.0, 42498.0, 113709.0, 262152.0, 322887.0, 171553.0, 66153.0, 24658.0, 9659.0, 4017.0, 1790.0, 858.0, 399.0, 223.0, 118.0, 80.0, 51.0, 26.0, 14.0, 10.0, 7.0, 12.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057830810546875, -0.05578184127807617, -0.053732872009277344, -0.051683902740478516, -0.04963493347167969, -0.04758596420288086, -0.04553699493408203, -0.0434880256652832, -0.041439056396484375, -0.03939008712768555, -0.03734111785888672, -0.03529214859008789, -0.03324317932128906, -0.031194210052490234, -0.029145240783691406, -0.027096271514892578, -0.02504730224609375, -0.022998332977294922, -0.020949363708496094, -0.018900394439697266, -0.016851425170898438, -0.01480245590209961, -0.012753486633300781, -0.010704517364501953, -0.008655548095703125, -0.006606578826904297, -0.004557609558105469, -0.0025086402893066406, -0.0004596710205078125, 0.0015892982482910156, 0.0036382675170898438, 0.005687236785888672, 0.0077362060546875, 0.009785175323486328, 0.011834144592285156, 0.013883113861083984, 0.015932083129882812, 0.01798105239868164, 0.02003002166748047, 0.022078990936279297, 0.024127960205078125, 0.026176929473876953, 0.02822589874267578, 0.03027486801147461, 0.03232383728027344, 0.034372806549072266, 0.036421775817871094, 0.03847074508666992, 0.04051971435546875, 0.04256868362426758, 0.044617652893066406, 0.046666622161865234, 0.04871559143066406, 0.05076456069946289, 0.05281352996826172, 0.05486249923706055, 0.056911468505859375, 0.0589604377746582, 0.06100940704345703, 0.06305837631225586, 0.06510734558105469, 0.06715631484985352, 0.06920528411865234, 0.07125425338745117, 0.07330322265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 7.0, 5.0, 14.0, 10.0, 15.0, 28.0, 31.0, 34.0, 42.0, 49.0, 51.0, 46.0, 60.0, 58.0, 58.0, 58.0, 59.0, 56.0, 47.0, 52.0, 40.0, 36.0, 33.0, 24.0, 27.0, 12.0, 9.0, 12.0, 6.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03717041015625, -0.035916805267333984, -0.03466320037841797, -0.03340959548950195, -0.03215599060058594, -0.030902385711669922, -0.029648780822753906, -0.02839517593383789, -0.027141571044921875, -0.02588796615600586, -0.024634361267089844, -0.023380756378173828, -0.022127151489257812, -0.020873546600341797, -0.01961994171142578, -0.018366336822509766, -0.01711273193359375, -0.015859127044677734, -0.014605522155761719, -0.013351917266845703, -0.012098312377929688, -0.010844707489013672, -0.009591102600097656, -0.00833749771118164, -0.007083892822265625, -0.005830287933349609, -0.004576683044433594, -0.003323078155517578, -0.0020694732666015625, -0.0008158683776855469, 0.00043773651123046875, 0.0016913414001464844, 0.0029449462890625, 0.004198551177978516, 0.005452156066894531, 0.006705760955810547, 0.007959365844726562, 0.009212970733642578, 0.010466575622558594, 0.01172018051147461, 0.012973785400390625, 0.01422739028930664, 0.015480995178222656, 0.016734600067138672, 0.017988204956054688, 0.019241809844970703, 0.02049541473388672, 0.021749019622802734, 0.02300262451171875, 0.024256229400634766, 0.02550983428955078, 0.026763439178466797, 0.028017044067382812, 0.029270648956298828, 0.030524253845214844, 0.03177785873413086, 0.033031463623046875, 0.03428506851196289, 0.035538673400878906, 0.03679227828979492, 0.03804588317871094, 0.03929948806762695, 0.04055309295654297, 0.041806697845458984, 0.043060302734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 6.0, 4.0, 9.0, 17.0, 15.0, 20.0, 43.0, 76.0, 103.0, 212.0, 387.0, 762.0, 1851.0, 5986.0, 46155.0, 826399.0, 150518.0, 11109.0, 2692.0, 1036.0, 506.0, 268.0, 123.0, 79.0, 50.0, 35.0, 25.0, 14.0, 15.0, 8.0, 8.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2073974609375, -0.2004108428955078, -0.19342422485351562, -0.18643760681152344, -0.17945098876953125, -0.17246437072753906, -0.16547775268554688, -0.1584911346435547, -0.1515045166015625, -0.1445178985595703, -0.13753128051757812, -0.13054466247558594, -0.12355804443359375, -0.11657142639160156, -0.10958480834960938, -0.10259819030761719, -0.095611572265625, -0.08862495422363281, -0.08163833618164062, -0.07465171813964844, -0.06766510009765625, -0.06067848205566406, -0.053691864013671875, -0.04670524597167969, -0.0397186279296875, -0.03273200988769531, -0.025745391845703125, -0.018758773803710938, -0.01177215576171875, -0.0047855377197265625, 0.002201080322265625, 0.009187698364257812, 0.01617431640625, 0.023160934448242188, 0.030147552490234375, 0.03713417053222656, 0.04412078857421875, 0.05110740661621094, 0.058094024658203125, 0.06508064270019531, 0.0720672607421875, 0.07905387878417969, 0.08604049682617188, 0.09302711486816406, 0.10001373291015625, 0.10700035095214844, 0.11398696899414062, 0.12097358703613281, 0.127960205078125, 0.1349468231201172, 0.14193344116210938, 0.14892005920410156, 0.15590667724609375, 0.16289329528808594, 0.16987991333007812, 0.1768665313720703, 0.1838531494140625, 0.1908397674560547, 0.19782638549804688, 0.20481300354003906, 0.21179962158203125, 0.21878623962402344, 0.22577285766601562, 0.2327594757080078, 0.23974609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 3.0, 3.0, 3.0, 6.0, 10.0, 12.0, 12.0, 20.0, 18.0, 13.0, 21.0, 30.0, 22.0, 29.0, 29.0, 40.0, 35.0, 46.0, 43.0, 50.0, 35.0, 43.0, 53.0, 45.0, 49.0, 35.0, 30.0, 38.0, 30.0, 31.0, 31.0, 25.0, 19.0, 21.0, 15.0, 11.0, 14.0, 4.0, 11.0, 2.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.12646484375, -0.12265682220458984, -0.11884880065917969, -0.11504077911376953, -0.11123275756835938, -0.10742473602294922, -0.10361671447753906, -0.0998086929321289, -0.09600067138671875, -0.0921926498413086, -0.08838462829589844, -0.08457660675048828, -0.08076858520507812, -0.07696056365966797, -0.07315254211425781, -0.06934452056884766, -0.0655364990234375, -0.061728477478027344, -0.05792045593261719, -0.05411243438720703, -0.050304412841796875, -0.04649639129638672, -0.04268836975097656, -0.038880348205566406, -0.03507232666015625, -0.031264305114746094, -0.027456283569335938, -0.02364826202392578, -0.019840240478515625, -0.01603221893310547, -0.012224197387695312, -0.008416175842285156, -0.004608154296875, -0.0008001327514648438, 0.0030078887939453125, 0.006815910339355469, 0.010623931884765625, 0.014431953430175781, 0.018239974975585938, 0.022047996520996094, 0.02585601806640625, 0.029664039611816406, 0.03347206115722656, 0.03728008270263672, 0.041088104248046875, 0.04489612579345703, 0.04870414733886719, 0.052512168884277344, 0.0563201904296875, 0.060128211975097656, 0.06393623352050781, 0.06774425506591797, 0.07155227661132812, 0.07536029815673828, 0.07916831970214844, 0.0829763412475586, 0.08678436279296875, 0.0905923843383789, 0.09440040588378906, 0.09820842742919922, 0.10201644897460938, 0.10582447052001953, 0.10963249206542969, 0.11344051361083984, 0.11724853515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 12.0, 9.0, 11.0, 16.0, 20.0, 27.0, 32.0, 55.0, 102.0, 156.0, 242.0, 495.0, 815.0, 1570.0, 3197.0, 7785.0, 24573.0, 797512.0, 182565.0, 17509.0, 6202.0, 2694.0, 1255.0, 669.0, 383.0, 206.0, 152.0, 84.0, 54.0, 48.0, 32.0, 12.0, 18.0, 9.0, 4.0, 8.0, 4.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1656494140625, -0.16061019897460938, -0.15557098388671875, -0.15053176879882812, -0.1454925537109375, -0.14045333862304688, -0.13541412353515625, -0.13037490844726562, -0.125335693359375, -0.12029647827148438, -0.11525726318359375, -0.11021804809570312, -0.1051788330078125, -0.10013961791992188, -0.09510040283203125, -0.09006118774414062, -0.08502197265625, -0.07998275756835938, -0.07494354248046875, -0.06990432739257812, -0.0648651123046875, -0.059825897216796875, -0.05478668212890625, -0.049747467041015625, -0.044708251953125, -0.039669036865234375, -0.03462982177734375, -0.029590606689453125, -0.0245513916015625, -0.019512176513671875, -0.01447296142578125, -0.009433746337890625, -0.00439453125, 0.000644683837890625, 0.00568389892578125, 0.010723114013671875, 0.0157623291015625, 0.020801544189453125, 0.02584075927734375, 0.030879974365234375, 0.035919189453125, 0.040958404541015625, 0.04599761962890625, 0.051036834716796875, 0.0560760498046875, 0.061115264892578125, 0.06615447998046875, 0.07119369506835938, 0.07623291015625, 0.08127212524414062, 0.08631134033203125, 0.09135055541992188, 0.0963897705078125, 0.10142898559570312, 0.10646820068359375, 0.11150741577148438, 0.116546630859375, 0.12158584594726562, 0.12662506103515625, 0.13166427612304688, 0.1367034912109375, 0.14174270629882812, 0.14678192138671875, 0.15182113647460938, 0.1568603515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 10.0, 6.0, 20.0, 28.0, 69.0, 298.0, 393.0, 93.0, 24.0, 16.0, 14.0, 3.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.706880569458008e-05, -7.442384958267212e-05, -7.177889347076416e-05, -6.91339373588562e-05, -6.648898124694824e-05, -6.384402513504028e-05, -6.119906902313232e-05, -5.8554112911224365e-05, -5.5909156799316406e-05, -5.326420068740845e-05, -5.061924457550049e-05, -4.797428846359253e-05, -4.532933235168457e-05, -4.268437623977661e-05, -4.003942012786865e-05, -3.739446401596069e-05, -3.4749507904052734e-05, -3.2104551792144775e-05, -2.9459595680236816e-05, -2.6814639568328857e-05, -2.41696834564209e-05, -2.152472734451294e-05, -1.887977123260498e-05, -1.623481512069702e-05, -1.3589859008789062e-05, -1.0944902896881104e-05, -8.299946784973145e-06, -5.6549906730651855e-06, -3.0100345611572266e-06, -3.650784492492676e-07, 2.2798776626586914e-06, 4.92483377456665e-06, 7.569789886474609e-06, 1.0214745998382568e-05, 1.2859702110290527e-05, 1.5504658222198486e-05, 1.8149614334106445e-05, 2.0794570446014404e-05, 2.3439526557922363e-05, 2.6084482669830322e-05, 2.872943878173828e-05, 3.137439489364624e-05, 3.40193510055542e-05, 3.666430711746216e-05, 3.930926322937012e-05, 4.1954219341278076e-05, 4.4599175453186035e-05, 4.7244131565093994e-05, 4.988908767700195e-05, 5.253404378890991e-05, 5.517899990081787e-05, 5.782395601272583e-05, 6.046891212463379e-05, 6.311386823654175e-05, 6.575882434844971e-05, 6.840378046035767e-05, 7.104873657226562e-05, 7.369369268417358e-05, 7.633864879608154e-05, 7.89836049079895e-05, 8.162856101989746e-05, 8.427351713180542e-05, 8.691847324371338e-05, 8.956342935562134e-05, 9.22083854675293e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 9.0, 5.0, 7.0, 12.0, 23.0, 29.0, 43.0, 52.0, 122.0, 209.0, 312.0, 656.0, 1333.0, 3265.0, 9127.0, 36803.0, 924639.0, 53771.0, 11088.0, 3880.0, 1559.0, 732.0, 367.0, 176.0, 111.0, 64.0, 43.0, 35.0, 20.0, 18.0, 9.0, 14.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15966796875, -0.1544475555419922, -0.14922714233398438, -0.14400672912597656, -0.13878631591796875, -0.13356590270996094, -0.12834548950195312, -0.12312507629394531, -0.1179046630859375, -0.11268424987792969, -0.10746383666992188, -0.10224342346191406, -0.09702301025390625, -0.09180259704589844, -0.08658218383789062, -0.08136177062988281, -0.076141357421875, -0.07092094421386719, -0.06570053100585938, -0.06048011779785156, -0.05525970458984375, -0.05003929138183594, -0.044818878173828125, -0.03959846496582031, -0.0343780517578125, -0.029157638549804688, -0.023937225341796875, -0.018716812133789062, -0.01349639892578125, -0.008275985717773438, -0.003055572509765625, 0.0021648406982421875, 0.00738525390625, 0.012605667114257812, 0.017826080322265625, 0.023046493530273438, 0.02826690673828125, 0.03348731994628906, 0.038707733154296875, 0.04392814636230469, 0.0491485595703125, 0.05436897277832031, 0.059589385986328125, 0.06480979919433594, 0.07003021240234375, 0.07525062561035156, 0.08047103881835938, 0.08569145202636719, 0.090911865234375, 0.09613227844238281, 0.10135269165039062, 0.10657310485839844, 0.11179351806640625, 0.11701393127441406, 0.12223434448242188, 0.1274547576904297, 0.1326751708984375, 0.1378955841064453, 0.14311599731445312, 0.14833641052246094, 0.15355682373046875, 0.15877723693847656, 0.16399765014648438, 0.1692180633544922, 0.1744384765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 3.0, 4.0, 6.0, 15.0, 14.0, 38.0, 60.0, 104.0, 191.0, 200.0, 151.0, 77.0, 44.0, 21.0, 10.0, 8.0, 8.0, 3.0, 5.0, 1.0, 2.0, 7.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1131591796875, -0.109405517578125, -0.10565185546875, -0.101898193359375, -0.09814453125, -0.094390869140625, -0.09063720703125, -0.086883544921875, -0.0831298828125, -0.079376220703125, -0.07562255859375, -0.071868896484375, -0.068115234375, -0.064361572265625, -0.06060791015625, -0.056854248046875, -0.0531005859375, -0.049346923828125, -0.04559326171875, -0.041839599609375, -0.0380859375, -0.034332275390625, -0.03057861328125, -0.026824951171875, -0.0230712890625, -0.019317626953125, -0.01556396484375, -0.011810302734375, -0.008056640625, -0.004302978515625, -0.00054931640625, 0.003204345703125, 0.0069580078125, 0.010711669921875, 0.01446533203125, 0.018218994140625, 0.02197265625, 0.025726318359375, 0.02947998046875, 0.033233642578125, 0.0369873046875, 0.040740966796875, 0.04449462890625, 0.048248291015625, 0.052001953125, 0.055755615234375, 0.05950927734375, 0.063262939453125, 0.0670166015625, 0.070770263671875, 0.07452392578125, 0.078277587890625, 0.08203125, 0.085784912109375, 0.08953857421875, 0.093292236328125, 0.0970458984375, 0.100799560546875, 0.10455322265625, 0.108306884765625, 0.112060546875, 0.115814208984375, 0.11956787109375, 0.123321533203125, 0.1270751953125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 18.0, 23.0, 73.0, 183.0, 353.0, 210.0, 85.0, 35.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7009124755859375, -4.6061811447143555, -4.511449813842773, -4.416718482971191, -4.321986675262451, -4.227255344390869, -4.132524013519287, -4.037792682647705, -3.943061351776123, -3.848330020904541, -3.75359845161438, -3.658867120742798, -3.564135789871216, -3.4694042205810547, -3.3746728897094727, -3.2799415588378906, -3.1852099895477295, -3.0904786586761475, -2.9957470893859863, -2.9010157585144043, -2.8062844276428223, -2.7115530967712402, -2.616821527481079, -2.522090196609497, -2.427358627319336, -2.332627296447754, -2.2378957271575928, -2.1431643962860107, -2.0484330654144287, -1.9537016153335571, -1.8589701652526855, -1.7642388343811035, -1.6695072650909424, -1.5747758150100708, -1.4800444841384888, -1.3853130340576172, -1.2905817031860352, -1.1958502531051636, -1.101118803024292, -1.00638747215271, -0.9116560220718384, -0.8169246315956116, -0.7221932411193848, -0.6274617910385132, -0.5327304005622864, -0.43799901008605957, -0.343267560005188, -0.24853616952896118, -0.15380477905273438, -0.059073373675346375, 0.035658031702041626, 0.13038945198059082, 0.22512084245681763, 0.31985223293304443, 0.414583683013916, 0.5093150734901428, 0.6040464639663696, 0.6987778544425964, 0.7935092449188232, 0.8882406949996948, 0.9829720854759216, 1.0777034759521484, 1.17243492603302, 1.2671663761138916, 1.3618977069854736]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 6.0, 5.0, 18.0, 11.0, 10.0, 12.0, 15.0, 17.0, 29.0, 26.0, 33.0, 36.0, 41.0, 30.0, 41.0, 52.0, 53.0, 63.0, 83.0, 56.0, 43.0, 46.0, 28.0, 33.0, 25.0, 29.0, 21.0, 19.0, 17.0, 15.0, 15.0, 19.0, 7.0, 10.0, 6.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6356878280639648, -0.6174606680870056, -0.5992335081100464, -0.5810063481330872, -0.5627791881561279, -0.5445520281791687, -0.5263248682022095, -0.508097767829895, -0.4898705780506134, -0.4716434180736542, -0.45341625809669495, -0.4351890981197357, -0.4169619679450989, -0.39873480796813965, -0.3805076479911804, -0.3622804880142212, -0.34405332803726196, -0.32582616806030273, -0.3075990080833435, -0.2893718481063843, -0.27114468812942505, -0.2529175281524658, -0.23469039797782898, -0.21646323800086975, -0.19823607802391052, -0.1800089180469513, -0.16178175806999207, -0.14355461299419403, -0.1253274530172348, -0.10710029304027557, -0.08887314051389694, -0.07064598798751831, -0.05241888761520386, -0.03419173136353493, -0.015964575111865997, 0.0022625811398029327, 0.020489737391471863, 0.03871689736843109, 0.05694404989480972, 0.07517120242118835, 0.09339836239814758, 0.11162552237510681, 0.12985268235206604, 0.14807982742786407, 0.1663069874048233, 0.18453414738178253, 0.20276129245758057, 0.2209884524345398, 0.23921561241149902, 0.25744277238845825, 0.2756699323654175, 0.2938970923423767, 0.31212425231933594, 0.33035141229629517, 0.348578542470932, 0.36680570244789124, 0.38503286242485046, 0.4032600224018097, 0.4214871823787689, 0.43971434235572815, 0.457941472530365, 0.4761686325073242, 0.49439579248428345, 0.5126229524612427, 0.5308501124382019]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 6.0, 8.0, 11.0, 27.0, 32.0, 45.0, 101.0, 179.0, 530.0, 2168.0, 12124.0, 153921.0, 3790330.0, 217393.0, 13875.0, 2404.0, 592.0, 249.0, 118.0, 67.0, 28.0, 30.0, 18.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14794921875, -0.14325904846191406, -0.13856887817382812, -0.1338787078857422, -0.12918853759765625, -0.12449836730957031, -0.11980819702148438, -0.11511802673339844, -0.1104278564453125, -0.10573768615722656, -0.10104751586914062, -0.09635734558105469, -0.09166717529296875, -0.08697700500488281, -0.08228683471679688, -0.07759666442871094, -0.072906494140625, -0.06821632385253906, -0.06352615356445312, -0.05883598327636719, -0.05414581298828125, -0.04945564270019531, -0.044765472412109375, -0.04007530212402344, -0.0353851318359375, -0.030694961547851562, -0.026004791259765625, -0.021314620971679688, -0.01662445068359375, -0.011934280395507812, -0.007244110107421875, -0.0025539398193359375, 0.00213623046875, 0.0068264007568359375, 0.011516571044921875, 0.016206741333007812, 0.02089691162109375, 0.025587081909179688, 0.030277252197265625, 0.03496742248535156, 0.0396575927734375, 0.04434776306152344, 0.049037933349609375, 0.05372810363769531, 0.05841827392578125, 0.06310844421386719, 0.06779861450195312, 0.07248878479003906, 0.077178955078125, 0.08186912536621094, 0.08655929565429688, 0.09124946594238281, 0.09593963623046875, 0.10062980651855469, 0.10531997680664062, 0.11001014709472656, 0.1147003173828125, 0.11939048767089844, 0.12408065795898438, 0.1287708282470703, 0.13346099853515625, 0.1381511688232422, 0.14284133911132812, 0.14753150939941406, 0.1522216796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 11.0, 12.0, 7.0, 22.0, 18.0, 24.0, 40.0, 52.0, 44.0, 54.0, 60.0, 58.0, 67.0, 65.0, 63.0, 68.0, 60.0, 43.0, 53.0, 40.0, 34.0, 31.0, 16.0, 17.0, 10.0, 11.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03546142578125, -0.033939361572265625, -0.03241729736328125, -0.030895233154296875, -0.0293731689453125, -0.027851104736328125, -0.02632904052734375, -0.024806976318359375, -0.023284912109375, -0.021762847900390625, -0.02024078369140625, -0.018718719482421875, -0.0171966552734375, -0.015674591064453125, -0.01415252685546875, -0.012630462646484375, -0.0111083984375, -0.009586334228515625, -0.00806427001953125, -0.006542205810546875, -0.0050201416015625, -0.003498077392578125, -0.00197601318359375, -0.000453948974609375, 0.001068115234375, 0.002590179443359375, 0.00411224365234375, 0.005634307861328125, 0.0071563720703125, 0.008678436279296875, 0.01020050048828125, 0.011722564697265625, 0.01324462890625, 0.014766693115234375, 0.01628875732421875, 0.017810821533203125, 0.0193328857421875, 0.020854949951171875, 0.02237701416015625, 0.023899078369140625, 0.025421142578125, 0.026943206787109375, 0.02846527099609375, 0.029987335205078125, 0.0315093994140625, 0.033031463623046875, 0.03455352783203125, 0.036075592041015625, 0.03759765625, 0.039119720458984375, 0.04064178466796875, 0.042163848876953125, 0.0436859130859375, 0.045207977294921875, 0.04673004150390625, 0.048252105712890625, 0.049774169921875, 0.051296234130859375, 0.05281829833984375, 0.054340362548828125, 0.0558624267578125, 0.057384490966796875, 0.05890655517578125, 0.060428619384765625, 0.06195068359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 6.0, 11.0, 15.0, 22.0, 34.0, 56.0, 80.0, 130.0, 177.0, 409.0, 3219.0, 3991095.0, 196867.0, 1435.0, 331.0, 127.0, 99.0, 57.0, 42.0, 20.0, 12.0, 15.0, 14.0, 8.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8486328125, -0.8297119140625, -0.810791015625, -0.7918701171875, -0.77294921875, -0.7540283203125, -0.735107421875, -0.7161865234375, -0.697265625, -0.6783447265625, -0.659423828125, -0.6405029296875, -0.62158203125, -0.6026611328125, -0.583740234375, -0.5648193359375, -0.5458984375, -0.5269775390625, -0.508056640625, -0.4891357421875, -0.47021484375, -0.4512939453125, -0.432373046875, -0.4134521484375, -0.39453125, -0.3756103515625, -0.356689453125, -0.3377685546875, -0.31884765625, -0.2999267578125, -0.281005859375, -0.2620849609375, -0.2431640625, -0.2242431640625, -0.205322265625, -0.1864013671875, -0.16748046875, -0.1485595703125, -0.129638671875, -0.1107177734375, -0.091796875, -0.0728759765625, -0.053955078125, -0.0350341796875, -0.01611328125, 0.0028076171875, 0.021728515625, 0.0406494140625, 0.0595703125, 0.0784912109375, 0.097412109375, 0.1163330078125, 0.13525390625, 0.1541748046875, 0.173095703125, 0.1920166015625, 0.2109375, 0.2298583984375, 0.248779296875, 0.2677001953125, 0.28662109375, 0.3055419921875, 0.324462890625, 0.3433837890625, 0.3623046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 15.0, 12.0, 20.0, 39.0, 53.0, 118.0, 324.0, 1002.0, 1500.0, 603.0, 198.0, 88.0, 49.0, 21.0, 12.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2618217468261719, -0.25460052490234375, -0.24737930297851562, -0.2401580810546875, -0.23293685913085938, -0.22571563720703125, -0.21849441528320312, -0.211273193359375, -0.20405197143554688, -0.19683074951171875, -0.18960952758789062, -0.1823883056640625, -0.17516708374023438, -0.16794586181640625, -0.16072463989257812, -0.15350341796875, -0.14628219604492188, -0.13906097412109375, -0.13183975219726562, -0.1246185302734375, -0.11739730834960938, -0.11017608642578125, -0.10295486450195312, -0.095733642578125, -0.08851242065429688, -0.08129119873046875, -0.07406997680664062, -0.0668487548828125, -0.059627532958984375, -0.05240631103515625, -0.045185089111328125, -0.0379638671875, -0.030742645263671875, -0.02352142333984375, -0.016300201416015625, -0.0090789794921875, -0.001857757568359375, 0.00536346435546875, 0.012584686279296875, 0.019805908203125, 0.027027130126953125, 0.03424835205078125, 0.041469573974609375, 0.0486907958984375, 0.055912017822265625, 0.06313323974609375, 0.07035446166992188, 0.07757568359375, 0.08479690551757812, 0.09201812744140625, 0.09923934936523438, 0.1064605712890625, 0.11368179321289062, 0.12090301513671875, 0.12812423706054688, 0.135345458984375, 0.14256668090820312, 0.14978790283203125, 0.15700912475585938, 0.1642303466796875, 0.17145156860351562, 0.17867279052734375, 0.18589401245117188, 0.193115234375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 0.0, 4.0, 3.0, 12.0, 11.0, 35.0, 58.0, 124.0, 270.0, 229.0, 128.0, 57.0, 28.0, 19.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9270200729370117, -2.847770929336548, -2.768522024154663, -2.689272880554199, -2.6100239753723145, -2.5307748317718506, -2.451525926589966, -2.372276782989502, -2.293027877807617, -2.2137787342071533, -2.1345298290252686, -2.0552806854248047, -1.97603178024292, -1.896782636642456, -1.8175336122512817, -1.7382845878601074, -1.6590354442596436, -1.5797864198684692, -1.500537395477295, -1.4212883710861206, -1.3420393466949463, -1.2627902030944824, -1.183541178703308, -1.1042921543121338, -1.0250431299209595, -0.9457941055297852, -0.8665450811386108, -0.7872959971427917, -0.7080469727516174, -0.6287979483604431, -0.549548864364624, -0.4702998399734497, -0.3910505771636963, -0.311801552772522, -0.23255249857902527, -0.15330345928668976, -0.07405441999435425, 0.005194604396820068, 0.08444365859031677, 0.16369271278381348, 0.2429417371749878, 0.3221907615661621, 0.4014398157596588, 0.4806888699531555, 0.5599378943443298, 0.6391869187355042, 0.7184360027313232, 0.7976850271224976, 0.8769340515136719, 0.9561830759048462, 1.0354321002960205, 1.1146811246871948, 1.1939301490783691, 1.273179292678833, 1.3524283170700073, 1.4316773414611816, 1.510926365852356, 1.5901753902435303, 1.6694244146347046, 1.748673439025879, 1.8279225826263428, 1.9071714878082275, 1.9864206314086914, 2.065669536590576, 2.14491868019104]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 14.0, 11.0, 11.0, 16.0, 18.0, 34.0, 24.0, 34.0, 51.0, 40.0, 48.0, 53.0, 67.0, 60.0, 74.0, 57.0, 48.0, 54.0, 46.0, 34.0, 28.0, 32.0, 29.0, 21.0, 20.0, 15.0, 12.0, 14.0, 11.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.825846791267395, -0.8045121431350708, -0.7831775546073914, -0.7618429660797119, -0.7405083179473877, -0.7191736698150635, -0.697839081287384, -0.6765044927597046, -0.6551698446273804, -0.6338351964950562, -0.6125006079673767, -0.5911660194396973, -0.569831371307373, -0.5484967231750488, -0.5271621346473694, -0.5058275461196899, -0.4844928979873657, -0.4631582796573639, -0.44182366132736206, -0.42048904299736023, -0.3991544246673584, -0.37781980633735657, -0.35648518800735474, -0.3351505696773529, -0.3138159513473511, -0.29248133301734924, -0.2711467146873474, -0.24981209635734558, -0.22847747802734375, -0.20714285969734192, -0.1858082413673401, -0.16447362303733826, -0.14313894510269165, -0.12180432677268982, -0.10046970844268799, -0.07913509011268616, -0.057800471782684326, -0.036465853452682495, -0.015131235122680664, 0.006203383207321167, 0.027538001537322998, 0.04887261986732483, 0.07020723819732666, 0.09154185652732849, 0.11287647485733032, 0.13421109318733215, 0.15554571151733398, 0.17688032984733582, 0.19821494817733765, 0.21954956650733948, 0.2408841848373413, 0.26221880316734314, 0.28355342149734497, 0.3048880398273468, 0.32622265815734863, 0.34755727648735046, 0.3688918948173523, 0.3902265131473541, 0.41156113147735596, 0.4328957498073578, 0.4542303681373596, 0.47556498646736145, 0.4968996047973633, 0.5182342529296875, 0.5395688414573669]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 11.0, 19.0, 19.0, 35.0, 62.0, 93.0, 158.0, 274.0, 507.0, 906.0, 1842.0, 4013.0, 10192.0, 30113.0, 116864.0, 465563.0, 314492.0, 69768.0, 20106.0, 7275.0, 3088.0, 1420.0, 747.0, 383.0, 232.0, 130.0, 91.0, 48.0, 20.0, 24.0, 19.0, 9.0, 3.0, 7.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.1763629913330078, -0.17157363891601562, -0.16678428649902344, -0.16199493408203125, -0.15720558166503906, -0.15241622924804688, -0.1476268768310547, -0.1428375244140625, -0.1380481719970703, -0.13325881958007812, -0.12846946716308594, -0.12368011474609375, -0.11889076232910156, -0.11410140991210938, -0.10931205749511719, -0.104522705078125, -0.09973335266113281, -0.09494400024414062, -0.09015464782714844, -0.08536529541015625, -0.08057594299316406, -0.07578659057617188, -0.07099723815917969, -0.0662078857421875, -0.06141853332519531, -0.056629180908203125, -0.05183982849121094, -0.04705047607421875, -0.04226112365722656, -0.037471771240234375, -0.03268241882324219, -0.02789306640625, -0.023103713989257812, -0.018314361572265625, -0.013525009155273438, -0.00873565673828125, -0.0039463043212890625, 0.000843048095703125, 0.0056324005126953125, 0.0104217529296875, 0.015211105346679688, 0.020000457763671875, 0.024789810180664062, 0.02957916259765625, 0.03436851501464844, 0.039157867431640625, 0.04394721984863281, 0.048736572265625, 0.05352592468261719, 0.058315277099609375, 0.06310462951660156, 0.06789398193359375, 0.07268333435058594, 0.07747268676757812, 0.08226203918457031, 0.0870513916015625, 0.09184074401855469, 0.09663009643554688, 0.10141944885253906, 0.10620880126953125, 0.11099815368652344, 0.11578750610351562, 0.12057685852050781, 0.1253662109375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 2.0, 3.0, 3.0, 9.0, 7.0, 14.0, 8.0, 17.0, 26.0, 22.0, 34.0, 23.0, 37.0, 41.0, 51.0, 49.0, 48.0, 51.0, 59.0, 44.0, 54.0, 52.0, 48.0, 34.0, 47.0, 38.0, 30.0, 32.0, 31.0, 26.0, 16.0, 6.0, 13.0, 5.0, 5.0, 7.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0462646484375, -0.044857025146484375, -0.04344940185546875, -0.042041778564453125, -0.0406341552734375, -0.039226531982421875, -0.03781890869140625, -0.036411285400390625, -0.035003662109375, -0.033596038818359375, -0.03218841552734375, -0.030780792236328125, -0.0293731689453125, -0.027965545654296875, -0.02655792236328125, -0.025150299072265625, -0.02374267578125, -0.022335052490234375, -0.02092742919921875, -0.019519805908203125, -0.0181121826171875, -0.016704559326171875, -0.01529693603515625, -0.013889312744140625, -0.012481689453125, -0.011074066162109375, -0.00966644287109375, -0.008258819580078125, -0.0068511962890625, -0.005443572998046875, -0.00403594970703125, -0.002628326416015625, -0.001220703125, 0.000186920166015625, 0.00159454345703125, 0.003002166748046875, 0.0044097900390625, 0.005817413330078125, 0.00722503662109375, 0.008632659912109375, 0.010040283203125, 0.011447906494140625, 0.01285552978515625, 0.014263153076171875, 0.0156707763671875, 0.017078399658203125, 0.01848602294921875, 0.019893646240234375, 0.02130126953125, 0.022708892822265625, 0.02411651611328125, 0.025524139404296875, 0.0269317626953125, 0.028339385986328125, 0.02974700927734375, 0.031154632568359375, 0.032562255859375, 0.033969879150390625, 0.03537750244140625, 0.036785125732421875, 0.0381927490234375, 0.039600372314453125, 0.04100799560546875, 0.042415618896484375, 0.0438232421875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 11.0, 12.0, 18.0, 34.0, 35.0, 48.0, 66.0, 100.0, 115.0, 181.0, 311.0, 532.0, 952.0, 2114.0, 5090.0, 19104.0, 163321.0, 776954.0, 61544.0, 10951.0, 3550.0, 1467.0, 711.0, 441.0, 263.0, 179.0, 138.0, 95.0, 57.0, 48.0, 22.0, 13.0, 18.0, 9.0, 9.0, 6.0, 10.0, 1.0, 6.0, 2.0, 4.0, 1.0, 5.0], "bins": [-0.3642578125, -0.3547496795654297, -0.3452415466308594, -0.33573341369628906, -0.32622528076171875, -0.31671714782714844, -0.3072090148925781, -0.2977008819580078, -0.2881927490234375, -0.2786846160888672, -0.2691764831542969, -0.25966835021972656, -0.25016021728515625, -0.24065208435058594, -0.23114395141601562, -0.2216358184814453, -0.212127685546875, -0.2026195526123047, -0.19311141967773438, -0.18360328674316406, -0.17409515380859375, -0.16458702087402344, -0.15507888793945312, -0.1455707550048828, -0.1360626220703125, -0.1265544891357422, -0.11704635620117188, -0.10753822326660156, -0.09803009033203125, -0.08852195739746094, -0.07901382446289062, -0.06950569152832031, -0.05999755859375, -0.05048942565917969, -0.040981292724609375, -0.03147315979003906, -0.02196502685546875, -0.012456893920898438, -0.002948760986328125, 0.0065593719482421875, 0.0160675048828125, 0.025575637817382812, 0.035083770751953125, 0.04459190368652344, 0.05410003662109375, 0.06360816955566406, 0.07311630249023438, 0.08262443542480469, 0.092132568359375, 0.10164070129394531, 0.11114883422851562, 0.12065696716308594, 0.13016510009765625, 0.13967323303222656, 0.14918136596679688, 0.1586894989013672, 0.1681976318359375, 0.1777057647705078, 0.18721389770507812, 0.19672203063964844, 0.20623016357421875, 0.21573829650878906, 0.22524642944335938, 0.2347545623779297, 0.2442626953125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 6.0, 5.0, 1.0, 9.0, 10.0, 19.0, 36.0, 29.0, 25.0, 31.0, 38.0, 50.0, 60.0, 47.0, 52.0, 53.0, 57.0, 59.0, 48.0, 53.0, 47.0, 36.0, 40.0, 39.0, 24.0, 23.0, 21.0, 12.0, 13.0, 8.0, 13.0, 6.0, 4.0, 4.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.181640625, -0.17567062377929688, -0.16970062255859375, -0.16373062133789062, -0.1577606201171875, -0.15179061889648438, -0.14582061767578125, -0.13985061645507812, -0.133880615234375, -0.12791061401367188, -0.12194061279296875, -0.11597061157226562, -0.1100006103515625, -0.10403060913085938, -0.09806060791015625, -0.09209060668945312, -0.08612060546875, -0.08015060424804688, -0.07418060302734375, -0.06821060180664062, -0.0622406005859375, -0.056270599365234375, -0.05030059814453125, -0.044330596923828125, -0.038360595703125, -0.032390594482421875, -0.02642059326171875, -0.020450592041015625, -0.0144805908203125, -0.008510589599609375, -0.00254058837890625, 0.003429412841796875, 0.0093994140625, 0.015369415283203125, 0.02133941650390625, 0.027309417724609375, 0.0332794189453125, 0.039249420166015625, 0.04521942138671875, 0.051189422607421875, 0.057159423828125, 0.06312942504882812, 0.06909942626953125, 0.07506942749023438, 0.0810394287109375, 0.08700942993164062, 0.09297943115234375, 0.09894943237304688, 0.10491943359375, 0.11088943481445312, 0.11685943603515625, 0.12282943725585938, 0.1287994384765625, 0.13476943969726562, 0.14073944091796875, 0.14670944213867188, 0.152679443359375, 0.15864944458007812, 0.16461944580078125, 0.17058944702148438, 0.1765594482421875, 0.18252944946289062, 0.18849945068359375, 0.19446945190429688, 0.200439453125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 6.0, 10.0, 7.0, 12.0, 22.0, 21.0, 43.0, 64.0, 88.0, 150.0, 228.0, 413.0, 691.0, 1288.0, 2611.0, 5174.0, 11707.0, 28869.0, 113345.0, 709760.0, 121437.0, 29549.0, 11894.0, 5370.0, 2645.0, 1361.0, 705.0, 391.0, 238.0, 148.0, 102.0, 62.0, 41.0, 27.0, 16.0, 14.0, 15.0, 6.0, 9.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0972900390625, -0.09420299530029297, -0.09111595153808594, -0.0880289077758789, -0.08494186401367188, -0.08185482025146484, -0.07876777648925781, -0.07568073272705078, -0.07259368896484375, -0.06950664520263672, -0.06641960144042969, -0.06333255767822266, -0.060245513916015625, -0.057158470153808594, -0.05407142639160156, -0.05098438262939453, -0.0478973388671875, -0.04481029510498047, -0.04172325134277344, -0.038636207580566406, -0.035549163818359375, -0.032462120056152344, -0.029375076293945312, -0.02628803253173828, -0.02320098876953125, -0.02011394500732422, -0.017026901245117188, -0.013939857482910156, -0.010852813720703125, -0.007765769958496094, -0.0046787261962890625, -0.0015916824340820312, 0.001495361328125, 0.004582405090332031, 0.0076694488525390625, 0.010756492614746094, 0.013843536376953125, 0.016930580139160156, 0.020017623901367188, 0.02310466766357422, 0.02619171142578125, 0.02927875518798828, 0.03236579895019531, 0.035452842712402344, 0.038539886474609375, 0.041626930236816406, 0.04471397399902344, 0.04780101776123047, 0.0508880615234375, 0.05397510528564453, 0.05706214904785156, 0.060149192810058594, 0.06323623657226562, 0.06632328033447266, 0.06941032409667969, 0.07249736785888672, 0.07558441162109375, 0.07867145538330078, 0.08175849914550781, 0.08484554290771484, 0.08793258666992188, 0.0910196304321289, 0.09410667419433594, 0.09719371795654297, 0.10028076171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 1.0, 9.0, 18.0, 18.0, 34.0, 68.0, 109.0, 228.0, 241.0, 118.0, 42.0, 23.0, 19.0, 13.0, 9.0, 13.0, 6.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.577108383178711e-05, -8.356571197509766e-05, -8.13603401184082e-05, -7.915496826171875e-05, -7.69495964050293e-05, -7.474422454833984e-05, -7.253885269165039e-05, -7.033348083496094e-05, -6.812810897827148e-05, -6.592273712158203e-05, -6.371736526489258e-05, -6.151199340820312e-05, -5.930662155151367e-05, -5.710124969482422e-05, -5.4895877838134766e-05, -5.269050598144531e-05, -5.048513412475586e-05, -4.8279762268066406e-05, -4.607439041137695e-05, -4.38690185546875e-05, -4.166364669799805e-05, -3.9458274841308594e-05, -3.725290298461914e-05, -3.504753112792969e-05, -3.2842159271240234e-05, -3.063678741455078e-05, -2.8431415557861328e-05, -2.6226043701171875e-05, -2.4020671844482422e-05, -2.181529998779297e-05, -1.9609928131103516e-05, -1.7404556274414062e-05, -1.519918441772461e-05, -1.2993812561035156e-05, -1.0788440704345703e-05, -8.58306884765625e-06, -6.377696990966797e-06, -4.172325134277344e-06, -1.9669532775878906e-06, 2.384185791015625e-07, 2.4437904357910156e-06, 4.649162292480469e-06, 6.854534149169922e-06, 9.059906005859375e-06, 1.1265277862548828e-05, 1.3470649719238281e-05, 1.5676021575927734e-05, 1.7881393432617188e-05, 2.008676528930664e-05, 2.2292137145996094e-05, 2.4497509002685547e-05, 2.6702880859375e-05, 2.8908252716064453e-05, 3.1113624572753906e-05, 3.331899642944336e-05, 3.552436828613281e-05, 3.7729740142822266e-05, 3.993511199951172e-05, 4.214048385620117e-05, 4.4345855712890625e-05, 4.655122756958008e-05, 4.875659942626953e-05, 5.0961971282958984e-05, 5.316734313964844e-05, 5.537271499633789e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 3.0, 7.0, 17.0, 19.0, 31.0, 53.0, 70.0, 118.0, 205.0, 415.0, 898.0, 2310.0, 9063.0, 55014.0, 844621.0, 116374.0, 13827.0, 3255.0, 1173.0, 454.0, 267.0, 117.0, 78.0, 47.0, 34.0, 21.0, 16.0, 15.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.208984375, -0.2034320831298828, -0.19787979125976562, -0.19232749938964844, -0.18677520751953125, -0.18122291564941406, -0.17567062377929688, -0.1701183319091797, -0.1645660400390625, -0.1590137481689453, -0.15346145629882812, -0.14790916442871094, -0.14235687255859375, -0.13680458068847656, -0.13125228881835938, -0.1256999969482422, -0.120147705078125, -0.11459541320800781, -0.10904312133789062, -0.10349082946777344, -0.09793853759765625, -0.09238624572753906, -0.08683395385742188, -0.08128166198730469, -0.0757293701171875, -0.07017707824707031, -0.06462478637695312, -0.05907249450683594, -0.05352020263671875, -0.04796791076660156, -0.042415618896484375, -0.03686332702636719, -0.03131103515625, -0.025758743286132812, -0.020206451416015625, -0.014654159545898438, -0.00910186767578125, -0.0035495758056640625, 0.002002716064453125, 0.0075550079345703125, 0.0131072998046875, 0.018659591674804688, 0.024211883544921875, 0.029764175415039062, 0.03531646728515625, 0.04086875915527344, 0.046421051025390625, 0.05197334289550781, 0.057525634765625, 0.06307792663574219, 0.06863021850585938, 0.07418251037597656, 0.07973480224609375, 0.08528709411621094, 0.09083938598632812, 0.09639167785644531, 0.1019439697265625, 0.10749626159667969, 0.11304855346679688, 0.11860084533691406, 0.12415313720703125, 0.12970542907714844, 0.13525772094726562, 0.1408100128173828, 0.1463623046875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 4.0, 3.0, 9.0, 11.0, 15.0, 16.0, 19.0, 39.0, 64.0, 71.0, 85.0, 111.0, 120.0, 124.0, 74.0, 66.0, 41.0, 32.0, 27.0, 13.0, 8.0, 5.0, 5.0, 4.0, 5.0, 4.0, 7.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1446533203125, -0.1409778594970703, -0.13730239868164062, -0.13362693786621094, -0.12995147705078125, -0.12627601623535156, -0.12260055541992188, -0.11892509460449219, -0.1152496337890625, -0.11157417297363281, -0.10789871215820312, -0.10422325134277344, -0.10054779052734375, -0.09687232971191406, -0.09319686889648438, -0.08952140808105469, -0.085845947265625, -0.08217048645019531, -0.07849502563476562, -0.07481956481933594, -0.07114410400390625, -0.06746864318847656, -0.06379318237304688, -0.06011772155761719, -0.0564422607421875, -0.05276679992675781, -0.049091339111328125, -0.04541587829589844, -0.04174041748046875, -0.03806495666503906, -0.034389495849609375, -0.030714035034179688, -0.02703857421875, -0.023363113403320312, -0.019687652587890625, -0.016012191772460938, -0.01233673095703125, -0.008661270141601562, -0.004985809326171875, -0.0013103485107421875, 0.0023651123046875, 0.0060405731201171875, 0.009716033935546875, 0.013391494750976562, 0.01706695556640625, 0.020742416381835938, 0.024417877197265625, 0.028093338012695312, 0.031768798828125, 0.03544425964355469, 0.039119720458984375, 0.04279518127441406, 0.04647064208984375, 0.05014610290527344, 0.053821563720703125, 0.05749702453613281, 0.0611724853515625, 0.06484794616699219, 0.06852340698242188, 0.07219886779785156, 0.07587432861328125, 0.07954978942871094, 0.08322525024414062, 0.08690071105957031, 0.090576171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 10.0, 11.0, 37.0, 48.0, 97.0, 157.0, 279.0, 169.0, 81.0, 55.0, 15.0, 12.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.213435411453247, -3.1317873001098633, -3.0501394271850586, -2.968491554260254, -2.88684344291687, -2.8051953315734863, -2.7235474586486816, -2.641899585723877, -2.560251474380493, -2.4786033630371094, -2.3969554901123047, -2.3153076171875, -2.233659505844116, -2.1520113945007324, -2.0703635215759277, -1.9887155294418335, -1.9070675373077393, -1.825419545173645, -1.7437715530395508, -1.6621235609054565, -1.5804755687713623, -1.498827576637268, -1.4171795845031738, -1.3355315923690796, -1.2538836002349854, -1.1722356081008911, -1.0905876159667969, -1.0089396238327026, -0.9272916316986084, -0.8456436395645142, -0.7639956474304199, -0.6823476552963257, -0.6006996631622314, -0.5190516710281372, -0.43740367889404297, -0.35575568675994873, -0.2741076946258545, -0.19245970249176025, -0.11081171035766602, -0.029163718223571777, 0.05248427391052246, 0.1341322660446167, 0.21578025817871094, 0.2974282503128052, 0.3790762424468994, 0.46072423458099365, 0.5423722267150879, 0.6240202188491821, 0.7056682109832764, 0.7873162031173706, 0.8689641952514648, 0.9506121873855591, 1.0322601795196533, 1.1139081716537476, 1.1955561637878418, 1.277204155921936, 1.3588521480560303, 1.4405001401901245, 1.5221481323242188, 1.603796124458313, 1.6854441165924072, 1.7670921087265015, 1.8487401008605957, 1.93038809299469, 2.012036085128784]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 11.0, 8.0, 12.0, 9.0, 11.0, 19.0, 21.0, 25.0, 22.0, 24.0, 36.0, 27.0, 38.0, 32.0, 42.0, 47.0, 83.0, 73.0, 68.0, 53.0, 43.0, 34.0, 37.0, 35.0, 22.0, 25.0, 13.0, 24.0, 23.0, 15.0, 14.0, 13.0, 11.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.842074990272522, -0.815356969833374, -0.7886389493942261, -0.7619209289550781, -0.7352029085159302, -0.7084848880767822, -0.681766927242279, -0.6550489068031311, -0.6283308863639832, -0.6016128659248352, -0.5748948454856873, -0.5481768250465393, -0.5214588642120361, -0.4947408139705658, -0.46802282333374023, -0.4413048028945923, -0.41458678245544434, -0.3878687620162964, -0.36115074157714844, -0.3344327509403229, -0.3077147305011749, -0.280996710062027, -0.2542787194252014, -0.22756069898605347, -0.20084267854690552, -0.17412465810775757, -0.1474066525697708, -0.12068863958120346, -0.09397062659263611, -0.06725260615348816, -0.040534600615501404, -0.013816595077514648, 0.0129014253616333, 0.03961943835020065, 0.066337451338768, 0.09305546432733536, 0.11977347731590271, 0.14649149775505066, 0.17320950329303741, 0.19992750883102417, 0.22664552927017212, 0.25336354970932007, 0.280081570148468, 0.3067995607852936, 0.33351758122444153, 0.3602356016635895, 0.38695359230041504, 0.413671612739563, 0.44038963317871094, 0.4671076536178589, 0.49382567405700684, 0.5205436944961548, 0.5472617149353027, 0.5739797353744507, 0.6006976962089539, 0.6274157166481018, 0.6541337370872498, 0.6808517575263977, 0.7075697779655457, 0.7342877984046936, 0.7610057592391968, 0.7877237796783447, 0.8144418001174927, 0.8411598205566406, 0.8678778409957886]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 13.0, 17.0, 14.0, 19.0, 41.0, 50.0, 106.0, 217.0, 444.0, 1107.0, 2742.0, 8980.0, 38793.0, 516059.0, 3335825.0, 252320.0, 27072.0, 6658.0, 2210.0, 791.0, 361.0, 181.0, 98.0, 56.0, 38.0, 12.0, 10.0, 12.0, 8.0, 6.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12491798400878906, -0.12080764770507812, -0.11669731140136719, -0.11258697509765625, -0.10847663879394531, -0.10436630249023438, -0.10025596618652344, -0.0961456298828125, -0.09203529357910156, -0.08792495727539062, -0.08381462097167969, -0.07970428466796875, -0.07559394836425781, -0.07148361206054688, -0.06737327575683594, -0.063262939453125, -0.05915260314941406, -0.055042266845703125, -0.05093193054199219, -0.04682159423828125, -0.04271125793457031, -0.038600921630859375, -0.03449058532714844, -0.0303802490234375, -0.026269912719726562, -0.022159576416015625, -0.018049240112304688, -0.01393890380859375, -0.009828567504882812, -0.005718231201171875, -0.0016078948974609375, 0.00250244140625, 0.0066127777099609375, 0.010723114013671875, 0.014833450317382812, 0.01894378662109375, 0.023054122924804688, 0.027164459228515625, 0.03127479553222656, 0.0353851318359375, 0.03949546813964844, 0.043605804443359375, 0.04771614074707031, 0.05182647705078125, 0.05593681335449219, 0.060047149658203125, 0.06415748596191406, 0.068267822265625, 0.07237815856933594, 0.07648849487304688, 0.08059883117675781, 0.08470916748046875, 0.08881950378417969, 0.09292984008789062, 0.09704017639160156, 0.1011505126953125, 0.10526084899902344, 0.10937118530273438, 0.11348152160644531, 0.11759185791015625, 0.12170219421386719, 0.12581253051757812, 0.12992286682128906, 0.134033203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 6.0, 1.0, 5.0, 8.0, 7.0, 6.0, 15.0, 15.0, 23.0, 15.0, 22.0, 31.0, 36.0, 36.0, 36.0, 53.0, 39.0, 59.0, 59.0, 44.0, 54.0, 49.0, 48.0, 52.0, 54.0, 39.0, 33.0, 37.0, 16.0, 27.0, 15.0, 12.0, 4.0, 18.0, 6.0, 9.0, 2.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049591064453125, -0.047965049743652344, -0.04633903503417969, -0.04471302032470703, -0.043087005615234375, -0.04146099090576172, -0.03983497619628906, -0.038208961486816406, -0.03658294677734375, -0.034956932067871094, -0.03333091735839844, -0.03170490264892578, -0.030078887939453125, -0.02845287322998047, -0.026826858520507812, -0.025200843811035156, -0.0235748291015625, -0.021948814392089844, -0.020322799682617188, -0.01869678497314453, -0.017070770263671875, -0.015444755554199219, -0.013818740844726562, -0.012192726135253906, -0.01056671142578125, -0.008940696716308594, -0.0073146820068359375, -0.005688667297363281, -0.004062652587890625, -0.0024366378784179688, -0.0008106231689453125, 0.0008153915405273438, 0.00244140625, 0.004067420959472656, 0.0056934356689453125, 0.007319450378417969, 0.008945465087890625, 0.010571479797363281, 0.012197494506835938, 0.013823509216308594, 0.01544952392578125, 0.017075538635253906, 0.018701553344726562, 0.02032756805419922, 0.021953582763671875, 0.02357959747314453, 0.025205612182617188, 0.026831626892089844, 0.0284576416015625, 0.030083656311035156, 0.03170967102050781, 0.03333568572998047, 0.034961700439453125, 0.03658771514892578, 0.03821372985839844, 0.039839744567871094, 0.04146575927734375, 0.043091773986816406, 0.04471778869628906, 0.04634380340576172, 0.047969818115234375, 0.04959583282470703, 0.05122184753417969, 0.052847862243652344, 0.054473876953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 11.0, 13.0, 22.0, 31.0, 53.0, 48.0, 76.0, 126.0, 173.0, 221.0, 383.0, 567.0, 1092.0, 8399.0, 3517375.0, 658562.0, 5105.0, 832.0, 369.0, 216.0, 183.0, 114.0, 87.0, 56.0, 43.0, 30.0, 24.0, 19.0, 7.0, 12.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5094223022460938, -0.4939422607421875, -0.47846221923828125, -0.462982177734375, -0.44750213623046875, -0.4320220947265625, -0.41654205322265625, -0.40106201171875, -0.38558197021484375, -0.3701019287109375, -0.35462188720703125, -0.339141845703125, -0.32366180419921875, -0.3081817626953125, -0.29270172119140625, -0.2772216796875, -0.26174163818359375, -0.2462615966796875, -0.23078155517578125, -0.215301513671875, -0.19982147216796875, -0.1843414306640625, -0.16886138916015625, -0.15338134765625, -0.13790130615234375, -0.1224212646484375, -0.10694122314453125, -0.091461181640625, -0.07598114013671875, -0.0605010986328125, -0.04502105712890625, -0.029541015625, -0.01406097412109375, 0.0014190673828125, 0.01689910888671875, 0.032379150390625, 0.04785919189453125, 0.0633392333984375, 0.07881927490234375, 0.09429931640625, 0.10977935791015625, 0.1252593994140625, 0.14073944091796875, 0.156219482421875, 0.17169952392578125, 0.1871795654296875, 0.20265960693359375, 0.2181396484375, 0.23361968994140625, 0.2490997314453125, 0.26457977294921875, 0.280059814453125, 0.29553985595703125, 0.3110198974609375, 0.32649993896484375, 0.34197998046875, 0.35746002197265625, 0.3729400634765625, 0.38842010498046875, 0.403900146484375, 0.41938018798828125, 0.4348602294921875, 0.45034027099609375, 0.4658203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 7.0, 8.0, 17.0, 38.0, 99.0, 207.0, 773.0, 1764.0, 775.0, 229.0, 79.0, 44.0, 20.0, 15.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.56005859375, -0.5493927001953125, -0.538726806640625, -0.5280609130859375, -0.51739501953125, -0.5067291259765625, -0.496063232421875, -0.4853973388671875, -0.4747314453125, -0.4640655517578125, -0.453399658203125, -0.4427337646484375, -0.43206787109375, -0.4214019775390625, -0.410736083984375, -0.4000701904296875, -0.389404296875, -0.3787384033203125, -0.368072509765625, -0.3574066162109375, -0.34674072265625, -0.3360748291015625, -0.325408935546875, -0.3147430419921875, -0.3040771484375, -0.2934112548828125, -0.282745361328125, -0.2720794677734375, -0.26141357421875, -0.2507476806640625, -0.240081787109375, -0.2294158935546875, -0.21875, -0.2080841064453125, -0.197418212890625, -0.1867523193359375, -0.17608642578125, -0.1654205322265625, -0.154754638671875, -0.1440887451171875, -0.1334228515625, -0.1227569580078125, -0.112091064453125, -0.1014251708984375, -0.09075927734375, -0.0800933837890625, -0.069427490234375, -0.0587615966796875, -0.048095703125, -0.0374298095703125, -0.026763916015625, -0.0160980224609375, -0.00543212890625, 0.0052337646484375, 0.015899658203125, 0.0265655517578125, 0.0372314453125, 0.0478973388671875, 0.058563232421875, 0.0692291259765625, 0.07989501953125, 0.0905609130859375, 0.101226806640625, 0.1118927001953125, 0.12255859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 14.0, 19.0, 60.0, 109.0, 208.0, 281.0, 152.0, 70.0, 36.0, 13.0, 4.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.8337228298187256, -3.740873336791992, -3.6480236053466797, -3.5551741123199463, -3.462324380874634, -3.3694748878479004, -3.276625156402588, -3.1837756633758545, -3.090926170349121, -2.9980766773223877, -2.905226945877075, -2.812377452850342, -2.7195277214050293, -2.626678228378296, -2.5338287353515625, -2.44097900390625, -2.3481292724609375, -2.255279779434204, -2.1624300479888916, -2.069580554962158, -1.9767308235168457, -1.8838813304901123, -1.7910317182540894, -1.6981821060180664, -1.6053324937820435, -1.5124828815460205, -1.4196332693099976, -1.3267836570739746, -1.2339341640472412, -1.1410844326019287, -1.0482349395751953, -0.9553853273391724, -0.8625359535217285, -0.7696863412857056, -0.6768367290496826, -0.5839871764183044, -0.4911375641822815, -0.39828795194625854, -0.30543839931488037, -0.21258878707885742, -0.11973917484283447, -0.026889577507972717, 0.06596001982688904, 0.1588096022605896, 0.25165921449661255, 0.3445088267326355, 0.43735837936401367, 0.5302079916000366, 0.6230576038360596, 0.7159072160720825, 0.8087568283081055, 0.9016063809394836, 0.9944559931755066, 1.0873055458068848, 1.1801551580429077, 1.2730047702789307, 1.3658543825149536, 1.4587039947509766, 1.5515536069869995, 1.6444032192230225, 1.7372527122497559, 1.8301024436950684, 1.9229519367218018, 2.015801429748535, 2.1086511611938477]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 2.0, 8.0, 6.0, 7.0, 8.0, 12.0, 10.0, 15.0, 16.0, 13.0, 33.0, 29.0, 37.0, 44.0, 40.0, 48.0, 49.0, 50.0, 54.0, 55.0, 65.0, 51.0, 56.0, 54.0, 34.0, 42.0, 33.0, 21.0, 24.0, 14.0, 13.0, 17.0, 13.0, 4.0, 3.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8276990056037903, -0.7997447848320007, -0.771790623664856, -0.7438364028930664, -0.7158821821212769, -0.6879280209541321, -0.6599738001823425, -0.6320196390151978, -0.6040654182434082, -0.5761111974716187, -0.5481570363044739, -0.5202028155326843, -0.49224862456321716, -0.46429443359375, -0.43634021282196045, -0.4083860218524933, -0.38043180108070374, -0.3524776101112366, -0.324523389339447, -0.29656919836997986, -0.2686150074005127, -0.24066080152988434, -0.21270659565925598, -0.18475240468978882, -0.15679819881916046, -0.1288439929485321, -0.10088980197906494, -0.07293559610843658, -0.044981397688388824, -0.017027199268341064, 0.010927006602287292, 0.038881197571754456, 0.06683540344238281, 0.09478960186243057, 0.12274380028247833, 0.1506980061531067, 0.17865219712257385, 0.2066064029932022, 0.23456060886383057, 0.26251479983329773, 0.2904689908027649, 0.31842318177223206, 0.3463774025440216, 0.37433159351348877, 0.40228578448295593, 0.4302399754524231, 0.45819419622421265, 0.4861483871936798, 0.514102578163147, 0.5420567989349365, 0.5700109601020813, 0.5979651808738708, 0.6259194016456604, 0.6538735628128052, 0.6818277835845947, 0.7097820043563843, 0.7377362251281738, 0.7656904458999634, 0.7936446070671082, 0.8215988278388977, 0.8495530486106873, 0.877507209777832, 0.9054614305496216, 0.9334156513214111, 0.9613698124885559]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 12.0, 19.0, 28.0, 36.0, 62.0, 85.0, 95.0, 200.0, 281.0, 454.0, 759.0, 1222.0, 2119.0, 3838.0, 7430.0, 15614.0, 35329.0, 88117.0, 213508.0, 324440.0, 206284.0, 83619.0, 33793.0, 14790.0, 7232.0, 3842.0, 2145.0, 1180.0, 741.0, 403.0, 286.0, 195.0, 125.0, 89.0, 55.0, 34.0, 30.0, 12.0, 17.0, 11.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.119873046875, -0.11658668518066406, -0.11330032348632812, -0.11001396179199219, -0.10672760009765625, -0.10344123840332031, -0.10015487670898438, -0.09686851501464844, -0.0935821533203125, -0.09029579162597656, -0.08700942993164062, -0.08372306823730469, -0.08043670654296875, -0.07715034484863281, -0.07386398315429688, -0.07057762145996094, -0.067291259765625, -0.06400489807128906, -0.060718536376953125, -0.05743217468261719, -0.05414581298828125, -0.05085945129394531, -0.047573089599609375, -0.04428672790527344, -0.0410003662109375, -0.03771400451660156, -0.034427642822265625, -0.031141281127929688, -0.02785491943359375, -0.024568557739257812, -0.021282196044921875, -0.017995834350585938, -0.01470947265625, -0.011423110961914062, -0.008136749267578125, -0.0048503875732421875, -0.00156402587890625, 0.0017223358154296875, 0.005008697509765625, 0.008295059204101562, 0.0115814208984375, 0.014867782592773438, 0.018154144287109375, 0.021440505981445312, 0.02472686767578125, 0.028013229370117188, 0.031299591064453125, 0.03458595275878906, 0.037872314453125, 0.04115867614746094, 0.044445037841796875, 0.04773139953613281, 0.05101776123046875, 0.05430412292480469, 0.057590484619140625, 0.06087684631347656, 0.0641632080078125, 0.06744956970214844, 0.07073593139648438, 0.07402229309082031, 0.07730865478515625, 0.08059501647949219, 0.08388137817382812, 0.08716773986816406, 0.0904541015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 6.0, 1.0, 9.0, 7.0, 7.0, 9.0, 14.0, 19.0, 25.0, 29.0, 21.0, 29.0, 30.0, 34.0, 45.0, 39.0, 49.0, 45.0, 46.0, 45.0, 53.0, 53.0, 42.0, 35.0, 45.0, 44.0, 34.0, 26.0, 32.0, 23.0, 24.0, 15.0, 15.0, 13.0, 4.0, 6.0, 11.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06085205078125, -0.05908536911010742, -0.057318687438964844, -0.055552005767822266, -0.05378532409667969, -0.05201864242553711, -0.05025196075439453, -0.04848527908325195, -0.046718597412109375, -0.0449519157409668, -0.04318523406982422, -0.04141855239868164, -0.03965187072753906, -0.037885189056396484, -0.036118507385253906, -0.03435182571411133, -0.03258514404296875, -0.030818462371826172, -0.029051780700683594, -0.027285099029541016, -0.025518417358398438, -0.02375173568725586, -0.02198505401611328, -0.020218372344970703, -0.018451690673828125, -0.016685009002685547, -0.014918327331542969, -0.01315164566040039, -0.011384963989257812, -0.009618282318115234, -0.007851600646972656, -0.006084918975830078, -0.0043182373046875, -0.002551555633544922, -0.0007848739624023438, 0.0009818077087402344, 0.0027484893798828125, 0.004515171051025391, 0.006281852722167969, 0.008048534393310547, 0.009815216064453125, 0.011581897735595703, 0.013348579406738281, 0.01511526107788086, 0.016881942749023438, 0.018648624420166016, 0.020415306091308594, 0.022181987762451172, 0.02394866943359375, 0.025715351104736328, 0.027482032775878906, 0.029248714447021484, 0.031015396118164062, 0.03278207778930664, 0.03454875946044922, 0.0363154411315918, 0.038082122802734375, 0.03984880447387695, 0.04161548614501953, 0.04338216781616211, 0.04514884948730469, 0.046915531158447266, 0.048682212829589844, 0.05044889450073242, 0.052215576171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 3.0, 9.0, 11.0, 14.0, 27.0, 35.0, 48.0, 63.0, 126.0, 166.0, 268.0, 455.0, 734.0, 1298.0, 2474.0, 5249.0, 13944.0, 52381.0, 266137.0, 576600.0, 92616.0, 21410.0, 7311.0, 3159.0, 1639.0, 936.0, 526.0, 339.0, 199.0, 123.0, 79.0, 56.0, 34.0, 31.0, 13.0, 14.0, 17.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1768798828125, -0.17037200927734375, -0.1638641357421875, -0.15735626220703125, -0.150848388671875, -0.14434051513671875, -0.1378326416015625, -0.13132476806640625, -0.12481689453125, -0.11830902099609375, -0.1118011474609375, -0.10529327392578125, -0.098785400390625, -0.09227752685546875, -0.0857696533203125, -0.07926177978515625, -0.07275390625, -0.06624603271484375, -0.0597381591796875, -0.05323028564453125, -0.046722412109375, -0.04021453857421875, -0.0337066650390625, -0.02719879150390625, -0.02069091796875, -0.01418304443359375, -0.0076751708984375, -0.00116729736328125, 0.005340576171875, 0.01184844970703125, 0.0183563232421875, 0.02486419677734375, 0.0313720703125, 0.03787994384765625, 0.0443878173828125, 0.05089569091796875, 0.057403564453125, 0.06391143798828125, 0.0704193115234375, 0.07692718505859375, 0.08343505859375, 0.08994293212890625, 0.0964508056640625, 0.10295867919921875, 0.109466552734375, 0.11597442626953125, 0.1224822998046875, 0.12899017333984375, 0.135498046875, 0.14200592041015625, 0.1485137939453125, 0.15502166748046875, 0.161529541015625, 0.16803741455078125, 0.1745452880859375, 0.18105316162109375, 0.18756103515625, 0.19406890869140625, 0.2005767822265625, 0.20708465576171875, 0.213592529296875, 0.22010040283203125, 0.2266082763671875, 0.23311614990234375, 0.2396240234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 4.0, 8.0, 7.0, 16.0, 12.0, 16.0, 17.0, 26.0, 29.0, 29.0, 41.0, 38.0, 51.0, 57.0, 53.0, 50.0, 55.0, 60.0, 58.0, 46.0, 43.0, 38.0, 37.0, 37.0, 33.0, 25.0, 22.0, 14.0, 18.0, 10.0, 10.0, 5.0, 8.0, 4.0, 9.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2279052734375, -0.22035789489746094, -0.21281051635742188, -0.2052631378173828, -0.19771575927734375, -0.1901683807373047, -0.18262100219726562, -0.17507362365722656, -0.1675262451171875, -0.15997886657714844, -0.15243148803710938, -0.1448841094970703, -0.13733673095703125, -0.1297893524169922, -0.12224197387695312, -0.11469459533691406, -0.107147216796875, -0.09959983825683594, -0.09205245971679688, -0.08450508117675781, -0.07695770263671875, -0.06941032409667969, -0.061862945556640625, -0.05431556701660156, -0.0467681884765625, -0.03922080993652344, -0.031673431396484375, -0.024126052856445312, -0.01657867431640625, -0.009031295776367188, -0.001483917236328125, 0.0060634613037109375, 0.01361083984375, 0.021158218383789062, 0.028705596923828125, 0.03625297546386719, 0.04380035400390625, 0.05134773254394531, 0.058895111083984375, 0.06644248962402344, 0.0739898681640625, 0.08153724670410156, 0.08908462524414062, 0.09663200378417969, 0.10417938232421875, 0.11172676086425781, 0.11927413940429688, 0.12682151794433594, 0.134368896484375, 0.14191627502441406, 0.14946365356445312, 0.1570110321044922, 0.16455841064453125, 0.1721057891845703, 0.17965316772460938, 0.18720054626464844, 0.1947479248046875, 0.20229530334472656, 0.20984268188476562, 0.2173900604248047, 0.22493743896484375, 0.2324848175048828, 0.24003219604492188, 0.24757957458496094, 0.255126953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 9.0, 15.0, 20.0, 38.0, 54.0, 93.0, 117.0, 248.0, 357.0, 666.0, 1179.0, 2244.0, 4692.0, 11792.0, 38305.0, 198985.0, 666714.0, 86519.0, 21704.0, 7617.0, 3452.0, 1675.0, 834.0, 494.0, 289.0, 151.0, 98.0, 70.0, 38.0, 21.0, 26.0, 12.0, 7.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.104248046875, -0.10042572021484375, -0.0966033935546875, -0.09278106689453125, -0.088958740234375, -0.08513641357421875, -0.0813140869140625, -0.07749176025390625, -0.07366943359375, -0.06984710693359375, -0.0660247802734375, -0.06220245361328125, -0.058380126953125, -0.05455780029296875, -0.0507354736328125, -0.04691314697265625, -0.0430908203125, -0.03926849365234375, -0.0354461669921875, -0.03162384033203125, -0.027801513671875, -0.02397918701171875, -0.0201568603515625, -0.01633453369140625, -0.01251220703125, -0.00868988037109375, -0.0048675537109375, -0.00104522705078125, 0.002777099609375, 0.00659942626953125, 0.0104217529296875, 0.01424407958984375, 0.01806640625, 0.02188873291015625, 0.0257110595703125, 0.02953338623046875, 0.033355712890625, 0.03717803955078125, 0.0410003662109375, 0.04482269287109375, 0.04864501953125, 0.05246734619140625, 0.0562896728515625, 0.06011199951171875, 0.063934326171875, 0.06775665283203125, 0.0715789794921875, 0.07540130615234375, 0.0792236328125, 0.08304595947265625, 0.0868682861328125, 0.09069061279296875, 0.094512939453125, 0.09833526611328125, 0.1021575927734375, 0.10597991943359375, 0.10980224609375, 0.11362457275390625, 0.1174468994140625, 0.12126922607421875, 0.125091552734375, 0.12891387939453125, 0.1327362060546875, 0.13655853271484375, 0.140380859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 2.0, 7.0, 7.0, 11.0, 19.0, 37.0, 60.0, 166.0, 287.0, 209.0, 91.0, 34.0, 19.0, 14.0, 8.0, 5.0, 2.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.291006088256836e-05, -7.980596274137497e-05, -7.670186460018158e-05, -7.359776645898819e-05, -7.04936683177948e-05, -6.738957017660141e-05, -6.428547203540802e-05, -6.118137389421463e-05, -5.807727575302124e-05, -5.497317761182785e-05, -5.186907947063446e-05, -4.876498132944107e-05, -4.566088318824768e-05, -4.255678504705429e-05, -3.94526869058609e-05, -3.634858876466751e-05, -3.324449062347412e-05, -3.014039248228073e-05, -2.703629434108734e-05, -2.393219619989395e-05, -2.082809805870056e-05, -1.772399991750717e-05, -1.4619901776313782e-05, -1.1515803635120392e-05, -8.411705493927002e-06, -5.307607352733612e-06, -2.203509211540222e-06, 9.005889296531677e-07, 4.004687070846558e-06, 7.1087852120399475e-06, 1.0212883353233337e-05, 1.3316981494426727e-05, 1.6421079635620117e-05, 1.9525177776813507e-05, 2.2629275918006897e-05, 2.5733374059200287e-05, 2.8837472200393677e-05, 3.194157034158707e-05, 3.5045668482780457e-05, 3.8149766623973846e-05, 4.1253864765167236e-05, 4.4357962906360626e-05, 4.7462061047554016e-05, 5.0566159188747406e-05, 5.3670257329940796e-05, 5.6774355471134186e-05, 5.9878453612327576e-05, 6.298255175352097e-05, 6.608664989471436e-05, 6.919074803590775e-05, 7.229484617710114e-05, 7.539894431829453e-05, 7.850304245948792e-05, 8.16071406006813e-05, 8.47112387418747e-05, 8.781533688306808e-05, 9.091943502426147e-05, 9.402353316545486e-05, 9.712763130664825e-05, 0.00010023172944784164, 0.00010333582758903503, 0.00010643992573022842, 0.00010954402387142181, 0.0001126481220126152, 0.0001157522201538086]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 8.0, 2.0, 7.0, 8.0, 7.0, 8.0, 24.0, 31.0, 59.0, 66.0, 113.0, 156.0, 265.0, 367.0, 622.0, 1125.0, 2009.0, 3795.0, 7869.0, 18409.0, 51454.0, 189934.0, 579821.0, 126804.0, 37647.0, 14242.0, 6403.0, 3139.0, 1688.0, 952.0, 569.0, 310.0, 197.0, 131.0, 97.0, 71.0, 37.0, 29.0, 19.0, 22.0, 9.0, 9.0, 11.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08349609375, -0.08074569702148438, -0.07799530029296875, -0.07524490356445312, -0.0724945068359375, -0.06974411010742188, -0.06699371337890625, -0.06424331665039062, -0.061492919921875, -0.058742523193359375, -0.05599212646484375, -0.053241729736328125, -0.0504913330078125, -0.047740936279296875, -0.04499053955078125, -0.042240142822265625, -0.03948974609375, -0.036739349365234375, -0.03398895263671875, -0.031238555908203125, -0.0284881591796875, -0.025737762451171875, -0.02298736572265625, -0.020236968994140625, -0.017486572265625, -0.014736175537109375, -0.01198577880859375, -0.009235382080078125, -0.0064849853515625, -0.003734588623046875, -0.00098419189453125, 0.001766204833984375, 0.0045166015625, 0.007266998291015625, 0.01001739501953125, 0.012767791748046875, 0.0155181884765625, 0.018268585205078125, 0.02101898193359375, 0.023769378662109375, 0.026519775390625, 0.029270172119140625, 0.03202056884765625, 0.034770965576171875, 0.0375213623046875, 0.040271759033203125, 0.04302215576171875, 0.045772552490234375, 0.04852294921875, 0.051273345947265625, 0.05402374267578125, 0.056774139404296875, 0.0595245361328125, 0.062274932861328125, 0.06502532958984375, 0.06777572631835938, 0.070526123046875, 0.07327651977539062, 0.07602691650390625, 0.07877731323242188, 0.0815277099609375, 0.08427810668945312, 0.08702850341796875, 0.08977890014648438, 0.092529296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 5.0, 10.0, 11.0, 12.0, 19.0, 18.0, 45.0, 43.0, 53.0, 71.0, 89.0, 110.0, 101.0, 84.0, 50.0, 55.0, 52.0, 30.0, 32.0, 24.0, 13.0, 12.0, 8.0, 8.0, 4.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10272216796875, -0.09951496124267578, -0.09630775451660156, -0.09310054779052734, -0.08989334106445312, -0.0866861343383789, -0.08347892761230469, -0.08027172088623047, -0.07706451416015625, -0.07385730743408203, -0.07065010070800781, -0.0674428939819336, -0.06423568725585938, -0.061028480529785156, -0.05782127380371094, -0.05461406707763672, -0.0514068603515625, -0.04819965362548828, -0.04499244689941406, -0.041785240173339844, -0.038578033447265625, -0.035370826721191406, -0.03216361999511719, -0.02895641326904297, -0.02574920654296875, -0.02254199981689453, -0.019334793090820312, -0.016127586364746094, -0.012920379638671875, -0.009713172912597656, -0.0065059661865234375, -0.0032987594604492188, -9.1552734375e-05, 0.0031156539916992188, 0.0063228607177734375, 0.009530067443847656, 0.012737274169921875, 0.015944480895996094, 0.019151687622070312, 0.02235889434814453, 0.02556610107421875, 0.02877330780029297, 0.03198051452636719, 0.035187721252441406, 0.038394927978515625, 0.041602134704589844, 0.04480934143066406, 0.04801654815673828, 0.0512237548828125, 0.05443096160888672, 0.05763816833496094, 0.060845375061035156, 0.06405258178710938, 0.0672597885131836, 0.07046699523925781, 0.07367420196533203, 0.07688140869140625, 0.08008861541748047, 0.08329582214355469, 0.0865030288696289, 0.08971023559570312, 0.09291744232177734, 0.09612464904785156, 0.09933185577392578, 0.1025390625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 8.0, 15.0, 34.0, 72.0, 131.0, 254.0, 219.0, 127.0, 60.0, 30.0, 18.0, 10.0, 8.0, 4.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3953869342803955, -1.3076300621032715, -1.219873309135437, -1.132116436958313, -1.0443596839904785, -0.9566028118133545, -0.8688459396362305, -0.7810891270637512, -0.693332314491272, -0.6055755019187927, -0.5178186893463135, -0.43006181716918945, -0.3423050045967102, -0.25454819202423096, -0.16679131984710693, -0.07903450727462769, 0.008722305297851562, 0.096479132771492, 0.18423596024513245, 0.2719928026199341, 0.35974961519241333, 0.4475064277648926, 0.5352632999420166, 0.6230201125144958, 0.7107769250869751, 0.7985337376594543, 0.8862905502319336, 0.9740474224090576, 1.0618042945861816, 1.1495610475540161, 1.2373179197311401, 1.3250746726989746, 1.4128313064575195, 1.5005881786346436, 1.588344931602478, 1.676101803779602, 1.7638585567474365, 1.8516154289245605, 1.9393723011016846, 2.0271291732788086, 2.1148858070373535, 2.2026426792144775, 2.2903995513916016, 2.3781561851501465, 2.4659130573272705, 2.5536699295043945, 2.6414268016815186, 2.7291836738586426, 2.8169405460357666, 2.9046974182128906, 2.9924542903900146, 3.0802111625671387, 3.1679677963256836, 3.2557246685028076, 3.3434815406799316, 3.4312384128570557, 3.5189952850341797, 3.6067521572113037, 3.6945090293884277, 3.7822656631469727, 3.8700225353240967, 3.9577794075012207, 4.045536041259766, 4.133293151855469, 4.221049785614014]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 5.0, 3.0, 7.0, 8.0, 5.0, 11.0, 18.0, 15.0, 18.0, 31.0, 22.0, 18.0, 29.0, 30.0, 31.0, 43.0, 42.0, 68.0, 72.0, 81.0, 74.0, 64.0, 38.0, 43.0, 27.0, 34.0, 22.0, 22.0, 18.0, 11.0, 14.0, 14.0, 15.0, 12.0, 9.0, 8.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7888940572738647, -0.758541464805603, -0.7281888127326965, -0.6978362202644348, -0.6674835681915283, -0.6371309757232666, -0.6067783236503601, -0.5764257311820984, -0.5460730791091919, -0.5157204866409302, -0.4853678345680237, -0.4550152122974396, -0.42466259002685547, -0.39430999755859375, -0.36395734548568726, -0.33360475301742554, -0.30325213074684143, -0.2728995084762573, -0.24254688620567322, -0.2121942639350891, -0.181841641664505, -0.1514890342950821, -0.12113641202449799, -0.09078378975391388, -0.06043116748332977, -0.030078547075390816, 0.0002740733325481415, 0.03062669187784195, 0.060979314148426056, 0.09133192896842957, 0.12168455123901367, 0.15203717350959778, 0.18238979578018188, 0.212742418050766, 0.2430950403213501, 0.2734476625919342, 0.3038002848625183, 0.33415287733078003, 0.3645055294036865, 0.39485812187194824, 0.42521077394485474, 0.45556339621543884, 0.48591601848602295, 0.5162686109542847, 0.5466212630271912, 0.5769738554954529, 0.6073265075683594, 0.6376791000366211, 0.6680316925048828, 0.6983842849731445, 0.728736937046051, 0.7590895295143127, 0.7894421815872192, 0.819794774055481, 0.8501474261283875, 0.8805000185966492, 0.9108526706695557, 0.9412052631378174, 0.9715579152107239, 1.0019105672836304, 1.032263159751892, 1.0626157522201538, 1.0929683446884155, 1.1233210563659668, 1.1536736488342285]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 9.0, 7.0, 5.0, 18.0, 22.0, 45.0, 68.0, 89.0, 177.0, 282.0, 505.0, 963.0, 1865.0, 3908.0, 8919.0, 24775.0, 103256.0, 1156368.0, 2586996.0, 241684.0, 40259.0, 13123.0, 5500.0, 2502.0, 1302.0, 673.0, 363.0, 218.0, 135.0, 90.0, 61.0, 36.0, 20.0, 14.0, 11.0, 11.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.157958984375, -0.15402984619140625, -0.1501007080078125, -0.14617156982421875, -0.142242431640625, -0.13831329345703125, -0.1343841552734375, -0.13045501708984375, -0.12652587890625, -0.12259674072265625, -0.1186676025390625, -0.11473846435546875, -0.110809326171875, -0.10688018798828125, -0.1029510498046875, -0.09902191162109375, -0.0950927734375, -0.09116363525390625, -0.0872344970703125, -0.08330535888671875, -0.079376220703125, -0.07544708251953125, -0.0715179443359375, -0.06758880615234375, -0.06365966796875, -0.05973052978515625, -0.0558013916015625, -0.05187225341796875, -0.047943115234375, -0.04401397705078125, -0.0400848388671875, -0.03615570068359375, -0.0322265625, -0.02829742431640625, -0.0243682861328125, -0.02043914794921875, -0.016510009765625, -0.01258087158203125, -0.0086517333984375, -0.00472259521484375, -0.00079345703125, 0.00313568115234375, 0.0070648193359375, 0.01099395751953125, 0.014923095703125, 0.01885223388671875, 0.0227813720703125, 0.02671051025390625, 0.0306396484375, 0.03456878662109375, 0.0384979248046875, 0.04242706298828125, 0.046356201171875, 0.05028533935546875, 0.0542144775390625, 0.05814361572265625, 0.06207275390625, 0.06600189208984375, 0.0699310302734375, 0.07386016845703125, 0.077789306640625, 0.08171844482421875, 0.0856475830078125, 0.08957672119140625, 0.093505859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 7.0, 3.0, 5.0, 5.0, 7.0, 16.0, 7.0, 17.0, 17.0, 15.0, 16.0, 19.0, 25.0, 25.0, 39.0, 37.0, 41.0, 40.0, 47.0, 48.0, 43.0, 48.0, 45.0, 37.0, 49.0, 49.0, 31.0, 37.0, 29.0, 31.0, 26.0, 16.0, 25.0, 20.0, 12.0, 15.0, 12.0, 11.0, 7.0, 10.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0452880859375, -0.043634891510009766, -0.04198169708251953, -0.0403285026550293, -0.03867530822753906, -0.03702211380004883, -0.035368919372558594, -0.03371572494506836, -0.032062530517578125, -0.03040933609008789, -0.028756141662597656, -0.027102947235107422, -0.025449752807617188, -0.023796558380126953, -0.02214336395263672, -0.020490169525146484, -0.01883697509765625, -0.017183780670166016, -0.015530586242675781, -0.013877391815185547, -0.012224197387695312, -0.010571002960205078, -0.008917808532714844, -0.007264614105224609, -0.005611419677734375, -0.003958225250244141, -0.0023050308227539062, -0.0006518363952636719, 0.0010013580322265625, 0.002654552459716797, 0.004307746887207031, 0.005960941314697266, 0.0076141357421875, 0.009267330169677734, 0.010920524597167969, 0.012573719024658203, 0.014226913452148438, 0.015880107879638672, 0.017533302307128906, 0.01918649673461914, 0.020839691162109375, 0.02249288558959961, 0.024146080017089844, 0.025799274444580078, 0.027452468872070312, 0.029105663299560547, 0.03075885772705078, 0.032412052154541016, 0.03406524658203125, 0.035718441009521484, 0.03737163543701172, 0.03902482986450195, 0.04067802429199219, 0.04233121871948242, 0.043984413146972656, 0.04563760757446289, 0.047290802001953125, 0.04894399642944336, 0.050597190856933594, 0.05225038528442383, 0.05390357971191406, 0.0555567741394043, 0.05720996856689453, 0.058863162994384766, 0.060516357421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 17.0, 16.0, 53.0, 101.0, 197.0, 530.0, 2944.0, 157564.0, 4022277.0, 9054.0, 991.0, 336.0, 113.0, 48.0, 24.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.919921875, -0.8930282592773438, -0.8661346435546875, -0.8392410278320312, -0.812347412109375, -0.7854537963867188, -0.7585601806640625, -0.7316665649414062, -0.70477294921875, -0.6778793334960938, -0.6509857177734375, -0.6240921020507812, -0.597198486328125, -0.5703048706054688, -0.5434112548828125, -0.5165176391601562, -0.4896240234375, -0.46273040771484375, -0.4358367919921875, -0.40894317626953125, -0.382049560546875, -0.35515594482421875, -0.3282623291015625, -0.30136871337890625, -0.27447509765625, -0.24758148193359375, -0.2206878662109375, -0.19379425048828125, -0.166900634765625, -0.14000701904296875, -0.1131134033203125, -0.08621978759765625, -0.059326171875, -0.03243255615234375, -0.0055389404296875, 0.02135467529296875, 0.048248291015625, 0.07514190673828125, 0.1020355224609375, 0.12892913818359375, 0.15582275390625, 0.18271636962890625, 0.2096099853515625, 0.23650360107421875, 0.263397216796875, 0.29029083251953125, 0.3171844482421875, 0.34407806396484375, 0.3709716796875, 0.39786529541015625, 0.4247589111328125, 0.45165252685546875, 0.478546142578125, 0.5054397583007812, 0.5323333740234375, 0.5592269897460938, 0.58612060546875, 0.6130142211914062, 0.6399078369140625, 0.6668014526367188, 0.693695068359375, 0.7205886840820312, 0.7474822998046875, 0.7743759155273438, 0.80126953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 19.0, 16.0, 50.0, 90.0, 168.0, 614.0, 1790.0, 891.0, 241.0, 92.0, 41.0, 27.0, 10.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.619140625, -0.604949951171875, -0.59075927734375, -0.576568603515625, -0.5623779296875, -0.548187255859375, -0.53399658203125, -0.519805908203125, -0.505615234375, -0.491424560546875, -0.47723388671875, -0.463043212890625, -0.4488525390625, -0.434661865234375, -0.42047119140625, -0.406280517578125, -0.39208984375, -0.377899169921875, -0.36370849609375, -0.349517822265625, -0.3353271484375, -0.321136474609375, -0.30694580078125, -0.292755126953125, -0.278564453125, -0.264373779296875, -0.25018310546875, -0.235992431640625, -0.2218017578125, -0.207611083984375, -0.19342041015625, -0.179229736328125, -0.1650390625, -0.150848388671875, -0.13665771484375, -0.122467041015625, -0.1082763671875, -0.094085693359375, -0.07989501953125, -0.065704345703125, -0.051513671875, -0.037322998046875, -0.02313232421875, -0.008941650390625, 0.0052490234375, 0.019439697265625, 0.03363037109375, 0.047821044921875, 0.06201171875, 0.076202392578125, 0.09039306640625, 0.104583740234375, 0.1187744140625, 0.132965087890625, 0.14715576171875, 0.161346435546875, 0.175537109375, 0.189727783203125, 0.20391845703125, 0.218109130859375, 0.2322998046875, 0.246490478515625, 0.26068115234375, 0.274871826171875, 0.2890625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 8.0, 12.0, 39.0, 77.0, 189.0, 279.0, 235.0, 114.0, 39.0, 9.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.800698757171631, -3.680863857269287, -3.5610289573669434, -3.4411942958831787, -3.321359395980835, -3.201524496078491, -3.0816895961761475, -2.961854934692383, -2.842020034790039, -2.7221851348876953, -2.6023502349853516, -2.482515573501587, -2.362680673599243, -2.2428457736968994, -2.1230108737945557, -2.003176212310791, -1.8833411931991577, -1.763506293296814, -1.6436715126037598, -1.523836612701416, -1.4040018320083618, -1.284166932106018, -1.1643321514129639, -1.0444972515106201, -0.9246624112129211, -0.8048275709152222, -0.6849927306175232, -0.5651578903198242, -0.44532302021980286, -0.3254881501197815, -0.20565330982208252, -0.08581846952438354, 0.03401637077331543, 0.1538512110710144, 0.2736860513687134, 0.39352092146873474, 0.5133557319641113, 0.6331906318664551, 0.753025472164154, 0.872860312461853, 0.992695152759552, 1.112529993057251, 1.2323648929595947, 1.352199673652649, 1.4720345735549927, 1.5918693542480469, 1.7117042541503906, 1.8315391540527344, 1.9513739347457886, 2.0712087154388428, 2.1910436153411865, 2.3108785152435303, 2.430713415145874, 2.5505480766296387, 2.6703829765319824, 2.790217876434326, 2.91005277633667, 3.0298876762390137, 3.1497225761413574, 3.269557237625122, 3.389392137527466, 3.5092270374298096, 3.6290619373321533, 3.748896598815918, 3.8687314987182617]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 3.0, 7.0, 13.0, 13.0, 11.0, 15.0, 17.0, 13.0, 31.0, 25.0, 30.0, 36.0, 30.0, 35.0, 35.0, 39.0, 40.0, 35.0, 43.0, 38.0, 52.0, 40.0, 42.0, 33.0, 39.0, 47.0, 42.0, 47.0, 33.0, 25.0, 18.0, 15.0, 13.0, 11.0, 8.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9181565642356873, -0.8884775638580322, -0.8587985038757324, -0.8291195034980774, -0.7994405031204224, -0.7697615027427673, -0.7400825023651123, -0.7104034423828125, -0.6807244420051575, -0.6510454416275024, -0.6213663816452026, -0.5916873812675476, -0.5620083808898926, -0.5323293805122375, -0.5026503801345825, -0.4729713201522827, -0.4432923197746277, -0.41361331939697266, -0.38393428921699524, -0.3542552590370178, -0.3245762586593628, -0.29489725828170776, -0.26521822810173035, -0.23553921282291412, -0.2058601975440979, -0.17618118226528168, -0.14650216698646545, -0.11682315170764923, -0.08714413642883301, -0.057465121150016785, -0.02778610587120056, 0.0018929094076156616, 0.031571924686431885, 0.06125093996524811, 0.09092995524406433, 0.12060897052288055, 0.15028798580169678, 0.179967001080513, 0.20964601635932922, 0.23932503163814545, 0.26900404691696167, 0.2986830472946167, 0.3283620774745941, 0.35804110765457153, 0.38772010803222656, 0.4173991084098816, 0.447078138589859, 0.4767571687698364, 0.5064361691474915, 0.5361151695251465, 0.5657942295074463, 0.5954732298851013, 0.6251522302627563, 0.6548312306404114, 0.6845102310180664, 0.7141892910003662, 0.7438682913780212, 0.7735472917556763, 0.8032263517379761, 0.8329053521156311, 0.8625843524932861, 0.8922633528709412, 0.9219423532485962, 0.951621413230896, 0.981300413608551]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 8.0, 18.0, 22.0, 28.0, 42.0, 57.0, 97.0, 133.0, 212.0, 341.0, 541.0, 928.0, 1583.0, 2812.0, 5125.0, 9798.0, 19228.0, 39308.0, 82220.0, 165743.0, 266266.0, 222115.0, 117732.0, 56631.0, 27395.0, 13949.0, 7195.0, 3761.0, 2113.0, 1226.0, 667.0, 448.0, 273.0, 152.0, 116.0, 83.0, 65.0, 32.0, 24.0, 14.0, 15.0, 11.0, 7.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07794189453125, -0.0751333236694336, -0.07232475280761719, -0.06951618194580078, -0.06670761108398438, -0.06389904022216797, -0.06109046936035156, -0.058281898498535156, -0.05547332763671875, -0.052664756774902344, -0.04985618591308594, -0.04704761505126953, -0.044239044189453125, -0.04143047332763672, -0.03862190246582031, -0.035813331604003906, -0.0330047607421875, -0.030196189880371094, -0.027387619018554688, -0.02457904815673828, -0.021770477294921875, -0.01896190643310547, -0.016153335571289062, -0.013344764709472656, -0.01053619384765625, -0.007727622985839844, -0.0049190521240234375, -0.0021104812622070312, 0.000698089599609375, 0.0035066604614257812, 0.0063152313232421875, 0.009123802185058594, 0.011932373046875, 0.014740943908691406, 0.017549514770507812, 0.02035808563232422, 0.023166656494140625, 0.02597522735595703, 0.028783798217773438, 0.031592369079589844, 0.03440093994140625, 0.037209510803222656, 0.04001808166503906, 0.04282665252685547, 0.045635223388671875, 0.04844379425048828, 0.05125236511230469, 0.054060935974121094, 0.0568695068359375, 0.059678077697753906, 0.06248664855957031, 0.06529521942138672, 0.06810379028320312, 0.07091236114501953, 0.07372093200683594, 0.07652950286865234, 0.07933807373046875, 0.08214664459228516, 0.08495521545410156, 0.08776378631591797, 0.09057235717773438, 0.09338092803955078, 0.09618949890136719, 0.0989980697631836, 0.101806640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 8.0, 2.0, 12.0, 11.0, 13.0, 16.0, 24.0, 21.0, 19.0, 30.0, 29.0, 44.0, 41.0, 24.0, 49.0, 41.0, 50.0, 54.0, 38.0, 40.0, 43.0, 53.0, 42.0, 37.0, 30.0, 34.0, 27.0, 32.0, 27.0, 18.0, 10.0, 18.0, 18.0, 4.0, 4.0, 11.0, 4.0, 5.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062744140625, -0.06068611145019531, -0.058628082275390625, -0.05657005310058594, -0.05451202392578125, -0.05245399475097656, -0.050395965576171875, -0.04833793640136719, -0.0462799072265625, -0.04422187805175781, -0.042163848876953125, -0.04010581970214844, -0.03804779052734375, -0.03598976135253906, -0.033931732177734375, -0.03187370300292969, -0.029815673828125, -0.027757644653320312, -0.025699615478515625, -0.023641586303710938, -0.02158355712890625, -0.019525527954101562, -0.017467498779296875, -0.015409469604492188, -0.0133514404296875, -0.011293411254882812, -0.009235382080078125, -0.0071773529052734375, -0.00511932373046875, -0.0030612945556640625, -0.001003265380859375, 0.0010547637939453125, 0.00311279296875, 0.0051708221435546875, 0.007228851318359375, 0.009286880493164062, 0.01134490966796875, 0.013402938842773438, 0.015460968017578125, 0.017518997192382812, 0.0195770263671875, 0.021635055541992188, 0.023693084716796875, 0.025751113891601562, 0.02780914306640625, 0.029867172241210938, 0.031925201416015625, 0.03398323059082031, 0.036041259765625, 0.03809928894042969, 0.040157318115234375, 0.04221534729003906, 0.04427337646484375, 0.04633140563964844, 0.048389434814453125, 0.05044746398925781, 0.0525054931640625, 0.05456352233886719, 0.056621551513671875, 0.05867958068847656, 0.06073760986328125, 0.06279563903808594, 0.06485366821289062, 0.06691169738769531, 0.0689697265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 5.0, 6.0, 5.0, 12.0, 23.0, 26.0, 58.0, 74.0, 102.0, 198.0, 317.0, 719.0, 1867.0, 7497.0, 59019.0, 778637.0, 178345.0, 16403.0, 3179.0, 1030.0, 431.0, 248.0, 122.0, 94.0, 36.0, 24.0, 29.0, 16.0, 9.0, 4.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.365234375, -0.3540687561035156, -0.34290313720703125, -0.3317375183105469, -0.3205718994140625, -0.3094062805175781, -0.29824066162109375, -0.2870750427246094, -0.275909423828125, -0.2647438049316406, -0.25357818603515625, -0.24241256713867188, -0.2312469482421875, -0.22008132934570312, -0.20891571044921875, -0.19775009155273438, -0.18658447265625, -0.17541885375976562, -0.16425323486328125, -0.15308761596679688, -0.1419219970703125, -0.13075637817382812, -0.11959075927734375, -0.10842514038085938, -0.097259521484375, -0.08609390258789062, -0.07492828369140625, -0.06376266479492188, -0.0525970458984375, -0.041431427001953125, -0.03026580810546875, -0.019100189208984375, -0.0079345703125, 0.003231048583984375, 0.01439666748046875, 0.025562286376953125, 0.0367279052734375, 0.047893524169921875, 0.05905914306640625, 0.07022476196289062, 0.081390380859375, 0.09255599975585938, 0.10372161865234375, 0.11488723754882812, 0.1260528564453125, 0.13721847534179688, 0.14838409423828125, 0.15954971313476562, 0.17071533203125, 0.18188095092773438, 0.19304656982421875, 0.20421218872070312, 0.2153778076171875, 0.22654342651367188, 0.23770904541015625, 0.24887466430664062, 0.260040283203125, 0.2712059020996094, 0.28237152099609375, 0.2935371398925781, 0.3047027587890625, 0.3158683776855469, 0.32703399658203125, 0.3381996154785156, 0.349365234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 4.0, 6.0, 6.0, 7.0, 8.0, 5.0, 12.0, 13.0, 17.0, 24.0, 26.0, 36.0, 29.0, 46.0, 44.0, 51.0, 50.0, 56.0, 73.0, 54.0, 62.0, 51.0, 53.0, 47.0, 33.0, 35.0, 28.0, 32.0, 25.0, 15.0, 11.0, 9.0, 7.0, 9.0, 6.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33837890625, -0.32871246337890625, -0.3190460205078125, -0.30937957763671875, -0.299713134765625, -0.29004669189453125, -0.2803802490234375, -0.27071380615234375, -0.26104736328125, -0.25138092041015625, -0.2417144775390625, -0.23204803466796875, -0.222381591796875, -0.21271514892578125, -0.2030487060546875, -0.19338226318359375, -0.1837158203125, -0.17404937744140625, -0.1643829345703125, -0.15471649169921875, -0.145050048828125, -0.13538360595703125, -0.1257171630859375, -0.11605072021484375, -0.10638427734375, -0.09671783447265625, -0.0870513916015625, -0.07738494873046875, -0.067718505859375, -0.05805206298828125, -0.0483856201171875, -0.03871917724609375, -0.029052734375, -0.01938629150390625, -0.0097198486328125, -5.340576171875e-05, 0.009613037109375, 0.01927947998046875, 0.0289459228515625, 0.03861236572265625, 0.04827880859375, 0.05794525146484375, 0.0676116943359375, 0.07727813720703125, 0.086944580078125, 0.09661102294921875, 0.1062774658203125, 0.11594390869140625, 0.1256103515625, 0.13527679443359375, 0.1449432373046875, 0.15460968017578125, 0.164276123046875, 0.17394256591796875, 0.1836090087890625, 0.19327545166015625, 0.20294189453125, 0.21260833740234375, 0.2222747802734375, 0.23194122314453125, 0.241607666015625, 0.25127410888671875, 0.2609405517578125, 0.27060699462890625, 0.2802734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 8.0, 10.0, 21.0, 29.0, 58.0, 61.0, 110.0, 210.0, 427.0, 948.0, 2295.0, 6790.0, 25452.0, 133371.0, 750442.0, 98857.0, 20155.0, 5587.0, 1975.0, 880.0, 368.0, 197.0, 100.0, 65.0, 37.0, 32.0, 19.0, 10.0, 6.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10821533203125, -0.10465812683105469, -0.10110092163085938, -0.09754371643066406, -0.09398651123046875, -0.09042930603027344, -0.08687210083007812, -0.08331489562988281, -0.0797576904296875, -0.07620048522949219, -0.07264328002929688, -0.06908607482910156, -0.06552886962890625, -0.06197166442871094, -0.058414459228515625, -0.05485725402832031, -0.051300048828125, -0.04774284362792969, -0.044185638427734375, -0.04062843322753906, -0.03707122802734375, -0.03351402282714844, -0.029956817626953125, -0.026399612426757812, -0.0228424072265625, -0.019285202026367188, -0.015727996826171875, -0.012170791625976562, -0.00861358642578125, -0.0050563812255859375, -0.001499176025390625, 0.0020580291748046875, 0.005615234375, 0.009172439575195312, 0.012729644775390625, 0.016286849975585938, 0.01984405517578125, 0.023401260375976562, 0.026958465576171875, 0.030515670776367188, 0.0340728759765625, 0.03763008117675781, 0.041187286376953125, 0.04474449157714844, 0.04830169677734375, 0.05185890197753906, 0.055416107177734375, 0.05897331237792969, 0.062530517578125, 0.06608772277832031, 0.06964492797851562, 0.07320213317871094, 0.07675933837890625, 0.08031654357910156, 0.08387374877929688, 0.08743095397949219, 0.0909881591796875, 0.09454536437988281, 0.09810256958007812, 0.10165977478027344, 0.10521697998046875, 0.10877418518066406, 0.11233139038085938, 0.11588859558105469, 0.11944580078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 6.0, 11.0, 9.0, 18.0, 25.0, 26.0, 30.0, 61.0, 72.0, 106.0, 140.0, 152.0, 92.0, 54.0, 41.0, 33.0, 24.0, 30.0, 18.0, 9.0, 10.0, 0.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2557716369628906e-05, -4.125572741031647e-05, -3.995373845100403e-05, -3.865174949169159e-05, -3.734976053237915e-05, -3.604777157306671e-05, -3.474578261375427e-05, -3.3443793654441833e-05, -3.2141804695129395e-05, -3.0839815735816956e-05, -2.9537826776504517e-05, -2.8235837817192078e-05, -2.693384885787964e-05, -2.56318598985672e-05, -2.432987093925476e-05, -2.3027881979942322e-05, -2.1725893020629883e-05, -2.0423904061317444e-05, -1.9121915102005005e-05, -1.7819926142692566e-05, -1.6517937183380127e-05, -1.5215948224067688e-05, -1.3913959264755249e-05, -1.261197030544281e-05, -1.1309981346130371e-05, -1.0007992386817932e-05, -8.706003427505493e-06, -7.404014468193054e-06, -6.102025508880615e-06, -4.800036549568176e-06, -3.4980475902557373e-06, -2.1960586309432983e-06, -8.940696716308594e-07, 4.079192876815796e-07, 1.7099082469940186e-06, 3.0118972063064575e-06, 4.3138861656188965e-06, 5.6158751249313354e-06, 6.917864084243774e-06, 8.219853043556213e-06, 9.521842002868652e-06, 1.0823830962181091e-05, 1.212581992149353e-05, 1.342780888080597e-05, 1.4729797840118408e-05, 1.6031786799430847e-05, 1.7333775758743286e-05, 1.8635764718055725e-05, 1.9937753677368164e-05, 2.1239742636680603e-05, 2.2541731595993042e-05, 2.384372055530548e-05, 2.514570951461792e-05, 2.644769847393036e-05, 2.7749687433242798e-05, 2.9051676392555237e-05, 3.0353665351867676e-05, 3.1655654311180115e-05, 3.2957643270492554e-05, 3.425963222980499e-05, 3.556162118911743e-05, 3.686361014842987e-05, 3.816559910774231e-05, 3.946758806705475e-05, 4.076957702636719e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 17.0, 15.0, 25.0, 41.0, 66.0, 135.0, 187.0, 343.0, 787.0, 1876.0, 5693.0, 24251.0, 150789.0, 755152.0, 86111.0, 15987.0, 4263.0, 1479.0, 597.0, 277.0, 193.0, 94.0, 50.0, 38.0, 24.0, 11.0, 10.0, 13.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1187744140625, -0.11498737335205078, -0.11120033264160156, -0.10741329193115234, -0.10362625122070312, -0.0998392105102539, -0.09605216979980469, -0.09226512908935547, -0.08847808837890625, -0.08469104766845703, -0.08090400695800781, -0.0771169662475586, -0.07332992553710938, -0.06954288482666016, -0.06575584411621094, -0.06196880340576172, -0.0581817626953125, -0.05439472198486328, -0.05060768127441406, -0.046820640563964844, -0.043033599853515625, -0.039246559143066406, -0.03545951843261719, -0.03167247772216797, -0.02788543701171875, -0.02409839630126953, -0.020311355590820312, -0.016524314880371094, -0.012737274169921875, -0.008950233459472656, -0.0051631927490234375, -0.0013761520385742188, 0.002410888671875, 0.006197929382324219, 0.009984970092773438, 0.013772010803222656, 0.017559051513671875, 0.021346092224121094, 0.025133132934570312, 0.02892017364501953, 0.03270721435546875, 0.03649425506591797, 0.04028129577636719, 0.044068336486816406, 0.047855377197265625, 0.051642417907714844, 0.05542945861816406, 0.05921649932861328, 0.0630035400390625, 0.06679058074951172, 0.07057762145996094, 0.07436466217041016, 0.07815170288085938, 0.0819387435913086, 0.08572578430175781, 0.08951282501220703, 0.09329986572265625, 0.09708690643310547, 0.10087394714355469, 0.1046609878540039, 0.10844802856445312, 0.11223506927490234, 0.11602210998535156, 0.11980915069580078, 0.12359619140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 11.0, 14.0, 13.0, 23.0, 23.0, 29.0, 46.0, 58.0, 89.0, 106.0, 149.0, 94.0, 89.0, 55.0, 51.0, 24.0, 19.0, 20.0, 29.0, 8.0, 6.0, 11.0, 3.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09405517578125, -0.09085750579833984, -0.08765983581542969, -0.08446216583251953, -0.08126449584960938, -0.07806682586669922, -0.07486915588378906, -0.0716714859008789, -0.06847381591796875, -0.0652761459350586, -0.06207847595214844, -0.05888080596923828, -0.055683135986328125, -0.05248546600341797, -0.04928779602050781, -0.046090126037597656, -0.0428924560546875, -0.039694786071777344, -0.03649711608886719, -0.03329944610595703, -0.030101776123046875, -0.02690410614013672, -0.023706436157226562, -0.020508766174316406, -0.01731109619140625, -0.014113426208496094, -0.010915756225585938, -0.007718086242675781, -0.004520416259765625, -0.0013227462768554688, 0.0018749237060546875, 0.005072593688964844, 0.008270263671875, 0.011467933654785156, 0.014665603637695312, 0.01786327362060547, 0.021060943603515625, 0.02425861358642578, 0.027456283569335938, 0.030653953552246094, 0.03385162353515625, 0.037049293518066406, 0.04024696350097656, 0.04344463348388672, 0.046642303466796875, 0.04983997344970703, 0.05303764343261719, 0.056235313415527344, 0.0594329833984375, 0.06263065338134766, 0.06582832336425781, 0.06902599334716797, 0.07222366333007812, 0.07542133331298828, 0.07861900329589844, 0.0818166732788086, 0.08501434326171875, 0.0882120132446289, 0.09140968322753906, 0.09460735321044922, 0.09780502319335938, 0.10100269317626953, 0.10420036315917969, 0.10739803314208984, 0.110595703125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 19.0, 26.0, 46.0, 84.0, 129.0, 279.0, 169.0, 82.0, 49.0, 42.0, 28.0, 8.0, 14.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.6796164512634277, -2.6152126789093018, -2.550808906555176, -2.486405372619629, -2.422001600265503, -2.357597827911377, -2.29319429397583, -2.228790521621704, -2.164386749267578, -2.099982976913452, -2.035579204559326, -1.9711756706237793, -1.9067718982696533, -1.8423681259155273, -1.777964472770691, -1.7135608196258545, -1.6491570472717285, -1.5847532749176025, -1.5203496217727661, -1.4559459686279297, -1.3915421962738037, -1.3271384239196777, -1.2627347707748413, -1.1983311176300049, -1.133927345275879, -1.069523572921753, -1.0051199197769165, -0.9407162070274353, -0.8763124942779541, -0.8119087815284729, -0.7475050687789917, -0.6831013560295105, -0.6186974048614502, -0.554293692111969, -0.4898899793624878, -0.4254862666130066, -0.3610825538635254, -0.2966788411140442, -0.232275128364563, -0.1678714156150818, -0.10346770286560059, -0.039063990116119385, 0.025339722633361816, 0.08974343538284302, 0.15414714813232422, 0.21855086088180542, 0.2829545736312866, 0.3473582863807678, 0.411761999130249, 0.4761657118797302, 0.5405694246292114, 0.6049731373786926, 0.6693768501281738, 0.733780562877655, 0.7981842756271362, 0.8625879883766174, 0.9269917011260986, 0.9913954138755798, 1.055799126625061, 1.1202027797698975, 1.1846065521240234, 1.2490103244781494, 1.3134139776229858, 1.3778176307678223, 1.4422214031219482]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 8.0, 4.0, 6.0, 8.0, 11.0, 12.0, 8.0, 11.0, 19.0, 22.0, 14.0, 41.0, 30.0, 28.0, 31.0, 44.0, 58.0, 99.0, 117.0, 81.0, 51.0, 42.0, 36.0, 28.0, 30.0, 25.0, 19.0, 20.0, 20.0, 14.0, 16.0, 8.0, 11.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1332073211669922, -1.094657063484192, -1.0561068058013916, -1.0175564289093018, -0.9790061712265015, -0.9404559135437012, -0.9019056558609009, -0.8633553385734558, -0.8248050212860107, -0.7862547636032104, -0.7477044463157654, -0.7091541886329651, -0.67060387134552, -0.6320536136627197, -0.5935033559799194, -0.5549530386924744, -0.5164027810096741, -0.4778524935245514, -0.4393022060394287, -0.4007519483566284, -0.36220163106918335, -0.32365137338638306, -0.2851010859012604, -0.2465507984161377, -0.20800051093101501, -0.16945022344589233, -0.13089993596076965, -0.09234966337680817, -0.053799375891685486, -0.015249088406562805, 0.02330118417739868, 0.06185147166252136, 0.10040175914764404, 0.13895204663276672, 0.1775023341178894, 0.2160526067018509, 0.25460290908813477, 0.29315316677093506, 0.33170345425605774, 0.3702537417411804, 0.4088040292263031, 0.4473543167114258, 0.48590460419654846, 0.5244548916816711, 0.5630051493644714, 0.6015554666519165, 0.6401057243347168, 0.6786559820175171, 0.7172062993049622, 0.7557565569877625, 0.7943068742752075, 0.8328571319580078, 0.8714074492454529, 0.9099577069282532, 0.9485080242156982, 0.9870582818984985, 1.0256085395812988, 1.0641587972640991, 1.1027090549468994, 1.1412594318389893, 1.1798096895217896, 1.2183599472045898, 1.2569102048873901, 1.2954604625701904, 1.3340108394622803]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 10.0, 16.0, 11.0, 17.0, 37.0, 42.0, 65.0, 99.0, 126.0, 188.0, 279.0, 391.0, 635.0, 992.0, 1771.0, 3037.0, 6260.0, 13300.0, 33629.0, 114620.0, 605622.0, 2258371.0, 920676.0, 160181.0, 42379.0, 15770.0, 7012.0, 3555.0, 2007.0, 1056.0, 663.0, 444.0, 276.0, 198.0, 162.0, 108.0, 71.0, 56.0, 47.0, 23.0, 15.0, 16.0, 13.0, 7.0, 7.0, 3.0, 1.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.09637451171875, -0.09322643280029297, -0.09007835388183594, -0.0869302749633789, -0.08378219604492188, -0.08063411712646484, -0.07748603820800781, -0.07433795928955078, -0.07118988037109375, -0.06804180145263672, -0.06489372253417969, -0.061745643615722656, -0.058597564697265625, -0.055449485778808594, -0.05230140686035156, -0.04915332794189453, -0.0460052490234375, -0.04285717010498047, -0.03970909118652344, -0.036561012268066406, -0.033412933349609375, -0.030264854431152344, -0.027116775512695312, -0.02396869659423828, -0.02082061767578125, -0.01767253875732422, -0.014524459838867188, -0.011376380920410156, -0.008228302001953125, -0.005080223083496094, -0.0019321441650390625, 0.0012159347534179688, 0.004364013671875, 0.007512092590332031, 0.010660171508789062, 0.013808250427246094, 0.016956329345703125, 0.020104408264160156, 0.023252487182617188, 0.02640056610107422, 0.02954864501953125, 0.03269672393798828, 0.03584480285644531, 0.038992881774902344, 0.042140960693359375, 0.045289039611816406, 0.04843711853027344, 0.05158519744873047, 0.0547332763671875, 0.05788135528564453, 0.06102943420410156, 0.0641775131225586, 0.06732559204101562, 0.07047367095947266, 0.07362174987792969, 0.07676982879638672, 0.07991790771484375, 0.08306598663330078, 0.08621406555175781, 0.08936214447021484, 0.09251022338867188, 0.0956583023071289, 0.09880638122558594, 0.10195446014404297, 0.1051025390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 6.0, 5.0, 4.0, 9.0, 12.0, 14.0, 21.0, 27.0, 21.0, 37.0, 46.0, 49.0, 51.0, 42.0, 55.0, 49.0, 62.0, 52.0, 48.0, 45.0, 53.0, 39.0, 54.0, 28.0, 20.0, 38.0, 28.0, 16.0, 19.0, 8.0, 13.0, 10.0, 6.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0714111328125, -0.06895732879638672, -0.06650352478027344, -0.06404972076416016, -0.061595916748046875, -0.059142112731933594, -0.05668830871582031, -0.05423450469970703, -0.05178070068359375, -0.04932689666748047, -0.04687309265136719, -0.044419288635253906, -0.041965484619140625, -0.039511680603027344, -0.03705787658691406, -0.03460407257080078, -0.0321502685546875, -0.02969646453857422, -0.027242660522460938, -0.024788856506347656, -0.022335052490234375, -0.019881248474121094, -0.017427444458007812, -0.014973640441894531, -0.01251983642578125, -0.010066032409667969, -0.0076122283935546875, -0.005158424377441406, -0.002704620361328125, -0.00025081634521484375, 0.0022029876708984375, 0.004656791687011719, 0.007110595703125, 0.009564399719238281, 0.012018203735351562, 0.014472007751464844, 0.016925811767578125, 0.019379615783691406, 0.021833419799804688, 0.02428722381591797, 0.02674102783203125, 0.02919483184814453, 0.03164863586425781, 0.034102439880371094, 0.036556243896484375, 0.039010047912597656, 0.04146385192871094, 0.04391765594482422, 0.0463714599609375, 0.04882526397705078, 0.05127906799316406, 0.053732872009277344, 0.056186676025390625, 0.058640480041503906, 0.06109428405761719, 0.06354808807373047, 0.06600189208984375, 0.06845569610595703, 0.07090950012207031, 0.0733633041381836, 0.07581710815429688, 0.07827091217041016, 0.08072471618652344, 0.08317852020263672, 0.08563232421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 12.0, 34.0, 50.0, 116.0, 267.0, 673.0, 2393.0, 28141.0, 3988967.0, 166303.0, 5389.0, 1101.0, 429.0, 216.0, 87.0, 40.0, 25.0, 12.0, 7.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5498046875, -0.5299606323242188, -0.5101165771484375, -0.49027252197265625, -0.470428466796875, -0.45058441162109375, -0.4307403564453125, -0.41089630126953125, -0.39105224609375, -0.37120819091796875, -0.3513641357421875, -0.33152008056640625, -0.311676025390625, -0.29183197021484375, -0.2719879150390625, -0.25214385986328125, -0.2322998046875, -0.21245574951171875, -0.1926116943359375, -0.17276763916015625, -0.152923583984375, -0.13307952880859375, -0.1132354736328125, -0.09339141845703125, -0.07354736328125, -0.05370330810546875, -0.0338592529296875, -0.01401519775390625, 0.005828857421875, 0.02567291259765625, 0.0455169677734375, 0.06536102294921875, 0.085205078125, 0.10504913330078125, 0.1248931884765625, 0.14473724365234375, 0.164581298828125, 0.18442535400390625, 0.2042694091796875, 0.22411346435546875, 0.24395751953125, 0.26380157470703125, 0.2836456298828125, 0.30348968505859375, 0.323333740234375, 0.34317779541015625, 0.3630218505859375, 0.38286590576171875, 0.4027099609375, 0.42255401611328125, 0.4423980712890625, 0.46224212646484375, 0.482086181640625, 0.5019302368164062, 0.5217742919921875, 0.5416183471679688, 0.56146240234375, 0.5813064575195312, 0.6011505126953125, 0.6209945678710938, 0.640838623046875, 0.6606826782226562, 0.6805267333984375, 0.7003707885742188, 0.72021484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 10.0, 20.0, 31.0, 37.0, 50.0, 61.0, 143.0, 311.0, 714.0, 1136.0, 805.0, 349.0, 138.0, 81.0, 55.0, 43.0, 19.0, 18.0, 16.0, 6.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2352294921875, -0.22481346130371094, -0.21439743041992188, -0.2039813995361328, -0.19356536865234375, -0.1831493377685547, -0.17273330688476562, -0.16231727600097656, -0.1519012451171875, -0.14148521423339844, -0.13106918334960938, -0.12065315246582031, -0.11023712158203125, -0.09982109069824219, -0.08940505981445312, -0.07898902893066406, -0.068572998046875, -0.05815696716308594, -0.047740936279296875, -0.03732490539550781, -0.02690887451171875, -0.016492843627929688, -0.006076812744140625, 0.0043392181396484375, 0.0147552490234375, 0.025171279907226562, 0.035587310791015625, 0.04600334167480469, 0.05641937255859375, 0.06683540344238281, 0.07725143432617188, 0.08766746520996094, 0.09808349609375, 0.10849952697753906, 0.11891555786132812, 0.1293315887451172, 0.13974761962890625, 0.1501636505126953, 0.16057968139648438, 0.17099571228027344, 0.1814117431640625, 0.19182777404785156, 0.20224380493164062, 0.2126598358154297, 0.22307586669921875, 0.2334918975830078, 0.24390792846679688, 0.25432395935058594, 0.264739990234375, 0.27515602111816406, 0.2855720520019531, 0.2959880828857422, 0.30640411376953125, 0.3168201446533203, 0.3272361755371094, 0.33765220642089844, 0.3480682373046875, 0.35848426818847656, 0.3689002990722656, 0.3793163299560547, 0.38973236083984375, 0.4001483917236328, 0.4105644226074219, 0.42098045349121094, 0.431396484375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 9.0, 14.0, 42.0, 87.0, 195.0, 236.0, 194.0, 122.0, 41.0, 26.0, 15.0, 6.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4318771362304688, -1.3266048431396484, -1.2213325500488281, -1.1160601377487183, -1.010787844657898, -0.9055155515670776, -0.8002431988716125, -0.6949708461761475, -0.5896985530853271, -0.48442623019218445, -0.37915390729904175, -0.27388158440589905, -0.16860926151275635, -0.06333696842193604, 0.04193538427352905, 0.14720773696899414, 0.25248003005981445, 0.35775235295295715, 0.46302467584609985, 0.5682970285415649, 0.6735693216323853, 0.7788416147232056, 0.8841139674186707, 0.9893863201141357, 1.094658613204956, 1.1999309062957764, 1.3052031993865967, 1.4104756116867065, 1.5157479047775269, 1.6210201978683472, 1.726292610168457, 1.8315649032592773, 1.9368371963500977, 2.042109489440918, 2.1473817825317383, 2.2526540756225586, 2.357926368713379, 2.463198661804199, 2.5684711933135986, 2.673743486404419, 2.7790157794952393, 2.8842880725860596, 2.98956036567688, 3.0948326587677, 3.2001051902770996, 3.30537748336792, 3.4106497764587402, 3.5159220695495605, 3.621194362640381, 3.726466655731201, 3.8317389488220215, 3.937011241912842, 4.042283535003662, 4.147555828094482, 4.252828121185303, 4.358100891113281, 4.463373184204102, 4.568645477294922, 4.673917770385742, 4.7791900634765625, 4.884462356567383, 4.989734649658203, 5.095006942749023, 5.200279235839844, 5.305551528930664]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 1.0, 12.0, 11.0, 16.0, 16.0, 16.0, 21.0, 22.0, 26.0, 24.0, 31.0, 45.0, 47.0, 40.0, 45.0, 56.0, 41.0, 49.0, 62.0, 52.0, 48.0, 53.0, 37.0, 41.0, 31.0, 24.0, 23.0, 18.0, 15.0, 12.0, 14.0, 12.0, 7.0, 2.0, 10.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1538000106811523, -1.118662714958191, -1.0835254192352295, -1.0483882427215576, -1.0132509469985962, -0.9781136512756348, -0.9429763555526733, -0.9078390598297119, -0.8727017641067505, -0.8375644683837891, -0.8024272322654724, -0.767289936542511, -0.7321526408195496, -0.6970154047012329, -0.6618781089782715, -0.6267408132553101, -0.5916035771369934, -0.556466281414032, -0.5213290452957153, -0.4861917495727539, -0.4510544538497925, -0.41591718792915344, -0.3807799220085144, -0.345642626285553, -0.31050536036491394, -0.2753680944442749, -0.24023079872131348, -0.20509353280067444, -0.1699562519788742, -0.13481897115707397, -0.09968170523643494, -0.0645444244146347, -0.029407143592834473, 0.005730133503675461, 0.040867410600185394, 0.07600468397140503, 0.11114196479320526, 0.1462792456150055, 0.18141651153564453, 0.21655379235744476, 0.251691073179245, 0.28682833909988403, 0.32196563482284546, 0.3571029007434845, 0.39224016666412354, 0.42737746238708496, 0.462514728307724, 0.49765199422836304, 0.5327892899513245, 0.5679265856742859, 0.6030638217926025, 0.638201117515564, 0.6733384132385254, 0.7084757089614868, 0.7436129450798035, 0.7787502408027649, 0.8138874769210815, 0.849024772644043, 0.8841620087623596, 0.919299304485321, 0.9544366002082825, 0.9895738363265991, 1.0247111320495605, 1.059848427772522, 1.0949857234954834]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 6.0, 6.0, 14.0, 19.0, 22.0, 37.0, 52.0, 73.0, 107.0, 172.0, 262.0, 381.0, 604.0, 999.0, 1421.0, 2365.0, 3993.0, 6915.0, 12196.0, 22638.0, 44768.0, 94507.0, 198685.0, 290635.0, 188409.0, 87520.0, 42205.0, 21192.0, 11500.0, 6581.0, 3725.0, 2354.0, 1458.0, 933.0, 595.0, 410.0, 270.0, 173.0, 94.0, 97.0, 51.0, 31.0, 28.0, 20.0, 9.0, 10.0, 5.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11199951171875, -0.1083221435546875, -0.104644775390625, -0.1009674072265625, -0.0972900390625, -0.0936126708984375, -0.089935302734375, -0.0862579345703125, -0.08258056640625, -0.0789031982421875, -0.075225830078125, -0.0715484619140625, -0.06787109375, -0.0641937255859375, -0.060516357421875, -0.0568389892578125, -0.05316162109375, -0.0494842529296875, -0.045806884765625, -0.0421295166015625, -0.0384521484375, -0.0347747802734375, -0.031097412109375, -0.0274200439453125, -0.02374267578125, -0.0200653076171875, -0.016387939453125, -0.0127105712890625, -0.009033203125, -0.0053558349609375, -0.001678466796875, 0.0019989013671875, 0.00567626953125, 0.0093536376953125, 0.013031005859375, 0.0167083740234375, 0.0203857421875, 0.0240631103515625, 0.027740478515625, 0.0314178466796875, 0.03509521484375, 0.0387725830078125, 0.042449951171875, 0.0461273193359375, 0.0498046875, 0.0534820556640625, 0.057159423828125, 0.0608367919921875, 0.06451416015625, 0.0681915283203125, 0.071868896484375, 0.0755462646484375, 0.0792236328125, 0.0829010009765625, 0.086578369140625, 0.0902557373046875, 0.09393310546875, 0.0976104736328125, 0.101287841796875, 0.1049652099609375, 0.108642578125, 0.1123199462890625, 0.115997314453125, 0.1196746826171875, 0.12335205078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 9.0, 10.0, 10.0, 10.0, 14.0, 14.0, 22.0, 18.0, 26.0, 40.0, 31.0, 41.0, 45.0, 49.0, 77.0, 64.0, 60.0, 56.0, 67.0, 42.0, 51.0, 35.0, 33.0, 32.0, 24.0, 28.0, 31.0, 14.0, 10.0, 7.0, 9.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10540771484375, -0.10215282440185547, -0.09889793395996094, -0.0956430435180664, -0.09238815307617188, -0.08913326263427734, -0.08587837219238281, -0.08262348175048828, -0.07936859130859375, -0.07611370086669922, -0.07285881042480469, -0.06960391998291016, -0.06634902954101562, -0.0630941390991211, -0.05983924865722656, -0.05658435821533203, -0.0533294677734375, -0.05007457733154297, -0.04681968688964844, -0.043564796447753906, -0.040309906005859375, -0.037055015563964844, -0.03380012512207031, -0.03054523468017578, -0.02729034423828125, -0.02403545379638672, -0.020780563354492188, -0.017525672912597656, -0.014270782470703125, -0.011015892028808594, -0.0077610015869140625, -0.004506111145019531, -0.001251220703125, 0.0020036697387695312, 0.0052585601806640625, 0.008513450622558594, 0.011768341064453125, 0.015023231506347656, 0.018278121948242188, 0.02153301239013672, 0.02478790283203125, 0.02804279327392578, 0.03129768371582031, 0.034552574157714844, 0.037807464599609375, 0.041062355041503906, 0.04431724548339844, 0.04757213592529297, 0.0508270263671875, 0.05408191680908203, 0.05733680725097656, 0.060591697692871094, 0.06384658813476562, 0.06710147857666016, 0.07035636901855469, 0.07361125946044922, 0.07686614990234375, 0.08012104034423828, 0.08337593078613281, 0.08663082122802734, 0.08988571166992188, 0.0931406021118164, 0.09639549255371094, 0.09965038299560547, 0.1029052734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 10.0, 10.0, 13.0, 31.0, 46.0, 62.0, 79.0, 131.0, 171.0, 292.0, 551.0, 1187.0, 3115.0, 15314.0, 248316.0, 744917.0, 26994.0, 4209.0, 1435.0, 671.0, 346.0, 220.0, 134.0, 87.0, 46.0, 33.0, 27.0, 25.0, 19.0, 14.0, 6.0, 11.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.4873046875, -0.4721336364746094, -0.45696258544921875, -0.4417915344238281, -0.4266204833984375, -0.4114494323730469, -0.39627838134765625, -0.3811073303222656, -0.365936279296875, -0.3507652282714844, -0.33559417724609375, -0.3204231262207031, -0.3052520751953125, -0.2900810241699219, -0.27490997314453125, -0.2597389221191406, -0.24456787109375, -0.22939682006835938, -0.21422576904296875, -0.19905471801757812, -0.1838836669921875, -0.16871261596679688, -0.15354156494140625, -0.13837051391601562, -0.123199462890625, -0.10802841186523438, -0.09285736083984375, -0.07768630981445312, -0.0625152587890625, -0.047344207763671875, -0.03217315673828125, -0.017002105712890625, -0.0018310546875, 0.013339996337890625, 0.02851104736328125, 0.043682098388671875, 0.0588531494140625, 0.07402420043945312, 0.08919525146484375, 0.10436630249023438, 0.119537353515625, 0.13470840454101562, 0.14987945556640625, 0.16505050659179688, 0.1802215576171875, 0.19539260864257812, 0.21056365966796875, 0.22573471069335938, 0.24090576171875, 0.2560768127441406, 0.27124786376953125, 0.2864189147949219, 0.3015899658203125, 0.3167610168457031, 0.33193206787109375, 0.3471031188964844, 0.362274169921875, 0.3774452209472656, 0.39261627197265625, 0.4077873229980469, 0.4229583740234375, 0.4381294250488281, 0.45330047607421875, 0.4684715270996094, 0.483642578125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 4.0, 5.0, 4.0, 3.0, 6.0, 7.0, 4.0, 9.0, 12.0, 11.0, 21.0, 15.0, 31.0, 31.0, 39.0, 36.0, 35.0, 43.0, 47.0, 67.0, 49.0, 47.0, 67.0, 45.0, 50.0, 60.0, 37.0, 33.0, 28.0, 22.0, 20.0, 18.0, 13.0, 15.0, 7.0, 12.0, 9.0, 8.0, 7.0, 4.0, 9.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.357177734375, -0.34479522705078125, -0.3324127197265625, -0.32003021240234375, -0.307647705078125, -0.29526519775390625, -0.2828826904296875, -0.27050018310546875, -0.25811767578125, -0.24573516845703125, -0.2333526611328125, -0.22097015380859375, -0.208587646484375, -0.19620513916015625, -0.1838226318359375, -0.17144012451171875, -0.1590576171875, -0.14667510986328125, -0.1342926025390625, -0.12191009521484375, -0.109527587890625, -0.09714508056640625, -0.0847625732421875, -0.07238006591796875, -0.05999755859375, -0.04761505126953125, -0.0352325439453125, -0.02285003662109375, -0.010467529296875, 0.00191497802734375, 0.0142974853515625, 0.02667999267578125, 0.0390625, 0.05144500732421875, 0.0638275146484375, 0.07621002197265625, 0.088592529296875, 0.10097503662109375, 0.1133575439453125, 0.12574005126953125, 0.13812255859375, 0.15050506591796875, 0.1628875732421875, 0.17527008056640625, 0.187652587890625, 0.20003509521484375, 0.2124176025390625, 0.22480010986328125, 0.2371826171875, 0.24956512451171875, 0.2619476318359375, 0.27433013916015625, 0.286712646484375, 0.29909515380859375, 0.3114776611328125, 0.32386016845703125, 0.33624267578125, 0.34862518310546875, 0.3610076904296875, 0.37339019775390625, 0.385772705078125, 0.39815521240234375, 0.4105377197265625, 0.42292022705078125, 0.435302734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 6.0, 3.0, 7.0, 4.0, 10.0, 13.0, 8.0, 17.0, 22.0, 40.0, 55.0, 102.0, 163.0, 343.0, 726.0, 1998.0, 6135.0, 30579.0, 632014.0, 338642.0, 28525.0, 5856.0, 1802.0, 719.0, 351.0, 174.0, 82.0, 51.0, 29.0, 22.0, 14.0, 12.0, 8.0, 6.0, 1.0, 5.0, 3.0, 3.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11309814453125, -0.10874462127685547, -0.10439109802246094, -0.1000375747680664, -0.09568405151367188, -0.09133052825927734, -0.08697700500488281, -0.08262348175048828, -0.07826995849609375, -0.07391643524169922, -0.06956291198730469, -0.06520938873291016, -0.060855865478515625, -0.056502342224121094, -0.05214881896972656, -0.04779529571533203, -0.0434417724609375, -0.03908824920654297, -0.03473472595214844, -0.030381202697753906, -0.026027679443359375, -0.021674156188964844, -0.017320632934570312, -0.012967109680175781, -0.00861358642578125, -0.004260063171386719, 9.34600830078125e-05, 0.004446983337402344, 0.008800506591796875, 0.013154029846191406, 0.017507553100585938, 0.02186107635498047, 0.026214599609375, 0.03056812286376953, 0.03492164611816406, 0.039275169372558594, 0.043628692626953125, 0.047982215881347656, 0.05233573913574219, 0.05668926239013672, 0.06104278564453125, 0.06539630889892578, 0.06974983215332031, 0.07410335540771484, 0.07845687866210938, 0.0828104019165039, 0.08716392517089844, 0.09151744842529297, 0.0958709716796875, 0.10022449493408203, 0.10457801818847656, 0.1089315414428711, 0.11328506469726562, 0.11763858795166016, 0.12199211120605469, 0.12634563446044922, 0.13069915771484375, 0.13505268096923828, 0.1394062042236328, 0.14375972747802734, 0.14811325073242188, 0.1524667739868164, 0.15682029724121094, 0.16117382049560547, 0.16552734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 3.0, 4.0, 4.0, 13.0, 9.0, 19.0, 28.0, 28.0, 58.0, 76.0, 137.0, 164.0, 136.0, 109.0, 70.0, 38.0, 30.0, 18.0, 19.0, 10.0, 6.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7550926208496094e-05, -3.588385879993439e-05, -3.421679139137268e-05, -3.2549723982810974e-05, -3.088265657424927e-05, -2.921558916568756e-05, -2.7548521757125854e-05, -2.5881454348564148e-05, -2.421438694000244e-05, -2.2547319531440735e-05, -2.088025212287903e-05, -1.9213184714317322e-05, -1.7546117305755615e-05, -1.587904989719391e-05, -1.4211982488632202e-05, -1.2544915080070496e-05, -1.0877847671508789e-05, -9.210780262947083e-06, -7.543712854385376e-06, -5.8766454458236694e-06, -4.209578037261963e-06, -2.5425106287002563e-06, -8.754432201385498e-07, 7.916241884231567e-07, 2.4586915969848633e-06, 4.12575900554657e-06, 5.792826414108276e-06, 7.459893822669983e-06, 9.12696123123169e-06, 1.0794028639793396e-05, 1.2461096048355103e-05, 1.4128163456916809e-05, 1.5795230865478516e-05, 1.7462298274040222e-05, 1.912936568260193e-05, 2.0796433091163635e-05, 2.2463500499725342e-05, 2.413056790828705e-05, 2.5797635316848755e-05, 2.746470272541046e-05, 2.9131770133972168e-05, 3.0798837542533875e-05, 3.246590495109558e-05, 3.413297235965729e-05, 3.5800039768218994e-05, 3.74671071767807e-05, 3.913417458534241e-05, 4.0801241993904114e-05, 4.246830940246582e-05, 4.413537681102753e-05, 4.5802444219589233e-05, 4.746951162815094e-05, 4.9136579036712646e-05, 5.080364644527435e-05, 5.247071385383606e-05, 5.4137781262397766e-05, 5.580484867095947e-05, 5.747191607952118e-05, 5.9138983488082886e-05, 6.080605089664459e-05, 6.24731183052063e-05, 6.4140185713768e-05, 6.580725312232971e-05, 6.747432053089142e-05, 6.914138793945312e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 11.0, 14.0, 16.0, 24.0, 32.0, 68.0, 111.0, 194.0, 408.0, 1079.0, 3199.0, 18781.0, 342937.0, 655161.0, 20990.0, 3531.0, 1074.0, 425.0, 191.0, 103.0, 57.0, 46.0, 27.0, 15.0, 6.0, 10.0, 6.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1590576171875, -0.15409088134765625, -0.1491241455078125, -0.14415740966796875, -0.139190673828125, -0.13422393798828125, -0.1292572021484375, -0.12429046630859375, -0.11932373046875, -0.11435699462890625, -0.1093902587890625, -0.10442352294921875, -0.099456787109375, -0.09449005126953125, -0.0895233154296875, -0.08455657958984375, -0.07958984375, -0.07462310791015625, -0.0696563720703125, -0.06468963623046875, -0.059722900390625, -0.05475616455078125, -0.0497894287109375, -0.04482269287109375, -0.03985595703125, -0.03488922119140625, -0.0299224853515625, -0.02495574951171875, -0.019989013671875, -0.01502227783203125, -0.0100555419921875, -0.00508880615234375, -0.0001220703125, 0.00484466552734375, 0.0098114013671875, 0.01477813720703125, 0.019744873046875, 0.02471160888671875, 0.0296783447265625, 0.03464508056640625, 0.03961181640625, 0.04457855224609375, 0.0495452880859375, 0.05451202392578125, 0.059478759765625, 0.06444549560546875, 0.0694122314453125, 0.07437896728515625, 0.079345703125, 0.08431243896484375, 0.0892791748046875, 0.09424591064453125, 0.099212646484375, 0.10417938232421875, 0.1091461181640625, 0.11411285400390625, 0.11907958984375, 0.12404632568359375, 0.1290130615234375, 0.13397979736328125, 0.138946533203125, 0.14391326904296875, 0.1488800048828125, 0.15384674072265625, 0.1588134765625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 5.0, 6.0, 6.0, 14.0, 21.0, 27.0, 37.0, 47.0, 56.0, 80.0, 109.0, 107.0, 130.0, 87.0, 74.0, 38.0, 36.0, 27.0, 24.0, 19.0, 15.0, 10.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10970115661621094, -0.10624313354492188, -0.10278511047363281, -0.09932708740234375, -0.09586906433105469, -0.09241104125976562, -0.08895301818847656, -0.0854949951171875, -0.08203697204589844, -0.07857894897460938, -0.07512092590332031, -0.07166290283203125, -0.06820487976074219, -0.06474685668945312, -0.06128883361816406, -0.057830810546875, -0.05437278747558594, -0.050914764404296875, -0.04745674133300781, -0.04399871826171875, -0.04054069519042969, -0.037082672119140625, -0.03362464904785156, -0.0301666259765625, -0.026708602905273438, -0.023250579833984375, -0.019792556762695312, -0.01633453369140625, -0.012876510620117188, -0.009418487548828125, -0.0059604644775390625, -0.00250244140625, 0.0009555816650390625, 0.004413604736328125, 0.007871627807617188, 0.01132965087890625, 0.014787673950195312, 0.018245697021484375, 0.021703720092773438, 0.0251617431640625, 0.028619766235351562, 0.032077789306640625, 0.03553581237792969, 0.03899383544921875, 0.04245185852050781, 0.045909881591796875, 0.04936790466308594, 0.052825927734375, 0.05628395080566406, 0.059741973876953125, 0.06319999694824219, 0.06665802001953125, 0.07011604309082031, 0.07357406616210938, 0.07703208923339844, 0.0804901123046875, 0.08394813537597656, 0.08740615844726562, 0.09086418151855469, 0.09432220458984375, 0.09778022766113281, 0.10123825073242188, 0.10469627380371094, 0.108154296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 8.0, 29.0, 72.0, 140.0, 413.0, 162.0, 88.0, 48.0, 25.0, 11.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.424959659576416, -4.306817054748535, -4.188673973083496, -4.070531368255615, -3.952388286590576, -3.8342456817626953, -3.7161028385162354, -3.5979599952697754, -3.4798171520233154, -3.3616743087768555, -3.2435314655303955, -3.1253886222839355, -3.0072460174560547, -2.8891029357910156, -2.7709603309631348, -2.652817487716675, -2.534674644470215, -2.416531801223755, -2.298388957977295, -2.180246114730835, -2.062103271484375, -1.9439605474472046, -1.8258178234100342, -1.7076749801635742, -1.5895321369171143, -1.4713892936706543, -1.3532464504241943, -1.235103726387024, -1.116960883140564, -0.998818039894104, -0.8806752562522888, -0.7625324726104736, -0.6443893909454346, -0.5262465476989746, -0.4081037640571594, -0.28996095061302185, -0.17181813716888428, -0.053675293922424316, 0.06446748971939087, 0.18261027336120605, 0.300753116607666, 0.4188959300518036, 0.5370387434959412, 0.6551815271377563, 0.7733243703842163, 0.8914672136306763, 1.0096099376678467, 1.1277527809143066, 1.2458956241607666, 1.3640384674072266, 1.4821813106536865, 1.600324034690857, 1.718466877937317, 1.8366097211837769, 1.9547524452209473, 2.0728952884674072, 2.191038131713867, 2.309180974960327, 2.427323818206787, 2.545466661453247, 2.663609504699707, 2.781752109527588, 2.899894952774048, 3.018037796020508, 3.1361806392669678]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 0.0, 6.0, 5.0, 7.0, 3.0, 12.0, 10.0, 9.0, 10.0, 18.0, 21.0, 19.0, 30.0, 26.0, 36.0, 29.0, 43.0, 68.0, 145.0, 133.0, 50.0, 42.0, 38.0, 31.0, 30.0, 15.0, 25.0, 27.0, 20.0, 11.0, 17.0, 13.0, 10.0, 6.0, 7.0, 5.0, 5.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6545605659484863, -1.5974253416061401, -1.540290117263794, -1.4831547737121582, -1.426019549369812, -1.3688843250274658, -1.3117491006851196, -1.2546138763427734, -1.1974785327911377, -1.1403433084487915, -1.0832080841064453, -1.0260727405548096, -0.9689375162124634, -0.9118022918701172, -0.854667067527771, -0.7975318431854248, -0.7403966188430786, -0.6832613945007324, -0.6261261105537415, -0.5689908862113953, -0.5118556022644043, -0.4547203779220581, -0.3975851535797119, -0.34044989943504333, -0.28331464529037476, -0.22617939114570618, -0.1690441519021988, -0.1119089126586914, -0.05477365851402283, 0.002361595630645752, 0.05949681997299194, 0.11663207411766052, 0.1737673282623291, 0.23090258240699768, 0.28803783655166626, 0.34517306089401245, 0.40230831503868103, 0.4594435691833496, 0.5165787935256958, 0.573714017868042, 0.630849301815033, 0.6879845261573792, 0.7451198101043701, 0.8022550344467163, 0.8593902587890625, 0.9165255427360535, 0.9736607670783997, 1.0307960510253906, 1.0879312753677368, 1.145066499710083, 1.2022017240524292, 1.2593369483947754, 1.3164722919464111, 1.3736075162887573, 1.4307427406311035, 1.4878779649734497, 1.545013189315796, 1.602148413658142, 1.6592836380004883, 1.716418981552124, 1.7735542058944702, 1.8306894302368164, 1.8878246545791626, 1.9449598789215088, 2.0020952224731445]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 6.0, 14.0, 10.0, 16.0, 34.0, 38.0, 51.0, 87.0, 115.0, 177.0, 206.0, 333.0, 459.0, 684.0, 1070.0, 1531.0, 2489.0, 4311.0, 7532.0, 14723.0, 32870.0, 86379.0, 277120.0, 929483.0, 1689972.0, 776975.0, 232024.0, 75202.0, 29348.0, 13515.0, 6914.0, 3881.0, 2269.0, 1403.0, 935.0, 647.0, 442.0, 279.0, 208.0, 155.0, 88.0, 79.0, 64.0, 36.0, 27.0, 22.0, 11.0, 16.0, 10.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.10675048828125, -0.10335350036621094, -0.09995651245117188, -0.09655952453613281, -0.09316253662109375, -0.08976554870605469, -0.08636856079101562, -0.08297157287597656, -0.0795745849609375, -0.07617759704589844, -0.07278060913085938, -0.06938362121582031, -0.06598663330078125, -0.06258964538574219, -0.059192657470703125, -0.05579566955566406, -0.052398681640625, -0.04900169372558594, -0.045604705810546875, -0.04220771789550781, -0.03881072998046875, -0.03541374206542969, -0.032016754150390625, -0.028619766235351562, -0.0252227783203125, -0.021825790405273438, -0.018428802490234375, -0.015031814575195312, -0.01163482666015625, -0.008237838745117188, -0.004840850830078125, -0.0014438629150390625, 0.001953125, 0.0053501129150390625, 0.008747100830078125, 0.012144088745117188, 0.01554107666015625, 0.018938064575195312, 0.022335052490234375, 0.025732040405273438, 0.0291290283203125, 0.03252601623535156, 0.035923004150390625, 0.03931999206542969, 0.04271697998046875, 0.04611396789550781, 0.049510955810546875, 0.05290794372558594, 0.056304931640625, 0.05970191955566406, 0.06309890747070312, 0.06649589538574219, 0.06989288330078125, 0.07328987121582031, 0.07668685913085938, 0.08008384704589844, 0.0834808349609375, 0.08687782287597656, 0.09027481079101562, 0.09367179870605469, 0.09706878662109375, 0.10046577453613281, 0.10386276245117188, 0.10725975036621094, 0.11065673828125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 2.0, 4.0, 7.0, 6.0, 12.0, 6.0, 13.0, 19.0, 14.0, 33.0, 24.0, 30.0, 30.0, 40.0, 38.0, 45.0, 50.0, 50.0, 46.0, 50.0, 42.0, 66.0, 50.0, 38.0, 35.0, 36.0, 30.0, 23.0, 24.0, 29.0, 19.0, 23.0, 15.0, 14.0, 14.0, 7.0, 1.0, 3.0, 2.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0924072265625, -0.0897989273071289, -0.08719062805175781, -0.08458232879638672, -0.08197402954101562, -0.07936573028564453, -0.07675743103027344, -0.07414913177490234, -0.07154083251953125, -0.06893253326416016, -0.06632423400878906, -0.06371593475341797, -0.061107635498046875, -0.05849933624267578, -0.05589103698730469, -0.053282737731933594, -0.0506744384765625, -0.048066139221191406, -0.04545783996582031, -0.04284954071044922, -0.040241241455078125, -0.03763294219970703, -0.03502464294433594, -0.032416343688964844, -0.02980804443359375, -0.027199745178222656, -0.024591445922851562, -0.02198314666748047, -0.019374847412109375, -0.01676654815673828, -0.014158248901367188, -0.011549949645996094, -0.008941650390625, -0.006333351135253906, -0.0037250518798828125, -0.0011167526245117188, 0.001491546630859375, 0.004099845886230469, 0.0067081451416015625, 0.009316444396972656, 0.01192474365234375, 0.014533042907714844, 0.017141342163085938, 0.01974964141845703, 0.022357940673828125, 0.02496623992919922, 0.027574539184570312, 0.030182838439941406, 0.0327911376953125, 0.035399436950683594, 0.03800773620605469, 0.04061603546142578, 0.043224334716796875, 0.04583263397216797, 0.04844093322753906, 0.051049232482910156, 0.05365753173828125, 0.056265830993652344, 0.05887413024902344, 0.06148242950439453, 0.06409072875976562, 0.06669902801513672, 0.06930732727050781, 0.0719156265258789, 0.07452392578125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 12.0, 13.0, 47.0, 139.0, 324.0, 1069.0, 7272.0, 4134218.0, 48358.0, 2018.0, 510.0, 176.0, 62.0, 28.0, 11.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3505859375, -1.30352783203125, -1.2564697265625, -1.20941162109375, -1.162353515625, -1.11529541015625, -1.0682373046875, -1.02117919921875, -0.97412109375, -0.92706298828125, -0.8800048828125, -0.83294677734375, -0.785888671875, -0.73883056640625, -0.6917724609375, -0.64471435546875, -0.59765625, -0.55059814453125, -0.5035400390625, -0.45648193359375, -0.409423828125, -0.36236572265625, -0.3153076171875, -0.26824951171875, -0.22119140625, -0.17413330078125, -0.1270751953125, -0.08001708984375, -0.032958984375, 0.01409912109375, 0.0611572265625, 0.10821533203125, 0.1552734375, 0.20233154296875, 0.2493896484375, 0.29644775390625, 0.343505859375, 0.39056396484375, 0.4376220703125, 0.48468017578125, 0.53173828125, 0.57879638671875, 0.6258544921875, 0.67291259765625, 0.719970703125, 0.76702880859375, 0.8140869140625, 0.86114501953125, 0.908203125, 0.95526123046875, 1.0023193359375, 1.04937744140625, 1.096435546875, 1.14349365234375, 1.1905517578125, 1.23760986328125, 1.28466796875, 1.33172607421875, 1.3787841796875, 1.42584228515625, 1.472900390625, 1.51995849609375, 1.5670166015625, 1.61407470703125, 1.6611328125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 2.0, 13.0, 16.0, 27.0, 60.0, 89.0, 151.0, 296.0, 562.0, 902.0, 889.0, 475.0, 248.0, 160.0, 78.0, 51.0, 25.0, 12.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.344482421875, -0.3280143737792969, -0.31154632568359375, -0.2950782775878906, -0.2786102294921875, -0.2621421813964844, -0.24567413330078125, -0.22920608520507812, -0.212738037109375, -0.19626998901367188, -0.17980194091796875, -0.16333389282226562, -0.1468658447265625, -0.13039779663085938, -0.11392974853515625, -0.09746170043945312, -0.08099365234375, -0.06452560424804688, -0.04805755615234375, -0.031589508056640625, -0.0151214599609375, 0.001346588134765625, 0.01781463623046875, 0.034282684326171875, 0.050750732421875, 0.06721878051757812, 0.08368682861328125, 0.10015487670898438, 0.1166229248046875, 0.13309097290039062, 0.14955902099609375, 0.16602706909179688, 0.1824951171875, 0.19896316528320312, 0.21543121337890625, 0.23189926147460938, 0.2483673095703125, 0.2648353576660156, 0.28130340576171875, 0.2977714538574219, 0.314239501953125, 0.3307075500488281, 0.34717559814453125, 0.3636436462402344, 0.3801116943359375, 0.3965797424316406, 0.41304779052734375, 0.4295158386230469, 0.44598388671875, 0.4624519348144531, 0.47891998291015625, 0.4953880310058594, 0.5118560791015625, 0.5283241271972656, 0.5447921752929688, 0.5612602233886719, 0.577728271484375, 0.5941963195800781, 0.6106643676757812, 0.6271324157714844, 0.6436004638671875, 0.6600685119628906, 0.6765365600585938, 0.6930046081542969, 0.70947265625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 2.0, 8.0, 15.0, 56.0, 149.0, 303.0, 298.0, 89.0, 37.0, 20.0, 12.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.405509948730469, -9.157914161682129, -8.910319328308105, -8.662723541259766, -8.415127754211426, -8.167531967163086, -7.9199371337890625, -7.672341346740723, -7.424746036529541, -7.177150726318359, -6.9295549392700195, -6.681959629058838, -6.434364318847656, -6.186768531799316, -5.939173221588135, -5.691577911376953, -5.443982124328613, -5.196386814117432, -4.948791027069092, -4.70119571685791, -4.45359992980957, -4.206004619598389, -3.958409309387207, -3.7108137607574463, -3.4632182121276855, -3.215622663497925, -2.968027114868164, -2.7204318046569824, -2.4728362560272217, -2.225240707397461, -1.9776452779769897, -1.7300498485565186, -1.4824542999267578, -1.234858751296997, -0.9872633218765259, -0.7396678328514099, -0.49207234382629395, -0.2444767951965332, 0.0031186342239379883, 0.2507140636444092, 0.4983096122741699, 0.7459051012992859, 0.9935005903244019, 1.241096019744873, 1.4886915683746338, 1.7362871170043945, 1.9838825464248657, 2.231477975845337, 2.4790735244750977, 2.7266690731048584, 2.974264621734619, 3.221859931945801, 3.4694554805755615, 3.7170510292053223, 3.964646339416504, 4.212242126464844, 4.459837436676025, 4.707432746887207, 4.955028533935547, 5.2026238441467285, 5.45021915435791, 5.69781494140625, 5.945410251617432, 6.193005561828613, 6.440601348876953]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 4.0, 7.0, 8.0, 3.0, 12.0, 14.0, 17.0, 20.0, 24.0, 32.0, 43.0, 44.0, 36.0, 59.0, 41.0, 71.0, 68.0, 72.0, 64.0, 51.0, 39.0, 49.0, 30.0, 30.0, 28.0, 27.0, 23.0, 12.0, 13.0, 11.0, 13.0, 8.0, 2.0, 4.0, 3.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9496837854385376, -1.887587308883667, -1.8254908323287964, -1.7633943557739258, -1.7012978792190552, -1.6392014026641846, -1.5771050453186035, -1.5150084495544434, -1.4529120922088623, -1.3908156156539917, -1.328719139099121, -1.2666226625442505, -1.2045261859893799, -1.1424297094345093, -1.0803332328796387, -1.0182368755340576, -0.9561402797698975, -0.8940438032150269, -0.8319473266601562, -0.7698508501052856, -0.707754373550415, -0.6456578969955444, -0.5835614800453186, -0.521465003490448, -0.4593685269355774, -0.3972720503807068, -0.3351755738258362, -0.27307912707328796, -0.21098265051841736, -0.14888617396354675, -0.08678972721099854, -0.02469325065612793, 0.037403106689453125, 0.09949957579374313, 0.16159604489803314, 0.22369250655174255, 0.28578898310661316, 0.34788545966148376, 0.409981906414032, 0.4720783829689026, 0.5341748595237732, 0.5962713360786438, 0.6583678126335144, 0.7204642295837402, 0.7825607061386108, 0.8446571826934814, 0.906753659248352, 0.9688501358032227, 1.0309466123580933, 1.0930430889129639, 1.1551395654678345, 1.217236042022705, 1.2793325185775757, 1.3414289951324463, 1.4035253524780273, 1.4656219482421875, 1.5277183055877686, 1.5898147821426392, 1.6519112586975098, 1.7140077352523804, 1.776104211807251, 1.8382006883621216, 1.9002971649169922, 1.9623935222625732, 2.0244901180267334]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 9.0, 21.0, 13.0, 19.0, 31.0, 46.0, 59.0, 103.0, 132.0, 185.0, 328.0, 489.0, 857.0, 1554.0, 2757.0, 5591.0, 12532.0, 31001.0, 90701.0, 373254.0, 380840.0, 91588.0, 31424.0, 12652.0, 5622.0, 2919.0, 1474.0, 877.0, 552.0, 329.0, 198.0, 124.0, 91.0, 51.0, 35.0, 27.0, 24.0, 13.0, 6.0, 7.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1712646484375, -0.165740966796875, -0.16021728515625, -0.154693603515625, -0.149169921875, -0.143646240234375, -0.13812255859375, -0.132598876953125, -0.1270751953125, -0.121551513671875, -0.11602783203125, -0.110504150390625, -0.10498046875, -0.099456787109375, -0.09393310546875, -0.088409423828125, -0.0828857421875, -0.077362060546875, -0.07183837890625, -0.066314697265625, -0.060791015625, -0.055267333984375, -0.04974365234375, -0.044219970703125, -0.0386962890625, -0.033172607421875, -0.02764892578125, -0.022125244140625, -0.0166015625, -0.011077880859375, -0.00555419921875, -3.0517578125e-05, 0.0054931640625, 0.011016845703125, 0.01654052734375, 0.022064208984375, 0.027587890625, 0.033111572265625, 0.03863525390625, 0.044158935546875, 0.0496826171875, 0.055206298828125, 0.06072998046875, 0.066253662109375, 0.07177734375, 0.077301025390625, 0.08282470703125, 0.088348388671875, 0.0938720703125, 0.099395751953125, 0.10491943359375, 0.110443115234375, 0.115966796875, 0.121490478515625, 0.12701416015625, 0.132537841796875, 0.1380615234375, 0.143585205078125, 0.14910888671875, 0.154632568359375, 0.16015625, 0.165679931640625, 0.17120361328125, 0.176727294921875, 0.1822509765625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 11.0, 14.0, 16.0, 28.0, 34.0, 39.0, 42.0, 60.0, 46.0, 68.0, 80.0, 76.0, 75.0, 65.0, 63.0, 58.0, 49.0, 38.0, 31.0, 22.0, 10.0, 13.0, 12.0, 11.0, 5.0, 9.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10882568359375, -0.10399150848388672, -0.09915733337402344, -0.09432315826416016, -0.08948898315429688, -0.0846548080444336, -0.07982063293457031, -0.07498645782470703, -0.07015228271484375, -0.06531810760498047, -0.06048393249511719, -0.055649757385253906, -0.050815582275390625, -0.045981407165527344, -0.04114723205566406, -0.03631305694580078, -0.0314788818359375, -0.02664470672607422, -0.021810531616210938, -0.016976356506347656, -0.012142181396484375, -0.007308006286621094, -0.0024738311767578125, 0.0023603439331054688, 0.00719451904296875, 0.012028694152832031, 0.016862869262695312, 0.021697044372558594, 0.026531219482421875, 0.031365394592285156, 0.03619956970214844, 0.04103374481201172, 0.045867919921875, 0.05070209503173828, 0.05553627014160156, 0.060370445251464844, 0.06520462036132812, 0.0700387954711914, 0.07487297058105469, 0.07970714569091797, 0.08454132080078125, 0.08937549591064453, 0.09420967102050781, 0.0990438461303711, 0.10387802124023438, 0.10871219635009766, 0.11354637145996094, 0.11838054656982422, 0.1232147216796875, 0.12804889678955078, 0.13288307189941406, 0.13771724700927734, 0.14255142211914062, 0.1473855972290039, 0.1522197723388672, 0.15705394744873047, 0.16188812255859375, 0.16672229766845703, 0.1715564727783203, 0.1763906478881836, 0.18122482299804688, 0.18605899810791016, 0.19089317321777344, 0.19572734832763672, 0.2005615234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 8.0, 11.0, 11.0, 28.0, 35.0, 44.0, 66.0, 93.0, 177.0, 286.0, 542.0, 1253.0, 4206.0, 28075.0, 877660.0, 121342.0, 10632.0, 2219.0, 855.0, 406.0, 197.0, 131.0, 75.0, 55.0, 40.0, 26.0, 17.0, 15.0, 7.0, 10.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379638671875, -0.36730194091796875, -0.3549652099609375, -0.34262847900390625, -0.330291748046875, -0.31795501708984375, -0.3056182861328125, -0.29328155517578125, -0.28094482421875, -0.26860809326171875, -0.2562713623046875, -0.24393463134765625, -0.231597900390625, -0.21926116943359375, -0.2069244384765625, -0.19458770751953125, -0.1822509765625, -0.16991424560546875, -0.1575775146484375, -0.14524078369140625, -0.132904052734375, -0.12056732177734375, -0.1082305908203125, -0.09589385986328125, -0.08355712890625, -0.07122039794921875, -0.0588836669921875, -0.04654693603515625, -0.034210205078125, -0.02187347412109375, -0.0095367431640625, 0.00279998779296875, 0.01513671875, 0.02747344970703125, 0.0398101806640625, 0.05214691162109375, 0.064483642578125, 0.07682037353515625, 0.0891571044921875, 0.10149383544921875, 0.11383056640625, 0.12616729736328125, 0.1385040283203125, 0.15084075927734375, 0.163177490234375, 0.17551422119140625, 0.1878509521484375, 0.20018768310546875, 0.2125244140625, 0.22486114501953125, 0.2371978759765625, 0.24953460693359375, 0.261871337890625, 0.27420806884765625, 0.2865447998046875, 0.29888153076171875, 0.31121826171875, 0.32355499267578125, 0.3358917236328125, 0.34822845458984375, 0.360565185546875, 0.37290191650390625, 0.3852386474609375, 0.39757537841796875, 0.409912109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 1.0, 8.0, 8.0, 5.0, 18.0, 20.0, 15.0, 14.0, 19.0, 39.0, 45.0, 54.0, 78.0, 99.0, 104.0, 98.0, 89.0, 67.0, 42.0, 32.0, 37.0, 25.0, 22.0, 13.0, 13.0, 9.0, 3.0, 5.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.755859375, -0.7347488403320312, -0.7136383056640625, -0.6925277709960938, -0.671417236328125, -0.6503067016601562, -0.6291961669921875, -0.6080856323242188, -0.58697509765625, -0.5658645629882812, -0.5447540283203125, -0.5236434936523438, -0.502532958984375, -0.48142242431640625, -0.4603118896484375, -0.43920135498046875, -0.4180908203125, -0.39698028564453125, -0.3758697509765625, -0.35475921630859375, -0.333648681640625, -0.31253814697265625, -0.2914276123046875, -0.27031707763671875, -0.24920654296875, -0.22809600830078125, -0.2069854736328125, -0.18587493896484375, -0.164764404296875, -0.14365386962890625, -0.1225433349609375, -0.10143280029296875, -0.080322265625, -0.05921173095703125, -0.0381011962890625, -0.01699066162109375, 0.004119873046875, 0.02523040771484375, 0.0463409423828125, 0.06745147705078125, 0.08856201171875, 0.10967254638671875, 0.1307830810546875, 0.15189361572265625, 0.173004150390625, 0.19411468505859375, 0.2152252197265625, 0.23633575439453125, 0.2574462890625, 0.27855682373046875, 0.2996673583984375, 0.32077789306640625, 0.341888427734375, 0.36299896240234375, 0.3841094970703125, 0.40522003173828125, 0.42633056640625, 0.44744110107421875, 0.4685516357421875, 0.48966217041015625, 0.510772705078125, 0.5318832397460938, 0.5529937744140625, 0.5741043090820312, 0.59521484375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 8.0, 9.0, 10.0, 14.0, 14.0, 31.0, 31.0, 47.0, 52.0, 85.0, 120.0, 192.0, 409.0, 669.0, 1555.0, 3934.0, 12979.0, 74305.0, 892542.0, 45857.0, 9621.0, 3229.0, 1257.0, 644.0, 330.0, 192.0, 116.0, 64.0, 50.0, 37.0, 29.0, 22.0, 10.0, 16.0, 13.0, 8.0, 7.0, 8.0, 3.0, 2.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0833740234375, -0.08080005645751953, -0.07822608947753906, -0.0756521224975586, -0.07307815551757812, -0.07050418853759766, -0.06793022155761719, -0.06535625457763672, -0.06278228759765625, -0.06020832061767578, -0.05763435363769531, -0.055060386657714844, -0.052486419677734375, -0.049912452697753906, -0.04733848571777344, -0.04476451873779297, -0.0421905517578125, -0.03961658477783203, -0.03704261779785156, -0.034468650817871094, -0.031894683837890625, -0.029320716857910156, -0.026746749877929688, -0.02417278289794922, -0.02159881591796875, -0.01902484893798828, -0.016450881958007812, -0.013876914978027344, -0.011302947998046875, -0.008728981018066406, -0.0061550140380859375, -0.0035810470581054688, -0.001007080078125, 0.0015668869018554688, 0.0041408538818359375, 0.006714820861816406, 0.009288787841796875, 0.011862754821777344, 0.014436721801757812, 0.01701068878173828, 0.01958465576171875, 0.02215862274169922, 0.024732589721679688, 0.027306556701660156, 0.029880523681640625, 0.032454490661621094, 0.03502845764160156, 0.03760242462158203, 0.0401763916015625, 0.04275035858154297, 0.04532432556152344, 0.047898292541503906, 0.050472259521484375, 0.053046226501464844, 0.05562019348144531, 0.05819416046142578, 0.06076812744140625, 0.06334209442138672, 0.06591606140136719, 0.06849002838134766, 0.07106399536132812, 0.0736379623413086, 0.07621192932128906, 0.07878589630126953, 0.08135986328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 6.0, 1.0, 6.0, 5.0, 8.0, 7.0, 14.0, 15.0, 17.0, 25.0, 44.0, 70.0, 95.0, 131.0, 148.0, 124.0, 74.0, 55.0, 26.0, 23.0, 17.0, 9.0, 15.0, 10.0, 7.0, 12.0, 2.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.039836883544922e-05, -2.945028245449066e-05, -2.8502196073532104e-05, -2.7554109692573547e-05, -2.660602331161499e-05, -2.5657936930656433e-05, -2.4709850549697876e-05, -2.376176416873932e-05, -2.2813677787780762e-05, -2.1865591406822205e-05, -2.0917505025863647e-05, -1.996941864490509e-05, -1.9021332263946533e-05, -1.8073245882987976e-05, -1.712515950202942e-05, -1.6177073121070862e-05, -1.5228986740112305e-05, -1.4280900359153748e-05, -1.333281397819519e-05, -1.2384727597236633e-05, -1.1436641216278076e-05, -1.0488554835319519e-05, -9.540468454360962e-06, -8.592382073402405e-06, -7.644295692443848e-06, -6.6962093114852905e-06, -5.748122930526733e-06, -4.800036549568176e-06, -3.851950168609619e-06, -2.903863787651062e-06, -1.955777406692505e-06, -1.0076910257339478e-06, -5.960464477539063e-08, 8.884817361831665e-07, 1.8365681171417236e-06, 2.7846544981002808e-06, 3.732740879058838e-06, 4.680827260017395e-06, 5.628913640975952e-06, 6.577000021934509e-06, 7.525086402893066e-06, 8.473172783851624e-06, 9.42125916481018e-06, 1.0369345545768738e-05, 1.1317431926727295e-05, 1.2265518307685852e-05, 1.321360468864441e-05, 1.4161691069602966e-05, 1.5109777450561523e-05, 1.605786383152008e-05, 1.7005950212478638e-05, 1.7954036593437195e-05, 1.8902122974395752e-05, 1.985020935535431e-05, 2.0798295736312866e-05, 2.1746382117271423e-05, 2.269446849822998e-05, 2.3642554879188538e-05, 2.4590641260147095e-05, 2.5538727641105652e-05, 2.648681402206421e-05, 2.7434900403022766e-05, 2.8382986783981323e-05, 2.933107316493988e-05, 3.0279159545898438e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 12.0, 12.0, 12.0, 13.0, 19.0, 32.0, 45.0, 72.0, 111.0, 145.0, 280.0, 446.0, 836.0, 1553.0, 3568.0, 9228.0, 31148.0, 702123.0, 254174.0, 29189.0, 8792.0, 3310.0, 1487.0, 779.0, 429.0, 251.0, 166.0, 87.0, 81.0, 40.0, 27.0, 29.0, 15.0, 10.0, 10.0, 4.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.053558349609375, -0.05164384841918945, -0.049729347229003906, -0.04781484603881836, -0.04590034484863281, -0.043985843658447266, -0.04207134246826172, -0.04015684127807617, -0.038242340087890625, -0.03632783889770508, -0.03441333770751953, -0.032498836517333984, -0.030584335327148438, -0.02866983413696289, -0.026755332946777344, -0.024840831756591797, -0.02292633056640625, -0.021011829376220703, -0.019097328186035156, -0.01718282699584961, -0.015268325805664062, -0.013353824615478516, -0.011439323425292969, -0.009524822235107422, -0.007610321044921875, -0.005695819854736328, -0.0037813186645507812, -0.0018668174743652344, 4.76837158203125e-05, 0.0019621849060058594, 0.0038766860961914062, 0.005791187286376953, 0.0077056884765625, 0.009620189666748047, 0.011534690856933594, 0.01344919204711914, 0.015363693237304688, 0.017278194427490234, 0.01919269561767578, 0.021107196807861328, 0.023021697998046875, 0.024936199188232422, 0.02685070037841797, 0.028765201568603516, 0.030679702758789062, 0.03259420394897461, 0.034508705139160156, 0.0364232063293457, 0.03833770751953125, 0.0402522087097168, 0.042166709899902344, 0.04408121109008789, 0.04599571228027344, 0.047910213470458984, 0.04982471466064453, 0.05173921585083008, 0.053653717041015625, 0.05556821823120117, 0.05748271942138672, 0.059397220611572266, 0.06131172180175781, 0.06322622299194336, 0.0651407241821289, 0.06705522537231445, 0.0689697265625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 2.0, 8.0, 9.0, 13.0, 10.0, 15.0, 22.0, 29.0, 47.0, 64.0, 95.0, 116.0, 145.0, 132.0, 78.0, 58.0, 36.0, 30.0, 15.0, 13.0, 8.0, 7.0, 15.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06439208984375, -0.061844825744628906, -0.05929756164550781, -0.05675029754638672, -0.054203033447265625, -0.05165576934814453, -0.04910850524902344, -0.046561241149902344, -0.04401397705078125, -0.041466712951660156, -0.03891944885253906, -0.03637218475341797, -0.033824920654296875, -0.03127765655517578, -0.028730392456054688, -0.026183128356933594, -0.0236358642578125, -0.021088600158691406, -0.018541336059570312, -0.01599407196044922, -0.013446807861328125, -0.010899543762207031, -0.008352279663085938, -0.005805015563964844, -0.00325775146484375, -0.0007104873657226562, 0.0018367767333984375, 0.004384040832519531, 0.006931304931640625, 0.009478569030761719, 0.012025833129882812, 0.014573097229003906, 0.017120361328125, 0.019667625427246094, 0.022214889526367188, 0.02476215362548828, 0.027309417724609375, 0.02985668182373047, 0.03240394592285156, 0.034951210021972656, 0.03749847412109375, 0.040045738220214844, 0.04259300231933594, 0.04514026641845703, 0.047687530517578125, 0.05023479461669922, 0.05278205871582031, 0.055329322814941406, 0.0578765869140625, 0.060423851013183594, 0.06297111511230469, 0.06551837921142578, 0.06806564331054688, 0.07061290740966797, 0.07316017150878906, 0.07570743560791016, 0.07825469970703125, 0.08080196380615234, 0.08334922790527344, 0.08589649200439453, 0.08844375610351562, 0.09099102020263672, 0.09353828430175781, 0.0960855484008789, 0.0986328125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 9.0, 8.0, 21.0, 45.0, 118.0, 533.0, 152.0, 64.0, 29.0, 7.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.787998199462891, -4.685794353485107, -4.583590507507324, -4.481386661529541, -4.379182815551758, -4.276978492736816, -4.174775123596191, -4.07257080078125, -3.970366954803467, -3.8681631088256836, -3.7659592628479004, -3.663755416870117, -3.561551332473755, -3.4593474864959717, -3.3571436405181885, -3.2549397945404053, -3.152735948562622, -3.050532102584839, -2.9483282566070557, -2.8461241722106934, -2.74392032623291, -2.641716480255127, -2.5395126342773438, -2.4373087882995605, -2.3351049423217773, -2.232901096343994, -2.130697250366211, -2.0284934043884277, -1.9262893199920654, -1.8240854740142822, -1.721881628036499, -1.6196777820587158, -1.5174739360809326, -1.4152700901031494, -1.3130661249160767, -1.2108622789382935, -1.1086583137512207, -1.0064544677734375, -0.9042506217956543, -0.8020467162132263, -0.6998428106307983, -0.5976389050483704, -0.49543502926826477, -0.3932311534881592, -0.2910272479057312, -0.18882334232330322, -0.08661949634552002, 0.015584409236907959, 0.11778831481933594, 0.21999220550060272, 0.3221960961818695, 0.4243999719619751, 0.5266038775444031, 0.628807783126831, 0.7310116291046143, 0.8332155346870422, 0.9354194402694702, 1.0376232862472534, 1.1398272514343262, 1.2420310974121094, 1.3442349433898926, 1.4464389085769653, 1.5486427545547485, 1.6508467197418213, 1.7530505657196045]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 6.0, 12.0, 14.0, 20.0, 13.0, 16.0, 24.0, 23.0, 25.0, 23.0, 19.0, 42.0, 86.0, 337.0, 99.0, 35.0, 23.0, 30.0, 25.0, 17.0, 12.0, 13.0, 20.0, 8.0, 7.0, 8.0, 5.0, 2.0, 7.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5396223068237305, -1.4949918985366821, -1.4503616094589233, -1.405731201171875, -1.3611007928848267, -1.3164703845977783, -1.2718400955200195, -1.2272096872329712, -1.1825792789459229, -1.1379488706588745, -1.0933185815811157, -1.0486881732940674, -1.004057765007019, -0.9594274163246155, -0.9147970676422119, -0.8701666593551636, -0.82553631067276, -0.7809059619903564, -0.7362755537033081, -0.6916452050209045, -0.6470147967338562, -0.6023844480514526, -0.5577540397644043, -0.5131236910820007, -0.4684933125972748, -0.42386293411254883, -0.3792325556278229, -0.3346021771430969, -0.28997182846069336, -0.2453414350748062, -0.20071107149124146, -0.1560806930065155, -0.11145031452178955, -0.0668199360370636, -0.022189565002918243, 0.022440806031227112, 0.06707118451595306, 0.11170156300067902, 0.15633192658424377, 0.20096230506896973, 0.24559268355369568, 0.29022306203842163, 0.3348534405231476, 0.37948381900787354, 0.4241141676902771, 0.46874457597732544, 0.513374924659729, 0.5580053329467773, 0.6026356816291809, 0.6472660303115845, 0.6918964385986328, 0.7365267872810364, 0.7811571955680847, 0.8257875442504883, 0.8704179525375366, 0.9150483012199402, 0.9596786499023438, 1.004309058189392, 1.0489393472671509, 1.0935697555541992, 1.1382001638412476, 1.182830572128296, 1.2274608612060547, 1.272091269493103, 1.3167216777801514]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 9.0, 7.0, 10.0, 7.0, 10.0, 19.0, 22.0, 18.0, 29.0, 38.0, 37.0, 41.0, 73.0, 223.0, 172.0, 54.0, 46.0, 36.0, 33.0, 33.0, 14.0, 13.0, 14.0, 13.0, 8.0, 6.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1805419921875, -0.17601585388183594, -0.17148971557617188, -0.1669635772705078, -0.16243743896484375, -0.1579113006591797, -0.15338516235351562, -0.14885902404785156, -0.1443328857421875, -0.13980674743652344, -0.13528060913085938, -0.1307544708251953, -0.12622833251953125, -0.12170219421386719, -0.11717605590820312, -0.11264991760253906, -0.108123779296875, -0.10359764099121094, -0.09907150268554688, -0.09454536437988281, -0.09001922607421875, -0.08549308776855469, -0.08096694946289062, -0.07644081115722656, -0.0719146728515625, -0.06738853454589844, -0.06286239624023438, -0.05833625793457031, -0.05381011962890625, -0.04928398132324219, -0.044757843017578125, -0.04023170471191406, -0.03570556640625, -0.031179428100585938, -0.026653289794921875, -0.022127151489257812, -0.01760101318359375, -0.013074874877929688, -0.008548736572265625, -0.0040225982666015625, 0.0005035400390625, 0.0050296783447265625, 0.009555816650390625, 0.014081954956054688, 0.01860809326171875, 0.023134231567382812, 0.027660369873046875, 0.03218650817871094, 0.036712646484375, 0.04123878479003906, 0.045764923095703125, 0.05029106140136719, 0.05481719970703125, 0.05934333801269531, 0.06386947631835938, 0.06839561462402344, 0.0729217529296875, 0.07744789123535156, 0.08197402954101562, 0.08650016784667969, 0.09102630615234375, 0.09555244445800781, 0.10007858276367188, 0.10460472106933594, 0.109130859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 17.0, 21.0, 18.0, 30.0, 34.0, 60.0, 88.0, 144.0, 343.0, 835.0, 2603.0, 14902.0, 8345028.0, 19539.0, 3127.0, 913.0, 303.0, 187.0, 98.0, 79.0, 65.0, 41.0, 24.0, 10.0, 9.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 1.0, 4.0, 4.0, 4.0], "bins": [-1.41782546043396, -1.3767873048782349, -1.3357492685317993, -1.2947111129760742, -1.2536730766296387, -1.2126349210739136, -1.171596884727478, -1.130558729171753, -1.0895206928253174, -1.0484825372695923, -1.0074445009231567, -0.9664064049720764, -0.9253683090209961, -0.8843302130699158, -0.8432921171188354, -0.8022539615631104, -0.76121586561203, -0.7201777696609497, -0.6791396737098694, -0.6381015777587891, -0.5970634818077087, -0.5560253858566284, -0.5149872303009033, -0.4739491641521454, -0.43291106820106506, -0.39187297224998474, -0.3508348762989044, -0.3097967505455017, -0.2687586545944214, -0.22772057354450226, -0.18668246269226074, -0.14564436674118042, -0.1046062707901001, -0.06356817483901978, -0.022530071437358856, 0.018508031964302063, 0.059546127915382385, 0.10058422386646271, 0.14162233471870422, 0.18266043066978455, 0.22369852662086487, 0.2647366225719452, 0.3057747185230255, 0.3468128442764282, 0.38785094022750854, 0.42888903617858887, 0.4699271321296692, 0.5109652280807495, 0.5520033240318298, 0.5930414199829102, 0.6340795159339905, 0.6751176118850708, 0.7161557078361511, 0.7571938037872314, 0.7982319593429565, 0.8392699956893921, 0.8803081512451172, 0.9213462471961975, 0.9623843431472778, 1.003422498703003, 1.0444605350494385, 1.0854986906051636, 1.1265367269515991, 1.1675748825073242, 1.2086129188537598]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 5.0, 8.0, 2.0, 3.0, 4.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.2325770854949951, -1.19754159450531, -1.1625059843063354, -1.1274704933166504, -1.0924350023269653, -1.0573995113372803, -1.0223639011383057, -0.9873284101486206, -0.9522928595542908, -0.9172573089599609, -0.8822218179702759, -0.847186267375946, -0.8121507167816162, -0.7771152257919312, -0.7420796751976013, -0.7070441246032715, -0.6720086336135864, -0.6369730830192566, -0.6019375920295715, -0.5669020414352417, -0.5318665504455566, -0.4968309998512268, -0.461795449256897, -0.4267599284648895, -0.3917244076728821, -0.35668888688087463, -0.3216533660888672, -0.28661781549453735, -0.2515822947025299, -0.21654677391052246, -0.18151123821735382, -0.14647570252418518, -0.11144006252288818, -0.07640453428030014, -0.0413690060377121, -0.006333477795124054, 0.02870205044746399, 0.06373757123947144, 0.09877310693264008, 0.13380864262580872, 0.16884416341781616, 0.2038796842098236, 0.23891521990299225, 0.2739507555961609, 0.30898627638816833, 0.3440217971801758, 0.3790573477745056, 0.41409286856651306, 0.4491283893585205, 0.48416391015052795, 0.5191994309425354, 0.5542349815368652, 0.5892704725265503, 0.6243060231208801, 0.65934157371521, 0.694377064704895, 0.7294126152992249, 0.7644481658935547, 0.7994836568832397, 0.8345192074775696, 0.8695547580718994, 0.9045902490615845, 0.9396257996559143, 0.9746613502502441, 1.0096968412399292]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 10.0, 18.0, 25.0, 48.0, 99.0, 245.0, 655.0, 2208.0, 12565.0, 129552.0, 336393.0, 35423.0, 5177.0, 1136.0, 376.0, 148.0, 77.0, 43.0, 20.0, 21.0, 7.0, 3.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.697265625, -2.6207275390625, -2.544189453125, -2.4676513671875, -2.39111328125, -2.3145751953125, -2.238037109375, -2.1614990234375, -2.0849609375, -2.0084228515625, -1.931884765625, -1.8553466796875, -1.77880859375, -1.7022705078125, -1.625732421875, -1.5491943359375, -1.47265625, -1.3961181640625, -1.319580078125, -1.2430419921875, -1.16650390625, -1.0899658203125, -1.013427734375, -0.9368896484375, -0.8603515625, -0.7838134765625, -0.707275390625, -0.6307373046875, -0.55419921875, -0.4776611328125, -0.401123046875, -0.3245849609375, -0.248046875, -0.1715087890625, -0.094970703125, -0.0184326171875, 0.05810546875, 0.1346435546875, 0.211181640625, 0.2877197265625, 0.3642578125, 0.4407958984375, 0.517333984375, 0.5938720703125, 0.67041015625, 0.7469482421875, 0.823486328125, 0.9000244140625, 0.9765625, 1.0531005859375, 1.129638671875, 1.2061767578125, 1.28271484375, 1.3592529296875, 1.435791015625, 1.5123291015625, 1.5888671875, 1.6654052734375, 1.741943359375, 1.8184814453125, 1.89501953125, 1.9715576171875, 2.048095703125, 2.1246337890625, 2.201171875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 6.0, 19.0, 19.0, 22.0, 40.0, 42.0, 43.0, 50.0, 92.0, 109.0, 100.0, 83.0, 78.0, 66.0, 60.0, 42.0, 24.0, 16.0, 25.0, 20.0, 7.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11834716796875, -0.1128225326538086, -0.10729789733886719, -0.10177326202392578, -0.09624862670898438, -0.09072399139404297, -0.08519935607910156, -0.07967472076416016, -0.07415008544921875, -0.06862545013427734, -0.06310081481933594, -0.05757617950439453, -0.052051544189453125, -0.04652690887451172, -0.04100227355957031, -0.035477638244628906, -0.0299530029296875, -0.024428367614746094, -0.018903732299804688, -0.013379096984863281, -0.007854461669921875, -0.0023298263549804688, 0.0031948089599609375, 0.008719444274902344, 0.01424407958984375, 0.019768714904785156, 0.025293350219726562, 0.03081798553466797, 0.036342620849609375, 0.04186725616455078, 0.04739189147949219, 0.052916526794433594, 0.058441162109375, 0.0639657974243164, 0.06949043273925781, 0.07501506805419922, 0.08053970336914062, 0.08606433868408203, 0.09158897399902344, 0.09711360931396484, 0.10263824462890625, 0.10816287994384766, 0.11368751525878906, 0.11921215057373047, 0.12473678588867188, 0.13026142120361328, 0.1357860565185547, 0.1413106918334961, 0.1468353271484375, 0.1523599624633789, 0.1578845977783203, 0.16340923309326172, 0.16893386840820312, 0.17445850372314453, 0.17998313903808594, 0.18550777435302734, 0.19103240966796875, 0.19655704498291016, 0.20208168029785156, 0.20760631561279297, 0.21313095092773438, 0.21865558624267578, 0.2241802215576172, 0.2297048568725586, 0.2352294921875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 12.0, 21.0, 39.0, 56.0, 78.0, 91.0, 55.0, 41.0, 26.0, 16.0, 4.0, 10.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0994012355804443, -1.0622732639312744, -1.025145411491394, -0.9880174398422241, -0.9508894681930542, -0.913761556148529, -0.8766336441040039, -0.839505672454834, -0.8023777008056641, -0.7652497887611389, -0.728121817111969, -0.6909939050674438, -0.6538659334182739, -0.6167380213737488, -0.5796101093292236, -0.5424821376800537, -0.5053542256355286, -0.46822628378868103, -0.4310983419418335, -0.39397042989730835, -0.3568424582481384, -0.3197145462036133, -0.28258660435676575, -0.2454586625099182, -0.20833072066307068, -0.17120277881622314, -0.1340748369693756, -0.09694691002368927, -0.059818968176841736, -0.0226910263299942, 0.014436900615692139, 0.05156484246253967, 0.08869278430938721, 0.12582072615623474, 0.16294866800308228, 0.20007659494876862, 0.23720453679561615, 0.2743324637413025, 0.31146040558815, 0.34858834743499756, 0.3857162892818451, 0.4228442311286926, 0.45997217297554016, 0.4971001148223877, 0.5342280268669128, 0.5713559985160828, 0.6084839105606079, 0.6456118822097778, 0.682739794254303, 0.7198677062988281, 0.756995677947998, 0.7941235899925232, 0.8312515616416931, 0.8683794736862183, 0.9055074453353882, 0.9426353573799133, 0.9797632694244385, 1.0168912410736084, 1.0540190935134888, 1.0911470651626587, 1.1282750368118286, 1.1654030084609985, 1.202530860900879, 1.2396588325500488, 1.2767868041992188]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 1.0, 4.0, 7.0, 7.0, 13.0, 22.0, 37.0, 69.0, 73.0, 74.0, 52.0, 24.0, 24.0, 12.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.6544191241264343, -0.6343851089477539, -0.6143510341644287, -0.5943170189857483, -0.5742830038070679, -0.5542489886283875, -0.534214973449707, -0.5141808986663818, -0.4941468834877014, -0.474112868309021, -0.4540788233280182, -0.4340447783470154, -0.41401076316833496, -0.39397674798965454, -0.37394270300865173, -0.3539086580276489, -0.3338746428489685, -0.3138406276702881, -0.2938065826892853, -0.27377253770828247, -0.25373852252960205, -0.23370449244976044, -0.21367046236991882, -0.1936364322900772, -0.1736024022102356, -0.15356837213039398, -0.13353434205055237, -0.11350031197071075, -0.09346628189086914, -0.07343225181102753, -0.05339822173118591, -0.0333641916513443, -0.013330221176147461, 0.006703808903694153, 0.026737838983535767, 0.04677186906337738, 0.066805899143219, 0.08683992922306061, 0.10687395930290222, 0.12690798938274384, 0.14694201946258545, 0.16697604954242706, 0.18701007962226868, 0.2070441097021103, 0.2270781397819519, 0.24711216986179352, 0.26714619994163513, 0.28718024492263794, 0.30721426010131836, 0.3272482752799988, 0.3472823202610016, 0.3673163652420044, 0.3873503804206848, 0.40738439559936523, 0.42741844058036804, 0.44745248556137085, 0.46748650074005127, 0.4875205159187317, 0.5075545310974121, 0.5275886058807373, 0.5476226210594177, 0.5676566362380981, 0.5876907110214233, 0.6077247262001038, 0.6277587413787842]}, "_wandb": {"runtime": 4160}} \ No newline at end of file