diff --git "a/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" "b/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" --- "a/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" +++ "b/wandb/run-20220303_033953-1eigbhyo/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.2487, "train/learning_rate": 5.102040816326531e-06, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 7749, "_timestamp": 1646286542, "_step": 894, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 51.0, 788.0, 154.0, 11.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-157.27684020996094, -143.8236541748047, -130.37045288085938, -116.91726684570312, -103.46407318115234, -90.01087951660156, -76.55769348144531, -63.10449981689453, -49.65130615234375, -36.19811248779297, -22.744922637939453, -9.291732788085938, 4.161460876464844, 17.614654541015625, 31.067840576171875, 44.521034240722656, 57.97422790527344, 71.42742156982422, 84.880615234375, 98.33380126953125, 111.78699493408203, 125.24018859863281, 138.69337463378906, 152.14657592773438, 165.59976196289062, 179.05294799804688, 192.5061492919922, 205.95933532714844, 219.41253662109375, 232.86572265625, 246.31890869140625, 259.7720947265625, 273.22528076171875, 286.678466796875, 300.13165283203125, 313.5848388671875, 327.0380554199219, 340.4912414550781, 353.9444274902344, 367.3976135253906, 380.850830078125, 394.30401611328125, 407.7572021484375, 421.21038818359375, 434.6636047363281, 448.1167907714844, 461.5699768066406, 475.0231628417969, 488.4763488769531, 501.9295349121094, 515.3827514648438, 528.8359375, 542.2891235351562, 555.7423095703125, 569.1954956054688, 582.648681640625, 596.1018676757812, 609.5550537109375, 623.0082397460938, 636.46142578125, 649.9146118164062, 663.3677978515625, 676.821044921875, 690.2742309570312, 703.7274169921875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 0.0, 3.0, 9.0, 7.0, 7.0, 16.0, 23.0, 39.0, 34.0, 65.0, 107.0, 155.0, 167.0, 125.0, 93.0, 52.0, 31.0, 23.0, 12.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-367.9178161621094, -358.02044677734375, -348.12310791015625, -338.2257385253906, -328.3283996582031, -318.4310302734375, -308.53369140625, -298.6363220214844, -288.73895263671875, -278.8415832519531, -268.9442443847656, -259.046875, -249.14952087402344, -239.25216674804688, -229.3548126220703, -219.45745849609375, -209.5601043701172, -199.66275024414062, -189.76539611816406, -179.8680419921875, -169.97067260742188, -160.0733184814453, -150.17596435546875, -140.27859497070312, -130.38125610351562, -120.48390197753906, -110.58654022216797, -100.6891860961914, -90.79182434082031, -80.89447021484375, -70.99711608886719, -61.099754333496094, -51.202392578125, -41.30503463745117, -31.407678604125977, -21.51032257080078, -11.612964630126953, -1.715606689453125, 8.181747436523438, 18.07910919189453, 27.976463317871094, 37.87382125854492, 47.77117919921875, 57.66853332519531, 67.56588745117188, 77.46324920654297, 87.36060333251953, 97.25796508789062, 107.15531921386719, 117.05267333984375, 126.95003509521484, 136.84738159179688, 146.7447509765625, 156.64210510253906, 166.53945922851562, 176.43682861328125, 186.33416748046875, 196.2315216064453, 206.12887573242188, 216.0262451171875, 225.92359924316406, 235.82095336914062, 245.7183074951172, 255.61566162109375, 265.5130310058594]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 9.0, 7.0, 11.0, 17.0, 25.0, 38.0, 30.0, 72.0, 96.0, 131.0, 152.0, 130.0, 93.0, 59.0, 45.0, 28.0, 17.0, 8.0, 11.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4296875, -5.28729248046875, -5.1448974609375, -5.00250244140625, -4.860107421875, -4.71771240234375, -4.5753173828125, -4.43292236328125, -4.29052734375, -4.14813232421875, -4.0057373046875, -3.86334228515625, -3.720947265625, -3.57855224609375, -3.4361572265625, -3.29376220703125, -3.1513671875, -3.00897216796875, -2.8665771484375, -2.72418212890625, -2.581787109375, -2.43939208984375, -2.2969970703125, -2.15460205078125, -2.01220703125, -1.86981201171875, -1.7274169921875, -1.58502197265625, -1.442626953125, -1.30023193359375, -1.1578369140625, -1.01544189453125, -0.873046875, -0.73065185546875, -0.5882568359375, -0.44586181640625, -0.303466796875, -0.16107177734375, -0.0186767578125, 0.12371826171875, 0.26611328125, 0.40850830078125, 0.5509033203125, 0.69329833984375, 0.835693359375, 0.97808837890625, 1.1204833984375, 1.26287841796875, 1.4052734375, 1.54766845703125, 1.6900634765625, 1.83245849609375, 1.974853515625, 2.11724853515625, 2.2596435546875, 2.40203857421875, 2.54443359375, 2.68682861328125, 2.8292236328125, 2.97161865234375, 3.114013671875, 3.25640869140625, 3.3988037109375, 3.54119873046875, 3.68359375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 17.0, 23.0, 17.0, 19.0, 36.0, 71.0, 92.0, 125.0, 210.0, 343.0, 642.0, 1381.0, 3303.0, 14395.0, 4000953.0, 161666.0, 7076.0, 2043.0, 852.0, 372.0, 248.0, 113.0, 84.0, 59.0, 28.0, 23.0, 25.0, 13.0, 6.0, 6.0, 8.0, 8.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-46.40625, -45.1787109375, -43.951171875, -42.7236328125, -41.49609375, -40.2685546875, -39.041015625, -37.8134765625, -36.5859375, -35.3583984375, -34.130859375, -32.9033203125, -31.67578125, -30.4482421875, -29.220703125, -27.9931640625, -26.765625, -25.5380859375, -24.310546875, -23.0830078125, -21.85546875, -20.6279296875, -19.400390625, -18.1728515625, -16.9453125, -15.7177734375, -14.490234375, -13.2626953125, -12.03515625, -10.8076171875, -9.580078125, -8.3525390625, -7.125, -5.8974609375, -4.669921875, -3.4423828125, -2.21484375, -0.9873046875, 0.240234375, 1.4677734375, 2.6953125, 3.9228515625, 5.150390625, 6.3779296875, 7.60546875, 8.8330078125, 10.060546875, 11.2880859375, 12.515625, 13.7431640625, 14.970703125, 16.1982421875, 17.42578125, 18.6533203125, 19.880859375, 21.1083984375, 22.3359375, 23.5634765625, 24.791015625, 26.0185546875, 27.24609375, 28.4736328125, 29.701171875, 30.9287109375, 32.15625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 14.0, 14.0, 16.0, 29.0, 28.0, 35.0, 65.0, 97.0, 169.0, 298.0, 640.0, 1029.0, 687.0, 371.0, 194.0, 111.0, 72.0, 54.0, 38.0, 27.0, 17.0, 12.0, 14.0, 9.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.387939453125, -9.03369140625, -8.679443359375, -8.3251953125, -7.970947265625, -7.61669921875, -7.262451171875, -6.908203125, -6.553955078125, -6.19970703125, -5.845458984375, -5.4912109375, -5.136962890625, -4.78271484375, -4.428466796875, -4.07421875, -3.719970703125, -3.36572265625, -3.011474609375, -2.6572265625, -2.302978515625, -1.94873046875, -1.594482421875, -1.240234375, -0.885986328125, -0.53173828125, -0.177490234375, 0.1767578125, 0.531005859375, 0.88525390625, 1.239501953125, 1.59375, 1.947998046875, 2.30224609375, 2.656494140625, 3.0107421875, 3.364990234375, 3.71923828125, 4.073486328125, 4.427734375, 4.781982421875, 5.13623046875, 5.490478515625, 5.8447265625, 6.198974609375, 6.55322265625, 6.907470703125, 7.26171875, 7.615966796875, 7.97021484375, 8.324462890625, 8.6787109375, 9.032958984375, 9.38720703125, 9.741455078125, 10.095703125, 10.449951171875, 10.80419921875, 11.158447265625, 11.5126953125, 11.866943359375, 12.22119140625, 12.575439453125, 12.9296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 21.0, 19.0, 25.0, 42.0, 61.0, 81.0, 121.0, 177.0, 320.0, 1004.0, 6191.0, 151149.0, 3984397.0, 45848.0, 3317.0, 701.0, 284.0, 157.0, 97.0, 57.0, 66.0, 38.0, 25.0, 20.0, 15.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.53125, -35.5263671875, -34.521484375, -33.5166015625, -32.51171875, -31.5068359375, -30.501953125, -29.4970703125, -28.4921875, -27.4873046875, -26.482421875, -25.4775390625, -24.47265625, -23.4677734375, -22.462890625, -21.4580078125, -20.453125, -19.4482421875, -18.443359375, -17.4384765625, -16.43359375, -15.4287109375, -14.423828125, -13.4189453125, -12.4140625, -11.4091796875, -10.404296875, -9.3994140625, -8.39453125, -7.3896484375, -6.384765625, -5.3798828125, -4.375, -3.3701171875, -2.365234375, -1.3603515625, -0.35546875, 0.6494140625, 1.654296875, 2.6591796875, 3.6640625, 4.6689453125, 5.673828125, 6.6787109375, 7.68359375, 8.6884765625, 9.693359375, 10.6982421875, 11.703125, 12.7080078125, 13.712890625, 14.7177734375, 15.72265625, 16.7275390625, 17.732421875, 18.7373046875, 19.7421875, 20.7470703125, 21.751953125, 22.7568359375, 23.76171875, 24.7666015625, 25.771484375, 26.7763671875, 27.78125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 52.0, 218.0, 463.0, 201.0, 59.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.93682098388672, -117.5113754272461, -115.0859375, -112.66049194335938, -110.23505401611328, -107.80960845947266, -105.38417053222656, -102.95872497558594, -100.53327941894531, -98.10783386230469, -95.6823959350586, -93.25695037841797, -90.83151245117188, -88.40606689453125, -85.98062133789062, -83.55518341064453, -81.12974548339844, -78.70429992675781, -76.27886199951172, -73.8534164428711, -71.427978515625, -69.00253295898438, -66.57708740234375, -64.15164947509766, -61.72620391845703, -59.30076217651367, -56.87532043457031, -54.44987487792969, -52.02443313598633, -49.59899139404297, -47.17354965209961, -44.74810791015625, -42.32265853881836, -39.897216796875, -37.47177505493164, -35.04633331298828, -32.620887756347656, -30.195446014404297, -27.770004272460938, -25.344560623168945, -22.919118881225586, -20.493677139282227, -18.068233489990234, -15.642791748046875, -13.2173490524292, -10.791906356811523, -8.366464614868164, -5.941020965576172, -3.5155792236328125, -1.0901367664337158, 1.3353056907653809, 3.7607479095458984, 6.186190605163574, 8.61163330078125, 11.03707504272461, 13.462518692016602, 15.887960433959961, 18.31340217590332, 20.738845825195312, 23.164287567138672, 25.58972930908203, 28.015172958374023, 30.440614700317383, 32.866058349609375, 35.291500091552734]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 12.0, 9.0, 17.0, 13.0, 19.0, 21.0, 30.0, 21.0, 32.0, 32.0, 33.0, 46.0, 40.0, 42.0, 40.0, 49.0, 42.0, 44.0, 41.0, 39.0, 47.0, 38.0, 38.0, 40.0, 26.0, 25.0, 32.0, 23.0, 16.0, 15.0, 12.0, 14.0, 8.0, 5.0, 3.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.84715270996094, -32.708274841308594, -31.56939697265625, -30.430519104003906, -29.291641235351562, -28.15276336669922, -27.013885498046875, -25.87500762939453, -24.736129760742188, -23.597251892089844, -22.4583740234375, -21.319496154785156, -20.180618286132812, -19.04174041748047, -17.902862548828125, -16.76398468017578, -15.625104904174805, -14.486227035522461, -13.347349166870117, -12.208471298217773, -11.06959342956543, -9.930715560913086, -8.791836738586426, -7.652958869934082, -6.514081001281738, -5.3752031326293945, -4.236325263977051, -3.097446918487549, -1.958569049835205, -0.8196911811828613, 0.3191871643066406, 1.4580650329589844, 2.596942901611328, 3.735820770263672, 4.874698638916016, 6.013576984405518, 7.152454853057861, 8.291332244873047, 9.430211067199707, 10.56908893585205, 11.707966804504395, 12.846844673156738, 13.985722541809082, 15.124601364135742, 16.263479232788086, 17.40235710144043, 18.541234970092773, 19.680112838745117, 20.81899070739746, 21.957868576049805, 23.09674644470215, 24.235624313354492, 25.374502182006836, 26.51338005065918, 27.652259826660156, 28.7911376953125, 29.930015563964844, 31.068893432617188, 32.20777130126953, 33.346649169921875, 34.48552703857422, 35.62440490722656, 36.763282775878906, 37.90216064453125, 39.041038513183594]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 14.0, 10.0, 28.0, 29.0, 42.0, 50.0, 83.0, 106.0, 125.0, 157.0, 104.0, 76.0, 56.0, 36.0, 27.0, 13.0, 10.0, 7.0, 1.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.91290283203125, -4.7789306640625, -4.64495849609375, -4.510986328125, -4.37701416015625, -4.2430419921875, -4.10906982421875, -3.97509765625, -3.84112548828125, -3.7071533203125, -3.57318115234375, -3.439208984375, -3.30523681640625, -3.1712646484375, -3.03729248046875, -2.9033203125, -2.76934814453125, -2.6353759765625, -2.50140380859375, -2.367431640625, -2.23345947265625, -2.0994873046875, -1.96551513671875, -1.83154296875, -1.69757080078125, -1.5635986328125, -1.42962646484375, -1.295654296875, -1.16168212890625, -1.0277099609375, -0.89373779296875, -0.759765625, -0.62579345703125, -0.4918212890625, -0.35784912109375, -0.223876953125, -0.08990478515625, 0.0440673828125, 0.17803955078125, 0.31201171875, 0.44598388671875, 0.5799560546875, 0.71392822265625, 0.847900390625, 0.98187255859375, 1.1158447265625, 1.24981689453125, 1.3837890625, 1.51776123046875, 1.6517333984375, 1.78570556640625, 1.919677734375, 2.05364990234375, 2.1876220703125, 2.32159423828125, 2.45556640625, 2.58953857421875, 2.7235107421875, 2.85748291015625, 2.991455078125, 3.12542724609375, 3.2593994140625, 3.39337158203125, 3.52734375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 11.0, 5.0, 12.0, 10.0, 17.0, 19.0, 30.0, 37.0, 57.0, 77.0, 121.0, 180.0, 262.0, 416.0, 633.0, 993.0, 1474.0, 2513.0, 4484.0, 8982.0, 21978.0, 71196.0, 434702.0, 391400.0, 68229.0, 20756.0, 9021.0, 4418.0, 2397.0, 1447.0, 944.0, 583.0, 373.0, 238.0, 151.0, 125.0, 70.0, 58.0, 36.0, 30.0, 20.0, 11.0, 15.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2352294921875, -0.22763633728027344, -0.22004318237304688, -0.2124500274658203, -0.20485687255859375, -0.1972637176513672, -0.18967056274414062, -0.18207740783691406, -0.1744842529296875, -0.16689109802246094, -0.15929794311523438, -0.1517047882080078, -0.14411163330078125, -0.1365184783935547, -0.12892532348632812, -0.12133216857910156, -0.113739013671875, -0.10614585876464844, -0.09855270385742188, -0.09095954895019531, -0.08336639404296875, -0.07577323913574219, -0.06818008422851562, -0.06058692932128906, -0.0529937744140625, -0.04540061950683594, -0.037807464599609375, -0.030214309692382812, -0.02262115478515625, -0.015027999877929688, -0.007434844970703125, 0.0001583099365234375, 0.00775146484375, 0.015344619750976562, 0.022937774658203125, 0.030530929565429688, 0.03812408447265625, 0.04571723937988281, 0.053310394287109375, 0.06090354919433594, 0.0684967041015625, 0.07608985900878906, 0.08368301391601562, 0.09127616882324219, 0.09886932373046875, 0.10646247863769531, 0.11405563354492188, 0.12164878845214844, 0.129241943359375, 0.13683509826660156, 0.14442825317382812, 0.1520214080810547, 0.15961456298828125, 0.1672077178955078, 0.17480087280273438, 0.18239402770996094, 0.1899871826171875, 0.19758033752441406, 0.20517349243164062, 0.2127666473388672, 0.22035980224609375, 0.2279529571533203, 0.23554611206054688, 0.24313926696777344, 0.250732421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 4.0, 8.0, 12.0, 16.0, 24.0, 24.0, 28.0, 25.0, 33.0, 33.0, 27.0, 29.0, 39.0, 50.0, 44.0, 50.0, 1064.0, 62.0, 48.0, 59.0, 36.0, 49.0, 38.0, 34.0, 24.0, 27.0, 23.0, 18.0, 25.0, 16.0, 10.0, 14.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0546875, -2.952239990234375, -2.84979248046875, -2.747344970703125, -2.6448974609375, -2.542449951171875, -2.44000244140625, -2.337554931640625, -2.235107421875, -2.132659912109375, -2.03021240234375, -1.927764892578125, -1.8253173828125, -1.722869873046875, -1.62042236328125, -1.517974853515625, -1.41552734375, -1.313079833984375, -1.21063232421875, -1.108184814453125, -1.0057373046875, -0.903289794921875, -0.80084228515625, -0.698394775390625, -0.595947265625, -0.493499755859375, -0.39105224609375, -0.288604736328125, -0.1861572265625, -0.083709716796875, 0.01873779296875, 0.121185302734375, 0.2236328125, 0.326080322265625, 0.42852783203125, 0.530975341796875, 0.6334228515625, 0.735870361328125, 0.83831787109375, 0.940765380859375, 1.043212890625, 1.145660400390625, 1.24810791015625, 1.350555419921875, 1.4530029296875, 1.555450439453125, 1.65789794921875, 1.760345458984375, 1.86279296875, 1.965240478515625, 2.06768798828125, 2.170135498046875, 2.2725830078125, 2.375030517578125, 2.47747802734375, 2.579925537109375, 2.682373046875, 2.784820556640625, 2.88726806640625, 2.989715576171875, 3.0921630859375, 3.194610595703125, 3.29705810546875, 3.399505615234375, 3.501953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 10.0, 10.0, 12.0, 31.0, 32.0, 44.0, 77.0, 125.0, 156.0, 244.0, 444.0, 616.0, 1009.0, 1529.0, 2345.0, 3568.0, 5616.0, 8782.0, 14055.0, 22371.0, 36501.0, 61429.0, 111638.0, 1282345.0, 290438.0, 103776.0, 57655.0, 34439.0, 21122.0, 13204.0, 8499.0, 5444.0, 3410.0, 2157.0, 1433.0, 869.0, 593.0, 387.0, 269.0, 149.0, 105.0, 80.0, 39.0, 31.0, 14.0, 13.0, 7.0, 4.0, 7.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.08544921875, -0.082855224609375, -0.08026123046875, -0.077667236328125, -0.0750732421875, -0.072479248046875, -0.06988525390625, -0.067291259765625, -0.064697265625, -0.062103271484375, -0.05950927734375, -0.056915283203125, -0.0543212890625, -0.051727294921875, -0.04913330078125, -0.046539306640625, -0.0439453125, -0.041351318359375, -0.03875732421875, -0.036163330078125, -0.0335693359375, -0.030975341796875, -0.02838134765625, -0.025787353515625, -0.023193359375, -0.020599365234375, -0.01800537109375, -0.015411376953125, -0.0128173828125, -0.010223388671875, -0.00762939453125, -0.005035400390625, -0.00244140625, 0.000152587890625, 0.00274658203125, 0.005340576171875, 0.0079345703125, 0.010528564453125, 0.01312255859375, 0.015716552734375, 0.018310546875, 0.020904541015625, 0.02349853515625, 0.026092529296875, 0.0286865234375, 0.031280517578125, 0.03387451171875, 0.036468505859375, 0.0390625, 0.041656494140625, 0.04425048828125, 0.046844482421875, 0.0494384765625, 0.052032470703125, 0.05462646484375, 0.057220458984375, 0.059814453125, 0.062408447265625, 0.06500244140625, 0.067596435546875, 0.0701904296875, 0.072784423828125, 0.07537841796875, 0.077972412109375, 0.08056640625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 4.0, 9.0, 15.0, 14.0, 12.0, 14.0, 30.0, 30.0, 29.0, 47.0, 38.0, 49.0, 65.0, 74.0, 79.0, 85.0, 49.0, 59.0, 35.0, 40.0, 32.0, 31.0, 38.0, 15.0, 25.0, 17.0, 10.0, 11.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006933212280273438, -0.0006714761257171631, -0.0006496310234069824, -0.0006277859210968018, -0.0006059408187866211, -0.0005840957164764404, -0.0005622506141662598, -0.0005404055118560791, -0.0005185604095458984, -0.0004967153072357178, -0.0004748702049255371, -0.00045302510261535645, -0.0004311800003051758, -0.0004093348979949951, -0.00038748979568481445, -0.0003656446933746338, -0.0003437995910644531, -0.00032195448875427246, -0.0003001093864440918, -0.00027826428413391113, -0.00025641918182373047, -0.0002345740795135498, -0.00021272897720336914, -0.00019088387489318848, -0.0001690387725830078, -0.00014719367027282715, -0.00012534856796264648, -0.00010350346565246582, -8.165836334228516e-05, -5.981326103210449e-05, -3.796815872192383e-05, -1.6123056411743164e-05, 5.7220458984375e-06, 2.7567148208618164e-05, 4.941225051879883e-05, 7.125735282897949e-05, 9.310245513916016e-05, 0.00011494755744934082, 0.00013679265975952148, 0.00015863776206970215, 0.0001804828643798828, 0.00020232796669006348, 0.00022417306900024414, 0.0002460181713104248, 0.00026786327362060547, 0.00028970837593078613, 0.0003115534782409668, 0.00033339858055114746, 0.0003552436828613281, 0.0003770887851715088, 0.00039893388748168945, 0.0004207789897918701, 0.0004426240921020508, 0.00046446919441223145, 0.0004863142967224121, 0.0005081593990325928, 0.0005300045013427734, 0.0005518496036529541, 0.0005736947059631348, 0.0005955398082733154, 0.0006173849105834961, 0.0006392300128936768, 0.0006610751152038574, 0.0006829202175140381, 0.0007047653198242188]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 8.0, 11.0, 11.0, 15.0, 16.0, 24.0, 34.0, 50.0, 62.0, 72.0, 88.0, 127.0, 133.0, 217.0, 227.0, 366.0, 27533.0, 1017823.0, 448.0, 309.0, 193.0, 151.0, 156.0, 98.0, 94.0, 73.0, 40.0, 37.0, 34.0, 25.0, 15.0, 12.0, 14.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0141448974609375, -0.013705253601074219, -0.013265609741210938, -0.012825965881347656, -0.012386322021484375, -0.011946678161621094, -0.011507034301757812, -0.011067390441894531, -0.01062774658203125, -0.010188102722167969, -0.009748458862304688, -0.009308815002441406, -0.008869171142578125, -0.008429527282714844, -0.007989883422851562, -0.007550239562988281, -0.007110595703125, -0.006670951843261719, -0.0062313079833984375, -0.005791664123535156, -0.005352020263671875, -0.004912376403808594, -0.0044727325439453125, -0.004033088684082031, -0.00359344482421875, -0.0031538009643554688, -0.0027141571044921875, -0.0022745132446289062, -0.001834869384765625, -0.0013952255249023438, -0.0009555816650390625, -0.0005159378051757812, -7.62939453125e-05, 0.00036334991455078125, 0.0008029937744140625, 0.0012426376342773438, 0.001682281494140625, 0.0021219253540039062, 0.0025615692138671875, 0.0030012130737304688, 0.00344085693359375, 0.0038805007934570312, 0.0043201446533203125, 0.004759788513183594, 0.005199432373046875, 0.005639076232910156, 0.0060787200927734375, 0.006518363952636719, 0.0069580078125, 0.007397651672363281, 0.007837295532226562, 0.008276939392089844, 0.008716583251953125, 0.009156227111816406, 0.009595870971679688, 0.010035514831542969, 0.01047515869140625, 0.010914802551269531, 0.011354446411132812, 0.011794090270996094, 0.012233734130859375, 0.012673377990722656, 0.013113021850585938, 0.013552665710449219, 0.0139923095703125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1010.0, 4.0], "bins": [-0.01571698673069477, -0.015465534292161465, -0.015214082784950733, -0.014962630346417427, -0.014711177907884121, -0.014459725469350815, -0.014208273962140083, -0.013956821523606777, -0.013705369085073471, -0.013453916646540165, -0.013202465139329433, -0.012951012700796127, -0.012699560262262821, -0.012448107823729515, -0.012196656316518784, -0.011945203877985477, -0.011693752370774746, -0.01144229993224144, -0.011190848425030708, -0.010939395986497402, -0.010687943547964096, -0.010436492040753365, -0.010185039602220058, -0.009933587163686752, -0.00968213565647602, -0.009430683217942715, -0.009179231710731983, -0.008927779272198677, -0.008676326833665371, -0.008424874395132065, -0.008173422887921333, -0.007921970449388027, -0.0076705170795321465, -0.007419065106660128, -0.0071676126681268215, -0.006916160695254803, -0.006664708256721497, -0.006413256283849478, -0.006161804310977459, -0.005910351872444153, -0.005658899899572134, -0.005407447926700115, -0.005155995488166809, -0.00490454351529479, -0.0046530915424227715, -0.004401639103889465, -0.0041501871310174465, -0.003898734925314784, -0.0036472827196121216, -0.003395830513909459, -0.0031443783082067966, -0.002892926335334778, -0.0026414741296321154, -0.002390021923929453, -0.002138569951057434, -0.0018871177453547716, -0.001635665656067431, -0.0013842135667800903, -0.0011327613610774279, -0.0008813092135824263, -0.0006298570660874248, -0.0003784048603847623, -0.00012695277109742165, 0.000124499318189919, 0.0003759515529964119]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 19.0, 17.0, 21.0, 24.0, 33.0, 25.0, 36.0, 58.0, 48.0, 53.0, 68.0, 67.0, 60.0, 60.0, 61.0, 56.0, 43.0, 46.0, 44.0, 29.0, 35.0, 24.0, 14.0, 19.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006846189498901367, -0.0006620734930038452, -0.0006395280361175537, -0.0006169825792312622, -0.0005944371223449707, -0.0005718916654586792, -0.0005493462085723877, -0.0005268007516860962, -0.0005042552947998047, -0.0004817098379135132, -0.0004591643810272217, -0.0004366189241409302, -0.00041407346725463867, -0.00039152801036834717, -0.00036898255348205566, -0.00034643709659576416, -0.00032389163970947266, -0.00030134618282318115, -0.00027880072593688965, -0.00025625526905059814, -0.00023370981216430664, -0.00021116435527801514, -0.00018861889839172363, -0.00016607344150543213, -0.00014352798461914062, -0.00012098252773284912, -9.843707084655762e-05, -7.589161396026611e-05, -5.334615707397461e-05, -3.0800700187683105e-05, -8.255243301391602e-06, 1.4290213584899902e-05, 3.6835670471191406e-05, 5.938112735748291e-05, 8.192658424377441e-05, 0.00010447204113006592, 0.00012701749801635742, 0.00014956295490264893, 0.00017210841178894043, 0.00019465386867523193, 0.00021719932556152344, 0.00023974478244781494, 0.00026229023933410645, 0.00028483569622039795, 0.00030738115310668945, 0.00032992660999298096, 0.00035247206687927246, 0.00037501752376556396, 0.00039756298065185547, 0.00042010843753814697, 0.0004426538944244385, 0.00046519935131073, 0.0004877448081970215, 0.000510290265083313, 0.0005328357219696045, 0.000555381178855896, 0.0005779266357421875, 0.000600472092628479, 0.0006230175495147705, 0.000645563006401062, 0.0006681084632873535, 0.000690653920173645, 0.0007131993770599365, 0.000735744833946228, 0.0007582902908325195]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 14.0, 10.0, 28.0, 29.0, 42.0, 50.0, 83.0, 106.0, 125.0, 157.0, 104.0, 76.0, 56.0, 36.0, 27.0, 13.0, 10.0, 7.0, 1.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.91290283203125, -4.7789306640625, -4.64495849609375, -4.510986328125, -4.37701416015625, -4.2430419921875, -4.10906982421875, -3.97509765625, -3.84112548828125, -3.7071533203125, -3.57318115234375, -3.439208984375, -3.30523681640625, -3.1712646484375, -3.03729248046875, -2.9033203125, -2.76934814453125, -2.6353759765625, -2.50140380859375, -2.367431640625, -2.23345947265625, -2.0994873046875, -1.96551513671875, -1.83154296875, -1.69757080078125, -1.5635986328125, -1.42962646484375, -1.295654296875, -1.16168212890625, -1.0277099609375, -0.89373779296875, -0.759765625, -0.62579345703125, -0.4918212890625, -0.35784912109375, -0.223876953125, -0.08990478515625, 0.0440673828125, 0.17803955078125, 0.31201171875, 0.44598388671875, 0.5799560546875, 0.71392822265625, 0.847900390625, 0.98187255859375, 1.1158447265625, 1.24981689453125, 1.3837890625, 1.51776123046875, 1.6517333984375, 1.78570556640625, 1.919677734375, 2.05364990234375, 2.1876220703125, 2.32159423828125, 2.45556640625, 2.58953857421875, 2.7235107421875, 2.85748291015625, 2.991455078125, 3.12542724609375, 3.2593994140625, 3.39337158203125, 3.52734375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 11.0, 16.0, 29.0, 32.0, 56.0, 89.0, 94.0, 165.0, 250.0, 486.0, 955.0, 1974.0, 5367.0, 28971.0, 923839.0, 73186.0, 7823.0, 2549.0, 1160.0, 610.0, 312.0, 184.0, 114.0, 79.0, 51.0, 50.0, 28.0, 12.0, 11.0, 9.0, 12.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.328125, -26.515869140625, -25.70361328125, -24.891357421875, -24.0791015625, -23.266845703125, -22.45458984375, -21.642333984375, -20.830078125, -20.017822265625, -19.20556640625, -18.393310546875, -17.5810546875, -16.768798828125, -15.95654296875, -15.144287109375, -14.33203125, -13.519775390625, -12.70751953125, -11.895263671875, -11.0830078125, -10.270751953125, -9.45849609375, -8.646240234375, -7.833984375, -7.021728515625, -6.20947265625, -5.397216796875, -4.5849609375, -3.772705078125, -2.96044921875, -2.148193359375, -1.3359375, -0.523681640625, 0.28857421875, 1.100830078125, 1.9130859375, 2.725341796875, 3.53759765625, 4.349853515625, 5.162109375, 5.974365234375, 6.78662109375, 7.598876953125, 8.4111328125, 9.223388671875, 10.03564453125, 10.847900390625, 11.66015625, 12.472412109375, 13.28466796875, 14.096923828125, 14.9091796875, 15.721435546875, 16.53369140625, 17.345947265625, 18.158203125, 18.970458984375, 19.78271484375, 20.594970703125, 21.4072265625, 22.219482421875, 23.03173828125, 23.843994140625, 24.65625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 8.0, 7.0, 12.0, 11.0, 18.0, 19.0, 14.0, 28.0, 26.0, 18.0, 37.0, 33.0, 39.0, 51.0, 55.0, 59.0, 96.0, 192.0, 1520.0, 226.0, 100.0, 87.0, 63.0, 28.0, 43.0, 39.0, 24.0, 25.0, 29.0, 21.0, 18.0, 16.0, 11.0, 11.0, 12.0, 7.0, 12.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69921875, -6.47332763671875, -6.2474365234375, -6.02154541015625, -5.795654296875, -5.56976318359375, -5.3438720703125, -5.11798095703125, -4.89208984375, -4.66619873046875, -4.4403076171875, -4.21441650390625, -3.988525390625, -3.76263427734375, -3.5367431640625, -3.31085205078125, -3.0849609375, -2.85906982421875, -2.6331787109375, -2.40728759765625, -2.181396484375, -1.95550537109375, -1.7296142578125, -1.50372314453125, -1.27783203125, -1.05194091796875, -0.8260498046875, -0.60015869140625, -0.374267578125, -0.14837646484375, 0.0775146484375, 0.30340576171875, 0.529296875, 0.75518798828125, 0.9810791015625, 1.20697021484375, 1.432861328125, 1.65875244140625, 1.8846435546875, 2.11053466796875, 2.33642578125, 2.56231689453125, 2.7882080078125, 3.01409912109375, 3.239990234375, 3.46588134765625, 3.6917724609375, 3.91766357421875, 4.1435546875, 4.36944580078125, 4.5953369140625, 4.82122802734375, 5.047119140625, 5.27301025390625, 5.4989013671875, 5.72479248046875, 5.95068359375, 6.17657470703125, 6.4024658203125, 6.62835693359375, 6.854248046875, 7.08013916015625, 7.3060302734375, 7.53192138671875, 7.7578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 10.0, 6.0, 12.0, 16.0, 11.0, 22.0, 28.0, 23.0, 32.0, 42.0, 50.0, 81.0, 166.0, 335.0, 1262.0, 24451.0, 3090122.0, 26731.0, 1307.0, 384.0, 164.0, 95.0, 59.0, 45.0, 40.0, 25.0, 27.0, 21.0, 18.0, 23.0, 16.0, 6.0, 11.0, 12.0, 5.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.25, -29.319580078125, -28.38916015625, -27.458740234375, -26.5283203125, -25.597900390625, -24.66748046875, -23.737060546875, -22.806640625, -21.876220703125, -20.94580078125, -20.015380859375, -19.0849609375, -18.154541015625, -17.22412109375, -16.293701171875, -15.36328125, -14.432861328125, -13.50244140625, -12.572021484375, -11.6416015625, -10.711181640625, -9.78076171875, -8.850341796875, -7.919921875, -6.989501953125, -6.05908203125, -5.128662109375, -4.1982421875, -3.267822265625, -2.33740234375, -1.406982421875, -0.4765625, 0.453857421875, 1.38427734375, 2.314697265625, 3.2451171875, 4.175537109375, 5.10595703125, 6.036376953125, 6.966796875, 7.897216796875, 8.82763671875, 9.758056640625, 10.6884765625, 11.618896484375, 12.54931640625, 13.479736328125, 14.41015625, 15.340576171875, 16.27099609375, 17.201416015625, 18.1318359375, 19.062255859375, 19.99267578125, 20.923095703125, 21.853515625, 22.783935546875, 23.71435546875, 24.644775390625, 25.5751953125, 26.505615234375, 27.43603515625, 28.366455078125, 29.296875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 15.0, 219.0, 633.0, 135.0, 15.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.684745788574219, -5.3429388999938965, -3.001132011413574, -0.659325122833252, 1.6824817657470703, 4.024288177490234, 6.366095542907715, 8.707902908325195, 11.04970932006836, 13.391515731811523, 15.733323097229004, 18.075130462646484, 20.41693687438965, 22.758743286132812, 25.10055160522461, 27.442358016967773, 29.784164428710938, 32.125972747802734, 34.467777252197266, 36.80958557128906, 39.151390075683594, 41.49319839477539, 43.83500671386719, 46.17681121826172, 48.518619537353516, 50.86042785644531, 53.202232360839844, 55.54404067993164, 57.88584899902344, 60.22765350341797, 62.569461822509766, 64.91127014160156, 67.25308227539062, 69.59488677978516, 71.93669891357422, 74.27850341796875, 76.62030792236328, 78.96211242675781, 81.30392456054688, 83.6457290649414, 85.98753356933594, 88.32933807373047, 90.67115020751953, 93.01295471191406, 95.3547592163086, 97.69656372070312, 100.03837585449219, 102.38018035888672, 104.72199249267578, 107.06379699707031, 109.40560913085938, 111.7474136352539, 114.08921813964844, 116.4310302734375, 118.77283477783203, 121.11463928222656, 123.45645141601562, 125.79825592041016, 128.1400604248047, 130.48187255859375, 132.8236846923828, 135.1654815673828, 137.50729370117188, 139.84910583496094, 142.19090270996094]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 5.0, 8.0, 5.0, 14.0, 26.0, 16.0, 16.0, 21.0, 23.0, 30.0, 31.0, 37.0, 44.0, 23.0, 37.0, 48.0, 32.0, 48.0, 37.0, 48.0, 35.0, 38.0, 47.0, 42.0, 29.0, 37.0, 28.0, 28.0, 29.0, 24.0, 22.0, 9.0, 11.0, 14.0, 12.0, 5.0, 4.0, 10.0, 14.0, 6.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-27.12782096862793, -26.352937698364258, -25.578054428100586, -24.80316925048828, -24.02828598022461, -23.253402709960938, -22.478519439697266, -21.703636169433594, -20.928752899169922, -20.15386962890625, -19.378986358642578, -18.604103088378906, -17.8292179107666, -17.05433464050293, -16.279451370239258, -15.504568099975586, -14.729682922363281, -13.95479965209961, -13.179915428161621, -12.40503215789795, -11.630147933959961, -10.855264663696289, -10.080381393432617, -9.305498123168945, -8.530613899230957, -7.755730152130127, -6.980846405029297, -6.205963134765625, -5.431079387664795, -4.656195640563965, -3.881312370300293, -3.106428623199463, -2.3315467834472656, -1.556663155555725, -0.7817795276641846, -0.006896018981933594, 0.7679877281188965, 1.5428714752197266, 2.3177547454833984, 3.0926384925842285, 3.8675222396850586, 4.642405986785889, 5.417289733886719, 6.192173004150391, 6.967056751251221, 7.741940498352051, 8.516823768615723, 9.291707992553711, 10.066591262817383, 10.841474533081055, 11.616358757019043, 12.391242027282715, 13.166126251220703, 13.941009521484375, 14.715892791748047, 15.490776062011719, 16.26565933227539, 17.040542602539062, 17.815425872802734, 18.590309143066406, 19.36519432067871, 20.140077590942383, 20.914960861206055, 21.689844131469727, 22.46472930908203]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 2.0, 8.0, 14.0, 11.0, 28.0, 36.0, 40.0, 58.0, 91.0, 113.0, 116.0, 138.0, 102.0, 79.0, 57.0, 34.0, 22.0, 18.0, 10.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.10546875, -4.969482421875, -4.83349609375, -4.697509765625, -4.5615234375, -4.425537109375, -4.28955078125, -4.153564453125, -4.017578125, -3.881591796875, -3.74560546875, -3.609619140625, -3.4736328125, -3.337646484375, -3.20166015625, -3.065673828125, -2.9296875, -2.793701171875, -2.65771484375, -2.521728515625, -2.3857421875, -2.249755859375, -2.11376953125, -1.977783203125, -1.841796875, -1.705810546875, -1.56982421875, -1.433837890625, -1.2978515625, -1.161865234375, -1.02587890625, -0.889892578125, -0.75390625, -0.617919921875, -0.48193359375, -0.345947265625, -0.2099609375, -0.073974609375, 0.06201171875, 0.197998046875, 0.333984375, 0.469970703125, 0.60595703125, 0.741943359375, 0.8779296875, 1.013916015625, 1.14990234375, 1.285888671875, 1.421875, 1.557861328125, 1.69384765625, 1.829833984375, 1.9658203125, 2.101806640625, 2.23779296875, 2.373779296875, 2.509765625, 2.645751953125, 2.78173828125, 2.917724609375, 3.0537109375, 3.189697265625, 3.32568359375, 3.461669921875, 3.59765625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 11.0, 9.0, 12.0, 27.0, 28.0, 59.0, 92.0, 158.0, 212.0, 540.0, 1289.0, 4332.0, 61982.0, 4104052.0, 17378.0, 2580.0, 780.0, 328.0, 160.0, 89.0, 53.0, 37.0, 18.0, 9.0, 14.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.75, -41.60498046875, -40.4599609375, -39.31494140625, -38.169921875, -37.02490234375, -35.8798828125, -34.73486328125, -33.58984375, -32.44482421875, -31.2998046875, -30.15478515625, -29.009765625, -27.86474609375, -26.7197265625, -25.57470703125, -24.4296875, -23.28466796875, -22.1396484375, -20.99462890625, -19.849609375, -18.70458984375, -17.5595703125, -16.41455078125, -15.26953125, -14.12451171875, -12.9794921875, -11.83447265625, -10.689453125, -9.54443359375, -8.3994140625, -7.25439453125, -6.109375, -4.96435546875, -3.8193359375, -2.67431640625, -1.529296875, -0.38427734375, 0.7607421875, 1.90576171875, 3.05078125, 4.19580078125, 5.3408203125, 6.48583984375, 7.630859375, 8.77587890625, 9.9208984375, 11.06591796875, 12.2109375, 13.35595703125, 14.5009765625, 15.64599609375, 16.791015625, 17.93603515625, 19.0810546875, 20.22607421875, 21.37109375, 22.51611328125, 23.6611328125, 24.80615234375, 25.951171875, 27.09619140625, 28.2412109375, 29.38623046875, 30.53125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 13.0, 8.0, 15.0, 19.0, 25.0, 32.0, 48.0, 98.0, 107.0, 210.0, 304.0, 550.0, 799.0, 665.0, 399.0, 251.0, 162.0, 105.0, 60.0, 46.0, 30.0, 24.0, 18.0, 7.0, 12.0, 8.0, 7.0, 10.0, 3.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.890625, -7.6336669921875, -7.376708984375, -7.1197509765625, -6.86279296875, -6.6058349609375, -6.348876953125, -6.0919189453125, -5.8349609375, -5.5780029296875, -5.321044921875, -5.0640869140625, -4.80712890625, -4.5501708984375, -4.293212890625, -4.0362548828125, -3.779296875, -3.5223388671875, -3.265380859375, -3.0084228515625, -2.75146484375, -2.4945068359375, -2.237548828125, -1.9805908203125, -1.7236328125, -1.4666748046875, -1.209716796875, -0.9527587890625, -0.69580078125, -0.4388427734375, -0.181884765625, 0.0750732421875, 0.33203125, 0.5889892578125, 0.845947265625, 1.1029052734375, 1.35986328125, 1.6168212890625, 1.873779296875, 2.1307373046875, 2.3876953125, 2.6446533203125, 2.901611328125, 3.1585693359375, 3.41552734375, 3.6724853515625, 3.929443359375, 4.1864013671875, 4.443359375, 4.7003173828125, 4.957275390625, 5.2142333984375, 5.47119140625, 5.7281494140625, 5.985107421875, 6.2420654296875, 6.4990234375, 6.7559814453125, 7.012939453125, 7.2698974609375, 7.52685546875, 7.7838134765625, 8.040771484375, 8.2977294921875, 8.5546875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 6.0, 15.0, 17.0, 18.0, 56.0, 74.0, 113.0, 178.0, 335.0, 525.0, 942.0, 1678.0, 3245.0, 6484.0, 14236.0, 38563.0, 151931.0, 1371988.0, 2287519.0, 232318.0, 50384.0, 17758.0, 7684.0, 3695.0, 1892.0, 1073.0, 614.0, 354.0, 224.0, 119.0, 92.0, 42.0, 31.0, 22.0, 17.0, 16.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5859375, -11.236083984375, -10.88623046875, -10.536376953125, -10.1865234375, -9.836669921875, -9.48681640625, -9.136962890625, -8.787109375, -8.437255859375, -8.08740234375, -7.737548828125, -7.3876953125, -7.037841796875, -6.68798828125, -6.338134765625, -5.98828125, -5.638427734375, -5.28857421875, -4.938720703125, -4.5888671875, -4.239013671875, -3.88916015625, -3.539306640625, -3.189453125, -2.839599609375, -2.48974609375, -2.139892578125, -1.7900390625, -1.440185546875, -1.09033203125, -0.740478515625, -0.390625, -0.040771484375, 0.30908203125, 0.658935546875, 1.0087890625, 1.358642578125, 1.70849609375, 2.058349609375, 2.408203125, 2.758056640625, 3.10791015625, 3.457763671875, 3.8076171875, 4.157470703125, 4.50732421875, 4.857177734375, 5.20703125, 5.556884765625, 5.90673828125, 6.256591796875, 6.6064453125, 6.956298828125, 7.30615234375, 7.656005859375, 8.005859375, 8.355712890625, 8.70556640625, 9.055419921875, 9.4052734375, 9.755126953125, 10.10498046875, 10.454833984375, 10.8046875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 22.0, 74.0, 284.0, 400.0, 175.0, 45.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34567642211914, -32.80447769165039, -29.263277053833008, -25.722076416015625, -22.180877685546875, -18.639678955078125, -15.098478317260742, -11.55727767944336, -8.01607894897461, -4.474879264831543, -0.9336795806884766, 2.60752010345459, 6.148719787597656, 9.689918518066406, 13.231119155883789, 16.772319793701172, 20.313518524169922, 23.854717254638672, 27.395917892456055, 30.937118530273438, 34.47831726074219, 38.01951599121094, 41.56071472167969, 45.1019172668457, 48.64311599731445, 52.1843147277832, 55.72551727294922, 59.26671600341797, 62.80791473388672, 66.34911346435547, 69.89031219482422, 73.4315185546875, 76.97271728515625, 80.513916015625, 84.05511474609375, 87.5963134765625, 91.13751220703125, 94.6787109375, 98.21991729736328, 101.76111602783203, 105.30231475830078, 108.84351348876953, 112.38471221923828, 115.92591094970703, 119.46711730957031, 123.00831604003906, 126.54951477050781, 130.09071350097656, 133.6319122314453, 137.17311096191406, 140.7143096923828, 144.25550842285156, 147.7967071533203, 151.33790588378906, 154.8791046142578, 158.42031860351562, 161.96151733398438, 165.50271606445312, 169.04391479492188, 172.58511352539062, 176.12631225585938, 179.66751098632812, 183.20870971679688, 186.74990844726562, 190.29110717773438]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 3.0, 6.0, 3.0, 12.0, 13.0, 12.0, 14.0, 18.0, 17.0, 31.0, 26.0, 28.0, 31.0, 24.0, 28.0, 39.0, 27.0, 36.0, 43.0, 30.0, 38.0, 47.0, 35.0, 39.0, 32.0, 35.0, 36.0, 28.0, 28.0, 27.0, 22.0, 23.0, 24.0, 15.0, 22.0, 14.0, 23.0, 13.0, 8.0, 15.0, 8.0, 2.0, 6.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0], "bins": [-26.044818878173828, -25.298988342285156, -24.553159713745117, -23.807329177856445, -23.061498641967773, -22.315670013427734, -21.569839477539062, -20.82400894165039, -20.07818031311035, -19.33234977722168, -18.58652114868164, -17.84069061279297, -17.094860076904297, -16.349031448364258, -15.603200912475586, -14.85737133026123, -14.111540794372559, -13.365711212158203, -12.619880676269531, -11.874051094055176, -11.12822151184082, -10.382390975952148, -9.636561393737793, -8.890731811523438, -8.144901275634766, -7.399071216583252, -6.6532416343688965, -5.907411575317383, -5.161581993103027, -4.415751934051514, -3.669921875, -2.9240922927856445, -2.178262710571289, -1.4324328899383545, -0.6866029500961304, 0.05922698974609375, 0.8050568103790283, 1.550886631011963, 2.2967166900634766, 3.042546272277832, 3.7883763313293457, 4.534206390380859, 5.280035972595215, 6.0258660316467285, 6.771696090698242, 7.517525672912598, 8.263355255126953, 9.009185791015625, 9.75501537322998, 10.500844955444336, 11.246675491333008, 11.992505073547363, 12.738334655761719, 13.48416519165039, 14.229994773864746, 14.975824356079102, 15.721654891967773, 16.467485427856445, 17.213314056396484, 17.959144592285156, 18.704975128173828, 19.450803756713867, 20.19663429260254, 20.942462921142578, 21.68829345703125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 8.0, 20.0, 22.0, 22.0, 39.0, 62.0, 83.0, 88.0, 123.0, 103.0, 115.0, 90.0, 57.0, 66.0, 29.0, 25.0, 12.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8046875, -4.675201416015625, -4.54571533203125, -4.416229248046875, -4.2867431640625, -4.157257080078125, -4.02777099609375, -3.898284912109375, -3.768798828125, -3.639312744140625, -3.50982666015625, -3.380340576171875, -3.2508544921875, -3.121368408203125, -2.99188232421875, -2.862396240234375, -2.73291015625, -2.603424072265625, -2.47393798828125, -2.344451904296875, -2.2149658203125, -2.085479736328125, -1.95599365234375, -1.826507568359375, -1.697021484375, -1.567535400390625, -1.43804931640625, -1.308563232421875, -1.1790771484375, -1.049591064453125, -0.92010498046875, -0.790618896484375, -0.6611328125, -0.531646728515625, -0.40216064453125, -0.272674560546875, -0.1431884765625, -0.013702392578125, 0.11578369140625, 0.245269775390625, 0.374755859375, 0.504241943359375, 0.63372802734375, 0.763214111328125, 0.8927001953125, 1.022186279296875, 1.15167236328125, 1.281158447265625, 1.41064453125, 1.540130615234375, 1.66961669921875, 1.799102783203125, 1.9285888671875, 2.058074951171875, 2.18756103515625, 2.317047119140625, 2.446533203125, 2.576019287109375, 2.70550537109375, 2.834991455078125, 2.9644775390625, 3.093963623046875, 3.22344970703125, 3.352935791015625, 3.482421875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 15.0, 9.0, 32.0, 42.0, 51.0, 52.0, 82.0, 103.0, 151.0, 267.0, 367.0, 525.0, 797.0, 1349.0, 2198.0, 3827.0, 7414.0, 16832.0, 46359.0, 181476.0, 588692.0, 131660.0, 36997.0, 13984.0, 6540.0, 3306.0, 1903.0, 1133.0, 780.0, 534.0, 324.0, 199.0, 143.0, 103.0, 68.0, 62.0, 35.0, 30.0, 24.0, 14.0, 14.0, 13.0, 9.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2049560546875, -0.1982135772705078, -0.19147109985351562, -0.18472862243652344, -0.17798614501953125, -0.17124366760253906, -0.16450119018554688, -0.1577587127685547, -0.1510162353515625, -0.1442737579345703, -0.13753128051757812, -0.13078880310058594, -0.12404632568359375, -0.11730384826660156, -0.11056137084960938, -0.10381889343261719, -0.097076416015625, -0.09033393859863281, -0.08359146118164062, -0.07684898376464844, -0.07010650634765625, -0.06336402893066406, -0.056621551513671875, -0.04987907409667969, -0.0431365966796875, -0.03639411926269531, -0.029651641845703125, -0.022909164428710938, -0.01616668701171875, -0.009424209594726562, -0.002681732177734375, 0.0040607452392578125, 0.01080322265625, 0.017545700073242188, 0.024288177490234375, 0.031030654907226562, 0.03777313232421875, 0.04451560974121094, 0.051258087158203125, 0.05800056457519531, 0.0647430419921875, 0.07148551940917969, 0.07822799682617188, 0.08497047424316406, 0.09171295166015625, 0.09845542907714844, 0.10519790649414062, 0.11194038391113281, 0.118682861328125, 0.1254253387451172, 0.13216781616210938, 0.13891029357910156, 0.14565277099609375, 0.15239524841308594, 0.15913772583007812, 0.1658802032470703, 0.1726226806640625, 0.1793651580810547, 0.18610763549804688, 0.19285011291503906, 0.19959259033203125, 0.20633506774902344, 0.21307754516601562, 0.2198200225830078, 0.2265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 13.0, 12.0, 12.0, 18.0, 20.0, 20.0, 26.0, 22.0, 20.0, 35.0, 31.0, 32.0, 37.0, 37.0, 39.0, 38.0, 32.0, 1060.0, 32.0, 32.0, 35.0, 33.0, 27.0, 38.0, 44.0, 34.0, 37.0, 20.0, 20.0, 27.0, 18.0, 22.0, 18.0, 9.0, 12.0, 9.0, 10.0, 5.0, 7.0, 3.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.376953125, -2.306732177734375, -2.23651123046875, -2.166290283203125, -2.0960693359375, -2.025848388671875, -1.95562744140625, -1.885406494140625, -1.815185546875, -1.744964599609375, -1.67474365234375, -1.604522705078125, -1.5343017578125, -1.464080810546875, -1.39385986328125, -1.323638916015625, -1.25341796875, -1.183197021484375, -1.11297607421875, -1.042755126953125, -0.9725341796875, -0.902313232421875, -0.83209228515625, -0.761871337890625, -0.691650390625, -0.621429443359375, -0.55120849609375, -0.480987548828125, -0.4107666015625, -0.340545654296875, -0.27032470703125, -0.200103759765625, -0.1298828125, -0.059661865234375, 0.01055908203125, 0.080780029296875, 0.1510009765625, 0.221221923828125, 0.29144287109375, 0.361663818359375, 0.431884765625, 0.502105712890625, 0.57232666015625, 0.642547607421875, 0.7127685546875, 0.782989501953125, 0.85321044921875, 0.923431396484375, 0.99365234375, 1.063873291015625, 1.13409423828125, 1.204315185546875, 1.2745361328125, 1.344757080078125, 1.41497802734375, 1.485198974609375, 1.555419921875, 1.625640869140625, 1.69586181640625, 1.766082763671875, 1.8363037109375, 1.906524658203125, 1.97674560546875, 2.046966552734375, 2.1171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 13.0, 10.0, 10.0, 21.0, 43.0, 41.0, 62.0, 109.0, 139.0, 199.0, 345.0, 461.0, 657.0, 936.0, 1271.0, 1833.0, 2761.0, 3935.0, 5677.0, 8311.0, 12076.0, 18168.0, 27051.0, 41447.0, 65742.0, 110464.0, 1106326.0, 395159.0, 107412.0, 64158.0, 40583.0, 26325.0, 17551.0, 11885.0, 8118.0, 5376.0, 3782.0, 2649.0, 1794.0, 1311.0, 882.0, 623.0, 402.0, 307.0, 214.0, 156.0, 104.0, 80.0, 52.0, 28.0, 34.0, 20.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.057098388671875, -0.05525493621826172, -0.05341148376464844, -0.051568031311035156, -0.049724578857421875, -0.047881126403808594, -0.04603767395019531, -0.04419422149658203, -0.04235076904296875, -0.04050731658935547, -0.03866386413574219, -0.036820411682128906, -0.034976959228515625, -0.033133506774902344, -0.03129005432128906, -0.02944660186767578, -0.0276031494140625, -0.02575969696044922, -0.023916244506835938, -0.022072792053222656, -0.020229339599609375, -0.018385887145996094, -0.016542434692382812, -0.014698982238769531, -0.01285552978515625, -0.011012077331542969, -0.009168624877929688, -0.007325172424316406, -0.005481719970703125, -0.0036382675170898438, -0.0017948150634765625, 4.863739013671875e-05, 0.00189208984375, 0.0037355422973632812, 0.0055789947509765625, 0.007422447204589844, 0.009265899658203125, 0.011109352111816406, 0.012952804565429688, 0.014796257019042969, 0.01663970947265625, 0.01848316192626953, 0.020326614379882812, 0.022170066833496094, 0.024013519287109375, 0.025856971740722656, 0.027700424194335938, 0.02954387664794922, 0.0313873291015625, 0.03323078155517578, 0.03507423400878906, 0.036917686462402344, 0.038761138916015625, 0.040604591369628906, 0.04244804382324219, 0.04429149627685547, 0.04613494873046875, 0.04797840118408203, 0.04982185363769531, 0.051665306091308594, 0.053508758544921875, 0.055352210998535156, 0.05719566345214844, 0.05903911590576172, 0.060882568359375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 9.0, 4.0, 9.0, 13.0, 15.0, 6.0, 18.0, 21.0, 24.0, 28.0, 29.0, 38.0, 42.0, 56.0, 60.0, 57.0, 66.0, 51.0, 59.0, 48.0, 50.0, 53.0, 46.0, 34.0, 29.0, 25.0, 14.0, 20.0, 12.0, 12.0, 8.0, 13.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003948211669921875, -0.0003816261887550354, -0.0003684312105178833, -0.0003552362322807312, -0.0003420412540435791, -0.000328846275806427, -0.0003156512975692749, -0.0003024563193321228, -0.0002892613410949707, -0.0002760663628578186, -0.0002628713846206665, -0.0002496764063835144, -0.0002364814281463623, -0.0002232864499092102, -0.0002100914716720581, -0.000196896493434906, -0.0001837015151977539, -0.0001705065369606018, -0.0001573115587234497, -0.0001441165804862976, -0.0001309216022491455, -0.00011772662401199341, -0.00010453164577484131, -9.133666753768921e-05, -7.814168930053711e-05, -6.494671106338501e-05, -5.175173282623291e-05, -3.855675458908081e-05, -2.536177635192871e-05, -1.2166798114776611e-05, 1.0281801223754883e-06, 1.4223158359527588e-05, 2.7418136596679688e-05, 4.061311483383179e-05, 5.380809307098389e-05, 6.700307130813599e-05, 8.019804954528809e-05, 9.339302778244019e-05, 0.00010658800601959229, 0.00011978298425674438, 0.00013297796249389648, 0.00014617294073104858, 0.00015936791896820068, 0.00017256289720535278, 0.00018575787544250488, 0.00019895285367965698, 0.00021214783191680908, 0.00022534281015396118, 0.00023853778839111328, 0.0002517327666282654, 0.0002649277448654175, 0.0002781227231025696, 0.0002913177013397217, 0.0003045126795768738, 0.0003177076578140259, 0.000330902636051178, 0.0003440976142883301, 0.0003572925925254822, 0.0003704875707626343, 0.0003836825489997864, 0.0003968775272369385, 0.0004100725054740906, 0.0004232674837112427, 0.0004364624619483948, 0.0004496574401855469]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 3.0, 3.0, 5.0, 7.0, 13.0, 14.0, 22.0, 22.0, 29.0, 37.0, 44.0, 42.0, 46.0, 80.0, 91.0, 97.0, 120.0, 149.0, 168.0, 417.0, 8932.0, 842230.0, 191900.0, 2847.0, 244.0, 193.0, 144.0, 124.0, 91.0, 82.0, 59.0, 52.0, 47.0, 37.0, 38.0, 27.0, 16.0, 27.0, 13.0, 9.0, 5.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006885528564453125, -0.006669342517852783, -0.006453156471252441, -0.0062369704246521, -0.006020784378051758, -0.005804598331451416, -0.005588412284851074, -0.005372226238250732, -0.005156040191650391, -0.004939854145050049, -0.004723668098449707, -0.004507482051849365, -0.0042912960052490234, -0.004075109958648682, -0.00385892391204834, -0.003642737865447998, -0.0034265518188476562, -0.0032103657722473145, -0.0029941797256469727, -0.002777993679046631, -0.002561807632446289, -0.0023456215858459473, -0.0021294355392456055, -0.0019132494926452637, -0.0016970634460449219, -0.00148087739944458, -0.0012646913528442383, -0.0010485053062438965, -0.0008323192596435547, -0.0006161332130432129, -0.0003999471664428711, -0.0001837611198425293, 3.24249267578125e-05, 0.0002486109733581543, 0.0004647970199584961, 0.0006809830665588379, 0.0008971691131591797, 0.0011133551597595215, 0.0013295412063598633, 0.001545727252960205, 0.0017619132995605469, 0.0019780993461608887, 0.0021942853927612305, 0.0024104714393615723, 0.002626657485961914, 0.002842843532562256, 0.0030590295791625977, 0.0032752156257629395, 0.0034914016723632812, 0.003707587718963623, 0.003923773765563965, 0.004139959812164307, 0.0043561458587646484, 0.00457233190536499, 0.004788517951965332, 0.005004703998565674, 0.005220890045166016, 0.005437076091766357, 0.005653262138366699, 0.005869448184967041, 0.006085634231567383, 0.006301820278167725, 0.006518006324768066, 0.006734192371368408, 0.00695037841796875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 96.0, 858.0, 56.0, 2.0, 0.0, 1.0], "bins": [-0.007806016132235527, -0.007674674037843943, -0.007543331943452358, -0.007411989849060774, -0.0072806477546691895, -0.007149305660277605, -0.007017963565886021, -0.006886621471494436, -0.006755279377102852, -0.0066239372827112675, -0.006492595188319683, -0.006361253093928099, -0.006229910999536514, -0.00609856890514493, -0.0059672268107533455, -0.005835884716361761, -0.005704542621970177, -0.005573200527578592, -0.005441858433187008, -0.0053105163387954235, -0.005179174244403839, -0.005047832150012255, -0.00491649005562067, -0.004785147961229086, -0.004653806332498789, -0.0045224642381072044, -0.00439112214371562, -0.004259780049324036, -0.004128437954932451, -0.003997095860540867, -0.0038657537661492825, -0.003734411671757698, -0.0036030698101967573, -0.003471727715805173, -0.0033403856214135885, -0.003209043527022004, -0.0030777014326304197, -0.0029463593382388353, -0.0028150174766778946, -0.00268367538228631, -0.002552333287894726, -0.0024209911935031414, -0.002289649099111557, -0.0021583070047199726, -0.002026964910328388, -0.0018956228159368038, -0.0017642808379605412, -0.0016329387435689569, -0.0015015965327620506, -0.0013702544383704662, -0.0012389123439788818, -0.0011075702495872974, -0.000976228213403374, -0.0008448861190117896, -0.0007135440828278661, -0.0005822019884362817, -0.0004508599522523582, -0.0003195178578607738, -0.00018817579257301986, -5.683372728526592e-05, 7.450836710631847e-05, 0.00020585046149790287, 0.00033719249768182635, 0.00046853459207341075, 0.0005998766864649951]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 5.0, 8.0, 16.0, 11.0, 17.0, 22.0, 29.0, 36.0, 29.0, 43.0, 30.0, 45.0, 43.0, 58.0, 41.0, 47.0, 49.0, 56.0, 53.0, 50.0, 38.0, 43.0, 32.0, 32.0, 30.0, 23.0, 20.0, 20.0, 18.0, 12.0, 6.0, 8.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0004892349243164062, -0.0004763184115290642, -0.0004634018987417221, -0.00045048538595438004, -0.00043756887316703796, -0.0004246523603796959, -0.0004117358475923538, -0.00039881933480501175, -0.0003859028220176697, -0.0003729863092303276, -0.00036006979644298553, -0.00034715328365564346, -0.0003342367708683014, -0.0003213202580809593, -0.00030840374529361725, -0.0002954872325062752, -0.0002825707197189331, -0.00026965420693159103, -0.00025673769414424896, -0.0002438211813569069, -0.00023090466856956482, -0.00021798815578222275, -0.00020507164299488068, -0.0001921551302075386, -0.00017923861742019653, -0.00016632210463285446, -0.0001534055918455124, -0.00014048907905817032, -0.00012757256627082825, -0.00011465605348348618, -0.0001017395406961441, -8.882302790880203e-05, -7.590651512145996e-05, -6.299000233411789e-05, -5.007348954677582e-05, -3.7156976759433746e-05, -2.4240463972091675e-05, -1.1323951184749603e-05, 1.5925616025924683e-06, 1.450907438993454e-05, 2.742558717727661e-05, 4.034209996461868e-05, 5.3258612751960754e-05, 6.617512553930283e-05, 7.90916383266449e-05, 9.200815111398697e-05, 0.00010492466390132904, 0.00011784117668867111, 0.00013075768947601318, 0.00014367420226335526, 0.00015659071505069733, 0.0001695072278380394, 0.00018242374062538147, 0.00019534025341272354, 0.0002082567662000656, 0.00022117327898740768, 0.00023408979177474976, 0.00024700630456209183, 0.0002599228173494339, 0.00027283933013677597, 0.00028575584292411804, 0.0002986723557114601, 0.0003115888684988022, 0.00032450538128614426, 0.00033742189407348633]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 8.0, 20.0, 22.0, 22.0, 39.0, 62.0, 83.0, 88.0, 123.0, 103.0, 115.0, 90.0, 57.0, 66.0, 29.0, 25.0, 12.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8046875, -4.675201416015625, -4.54571533203125, -4.416229248046875, -4.2867431640625, -4.157257080078125, -4.02777099609375, -3.898284912109375, -3.768798828125, -3.639312744140625, -3.50982666015625, -3.380340576171875, -3.2508544921875, -3.121368408203125, -2.99188232421875, -2.862396240234375, -2.73291015625, -2.603424072265625, -2.47393798828125, -2.344451904296875, -2.2149658203125, -2.085479736328125, -1.95599365234375, -1.826507568359375, -1.697021484375, -1.567535400390625, -1.43804931640625, -1.308563232421875, -1.1790771484375, -1.049591064453125, -0.92010498046875, -0.790618896484375, -0.6611328125, -0.531646728515625, -0.40216064453125, -0.272674560546875, -0.1431884765625, -0.013702392578125, 0.11578369140625, 0.245269775390625, 0.374755859375, 0.504241943359375, 0.63372802734375, 0.763214111328125, 0.8927001953125, 1.022186279296875, 1.15167236328125, 1.281158447265625, 1.41064453125, 1.540130615234375, 1.66961669921875, 1.799102783203125, 1.9285888671875, 2.058074951171875, 2.18756103515625, 2.317047119140625, 2.446533203125, 2.576019287109375, 2.70550537109375, 2.834991455078125, 2.9644775390625, 3.093963623046875, 3.22344970703125, 3.352935791015625, 3.482421875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 7.0, 8.0, 11.0, 11.0, 11.0, 45.0, 61.0, 61.0, 125.0, 196.0, 331.0, 654.0, 1557.0, 4678.0, 19406.0, 111546.0, 588540.0, 267183.0, 40857.0, 8664.0, 2588.0, 955.0, 444.0, 209.0, 130.0, 79.0, 53.0, 36.0, 25.0, 23.0, 13.0, 8.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.1328125, -4.9891357421875, -4.845458984375, -4.7017822265625, -4.55810546875, -4.4144287109375, -4.270751953125, -4.1270751953125, -3.9833984375, -3.8397216796875, -3.696044921875, -3.5523681640625, -3.40869140625, -3.2650146484375, -3.121337890625, -2.9776611328125, -2.833984375, -2.6903076171875, -2.546630859375, -2.4029541015625, -2.25927734375, -2.1156005859375, -1.971923828125, -1.8282470703125, -1.6845703125, -1.5408935546875, -1.397216796875, -1.2535400390625, -1.10986328125, -0.9661865234375, -0.822509765625, -0.6788330078125, -0.53515625, -0.3914794921875, -0.247802734375, -0.1041259765625, 0.03955078125, 0.1832275390625, 0.326904296875, 0.4705810546875, 0.6142578125, 0.7579345703125, 0.901611328125, 1.0452880859375, 1.18896484375, 1.3326416015625, 1.476318359375, 1.6199951171875, 1.763671875, 1.9073486328125, 2.051025390625, 2.1947021484375, 2.33837890625, 2.4820556640625, 2.625732421875, 2.7694091796875, 2.9130859375, 3.0567626953125, 3.200439453125, 3.3441162109375, 3.48779296875, 3.6314697265625, 3.775146484375, 3.9188232421875, 4.0625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 9.0, 12.0, 23.0, 19.0, 20.0, 23.0, 20.0, 29.0, 28.0, 33.0, 30.0, 34.0, 48.0, 48.0, 99.0, 239.0, 1621.0, 217.0, 71.0, 53.0, 46.0, 43.0, 36.0, 25.0, 32.0, 37.0, 22.0, 16.0, 26.0, 16.0, 19.0, 11.0, 8.0, 6.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.7109375, -8.4652099609375, -8.219482421875, -7.9737548828125, -7.72802734375, -7.4822998046875, -7.236572265625, -6.9908447265625, -6.7451171875, -6.4993896484375, -6.253662109375, -6.0079345703125, -5.76220703125, -5.5164794921875, -5.270751953125, -5.0250244140625, -4.779296875, -4.5335693359375, -4.287841796875, -4.0421142578125, -3.79638671875, -3.5506591796875, -3.304931640625, -3.0592041015625, -2.8134765625, -2.5677490234375, -2.322021484375, -2.0762939453125, -1.83056640625, -1.5848388671875, -1.339111328125, -1.0933837890625, -0.84765625, -0.6019287109375, -0.356201171875, -0.1104736328125, 0.13525390625, 0.3809814453125, 0.626708984375, 0.8724365234375, 1.1181640625, 1.3638916015625, 1.609619140625, 1.8553466796875, 2.10107421875, 2.3468017578125, 2.592529296875, 2.8382568359375, 3.083984375, 3.3297119140625, 3.575439453125, 3.8211669921875, 4.06689453125, 4.3126220703125, 4.558349609375, 4.8040771484375, 5.0498046875, 5.2955322265625, 5.541259765625, 5.7869873046875, 6.03271484375, 6.2784423828125, 6.524169921875, 6.7698974609375, 7.015625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 7.0, 9.0, 11.0, 18.0, 20.0, 10.0, 25.0, 31.0, 30.0, 46.0, 35.0, 64.0, 92.0, 155.0, 321.0, 925.0, 17596.0, 3073751.0, 50268.0, 1298.0, 371.0, 184.0, 94.0, 79.0, 46.0, 33.0, 27.0, 28.0, 22.0, 21.0, 20.0, 15.0, 15.0, 13.0, 9.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.8797607421875, -13.376708984375, -12.8736572265625, -12.37060546875, -11.8675537109375, -11.364501953125, -10.8614501953125, -10.3583984375, -9.8553466796875, -9.352294921875, -8.8492431640625, -8.34619140625, -7.8431396484375, -7.340087890625, -6.8370361328125, -6.333984375, -5.8309326171875, -5.327880859375, -4.8248291015625, -4.32177734375, -3.8187255859375, -3.315673828125, -2.8126220703125, -2.3095703125, -1.8065185546875, -1.303466796875, -0.8004150390625, -0.29736328125, 0.2056884765625, 0.708740234375, 1.2117919921875, 1.71484375, 2.2178955078125, 2.720947265625, 3.2239990234375, 3.72705078125, 4.2301025390625, 4.733154296875, 5.2362060546875, 5.7392578125, 6.2423095703125, 6.745361328125, 7.2484130859375, 7.75146484375, 8.2545166015625, 8.757568359375, 9.2606201171875, 9.763671875, 10.2667236328125, 10.769775390625, 11.2728271484375, 11.77587890625, 12.2789306640625, 12.781982421875, 13.2850341796875, 13.7880859375, 14.2911376953125, 14.794189453125, 15.2972412109375, 15.80029296875, 16.3033447265625, 16.806396484375, 17.3094482421875, 17.8125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 8.0, 1004.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.908605575561523, -8.04853630065918, -2.1884679794311523, 3.671600341796875, 9.531669616699219, 15.391738891601562, 21.251806259155273, 27.111875534057617, 32.971946716308594, 38.83201599121094, 44.69208526611328, 50.552154541015625, 56.41222381591797, 62.27229309082031, 68.13235473632812, 73.992431640625, 79.85249328613281, 85.71256256103516, 91.5726318359375, 97.43270111083984, 103.29277038574219, 109.15283966064453, 115.01290893554688, 120.87297058105469, 126.73304748535156, 132.59310913085938, 138.45318603515625, 144.31324768066406, 150.17332458496094, 156.03338623046875, 161.89346313476562, 167.75352478027344, 173.6136016845703, 179.47366333007812, 185.333740234375, 191.1938018798828, 197.0538787841797, 202.9139404296875, 208.77401733398438, 214.6340789794922, 220.49415588378906, 226.35421752929688, 232.21429443359375, 238.07435607910156, 243.93443298339844, 249.79449462890625, 255.65457153320312, 261.5146484375, 267.37469482421875, 273.2347717285156, 279.0948181152344, 284.95489501953125, 290.8149719238281, 296.675048828125, 302.53509521484375, 308.3951721191406, 314.2552490234375, 320.1153259277344, 325.9753723144531, 331.83544921875, 337.6955261230469, 343.55560302734375, 349.4156494140625, 355.2757263183594, 361.13580322265625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 3.0, 9.0, 16.0, 16.0, 20.0, 22.0, 27.0, 37.0, 36.0, 34.0, 38.0, 27.0, 32.0, 51.0, 35.0, 49.0, 53.0, 45.0, 45.0, 38.0, 39.0, 38.0, 35.0, 46.0, 30.0, 25.0, 19.0, 21.0, 18.0, 19.0, 11.0, 12.0, 6.0, 5.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-28.132755279541016, -27.32994842529297, -26.527141571044922, -25.724334716796875, -24.921525955200195, -24.11871910095215, -23.3159122467041, -22.513105392456055, -21.710298538208008, -20.90749168395996, -20.104684829711914, -19.301876068115234, -18.499069213867188, -17.69626235961914, -16.893455505371094, -16.090648651123047, -15.287840843200684, -14.485033988952637, -13.682226181030273, -12.879419326782227, -12.07661247253418, -11.273805618286133, -10.47099781036377, -9.668190956115723, -8.86538314819336, -8.062576293945312, -7.259768962860107, -6.456961631774902, -5.6541547775268555, -4.85134744644165, -4.048540115356445, -3.2457332611083984, -2.4429264068603516, -1.6401193141937256, -0.8373121023178101, -0.03450489044189453, 0.7683022022247314, 1.5711092948913574, 2.3739166259765625, 3.1767234802246094, 3.9795308113098145, 4.7823381423950195, 5.585144996643066, 6.3879523277282715, 7.190759658813477, 7.993566513061523, 8.79637336730957, 9.599180221557617, 10.40198802947998, 11.204794883728027, 12.00760269165039, 12.810409545898438, 13.613216400146484, 14.416023254394531, 15.218831062316895, 16.021636962890625, 16.824445724487305, 17.62725257873535, 18.4300594329834, 19.232868194580078, 20.035675048828125, 20.838481903076172, 21.64128875732422, 22.444095611572266, 23.246902465820312]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 4.0, 11.0, 16.0, 25.0, 26.0, 43.0, 63.0, 77.0, 87.0, 123.0, 99.0, 114.0, 94.0, 59.0, 60.0, 34.0, 19.0, 15.0, 11.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8125, -4.682647705078125, -4.55279541015625, -4.422943115234375, -4.2930908203125, -4.163238525390625, -4.03338623046875, -3.903533935546875, -3.773681640625, -3.643829345703125, -3.51397705078125, -3.384124755859375, -3.2542724609375, -3.124420166015625, -2.99456787109375, -2.864715576171875, -2.73486328125, -2.605010986328125, -2.47515869140625, -2.345306396484375, -2.2154541015625, -2.085601806640625, -1.95574951171875, -1.825897216796875, -1.696044921875, -1.566192626953125, -1.43634033203125, -1.306488037109375, -1.1766357421875, -1.046783447265625, -0.91693115234375, -0.787078857421875, -0.6572265625, -0.527374267578125, -0.39752197265625, -0.267669677734375, -0.1378173828125, -0.007965087890625, 0.12188720703125, 0.251739501953125, 0.381591796875, 0.511444091796875, 0.64129638671875, 0.771148681640625, 0.9010009765625, 1.030853271484375, 1.16070556640625, 1.290557861328125, 1.42041015625, 1.550262451171875, 1.68011474609375, 1.809967041015625, 1.9398193359375, 2.069671630859375, 2.19952392578125, 2.329376220703125, 2.459228515625, 2.589080810546875, 2.71893310546875, 2.848785400390625, 2.9786376953125, 3.108489990234375, 3.23834228515625, 3.368194580078125, 3.498046875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 10.0, 20.0, 13.0, 29.0, 35.0, 80.0, 107.0, 159.0, 347.0, 645.0, 1277.0, 3636.0, 18283.0, 2704388.0, 1444805.0, 15338.0, 3023.0, 1042.0, 471.0, 221.0, 150.0, 73.0, 35.0, 31.0, 23.0, 13.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.875, -24.201904296875, -23.52880859375, -22.855712890625, -22.1826171875, -21.509521484375, -20.83642578125, -20.163330078125, -19.490234375, -18.817138671875, -18.14404296875, -17.470947265625, -16.7978515625, -16.124755859375, -15.45166015625, -14.778564453125, -14.10546875, -13.432373046875, -12.75927734375, -12.086181640625, -11.4130859375, -10.739990234375, -10.06689453125, -9.393798828125, -8.720703125, -8.047607421875, -7.37451171875, -6.701416015625, -6.0283203125, -5.355224609375, -4.68212890625, -4.009033203125, -3.3359375, -2.662841796875, -1.98974609375, -1.316650390625, -0.6435546875, 0.029541015625, 0.70263671875, 1.375732421875, 2.048828125, 2.721923828125, 3.39501953125, 4.068115234375, 4.7412109375, 5.414306640625, 6.08740234375, 6.760498046875, 7.43359375, 8.106689453125, 8.77978515625, 9.452880859375, 10.1259765625, 10.799072265625, 11.47216796875, 12.145263671875, 12.818359375, 13.491455078125, 14.16455078125, 14.837646484375, 15.5107421875, 16.183837890625, 16.85693359375, 17.530029296875, 18.203125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 14.0, 2.0, 16.0, 19.0, 11.0, 33.0, 39.0, 70.0, 71.0, 137.0, 223.0, 339.0, 498.0, 715.0, 627.0, 420.0, 288.0, 170.0, 116.0, 68.0, 54.0, 33.0, 26.0, 16.0, 14.0, 9.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1015625, -6.8629150390625, -6.624267578125, -6.3856201171875, -6.14697265625, -5.9083251953125, -5.669677734375, -5.4310302734375, -5.1923828125, -4.9537353515625, -4.715087890625, -4.4764404296875, -4.23779296875, -3.9991455078125, -3.760498046875, -3.5218505859375, -3.283203125, -3.0445556640625, -2.805908203125, -2.5672607421875, -2.32861328125, -2.0899658203125, -1.851318359375, -1.6126708984375, -1.3740234375, -1.1353759765625, -0.896728515625, -0.6580810546875, -0.41943359375, -0.1807861328125, 0.057861328125, 0.2965087890625, 0.53515625, 0.7738037109375, 1.012451171875, 1.2510986328125, 1.48974609375, 1.7283935546875, 1.967041015625, 2.2056884765625, 2.4443359375, 2.6829833984375, 2.921630859375, 3.1602783203125, 3.39892578125, 3.6375732421875, 3.876220703125, 4.1148681640625, 4.353515625, 4.5921630859375, 4.830810546875, 5.0694580078125, 5.30810546875, 5.5467529296875, 5.785400390625, 6.0240478515625, 6.2626953125, 6.5013427734375, 6.739990234375, 6.9786376953125, 7.21728515625, 7.4559326171875, 7.694580078125, 7.9332275390625, 8.171875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 5.0, 12.0, 26.0, 31.0, 41.0, 57.0, 86.0, 153.0, 287.0, 448.0, 851.0, 1699.0, 3508.0, 8250.0, 22829.0, 82200.0, 555135.0, 2847407.0, 550748.0, 82273.0, 22762.0, 8288.0, 3512.0, 1684.0, 832.0, 438.0, 258.0, 161.0, 86.0, 83.0, 43.0, 29.0, 22.0, 9.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.3125, -11.9449462890625, -11.577392578125, -11.2098388671875, -10.84228515625, -10.4747314453125, -10.107177734375, -9.7396240234375, -9.3720703125, -9.0045166015625, -8.636962890625, -8.2694091796875, -7.90185546875, -7.5343017578125, -7.166748046875, -6.7991943359375, -6.431640625, -6.0640869140625, -5.696533203125, -5.3289794921875, -4.96142578125, -4.5938720703125, -4.226318359375, -3.8587646484375, -3.4912109375, -3.1236572265625, -2.756103515625, -2.3885498046875, -2.02099609375, -1.6534423828125, -1.285888671875, -0.9183349609375, -0.55078125, -0.1832275390625, 0.184326171875, 0.5518798828125, 0.91943359375, 1.2869873046875, 1.654541015625, 2.0220947265625, 2.3896484375, 2.7572021484375, 3.124755859375, 3.4923095703125, 3.85986328125, 4.2274169921875, 4.594970703125, 4.9625244140625, 5.330078125, 5.6976318359375, 6.065185546875, 6.4327392578125, 6.80029296875, 7.1678466796875, 7.535400390625, 7.9029541015625, 8.2705078125, 8.6380615234375, 9.005615234375, 9.3731689453125, 9.74072265625, 10.1082763671875, 10.475830078125, 10.8433837890625, 11.2109375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 25.0, 59.0, 145.0, 269.0, 278.0, 140.0, 67.0, 16.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.68810272216797, -21.9373779296875, -19.18665313720703, -16.43592643737793, -13.685201644897461, -10.934476852416992, -8.18375015258789, -5.433025360107422, -2.682300567626953, 0.06842470169067383, 2.819149971008301, 5.569875717163086, 8.320600509643555, 11.071325302124023, 13.822052001953125, 16.572776794433594, 19.323501586914062, 22.07422637939453, 24.824951171875, 27.5756778717041, 30.32640266418457, 33.077125549316406, 35.82785415649414, 38.57857894897461, 41.32930374145508, 44.08002853393555, 46.830753326416016, 49.58148193359375, 52.33220672607422, 55.08293151855469, 57.833656311035156, 60.584381103515625, 63.33509826660156, 66.08582305908203, 68.8365478515625, 71.58727264404297, 74.33799743652344, 77.0887222290039, 79.83944702148438, 82.59017944335938, 85.34089660644531, 88.09162139892578, 90.84234619140625, 93.59307098388672, 96.34379577636719, 99.09452056884766, 101.84524536132812, 104.59597778320312, 107.3467025756836, 110.09742736816406, 112.84815216064453, 115.598876953125, 118.34960174560547, 121.10032653808594, 123.85105895996094, 126.60177612304688, 129.35250854492188, 132.10324096679688, 134.8539581298828, 137.6046905517578, 140.35540771484375, 143.10614013671875, 145.8568572998047, 148.6075897216797, 151.35830688476562]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 4.0, 4.0, 10.0, 5.0, 4.0, 13.0, 15.0, 17.0, 18.0, 23.0, 26.0, 28.0, 34.0, 26.0, 29.0, 39.0, 38.0, 38.0, 40.0, 54.0, 34.0, 53.0, 47.0, 37.0, 43.0, 34.0, 38.0, 34.0, 34.0, 34.0, 19.0, 13.0, 28.0, 18.0, 14.0, 10.0, 14.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.430870056152344, -23.666580200195312, -22.90228843688965, -22.137998580932617, -21.373706817626953, -20.609416961669922, -19.84512710571289, -19.080835342407227, -18.316545486450195, -17.552255630493164, -16.7879638671875, -16.02367401123047, -15.259383201599121, -14.495092391967773, -13.730801582336426, -12.966510772705078, -12.20221996307373, -11.437929153442383, -10.673638343811035, -9.909347534179688, -9.145057678222656, -8.380766868591309, -7.616476058959961, -6.8521857261657715, -6.087894916534424, -5.323604106903076, -4.559313774108887, -3.795022964477539, -3.0307323932647705, -2.266441822052002, -1.5021510124206543, -0.7378606796264648, 0.026430130004882812, 0.7907207608222961, 1.5550113916397095, 2.3193020820617676, 3.083592653274536, 3.8478832244873047, 4.612174034118652, 5.376464366912842, 6.1407551765441895, 6.905045986175537, 7.669336318969727, 8.433627128601074, 9.197917938232422, 9.962207794189453, 10.726499557495117, 11.490789413452148, 12.255080223083496, 13.019371032714844, 13.783661842346191, 14.547952651977539, 15.31224250793457, 16.076534271240234, 16.840824127197266, 17.605113983154297, 18.36940574645996, 19.133695602416992, 19.897987365722656, 20.662277221679688, 21.42656898498535, 22.190858840942383, 22.955150604248047, 23.719440460205078, 24.48373031616211]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 27.0, 18.0, 45.0, 58.0, 53.0, 82.0, 88.0, 82.0, 114.0, 94.0, 81.0, 60.0, 55.0, 41.0, 22.0, 15.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.475860595703125, -4.35406494140625, -4.232269287109375, -4.1104736328125, -3.988677978515625, -3.86688232421875, -3.745086669921875, -3.623291015625, -3.501495361328125, -3.37969970703125, -3.257904052734375, -3.1361083984375, -3.014312744140625, -2.89251708984375, -2.770721435546875, -2.64892578125, -2.527130126953125, -2.40533447265625, -2.283538818359375, -2.1617431640625, -2.039947509765625, -1.91815185546875, -1.796356201171875, -1.674560546875, -1.552764892578125, -1.43096923828125, -1.309173583984375, -1.1873779296875, -1.065582275390625, -0.94378662109375, -0.821990966796875, -0.7001953125, -0.578399658203125, -0.45660400390625, -0.334808349609375, -0.2130126953125, -0.091217041015625, 0.03057861328125, 0.152374267578125, 0.274169921875, 0.395965576171875, 0.51776123046875, 0.639556884765625, 0.7613525390625, 0.883148193359375, 1.00494384765625, 1.126739501953125, 1.24853515625, 1.370330810546875, 1.49212646484375, 1.613922119140625, 1.7357177734375, 1.857513427734375, 1.97930908203125, 2.101104736328125, 2.222900390625, 2.344696044921875, 2.46649169921875, 2.588287353515625, 2.7100830078125, 2.831878662109375, 2.95367431640625, 3.075469970703125, 3.197265625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 5.0, 4.0, 15.0, 16.0, 27.0, 29.0, 42.0, 39.0, 67.0, 85.0, 149.0, 222.0, 292.0, 477.0, 731.0, 1197.0, 2001.0, 3578.0, 6876.0, 14968.0, 39481.0, 127508.0, 562265.0, 195822.0, 54302.0, 19796.0, 8379.0, 4176.0, 2291.0, 1286.0, 846.0, 498.0, 337.0, 236.0, 149.0, 97.0, 69.0, 55.0, 34.0, 25.0, 21.0, 20.0, 14.0, 5.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.215087890625, -0.20806884765625, -0.2010498046875, -0.19403076171875, -0.18701171875, -0.17999267578125, -0.1729736328125, -0.16595458984375, -0.158935546875, -0.15191650390625, -0.1448974609375, -0.13787841796875, -0.130859375, -0.12384033203125, -0.1168212890625, -0.10980224609375, -0.102783203125, -0.09576416015625, -0.0887451171875, -0.08172607421875, -0.07470703125, -0.06768798828125, -0.0606689453125, -0.05364990234375, -0.046630859375, -0.03961181640625, -0.0325927734375, -0.02557373046875, -0.0185546875, -0.01153564453125, -0.0045166015625, 0.00250244140625, 0.009521484375, 0.01654052734375, 0.0235595703125, 0.03057861328125, 0.03759765625, 0.04461669921875, 0.0516357421875, 0.05865478515625, 0.065673828125, 0.07269287109375, 0.0797119140625, 0.08673095703125, 0.09375, 0.10076904296875, 0.1077880859375, 0.11480712890625, 0.121826171875, 0.12884521484375, 0.1358642578125, 0.14288330078125, 0.14990234375, 0.15692138671875, 0.1639404296875, 0.17095947265625, 0.177978515625, 0.18499755859375, 0.1920166015625, 0.19903564453125, 0.2060546875, 0.21307373046875, 0.2200927734375, 0.22711181640625, 0.234130859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 3.0, 10.0, 8.0, 8.0, 15.0, 16.0, 17.0, 23.0, 25.0, 34.0, 24.0, 23.0, 35.0, 44.0, 36.0, 48.0, 39.0, 59.0, 1070.0, 34.0, 42.0, 26.0, 45.0, 45.0, 36.0, 36.0, 27.0, 32.0, 25.0, 26.0, 20.0, 21.0, 16.0, 17.0, 9.0, 6.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.875, -2.797149658203125, -2.71929931640625, -2.641448974609375, -2.5635986328125, -2.485748291015625, -2.40789794921875, -2.330047607421875, -2.252197265625, -2.174346923828125, -2.09649658203125, -2.018646240234375, -1.9407958984375, -1.862945556640625, -1.78509521484375, -1.707244873046875, -1.62939453125, -1.551544189453125, -1.47369384765625, -1.395843505859375, -1.3179931640625, -1.240142822265625, -1.16229248046875, -1.084442138671875, -1.006591796875, -0.928741455078125, -0.85089111328125, -0.773040771484375, -0.6951904296875, -0.617340087890625, -0.53948974609375, -0.461639404296875, -0.3837890625, -0.305938720703125, -0.22808837890625, -0.150238037109375, -0.0723876953125, 0.005462646484375, 0.08331298828125, 0.161163330078125, 0.239013671875, 0.316864013671875, 0.39471435546875, 0.472564697265625, 0.5504150390625, 0.628265380859375, 0.70611572265625, 0.783966064453125, 0.86181640625, 0.939666748046875, 1.01751708984375, 1.095367431640625, 1.1732177734375, 1.251068115234375, 1.32891845703125, 1.406768798828125, 1.484619140625, 1.562469482421875, 1.64031982421875, 1.718170166015625, 1.7960205078125, 1.873870849609375, 1.95172119140625, 2.029571533203125, 2.107421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 11.0, 27.0, 32.0, 53.0, 82.0, 170.0, 213.0, 347.0, 576.0, 900.0, 1385.0, 2148.0, 3448.0, 5425.0, 8555.0, 13523.0, 21553.0, 35825.0, 60720.0, 111932.0, 1036662.0, 530396.0, 109881.0, 60367.0, 34968.0, 21682.0, 13417.0, 8378.0, 5206.0, 3355.0, 2162.0, 1371.0, 843.0, 542.0, 354.0, 220.0, 119.0, 102.0, 70.0, 38.0, 15.0, 25.0, 6.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06503105163574219, -0.06286239624023438, -0.06069374084472656, -0.05852508544921875, -0.05635643005371094, -0.054187774658203125, -0.05201911926269531, -0.0498504638671875, -0.04768180847167969, -0.045513153076171875, -0.04334449768066406, -0.04117584228515625, -0.03900718688964844, -0.036838531494140625, -0.03466987609863281, -0.032501220703125, -0.030332565307617188, -0.028163909912109375, -0.025995254516601562, -0.02382659912109375, -0.021657943725585938, -0.019489288330078125, -0.017320632934570312, -0.0151519775390625, -0.012983322143554688, -0.010814666748046875, -0.008646011352539062, -0.00647735595703125, -0.0043087005615234375, -0.002140045166015625, 2.86102294921875e-05, 0.002197265625, 0.0043659210205078125, 0.006534576416015625, 0.008703231811523438, 0.01087188720703125, 0.013040542602539062, 0.015209197998046875, 0.017377853393554688, 0.0195465087890625, 0.021715164184570312, 0.023883819580078125, 0.026052474975585938, 0.02822113037109375, 0.030389785766601562, 0.032558441162109375, 0.03472709655761719, 0.036895751953125, 0.03906440734863281, 0.041233062744140625, 0.04340171813964844, 0.04557037353515625, 0.04773902893066406, 0.049907684326171875, 0.05207633972167969, 0.0542449951171875, 0.05641365051269531, 0.058582305908203125, 0.06075096130371094, 0.06291961669921875, 0.06508827209472656, 0.06725692749023438, 0.06942558288574219, 0.07159423828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 7.0, 9.0, 2.0, 11.0, 8.0, 17.0, 14.0, 34.0, 36.0, 34.0, 64.0, 46.0, 79.0, 73.0, 91.0, 81.0, 69.0, 59.0, 69.0, 37.0, 34.0, 21.0, 24.0, 15.0, 22.0, 6.0, 13.0, 9.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007200241088867188, -0.0007008612155914307, -0.0006816983222961426, -0.0006625354290008545, -0.0006433725357055664, -0.0006242096424102783, -0.0006050467491149902, -0.0005858838558197021, -0.0005667209625244141, -0.000547558069229126, -0.0005283951759338379, -0.0005092322826385498, -0.0004900693893432617, -0.00047090649604797363, -0.00045174360275268555, -0.00043258070945739746, -0.0004134178161621094, -0.0003942549228668213, -0.0003750920295715332, -0.0003559291362762451, -0.00033676624298095703, -0.00031760334968566895, -0.00029844045639038086, -0.0002792775630950928, -0.0002601146697998047, -0.0002409517765045166, -0.00022178888320922852, -0.00020262598991394043, -0.00018346309661865234, -0.00016430020332336426, -0.00014513731002807617, -0.00012597441673278809, -0.0001068115234375, -8.764863014221191e-05, -6.848573684692383e-05, -4.932284355163574e-05, -3.0159950256347656e-05, -1.099705696105957e-05, 8.165836334228516e-06, 2.73287296295166e-05, 4.649162292480469e-05, 6.565451622009277e-05, 8.481740951538086e-05, 0.00010398030281066895, 0.00012314319610595703, 0.00014230608940124512, 0.0001614689826965332, 0.0001806318759918213, 0.00019979476928710938, 0.00021895766258239746, 0.00023812055587768555, 0.00025728344917297363, 0.0002764463424682617, 0.0002956092357635498, 0.0003147721290588379, 0.000333935022354126, 0.00035309791564941406, 0.00037226080894470215, 0.00039142370223999023, 0.0004105865955352783, 0.0004297494888305664, 0.0004489123821258545, 0.0004680752754211426, 0.00048723816871643066, 0.0005064010620117188]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 11.0, 16.0, 22.0, 19.0, 40.0, 40.0, 48.0, 67.0, 91.0, 131.0, 207.0, 361.0, 2757.0, 116888.0, 910897.0, 15287.0, 811.0, 252.0, 146.0, 112.0, 83.0, 71.0, 48.0, 38.0, 23.0, 20.0, 13.0, 10.0, 11.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00897979736328125, -0.008672833442687988, -0.008365869522094727, -0.008058905601501465, -0.007751941680908203, -0.007444977760314941, -0.00713801383972168, -0.006831049919128418, -0.006524085998535156, -0.0062171220779418945, -0.005910158157348633, -0.005603194236755371, -0.005296230316162109, -0.004989266395568848, -0.004682302474975586, -0.004375338554382324, -0.0040683746337890625, -0.0037614107131958008, -0.003454446792602539, -0.0031474828720092773, -0.0028405189514160156, -0.002533555030822754, -0.002226591110229492, -0.0019196271896362305, -0.0016126632690429688, -0.001305699348449707, -0.0009987354278564453, -0.0006917715072631836, -0.0003848075866699219, -7.784366607666016e-05, 0.00022912025451660156, 0.0005360841751098633, 0.000843048095703125, 0.0011500120162963867, 0.0014569759368896484, 0.0017639398574829102, 0.002070903778076172, 0.0023778676986694336, 0.0026848316192626953, 0.002991795539855957, 0.0032987594604492188, 0.0036057233810424805, 0.003912687301635742, 0.004219651222229004, 0.004526615142822266, 0.004833579063415527, 0.005140542984008789, 0.005447506904602051, 0.0057544708251953125, 0.006061434745788574, 0.006368398666381836, 0.006675362586975098, 0.006982326507568359, 0.007289290428161621, 0.007596254348754883, 0.007903218269348145, 0.008210182189941406, 0.008517146110534668, 0.00882411003112793, 0.009131073951721191, 0.009438037872314453, 0.009745001792907715, 0.010051965713500977, 0.010358929634094238, 0.0106658935546875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 25.0, 124.0, 718.0, 132.0, 17.0, 2.0], "bins": [-0.009489239193499088, -0.00933240819722414, -0.009175577200949192, -0.009018746204674244, -0.008861915208399296, -0.008705084212124348, -0.0085482532158494, -0.008391422219574451, -0.008234591223299503, -0.008077760227024555, -0.007920929230749607, -0.007764098234474659, -0.007607267238199711, -0.007450436241924763, -0.007293605245649815, -0.0071367742493748665, -0.006979943253099918, -0.00682311225682497, -0.006666281260550022, -0.006509450264275074, -0.006352619268000126, -0.006195788271725178, -0.00603895727545023, -0.0058821262791752815, -0.005725294817239046, -0.005568463820964098, -0.00541163282468915, -0.005254801828414202, -0.005097970832139254, -0.0049411398358643055, -0.004784308839589357, -0.004627477843314409, -0.004470646381378174, -0.004313815385103226, -0.004156984388828278, -0.0040001533925533295, -0.0038433223962783813, -0.0036864914000034332, -0.003529660403728485, -0.003372829407453537, -0.003215998411178589, -0.0030591674149036407, -0.0029023364186286926, -0.0027455054223537445, -0.0025886744260787964, -0.0024318434298038483, -0.0022750124335289, -0.002118181437253952, -0.001961350440979004, -0.0018045194447040558, -0.0016476884484291077, -0.0014908574521541595, -0.0013340264558792114, -0.0011771954596042633, -0.0010203643469139934, -0.0008635333506390452, -0.0007067023543640971, -0.000549871358089149, -0.0003930403327103704, -0.00023620930733159184, -7.937831105664372e-05, 7.74526852183044e-05, 0.00023428373970091343, 0.00039111473597586155, 0.0005479457322508097]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 9.0, 8.0, 14.0, 13.0, 26.0, 22.0, 32.0, 35.0, 41.0, 47.0, 47.0, 39.0, 44.0, 54.0, 73.0, 45.0, 37.0, 49.0, 49.0, 50.0, 42.0, 39.0, 33.0, 35.0, 20.0, 18.0, 20.0, 11.0, 11.0, 11.0, 10.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0007194876670837402, -0.0007006833329796791, -0.000681878998875618, -0.0006630746647715569, -0.0006442703306674957, -0.0006254659965634346, -0.0006066616624593735, -0.0005878573283553123, -0.0005690529942512512, -0.0005502486601471901, -0.000531444326043129, -0.0005126399919390678, -0.0004938356578350067, -0.0004750313237309456, -0.00045622698962688446, -0.00043742265552282333, -0.0004186183214187622, -0.0003998139873147011, -0.00038100965321063995, -0.0003622053191065788, -0.0003434009850025177, -0.0003245966508984566, -0.00030579231679439545, -0.0002869879826903343, -0.0002681836485862732, -0.00024937931448221207, -0.00023057498037815094, -0.0002117706462740898, -0.0001929663121700287, -0.00017416197806596756, -0.00015535764396190643, -0.0001365533098578453, -0.00011774897575378418, -9.894464164972305e-05, -8.014030754566193e-05, -6.13359734416008e-05, -4.253163933753967e-05, -2.3727305233478546e-05, -4.9229711294174194e-06, 1.3881362974643707e-05, 3.2685697078704834e-05, 5.149003118276596e-05, 7.029436528682709e-05, 8.909869939088821e-05, 0.00010790303349494934, 0.00012670736759901047, 0.0001455117017030716, 0.00016431603580713272, 0.00018312036991119385, 0.00020192470401525497, 0.0002207290381193161, 0.00023953337222337723, 0.00025833770632743835, 0.0002771420404314995, 0.0002959463745355606, 0.00031475070863962173, 0.00033355504274368286, 0.000352359376847744, 0.0003711637109518051, 0.00038996804505586624, 0.00040877237915992737, 0.0004275767132639885, 0.0004463810473680496, 0.00046518538147211075, 0.0004839897155761719]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 27.0, 18.0, 45.0, 58.0, 53.0, 82.0, 88.0, 82.0, 114.0, 93.0, 82.0, 60.0, 55.0, 41.0, 22.0, 15.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.475860595703125, -4.35406494140625, -4.232269287109375, -4.1104736328125, -3.988677978515625, -3.86688232421875, -3.745086669921875, -3.623291015625, -3.501495361328125, -3.37969970703125, -3.257904052734375, -3.1361083984375, -3.014312744140625, -2.89251708984375, -2.770721435546875, -2.64892578125, -2.527130126953125, -2.40533447265625, -2.283538818359375, -2.1617431640625, -2.039947509765625, -1.91815185546875, -1.796356201171875, -1.674560546875, -1.552764892578125, -1.43096923828125, -1.309173583984375, -1.1873779296875, -1.065582275390625, -0.94378662109375, -0.821990966796875, -0.7001953125, -0.578399658203125, -0.45660400390625, -0.334808349609375, -0.2130126953125, -0.091217041015625, 0.03057861328125, 0.152374267578125, 0.274169921875, 0.395965576171875, 0.51776123046875, 0.639556884765625, 0.7613525390625, 0.883148193359375, 1.00494384765625, 1.126739501953125, 1.24853515625, 1.370330810546875, 1.49212646484375, 1.613922119140625, 1.7357177734375, 1.857513427734375, 1.97930908203125, 2.101104736328125, 2.222900390625, 2.344696044921875, 2.46649169921875, 2.588287353515625, 2.7100830078125, 2.831878662109375, 2.95367431640625, 3.075469970703125, 3.197265625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 7.0, 10.0, 16.0, 20.0, 29.0, 39.0, 61.0, 67.0, 118.0, 193.0, 337.0, 631.0, 1442.0, 4534.0, 30392.0, 963706.0, 38597.0, 5169.0, 1607.0, 677.0, 311.0, 209.0, 121.0, 74.0, 65.0, 34.0, 21.0, 16.0, 13.0, 15.0, 2.0, 7.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.3125, -19.66845703125, -19.0244140625, -18.38037109375, -17.736328125, -17.09228515625, -16.4482421875, -15.80419921875, -15.16015625, -14.51611328125, -13.8720703125, -13.22802734375, -12.583984375, -11.93994140625, -11.2958984375, -10.65185546875, -10.0078125, -9.36376953125, -8.7197265625, -8.07568359375, -7.431640625, -6.78759765625, -6.1435546875, -5.49951171875, -4.85546875, -4.21142578125, -3.5673828125, -2.92333984375, -2.279296875, -1.63525390625, -0.9912109375, -0.34716796875, 0.296875, 0.94091796875, 1.5849609375, 2.22900390625, 2.873046875, 3.51708984375, 4.1611328125, 4.80517578125, 5.44921875, 6.09326171875, 6.7373046875, 7.38134765625, 8.025390625, 8.66943359375, 9.3134765625, 9.95751953125, 10.6015625, 11.24560546875, 11.8896484375, 12.53369140625, 13.177734375, 13.82177734375, 14.4658203125, 15.10986328125, 15.75390625, 16.39794921875, 17.0419921875, 17.68603515625, 18.330078125, 18.97412109375, 19.6181640625, 20.26220703125, 20.90625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 11.0, 15.0, 19.0, 24.0, 27.0, 32.0, 39.0, 39.0, 40.0, 55.0, 53.0, 68.0, 115.0, 1525.0, 428.0, 94.0, 73.0, 53.0, 43.0, 31.0, 38.0, 32.0, 37.0, 29.0, 31.0, 17.0, 15.0, 6.0, 9.0, 6.0, 4.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.263916015625, -7.95751953125, -7.651123046875, -7.3447265625, -7.038330078125, -6.73193359375, -6.425537109375, -6.119140625, -5.812744140625, -5.50634765625, -5.199951171875, -4.8935546875, -4.587158203125, -4.28076171875, -3.974365234375, -3.66796875, -3.361572265625, -3.05517578125, -2.748779296875, -2.4423828125, -2.135986328125, -1.82958984375, -1.523193359375, -1.216796875, -0.910400390625, -0.60400390625, -0.297607421875, 0.0087890625, 0.315185546875, 0.62158203125, 0.927978515625, 1.234375, 1.540771484375, 1.84716796875, 2.153564453125, 2.4599609375, 2.766357421875, 3.07275390625, 3.379150390625, 3.685546875, 3.991943359375, 4.29833984375, 4.604736328125, 4.9111328125, 5.217529296875, 5.52392578125, 5.830322265625, 6.13671875, 6.443115234375, 6.74951171875, 7.055908203125, 7.3623046875, 7.668701171875, 7.97509765625, 8.281494140625, 8.587890625, 8.894287109375, 9.20068359375, 9.507080078125, 9.8134765625, 10.119873046875, 10.42626953125, 10.732666015625, 11.0390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 9.0, 15.0, 29.0, 25.0, 38.0, 51.0, 95.0, 114.0, 152.0, 227.0, 322.0, 481.0, 793.0, 1115.0, 1794.0, 3169.0, 5695.0, 11830.0, 34838.0, 1505155.0, 1519298.0, 34436.0, 12048.0, 5615.0, 3086.0, 1868.0, 1133.0, 743.0, 476.0, 325.0, 214.0, 143.0, 102.0, 86.0, 41.0, 28.0, 27.0, 20.0, 15.0, 17.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.7109375, -14.2205810546875, -13.730224609375, -13.2398681640625, -12.74951171875, -12.2591552734375, -11.768798828125, -11.2784423828125, -10.7880859375, -10.2977294921875, -9.807373046875, -9.3170166015625, -8.82666015625, -8.3363037109375, -7.845947265625, -7.3555908203125, -6.865234375, -6.3748779296875, -5.884521484375, -5.3941650390625, -4.90380859375, -4.4134521484375, -3.923095703125, -3.4327392578125, -2.9423828125, -2.4520263671875, -1.961669921875, -1.4713134765625, -0.98095703125, -0.4906005859375, -0.000244140625, 0.4901123046875, 0.98046875, 1.4708251953125, 1.961181640625, 2.4515380859375, 2.94189453125, 3.4322509765625, 3.922607421875, 4.4129638671875, 4.9033203125, 5.3936767578125, 5.884033203125, 6.3743896484375, 6.86474609375, 7.3551025390625, 7.845458984375, 8.3358154296875, 8.826171875, 9.3165283203125, 9.806884765625, 10.2972412109375, 10.78759765625, 11.2779541015625, 11.768310546875, 12.2586669921875, 12.7490234375, 13.2393798828125, 13.729736328125, 14.2200927734375, 14.71044921875, 15.2008056640625, 15.691162109375, 16.1815185546875, 16.671875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 11.0, 19.0, 31.0, 42.0, 80.0, 133.0, 134.0, 154.0, 144.0, 96.0, 64.0, 43.0, 17.0, 11.0, 12.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.64273452758789, -54.412296295166016, -53.18185806274414, -51.951419830322266, -50.72098159790039, -49.490543365478516, -48.26010513305664, -47.0296630859375, -45.799224853515625, -44.56878662109375, -43.338348388671875, -42.10791015625, -40.877471923828125, -39.64703369140625, -38.416595458984375, -37.1861572265625, -35.955718994140625, -34.72528076171875, -33.494842529296875, -32.264404296875, -31.033966064453125, -29.80352783203125, -28.573087692260742, -27.342649459838867, -26.112211227416992, -24.881772994995117, -23.651334762573242, -22.420896530151367, -21.19045639038086, -19.960018157958984, -18.72957992553711, -17.499141693115234, -16.268707275390625, -15.03826904296875, -13.807830810546875, -12.577391624450684, -11.346953392028809, -10.116515159606934, -8.886075973510742, -7.655637741088867, -6.425199508666992, -5.194761276245117, -3.964322566986084, -2.73388409614563, -1.5034456253051758, -0.2730073928833008, 0.9574313163757324, 2.1878700256347656, 3.4183082580566406, 4.648746490478516, 5.879185199737549, 7.109623908996582, 8.340062141418457, 9.570500373840332, 10.800939559936523, 12.031377792358398, 13.261816024780273, 14.492254257202148, 15.722692489624023, 16.9531307220459, 18.183570861816406, 19.41400909423828, 20.644447326660156, 21.87488555908203, 23.105323791503906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 13.0, 15.0, 13.0, 16.0, 17.0, 26.0, 21.0, 26.0, 33.0, 27.0, 39.0, 41.0, 51.0, 48.0, 43.0, 46.0, 51.0, 41.0, 46.0, 42.0, 41.0, 41.0, 40.0, 31.0, 25.0, 28.0, 26.0, 18.0, 17.0, 13.0, 7.0, 10.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.903656005859375, -33.89384078979492, -32.88402557373047, -31.874210357666016, -30.864395141601562, -29.85457992553711, -28.844764709472656, -27.834949493408203, -26.82513427734375, -25.815319061279297, -24.805503845214844, -23.79568862915039, -22.785873413085938, -21.776058197021484, -20.76624298095703, -19.756427764892578, -18.746612548828125, -17.736797332763672, -16.72698211669922, -15.717166900634766, -14.707351684570312, -13.69753646850586, -12.687721252441406, -11.677906036376953, -10.6680908203125, -9.658275604248047, -8.648460388183594, -7.638645172119141, -6.6288299560546875, -5.619014739990234, -4.609199523925781, -3.599384307861328, -2.5895729064941406, -1.5797576904296875, -0.5699424743652344, 0.43987274169921875, 1.4496879577636719, 2.459503173828125, 3.469318389892578, 4.479133605957031, 5.488948822021484, 6.4987640380859375, 7.508579254150391, 8.518394470214844, 9.528209686279297, 10.53802490234375, 11.547840118408203, 12.557655334472656, 13.56747055053711, 14.577285766601562, 15.587100982666016, 16.59691619873047, 17.606731414794922, 18.616546630859375, 19.626361846923828, 20.63617706298828, 21.645992279052734, 22.655807495117188, 23.66562271118164, 24.675437927246094, 25.685253143310547, 26.695068359375, 27.704883575439453, 28.714698791503906, 29.72451400756836]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 2.0, 4.0, 3.0, 14.0, 15.0, 16.0, 25.0, 39.0, 61.0, 65.0, 66.0, 76.0, 93.0, 95.0, 105.0, 78.0, 57.0, 57.0, 43.0, 32.0, 22.0, 13.0, 4.0, 10.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.69921875, -4.575408935546875, -4.45159912109375, -4.327789306640625, -4.2039794921875, -4.080169677734375, -3.95635986328125, -3.832550048828125, -3.708740234375, -3.584930419921875, -3.46112060546875, -3.337310791015625, -3.2135009765625, -3.089691162109375, -2.96588134765625, -2.842071533203125, -2.71826171875, -2.594451904296875, -2.47064208984375, -2.346832275390625, -2.2230224609375, -2.099212646484375, -1.97540283203125, -1.851593017578125, -1.727783203125, -1.603973388671875, -1.48016357421875, -1.356353759765625, -1.2325439453125, -1.108734130859375, -0.98492431640625, -0.861114501953125, -0.7373046875, -0.613494873046875, -0.48968505859375, -0.365875244140625, -0.2420654296875, -0.118255615234375, 0.00555419921875, 0.129364013671875, 0.253173828125, 0.376983642578125, 0.50079345703125, 0.624603271484375, 0.7484130859375, 0.872222900390625, 0.99603271484375, 1.119842529296875, 1.24365234375, 1.367462158203125, 1.49127197265625, 1.615081787109375, 1.7388916015625, 1.862701416015625, 1.98651123046875, 2.110321044921875, 2.234130859375, 2.357940673828125, 2.48175048828125, 2.605560302734375, 2.7293701171875, 2.853179931640625, 2.97698974609375, 3.100799560546875, 3.224609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 7.0, 7.0, 14.0, 13.0, 17.0, 37.0, 61.0, 83.0, 159.0, 299.0, 699.0, 1837.0, 6508.0, 96907.0, 4005432.0, 74292.0, 5363.0, 1507.0, 524.0, 249.0, 117.0, 47.0, 28.0, 24.0, 12.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.90625, -24.241455078125, -23.57666015625, -22.911865234375, -22.2470703125, -21.582275390625, -20.91748046875, -20.252685546875, -19.587890625, -18.923095703125, -18.25830078125, -17.593505859375, -16.9287109375, -16.263916015625, -15.59912109375, -14.934326171875, -14.26953125, -13.604736328125, -12.93994140625, -12.275146484375, -11.6103515625, -10.945556640625, -10.28076171875, -9.615966796875, -8.951171875, -8.286376953125, -7.62158203125, -6.956787109375, -6.2919921875, -5.627197265625, -4.96240234375, -4.297607421875, -3.6328125, -2.968017578125, -2.30322265625, -1.638427734375, -0.9736328125, -0.308837890625, 0.35595703125, 1.020751953125, 1.685546875, 2.350341796875, 3.01513671875, 3.679931640625, 4.3447265625, 5.009521484375, 5.67431640625, 6.339111328125, 7.00390625, 7.668701171875, 8.33349609375, 8.998291015625, 9.6630859375, 10.327880859375, 10.99267578125, 11.657470703125, 12.322265625, 12.987060546875, 13.65185546875, 14.316650390625, 14.9814453125, 15.646240234375, 16.31103515625, 16.975830078125, 17.640625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 10.0, 7.0, 14.0, 25.0, 33.0, 55.0, 85.0, 135.0, 247.0, 431.0, 693.0, 856.0, 612.0, 347.0, 170.0, 133.0, 59.0, 42.0, 28.0, 26.0, 12.0, 13.0, 9.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.8828125, -10.5828857421875, -10.282958984375, -9.9830322265625, -9.68310546875, -9.3831787109375, -9.083251953125, -8.7833251953125, -8.4833984375, -8.1834716796875, -7.883544921875, -7.5836181640625, -7.28369140625, -6.9837646484375, -6.683837890625, -6.3839111328125, -6.083984375, -5.7840576171875, -5.484130859375, -5.1842041015625, -4.88427734375, -4.5843505859375, -4.284423828125, -3.9844970703125, -3.6845703125, -3.3846435546875, -3.084716796875, -2.7847900390625, -2.48486328125, -2.1849365234375, -1.885009765625, -1.5850830078125, -1.28515625, -0.9852294921875, -0.685302734375, -0.3853759765625, -0.08544921875, 0.2144775390625, 0.514404296875, 0.8143310546875, 1.1142578125, 1.4141845703125, 1.714111328125, 2.0140380859375, 2.31396484375, 2.6138916015625, 2.913818359375, 3.2137451171875, 3.513671875, 3.8135986328125, 4.113525390625, 4.4134521484375, 4.71337890625, 5.0133056640625, 5.313232421875, 5.6131591796875, 5.9130859375, 6.2130126953125, 6.512939453125, 6.8128662109375, 7.11279296875, 7.4127197265625, 7.712646484375, 8.0125732421875, 8.3125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 18.0, 38.0, 51.0, 107.0, 183.0, 437.0, 1020.0, 3145.0, 13224.0, 94850.0, 3195490.0, 835558.0, 39554.0, 7246.0, 1990.0, 740.0, 286.0, 163.0, 71.0, 44.0, 19.0, 14.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.88330078125, -19.1416015625, -18.39990234375, -17.658203125, -16.91650390625, -16.1748046875, -15.43310546875, -14.69140625, -13.94970703125, -13.2080078125, -12.46630859375, -11.724609375, -10.98291015625, -10.2412109375, -9.49951171875, -8.7578125, -8.01611328125, -7.2744140625, -6.53271484375, -5.791015625, -5.04931640625, -4.3076171875, -3.56591796875, -2.82421875, -2.08251953125, -1.3408203125, -0.59912109375, 0.142578125, 0.88427734375, 1.6259765625, 2.36767578125, 3.109375, 3.85107421875, 4.5927734375, 5.33447265625, 6.076171875, 6.81787109375, 7.5595703125, 8.30126953125, 9.04296875, 9.78466796875, 10.5263671875, 11.26806640625, 12.009765625, 12.75146484375, 13.4931640625, 14.23486328125, 14.9765625, 15.71826171875, 16.4599609375, 17.20166015625, 17.943359375, 18.68505859375, 19.4267578125, 20.16845703125, 20.91015625, 21.65185546875, 22.3935546875, 23.13525390625, 23.876953125, 24.61865234375, 25.3603515625, 26.10205078125, 26.84375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 13.0, 13.0, 30.0, 58.0, 76.0, 124.0, 184.0, 156.0, 114.0, 94.0, 61.0, 34.0, 23.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-84.50379943847656, -82.74308776855469, -80.98237609863281, -79.22166442871094, -77.46095275878906, -75.70024108886719, -73.93952941894531, -72.17881774902344, -70.41810607910156, -68.65739440917969, -66.89668273925781, -65.13597106933594, -63.37525939941406, -61.61454772949219, -59.85383605957031, -58.09312438964844, -56.33241653442383, -54.57170486450195, -52.81099319458008, -51.0502815246582, -49.28956985473633, -47.52885818481445, -45.768150329589844, -44.00743865966797, -42.246726989746094, -40.48601531982422, -38.725303649902344, -36.96459197998047, -35.203880310058594, -33.44316864013672, -31.682458877563477, -29.9217472076416, -28.16103744506836, -26.400325775146484, -24.63961410522461, -22.878902435302734, -21.11819076538086, -19.357479095458984, -17.596769332885742, -15.836057662963867, -14.075345993041992, -12.314634323120117, -10.553922653198242, -8.793211936950684, -7.032500267028809, -5.271788597106934, -3.511077880859375, -1.7503662109375, 0.010345458984375, 1.771056890487671, 3.531768321990967, 5.292479515075684, 7.053191184997559, 8.813902854919434, 10.574613571166992, 12.335325241088867, 14.096036911010742, 15.856748580932617, 17.617460250854492, 19.378170013427734, 21.13888168334961, 22.899593353271484, 24.66030502319336, 26.421016693115234, 28.18172836303711]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 7.0, 4.0, 14.0, 7.0, 11.0, 6.0, 18.0, 22.0, 15.0, 20.0, 29.0, 22.0, 26.0, 27.0, 32.0, 37.0, 41.0, 38.0, 27.0, 43.0, 35.0, 40.0, 43.0, 37.0, 34.0, 34.0, 29.0, 31.0, 33.0, 25.0, 27.0, 24.0, 24.0, 26.0, 14.0, 15.0, 13.0, 11.0, 7.0, 7.0, 4.0, 3.0, 5.0, 5.0, 6.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.42793083190918, -20.758066177368164, -20.08820343017578, -19.418338775634766, -18.74847412109375, -18.078609466552734, -17.40874481201172, -16.738882064819336, -16.06901741027832, -15.399152755737305, -14.729289054870605, -14.059425354003906, -13.38956069946289, -12.719696044921875, -12.049832344055176, -11.379968643188477, -10.710103988647461, -10.040239334106445, -9.370375633239746, -8.700511932373047, -8.030647277832031, -7.360783100128174, -6.690918922424316, -6.021054744720459, -5.351190567016602, -4.681326389312744, -4.011462211608887, -3.3415980339050293, -2.671733856201172, -2.0018696784973145, -1.332005500793457, -0.6621413230895996, 0.007724761962890625, 0.677588939666748, 1.3474531173706055, 2.017317295074463, 2.6871814727783203, 3.3570456504821777, 4.026909828186035, 4.696774005889893, 5.36663818359375, 6.036502361297607, 6.706366539001465, 7.376230716705322, 8.04609489440918, 8.715959548950195, 9.385823249816895, 10.055686950683594, 10.72555160522461, 11.395416259765625, 12.065279960632324, 12.735143661499023, 13.405008316040039, 14.074872970581055, 14.744736671447754, 15.414600372314453, 16.08446502685547, 16.754329681396484, 17.4241943359375, 18.094057083129883, 18.7639217376709, 19.433786392211914, 20.103649139404297, 20.773513793945312, 21.443378448486328]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 7.0, 15.0, 24.0, 24.0, 32.0, 40.0, 58.0, 72.0, 59.0, 76.0, 90.0, 94.0, 97.0, 83.0, 46.0, 46.0, 40.0, 39.0, 17.0, 18.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.411529541015625, -4.28790283203125, -4.164276123046875, -4.0406494140625, -3.917022705078125, -3.79339599609375, -3.669769287109375, -3.546142578125, -3.422515869140625, -3.29888916015625, -3.175262451171875, -3.0516357421875, -2.928009033203125, -2.80438232421875, -2.680755615234375, -2.55712890625, -2.433502197265625, -2.30987548828125, -2.186248779296875, -2.0626220703125, -1.938995361328125, -1.81536865234375, -1.691741943359375, -1.568115234375, -1.444488525390625, -1.32086181640625, -1.197235107421875, -1.0736083984375, -0.949981689453125, -0.82635498046875, -0.702728271484375, -0.5791015625, -0.455474853515625, -0.33184814453125, -0.208221435546875, -0.0845947265625, 0.039031982421875, 0.16265869140625, 0.286285400390625, 0.409912109375, 0.533538818359375, 0.65716552734375, 0.780792236328125, 0.9044189453125, 1.028045654296875, 1.15167236328125, 1.275299072265625, 1.39892578125, 1.522552490234375, 1.64617919921875, 1.769805908203125, 1.8934326171875, 2.017059326171875, 2.14068603515625, 2.264312744140625, 2.387939453125, 2.511566162109375, 2.63519287109375, 2.758819580078125, 2.8824462890625, 3.006072998046875, 3.12969970703125, 3.253326416015625, 3.376953125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 3.0, 10.0, 20.0, 21.0, 25.0, 29.0, 57.0, 53.0, 88.0, 124.0, 179.0, 279.0, 403.0, 671.0, 1225.0, 2010.0, 3796.0, 7847.0, 17281.0, 44677.0, 138797.0, 525159.0, 203253.0, 59786.0, 22540.0, 9532.0, 4663.0, 2418.0, 1393.0, 772.0, 495.0, 290.0, 182.0, 139.0, 89.0, 64.0, 40.0, 36.0, 23.0, 18.0, 13.0, 14.0, 9.0, 4.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.240478515625, -0.23332977294921875, -0.2261810302734375, -0.21903228759765625, -0.211883544921875, -0.20473480224609375, -0.1975860595703125, -0.19043731689453125, -0.18328857421875, -0.17613983154296875, -0.1689910888671875, -0.16184234619140625, -0.154693603515625, -0.14754486083984375, -0.1403961181640625, -0.13324737548828125, -0.1260986328125, -0.11894989013671875, -0.1118011474609375, -0.10465240478515625, -0.097503662109375, -0.09035491943359375, -0.0832061767578125, -0.07605743408203125, -0.06890869140625, -0.06175994873046875, -0.0546112060546875, -0.04746246337890625, -0.040313720703125, -0.03316497802734375, -0.0260162353515625, -0.01886749267578125, -0.01171875, -0.00457000732421875, 0.0025787353515625, 0.00972747802734375, 0.016876220703125, 0.02402496337890625, 0.0311737060546875, 0.03832244873046875, 0.04547119140625, 0.05261993408203125, 0.0597686767578125, 0.06691741943359375, 0.074066162109375, 0.08121490478515625, 0.0883636474609375, 0.09551239013671875, 0.1026611328125, 0.10980987548828125, 0.1169586181640625, 0.12410736083984375, 0.131256103515625, 0.13840484619140625, 0.1455535888671875, 0.15270233154296875, 0.15985107421875, 0.16699981689453125, 0.1741485595703125, 0.18129730224609375, 0.188446044921875, 0.19559478759765625, 0.2027435302734375, 0.20989227294921875, 0.217041015625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 6.0, 7.0, 5.0, 12.0, 12.0, 10.0, 15.0, 20.0, 29.0, 17.0, 21.0, 25.0, 33.0, 31.0, 43.0, 39.0, 30.0, 44.0, 37.0, 37.0, 1065.0, 43.0, 36.0, 27.0, 41.0, 29.0, 33.0, 26.0, 37.0, 30.0, 31.0, 20.0, 14.0, 14.0, 12.0, 16.0, 19.0, 8.0, 11.0, 7.0, 8.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 3.0], "bins": [-2.37109375, -2.306365966796875, -2.24163818359375, -2.176910400390625, -2.1121826171875, -2.047454833984375, -1.98272705078125, -1.917999267578125, -1.853271484375, -1.788543701171875, -1.72381591796875, -1.659088134765625, -1.5943603515625, -1.529632568359375, -1.46490478515625, -1.400177001953125, -1.33544921875, -1.270721435546875, -1.20599365234375, -1.141265869140625, -1.0765380859375, -1.011810302734375, -0.94708251953125, -0.882354736328125, -0.817626953125, -0.752899169921875, -0.68817138671875, -0.623443603515625, -0.5587158203125, -0.493988037109375, -0.42926025390625, -0.364532470703125, -0.2998046875, -0.235076904296875, -0.17034912109375, -0.105621337890625, -0.0408935546875, 0.023834228515625, 0.08856201171875, 0.153289794921875, 0.218017578125, 0.282745361328125, 0.34747314453125, 0.412200927734375, 0.4769287109375, 0.541656494140625, 0.60638427734375, 0.671112060546875, 0.73583984375, 0.800567626953125, 0.86529541015625, 0.930023193359375, 0.9947509765625, 1.059478759765625, 1.12420654296875, 1.188934326171875, 1.253662109375, 1.318389892578125, 1.38311767578125, 1.447845458984375, 1.5125732421875, 1.577301025390625, 1.64202880859375, 1.706756591796875, 1.771484375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 21.0, 26.0, 46.0, 62.0, 86.0, 154.0, 187.0, 273.0, 386.0, 636.0, 856.0, 1265.0, 1759.0, 2592.0, 3679.0, 5478.0, 7793.0, 11582.0, 17032.0, 25270.0, 38769.0, 61189.0, 106291.0, 500531.0, 1020267.0, 108500.0, 62384.0, 39418.0, 25781.0, 17375.0, 11576.0, 8016.0, 5388.0, 3788.0, 2669.0, 1837.0, 1277.0, 905.0, 613.0, 433.0, 275.0, 220.0, 131.0, 112.0, 69.0, 48.0, 32.0, 17.0, 10.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04815673828125, -0.046604156494140625, -0.04505157470703125, -0.043498992919921875, -0.0419464111328125, -0.040393829345703125, -0.03884124755859375, -0.037288665771484375, -0.035736083984375, -0.034183502197265625, -0.03263092041015625, -0.031078338623046875, -0.0295257568359375, -0.027973175048828125, -0.02642059326171875, -0.024868011474609375, -0.0233154296875, -0.021762847900390625, -0.02021026611328125, -0.018657684326171875, -0.0171051025390625, -0.015552520751953125, -0.01399993896484375, -0.012447357177734375, -0.010894775390625, -0.009342193603515625, -0.00778961181640625, -0.006237030029296875, -0.0046844482421875, -0.003131866455078125, -0.00157928466796875, -2.6702880859375e-05, 0.00152587890625, 0.003078460693359375, 0.00463104248046875, 0.006183624267578125, 0.0077362060546875, 0.009288787841796875, 0.01084136962890625, 0.012393951416015625, 0.013946533203125, 0.015499114990234375, 0.01705169677734375, 0.018604278564453125, 0.0201568603515625, 0.021709442138671875, 0.02326202392578125, 0.024814605712890625, 0.0263671875, 0.027919769287109375, 0.02947235107421875, 0.031024932861328125, 0.0325775146484375, 0.034130096435546875, 0.03568267822265625, 0.037235260009765625, 0.038787841796875, 0.040340423583984375, 0.04189300537109375, 0.043445587158203125, 0.0449981689453125, 0.046550750732421875, 0.04810333251953125, 0.049655914306640625, 0.05120849609375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 6.0, 6.0, 14.0, 13.0, 18.0, 14.0, 19.0, 27.0, 42.0, 51.0, 47.0, 64.0, 73.0, 104.0, 91.0, 72.0, 50.0, 40.0, 32.0, 25.0, 19.0, 22.0, 17.0, 12.0, 12.0, 6.0, 8.0, 9.0, 9.0, 3.0, 2.0, 8.0, 4.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002772808074951172, -0.00026794523000717163, -0.0002586096525192261, -0.0002492740750312805, -0.00023993849754333496, -0.0002306029200553894, -0.00022126734256744385, -0.0002119317650794983, -0.00020259618759155273, -0.00019326061010360718, -0.00018392503261566162, -0.00017458945512771606, -0.0001652538776397705, -0.00015591830015182495, -0.0001465827226638794, -0.00013724714517593384, -0.00012791156768798828, -0.00011857599020004272, -0.00010924041271209717, -9.990483522415161e-05, -9.056925773620605e-05, -8.12336802482605e-05, -7.189810276031494e-05, -6.256252527236938e-05, -5.322694778442383e-05, -4.389137029647827e-05, -3.4555792808532715e-05, -2.5220215320587158e-05, -1.58846378326416e-05, -6.549060344696045e-06, 2.7865171432495117e-06, 1.2122094631195068e-05, 2.1457672119140625e-05, 3.079324960708618e-05, 4.012882709503174e-05, 4.9464404582977295e-05, 5.879998207092285e-05, 6.813555955886841e-05, 7.747113704681396e-05, 8.680671453475952e-05, 9.614229202270508e-05, 0.00010547786951065063, 0.00011481344699859619, 0.00012414902448654175, 0.0001334846019744873, 0.00014282017946243286, 0.00015215575695037842, 0.00016149133443832397, 0.00017082691192626953, 0.0001801624894142151, 0.00018949806690216064, 0.0001988336443901062, 0.00020816922187805176, 0.00021750479936599731, 0.00022684037685394287, 0.00023617595434188843, 0.000245511531829834, 0.00025484710931777954, 0.0002641826868057251, 0.00027351826429367065, 0.0002828538417816162, 0.00029218941926956177, 0.0003015249967575073, 0.0003108605742454529, 0.00032019615173339844]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 8.0, 4.0, 4.0, 10.0, 3.0, 11.0, 9.0, 13.0, 18.0, 26.0, 23.0, 27.0, 30.0, 59.0, 58.0, 83.0, 139.0, 451.0, 2049.0, 12369.0, 102900.0, 801416.0, 112272.0, 13293.0, 2185.0, 511.0, 163.0, 95.0, 62.0, 42.0, 37.0, 34.0, 31.0, 23.0, 20.0, 14.0, 14.0, 12.0, 6.0, 7.0, 7.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.005462646484375, -0.005304396152496338, -0.005146145820617676, -0.004987895488739014, -0.0048296451568603516, -0.0046713948249816895, -0.004513144493103027, -0.004354894161224365, -0.004196643829345703, -0.004038393497467041, -0.003880143165588379, -0.003721892833709717, -0.0035636425018310547, -0.0034053921699523926, -0.0032471418380737305, -0.0030888915061950684, -0.0029306411743164062, -0.002772390842437744, -0.002614140510559082, -0.00245589017868042, -0.002297639846801758, -0.0021393895149230957, -0.0019811391830444336, -0.0018228888511657715, -0.0016646385192871094, -0.0015063881874084473, -0.0013481378555297852, -0.001189887523651123, -0.001031637191772461, -0.0008733868598937988, -0.0007151365280151367, -0.0005568861961364746, -0.0003986358642578125, -0.0002403855323791504, -8.213520050048828e-05, 7.611513137817383e-05, 0.00023436546325683594, 0.00039261579513549805, 0.0005508661270141602, 0.0007091164588928223, 0.0008673667907714844, 0.0010256171226501465, 0.0011838674545288086, 0.0013421177864074707, 0.0015003681182861328, 0.001658618450164795, 0.001816868782043457, 0.001975119113922119, 0.0021333694458007812, 0.0022916197776794434, 0.0024498701095581055, 0.0026081204414367676, 0.0027663707733154297, 0.002924621105194092, 0.003082871437072754, 0.003241121768951416, 0.003399372100830078, 0.0035576224327087402, 0.0037158727645874023, 0.0038741230964660645, 0.0040323734283447266, 0.004190623760223389, 0.004348874092102051, 0.004507124423980713, 0.004665374755859375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 22.0, 95.0, 614.0, 234.0, 36.0, 9.0], "bins": [-0.008506637066602707, -0.008366578258574009, -0.008226520381867886, -0.008086461573839188, -0.00794640276581049, -0.007806344889104366, -0.007666286081075668, -0.007526227738708258, -0.007386169396340847, -0.007246111053973436, -0.007106052245944738, -0.006965993903577328, -0.006825935561209917, -0.006685877218842506, -0.0065458184108138084, -0.006405760068446398, -0.006265701726078987, -0.0061256433837115765, -0.0059855845756828785, -0.005845526233315468, -0.005705467890948057, -0.0055654095485806465, -0.0054253507405519485, -0.005285292398184538, -0.00514523359015584, -0.005005175247788429, -0.004865116439759731, -0.004725058097392321, -0.00458499975502491, -0.004444941412657499, -0.004304882604628801, -0.004164824262261391, -0.004024765454232693, -0.0038847068790346384, -0.0037446485366672277, -0.0036045899614691734, -0.0034645316191017628, -0.0033244730439037085, -0.003184414468705654, -0.0030443561263382435, -0.002904297783970833, -0.0027642392087727785, -0.002624180866405368, -0.0024841222912073135, -0.002344063948839903, -0.0022040053736418486, -0.0020639467984437943, -0.0019238884560763836, -0.001783830113708973, -0.0016437716549262404, -0.001503713196143508, -0.0013636546209454536, -0.001223596278578043, -0.0010835377033799887, -0.0009434792445972562, -0.0008034207858145237, -0.0006633622688241303, -0.0005233038100413978, -0.00038324532215483487, -0.00024318683426827192, -0.00010312837548553944, 3.693008329719305e-05, 0.00017698860028758645, 0.00031704705907031894, 0.0004571055178530514]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 7.0, 11.0, 9.0, 11.0, 17.0, 23.0, 30.0, 31.0, 39.0, 40.0, 53.0, 39.0, 57.0, 60.0, 59.0, 47.0, 60.0, 47.0, 51.0, 51.0, 40.0, 34.0, 38.0, 33.0, 24.0, 17.0, 17.0, 11.0, 11.0, 10.0, 6.0, 4.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042742490768432617, -0.00041339173913002014, -0.0003993585705757141, -0.0003853254020214081, -0.00037129223346710205, -0.000357259064912796, -0.00034322589635849, -0.00032919272780418396, -0.00031515955924987793, -0.0003011263906955719, -0.00028709322214126587, -0.00027306005358695984, -0.0002590268850326538, -0.0002449937164783478, -0.00023096054792404175, -0.00021692737936973572, -0.0002028942108154297, -0.00018886104226112366, -0.00017482787370681763, -0.0001607947051525116, -0.00014676153659820557, -0.00013272836804389954, -0.0001186951994895935, -0.00010466203093528748, -9.062886238098145e-05, -7.659569382667542e-05, -6.256252527236938e-05, -4.8529356718063354e-05, -3.4496188163757324e-05, -2.0463019609451294e-05, -6.429851055145264e-06, 7.603317499160767e-06, 2.1636486053466797e-05, 3.566965460777283e-05, 4.970282316207886e-05, 6.373599171638489e-05, 7.776916027069092e-05, 9.180232882499695e-05, 0.00010583549737930298, 0.00011986866593360901, 0.00013390183448791504, 0.00014793500304222107, 0.0001619681715965271, 0.00017600134015083313, 0.00019003450870513916, 0.0002040676772594452, 0.00021810084581375122, 0.00023213401436805725, 0.0002461671829223633, 0.0002602003514766693, 0.00027423352003097534, 0.00028826668858528137, 0.0003022998571395874, 0.00031633302569389343, 0.00033036619424819946, 0.0003443993628025055, 0.0003584325313568115, 0.00037246569991111755, 0.0003864988684654236, 0.0004005320370197296, 0.00041456520557403564, 0.0004285983741283417, 0.0004426315426826477, 0.00045666471123695374, 0.00047069787979125977]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 7.0, 15.0, 24.0, 24.0, 32.0, 40.0, 58.0, 72.0, 59.0, 76.0, 90.0, 94.0, 96.0, 84.0, 46.0, 46.0, 40.0, 39.0, 17.0, 18.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.411529541015625, -4.28790283203125, -4.164276123046875, -4.0406494140625, -3.917022705078125, -3.79339599609375, -3.669769287109375, -3.546142578125, -3.422515869140625, -3.29888916015625, -3.175262451171875, -3.0516357421875, -2.928009033203125, -2.80438232421875, -2.680755615234375, -2.55712890625, -2.433502197265625, -2.30987548828125, -2.186248779296875, -2.0626220703125, -1.938995361328125, -1.81536865234375, -1.691741943359375, -1.568115234375, -1.444488525390625, -1.32086181640625, -1.197235107421875, -1.0736083984375, -0.949981689453125, -0.82635498046875, -0.702728271484375, -0.5791015625, -0.455474853515625, -0.33184814453125, -0.208221435546875, -0.0845947265625, 0.039031982421875, 0.16265869140625, 0.286285400390625, 0.409912109375, 0.533538818359375, 0.65716552734375, 0.780792236328125, 0.9044189453125, 1.028045654296875, 1.15167236328125, 1.275299072265625, 1.39892578125, 1.522552490234375, 1.64617919921875, 1.769805908203125, 1.8934326171875, 2.017059326171875, 2.14068603515625, 2.264312744140625, 2.387939453125, 2.511566162109375, 2.63519287109375, 2.758819580078125, 2.8824462890625, 3.006072998046875, 3.12969970703125, 3.253326416015625, 3.376953125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 7.0, 15.0, 21.0, 32.0, 54.0, 85.0, 179.0, 295.0, 718.0, 1860.0, 5351.0, 17245.0, 62183.0, 316640.0, 513875.0, 93705.0, 24646.0, 7389.0, 2457.0, 916.0, 392.0, 206.0, 105.0, 54.0, 37.0, 24.0, 15.0, 13.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.83734130859375, -3.7215576171875, -3.60577392578125, -3.489990234375, -3.37420654296875, -3.2584228515625, -3.14263916015625, -3.02685546875, -2.91107177734375, -2.7952880859375, -2.67950439453125, -2.563720703125, -2.44793701171875, -2.3321533203125, -2.21636962890625, -2.1005859375, -1.98480224609375, -1.8690185546875, -1.75323486328125, -1.637451171875, -1.52166748046875, -1.4058837890625, -1.29010009765625, -1.17431640625, -1.05853271484375, -0.9427490234375, -0.82696533203125, -0.711181640625, -0.59539794921875, -0.4796142578125, -0.36383056640625, -0.248046875, -0.13226318359375, -0.0164794921875, 0.09930419921875, 0.215087890625, 0.33087158203125, 0.4466552734375, 0.56243896484375, 0.67822265625, 0.79400634765625, 0.9097900390625, 1.02557373046875, 1.141357421875, 1.25714111328125, 1.3729248046875, 1.48870849609375, 1.6044921875, 1.72027587890625, 1.8360595703125, 1.95184326171875, 2.067626953125, 2.18341064453125, 2.2991943359375, 2.41497802734375, 2.53076171875, 2.64654541015625, 2.7623291015625, 2.87811279296875, 2.993896484375, 3.10968017578125, 3.2254638671875, 3.34124755859375, 3.45703125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 4.0, 9.0, 15.0, 15.0, 13.0, 18.0, 20.0, 14.0, 29.0, 30.0, 30.0, 33.0, 42.0, 34.0, 51.0, 64.0, 74.0, 183.0, 1624.0, 203.0, 108.0, 60.0, 56.0, 35.0, 32.0, 48.0, 28.0, 25.0, 25.0, 23.0, 20.0, 13.0, 14.0, 17.0, 5.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.238525390625, -7.96923828125, -7.699951171875, -7.4306640625, -7.161376953125, -6.89208984375, -6.622802734375, -6.353515625, -6.084228515625, -5.81494140625, -5.545654296875, -5.2763671875, -5.007080078125, -4.73779296875, -4.468505859375, -4.19921875, -3.929931640625, -3.66064453125, -3.391357421875, -3.1220703125, -2.852783203125, -2.58349609375, -2.314208984375, -2.044921875, -1.775634765625, -1.50634765625, -1.237060546875, -0.9677734375, -0.698486328125, -0.42919921875, -0.159912109375, 0.109375, 0.378662109375, 0.64794921875, 0.917236328125, 1.1865234375, 1.455810546875, 1.72509765625, 1.994384765625, 2.263671875, 2.532958984375, 2.80224609375, 3.071533203125, 3.3408203125, 3.610107421875, 3.87939453125, 4.148681640625, 4.41796875, 4.687255859375, 4.95654296875, 5.225830078125, 5.4951171875, 5.764404296875, 6.03369140625, 6.302978515625, 6.572265625, 6.841552734375, 7.11083984375, 7.380126953125, 7.6494140625, 7.918701171875, 8.18798828125, 8.457275390625, 8.7265625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 12.0, 18.0, 20.0, 30.0, 27.0, 27.0, 41.0, 63.0, 103.0, 236.0, 503.0, 1141.0, 3422.0, 19290.0, 520523.0, 2549225.0, 42533.0, 5497.0, 1652.0, 585.0, 244.0, 146.0, 81.0, 53.0, 43.0, 28.0, 21.0, 19.0, 21.0, 15.0, 16.0, 11.0, 12.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.6343994140625, -11.260986328125, -10.8875732421875, -10.51416015625, -10.1407470703125, -9.767333984375, -9.3939208984375, -9.0205078125, -8.6470947265625, -8.273681640625, -7.9002685546875, -7.52685546875, -7.1534423828125, -6.780029296875, -6.4066162109375, -6.033203125, -5.6597900390625, -5.286376953125, -4.9129638671875, -4.53955078125, -4.1661376953125, -3.792724609375, -3.4193115234375, -3.0458984375, -2.6724853515625, -2.299072265625, -1.9256591796875, -1.55224609375, -1.1788330078125, -0.805419921875, -0.4320068359375, -0.05859375, 0.3148193359375, 0.688232421875, 1.0616455078125, 1.43505859375, 1.8084716796875, 2.181884765625, 2.5552978515625, 2.9287109375, 3.3021240234375, 3.675537109375, 4.0489501953125, 4.42236328125, 4.7957763671875, 5.169189453125, 5.5426025390625, 5.916015625, 6.2894287109375, 6.662841796875, 7.0362548828125, 7.40966796875, 7.7830810546875, 8.156494140625, 8.5299072265625, 8.9033203125, 9.2767333984375, 9.650146484375, 10.0235595703125, 10.39697265625, 10.7703857421875, 11.143798828125, 11.5172119140625, 11.890625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 16.0, 38.0, 78.0, 155.0, 170.0, 205.0, 147.0, 108.0, 58.0, 20.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.738855361938477, -27.924104690551758, -27.10935401916504, -26.29460334777832, -25.4798526763916, -24.665102005004883, -23.85034942626953, -23.035598754882812, -22.220848083496094, -21.406097412109375, -20.591346740722656, -19.776596069335938, -18.96184539794922, -18.1470947265625, -17.33234405517578, -16.517593383789062, -15.702842712402344, -14.888092041015625, -14.073341369628906, -13.258590698242188, -12.443840026855469, -11.62908935546875, -10.814337730407715, -9.999587059020996, -9.184836387634277, -8.370085716247559, -7.55533504486084, -6.740583896636963, -5.925833225250244, -5.111082553863525, -4.296331405639648, -3.4815807342529297, -2.6668319702148438, -1.8520811796188354, -1.0373303890228271, -0.2225794792175293, 0.5921711921691895, 1.4069218635559082, 2.221673011779785, 3.036423683166504, 3.8511743545532227, 4.665925025939941, 5.48067569732666, 6.295426845550537, 7.110177516937256, 7.924928188323975, 8.739679336547852, 9.55443000793457, 10.369180679321289, 11.183931350708008, 11.998682022094727, 12.813432693481445, 13.628183364868164, 14.442934036254883, 15.257685661315918, 16.072437286376953, 16.887187957763672, 17.70193862915039, 18.51668930053711, 19.331439971923828, 20.146190643310547, 20.960941314697266, 21.775691986083984, 22.590442657470703, 23.405193328857422]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 6.0, 12.0, 8.0, 13.0, 14.0, 18.0, 22.0, 22.0, 19.0, 20.0, 33.0, 29.0, 36.0, 38.0, 44.0, 35.0, 27.0, 35.0, 26.0, 36.0, 27.0, 31.0, 37.0, 42.0, 37.0, 37.0, 39.0, 35.0, 22.0, 22.0, 15.0, 20.0, 21.0, 21.0, 13.0, 9.0, 15.0, 8.0, 13.0, 4.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-29.035263061523438, -28.222087860107422, -27.408910751342773, -26.595735549926758, -25.78255844116211, -24.969383239746094, -24.156208038330078, -23.34303092956543, -22.52985382080078, -21.716678619384766, -20.903501510620117, -20.0903263092041, -19.277149200439453, -18.463973999023438, -17.650798797607422, -16.837621688842773, -16.024446487426758, -15.211270332336426, -14.398094177246094, -13.584918975830078, -12.77174186706543, -11.958566665649414, -11.145390510559082, -10.33221435546875, -9.519038200378418, -8.705862045288086, -7.892685890197754, -7.07951021194458, -6.266334056854248, -5.453157901763916, -4.639982223510742, -3.82680606842041, -3.013629913330078, -2.200453758239746, -1.3872778415679932, -0.5741019248962402, 0.2390742301940918, 1.0522503852844238, 1.8654260635375977, 2.6786022186279297, 3.4917783737182617, 4.304954528808594, 5.118130683898926, 5.9313063621521, 6.744482517242432, 7.557658672332764, 8.370834350585938, 9.18401050567627, 9.997186660766602, 10.810362815856934, 11.623538970947266, 12.436714172363281, 13.24989128112793, 14.063066482543945, 14.876242637634277, 15.68941879272461, 16.502593994140625, 17.31576919555664, 18.12894630432129, 18.942121505737305, 19.755298614501953, 20.56847381591797, 21.381649017333984, 22.194826126098633, 23.00800323486328]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 1.0, 2.0, 3.0, 16.0, 13.0, 30.0, 21.0, 38.0, 53.0, 59.0, 62.0, 65.0, 78.0, 93.0, 100.0, 77.0, 71.0, 48.0, 45.0, 36.0, 41.0, 21.0, 11.0, 7.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.3154296875, -4.193359375, -4.0712890625, -3.94921875, -3.8271484375, -3.705078125, -3.5830078125, -3.4609375, -3.3388671875, -3.216796875, -3.0947265625, -2.97265625, -2.8505859375, -2.728515625, -2.6064453125, -2.484375, -2.3623046875, -2.240234375, -2.1181640625, -1.99609375, -1.8740234375, -1.751953125, -1.6298828125, -1.5078125, -1.3857421875, -1.263671875, -1.1416015625, -1.01953125, -0.8974609375, -0.775390625, -0.6533203125, -0.53125, -0.4091796875, -0.287109375, -0.1650390625, -0.04296875, 0.0791015625, 0.201171875, 0.3232421875, 0.4453125, 0.5673828125, 0.689453125, 0.8115234375, 0.93359375, 1.0556640625, 1.177734375, 1.2998046875, 1.421875, 1.5439453125, 1.666015625, 1.7880859375, 1.91015625, 2.0322265625, 2.154296875, 2.2763671875, 2.3984375, 2.5205078125, 2.642578125, 2.7646484375, 2.88671875, 3.0087890625, 3.130859375, 3.2529296875, 3.375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 18.0, 14.0, 36.0, 35.0, 62.0, 88.0, 163.0, 310.0, 680.0, 1563.0, 5208.0, 39891.0, 3849853.0, 282621.0, 9928.0, 2313.0, 776.0, 351.0, 140.0, 78.0, 38.0, 37.0, 17.0, 10.0, 7.0, 6.0, 9.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -24.306640625, -23.64453125, -22.982421875, -22.3203125, -21.658203125, -20.99609375, -20.333984375, -19.671875, -19.009765625, -18.34765625, -17.685546875, -17.0234375, -16.361328125, -15.69921875, -15.037109375, -14.375, -13.712890625, -13.05078125, -12.388671875, -11.7265625, -11.064453125, -10.40234375, -9.740234375, -9.078125, -8.416015625, -7.75390625, -7.091796875, -6.4296875, -5.767578125, -5.10546875, -4.443359375, -3.78125, -3.119140625, -2.45703125, -1.794921875, -1.1328125, -0.470703125, 0.19140625, 0.853515625, 1.515625, 2.177734375, 2.83984375, 3.501953125, 4.1640625, 4.826171875, 5.48828125, 6.150390625, 6.8125, 7.474609375, 8.13671875, 8.798828125, 9.4609375, 10.123046875, 10.78515625, 11.447265625, 12.109375, 12.771484375, 13.43359375, 14.095703125, 14.7578125, 15.419921875, 16.08203125, 16.744140625, 17.40625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 7.0, 5.0, 5.0, 10.0, 18.0, 15.0, 34.0, 50.0, 46.0, 96.0, 117.0, 237.0, 334.0, 473.0, 627.0, 629.0, 455.0, 342.0, 185.0, 109.0, 63.0, 46.0, 42.0, 26.0, 24.0, 22.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.51953125, -7.290283203125, -7.06103515625, -6.831787109375, -6.6025390625, -6.373291015625, -6.14404296875, -5.914794921875, -5.685546875, -5.456298828125, -5.22705078125, -4.997802734375, -4.7685546875, -4.539306640625, -4.31005859375, -4.080810546875, -3.8515625, -3.622314453125, -3.39306640625, -3.163818359375, -2.9345703125, -2.705322265625, -2.47607421875, -2.246826171875, -2.017578125, -1.788330078125, -1.55908203125, -1.329833984375, -1.1005859375, -0.871337890625, -0.64208984375, -0.412841796875, -0.18359375, 0.045654296875, 0.27490234375, 0.504150390625, 0.7333984375, 0.962646484375, 1.19189453125, 1.421142578125, 1.650390625, 1.879638671875, 2.10888671875, 2.338134765625, 2.5673828125, 2.796630859375, 3.02587890625, 3.255126953125, 3.484375, 3.713623046875, 3.94287109375, 4.172119140625, 4.4013671875, 4.630615234375, 4.85986328125, 5.089111328125, 5.318359375, 5.547607421875, 5.77685546875, 6.006103515625, 6.2353515625, 6.464599609375, 6.69384765625, 6.923095703125, 7.15234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 13.0, 18.0, 21.0, 42.0, 64.0, 107.0, 198.0, 276.0, 520.0, 995.0, 1585.0, 2913.0, 5787.0, 12732.0, 34248.0, 138317.0, 1094385.0, 2462918.0, 340120.0, 62008.0, 19850.0, 8273.0, 3974.0, 2024.0, 1181.0, 673.0, 421.0, 229.0, 145.0, 99.0, 53.0, 29.0, 22.0, 12.0, 7.0, 10.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.875, -10.52685546875, -10.1787109375, -9.83056640625, -9.482421875, -9.13427734375, -8.7861328125, -8.43798828125, -8.08984375, -7.74169921875, -7.3935546875, -7.04541015625, -6.697265625, -6.34912109375, -6.0009765625, -5.65283203125, -5.3046875, -4.95654296875, -4.6083984375, -4.26025390625, -3.912109375, -3.56396484375, -3.2158203125, -2.86767578125, -2.51953125, -2.17138671875, -1.8232421875, -1.47509765625, -1.126953125, -0.77880859375, -0.4306640625, -0.08251953125, 0.265625, 0.61376953125, 0.9619140625, 1.31005859375, 1.658203125, 2.00634765625, 2.3544921875, 2.70263671875, 3.05078125, 3.39892578125, 3.7470703125, 4.09521484375, 4.443359375, 4.79150390625, 5.1396484375, 5.48779296875, 5.8359375, 6.18408203125, 6.5322265625, 6.88037109375, 7.228515625, 7.57666015625, 7.9248046875, 8.27294921875, 8.62109375, 8.96923828125, 9.3173828125, 9.66552734375, 10.013671875, 10.36181640625, 10.7099609375, 11.05810546875, 11.40625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 23.0, 27.0, 60.0, 86.0, 121.0, 162.0, 128.0, 139.0, 91.0, 60.0, 41.0, 27.0, 14.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.423763275146484, -59.6796760559082, -57.93558883666992, -56.19150161743164, -54.447410583496094, -52.70332336425781, -50.95923614501953, -49.21514892578125, -47.47106170654297, -45.72697448730469, -43.982887268066406, -42.238800048828125, -40.494712829589844, -38.75062561035156, -37.006534576416016, -35.262447357177734, -33.51836013793945, -31.774272918701172, -30.03018569946289, -28.286096572875977, -26.542009353637695, -24.797922134399414, -23.0538330078125, -21.30974578857422, -19.565658569335938, -17.821571350097656, -16.077484130859375, -14.333395004272461, -12.58930778503418, -10.845220565795898, -9.1011323928833, -7.357044219970703, -5.612953186035156, -3.868865489959717, -2.1247777938842773, -0.3806900978088379, 1.3633975982666016, 3.107484817504883, 4.8515729904174805, 6.595661163330078, 8.33974838256836, 10.08383560180664, 11.827923774719238, 13.572011947631836, 15.316099166870117, 17.0601863861084, 18.804275512695312, 20.548362731933594, 22.292449951171875, 24.036537170410156, 25.780624389648438, 27.52471351623535, 29.268800735473633, 31.012887954711914, 32.75697708129883, 34.50106430053711, 36.24515151977539, 37.98923873901367, 39.73332595825195, 41.477413177490234, 43.22150421142578, 44.96559143066406, 46.709678649902344, 48.453765869140625, 50.197853088378906]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 8.0, 0.0, 5.0, 6.0, 5.0, 13.0, 6.0, 13.0, 18.0, 15.0, 24.0, 20.0, 16.0, 19.0, 30.0, 31.0, 20.0, 41.0, 39.0, 39.0, 40.0, 37.0, 30.0, 53.0, 36.0, 37.0, 24.0, 53.0, 35.0, 33.0, 36.0, 31.0, 34.0, 22.0, 17.0, 18.0, 14.0, 13.0, 11.0, 12.0, 7.0, 8.0, 11.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.55889129638672, -18.92671775817871, -18.294546127319336, -17.662372589111328, -17.03019905090332, -16.398025512695312, -15.765853881835938, -15.13368034362793, -14.501507759094238, -13.869335174560547, -13.237161636352539, -12.604989051818848, -11.972816467285156, -11.340642929077148, -10.708470344543457, -10.076297760009766, -9.444124221801758, -8.811951637268066, -8.179778099060059, -7.547605514526367, -6.915432453155518, -6.283259391784668, -5.651086807250977, -5.018913745880127, -4.386740684509277, -3.7545676231384277, -3.1223948001861572, -2.4902219772338867, -1.858048915863037, -1.2258758544921875, -0.593703031539917, 0.038469791412353516, 0.6706409454345703, 1.3028138875961304, 1.9349868297576904, 2.567159652709961, 3.1993327140808105, 3.83150577545166, 4.463678359985352, 5.095851421356201, 5.728024482727051, 6.3601975440979, 6.99237060546875, 7.624543190002441, 8.256715774536133, 8.88888931274414, 9.521061897277832, 10.153234481811523, 10.785408020019531, 11.417580604553223, 12.04975414276123, 12.681926727294922, 13.31410026550293, 13.946272850036621, 14.578445434570312, 15.21061897277832, 15.842791557312012, 16.474964141845703, 17.10713768005371, 17.73931121826172, 18.371482849121094, 19.0036563873291, 19.63582992553711, 20.268001556396484, 20.900175094604492]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 11.0, 9.0, 16.0, 23.0, 31.0, 39.0, 49.0, 51.0, 49.0, 67.0, 73.0, 83.0, 82.0, 77.0, 78.0, 64.0, 47.0, 39.0, 29.0, 23.0, 22.0, 13.0, 10.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.18353271484375, -4.0662841796875, -3.94903564453125, -3.831787109375, -3.71453857421875, -3.5972900390625, -3.48004150390625, -3.36279296875, -3.24554443359375, -3.1282958984375, -3.01104736328125, -2.893798828125, -2.77655029296875, -2.6593017578125, -2.54205322265625, -2.4248046875, -2.30755615234375, -2.1903076171875, -2.07305908203125, -1.955810546875, -1.83856201171875, -1.7213134765625, -1.60406494140625, -1.48681640625, -1.36956787109375, -1.2523193359375, -1.13507080078125, -1.017822265625, -0.90057373046875, -0.7833251953125, -0.66607666015625, -0.548828125, -0.43157958984375, -0.3143310546875, -0.19708251953125, -0.079833984375, 0.03741455078125, 0.1546630859375, 0.27191162109375, 0.38916015625, 0.50640869140625, 0.6236572265625, 0.74090576171875, 0.858154296875, 0.97540283203125, 1.0926513671875, 1.20989990234375, 1.3271484375, 1.44439697265625, 1.5616455078125, 1.67889404296875, 1.796142578125, 1.91339111328125, 2.0306396484375, 2.14788818359375, 2.26513671875, 2.38238525390625, 2.4996337890625, 2.61688232421875, 2.734130859375, 2.85137939453125, 2.9686279296875, 3.08587646484375, 3.203125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 8.0, 15.0, 23.0, 22.0, 53.0, 43.0, 64.0, 111.0, 141.0, 231.0, 354.0, 592.0, 1121.0, 1933.0, 3581.0, 6898.0, 13938.0, 32444.0, 83191.0, 281711.0, 430056.0, 113770.0, 42163.0, 18028.0, 8326.0, 4300.0, 2235.0, 1268.0, 661.0, 397.0, 278.0, 186.0, 118.0, 77.0, 57.0, 46.0, 31.0, 20.0, 19.0, 7.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.220703125, -0.21361732482910156, -0.20653152465820312, -0.1994457244873047, -0.19235992431640625, -0.1852741241455078, -0.17818832397460938, -0.17110252380371094, -0.1640167236328125, -0.15693092346191406, -0.14984512329101562, -0.1427593231201172, -0.13567352294921875, -0.1285877227783203, -0.12150192260742188, -0.11441612243652344, -0.107330322265625, -0.10024452209472656, -0.09315872192382812, -0.08607292175292969, -0.07898712158203125, -0.07190132141113281, -0.06481552124023438, -0.05772972106933594, -0.0506439208984375, -0.04355812072753906, -0.036472320556640625, -0.029386520385742188, -0.02230072021484375, -0.015214920043945312, -0.008129119873046875, -0.0010433197021484375, 0.00604248046875, 0.013128280639648438, 0.020214080810546875, 0.027299880981445312, 0.03438568115234375, 0.04147148132324219, 0.048557281494140625, 0.05564308166503906, 0.0627288818359375, 0.06981468200683594, 0.07690048217773438, 0.08398628234863281, 0.09107208251953125, 0.09815788269042969, 0.10524368286132812, 0.11232948303222656, 0.119415283203125, 0.12650108337402344, 0.13358688354492188, 0.1406726837158203, 0.14775848388671875, 0.1548442840576172, 0.16193008422851562, 0.16901588439941406, 0.1761016845703125, 0.18318748474121094, 0.19027328491210938, 0.1973590850830078, 0.20444488525390625, 0.2115306854248047, 0.21861648559570312, 0.22570228576660156, 0.2327880859375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 3.0, 3.0, 12.0, 5.0, 10.0, 13.0, 20.0, 25.0, 18.0, 23.0, 22.0, 23.0, 28.0, 27.0, 33.0, 26.0, 35.0, 32.0, 35.0, 49.0, 46.0, 1064.0, 41.0, 26.0, 40.0, 26.0, 36.0, 45.0, 25.0, 27.0, 30.0, 20.0, 19.0, 15.0, 22.0, 16.0, 12.0, 13.0, 6.0, 8.0, 11.0, 8.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.75390625, -1.6923828125, -1.630859375, -1.5693359375, -1.5078125, -1.4462890625, -1.384765625, -1.3232421875, -1.26171875, -1.2001953125, -1.138671875, -1.0771484375, -1.015625, -0.9541015625, -0.892578125, -0.8310546875, -0.76953125, -0.7080078125, -0.646484375, -0.5849609375, -0.5234375, -0.4619140625, -0.400390625, -0.3388671875, -0.27734375, -0.2158203125, -0.154296875, -0.0927734375, -0.03125, 0.0302734375, 0.091796875, 0.1533203125, 0.21484375, 0.2763671875, 0.337890625, 0.3994140625, 0.4609375, 0.5224609375, 0.583984375, 0.6455078125, 0.70703125, 0.7685546875, 0.830078125, 0.8916015625, 0.953125, 1.0146484375, 1.076171875, 1.1376953125, 1.19921875, 1.2607421875, 1.322265625, 1.3837890625, 1.4453125, 1.5068359375, 1.568359375, 1.6298828125, 1.69140625, 1.7529296875, 1.814453125, 1.8759765625, 1.9375, 1.9990234375, 2.060546875, 2.1220703125, 2.18359375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 6.0, 5.0, 8.0, 17.0, 20.0, 23.0, 26.0, 62.0, 61.0, 102.0, 148.0, 197.0, 267.0, 378.0, 563.0, 667.0, 927.0, 1296.0, 1818.0, 2533.0, 3623.0, 5171.0, 7089.0, 10240.0, 14920.0, 21567.0, 32635.0, 49898.0, 81573.0, 152216.0, 1317566.0, 154009.0, 81820.0, 50179.0, 32756.0, 21974.0, 15061.0, 10414.0, 7319.0, 5150.0, 3673.0, 2563.0, 1957.0, 1348.0, 968.0, 687.0, 444.0, 368.0, 223.0, 182.0, 115.0, 89.0, 60.0, 50.0, 30.0, 33.0, 18.0, 9.0, 11.0, 7.0, 4.0, 4.0], "bins": [-0.043121337890625, -0.041794776916503906, -0.04046821594238281, -0.03914165496826172, -0.037815093994140625, -0.03648853302001953, -0.03516197204589844, -0.033835411071777344, -0.03250885009765625, -0.031182289123535156, -0.029855728149414062, -0.02852916717529297, -0.027202606201171875, -0.02587604522705078, -0.024549484252929688, -0.023222923278808594, -0.0218963623046875, -0.020569801330566406, -0.019243240356445312, -0.01791667938232422, -0.016590118408203125, -0.015263557434082031, -0.013936996459960938, -0.012610435485839844, -0.01128387451171875, -0.009957313537597656, -0.008630752563476562, -0.007304191589355469, -0.005977630615234375, -0.004651069641113281, -0.0033245086669921875, -0.0019979476928710938, -0.00067138671875, 0.0006551742553710938, 0.0019817352294921875, 0.0033082962036132812, 0.004634857177734375, 0.005961418151855469, 0.0072879791259765625, 0.008614540100097656, 0.00994110107421875, 0.011267662048339844, 0.012594223022460938, 0.013920783996582031, 0.015247344970703125, 0.01657390594482422, 0.017900466918945312, 0.019227027893066406, 0.0205535888671875, 0.021880149841308594, 0.023206710815429688, 0.02453327178955078, 0.025859832763671875, 0.02718639373779297, 0.028512954711914062, 0.029839515686035156, 0.03116607666015625, 0.032492637634277344, 0.03381919860839844, 0.03514575958251953, 0.036472320556640625, 0.03779888153076172, 0.03912544250488281, 0.040452003479003906, 0.041778564453125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 8.0, 15.0, 14.0, 17.0, 16.0, 14.0, 17.0, 24.0, 42.0, 32.0, 50.0, 77.0, 103.0, 111.0, 100.0, 88.0, 48.0, 40.0, 31.0, 31.0, 22.0, 15.0, 20.0, 5.0, 12.0, 4.0, 10.0, 4.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005235671997070312, -0.0005052238702774048, -0.0004868805408477783, -0.00046853721141815186, -0.0004501938819885254, -0.0004318505525588989, -0.00041350722312927246, -0.000395163893699646, -0.00037682056427001953, -0.00035847723484039307, -0.0003401339054107666, -0.00032179057598114014, -0.00030344724655151367, -0.0002851039171218872, -0.00026676058769226074, -0.0002484172582626343, -0.0002300739288330078, -0.00021173059940338135, -0.00019338726997375488, -0.00017504394054412842, -0.00015670061111450195, -0.0001383572816848755, -0.00012001395225524902, -0.00010167062282562256, -8.33272933959961e-05, -6.498396396636963e-05, -4.6640634536743164e-05, -2.82973051071167e-05, -9.953975677490234e-06, 8.38935375213623e-06, 2.6732683181762695e-05, 4.507601261138916e-05, 6.341934204101562e-05, 8.176267147064209e-05, 0.00010010600090026855, 0.00011844933032989502, 0.00013679265975952148, 0.00015513598918914795, 0.00017347931861877441, 0.00019182264804840088, 0.00021016597747802734, 0.0002285093069076538, 0.0002468526363372803, 0.00026519596576690674, 0.0002835392951965332, 0.00030188262462615967, 0.00032022595405578613, 0.0003385692834854126, 0.00035691261291503906, 0.00037525594234466553, 0.000393599271774292, 0.00041194260120391846, 0.0004302859306335449, 0.0004486292600631714, 0.00046697258949279785, 0.0004853159189224243, 0.0005036592483520508, 0.0005220025777816772, 0.0005403459072113037, 0.0005586892366409302, 0.0005770325660705566, 0.0005953758955001831, 0.0006137192249298096, 0.000632062554359436, 0.0006504058837890625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 7.0, 9.0, 13.0, 21.0, 21.0, 29.0, 57.0, 67.0, 96.0, 126.0, 210.0, 886.0, 8087.0, 155497.0, 844419.0, 35458.0, 2582.0, 418.0, 177.0, 99.0, 64.0, 35.0, 38.0, 31.0, 24.0, 18.0, 12.0, 9.0, 13.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01025390625, -0.009963154792785645, -0.009672403335571289, -0.009381651878356934, -0.009090900421142578, -0.008800148963928223, -0.008509397506713867, -0.008218646049499512, -0.007927894592285156, -0.007637143135070801, -0.007346391677856445, -0.00705564022064209, -0.006764888763427734, -0.006474137306213379, -0.0061833858489990234, -0.005892634391784668, -0.0056018829345703125, -0.005311131477355957, -0.0050203800201416016, -0.004729628562927246, -0.004438877105712891, -0.004148125648498535, -0.0038573741912841797, -0.0035666227340698242, -0.0032758712768554688, -0.0029851198196411133, -0.002694368362426758, -0.0024036169052124023, -0.002112865447998047, -0.0018221139907836914, -0.001531362533569336, -0.0012406110763549805, -0.000949859619140625, -0.0006591081619262695, -0.00036835670471191406, -7.76052474975586e-05, 0.00021314620971679688, 0.0005038976669311523, 0.0007946491241455078, 0.0010854005813598633, 0.0013761520385742188, 0.0016669034957885742, 0.0019576549530029297, 0.002248406410217285, 0.0025391578674316406, 0.002829909324645996, 0.0031206607818603516, 0.003411412239074707, 0.0037021636962890625, 0.003992915153503418, 0.0042836666107177734, 0.004574418067932129, 0.004865169525146484, 0.00515592098236084, 0.005446672439575195, 0.005737423896789551, 0.006028175354003906, 0.006318926811218262, 0.006609678268432617, 0.006900429725646973, 0.007191181182861328, 0.007481932640075684, 0.007772684097290039, 0.008063435554504395, 0.00835418701171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 11.0, 51.0, 607.0, 323.0, 24.0], "bins": [-0.013291134499013424, -0.013076398521661758, -0.012861662544310093, -0.012646926566958427, -0.012432190589606762, -0.012217454612255096, -0.012002719566226006, -0.01178798358887434, -0.011573247611522675, -0.011358511634171009, -0.011143775656819344, -0.010929039679467678, -0.010714303702116013, -0.010499568656086922, -0.010284831747412682, -0.01007009670138359, -0.00985535979270935, -0.009640623815357685, -0.00942588783800602, -0.009211151860654354, -0.008996415883302689, -0.008781680837273598, -0.008566943928599358, -0.008352208882570267, -0.008137472905218601, -0.007922736927866936, -0.00770800095051527, -0.007493264973163605, -0.0072785294614732265, -0.007063793484121561, -0.0068490575067698956, -0.00663432152941823, -0.0064195855520665646, -0.006204849574714899, -0.0059901135973632336, -0.005775378085672855, -0.00556064210832119, -0.005345906130969524, -0.005131170153617859, -0.004916434176266193, -0.004701698198914528, -0.004486962221562862, -0.004272226244211197, -0.004057490266859531, -0.003842754755169153, -0.0036280187778174877, -0.0034132828004658222, -0.0031985468231141567, -0.0029838113114237785, -0.002769075334072113, -0.002554339589551091, -0.0023396036121994257, -0.002124867867678404, -0.0019101318903267384, -0.0016953959129750729, -0.0014806600520387292, -0.0012659241911023855, -0.0010511883301660419, -0.0008364524110220373, -0.0006217164918780327, -0.000406980630941689, -0.00019224477000534534, 2.2491207346320152e-05, 0.00023722706828266382, 0.0004519629292190075]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 14.0, 15.0, 21.0, 36.0, 26.0, 46.0, 43.0, 48.0, 64.0, 55.0, 64.0, 59.0, 70.0, 61.0, 62.0, 53.0, 52.0, 42.0, 31.0, 26.0, 25.0, 21.0, 19.0, 13.0, 6.0, 12.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005148649215698242, -0.0004944652318954468, -0.00047406554222106934, -0.0004536658525466919, -0.00043326616287231445, -0.000412866473197937, -0.00039246678352355957, -0.00037206709384918213, -0.0003516674041748047, -0.00033126771450042725, -0.0003108680248260498, -0.00029046833515167236, -0.0002700686454772949, -0.0002496689558029175, -0.00022926926612854004, -0.0002088695764541626, -0.00018846988677978516, -0.00016807019710540771, -0.00014767050743103027, -0.00012727081775665283, -0.00010687112808227539, -8.647143840789795e-05, -6.607174873352051e-05, -4.5672059059143066e-05, -2.5272369384765625e-05, -4.872679710388184e-06, 1.5527009963989258e-05, 3.59266996383667e-05, 5.632638931274414e-05, 7.672607898712158e-05, 9.712576866149902e-05, 0.00011752545833587646, 0.0001379251480102539, 0.00015832483768463135, 0.0001787245273590088, 0.00019912421703338623, 0.00021952390670776367, 0.0002399235963821411, 0.00026032328605651855, 0.000280722975730896, 0.00030112266540527344, 0.0003215223550796509, 0.0003419220447540283, 0.00036232173442840576, 0.0003827214241027832, 0.00040312111377716064, 0.0004235208034515381, 0.00044392049312591553, 0.00046432018280029297, 0.0004847198724746704, 0.0005051195621490479, 0.0005255192518234253, 0.0005459189414978027, 0.0005663186311721802, 0.0005867183208465576, 0.0006071180105209351, 0.0006275177001953125, 0.0006479173898696899, 0.0006683170795440674, 0.0006887167692184448, 0.0007091164588928223, 0.0007295161485671997, 0.0007499158382415771, 0.0007703155279159546, 0.000790715217590332]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 11.0, 9.0, 16.0, 23.0, 31.0, 39.0, 49.0, 51.0, 49.0, 67.0, 73.0, 83.0, 82.0, 77.0, 78.0, 64.0, 47.0, 39.0, 29.0, 23.0, 22.0, 13.0, 10.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.18353271484375, -4.0662841796875, -3.94903564453125, -3.831787109375, -3.71453857421875, -3.5972900390625, -3.48004150390625, -3.36279296875, -3.24554443359375, -3.1282958984375, -3.01104736328125, -2.893798828125, -2.77655029296875, -2.6593017578125, -2.54205322265625, -2.4248046875, -2.30755615234375, -2.1903076171875, -2.07305908203125, -1.955810546875, -1.83856201171875, -1.7213134765625, -1.60406494140625, -1.48681640625, -1.36956787109375, -1.2523193359375, -1.13507080078125, -1.017822265625, -0.90057373046875, -0.7833251953125, -0.66607666015625, -0.548828125, -0.43157958984375, -0.3143310546875, -0.19708251953125, -0.079833984375, 0.03741455078125, 0.1546630859375, 0.27191162109375, 0.38916015625, 0.50640869140625, 0.6236572265625, 0.74090576171875, 0.858154296875, 0.97540283203125, 1.0926513671875, 1.20989990234375, 1.3271484375, 1.44439697265625, 1.5616455078125, 1.67889404296875, 1.796142578125, 1.91339111328125, 2.0306396484375, 2.14788818359375, 2.26513671875, 2.38238525390625, 2.4996337890625, 2.61688232421875, 2.734130859375, 2.85137939453125, 2.9686279296875, 3.08587646484375, 3.203125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 8.0, 9.0, 11.0, 21.0, 21.0, 46.0, 73.0, 127.0, 209.0, 501.0, 1128.0, 3242.0, 13089.0, 91205.0, 814384.0, 104808.0, 13904.0, 3544.0, 1207.0, 488.0, 224.0, 120.0, 63.0, 44.0, 32.0, 15.0, 13.0, 12.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2578125, -10.9219970703125, -10.586181640625, -10.2503662109375, -9.91455078125, -9.5787353515625, -9.242919921875, -8.9071044921875, -8.5712890625, -8.2354736328125, -7.899658203125, -7.5638427734375, -7.22802734375, -6.8922119140625, -6.556396484375, -6.2205810546875, -5.884765625, -5.5489501953125, -5.213134765625, -4.8773193359375, -4.54150390625, -4.2056884765625, -3.869873046875, -3.5340576171875, -3.1982421875, -2.8624267578125, -2.526611328125, -2.1907958984375, -1.85498046875, -1.5191650390625, -1.183349609375, -0.8475341796875, -0.51171875, -0.1759033203125, 0.159912109375, 0.4957275390625, 0.83154296875, 1.1673583984375, 1.503173828125, 1.8389892578125, 2.1748046875, 2.5106201171875, 2.846435546875, 3.1822509765625, 3.51806640625, 3.8538818359375, 4.189697265625, 4.5255126953125, 4.861328125, 5.1971435546875, 5.532958984375, 5.8687744140625, 6.20458984375, 6.5404052734375, 6.876220703125, 7.2120361328125, 7.5478515625, 7.8836669921875, 8.219482421875, 8.5552978515625, 8.89111328125, 9.2269287109375, 9.562744140625, 9.8985595703125, 10.234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 10.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 15.0, 15.0, 25.0, 21.0, 24.0, 25.0, 23.0, 48.0, 33.0, 19.0, 39.0, 46.0, 58.0, 64.0, 110.0, 190.0, 1367.0, 236.0, 120.0, 52.0, 53.0, 43.0, 43.0, 43.0, 32.0, 26.0, 17.0, 34.0, 24.0, 20.0, 28.0, 18.0, 15.0, 13.0, 8.0, 11.0, 9.0, 10.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.86328125, -6.6466064453125, -6.429931640625, -6.2132568359375, -5.99658203125, -5.7799072265625, -5.563232421875, -5.3465576171875, -5.1298828125, -4.9132080078125, -4.696533203125, -4.4798583984375, -4.26318359375, -4.0465087890625, -3.829833984375, -3.6131591796875, -3.396484375, -3.1798095703125, -2.963134765625, -2.7464599609375, -2.52978515625, -2.3131103515625, -2.096435546875, -1.8797607421875, -1.6630859375, -1.4464111328125, -1.229736328125, -1.0130615234375, -0.79638671875, -0.5797119140625, -0.363037109375, -0.1463623046875, 0.0703125, 0.2869873046875, 0.503662109375, 0.7203369140625, 0.93701171875, 1.1536865234375, 1.370361328125, 1.5870361328125, 1.8037109375, 2.0203857421875, 2.237060546875, 2.4537353515625, 2.67041015625, 2.8870849609375, 3.103759765625, 3.3204345703125, 3.537109375, 3.7537841796875, 3.970458984375, 4.1871337890625, 4.40380859375, 4.6204833984375, 4.837158203125, 5.0538330078125, 5.2705078125, 5.4871826171875, 5.703857421875, 5.9205322265625, 6.13720703125, 6.3538818359375, 6.570556640625, 6.7872314453125, 7.00390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 12.0, 21.0, 12.0, 14.0, 17.0, 28.0, 42.0, 53.0, 59.0, 124.0, 173.0, 227.0, 423.0, 740.0, 1421.0, 2856.0, 6097.0, 14951.0, 46549.0, 355342.0, 2486689.0, 174935.0, 33365.0, 11538.0, 4935.0, 2216.0, 1134.0, 636.0, 341.0, 232.0, 136.0, 85.0, 75.0, 47.0, 42.0, 20.0, 24.0, 14.0, 13.0, 8.0, 13.0, 8.0, 4.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-10.9765625, -10.637451171875, -10.29833984375, -9.959228515625, -9.6201171875, -9.281005859375, -8.94189453125, -8.602783203125, -8.263671875, -7.924560546875, -7.58544921875, -7.246337890625, -6.9072265625, -6.568115234375, -6.22900390625, -5.889892578125, -5.55078125, -5.211669921875, -4.87255859375, -4.533447265625, -4.1943359375, -3.855224609375, -3.51611328125, -3.177001953125, -2.837890625, -2.498779296875, -2.15966796875, -1.820556640625, -1.4814453125, -1.142333984375, -0.80322265625, -0.464111328125, -0.125, 0.214111328125, 0.55322265625, 0.892333984375, 1.2314453125, 1.570556640625, 1.90966796875, 2.248779296875, 2.587890625, 2.927001953125, 3.26611328125, 3.605224609375, 3.9443359375, 4.283447265625, 4.62255859375, 4.961669921875, 5.30078125, 5.639892578125, 5.97900390625, 6.318115234375, 6.6572265625, 6.996337890625, 7.33544921875, 7.674560546875, 8.013671875, 8.352783203125, 8.69189453125, 9.031005859375, 9.3701171875, 9.709228515625, 10.04833984375, 10.387451171875, 10.7265625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [4.0, 140.0, 809.0, 65.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.585744857788086, -10.903063774108887, -3.2203826904296875, 4.462297439575195, 12.144979476928711, 19.827661514282227, 27.510339736938477, 35.193023681640625, 42.875701904296875, 50.55838394165039, 58.241065979003906, 65.92374420166016, 73.60643005371094, 81.28910827636719, 88.97178649902344, 96.65446472167969, 104.33715057373047, 112.01982879638672, 119.7025146484375, 127.38519287109375, 135.06787109375, 142.75054931640625, 150.4332275390625, 158.1159210205078, 165.79859924316406, 173.4812774658203, 181.16395568847656, 188.84664916992188, 196.52932739257812, 204.21200561523438, 211.89468383789062, 219.57736206054688, 227.26004028320312, 234.94271850585938, 242.62539672851562, 250.30807495117188, 257.9907531738281, 265.6734619140625, 273.35614013671875, 281.038818359375, 288.72149658203125, 296.4041748046875, 304.08685302734375, 311.76953125, 319.45220947265625, 327.1348876953125, 334.81756591796875, 342.5002746582031, 350.18292236328125, 357.8656005859375, 365.54827880859375, 373.23095703125, 380.91363525390625, 388.5963134765625, 396.27899169921875, 403.9617004394531, 411.6443786621094, 419.3270568847656, 427.0097351074219, 434.6924133300781, 442.3750915527344, 450.05780029296875, 457.740478515625, 465.42315673828125, 473.1058349609375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 5.0, 12.0, 8.0, 15.0, 22.0, 19.0, 20.0, 25.0, 18.0, 34.0, 30.0, 28.0, 27.0, 33.0, 56.0, 37.0, 35.0, 33.0, 36.0, 35.0, 45.0, 49.0, 34.0, 40.0, 38.0, 38.0, 28.0, 17.0, 21.0, 24.0, 16.0, 20.0, 18.0, 17.0, 8.0, 8.0, 4.0, 7.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.87702751159668, -28.988431930541992, -28.099836349487305, -27.211238861083984, -26.322643280029297, -25.43404769897461, -24.545452117919922, -23.656856536865234, -22.768260955810547, -21.87966537475586, -20.991069793701172, -20.102474212646484, -19.213876724243164, -18.325281143188477, -17.43668556213379, -16.5480899810791, -15.659492492675781, -14.770896911621094, -13.88230037689209, -12.993704795837402, -12.105108261108398, -11.216512680053711, -10.327917098999023, -9.439321517944336, -8.550724983215332, -7.662128925323486, -6.773532867431641, -5.884937286376953, -4.996341228485107, -4.107745170593262, -3.219149589538574, -2.3305535316467285, -1.4419574737548828, -0.5533615350723267, 0.3352344036102295, 1.223830223083496, 2.112426280975342, 3.0010223388671875, 3.889617919921875, 4.778213977813721, 5.666810035705566, 6.555406093597412, 7.444002151489258, 8.332597732543945, 9.221193313598633, 10.109789848327637, 10.998385429382324, 11.886981964111328, 12.775577545166016, 13.664173126220703, 14.552769660949707, 15.441365242004395, 16.3299617767334, 17.218557357788086, 18.107152938842773, 18.99574851989746, 19.88434600830078, 20.77294158935547, 21.661537170410156, 22.550132751464844, 23.438730239868164, 24.32732582092285, 25.21592140197754, 26.104516983032227, 26.993112564086914]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 14.0, 10.0, 16.0, 37.0, 31.0, 34.0, 46.0, 53.0, 42.0, 59.0, 63.0, 86.0, 83.0, 58.0, 77.0, 67.0, 37.0, 46.0, 35.0, 24.0, 25.0, 19.0, 12.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1171875, -4.005035400390625, -3.89288330078125, -3.780731201171875, -3.6685791015625, -3.556427001953125, -3.44427490234375, -3.332122802734375, -3.219970703125, -3.107818603515625, -2.99566650390625, -2.883514404296875, -2.7713623046875, -2.659210205078125, -2.54705810546875, -2.434906005859375, -2.32275390625, -2.210601806640625, -2.09844970703125, -1.986297607421875, -1.8741455078125, -1.761993408203125, -1.64984130859375, -1.537689208984375, -1.425537109375, -1.313385009765625, -1.20123291015625, -1.089080810546875, -0.9769287109375, -0.864776611328125, -0.75262451171875, -0.640472412109375, -0.5283203125, -0.416168212890625, -0.30401611328125, -0.191864013671875, -0.0797119140625, 0.032440185546875, 0.14459228515625, 0.256744384765625, 0.368896484375, 0.481048583984375, 0.59320068359375, 0.705352783203125, 0.8175048828125, 0.929656982421875, 1.04180908203125, 1.153961181640625, 1.26611328125, 1.378265380859375, 1.49041748046875, 1.602569580078125, 1.7147216796875, 1.826873779296875, 1.93902587890625, 2.051177978515625, 2.163330078125, 2.275482177734375, 2.38763427734375, 2.499786376953125, 2.6119384765625, 2.724090576171875, 2.83624267578125, 2.948394775390625, 3.060546875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 12.0, 12.0, 23.0, 23.0, 20.0, 48.0, 45.0, 102.0, 163.0, 273.0, 494.0, 918.0, 1918.0, 5519.0, 21902.0, 458838.0, 3565933.0, 119277.0, 12673.0, 3553.0, 1277.0, 566.0, 284.0, 150.0, 99.0, 66.0, 28.0, 12.0, 13.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.374755859375, -16.92138671875, -16.468017578125, -16.0146484375, -15.561279296875, -15.10791015625, -14.654541015625, -14.201171875, -13.747802734375, -13.29443359375, -12.841064453125, -12.3876953125, -11.934326171875, -11.48095703125, -11.027587890625, -10.57421875, -10.120849609375, -9.66748046875, -9.214111328125, -8.7607421875, -8.307373046875, -7.85400390625, -7.400634765625, -6.947265625, -6.493896484375, -6.04052734375, -5.587158203125, -5.1337890625, -4.680419921875, -4.22705078125, -3.773681640625, -3.3203125, -2.866943359375, -2.41357421875, -1.960205078125, -1.5068359375, -1.053466796875, -0.60009765625, -0.146728515625, 0.306640625, 0.760009765625, 1.21337890625, 1.666748046875, 2.1201171875, 2.573486328125, 3.02685546875, 3.480224609375, 3.93359375, 4.386962890625, 4.84033203125, 5.293701171875, 5.7470703125, 6.200439453125, 6.65380859375, 7.107177734375, 7.560546875, 8.013916015625, 8.46728515625, 8.920654296875, 9.3740234375, 9.827392578125, 10.28076171875, 10.734130859375, 11.1875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 10.0, 16.0, 15.0, 19.0, 44.0, 73.0, 93.0, 144.0, 274.0, 439.0, 654.0, 779.0, 582.0, 364.0, 202.0, 111.0, 97.0, 52.0, 25.0, 18.0, 15.0, 8.0, 11.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.3380126953125, -8.043212890625, -7.7484130859375, -7.45361328125, -7.1588134765625, -6.864013671875, -6.5692138671875, -6.2744140625, -5.9796142578125, -5.684814453125, -5.3900146484375, -5.09521484375, -4.8004150390625, -4.505615234375, -4.2108154296875, -3.916015625, -3.6212158203125, -3.326416015625, -3.0316162109375, -2.73681640625, -2.4420166015625, -2.147216796875, -1.8524169921875, -1.5576171875, -1.2628173828125, -0.968017578125, -0.6732177734375, -0.37841796875, -0.0836181640625, 0.211181640625, 0.5059814453125, 0.80078125, 1.0955810546875, 1.390380859375, 1.6851806640625, 1.97998046875, 2.2747802734375, 2.569580078125, 2.8643798828125, 3.1591796875, 3.4539794921875, 3.748779296875, 4.0435791015625, 4.33837890625, 4.6331787109375, 4.927978515625, 5.2227783203125, 5.517578125, 5.8123779296875, 6.107177734375, 6.4019775390625, 6.69677734375, 6.9915771484375, 7.286376953125, 7.5811767578125, 7.8759765625, 8.1707763671875, 8.465576171875, 8.7603759765625, 9.05517578125, 9.3499755859375, 9.644775390625, 9.9395751953125, 10.234375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 14.0, 32.0, 37.0, 65.0, 127.0, 234.0, 454.0, 811.0, 1663.0, 3733.0, 9589.0, 31475.0, 162612.0, 1705515.0, 2030701.0, 193676.0, 35183.0, 10605.0, 4009.0, 1839.0, 881.0, 459.0, 243.0, 152.0, 77.0, 46.0, 19.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.5205078125, -13.111328125, -12.7021484375, -12.29296875, -11.8837890625, -11.474609375, -11.0654296875, -10.65625, -10.2470703125, -9.837890625, -9.4287109375, -9.01953125, -8.6103515625, -8.201171875, -7.7919921875, -7.3828125, -6.9736328125, -6.564453125, -6.1552734375, -5.74609375, -5.3369140625, -4.927734375, -4.5185546875, -4.109375, -3.7001953125, -3.291015625, -2.8818359375, -2.47265625, -2.0634765625, -1.654296875, -1.2451171875, -0.8359375, -0.4267578125, -0.017578125, 0.3916015625, 0.80078125, 1.2099609375, 1.619140625, 2.0283203125, 2.4375, 2.8466796875, 3.255859375, 3.6650390625, 4.07421875, 4.4833984375, 4.892578125, 5.3017578125, 5.7109375, 6.1201171875, 6.529296875, 6.9384765625, 7.34765625, 7.7568359375, 8.166015625, 8.5751953125, 8.984375, 9.3935546875, 9.802734375, 10.2119140625, 10.62109375, 11.0302734375, 11.439453125, 11.8486328125, 12.2578125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 8.0, 39.0, 61.0, 114.0, 191.0, 186.0, 163.0, 99.0, 85.0, 27.0, 20.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-100.6738510131836, -98.3565444946289, -96.03923797607422, -93.72193145751953, -91.40461730957031, -89.08731079101562, -86.77000427246094, -84.45269775390625, -82.13539123535156, -79.81808471679688, -77.50077819824219, -75.1834716796875, -72.86616516113281, -70.5488510131836, -68.2315444946289, -65.91423797607422, -63.59693145751953, -61.279624938964844, -58.962318420410156, -56.6450080871582, -54.327701568603516, -52.01039505004883, -49.693084716796875, -47.37577819824219, -45.0584716796875, -42.74116516113281, -40.423858642578125, -38.10654830932617, -35.789241790771484, -33.4719352722168, -31.154626846313477, -28.837318420410156, -26.520004272460938, -24.20269775390625, -21.88538932800293, -19.56808090209961, -17.250774383544922, -14.933466911315918, -12.616159439086914, -10.298851013183594, -7.981544494628906, -5.664237022399902, -3.3469295501708984, -1.0296220779418945, 1.2876853942871094, 3.6049928665161133, 5.922300338745117, 8.239608764648438, 10.556915283203125, 12.874222755432129, 15.191530227661133, 17.508838653564453, 19.82614517211914, 22.143451690673828, 24.46076011657715, 26.77806854248047, 29.095375061035156, 31.412681579589844, 33.72998809814453, 36.047298431396484, 38.36460494995117, 40.68191146850586, 42.99922180175781, 45.3165283203125, 47.63383483886719]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 4.0, 5.0, 9.0, 12.0, 12.0, 12.0, 17.0, 32.0, 27.0, 35.0, 31.0, 46.0, 30.0, 36.0, 50.0, 46.0, 34.0, 41.0, 43.0, 62.0, 45.0, 42.0, 41.0, 32.0, 47.0, 27.0, 21.0, 27.0, 20.0, 22.0, 19.0, 10.0, 12.0, 8.0, 7.0, 7.0, 5.0, 10.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.952232360839844, -20.172441482543945, -19.392650604248047, -18.61285972595215, -17.83306884765625, -17.053279876708984, -16.273487091064453, -15.493698120117188, -14.713907241821289, -13.93411636352539, -13.154325485229492, -12.374534606933594, -11.594744682312012, -10.814953804016113, -10.035162925720215, -9.255373001098633, -8.475581169128418, -7.6957902908325195, -6.915999889373779, -6.136209011077881, -5.356418609619141, -4.576627731323242, -3.7968368530273438, -3.0170464515686035, -2.237255573272705, -1.4574649333953857, -0.6776741743087769, 0.10211658477783203, 0.8819072246551514, 1.6616978645324707, 2.441488742828369, 3.2212791442871094, 4.001070022583008, 4.780860900878906, 5.5606513023376465, 6.340442180633545, 7.120232582092285, 7.900023460388184, 8.679814338684082, 9.459604263305664, 10.239395141601562, 11.019186019897461, 11.79897689819336, 12.578767776489258, 13.35855770111084, 14.138348579406738, 14.918139457702637, 15.697929382324219, 16.47772216796875, 17.25751304626465, 18.037303924560547, 18.817094802856445, 19.596885681152344, 20.37667465209961, 21.15646743774414, 21.936256408691406, 22.716047286987305, 23.495838165283203, 24.2756290435791, 25.055419921875, 25.8352108001709, 26.615001678466797, 27.394790649414062, 28.17458152770996, 28.95437240600586]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 9.0, 18.0, 15.0, 23.0, 32.0, 41.0, 37.0, 32.0, 45.0, 68.0, 67.0, 73.0, 67.0, 67.0, 59.0, 64.0, 49.0, 35.0, 46.0, 30.0, 30.0, 17.0, 19.0, 15.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.76171875, -3.657684326171875, -3.55364990234375, -3.449615478515625, -3.3455810546875, -3.241546630859375, -3.13751220703125, -3.033477783203125, -2.929443359375, -2.825408935546875, -2.72137451171875, -2.617340087890625, -2.5133056640625, -2.409271240234375, -2.30523681640625, -2.201202392578125, -2.09716796875, -1.993133544921875, -1.88909912109375, -1.785064697265625, -1.6810302734375, -1.576995849609375, -1.47296142578125, -1.368927001953125, -1.264892578125, -1.160858154296875, -1.05682373046875, -0.952789306640625, -0.8487548828125, -0.744720458984375, -0.64068603515625, -0.536651611328125, -0.4326171875, -0.328582763671875, -0.22454833984375, -0.120513916015625, -0.0164794921875, 0.087554931640625, 0.19158935546875, 0.295623779296875, 0.399658203125, 0.503692626953125, 0.60772705078125, 0.711761474609375, 0.8157958984375, 0.919830322265625, 1.02386474609375, 1.127899169921875, 1.23193359375, 1.335968017578125, 1.44000244140625, 1.544036865234375, 1.6480712890625, 1.752105712890625, 1.85614013671875, 1.960174560546875, 2.064208984375, 2.168243408203125, 2.27227783203125, 2.376312255859375, 2.4803466796875, 2.584381103515625, 2.68841552734375, 2.792449951171875, 2.896484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 14.0, 7.0, 23.0, 33.0, 33.0, 46.0, 55.0, 93.0, 130.0, 188.0, 302.0, 452.0, 733.0, 1250.0, 2136.0, 3787.0, 6835.0, 13023.0, 24878.0, 50062.0, 111770.0, 359635.0, 284134.0, 96445.0, 44268.0, 21939.0, 11440.0, 6279.0, 3438.0, 1953.0, 1146.0, 666.0, 450.0, 293.0, 185.0, 110.0, 90.0, 60.0, 53.0, 30.0, 18.0, 13.0, 17.0, 11.0, 13.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0], "bins": [-0.1978759765625, -0.19204139709472656, -0.18620681762695312, -0.1803722381591797, -0.17453765869140625, -0.1687030792236328, -0.16286849975585938, -0.15703392028808594, -0.1511993408203125, -0.14536476135253906, -0.13953018188476562, -0.1336956024169922, -0.12786102294921875, -0.12202644348144531, -0.11619186401367188, -0.11035728454589844, -0.104522705078125, -0.09868812561035156, -0.09285354614257812, -0.08701896667480469, -0.08118438720703125, -0.07534980773925781, -0.06951522827148438, -0.06368064880371094, -0.0578460693359375, -0.05201148986816406, -0.046176910400390625, -0.04034233093261719, -0.03450775146484375, -0.028673171997070312, -0.022838592529296875, -0.017004013061523438, -0.01116943359375, -0.0053348541259765625, 0.000499725341796875, 0.0063343048095703125, 0.01216888427734375, 0.018003463745117188, 0.023838043212890625, 0.029672622680664062, 0.0355072021484375, 0.04134178161621094, 0.047176361083984375, 0.05301094055175781, 0.05884552001953125, 0.06468009948730469, 0.07051467895507812, 0.07634925842285156, 0.082183837890625, 0.08801841735839844, 0.09385299682617188, 0.09968757629394531, 0.10552215576171875, 0.11135673522949219, 0.11719131469726562, 0.12302589416503906, 0.1288604736328125, 0.13469505310058594, 0.14052963256835938, 0.1463642120361328, 0.15219879150390625, 0.1580333709716797, 0.16386795043945312, 0.16970252990722656, 0.175537109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 9.0, 10.0, 7.0, 7.0, 8.0, 14.0, 6.0, 7.0, 20.0, 20.0, 24.0, 22.0, 22.0, 27.0, 24.0, 29.0, 45.0, 38.0, 32.0, 45.0, 48.0, 1059.0, 27.0, 42.0, 45.0, 38.0, 36.0, 36.0, 33.0, 39.0, 34.0, 26.0, 28.0, 20.0, 13.0, 10.0, 21.0, 4.0, 11.0, 13.0, 8.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9501953125, -1.8871002197265625, -1.824005126953125, -1.7609100341796875, -1.69781494140625, -1.6347198486328125, -1.571624755859375, -1.5085296630859375, -1.4454345703125, -1.3823394775390625, -1.319244384765625, -1.2561492919921875, -1.19305419921875, -1.1299591064453125, -1.066864013671875, -1.0037689208984375, -0.940673828125, -0.8775787353515625, -0.814483642578125, -0.7513885498046875, -0.68829345703125, -0.6251983642578125, -0.562103271484375, -0.4990081787109375, -0.4359130859375, -0.3728179931640625, -0.309722900390625, -0.2466278076171875, -0.18353271484375, -0.1204376220703125, -0.057342529296875, 0.0057525634765625, 0.06884765625, 0.1319427490234375, 0.195037841796875, 0.2581329345703125, 0.32122802734375, 0.3843231201171875, 0.447418212890625, 0.5105133056640625, 0.5736083984375, 0.6367034912109375, 0.699798583984375, 0.7628936767578125, 0.82598876953125, 0.8890838623046875, 0.952178955078125, 1.0152740478515625, 1.078369140625, 1.1414642333984375, 1.204559326171875, 1.2676544189453125, 1.33074951171875, 1.3938446044921875, 1.456939697265625, 1.5200347900390625, 1.5831298828125, 1.6462249755859375, 1.709320068359375, 1.7724151611328125, 1.83551025390625, 1.8986053466796875, 1.961700439453125, 2.0247955322265625, 2.087890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 8.0, 7.0, 13.0, 18.0, 31.0, 42.0, 57.0, 85.0, 127.0, 167.0, 223.0, 324.0, 475.0, 649.0, 886.0, 1265.0, 1787.0, 2500.0, 3505.0, 4984.0, 7190.0, 10328.0, 14731.0, 21608.0, 32597.0, 50173.0, 81698.0, 154147.0, 1314405.0, 155298.0, 82748.0, 50588.0, 32942.0, 22042.0, 14770.0, 10280.0, 7088.0, 4970.0, 3580.0, 2469.0, 1886.0, 1295.0, 915.0, 654.0, 475.0, 314.0, 237.0, 157.0, 125.0, 89.0, 62.0, 45.0, 25.0, 15.0, 17.0, 8.0, 10.0, 3.0, 2.0, 3.0], "bins": [-0.044769287109375, -0.043392181396484375, -0.04201507568359375, -0.040637969970703125, -0.0392608642578125, -0.037883758544921875, -0.03650665283203125, -0.035129547119140625, -0.03375244140625, -0.032375335693359375, -0.03099822998046875, -0.029621124267578125, -0.0282440185546875, -0.026866912841796875, -0.02548980712890625, -0.024112701416015625, -0.022735595703125, -0.021358489990234375, -0.01998138427734375, -0.018604278564453125, -0.0172271728515625, -0.015850067138671875, -0.01447296142578125, -0.013095855712890625, -0.01171875, -0.010341644287109375, -0.00896453857421875, -0.007587432861328125, -0.0062103271484375, -0.004833221435546875, -0.00345611572265625, -0.002079010009765625, -0.000701904296875, 0.000675201416015625, 0.00205230712890625, 0.003429412841796875, 0.0048065185546875, 0.006183624267578125, 0.00756072998046875, 0.008937835693359375, 0.01031494140625, 0.011692047119140625, 0.01306915283203125, 0.014446258544921875, 0.0158233642578125, 0.017200469970703125, 0.01857757568359375, 0.019954681396484375, 0.021331787109375, 0.022708892822265625, 0.02408599853515625, 0.025463104248046875, 0.0268402099609375, 0.028217315673828125, 0.02959442138671875, 0.030971527099609375, 0.0323486328125, 0.033725738525390625, 0.03510284423828125, 0.036479949951171875, 0.0378570556640625, 0.039234161376953125, 0.04061126708984375, 0.041988372802734375, 0.043365478515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 7.0, 16.0, 6.0, 12.0, 17.0, 34.0, 39.0, 37.0, 46.0, 53.0, 102.0, 116.0, 113.0, 73.0, 55.0, 52.0, 42.0, 31.0, 24.0, 20.0, 18.0, 11.0, 6.0, 11.0, 10.0, 4.0, 9.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004665851593017578, -0.00045050308108329773, -0.00043442100286483765, -0.00041833892464637756, -0.0004022568464279175, -0.0003861747682094574, -0.0003700926899909973, -0.00035401061177253723, -0.00033792853355407715, -0.00032184645533561707, -0.000305764377117157, -0.0002896822988986969, -0.0002736002206802368, -0.00025751814246177673, -0.00024143606424331665, -0.00022535398602485657, -0.00020927190780639648, -0.0001931898295879364, -0.00017710775136947632, -0.00016102567315101624, -0.00014494359493255615, -0.00012886151671409607, -0.00011277943849563599, -9.66973602771759e-05, -8.061528205871582e-05, -6.453320384025574e-05, -4.8451125621795654e-05, -3.236904740333557e-05, -1.6286969184875488e-05, -2.0489096641540527e-07, 1.5877187252044678e-05, 3.195926547050476e-05, 4.8041343688964844e-05, 6.412342190742493e-05, 8.020550012588501e-05, 9.628757834434509e-05, 0.00011236965656280518, 0.00012845173478126526, 0.00014453381299972534, 0.00016061589121818542, 0.0001766979694366455, 0.0001927800476551056, 0.00020886212587356567, 0.00022494420409202576, 0.00024102628231048584, 0.0002571083605289459, 0.000273190438747406, 0.0002892725169658661, 0.00030535459518432617, 0.00032143667340278625, 0.00033751875162124634, 0.0003536008298397064, 0.0003696829080581665, 0.0003857649862766266, 0.00040184706449508667, 0.00041792914271354675, 0.00043401122093200684, 0.0004500932991504669, 0.000466175377368927, 0.0004822574555873871, 0.0004983395338058472, 0.0005144216120243073, 0.0005305036902427673, 0.0005465857684612274, 0.0005626678466796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 1.0, 4.0, 7.0, 10.0, 15.0, 12.0, 19.0, 24.0, 25.0, 45.0, 67.0, 104.0, 194.0, 636.0, 3560.0, 31048.0, 657582.0, 330538.0, 20987.0, 2624.0, 524.0, 179.0, 99.0, 70.0, 43.0, 35.0, 23.0, 13.0, 15.0, 6.0, 14.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0091552734375, -0.008893072605133057, -0.008630871772766113, -0.00836867094039917, -0.008106470108032227, -0.007844269275665283, -0.00758206844329834, -0.0073198676109313965, -0.007057666778564453, -0.00679546594619751, -0.006533265113830566, -0.006271064281463623, -0.00600886344909668, -0.005746662616729736, -0.005484461784362793, -0.00522226095199585, -0.004960060119628906, -0.004697859287261963, -0.0044356584548950195, -0.004173457622528076, -0.003911256790161133, -0.0036490559577941895, -0.003386855125427246, -0.0031246542930603027, -0.0028624534606933594, -0.002600252628326416, -0.0023380517959594727, -0.0020758509635925293, -0.001813650131225586, -0.0015514492988586426, -0.0012892484664916992, -0.0010270476341247559, -0.0007648468017578125, -0.0005026459693908691, -0.00024044513702392578, 2.1755695343017578e-05, 0.00028395652770996094, 0.0005461573600769043, 0.0008083581924438477, 0.001070559024810791, 0.0013327598571777344, 0.0015949606895446777, 0.001857161521911621, 0.0021193623542785645, 0.002381563186645508, 0.002643764019012451, 0.0029059648513793945, 0.003168165683746338, 0.0034303665161132812, 0.0036925673484802246, 0.003954768180847168, 0.004216969013214111, 0.004479169845581055, 0.004741370677947998, 0.005003571510314941, 0.005265772342681885, 0.005527973175048828, 0.0057901740074157715, 0.006052374839782715, 0.006314575672149658, 0.0065767765045166016, 0.006838977336883545, 0.007101178169250488, 0.007363379001617432, 0.007625579833984375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 33.0, 377.0, 556.0, 37.0, 8.0], "bins": [-0.013181163929402828, -0.012965384870767593, -0.012749604880809784, -0.012533825822174549, -0.012318046763539314, -0.012102266773581505, -0.01188648771494627, -0.011670708656311035, -0.0114549295976758, -0.011239150539040565, -0.011023370549082756, -0.010807591490447521, -0.010591812431812286, -0.010376032441854477, -0.010160253383219242, -0.009944474324584007, -0.009728694334626198, -0.009512915275990963, -0.009297135286033154, -0.009081356227397919, -0.008865577168762684, -0.008649798110127449, -0.00843401812016964, -0.008218239061534405, -0.00800246000289917, -0.007786680478602648, -0.007570901419967413, -0.007355121895670891, -0.007139342837035656, -0.006923563312739134, -0.006707783788442612, -0.006492004729807377, -0.006276224739849567, -0.006060445215553045, -0.0058446661569178104, -0.005628886632621288, -0.0054131075739860535, -0.005197328049689531, -0.004981548525393009, -0.004765769466757774, -0.0045499904081225395, -0.004334210883826017, -0.0041184318251907825, -0.0039026523008942604, -0.003686873009428382, -0.0034710937179625034, -0.003255314426496625, -0.0030395351350307465, -0.0028237556107342243, -0.002607976319268346, -0.0023921970278024673, -0.002176417503505945, -0.0019606382120400667, -0.0017448589205741882, -0.0015290796291083097, -0.0013133002212271094, -0.001097520929761231, -0.0008817415800876915, -0.0006659622304141521, -0.00045018293894827366, -0.00023440358927473426, -1.862423960119486e-05, 0.00019715505186468363, 0.00041293445974588394, 0.0006287137512117624]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 12.0, 19.0, 17.0, 23.0, 25.0, 49.0, 46.0, 52.0, 70.0, 53.0, 60.0, 73.0, 73.0, 80.0, 50.0, 48.0, 45.0, 38.0, 47.0, 29.0, 25.0, 19.0, 10.0, 12.0, 12.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004439353942871094, -0.00042630359530448914, -0.0004086717963218689, -0.00039103999733924866, -0.0003734081983566284, -0.0003557763993740082, -0.00033814460039138794, -0.0003205128014087677, -0.00030288100242614746, -0.0002852492034435272, -0.000267617404460907, -0.00024998560547828674, -0.0002323538064956665, -0.00021472200751304626, -0.00019709020853042603, -0.00017945840954780579, -0.00016182661056518555, -0.0001441948115825653, -0.00012656301259994507, -0.00010893121361732483, -9.129941463470459e-05, -7.366761565208435e-05, -5.603581666946411e-05, -3.840401768684387e-05, -2.0772218704223633e-05, -3.1404197216033936e-06, 1.4491379261016846e-05, 3.2123178243637085e-05, 4.9754977226257324e-05, 6.738677620887756e-05, 8.50185751914978e-05, 0.00010265037417411804, 0.00012028217315673828, 0.00013791397213935852, 0.00015554577112197876, 0.000173177570104599, 0.00019080936908721924, 0.00020844116806983948, 0.00022607296705245972, 0.00024370476603507996, 0.0002613365650177002, 0.00027896836400032043, 0.0002966001629829407, 0.0003142319619655609, 0.00033186376094818115, 0.0003494955599308014, 0.00036712735891342163, 0.00038475915789604187, 0.0004023909568786621, 0.00042002275586128235, 0.0004376545548439026, 0.00045528635382652283, 0.00047291815280914307, 0.0004905499517917633, 0.0005081817507743835, 0.0005258135497570038, 0.000543445348739624, 0.0005610771477222443, 0.0005787089467048645, 0.0005963407456874847, 0.000613972544670105, 0.0006316043436527252, 0.0006492361426353455, 0.0006668679416179657, 0.0006844997406005859]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 9.0, 18.0, 14.0, 23.0, 33.0, 41.0, 37.0, 32.0, 45.0, 68.0, 66.0, 74.0, 66.0, 68.0, 59.0, 64.0, 49.0, 34.0, 47.0, 29.0, 31.0, 17.0, 19.0, 15.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.763671875, -3.65960693359375, -3.5555419921875, -3.45147705078125, -3.347412109375, -3.24334716796875, -3.1392822265625, -3.03521728515625, -2.93115234375, -2.82708740234375, -2.7230224609375, -2.61895751953125, -2.514892578125, -2.41082763671875, -2.3067626953125, -2.20269775390625, -2.0986328125, -1.99456787109375, -1.8905029296875, -1.78643798828125, -1.682373046875, -1.57830810546875, -1.4742431640625, -1.37017822265625, -1.26611328125, -1.16204833984375, -1.0579833984375, -0.95391845703125, -0.849853515625, -0.74578857421875, -0.6417236328125, -0.53765869140625, -0.43359375, -0.32952880859375, -0.2254638671875, -0.12139892578125, -0.017333984375, 0.08673095703125, 0.1907958984375, 0.29486083984375, 0.39892578125, 0.50299072265625, 0.6070556640625, 0.71112060546875, 0.815185546875, 0.91925048828125, 1.0233154296875, 1.12738037109375, 1.2314453125, 1.33551025390625, 1.4395751953125, 1.54364013671875, 1.647705078125, 1.75177001953125, 1.8558349609375, 1.95989990234375, 2.06396484375, 2.16802978515625, 2.2720947265625, 2.37615966796875, 2.480224609375, 2.58428955078125, 2.6883544921875, 2.79241943359375, 2.896484375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 13.0, 23.0, 38.0, 56.0, 105.0, 148.0, 300.0, 714.0, 1873.0, 5846.0, 26141.0, 622019.0, 362127.0, 21150.0, 4979.0, 1660.0, 649.0, 318.0, 163.0, 94.0, 43.0, 27.0, 11.0, 15.0, 8.0, 10.0, 11.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.1639404296875, -11.695068359375, -11.2261962890625, -10.75732421875, -10.2884521484375, -9.819580078125, -9.3507080078125, -8.8818359375, -8.4129638671875, -7.944091796875, -7.4752197265625, -7.00634765625, -6.5374755859375, -6.068603515625, -5.5997314453125, -5.130859375, -4.6619873046875, -4.193115234375, -3.7242431640625, -3.25537109375, -2.7864990234375, -2.317626953125, -1.8487548828125, -1.3798828125, -0.9110107421875, -0.442138671875, 0.0267333984375, 0.49560546875, 0.9644775390625, 1.433349609375, 1.9022216796875, 2.37109375, 2.8399658203125, 3.308837890625, 3.7777099609375, 4.24658203125, 4.7154541015625, 5.184326171875, 5.6531982421875, 6.1220703125, 6.5909423828125, 7.059814453125, 7.5286865234375, 7.99755859375, 8.4664306640625, 8.935302734375, 9.4041748046875, 9.873046875, 10.3419189453125, 10.810791015625, 11.2796630859375, 11.74853515625, 12.2174072265625, 12.686279296875, 13.1551513671875, 13.6240234375, 14.0928955078125, 14.561767578125, 15.0306396484375, 15.49951171875, 15.9683837890625, 16.437255859375, 16.9061279296875, 17.375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 7.0, 8.0, 15.0, 16.0, 12.0, 10.0, 21.0, 27.0, 26.0, 26.0, 29.0, 28.0, 39.0, 41.0, 43.0, 67.0, 86.0, 126.0, 244.0, 1408.0, 158.0, 94.0, 87.0, 58.0, 50.0, 43.0, 30.0, 31.0, 24.0, 25.0, 19.0, 20.0, 16.0, 15.0, 15.0, 17.0, 7.0, 8.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-7.125, -6.90362548828125, -6.6822509765625, -6.46087646484375, -6.239501953125, -6.01812744140625, -5.7967529296875, -5.57537841796875, -5.35400390625, -5.13262939453125, -4.9112548828125, -4.68988037109375, -4.468505859375, -4.24713134765625, -4.0257568359375, -3.80438232421875, -3.5830078125, -3.36163330078125, -3.1402587890625, -2.91888427734375, -2.697509765625, -2.47613525390625, -2.2547607421875, -2.03338623046875, -1.81201171875, -1.59063720703125, -1.3692626953125, -1.14788818359375, -0.926513671875, -0.70513916015625, -0.4837646484375, -0.26239013671875, -0.041015625, 0.18035888671875, 0.4017333984375, 0.62310791015625, 0.844482421875, 1.06585693359375, 1.2872314453125, 1.50860595703125, 1.72998046875, 1.95135498046875, 2.1727294921875, 2.39410400390625, 2.615478515625, 2.83685302734375, 3.0582275390625, 3.27960205078125, 3.5009765625, 3.72235107421875, 3.9437255859375, 4.16510009765625, 4.386474609375, 4.60784912109375, 4.8292236328125, 5.05059814453125, 5.27197265625, 5.49334716796875, 5.7147216796875, 5.93609619140625, 6.157470703125, 6.37884521484375, 6.6002197265625, 6.82159423828125, 7.04296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 7.0, 11.0, 10.0, 23.0, 23.0, 23.0, 28.0, 44.0, 59.0, 64.0, 153.0, 245.0, 479.0, 840.0, 2035.0, 5015.0, 15814.0, 105030.0, 2362323.0, 597527.0, 40466.0, 9261.0, 3223.0, 1389.0, 655.0, 323.0, 187.0, 115.0, 65.0, 69.0, 48.0, 17.0, 19.0, 17.0, 22.0, 14.0, 14.0, 8.0, 5.0, 10.0, 8.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.0859375, -10.7371826171875, -10.388427734375, -10.0396728515625, -9.69091796875, -9.3421630859375, -8.993408203125, -8.6446533203125, -8.2958984375, -7.9471435546875, -7.598388671875, -7.2496337890625, -6.90087890625, -6.5521240234375, -6.203369140625, -5.8546142578125, -5.505859375, -5.1571044921875, -4.808349609375, -4.4595947265625, -4.11083984375, -3.7620849609375, -3.413330078125, -3.0645751953125, -2.7158203125, -2.3670654296875, -2.018310546875, -1.6695556640625, -1.32080078125, -0.9720458984375, -0.623291015625, -0.2745361328125, 0.07421875, 0.4229736328125, 0.771728515625, 1.1204833984375, 1.46923828125, 1.8179931640625, 2.166748046875, 2.5155029296875, 2.8642578125, 3.2130126953125, 3.561767578125, 3.9105224609375, 4.25927734375, 4.6080322265625, 4.956787109375, 5.3055419921875, 5.654296875, 6.0030517578125, 6.351806640625, 6.7005615234375, 7.04931640625, 7.3980712890625, 7.746826171875, 8.0955810546875, 8.4443359375, 8.7930908203125, 9.141845703125, 9.4906005859375, 9.83935546875, 10.1881103515625, 10.536865234375, 10.8856201171875, 11.234375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 123.0, 610.0, 265.0, 17.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53078842163086, -25.123645782470703, -20.716503143310547, -16.309358596801758, -11.902215957641602, -7.495073318481445, -3.0879287719726562, 1.3192138671875, 5.726356506347656, 10.133499145507812, 14.540642738342285, 18.947786331176758, 23.354928970336914, 27.76207160949707, 32.16921615600586, 36.576358795166016, 40.98350143432617, 45.39064407348633, 49.797786712646484, 54.204933166503906, 58.61207580566406, 63.01921844482422, 67.42636108398438, 71.83350372314453, 76.24064636230469, 80.64778900146484, 85.054931640625, 89.46207427978516, 93.86921691894531, 98.27635955810547, 102.68350219726562, 107.09065246582031, 111.497802734375, 115.90494537353516, 120.31208801269531, 124.71923065185547, 129.12637329101562, 133.5335235595703, 137.94065856933594, 142.34780883789062, 146.75494384765625, 151.16209411621094, 155.56922912597656, 159.97637939453125, 164.38351440429688, 168.79066467285156, 173.1977996826172, 177.60494995117188, 182.0120849609375, 186.4192352294922, 190.8263702392578, 195.2335205078125, 199.64065551757812, 204.0478057861328, 208.45494079589844, 212.86209106445312, 217.2692413330078, 221.6763916015625, 226.08352661132812, 230.4906768798828, 234.89781188964844, 239.30496215820312, 243.71209716796875, 248.11924743652344, 252.52638244628906]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 5.0, 13.0, 4.0, 8.0, 16.0, 18.0, 18.0, 15.0, 25.0, 25.0, 32.0, 24.0, 32.0, 34.0, 26.0, 32.0, 39.0, 40.0, 47.0, 43.0, 41.0, 42.0, 38.0, 44.0, 41.0, 36.0, 34.0, 31.0, 40.0, 27.0, 26.0, 23.0, 20.0, 12.0, 9.0, 8.0, 10.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.002681732177734, -27.202951431274414, -26.403223037719727, -25.603492736816406, -24.803762435913086, -24.004032135009766, -23.204303741455078, -22.404573440551758, -21.604843139648438, -20.805112838745117, -20.00538444519043, -19.20565414428711, -18.40592384338379, -17.60619354248047, -16.80646514892578, -16.00673484802246, -15.207006454467773, -14.40727710723877, -13.60754680633545, -12.807817459106445, -12.008087158203125, -11.208357810974121, -10.408628463745117, -9.608898162841797, -8.809168815612793, -8.009439468383789, -7.209709167480469, -6.409979820251465, -5.610249996185303, -4.810520172119141, -4.010790824890137, -3.2110610008239746, -2.4113311767578125, -1.61160147190094, -0.8118717670440674, -0.012142181396484375, 0.7875876426696777, 1.5873174667358398, 2.3870468139648438, 3.186776638031006, 3.986506462097168, 4.78623628616333, 5.585966110229492, 6.385695457458496, 7.185425281524658, 7.98515510559082, 8.784884452819824, 9.584613800048828, 10.384344100952148, 11.184073448181152, 11.983803749084473, 12.783533096313477, 13.583263397216797, 14.3829927444458, 15.182722091674805, 15.982452392578125, 16.782180786132812, 17.581911087036133, 18.38163948059082, 19.18136978149414, 19.98110008239746, 20.78083038330078, 21.58055877685547, 22.38028907775879, 23.18001937866211]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 6.0, 11.0, 10.0, 10.0, 23.0, 15.0, 28.0, 38.0, 41.0, 37.0, 44.0, 49.0, 59.0, 69.0, 65.0, 64.0, 59.0, 62.0, 50.0, 55.0, 38.0, 42.0, 33.0, 24.0, 17.0, 21.0, 10.0, 8.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.744140625, -3.639495849609375, -3.53485107421875, -3.430206298828125, -3.3255615234375, -3.220916748046875, -3.11627197265625, -3.011627197265625, -2.906982421875, -2.802337646484375, -2.69769287109375, -2.593048095703125, -2.4884033203125, -2.383758544921875, -2.27911376953125, -2.174468994140625, -2.06982421875, -1.965179443359375, -1.86053466796875, -1.755889892578125, -1.6512451171875, -1.546600341796875, -1.44195556640625, -1.337310791015625, -1.232666015625, -1.128021240234375, -1.02337646484375, -0.918731689453125, -0.8140869140625, -0.709442138671875, -0.60479736328125, -0.500152587890625, -0.3955078125, -0.290863037109375, -0.18621826171875, -0.081573486328125, 0.0230712890625, 0.127716064453125, 0.23236083984375, 0.337005615234375, 0.441650390625, 0.546295166015625, 0.65093994140625, 0.755584716796875, 0.8602294921875, 0.964874267578125, 1.06951904296875, 1.174163818359375, 1.27880859375, 1.383453369140625, 1.48809814453125, 1.592742919921875, 1.6973876953125, 1.802032470703125, 1.90667724609375, 2.011322021484375, 2.115966796875, 2.220611572265625, 2.32525634765625, 2.429901123046875, 2.5345458984375, 2.639190673828125, 2.74383544921875, 2.848480224609375, 2.953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 14.0, 13.0, 18.0, 30.0, 23.0, 42.0, 58.0, 91.0, 146.0, 231.0, 337.0, 618.0, 1044.0, 2002.0, 4180.0, 10924.0, 43867.0, 447295.0, 3076650.0, 533544.0, 52369.0, 12286.0, 4413.0, 1958.0, 951.0, 450.0, 269.0, 149.0, 110.0, 57.0, 46.0, 29.0, 15.0, 10.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-10.96875, -10.6981201171875, -10.427490234375, -10.1568603515625, -9.88623046875, -9.6156005859375, -9.344970703125, -9.0743408203125, -8.8037109375, -8.5330810546875, -8.262451171875, -7.9918212890625, -7.72119140625, -7.4505615234375, -7.179931640625, -6.9093017578125, -6.638671875, -6.3680419921875, -6.097412109375, -5.8267822265625, -5.55615234375, -5.2855224609375, -5.014892578125, -4.7442626953125, -4.4736328125, -4.2030029296875, -3.932373046875, -3.6617431640625, -3.39111328125, -3.1204833984375, -2.849853515625, -2.5792236328125, -2.30859375, -2.0379638671875, -1.767333984375, -1.4967041015625, -1.22607421875, -0.9554443359375, -0.684814453125, -0.4141845703125, -0.1435546875, 0.1270751953125, 0.397705078125, 0.6683349609375, 0.93896484375, 1.2095947265625, 1.480224609375, 1.7508544921875, 2.021484375, 2.2921142578125, 2.562744140625, 2.8333740234375, 3.10400390625, 3.3746337890625, 3.645263671875, 3.9158935546875, 4.1865234375, 4.4571533203125, 4.727783203125, 4.9984130859375, 5.26904296875, 5.5396728515625, 5.810302734375, 6.0809326171875, 6.3515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 8.0, 15.0, 19.0, 23.0, 36.0, 61.0, 74.0, 108.0, 178.0, 284.0, 410.0, 557.0, 610.0, 520.0, 380.0, 249.0, 168.0, 96.0, 67.0, 40.0, 34.0, 29.0, 23.0, 20.0, 10.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.84375, -7.6151123046875, -7.386474609375, -7.1578369140625, -6.92919921875, -6.7005615234375, -6.471923828125, -6.2432861328125, -6.0146484375, -5.7860107421875, -5.557373046875, -5.3287353515625, -5.10009765625, -4.8714599609375, -4.642822265625, -4.4141845703125, -4.185546875, -3.9569091796875, -3.728271484375, -3.4996337890625, -3.27099609375, -3.0423583984375, -2.813720703125, -2.5850830078125, -2.3564453125, -2.1278076171875, -1.899169921875, -1.6705322265625, -1.44189453125, -1.2132568359375, -0.984619140625, -0.7559814453125, -0.52734375, -0.2987060546875, -0.070068359375, 0.1585693359375, 0.38720703125, 0.6158447265625, 0.844482421875, 1.0731201171875, 1.3017578125, 1.5303955078125, 1.759033203125, 1.9876708984375, 2.21630859375, 2.4449462890625, 2.673583984375, 2.9022216796875, 3.130859375, 3.3594970703125, 3.588134765625, 3.8167724609375, 4.04541015625, 4.2740478515625, 4.502685546875, 4.7313232421875, 4.9599609375, 5.1885986328125, 5.417236328125, 5.6458740234375, 5.87451171875, 6.1031494140625, 6.331787109375, 6.5604248046875, 6.7890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 12.0, 6.0, 16.0, 13.0, 22.0, 37.0, 53.0, 88.0, 142.0, 238.0, 350.0, 509.0, 991.0, 1620.0, 2960.0, 5593.0, 11994.0, 30629.0, 107764.0, 563199.0, 2313327.0, 920573.0, 162601.0, 41484.0, 15036.0, 6843.0, 3403.0, 1930.0, 1126.0, 631.0, 367.0, 230.0, 197.0, 103.0, 55.0, 49.0, 22.0, 13.0, 16.0, 12.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.59375, -8.313232421875, -8.03271484375, -7.752197265625, -7.4716796875, -7.191162109375, -6.91064453125, -6.630126953125, -6.349609375, -6.069091796875, -5.78857421875, -5.508056640625, -5.2275390625, -4.947021484375, -4.66650390625, -4.385986328125, -4.10546875, -3.824951171875, -3.54443359375, -3.263916015625, -2.9833984375, -2.702880859375, -2.42236328125, -2.141845703125, -1.861328125, -1.580810546875, -1.30029296875, -1.019775390625, -0.7392578125, -0.458740234375, -0.17822265625, 0.102294921875, 0.3828125, 0.663330078125, 0.94384765625, 1.224365234375, 1.5048828125, 1.785400390625, 2.06591796875, 2.346435546875, 2.626953125, 2.907470703125, 3.18798828125, 3.468505859375, 3.7490234375, 4.029541015625, 4.31005859375, 4.590576171875, 4.87109375, 5.151611328125, 5.43212890625, 5.712646484375, 5.9931640625, 6.273681640625, 6.55419921875, 6.834716796875, 7.115234375, 7.395751953125, 7.67626953125, 7.956787109375, 8.2373046875, 8.517822265625, 8.79833984375, 9.078857421875, 9.359375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 17.0, 22.0, 43.0, 62.0, 93.0, 117.0, 119.0, 137.0, 102.0, 105.0, 67.0, 36.0, 29.0, 16.0, 16.0, 5.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.916015625, -45.53499221801758, -44.153968811035156, -42.77294158935547, -41.39191818237305, -40.010894775390625, -38.6298713684082, -37.24884796142578, -35.867820739746094, -34.48679733276367, -33.10577392578125, -31.724748611450195, -30.34372329711914, -28.96269989013672, -27.581676483154297, -26.200653076171875, -24.819629669189453, -23.43860626220703, -22.057580947875977, -20.676557540893555, -19.2955322265625, -17.914508819580078, -16.533485412597656, -15.152461051940918, -13.77143669128418, -12.390412330627441, -11.009387969970703, -9.628364562988281, -8.247340202331543, -6.866315841674805, -5.485292434692383, -4.1042680740356445, -2.723247528076172, -1.3422234058380127, 0.038800716400146484, 1.4198246002197266, 2.800848960876465, 4.181873321533203, 5.562896728515625, 6.943921089172363, 8.324945449829102, 9.70596981048584, 11.086994171142578, 12.468017578125, 13.849041938781738, 15.230066299438477, 16.6110897064209, 17.992115020751953, 19.373138427734375, 20.754161834716797, 22.13518714904785, 23.516210556030273, 24.897235870361328, 26.27825927734375, 27.659282684326172, 29.040306091308594, 30.42133140563965, 31.80235481262207, 33.183380126953125, 34.56440353393555, 35.94542694091797, 37.326454162597656, 38.70747375488281, 40.0885009765625, 41.46952438354492]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 13.0, 5.0, 5.0, 8.0, 14.0, 16.0, 20.0, 15.0, 16.0, 22.0, 25.0, 22.0, 22.0, 25.0, 30.0, 36.0, 36.0, 44.0, 44.0, 33.0, 37.0, 34.0, 39.0, 44.0, 36.0, 40.0, 35.0, 46.0, 49.0, 27.0, 24.0, 25.0, 30.0, 11.0, 11.0, 14.0, 10.0, 10.0, 5.0, 7.0, 3.0, 7.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.16278839111328, -19.51471710205078, -18.86664581298828, -18.21857452392578, -17.57050323486328, -16.92243003845215, -16.27435874938965, -15.626287460327148, -14.978216171264648, -14.330144882202148, -13.682073593139648, -13.034001350402832, -12.385930061340332, -11.737858772277832, -11.089786529541016, -10.441715240478516, -9.793643951416016, -9.145572662353516, -8.497501373291016, -7.849429130554199, -7.201357841491699, -6.553286552429199, -5.905214786529541, -5.257143020629883, -4.609071731567383, -3.9610002040863037, -3.3129286766052246, -2.6648571491241455, -2.0167856216430664, -1.3687140941619873, -0.7206425666809082, -0.07257080078125, 0.57550048828125, 1.223572015762329, 1.8716435432434082, 2.5197150707244873, 3.1677865982055664, 3.8158581256866455, 4.463929653167725, 5.112001419067383, 5.760072708129883, 6.408143997192383, 7.056215763092041, 7.704287528991699, 8.3523588180542, 9.0004301071167, 9.648502349853516, 10.296573638916016, 10.944644927978516, 11.592716217041016, 12.240787506103516, 12.888859748840332, 13.536931037902832, 14.185002326965332, 14.833074569702148, 15.481145858764648, 16.12921714782715, 16.77728843688965, 17.42535972595215, 18.07343101501465, 18.72150421142578, 19.36957550048828, 20.01764678955078, 20.66571807861328, 21.31378936767578]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 9.0, 18.0, 23.0, 26.0, 32.0, 42.0, 38.0, 50.0, 44.0, 44.0, 70.0, 77.0, 50.0, 71.0, 54.0, 63.0, 48.0, 37.0, 34.0, 31.0, 29.0, 16.0, 14.0, 20.0, 12.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.46875, -3.366546630859375, -3.26434326171875, -3.162139892578125, -3.0599365234375, -2.957733154296875, -2.85552978515625, -2.753326416015625, -2.651123046875, -2.548919677734375, -2.44671630859375, -2.344512939453125, -2.2423095703125, -2.140106201171875, -2.03790283203125, -1.935699462890625, -1.83349609375, -1.731292724609375, -1.62908935546875, -1.526885986328125, -1.4246826171875, -1.322479248046875, -1.22027587890625, -1.118072509765625, -1.015869140625, -0.913665771484375, -0.81146240234375, -0.709259033203125, -0.6070556640625, -0.504852294921875, -0.40264892578125, -0.300445556640625, -0.1982421875, -0.096038818359375, 0.00616455078125, 0.108367919921875, 0.2105712890625, 0.312774658203125, 0.41497802734375, 0.517181396484375, 0.619384765625, 0.721588134765625, 0.82379150390625, 0.925994873046875, 1.0281982421875, 1.130401611328125, 1.23260498046875, 1.334808349609375, 1.43701171875, 1.539215087890625, 1.64141845703125, 1.743621826171875, 1.8458251953125, 1.948028564453125, 2.05023193359375, 2.152435302734375, 2.254638671875, 2.356842041015625, 2.45904541015625, 2.561248779296875, 2.6634521484375, 2.765655517578125, 2.86785888671875, 2.970062255859375, 3.072265625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 6.0, 8.0, 12.0, 8.0, 26.0, 31.0, 50.0, 64.0, 80.0, 116.0, 191.0, 283.0, 447.0, 752.0, 1123.0, 1870.0, 3150.0, 5411.0, 9506.0, 17487.0, 33640.0, 67951.0, 156767.0, 413716.0, 179595.0, 75082.0, 36941.0, 19340.0, 10426.0, 5838.0, 3354.0, 1949.0, 1209.0, 743.0, 445.0, 300.0, 204.0, 129.0, 98.0, 63.0, 53.0, 20.0, 19.0, 15.0, 15.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.200439453125, -0.1940898895263672, -0.18774032592773438, -0.18139076232910156, -0.17504119873046875, -0.16869163513183594, -0.16234207153320312, -0.1559925079345703, -0.1496429443359375, -0.1432933807373047, -0.13694381713867188, -0.13059425354003906, -0.12424468994140625, -0.11789512634277344, -0.11154556274414062, -0.10519599914550781, -0.098846435546875, -0.09249687194824219, -0.08614730834960938, -0.07979774475097656, -0.07344818115234375, -0.06709861755371094, -0.060749053955078125, -0.05439949035644531, -0.0480499267578125, -0.04170036315917969, -0.035350799560546875, -0.029001235961914062, -0.02265167236328125, -0.016302108764648438, -0.009952545166015625, -0.0036029815673828125, 0.00274658203125, 0.009096145629882812, 0.015445709228515625, 0.021795272827148438, 0.02814483642578125, 0.03449440002441406, 0.040843963623046875, 0.04719352722167969, 0.0535430908203125, 0.05989265441894531, 0.06624221801757812, 0.07259178161621094, 0.07894134521484375, 0.08529090881347656, 0.09164047241210938, 0.09799003601074219, 0.104339599609375, 0.11068916320800781, 0.11703872680664062, 0.12338829040527344, 0.12973785400390625, 0.13608741760253906, 0.14243698120117188, 0.1487865447998047, 0.1551361083984375, 0.1614856719970703, 0.16783523559570312, 0.17418479919433594, 0.18053436279296875, 0.18688392639160156, 0.19323348999023438, 0.1995830535888672, 0.2059326171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 5.0, 10.0, 8.0, 12.0, 10.0, 12.0, 15.0, 27.0, 23.0, 23.0, 22.0, 18.0, 37.0, 31.0, 36.0, 37.0, 46.0, 45.0, 37.0, 35.0, 1064.0, 48.0, 46.0, 37.0, 39.0, 29.0, 33.0, 30.0, 19.0, 31.0, 26.0, 21.0, 23.0, 19.0, 16.0, 10.0, 10.0, 14.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.404296875, -2.33380126953125, -2.2633056640625, -2.19281005859375, -2.122314453125, -2.05181884765625, -1.9813232421875, -1.91082763671875, -1.84033203125, -1.76983642578125, -1.6993408203125, -1.62884521484375, -1.558349609375, -1.48785400390625, -1.4173583984375, -1.34686279296875, -1.2763671875, -1.20587158203125, -1.1353759765625, -1.06488037109375, -0.994384765625, -0.92388916015625, -0.8533935546875, -0.78289794921875, -0.71240234375, -0.64190673828125, -0.5714111328125, -0.50091552734375, -0.430419921875, -0.35992431640625, -0.2894287109375, -0.21893310546875, -0.1484375, -0.07794189453125, -0.0074462890625, 0.06304931640625, 0.133544921875, 0.20404052734375, 0.2745361328125, 0.34503173828125, 0.41552734375, 0.48602294921875, 0.5565185546875, 0.62701416015625, 0.697509765625, 0.76800537109375, 0.8385009765625, 0.90899658203125, 0.9794921875, 1.04998779296875, 1.1204833984375, 1.19097900390625, 1.261474609375, 1.33197021484375, 1.4024658203125, 1.47296142578125, 1.54345703125, 1.61395263671875, 1.6844482421875, 1.75494384765625, 1.825439453125, 1.89593505859375, 1.9664306640625, 2.03692626953125, 2.107421875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 10.0, 18.0, 24.0, 32.0, 51.0, 77.0, 110.0, 149.0, 216.0, 324.0, 473.0, 671.0, 1032.0, 1545.0, 2330.0, 3279.0, 4763.0, 7101.0, 10474.0, 16130.0, 24501.0, 38090.0, 60583.0, 101898.0, 293096.0, 1226912.0, 115609.0, 66605.0, 41446.0, 26529.0, 17327.0, 11643.0, 7685.0, 5165.0, 3542.0, 2333.0, 1670.0, 1116.0, 773.0, 594.0, 387.0, 265.0, 176.0, 125.0, 85.0, 53.0, 44.0, 22.0, 15.0, 11.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.05377197265625, -0.05214738845825195, -0.050522804260253906, -0.04889822006225586, -0.04727363586425781, -0.045649051666259766, -0.04402446746826172, -0.04239988327026367, -0.040775299072265625, -0.03915071487426758, -0.03752613067626953, -0.035901546478271484, -0.03427696228027344, -0.03265237808227539, -0.031027793884277344, -0.029403209686279297, -0.02777862548828125, -0.026154041290283203, -0.024529457092285156, -0.02290487289428711, -0.021280288696289062, -0.019655704498291016, -0.01803112030029297, -0.016406536102294922, -0.014781951904296875, -0.013157367706298828, -0.011532783508300781, -0.009908199310302734, -0.008283615112304688, -0.006659030914306641, -0.005034446716308594, -0.003409862518310547, -0.0017852783203125, -0.00016069412231445312, 0.0014638900756835938, 0.0030884742736816406, 0.0047130584716796875, 0.006337642669677734, 0.007962226867675781, 0.009586811065673828, 0.011211395263671875, 0.012835979461669922, 0.014460563659667969, 0.016085147857666016, 0.017709732055664062, 0.01933431625366211, 0.020958900451660156, 0.022583484649658203, 0.02420806884765625, 0.025832653045654297, 0.027457237243652344, 0.02908182144165039, 0.030706405639648438, 0.032330989837646484, 0.03395557403564453, 0.03558015823364258, 0.037204742431640625, 0.03882932662963867, 0.04045391082763672, 0.042078495025634766, 0.04370307922363281, 0.04532766342163086, 0.046952247619628906, 0.04857683181762695, 0.050201416015625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 8.0, 7.0, 8.0, 22.0, 23.0, 30.0, 29.0, 33.0, 54.0, 62.0, 79.0, 103.0, 125.0, 96.0, 65.0, 45.0, 39.0, 31.0, 24.0, 18.0, 21.0, 14.0, 14.0, 8.0, 5.0, 3.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004258155822753906, -0.0004117041826248169, -0.00039759278297424316, -0.00038348138332366943, -0.0003693699836730957, -0.00035525858402252197, -0.00034114718437194824, -0.0003270357847213745, -0.0003129243850708008, -0.00029881298542022705, -0.0002847015857696533, -0.0002705901861190796, -0.00025647878646850586, -0.00024236738681793213, -0.0002282559871673584, -0.00021414458751678467, -0.00020003318786621094, -0.0001859217882156372, -0.00017181038856506348, -0.00015769898891448975, -0.00014358758926391602, -0.00012947618961334229, -0.00011536478996276855, -0.00010125339031219482, -8.71419906616211e-05, -7.303059101104736e-05, -5.891919136047363e-05, -4.48077917098999e-05, -3.069639205932617e-05, -1.658499240875244e-05, -2.473592758178711e-06, 1.163780689239502e-05, 2.574920654296875e-05, 3.986060619354248e-05, 5.397200584411621e-05, 6.808340549468994e-05, 8.219480514526367e-05, 9.63062047958374e-05, 0.00011041760444641113, 0.00012452900409698486, 0.0001386404037475586, 0.00015275180339813232, 0.00016686320304870605, 0.00018097460269927979, 0.00019508600234985352, 0.00020919740200042725, 0.00022330880165100098, 0.0002374202013015747, 0.00025153160095214844, 0.00026564300060272217, 0.0002797544002532959, 0.00029386579990386963, 0.00030797719955444336, 0.0003220885992050171, 0.0003361999988555908, 0.00035031139850616455, 0.0003644227981567383, 0.000378534197807312, 0.00039264559745788574, 0.00040675699710845947, 0.0004208683967590332, 0.00043497979640960693, 0.00044909119606018066, 0.0004632025957107544, 0.0004773139953613281]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 2.0, 13.0, 10.0, 22.0, 32.0, 47.0, 68.0, 127.0, 224.0, 502.0, 1012.0, 2730.0, 7495.0, 22073.0, 76060.0, 497217.0, 347652.0, 63470.0, 18871.0, 6555.0, 2432.0, 983.0, 411.0, 162.0, 117.0, 85.0, 56.0, 23.0, 27.0, 21.0, 11.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0084991455078125, -0.008248686790466309, -0.007998228073120117, -0.007747769355773926, -0.007497310638427734, -0.007246851921081543, -0.0069963932037353516, -0.00674593448638916, -0.006495475769042969, -0.006245017051696777, -0.005994558334350586, -0.0057440996170043945, -0.005493640899658203, -0.005243182182312012, -0.00499272346496582, -0.004742264747619629, -0.0044918060302734375, -0.004241347312927246, -0.003990888595581055, -0.0037404298782348633, -0.003489971160888672, -0.0032395124435424805, -0.002989053726196289, -0.0027385950088500977, -0.0024881362915039062, -0.002237677574157715, -0.0019872188568115234, -0.001736760139465332, -0.0014863014221191406, -0.0012358427047729492, -0.0009853839874267578, -0.0007349252700805664, -0.000484466552734375, -0.0002340078353881836, 1.6450881958007812e-05, 0.0002669095993041992, 0.0005173683166503906, 0.000767827033996582, 0.0010182857513427734, 0.0012687444686889648, 0.0015192031860351562, 0.0017696619033813477, 0.002020120620727539, 0.0022705793380737305, 0.002521038055419922, 0.0027714967727661133, 0.0030219554901123047, 0.003272414207458496, 0.0035228729248046875, 0.003773331642150879, 0.00402379035949707, 0.004274249076843262, 0.004524707794189453, 0.0047751665115356445, 0.005025625228881836, 0.005276083946228027, 0.005526542663574219, 0.00577700138092041, 0.0060274600982666016, 0.006277918815612793, 0.006528377532958984, 0.006778836250305176, 0.007029294967651367, 0.007279753684997559, 0.00753021240234375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 31.0, 94.0, 480.0, 283.0, 73.0, 19.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011955345049500465, -0.011669577099382877, -0.01138380914926529, -0.011098040267825127, -0.010812272317707539, -0.01052650436758995, -0.010240736417472363, -0.009954968467354774, -0.009669199585914612, -0.009383431635797024, -0.009097663685679436, -0.008811894804239273, -0.008526126854121685, -0.008240358904004097, -0.007954590953886509, -0.007668822538107634, -0.0073830545879900455, -0.0070972866378724575, -0.006811518222093582, -0.006525750271975994, -0.006239981856197119, -0.005954213906079531, -0.005668445490300655, -0.005382677540183067, -0.005096909590065479, -0.004811141639947891, -0.004525373224169016, -0.004239605274051428, -0.0039538368582725525, -0.0036680689081549644, -0.0033823007252067327, -0.003096532542258501, -0.0028107636608183384, -0.0025249954778701067, -0.002239227294921875, -0.001953459344804287, -0.0016676910454407334, -0.0013819228624925017, -0.0010961547959595919, -0.0008103866130113602, -0.0005246184300631285, -0.00023885027621872723, 4.691787762567401e-05, 0.0003326860023662448, 0.0006184541853144765, 0.0009042223682627082, 0.001189990434795618, 0.0014757586177438498, 0.0017615268006920815, 0.002047294983640313, 0.002333063166588545, 0.002618831116706133, 0.0029045995324850082, 0.0031903674826025963, 0.003476135665550828, 0.0037619038484990597, 0.004047672264277935, 0.004333440214395523, 0.004619208630174398, 0.0049049765802919865, 0.005190744996070862, 0.00547651294618845, 0.005762280896306038, 0.006048049312084913, 0.006333817262202501]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 5.0, 6.0, 3.0, 19.0, 20.0, 18.0, 25.0, 40.0, 36.0, 50.0, 54.0, 64.0, 49.0, 72.0, 82.0, 59.0, 59.0, 61.0, 62.0, 50.0, 37.0, 24.0, 27.0, 24.0, 14.0, 9.0, 10.0, 5.0, 7.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041168928146362305, -0.00039730407297611237, -0.0003829188644886017, -0.000368533656001091, -0.0003541484475135803, -0.00033976323902606964, -0.00032537803053855896, -0.0003109928220510483, -0.0002966076135635376, -0.0002822224050760269, -0.00026783719658851624, -0.00025345198810100555, -0.00023906677961349487, -0.0002246815711259842, -0.0002102963626384735, -0.00019591115415096283, -0.00018152594566345215, -0.00016714073717594147, -0.00015275552868843079, -0.0001383703202009201, -0.00012398511171340942, -0.00010959990322589874, -9.521469473838806e-05, -8.082948625087738e-05, -6.64442777633667e-05, -5.205906927585602e-05, -3.767386078834534e-05, -2.3288652300834656e-05, -8.903443813323975e-06, 5.4817646741867065e-06, 1.9866973161697388e-05, 3.425218164920807e-05, 4.863739013671875e-05, 6.302259862422943e-05, 7.740780711174011e-05, 9.17930155992508e-05, 0.00010617822408676147, 0.00012056343257427216, 0.00013494864106178284, 0.00014933384954929352, 0.0001637190580368042, 0.00017810426652431488, 0.00019248947501182556, 0.00020687468349933624, 0.00022125989198684692, 0.0002356451004743576, 0.0002500303089618683, 0.00026441551744937897, 0.00027880072593688965, 0.00029318593442440033, 0.000307571142911911, 0.0003219563513994217, 0.0003363415598869324, 0.00035072676837444305, 0.00036511197686195374, 0.0003794971853494644, 0.0003938823938369751, 0.0004082676023244858, 0.00042265281081199646, 0.00043703801929950714, 0.0004514232277870178, 0.0004658084362745285, 0.0004801936447620392, 0.0004945788532495499, 0.0005089640617370605]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 9.0, 18.0, 23.0, 26.0, 32.0, 41.0, 39.0, 50.0, 44.0, 44.0, 70.0, 77.0, 50.0, 71.0, 55.0, 62.0, 48.0, 37.0, 34.0, 31.0, 29.0, 16.0, 14.0, 20.0, 12.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.46875, -3.366546630859375, -3.26434326171875, -3.162139892578125, -3.0599365234375, -2.957733154296875, -2.85552978515625, -2.753326416015625, -2.651123046875, -2.548919677734375, -2.44671630859375, -2.344512939453125, -2.2423095703125, -2.140106201171875, -2.03790283203125, -1.935699462890625, -1.83349609375, -1.731292724609375, -1.62908935546875, -1.526885986328125, -1.4246826171875, -1.322479248046875, -1.22027587890625, -1.118072509765625, -1.015869140625, -0.913665771484375, -0.81146240234375, -0.709259033203125, -0.6070556640625, -0.504852294921875, -0.40264892578125, -0.300445556640625, -0.1982421875, -0.096038818359375, 0.00616455078125, 0.108367919921875, 0.2105712890625, 0.312774658203125, 0.41497802734375, 0.517181396484375, 0.619384765625, 0.721588134765625, 0.82379150390625, 0.925994873046875, 1.0281982421875, 1.130401611328125, 1.23260498046875, 1.334808349609375, 1.43701171875, 1.539215087890625, 1.64141845703125, 1.743621826171875, 1.8458251953125, 1.948028564453125, 2.05023193359375, 2.152435302734375, 2.254638671875, 2.356842041015625, 2.45904541015625, 2.561248779296875, 2.6634521484375, 2.765655517578125, 2.86785888671875, 2.970062255859375, 3.072265625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 12.0, 11.0, 17.0, 38.0, 47.0, 56.0, 119.0, 210.0, 359.0, 723.0, 1440.0, 3097.0, 7990.0, 29927.0, 213577.0, 681614.0, 83676.0, 16091.0, 5143.0, 2130.0, 1023.0, 536.0, 312.0, 153.0, 88.0, 56.0, 33.0, 28.0, 18.0, 7.0, 5.0, 3.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.34576416015625, -7.0860595703125, -6.82635498046875, -6.566650390625, -6.30694580078125, -6.0472412109375, -5.78753662109375, -5.52783203125, -5.26812744140625, -5.0084228515625, -4.74871826171875, -4.489013671875, -4.22930908203125, -3.9696044921875, -3.70989990234375, -3.4501953125, -3.19049072265625, -2.9307861328125, -2.67108154296875, -2.411376953125, -2.15167236328125, -1.8919677734375, -1.63226318359375, -1.37255859375, -1.11285400390625, -0.8531494140625, -0.59344482421875, -0.333740234375, -0.07403564453125, 0.1856689453125, 0.44537353515625, 0.705078125, 0.96478271484375, 1.2244873046875, 1.48419189453125, 1.743896484375, 2.00360107421875, 2.2633056640625, 2.52301025390625, 2.78271484375, 3.04241943359375, 3.3021240234375, 3.56182861328125, 3.821533203125, 4.08123779296875, 4.3409423828125, 4.60064697265625, 4.8603515625, 5.12005615234375, 5.3797607421875, 5.63946533203125, 5.899169921875, 6.15887451171875, 6.4185791015625, 6.67828369140625, 6.93798828125, 7.19769287109375, 7.4573974609375, 7.71710205078125, 7.976806640625, 8.23651123046875, 8.4962158203125, 8.75592041015625, 9.015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 3.0, 8.0, 11.0, 11.0, 8.0, 21.0, 17.0, 18.0, 19.0, 20.0, 26.0, 30.0, 34.0, 46.0, 53.0, 57.0, 80.0, 107.0, 215.0, 1438.0, 200.0, 129.0, 72.0, 60.0, 54.0, 53.0, 38.0, 36.0, 32.0, 22.0, 13.0, 26.0, 13.0, 7.0, 13.0, 13.0, 4.0, 9.0, 3.0, 3.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9375, -7.68505859375, -7.4326171875, -7.18017578125, -6.927734375, -6.67529296875, -6.4228515625, -6.17041015625, -5.91796875, -5.66552734375, -5.4130859375, -5.16064453125, -4.908203125, -4.65576171875, -4.4033203125, -4.15087890625, -3.8984375, -3.64599609375, -3.3935546875, -3.14111328125, -2.888671875, -2.63623046875, -2.3837890625, -2.13134765625, -1.87890625, -1.62646484375, -1.3740234375, -1.12158203125, -0.869140625, -0.61669921875, -0.3642578125, -0.11181640625, 0.140625, 0.39306640625, 0.6455078125, 0.89794921875, 1.150390625, 1.40283203125, 1.6552734375, 1.90771484375, 2.16015625, 2.41259765625, 2.6650390625, 2.91748046875, 3.169921875, 3.42236328125, 3.6748046875, 3.92724609375, 4.1796875, 4.43212890625, 4.6845703125, 4.93701171875, 5.189453125, 5.44189453125, 5.6943359375, 5.94677734375, 6.19921875, 6.45166015625, 6.7041015625, 6.95654296875, 7.208984375, 7.46142578125, 7.7138671875, 7.96630859375, 8.21875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 5.0, 8.0, 10.0, 13.0, 9.0, 16.0, 20.0, 30.0, 29.0, 38.0, 50.0, 73.0, 127.0, 212.0, 313.0, 702.0, 2246.0, 9510.0, 92946.0, 2484608.0, 521254.0, 26629.0, 4299.0, 1269.0, 498.0, 233.0, 135.0, 92.0, 78.0, 51.0, 29.0, 25.0, 26.0, 22.0, 10.0, 14.0, 15.0, 13.0, 10.0, 4.0, 3.0, 4.0, 6.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.375, -11.97265625, -11.5703125, -11.16796875, -10.765625, -10.36328125, -9.9609375, -9.55859375, -9.15625, -8.75390625, -8.3515625, -7.94921875, -7.546875, -7.14453125, -6.7421875, -6.33984375, -5.9375, -5.53515625, -5.1328125, -4.73046875, -4.328125, -3.92578125, -3.5234375, -3.12109375, -2.71875, -2.31640625, -1.9140625, -1.51171875, -1.109375, -0.70703125, -0.3046875, 0.09765625, 0.5, 0.90234375, 1.3046875, 1.70703125, 2.109375, 2.51171875, 2.9140625, 3.31640625, 3.71875, 4.12109375, 4.5234375, 4.92578125, 5.328125, 5.73046875, 6.1328125, 6.53515625, 6.9375, 7.33984375, 7.7421875, 8.14453125, 8.546875, 8.94921875, 9.3515625, 9.75390625, 10.15625, 10.55859375, 10.9609375, 11.36328125, 11.765625, 12.16796875, 12.5703125, 12.97265625, 13.375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 9.0, 11.0, 41.0, 67.0, 118.0, 157.0, 165.0, 187.0, 124.0, 60.0, 45.0, 15.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.619930267333984, -33.673526763916016, -32.72712707519531, -31.780723571777344, -30.834320068359375, -29.88791847229004, -28.941516876220703, -27.995113372802734, -27.0487117767334, -26.102310180664062, -25.155906677246094, -24.209505081176758, -23.26310157775879, -22.316699981689453, -21.370296478271484, -20.42389488220215, -19.477493286132812, -18.531091690063477, -17.584688186645508, -16.638286590576172, -15.69188404083252, -14.745481491088867, -13.799078941345215, -12.852676391601562, -11.906272888183594, -10.959870338439941, -10.013467788696289, -9.067066192626953, -8.1206636428833, -7.174261093139648, -6.227858543395996, -5.281456470489502, -4.335054397583008, -3.3886520862579346, -2.4422497749328613, -1.495847225189209, -0.5494449138641357, 0.3969573974609375, 1.3433599472045898, 2.289762020111084, 3.2361645698547363, 4.182567119598389, 5.128969192504883, 6.075371742248535, 7.0217742919921875, 7.968176364898682, 8.914579391479492, 9.860980987548828, 10.80738353729248, 11.753786087036133, 12.700188636779785, 13.646591186523438, 14.592992782592773, 15.539395332336426, 16.485797882080078, 17.432199478149414, 18.378602981567383, 19.32500457763672, 20.271408081054688, 21.217809677124023, 22.164213180541992, 23.110614776611328, 24.057018280029297, 25.003419876098633, 25.94982147216797]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 6.0, 12.0, 21.0, 16.0, 13.0, 19.0, 30.0, 26.0, 37.0, 35.0, 31.0, 34.0, 41.0, 48.0, 54.0, 53.0, 45.0, 48.0, 42.0, 44.0, 41.0, 67.0, 34.0, 34.0, 35.0, 18.0, 26.0, 21.0, 15.0, 18.0, 9.0, 5.0, 9.0, 1.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-33.14874267578125, -32.308895111083984, -31.469051361083984, -30.62920379638672, -29.789358139038086, -28.949512481689453, -28.109664916992188, -27.269819259643555, -26.429973602294922, -25.59012794494629, -24.750282287597656, -23.91043472290039, -23.070589065551758, -22.230743408203125, -21.39089584350586, -20.551050186157227, -19.711204528808594, -18.87135887145996, -18.031513214111328, -17.191665649414062, -16.35181999206543, -15.511974334716797, -14.672127723693848, -13.832281112670898, -12.992435455322266, -12.152589797973633, -11.312743186950684, -10.472896575927734, -9.633050918579102, -8.793205261230469, -7.9533586502075195, -7.1135125160217285, -6.27366828918457, -5.433822154998779, -4.593976020812988, -3.7541298866271973, -2.9142837524414062, -2.0744376182556152, -1.2345914840698242, -0.3947453498840332, 0.4451007843017578, 1.2849469184875488, 2.12479305267334, 2.964639186859131, 3.804485321044922, 4.644331455230713, 5.484177589416504, 6.324023723602295, 7.163869857788086, 8.003715515136719, 8.843562126159668, 9.683408737182617, 10.52325439453125, 11.363100051879883, 12.202946662902832, 13.042793273925781, 13.882638931274414, 14.722484588623047, 15.562331199645996, 16.402177810668945, 17.242023468017578, 18.08186912536621, 18.921714782714844, 19.76156234741211, 20.601408004760742]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 6.0, 6.0, 11.0, 10.0, 20.0, 23.0, 29.0, 34.0, 37.0, 40.0, 45.0, 50.0, 55.0, 51.0, 77.0, 48.0, 65.0, 59.0, 56.0, 45.0, 42.0, 30.0, 29.0, 38.0, 16.0, 16.0, 17.0, 15.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.439453125, -3.338043212890625, -3.23663330078125, -3.135223388671875, -3.0338134765625, -2.932403564453125, -2.83099365234375, -2.729583740234375, -2.628173828125, -2.526763916015625, -2.42535400390625, -2.323944091796875, -2.2225341796875, -2.121124267578125, -2.01971435546875, -1.918304443359375, -1.81689453125, -1.715484619140625, -1.61407470703125, -1.512664794921875, -1.4112548828125, -1.309844970703125, -1.20843505859375, -1.107025146484375, -1.005615234375, -0.904205322265625, -0.80279541015625, -0.701385498046875, -0.5999755859375, -0.498565673828125, -0.39715576171875, -0.295745849609375, -0.1943359375, -0.092926025390625, 0.00848388671875, 0.109893798828125, 0.2113037109375, 0.312713623046875, 0.41412353515625, 0.515533447265625, 0.616943359375, 0.718353271484375, 0.81976318359375, 0.921173095703125, 1.0225830078125, 1.123992919921875, 1.22540283203125, 1.326812744140625, 1.42822265625, 1.529632568359375, 1.63104248046875, 1.732452392578125, 1.8338623046875, 1.935272216796875, 2.03668212890625, 2.138092041015625, 2.239501953125, 2.340911865234375, 2.44232177734375, 2.543731689453125, 2.6451416015625, 2.746551513671875, 2.84796142578125, 2.949371337890625, 3.05078125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 1.0, 7.0, 6.0, 6.0, 7.0, 11.0, 10.0, 29.0, 22.0, 42.0, 76.0, 91.0, 149.0, 238.0, 352.0, 620.0, 1002.0, 1915.0, 3732.0, 9306.0, 33895.0, 306256.0, 2941836.0, 803864.0, 66576.0, 14207.0, 5083.0, 2302.0, 1095.0, 583.0, 365.0, 196.0, 135.0, 89.0, 60.0, 32.0, 29.0, 18.0, 10.0, 10.0, 4.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-10.4296875, -10.15283203125, -9.8759765625, -9.59912109375, -9.322265625, -9.04541015625, -8.7685546875, -8.49169921875, -8.21484375, -7.93798828125, -7.6611328125, -7.38427734375, -7.107421875, -6.83056640625, -6.5537109375, -6.27685546875, -6.0, -5.72314453125, -5.4462890625, -5.16943359375, -4.892578125, -4.61572265625, -4.3388671875, -4.06201171875, -3.78515625, -3.50830078125, -3.2314453125, -2.95458984375, -2.677734375, -2.40087890625, -2.1240234375, -1.84716796875, -1.5703125, -1.29345703125, -1.0166015625, -0.73974609375, -0.462890625, -0.18603515625, 0.0908203125, 0.36767578125, 0.64453125, 0.92138671875, 1.1982421875, 1.47509765625, 1.751953125, 2.02880859375, 2.3056640625, 2.58251953125, 2.859375, 3.13623046875, 3.4130859375, 3.68994140625, 3.966796875, 4.24365234375, 4.5205078125, 4.79736328125, 5.07421875, 5.35107421875, 5.6279296875, 5.90478515625, 6.181640625, 6.45849609375, 6.7353515625, 7.01220703125, 7.2890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 15.0, 12.0, 24.0, 50.0, 48.0, 103.0, 181.0, 265.0, 402.0, 669.0, 741.0, 593.0, 353.0, 215.0, 136.0, 84.0, 53.0, 37.0, 18.0, 18.0, 9.0, 8.0, 5.0, 6.0, 8.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4453125, -9.1614990234375, -8.877685546875, -8.5938720703125, -8.31005859375, -8.0262451171875, -7.742431640625, -7.4586181640625, -7.1748046875, -6.8909912109375, -6.607177734375, -6.3233642578125, -6.03955078125, -5.7557373046875, -5.471923828125, -5.1881103515625, -4.904296875, -4.6204833984375, -4.336669921875, -4.0528564453125, -3.76904296875, -3.4852294921875, -3.201416015625, -2.9176025390625, -2.6337890625, -2.3499755859375, -2.066162109375, -1.7823486328125, -1.49853515625, -1.2147216796875, -0.930908203125, -0.6470947265625, -0.36328125, -0.0794677734375, 0.204345703125, 0.4881591796875, 0.77197265625, 1.0557861328125, 1.339599609375, 1.6234130859375, 1.9072265625, 2.1910400390625, 2.474853515625, 2.7586669921875, 3.04248046875, 3.3262939453125, 3.610107421875, 3.8939208984375, 4.177734375, 4.4615478515625, 4.745361328125, 5.0291748046875, 5.31298828125, 5.5968017578125, 5.880615234375, 6.1644287109375, 6.4482421875, 6.7320556640625, 7.015869140625, 7.2996826171875, 7.58349609375, 7.8673095703125, 8.151123046875, 8.4349365234375, 8.71875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 3.0, 13.0, 9.0, 16.0, 27.0, 55.0, 84.0, 148.0, 321.0, 792.0, 2448.0, 10601.0, 93374.0, 3260176.0, 788317.0, 30016.0, 5358.0, 1477.0, 550.0, 224.0, 110.0, 73.0, 31.0, 19.0, 12.0, 10.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.134033203125, -20.42431640625, -19.714599609375, -19.0048828125, -18.295166015625, -17.58544921875, -16.875732421875, -16.166015625, -15.456298828125, -14.74658203125, -14.036865234375, -13.3271484375, -12.617431640625, -11.90771484375, -11.197998046875, -10.48828125, -9.778564453125, -9.06884765625, -8.359130859375, -7.6494140625, -6.939697265625, -6.22998046875, -5.520263671875, -4.810546875, -4.100830078125, -3.39111328125, -2.681396484375, -1.9716796875, -1.261962890625, -0.55224609375, 0.157470703125, 0.8671875, 1.576904296875, 2.28662109375, 2.996337890625, 3.7060546875, 4.415771484375, 5.12548828125, 5.835205078125, 6.544921875, 7.254638671875, 7.96435546875, 8.674072265625, 9.3837890625, 10.093505859375, 10.80322265625, 11.512939453125, 12.22265625, 12.932373046875, 13.64208984375, 14.351806640625, 15.0615234375, 15.771240234375, 16.48095703125, 17.190673828125, 17.900390625, 18.610107421875, 19.31982421875, 20.029541015625, 20.7392578125, 21.448974609375, 22.15869140625, 22.868408203125, 23.578125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 12.0, 29.0, 29.0, 50.0, 55.0, 98.0, 109.0, 110.0, 133.0, 108.0, 92.0, 63.0, 34.0, 38.0, 11.0, 15.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.41304016113281, -65.94137573242188, -64.46971130371094, -62.998046875, -61.52638244628906, -60.054718017578125, -58.58305358886719, -57.11138916015625, -55.63972473144531, -54.168060302734375, -52.69639587402344, -51.2247314453125, -49.75306701660156, -48.281402587890625, -46.80973815917969, -45.33807373046875, -43.86641311645508, -42.39474868774414, -40.9230842590332, -39.451419830322266, -37.97975540161133, -36.50809097290039, -35.03643035888672, -33.56476593017578, -32.093101501464844, -30.621437072753906, -29.14977264404297, -27.67810821533203, -26.206443786621094, -24.734779357910156, -23.26311683654785, -21.791452407836914, -20.319787979125977, -18.84812355041504, -17.3764591217041, -15.90479564666748, -14.433131217956543, -12.961466789245605, -11.489803314208984, -10.018138885498047, -8.54647445678711, -7.074810028076172, -5.603146076202393, -4.131482124328613, -2.659817695617676, -1.1881532669067383, 0.2835102081298828, 1.7551746368408203, 3.226839065551758, 4.698503494262695, 6.170167446136475, 7.641831398010254, 9.113495826721191, 10.585160255432129, 12.05682373046875, 13.528488159179688, 15.000152587890625, 16.471817016601562, 17.9434814453125, 19.415145874023438, 20.886810302734375, 22.358474731445312, 23.830137252807617, 25.301801681518555, 26.773466110229492]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 4.0, 3.0, 4.0, 6.0, 7.0, 13.0, 3.0, 8.0, 14.0, 17.0, 11.0, 22.0, 19.0, 20.0, 25.0, 29.0, 24.0, 29.0, 40.0, 37.0, 40.0, 38.0, 32.0, 36.0, 31.0, 41.0, 37.0, 36.0, 33.0, 32.0, 30.0, 28.0, 34.0, 35.0, 24.0, 24.0, 19.0, 13.0, 16.0, 20.0, 9.0, 10.0, 14.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.286697387695312, -19.62721061706543, -18.967721939086914, -18.30823516845703, -17.648746490478516, -16.989259719848633, -16.32977294921875, -15.670284271240234, -15.010797500610352, -14.351309776306152, -13.691822052001953, -13.03233528137207, -12.372847557067871, -11.713359832763672, -11.053872108459473, -10.394384384155273, -9.734896659851074, -9.075408935546875, -8.415921211242676, -7.756433963775635, -7.096946716308594, -6.4374589920043945, -5.777971267700195, -5.118484020233154, -4.458996295928955, -3.799508810043335, -3.140021324157715, -2.4805335998535156, -1.8210461139678955, -1.1615586280822754, -0.5020709037780762, 0.15741634368896484, 0.8169040679931641, 1.4763915538787842, 2.1358790397644043, 2.7953667640686035, 3.4548542499542236, 4.114341735839844, 4.773829460144043, 5.433316707611084, 6.092804431915283, 6.752292156219482, 7.411779403686523, 8.071267127990723, 8.730754852294922, 9.390241622924805, 10.04973030090332, 10.709217071533203, 11.368704795837402, 12.028192520141602, 12.6876802444458, 13.34716796875, 14.006654739379883, 14.666142463684082, 15.325630187988281, 15.985116958618164, 16.64460563659668, 17.304092407226562, 17.963581085205078, 18.62306785583496, 19.282556533813477, 19.94204330444336, 20.601531982421875, 21.261018753051758, 21.92050552368164]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 10.0, 13.0, 6.0, 12.0, 20.0, 15.0, 24.0, 28.0, 47.0, 33.0, 32.0, 53.0, 47.0, 59.0, 64.0, 48.0, 52.0, 56.0, 63.0, 49.0, 49.0, 27.0, 44.0, 34.0, 22.0, 19.0, 11.0, 14.0, 10.0, 14.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.3046875, -3.20623779296875, -3.1077880859375, -3.00933837890625, -2.910888671875, -2.81243896484375, -2.7139892578125, -2.61553955078125, -2.51708984375, -2.41864013671875, -2.3201904296875, -2.22174072265625, -2.123291015625, -2.02484130859375, -1.9263916015625, -1.82794189453125, -1.7294921875, -1.63104248046875, -1.5325927734375, -1.43414306640625, -1.335693359375, -1.23724365234375, -1.1387939453125, -1.04034423828125, -0.94189453125, -0.84344482421875, -0.7449951171875, -0.64654541015625, -0.548095703125, -0.44964599609375, -0.3511962890625, -0.25274658203125, -0.154296875, -0.05584716796875, 0.0426025390625, 0.14105224609375, 0.239501953125, 0.33795166015625, 0.4364013671875, 0.53485107421875, 0.63330078125, 0.73175048828125, 0.8302001953125, 0.92864990234375, 1.027099609375, 1.12554931640625, 1.2239990234375, 1.32244873046875, 1.4208984375, 1.51934814453125, 1.6177978515625, 1.71624755859375, 1.814697265625, 1.91314697265625, 2.0115966796875, 2.11004638671875, 2.20849609375, 2.30694580078125, 2.4053955078125, 2.50384521484375, 2.602294921875, 2.70074462890625, 2.7991943359375, 2.89764404296875, 2.99609375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 7.0, 7.0, 2.0, 15.0, 8.0, 19.0, 34.0, 33.0, 53.0, 76.0, 119.0, 177.0, 249.0, 379.0, 625.0, 968.0, 1508.0, 2437.0, 4030.0, 6729.0, 11533.0, 20448.0, 37486.0, 73295.0, 155196.0, 373173.0, 181514.0, 82641.0, 41850.0, 22304.0, 12552.0, 7411.0, 4412.0, 2672.0, 1632.0, 1037.0, 648.0, 414.0, 291.0, 165.0, 131.0, 89.0, 62.0, 37.0, 28.0, 19.0, 17.0, 12.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.15379905700683594, -0.14841842651367188, -0.1430377960205078, -0.13765716552734375, -0.1322765350341797, -0.12689590454101562, -0.12151527404785156, -0.1161346435546875, -0.11075401306152344, -0.10537338256835938, -0.09999275207519531, -0.09461212158203125, -0.08923149108886719, -0.08385086059570312, -0.07847023010253906, -0.073089599609375, -0.06770896911621094, -0.062328338623046875, -0.05694770812988281, -0.05156707763671875, -0.04618644714355469, -0.040805816650390625, -0.03542518615722656, -0.0300445556640625, -0.024663925170898438, -0.019283294677734375, -0.013902664184570312, -0.00852203369140625, -0.0031414031982421875, 0.002239227294921875, 0.0076198577880859375, 0.01300048828125, 0.018381118774414062, 0.023761749267578125, 0.029142379760742188, 0.03452301025390625, 0.03990364074707031, 0.045284271240234375, 0.05066490173339844, 0.0560455322265625, 0.06142616271972656, 0.06680679321289062, 0.07218742370605469, 0.07756805419921875, 0.08294868469238281, 0.08832931518554688, 0.09370994567871094, 0.099090576171875, 0.10447120666503906, 0.10985183715820312, 0.11523246765136719, 0.12061309814453125, 0.1259937286376953, 0.13137435913085938, 0.13675498962402344, 0.1421356201171875, 0.14751625061035156, 0.15289688110351562, 0.1582775115966797, 0.16365814208984375, 0.1690387725830078, 0.17441940307617188, 0.17980003356933594, 0.1851806640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 7.0, 7.0, 16.0, 17.0, 10.0, 14.0, 21.0, 24.0, 15.0, 24.0, 30.0, 49.0, 39.0, 29.0, 33.0, 38.0, 36.0, 43.0, 1056.0, 34.0, 53.0, 42.0, 34.0, 43.0, 36.0, 27.0, 34.0, 35.0, 23.0, 29.0, 20.0, 14.0, 18.0, 16.0, 8.0, 11.0, 8.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.37890625, -2.306121826171875, -2.23333740234375, -2.160552978515625, -2.0877685546875, -2.014984130859375, -1.94219970703125, -1.869415283203125, -1.796630859375, -1.723846435546875, -1.65106201171875, -1.578277587890625, -1.5054931640625, -1.432708740234375, -1.35992431640625, -1.287139892578125, -1.21435546875, -1.141571044921875, -1.06878662109375, -0.996002197265625, -0.9232177734375, -0.850433349609375, -0.77764892578125, -0.704864501953125, -0.632080078125, -0.559295654296875, -0.48651123046875, -0.413726806640625, -0.3409423828125, -0.268157958984375, -0.19537353515625, -0.122589111328125, -0.0498046875, 0.022979736328125, 0.09576416015625, 0.168548583984375, 0.2413330078125, 0.314117431640625, 0.38690185546875, 0.459686279296875, 0.532470703125, 0.605255126953125, 0.67803955078125, 0.750823974609375, 0.8236083984375, 0.896392822265625, 0.96917724609375, 1.041961669921875, 1.11474609375, 1.187530517578125, 1.26031494140625, 1.333099365234375, 1.4058837890625, 1.478668212890625, 1.55145263671875, 1.624237060546875, 1.697021484375, 1.769805908203125, 1.84259033203125, 1.915374755859375, 1.9881591796875, 2.060943603515625, 2.13372802734375, 2.206512451171875, 2.279296875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 3.0, 11.0, 19.0, 25.0, 37.0, 48.0, 59.0, 107.0, 146.0, 248.0, 372.0, 609.0, 928.0, 1504.0, 2485.0, 4064.0, 6667.0, 11110.0, 19128.0, 33240.0, 59091.0, 112393.0, 463412.0, 1120311.0, 116002.0, 61607.0, 34550.0, 19844.0, 11503.0, 6859.0, 4009.0, 2436.0, 1550.0, 958.0, 630.0, 402.0, 254.0, 182.0, 94.0, 88.0, 54.0, 29.0, 24.0, 13.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.06866455078125, -0.06658554077148438, -0.06450653076171875, -0.062427520751953125, -0.0603485107421875, -0.058269500732421875, -0.05619049072265625, -0.054111480712890625, -0.052032470703125, -0.049953460693359375, -0.04787445068359375, -0.045795440673828125, -0.0437164306640625, -0.041637420654296875, -0.03955841064453125, -0.037479400634765625, -0.035400390625, -0.033321380615234375, -0.03124237060546875, -0.029163360595703125, -0.0270843505859375, -0.025005340576171875, -0.02292633056640625, -0.020847320556640625, -0.018768310546875, -0.016689300537109375, -0.01461029052734375, -0.012531280517578125, -0.0104522705078125, -0.008373260498046875, -0.00629425048828125, -0.004215240478515625, -0.00213623046875, -5.7220458984375e-05, 0.00202178955078125, 0.004100799560546875, 0.0061798095703125, 0.008258819580078125, 0.01033782958984375, 0.012416839599609375, 0.014495849609375, 0.016574859619140625, 0.01865386962890625, 0.020732879638671875, 0.0228118896484375, 0.024890899658203125, 0.02696990966796875, 0.029048919677734375, 0.0311279296875, 0.033206939697265625, 0.03528594970703125, 0.037364959716796875, 0.0394439697265625, 0.041522979736328125, 0.04360198974609375, 0.045680999755859375, 0.047760009765625, 0.049839019775390625, 0.05191802978515625, 0.053997039794921875, 0.0560760498046875, 0.058155059814453125, 0.06023406982421875, 0.062313079833984375, 0.06439208984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 13.0, 8.0, 19.0, 27.0, 14.0, 25.0, 27.0, 33.0, 57.0, 98.0, 135.0, 141.0, 106.0, 64.0, 44.0, 33.0, 25.0, 20.0, 17.0, 13.0, 11.0, 12.0, 5.0, 9.0, 6.0, 13.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.0008792877197265625, -0.0008589327335357666, -0.0008385777473449707, -0.0008182227611541748, -0.0007978677749633789, -0.000777512788772583, -0.0007571578025817871, -0.0007368028163909912, -0.0007164478302001953, -0.0006960928440093994, -0.0006757378578186035, -0.0006553828716278076, -0.0006350278854370117, -0.0006146728992462158, -0.0005943179130554199, -0.000573962926864624, -0.0005536079406738281, -0.0005332529544830322, -0.0005128979682922363, -0.0004925429821014404, -0.00047218799591064453, -0.00045183300971984863, -0.00043147802352905273, -0.00041112303733825684, -0.00039076805114746094, -0.00037041306495666504, -0.00035005807876586914, -0.00032970309257507324, -0.00030934810638427734, -0.00028899312019348145, -0.00026863813400268555, -0.00024828314781188965, -0.00022792816162109375, -0.00020757317543029785, -0.00018721818923950195, -0.00016686320304870605, -0.00014650821685791016, -0.00012615323066711426, -0.00010579824447631836, -8.544325828552246e-05, -6.508827209472656e-05, -4.4733285903930664e-05, -2.4378299713134766e-05, -4.023313522338867e-06, 1.633167266845703e-05, 3.668665885925293e-05, 5.704164505004883e-05, 7.739663124084473e-05, 9.775161743164062e-05, 0.00011810660362243652, 0.00013846158981323242, 0.00015881657600402832, 0.00017917156219482422, 0.00019952654838562012, 0.00021988153457641602, 0.00024023652076721191, 0.0002605915069580078, 0.0002809464931488037, 0.0003013014793395996, 0.0003216564655303955, 0.0003420114517211914, 0.0003623664379119873, 0.0003827214241027832, 0.0004030764102935791, 0.000423431396484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 5.0, 5.0, 8.0, 19.0, 22.0, 39.0, 57.0, 77.0, 147.0, 395.0, 1437.0, 6725.0, 45574.0, 692586.0, 269826.0, 25807.0, 4216.0, 968.0, 294.0, 134.0, 78.0, 39.0, 21.0, 20.0, 16.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00806427001953125, -0.007739901542663574, -0.0074155330657958984, -0.007091164588928223, -0.006766796112060547, -0.006442427635192871, -0.006118059158325195, -0.0057936906814575195, -0.005469322204589844, -0.005144953727722168, -0.004820585250854492, -0.004496216773986816, -0.004171848297119141, -0.003847479820251465, -0.003523111343383789, -0.0031987428665161133, -0.0028743743896484375, -0.0025500059127807617, -0.002225637435913086, -0.0019012689590454102, -0.0015769004821777344, -0.0012525320053100586, -0.0009281635284423828, -0.000603795051574707, -0.00027942657470703125, 4.494190216064453e-05, 0.0003693103790283203, 0.0006936788558959961, 0.0010180473327636719, 0.0013424158096313477, 0.0016667842864990234, 0.0019911527633666992, 0.002315521240234375, 0.0026398897171020508, 0.0029642581939697266, 0.0032886266708374023, 0.003612995147705078, 0.003937363624572754, 0.00426173210144043, 0.0045861005783081055, 0.004910469055175781, 0.005234837532043457, 0.005559206008911133, 0.005883574485778809, 0.006207942962646484, 0.00653231143951416, 0.006856679916381836, 0.007181048393249512, 0.0075054168701171875, 0.007829785346984863, 0.008154153823852539, 0.008478522300720215, 0.00880289077758789, 0.009127259254455566, 0.009451627731323242, 0.009775996208190918, 0.010100364685058594, 0.01042473316192627, 0.010749101638793945, 0.011073470115661621, 0.011397838592529297, 0.011722207069396973, 0.012046575546264648, 0.012370944023132324, 0.0126953125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 11.0, 33.0, 86.0, 282.0, 413.0, 106.0, 49.0, 14.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004466247744858265, -0.004313251003623009, -0.0041602542623877525, -0.004007257521152496, -0.0038542605470865965, -0.0037012638058513403, -0.0035482668317854404, -0.0033952700905501842, -0.003242273349314928, -0.003089276608079672, -0.0029362798668444157, -0.002783282892778516, -0.0026302861515432596, -0.0024772894103080034, -0.0023242924362421036, -0.0021712956950068474, -0.002018298953771591, -0.001865302212536335, -0.001712305354885757, -0.001559308497235179, -0.0014063117559999228, -0.0012533150147646666, -0.0011003181571140885, -0.0009473212994635105, -0.0007943245582282543, -0.0006413277587853372, -0.0004883309593424201, -0.000335334159899503, -0.00018233736045658588, -2.9340561013668776e-05, 0.00012365623842924833, 0.00027665309607982635, 0.00042965030297636986, 0.000582647102419287, 0.0007356439018622041, 0.0008886407013051212, 0.0010416375007480383, 0.0011946342419832945, 0.0013476310996338725, 0.0015006279572844505, 0.0016536246985197067, 0.001806621439754963, 0.001959618180990219, 0.002112615155056119, 0.002265611896291375, 0.0024186086375266314, 0.002571605611592531, 0.0027246023528277874, 0.0028775990940630436, 0.0030305958352983, 0.003183592576533556, 0.003336589550599456, 0.003489586291834712, 0.0036425830330699682, 0.003795580007135868, 0.003948576748371124, 0.0041015734896063805, 0.004254570230841637, 0.004407566972076893, 0.004560563713312149, 0.004713560454547405, 0.004866557661443949, 0.005019554402679205, 0.005172551143914461, 0.005325547885149717]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 11.0, 9.0, 21.0, 16.0, 16.0, 38.0, 35.0, 34.0, 39.0, 43.0, 56.0, 54.0, 59.0, 55.0, 59.0, 55.0, 68.0, 59.0, 66.0, 34.0, 25.0, 39.0, 28.0, 20.0, 16.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005463361740112305, -0.0005301665514707565, -0.0005139969289302826, -0.0004978273063898087, -0.0004816576838493347, -0.0004654880613088608, -0.00044931843876838684, -0.0004331488162279129, -0.00041697919368743896, -0.000400809571146965, -0.0003846399486064911, -0.00036847032606601715, -0.0003523007035255432, -0.0003361310809850693, -0.00031996145844459534, -0.0003037918359041214, -0.00028762221336364746, -0.0002714525908231735, -0.0002552829682826996, -0.00023911334574222565, -0.0002229437232017517, -0.00020677410066127777, -0.00019060447812080383, -0.0001744348555803299, -0.00015826523303985596, -0.00014209561049938202, -0.00012592598795890808, -0.00010975636541843414, -9.35867428779602e-05, -7.741712033748627e-05, -6.124749779701233e-05, -4.507787525653839e-05, -2.8908252716064453e-05, -1.2738630175590515e-05, 3.430992364883423e-06, 1.960061490535736e-05, 3.57702374458313e-05, 5.193985998630524e-05, 6.810948252677917e-05, 8.427910506725311e-05, 0.00010044872760772705, 0.00011661835014820099, 0.00013278797268867493, 0.00014895759522914886, 0.0001651272177696228, 0.00018129684031009674, 0.00019746646285057068, 0.00021363608539104462, 0.00022980570793151855, 0.0002459753304719925, 0.00026214495301246643, 0.00027831457555294037, 0.0002944841980934143, 0.00031065382063388824, 0.0003268234431743622, 0.0003429930657148361, 0.00035916268825531006, 0.000375332310795784, 0.00039150193333625793, 0.00040767155587673187, 0.0004238411784172058, 0.00044001080095767975, 0.0004561804234981537, 0.0004723500460386276, 0.0004885196685791016]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 10.0, 13.0, 6.0, 12.0, 20.0, 15.0, 24.0, 28.0, 47.0, 33.0, 33.0, 52.0, 47.0, 59.0, 64.0, 47.0, 53.0, 56.0, 63.0, 49.0, 49.0, 27.0, 44.0, 34.0, 22.0, 19.0, 11.0, 14.0, 10.0, 14.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.3046875, -3.20623779296875, -3.1077880859375, -3.00933837890625, -2.910888671875, -2.81243896484375, -2.7139892578125, -2.61553955078125, -2.51708984375, -2.41864013671875, -2.3201904296875, -2.22174072265625, -2.123291015625, -2.02484130859375, -1.9263916015625, -1.82794189453125, -1.7294921875, -1.63104248046875, -1.5325927734375, -1.43414306640625, -1.335693359375, -1.23724365234375, -1.1387939453125, -1.04034423828125, -0.94189453125, -0.84344482421875, -0.7449951171875, -0.64654541015625, -0.548095703125, -0.44964599609375, -0.3511962890625, -0.25274658203125, -0.154296875, -0.05584716796875, 0.0426025390625, 0.14105224609375, 0.239501953125, 0.33795166015625, 0.4364013671875, 0.53485107421875, 0.63330078125, 0.73175048828125, 0.8302001953125, 0.92864990234375, 1.027099609375, 1.12554931640625, 1.2239990234375, 1.32244873046875, 1.4208984375, 1.51934814453125, 1.6177978515625, 1.71624755859375, 1.814697265625, 1.91314697265625, 2.0115966796875, 2.11004638671875, 2.20849609375, 2.30694580078125, 2.4053955078125, 2.50384521484375, 2.602294921875, 2.70074462890625, 2.7991943359375, 2.89764404296875, 2.99609375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 13.0, 35.0, 50.0, 69.0, 113.0, 160.0, 347.0, 595.0, 1296.0, 3053.0, 10474.0, 70561.0, 746907.0, 184006.0, 22405.0, 4790.0, 1797.0, 824.0, 453.0, 212.0, 147.0, 69.0, 53.0, 40.0, 17.0, 14.0, 12.0, 7.0, 4.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.279052734375, -10.88623046875, -10.493408203125, -10.1005859375, -9.707763671875, -9.31494140625, -8.922119140625, -8.529296875, -8.136474609375, -7.74365234375, -7.350830078125, -6.9580078125, -6.565185546875, -6.17236328125, -5.779541015625, -5.38671875, -4.993896484375, -4.60107421875, -4.208251953125, -3.8154296875, -3.422607421875, -3.02978515625, -2.636962890625, -2.244140625, -1.851318359375, -1.45849609375, -1.065673828125, -0.6728515625, -0.280029296875, 0.11279296875, 0.505615234375, 0.8984375, 1.291259765625, 1.68408203125, 2.076904296875, 2.4697265625, 2.862548828125, 3.25537109375, 3.648193359375, 4.041015625, 4.433837890625, 4.82666015625, 5.219482421875, 5.6123046875, 6.005126953125, 6.39794921875, 6.790771484375, 7.18359375, 7.576416015625, 7.96923828125, 8.362060546875, 8.7548828125, 9.147705078125, 9.54052734375, 9.933349609375, 10.326171875, 10.718994140625, 11.11181640625, 11.504638671875, 11.8974609375, 12.290283203125, 12.68310546875, 13.075927734375, 13.46875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 4.0, 10.0, 12.0, 8.0, 23.0, 26.0, 30.0, 22.0, 25.0, 34.0, 41.0, 35.0, 50.0, 71.0, 112.0, 175.0, 1374.0, 304.0, 136.0, 114.0, 79.0, 50.0, 53.0, 30.0, 34.0, 44.0, 32.0, 24.0, 19.0, 11.0, 7.0, 9.0, 1.0, 10.0, 6.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.265625, -9.97998046875, -9.6943359375, -9.40869140625, -9.123046875, -8.83740234375, -8.5517578125, -8.26611328125, -7.98046875, -7.69482421875, -7.4091796875, -7.12353515625, -6.837890625, -6.55224609375, -6.2666015625, -5.98095703125, -5.6953125, -5.40966796875, -5.1240234375, -4.83837890625, -4.552734375, -4.26708984375, -3.9814453125, -3.69580078125, -3.41015625, -3.12451171875, -2.8388671875, -2.55322265625, -2.267578125, -1.98193359375, -1.6962890625, -1.41064453125, -1.125, -0.83935546875, -0.5537109375, -0.26806640625, 0.017578125, 0.30322265625, 0.5888671875, 0.87451171875, 1.16015625, 1.44580078125, 1.7314453125, 2.01708984375, 2.302734375, 2.58837890625, 2.8740234375, 3.15966796875, 3.4453125, 3.73095703125, 4.0166015625, 4.30224609375, 4.587890625, 4.87353515625, 5.1591796875, 5.44482421875, 5.73046875, 6.01611328125, 6.3017578125, 6.58740234375, 6.873046875, 7.15869140625, 7.4443359375, 7.72998046875, 8.015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 16.0, 18.0, 25.0, 39.0, 49.0, 59.0, 112.0, 149.0, 283.0, 540.0, 1309.0, 3753.0, 15662.0, 153515.0, 2514400.0, 415897.0, 30652.0, 5751.0, 1806.0, 693.0, 333.0, 180.0, 120.0, 76.0, 53.0, 44.0, 33.0, 21.0, 24.0, 10.0, 7.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.46875, -12.0338134765625, -11.598876953125, -11.1639404296875, -10.72900390625, -10.2940673828125, -9.859130859375, -9.4241943359375, -8.9892578125, -8.5543212890625, -8.119384765625, -7.6844482421875, -7.24951171875, -6.8145751953125, -6.379638671875, -5.9447021484375, -5.509765625, -5.0748291015625, -4.639892578125, -4.2049560546875, -3.77001953125, -3.3350830078125, -2.900146484375, -2.4652099609375, -2.0302734375, -1.5953369140625, -1.160400390625, -0.7254638671875, -0.29052734375, 0.1444091796875, 0.579345703125, 1.0142822265625, 1.44921875, 1.8841552734375, 2.319091796875, 2.7540283203125, 3.18896484375, 3.6239013671875, 4.058837890625, 4.4937744140625, 4.9287109375, 5.3636474609375, 5.798583984375, 6.2335205078125, 6.66845703125, 7.1033935546875, 7.538330078125, 7.9732666015625, 8.408203125, 8.8431396484375, 9.278076171875, 9.7130126953125, 10.14794921875, 10.5828857421875, 11.017822265625, 11.4527587890625, 11.8876953125, 12.3226318359375, 12.757568359375, 13.1925048828125, 13.62744140625, 14.0623779296875, 14.497314453125, 14.9322509765625, 15.3671875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [4.0, 27.0, 181.0, 427.0, 304.0, 63.0, 9.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.46053695678711, -9.165708541870117, -5.870879173278809, -2.5760498046875, 0.7187786102294922, 4.013607025146484, 7.308437347412109, 10.603265762329102, 13.898094177246094, 17.192922592163086, 20.487751007080078, 23.782581329345703, 27.077409744262695, 30.372238159179688, 33.66706848144531, 36.96189880371094, 40.2567253112793, 43.55155563354492, 46.84638214111328, 50.141212463378906, 53.43604278564453, 56.73086929321289, 60.025699615478516, 63.320526123046875, 66.6153564453125, 69.91018676757812, 73.20501708984375, 76.49984741210938, 79.79467010498047, 83.0895004272461, 86.38433074951172, 89.67916107177734, 92.97398376464844, 96.26881408691406, 99.56364440917969, 102.85847473144531, 106.1532974243164, 109.44812774658203, 112.74295806884766, 116.03778839111328, 119.33261108398438, 122.62744140625, 125.92227172851562, 129.21710205078125, 132.51193237304688, 135.8067626953125, 139.10159301757812, 142.3964080810547, 145.69125366210938, 148.986083984375, 152.28091430664062, 155.57574462890625, 158.87057495117188, 162.1654052734375, 165.46023559570312, 168.7550506591797, 172.0498809814453, 175.34471130371094, 178.63954162597656, 181.9343719482422, 185.2292022705078, 188.52401733398438, 191.81884765625, 195.11367797851562, 198.40850830078125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 9.0, 6.0, 10.0, 7.0, 16.0, 20.0, 24.0, 22.0, 26.0, 17.0, 29.0, 31.0, 43.0, 50.0, 47.0, 44.0, 47.0, 40.0, 38.0, 46.0, 42.0, 34.0, 36.0, 36.0, 43.0, 30.0, 29.0, 35.0, 24.0, 18.0, 15.0, 17.0, 13.0, 18.0, 12.0, 8.0, 5.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.645442962646484, -30.732877731323242, -29.8203125, -28.907747268676758, -27.995182037353516, -27.082618713378906, -26.170053482055664, -25.257488250732422, -24.34492301940918, -23.432357788085938, -22.519792556762695, -21.607227325439453, -20.694664001464844, -19.78209686279297, -18.86953353881836, -17.956968307495117, -17.044403076171875, -16.131837844848633, -15.21927261352539, -14.306708335876465, -13.394143104553223, -12.48157787322998, -11.569013595581055, -10.656448364257812, -9.74388313293457, -8.831317901611328, -7.918753147125244, -7.00618839263916, -6.093623161315918, -5.181057929992676, -4.268493175506592, -3.355928421020508, -2.4433631896972656, -1.5307981967926025, -0.6182332038879395, 0.29433178901672363, 1.2068967819213867, 2.119462013244629, 3.032026767730713, 3.944591522216797, 4.857156753540039, 5.769721984863281, 6.682286739349365, 7.594851493835449, 8.507416725158691, 9.419981956481934, 10.33254623413086, 11.245111465454102, 12.157676696777344, 13.070241928100586, 13.982807159423828, 14.895371437072754, 15.807936668395996, 16.720500946044922, 17.633066177368164, 18.545631408691406, 19.45819664001465, 20.37076187133789, 21.283327102661133, 22.195892333984375, 23.108455657958984, 24.02102279663086, 24.93358612060547, 25.84615135192871, 26.758716583251953]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 8.0, 5.0, 8.0, 5.0, 11.0, 13.0, 18.0, 15.0, 14.0, 23.0, 32.0, 31.0, 39.0, 37.0, 49.0, 54.0, 54.0, 42.0, 44.0, 45.0, 54.0, 54.0, 47.0, 43.0, 44.0, 37.0, 33.0, 30.0, 22.0, 25.0, 12.0, 10.0, 9.0, 10.0, 10.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.158203125, -3.06463623046875, -2.9710693359375, -2.87750244140625, -2.783935546875, -2.69036865234375, -2.5968017578125, -2.50323486328125, -2.40966796875, -2.31610107421875, -2.2225341796875, -2.12896728515625, -2.035400390625, -1.94183349609375, -1.8482666015625, -1.75469970703125, -1.6611328125, -1.56756591796875, -1.4739990234375, -1.38043212890625, -1.286865234375, -1.19329833984375, -1.0997314453125, -1.00616455078125, -0.91259765625, -0.81903076171875, -0.7254638671875, -0.63189697265625, -0.538330078125, -0.44476318359375, -0.3511962890625, -0.25762939453125, -0.1640625, -0.07049560546875, 0.0230712890625, 0.11663818359375, 0.210205078125, 0.30377197265625, 0.3973388671875, 0.49090576171875, 0.58447265625, 0.67803955078125, 0.7716064453125, 0.86517333984375, 0.958740234375, 1.05230712890625, 1.1458740234375, 1.23944091796875, 1.3330078125, 1.42657470703125, 1.5201416015625, 1.61370849609375, 1.707275390625, 1.80084228515625, 1.8944091796875, 1.98797607421875, 2.08154296875, 2.17510986328125, 2.2686767578125, 2.36224365234375, 2.455810546875, 2.54937744140625, 2.6429443359375, 2.73651123046875, 2.830078125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 10.0, 12.0, 14.0, 17.0, 20.0, 44.0, 52.0, 72.0, 132.0, 202.0, 356.0, 673.0, 1202.0, 2249.0, 4815.0, 13016.0, 59945.0, 760413.0, 2964925.0, 333489.0, 35741.0, 9542.0, 3712.0, 1695.0, 868.0, 429.0, 229.0, 153.0, 68.0, 54.0, 52.0, 25.0, 21.0, 8.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.15625, -10.8653564453125, -10.574462890625, -10.2835693359375, -9.99267578125, -9.7017822265625, -9.410888671875, -9.1199951171875, -8.8291015625, -8.5382080078125, -8.247314453125, -7.9564208984375, -7.66552734375, -7.3746337890625, -7.083740234375, -6.7928466796875, -6.501953125, -6.2110595703125, -5.920166015625, -5.6292724609375, -5.33837890625, -5.0474853515625, -4.756591796875, -4.4656982421875, -4.1748046875, -3.8839111328125, -3.593017578125, -3.3021240234375, -3.01123046875, -2.7203369140625, -2.429443359375, -2.1385498046875, -1.84765625, -1.5567626953125, -1.265869140625, -0.9749755859375, -0.68408203125, -0.3931884765625, -0.102294921875, 0.1885986328125, 0.4794921875, 0.7703857421875, 1.061279296875, 1.3521728515625, 1.64306640625, 1.9339599609375, 2.224853515625, 2.5157470703125, 2.806640625, 3.0975341796875, 3.388427734375, 3.6793212890625, 3.97021484375, 4.2611083984375, 4.552001953125, 4.8428955078125, 5.1337890625, 5.4246826171875, 5.715576171875, 6.0064697265625, 6.29736328125, 6.5882568359375, 6.879150390625, 7.1700439453125, 7.4609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 9.0, 11.0, 11.0, 18.0, 26.0, 26.0, 38.0, 55.0, 78.0, 102.0, 157.0, 283.0, 364.0, 546.0, 593.0, 548.0, 377.0, 258.0, 165.0, 131.0, 74.0, 65.0, 37.0, 23.0, 13.0, 15.0, 14.0, 4.0, 6.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.4376220703125, -6.203369140625, -5.9691162109375, -5.73486328125, -5.5006103515625, -5.266357421875, -5.0321044921875, -4.7978515625, -4.5635986328125, -4.329345703125, -4.0950927734375, -3.86083984375, -3.6265869140625, -3.392333984375, -3.1580810546875, -2.923828125, -2.6895751953125, -2.455322265625, -2.2210693359375, -1.98681640625, -1.7525634765625, -1.518310546875, -1.2840576171875, -1.0498046875, -0.8155517578125, -0.581298828125, -0.3470458984375, -0.11279296875, 0.1214599609375, 0.355712890625, 0.5899658203125, 0.82421875, 1.0584716796875, 1.292724609375, 1.5269775390625, 1.76123046875, 1.9954833984375, 2.229736328125, 2.4639892578125, 2.6982421875, 2.9324951171875, 3.166748046875, 3.4010009765625, 3.63525390625, 3.8695068359375, 4.103759765625, 4.3380126953125, 4.572265625, 4.8065185546875, 5.040771484375, 5.2750244140625, 5.50927734375, 5.7435302734375, 5.977783203125, 6.2120361328125, 6.4462890625, 6.6805419921875, 6.914794921875, 7.1490478515625, 7.38330078125, 7.6175537109375, 7.851806640625, 8.0860595703125, 8.3203125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 13.0, 13.0, 20.0, 15.0, 19.0, 34.0, 48.0, 80.0, 166.0, 313.0, 687.0, 1563.0, 3959.0, 11786.0, 57401.0, 721762.0, 3055904.0, 294480.0, 32574.0, 8256.0, 2824.0, 1164.0, 557.0, 244.0, 139.0, 83.0, 47.0, 32.0, 26.0, 18.0, 20.0, 11.0, 7.0, 5.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.703125, -17.241455078125, -16.77978515625, -16.318115234375, -15.8564453125, -15.394775390625, -14.93310546875, -14.471435546875, -14.009765625, -13.548095703125, -13.08642578125, -12.624755859375, -12.1630859375, -11.701416015625, -11.23974609375, -10.778076171875, -10.31640625, -9.854736328125, -9.39306640625, -8.931396484375, -8.4697265625, -8.008056640625, -7.54638671875, -7.084716796875, -6.623046875, -6.161376953125, -5.69970703125, -5.238037109375, -4.7763671875, -4.314697265625, -3.85302734375, -3.391357421875, -2.9296875, -2.468017578125, -2.00634765625, -1.544677734375, -1.0830078125, -0.621337890625, -0.15966796875, 0.302001953125, 0.763671875, 1.225341796875, 1.68701171875, 2.148681640625, 2.6103515625, 3.072021484375, 3.53369140625, 3.995361328125, 4.45703125, 4.918701171875, 5.38037109375, 5.842041015625, 6.3037109375, 6.765380859375, 7.22705078125, 7.688720703125, 8.150390625, 8.612060546875, 9.07373046875, 9.535400390625, 9.9970703125, 10.458740234375, 10.92041015625, 11.382080078125, 11.84375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 7.0, 8.0, 15.0, 11.0, 18.0, 29.0, 20.0, 27.0, 28.0, 37.0, 47.0, 49.0, 53.0, 56.0, 60.0, 65.0, 59.0, 52.0, 61.0, 48.0, 41.0, 47.0, 27.0, 32.0, 17.0, 18.0, 14.0, 9.0, 15.0, 4.0, 7.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.93575096130371, -19.27741050720215, -18.619068145751953, -17.96072769165039, -17.302387237548828, -16.644046783447266, -15.985705375671387, -15.327363967895508, -14.669023513793945, -14.010683059692383, -13.352341651916504, -12.694000244140625, -12.035659790039062, -11.3773193359375, -10.718977928161621, -10.060636520385742, -9.40229606628418, -8.743955612182617, -8.085614204406738, -7.427273273468018, -6.768932342529297, -6.110591411590576, -5.4522504806518555, -4.793909549713135, -4.135568618774414, -3.4772276878356934, -2.8188867568969727, -2.160545825958252, -1.5022048950195312, -0.8438639640808105, -0.18552303314208984, 0.47281789779663086, 1.1311607360839844, 1.789501667022705, 2.447842597961426, 3.1061835289001465, 3.764524459838867, 4.422865390777588, 5.081206321716309, 5.739547252655029, 6.39788818359375, 7.056229114532471, 7.714570045471191, 8.37291145324707, 9.031251907348633, 9.689592361450195, 10.347933769226074, 11.006275177001953, 11.664615631103516, 12.322956085205078, 12.981297492980957, 13.639638900756836, 14.297979354858398, 14.956319808959961, 15.61466121673584, 16.27300262451172, 16.93134307861328, 17.589683532714844, 18.248023986816406, 18.9063663482666, 19.564706802368164, 20.223047256469727, 20.881389617919922, 21.539730072021484, 22.198070526123047]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 1.0, 5.0, 3.0, 9.0, 4.0, 10.0, 16.0, 14.0, 20.0, 21.0, 25.0, 27.0, 24.0, 32.0, 25.0, 27.0, 40.0, 37.0, 39.0, 31.0, 45.0, 41.0, 35.0, 36.0, 35.0, 47.0, 29.0, 44.0, 26.0, 24.0, 38.0, 27.0, 24.0, 22.0, 10.0, 16.0, 14.0, 16.0, 11.0, 9.0, 9.0, 8.0, 4.0, 7.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-21.031719207763672, -20.40998649597168, -19.788253784179688, -19.166521072387695, -18.544788360595703, -17.92305564880371, -17.30132293701172, -16.67959213256836, -16.057857513427734, -15.436124801635742, -14.81439208984375, -14.192659378051758, -13.570926666259766, -12.949193954467773, -12.327462196350098, -11.705729484558105, -11.08399772644043, -10.462265014648438, -9.840532302856445, -9.218799591064453, -8.597066879272461, -7.975334644317627, -7.353602409362793, -6.731869697570801, -6.110136985778809, -5.488404273986816, -4.866671562194824, -4.24493932723999, -3.623206615447998, -3.001473903656006, -2.3797414302825928, -1.7580089569091797, -1.1362743377685547, -0.514541745185852, 0.10719084739685059, 0.7289234399795532, 1.3506560325622559, 1.972388744354248, 2.594121217727661, 3.215853691101074, 3.8375864028930664, 4.459319114685059, 5.081051826477051, 5.702784061431885, 6.324516773223877, 6.946249485015869, 7.567981719970703, 8.189714431762695, 8.811447143554688, 9.43317985534668, 10.054912567138672, 10.676645278930664, 11.298377990722656, 11.920110702514648, 12.541842460632324, 13.163575172424316, 13.785307884216309, 14.4070405960083, 15.028773307800293, 15.650506019592285, 16.27223777770996, 16.893970489501953, 17.515703201293945, 18.137435913085938, 18.75916862487793]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 3.0, 6.0, 12.0, 6.0, 9.0, 13.0, 19.0, 19.0, 12.0, 25.0, 35.0, 23.0, 40.0, 49.0, 40.0, 41.0, 41.0, 50.0, 49.0, 53.0, 49.0, 42.0, 49.0, 55.0, 31.0, 47.0, 28.0, 29.0, 20.0, 16.0, 13.0, 20.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.95703125, -2.86669921875, -2.7763671875, -2.68603515625, -2.595703125, -2.50537109375, -2.4150390625, -2.32470703125, -2.234375, -2.14404296875, -2.0537109375, -1.96337890625, -1.873046875, -1.78271484375, -1.6923828125, -1.60205078125, -1.51171875, -1.42138671875, -1.3310546875, -1.24072265625, -1.150390625, -1.06005859375, -0.9697265625, -0.87939453125, -0.7890625, -0.69873046875, -0.6083984375, -0.51806640625, -0.427734375, -0.33740234375, -0.2470703125, -0.15673828125, -0.06640625, 0.02392578125, 0.1142578125, 0.20458984375, 0.294921875, 0.38525390625, 0.4755859375, 0.56591796875, 0.65625, 0.74658203125, 0.8369140625, 0.92724609375, 1.017578125, 1.10791015625, 1.1982421875, 1.28857421875, 1.37890625, 1.46923828125, 1.5595703125, 1.64990234375, 1.740234375, 1.83056640625, 1.9208984375, 2.01123046875, 2.1015625, 2.19189453125, 2.2822265625, 2.37255859375, 2.462890625, 2.55322265625, 2.6435546875, 2.73388671875, 2.82421875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 12.0, 7.0, 15.0, 17.0, 30.0, 49.0, 65.0, 101.0, 149.0, 229.0, 376.0, 557.0, 866.0, 1365.0, 2314.0, 3994.0, 6857.0, 11509.0, 19493.0, 33936.0, 61561.0, 124931.0, 333465.0, 232021.0, 96360.0, 50166.0, 28173.0, 16219.0, 9584.0, 5660.0, 3263.0, 1896.0, 1250.0, 742.0, 444.0, 313.0, 186.0, 131.0, 75.0, 60.0, 44.0, 19.0, 18.0, 11.0, 11.0, 3.0, 8.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1579723358154297, -0.15249252319335938, -0.14701271057128906, -0.14153289794921875, -0.13605308532714844, -0.13057327270507812, -0.1250934600830078, -0.1196136474609375, -0.11413383483886719, -0.10865402221679688, -0.10317420959472656, -0.09769439697265625, -0.09221458435058594, -0.08673477172851562, -0.08125495910644531, -0.075775146484375, -0.07029533386230469, -0.06481552124023438, -0.05933570861816406, -0.05385589599609375, -0.04837608337402344, -0.042896270751953125, -0.03741645812988281, -0.0319366455078125, -0.026456832885742188, -0.020977020263671875, -0.015497207641601562, -0.01001739501953125, -0.0045375823974609375, 0.000942230224609375, 0.0064220428466796875, 0.01190185546875, 0.017381668090820312, 0.022861480712890625, 0.028341293334960938, 0.03382110595703125, 0.03930091857910156, 0.044780731201171875, 0.05026054382324219, 0.0557403564453125, 0.06122016906738281, 0.06669998168945312, 0.07217979431152344, 0.07765960693359375, 0.08313941955566406, 0.08861923217773438, 0.09409904479980469, 0.099578857421875, 0.10505867004394531, 0.11053848266601562, 0.11601829528808594, 0.12149810791015625, 0.12697792053222656, 0.13245773315429688, 0.1379375457763672, 0.1434173583984375, 0.1488971710205078, 0.15437698364257812, 0.15985679626464844, 0.16533660888671875, 0.17081642150878906, 0.17629623413085938, 0.1817760467529297, 0.187255859375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 7.0, 4.0, 7.0, 10.0, 15.0, 15.0, 21.0, 16.0, 18.0, 28.0, 37.0, 29.0, 40.0, 38.0, 34.0, 42.0, 37.0, 42.0, 39.0, 1071.0, 41.0, 26.0, 42.0, 39.0, 41.0, 37.0, 33.0, 32.0, 39.0, 23.0, 20.0, 16.0, 16.0, 11.0, 4.0, 11.0, 7.0, 6.0, 11.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08203125, -2.00799560546875, -1.9339599609375, -1.85992431640625, -1.785888671875, -1.71185302734375, -1.6378173828125, -1.56378173828125, -1.48974609375, -1.41571044921875, -1.3416748046875, -1.26763916015625, -1.193603515625, -1.11956787109375, -1.0455322265625, -0.97149658203125, -0.8974609375, -0.82342529296875, -0.7493896484375, -0.67535400390625, -0.601318359375, -0.52728271484375, -0.4532470703125, -0.37921142578125, -0.30517578125, -0.23114013671875, -0.1571044921875, -0.08306884765625, -0.009033203125, 0.06500244140625, 0.1390380859375, 0.21307373046875, 0.287109375, 0.36114501953125, 0.4351806640625, 0.50921630859375, 0.583251953125, 0.65728759765625, 0.7313232421875, 0.80535888671875, 0.87939453125, 0.95343017578125, 1.0274658203125, 1.10150146484375, 1.175537109375, 1.24957275390625, 1.3236083984375, 1.39764404296875, 1.4716796875, 1.54571533203125, 1.6197509765625, 1.69378662109375, 1.767822265625, 1.84185791015625, 1.9158935546875, 1.98992919921875, 2.06396484375, 2.13800048828125, 2.2120361328125, 2.28607177734375, 2.360107421875, 2.43414306640625, 2.5081787109375, 2.58221435546875, 2.65625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 8.0, 10.0, 14.0, 16.0, 21.0, 56.0, 55.0, 89.0, 95.0, 170.0, 247.0, 325.0, 495.0, 669.0, 992.0, 1345.0, 1897.0, 2919.0, 4197.0, 6206.0, 9213.0, 13656.0, 21210.0, 32872.0, 52543.0, 89270.0, 176638.0, 1325719.0, 145373.0, 77093.0, 46556.0, 29290.0, 18946.0, 12559.0, 8279.0, 5605.0, 3774.0, 2583.0, 1900.0, 1265.0, 891.0, 598.0, 439.0, 291.0, 233.0, 164.0, 98.0, 79.0, 55.0, 39.0, 29.0, 15.0, 14.0, 6.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.0496826171875, -0.04809904098510742, -0.046515464782714844, -0.044931888580322266, -0.04334831237792969, -0.04176473617553711, -0.04018115997314453, -0.03859758377075195, -0.037014007568359375, -0.0354304313659668, -0.03384685516357422, -0.03226327896118164, -0.030679702758789062, -0.029096126556396484, -0.027512550354003906, -0.025928974151611328, -0.02434539794921875, -0.022761821746826172, -0.021178245544433594, -0.019594669342041016, -0.018011093139648438, -0.01642751693725586, -0.014843940734863281, -0.013260364532470703, -0.011676788330078125, -0.010093212127685547, -0.008509635925292969, -0.006926059722900391, -0.0053424835205078125, -0.0037589073181152344, -0.0021753311157226562, -0.0005917549133300781, 0.0009918212890625, 0.002575397491455078, 0.004158973693847656, 0.005742549896240234, 0.0073261260986328125, 0.00890970230102539, 0.010493278503417969, 0.012076854705810547, 0.013660430908203125, 0.015244007110595703, 0.01682758331298828, 0.01841115951538086, 0.019994735717773438, 0.021578311920166016, 0.023161888122558594, 0.024745464324951172, 0.02632904052734375, 0.027912616729736328, 0.029496192932128906, 0.031079769134521484, 0.03266334533691406, 0.03424692153930664, 0.03583049774169922, 0.0374140739440918, 0.038997650146484375, 0.04058122634887695, 0.04216480255126953, 0.04374837875366211, 0.04533195495605469, 0.046915531158447266, 0.048499107360839844, 0.05008268356323242, 0.051666259765625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 6.0, 11.0, 8.0, 10.0, 12.0, 16.0, 15.0, 29.0, 23.0, 28.0, 37.0, 45.0, 69.0, 85.0, 114.0, 101.0, 78.0, 54.0, 57.0, 42.0, 25.0, 30.0, 25.0, 17.0, 17.0, 6.0, 6.0, 4.0, 4.0, 10.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.000667572021484375, -0.0006489977240562439, -0.0006304234266281128, -0.0006118491291999817, -0.0005932748317718506, -0.0005747005343437195, -0.0005561262369155884, -0.0005375519394874573, -0.0005189776420593262, -0.0005004033446311951, -0.00048182904720306396, -0.00046325474977493286, -0.00044468045234680176, -0.00042610615491867065, -0.00040753185749053955, -0.00038895756006240845, -0.00037038326263427734, -0.00035180896520614624, -0.00033323466777801514, -0.00031466037034988403, -0.00029608607292175293, -0.0002775117754936218, -0.0002589374780654907, -0.00024036318063735962, -0.00022178888320922852, -0.0002032145857810974, -0.0001846402883529663, -0.0001660659909248352, -0.0001474916934967041, -0.000128917396068573, -0.0001103430986404419, -9.176880121231079e-05, -7.319450378417969e-05, -5.4620206356048584e-05, -3.604590892791748e-05, -1.7471611499786377e-05, 1.1026859283447266e-06, 1.967698335647583e-05, 3.8251280784606934e-05, 5.682557821273804e-05, 7.539987564086914e-05, 9.397417306900024e-05, 0.00011254847049713135, 0.00013112276792526245, 0.00014969706535339355, 0.00016827136278152466, 0.00018684566020965576, 0.00020541995763778687, 0.00022399425506591797, 0.00024256855249404907, 0.0002611428499221802, 0.0002797171473503113, 0.0002982914447784424, 0.0003168657422065735, 0.0003354400396347046, 0.0003540143370628357, 0.0003725886344909668, 0.0003911629319190979, 0.000409737229347229, 0.0004283115267753601, 0.0004468858242034912, 0.0004654601216316223, 0.0004840344190597534, 0.0005026087164878845, 0.0005211830139160156]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 8.0, 6.0, 8.0, 22.0, 33.0, 40.0, 94.0, 168.0, 528.0, 2030.0, 9373.0, 55418.0, 637948.0, 300296.0, 34427.0, 6069.0, 1368.0, 364.0, 134.0, 66.0, 42.0, 24.0, 18.0, 15.0, 8.0, 9.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00795745849609375, -0.007681846618652344, -0.0074062347412109375, -0.007130622863769531, -0.006855010986328125, -0.006579399108886719, -0.0063037872314453125, -0.006028175354003906, -0.0057525634765625, -0.005476951599121094, -0.0052013397216796875, -0.004925727844238281, -0.004650115966796875, -0.004374504089355469, -0.0040988922119140625, -0.0038232803344726562, -0.00354766845703125, -0.0032720565795898438, -0.0029964447021484375, -0.0027208328247070312, -0.002445220947265625, -0.0021696090698242188, -0.0018939971923828125, -0.0016183853149414062, -0.0013427734375, -0.0010671615600585938, -0.0007915496826171875, -0.0005159378051757812, -0.000240325927734375, 3.528594970703125e-05, 0.0003108978271484375, 0.0005865097045898438, 0.00086212158203125, 0.0011377334594726562, 0.0014133453369140625, 0.0016889572143554688, 0.001964569091796875, 0.0022401809692382812, 0.0025157928466796875, 0.0027914047241210938, 0.0030670166015625, 0.0033426284790039062, 0.0036182403564453125, 0.0038938522338867188, 0.004169464111328125, 0.004445075988769531, 0.0047206878662109375, 0.004996299743652344, 0.00527191162109375, 0.005547523498535156, 0.0058231353759765625, 0.006098747253417969, 0.006374359130859375, 0.006649971008300781, 0.0069255828857421875, 0.007201194763183594, 0.007476806640625, 0.007752418518066406, 0.008028030395507812, 0.008303642272949219, 0.008579254150390625, 0.008854866027832031, 0.009130477905273438, 0.009406089782714844, 0.00968170166015625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 12.0, 134.0, 750.0, 104.0, 13.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002684985753148794, -0.0023683321196585894, -0.0020516784861683846, -0.0017350249690935016, -0.0014183713356032968, -0.001101717702113092, -0.000785064185038209, -0.00046841055154800415, -0.00015175691805779934, 0.00016489668632857502, 0.00048155029071494937, 0.0007982038659974933, 0.001114857499487698, 0.0014315111329779029, 0.0017481646500527859, 0.0020648182835429907, 0.0023814719170331955, 0.0026981255505234003, 0.003014779184013605, 0.0033314325846731663, 0.0036480864509940147, 0.003964739851653576, 0.004281393252313137, 0.0045980471186339855, 0.004914700984954834, 0.005231354385614395, 0.005548008251935244, 0.005864661652594805, 0.006181315518915653, 0.006497968919575214, 0.0068146223202347755, 0.007131276186555624, 0.007447929121553898, 0.007764582522213459, 0.00808123592287302, 0.008397890254855156, 0.008714543655514717, 0.009031197056174278, 0.00934785045683384, 0.0096645038574934, 0.009981158189475536, 0.010297811590135098, 0.010614464990794659, 0.010931119322776794, 0.011247772723436356, 0.011564426124095917, 0.011881079524755478, 0.012197732925415039, 0.0125143863260746, 0.012831039726734161, 0.013147693127393723, 0.013464347459375858, 0.01378100086003542, 0.01409765426069498, 0.014414307661354542, 0.014730961993336678, 0.015047615393996239, 0.0153642687946558, 0.01568092219531536, 0.015997575595974922, 0.016314228996634483, 0.016630884259939194, 0.016947537660598755, 0.017264191061258316, 0.017580844461917877]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 5.0, 24.0, 30.0, 38.0, 67.0, 76.0, 93.0, 99.0, 89.0, 97.0, 86.0, 62.0, 80.0, 49.0, 46.0, 28.0, 12.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013107657432556152, -0.0012807315215468407, -0.001250697299838066, -0.0012206630781292915, -0.001190628856420517, -0.0011605946347117424, -0.0011305604130029678, -0.0011005261912941933, -0.0010704919695854187, -0.0010404577478766441, -0.0010104235261678696, -0.000980389304459095, -0.0009503550827503204, -0.0009203208610415459, -0.0008902866393327713, -0.0008602524176239967, -0.0008302181959152222, -0.0008001839742064476, -0.000770149752497673, -0.0007401155307888985, -0.0007100813090801239, -0.0006800470873713493, -0.0006500128656625748, -0.0006199786439538002, -0.0005899444222450256, -0.0005599102005362511, -0.0005298759788274765, -0.0004998417571187019, -0.00046980753540992737, -0.0004397733137011528, -0.00040973909199237823, -0.00037970487028360367, -0.0003496706485748291, -0.00031963642686605453, -0.00028960220515727997, -0.0002595679834485054, -0.00022953376173973083, -0.00019949954003095627, -0.0001694653183221817, -0.00013943109661340714, -0.00010939687490463257, -7.9362653195858e-05, -4.9328431487083435e-05, -1.929420977830887e-05, 1.0740011930465698e-05, 4.0774233639240265e-05, 7.080845534801483e-05, 0.0001008426770567894, 0.00013087689876556396, 0.00016091112047433853, 0.0001909453421831131, 0.00022097956389188766, 0.00025101378560066223, 0.0002810480073094368, 0.00031108222901821136, 0.00034111645072698593, 0.0003711506724357605, 0.00040118489414453506, 0.00043121911585330963, 0.0004612533375620842, 0.0004912875592708588, 0.0005213217809796333, 0.0005513560026884079, 0.0005813902243971825, 0.000611424446105957]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 3.0, 6.0, 12.0, 6.0, 9.0, 13.0, 19.0, 19.0, 12.0, 25.0, 35.0, 23.0, 40.0, 49.0, 40.0, 41.0, 41.0, 50.0, 49.0, 53.0, 49.0, 42.0, 49.0, 55.0, 31.0, 47.0, 28.0, 29.0, 20.0, 16.0, 13.0, 20.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.95703125, -2.86669921875, -2.7763671875, -2.68603515625, -2.595703125, -2.50537109375, -2.4150390625, -2.32470703125, -2.234375, -2.14404296875, -2.0537109375, -1.96337890625, -1.873046875, -1.78271484375, -1.6923828125, -1.60205078125, -1.51171875, -1.42138671875, -1.3310546875, -1.24072265625, -1.150390625, -1.06005859375, -0.9697265625, -0.87939453125, -0.7890625, -0.69873046875, -0.6083984375, -0.51806640625, -0.427734375, -0.33740234375, -0.2470703125, -0.15673828125, -0.06640625, 0.02392578125, 0.1142578125, 0.20458984375, 0.294921875, 0.38525390625, 0.4755859375, 0.56591796875, 0.65625, 0.74658203125, 0.8369140625, 0.92724609375, 1.017578125, 1.10791015625, 1.1982421875, 1.28857421875, 1.37890625, 1.46923828125, 1.5595703125, 1.64990234375, 1.740234375, 1.83056640625, 1.9208984375, 2.01123046875, 2.1015625, 2.19189453125, 2.2822265625, 2.37255859375, 2.462890625, 2.55322265625, 2.6435546875, 2.73388671875, 2.82421875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 19.0, 17.0, 28.0, 38.0, 63.0, 162.0, 249.0, 480.0, 899.0, 1973.0, 4716.0, 13274.0, 43096.0, 156933.0, 510335.0, 226207.0, 61059.0, 17963.0, 6265.0, 2467.0, 1052.0, 565.0, 296.0, 142.0, 92.0, 63.0, 23.0, 20.0, 14.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.578125, -7.37127685546875, -7.1644287109375, -6.95758056640625, -6.750732421875, -6.54388427734375, -6.3370361328125, -6.13018798828125, -5.92333984375, -5.71649169921875, -5.5096435546875, -5.30279541015625, -5.095947265625, -4.88909912109375, -4.6822509765625, -4.47540283203125, -4.2685546875, -4.06170654296875, -3.8548583984375, -3.64801025390625, -3.441162109375, -3.23431396484375, -3.0274658203125, -2.82061767578125, -2.61376953125, -2.40692138671875, -2.2000732421875, -1.99322509765625, -1.786376953125, -1.57952880859375, -1.3726806640625, -1.16583251953125, -0.958984375, -0.75213623046875, -0.5452880859375, -0.33843994140625, -0.131591796875, 0.07525634765625, 0.2821044921875, 0.48895263671875, 0.69580078125, 0.90264892578125, 1.1094970703125, 1.31634521484375, 1.523193359375, 1.73004150390625, 1.9368896484375, 2.14373779296875, 2.3505859375, 2.55743408203125, 2.7642822265625, 2.97113037109375, 3.177978515625, 3.38482666015625, 3.5916748046875, 3.79852294921875, 4.00537109375, 4.21221923828125, 4.4190673828125, 4.62591552734375, 4.832763671875, 5.03961181640625, 5.2464599609375, 5.45330810546875, 5.66015625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 1.0, 5.0, 6.0, 8.0, 4.0, 12.0, 10.0, 9.0, 27.0, 23.0, 23.0, 39.0, 28.0, 34.0, 43.0, 49.0, 60.0, 85.0, 127.0, 185.0, 1352.0, 230.0, 117.0, 100.0, 66.0, 57.0, 59.0, 31.0, 27.0, 45.0, 30.0, 23.0, 19.0, 22.0, 22.0, 13.0, 14.0, 12.0, 9.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.53125, -8.2431640625, -7.955078125, -7.6669921875, -7.37890625, -7.0908203125, -6.802734375, -6.5146484375, -6.2265625, -5.9384765625, -5.650390625, -5.3623046875, -5.07421875, -4.7861328125, -4.498046875, -4.2099609375, -3.921875, -3.6337890625, -3.345703125, -3.0576171875, -2.76953125, -2.4814453125, -2.193359375, -1.9052734375, -1.6171875, -1.3291015625, -1.041015625, -0.7529296875, -0.46484375, -0.1767578125, 0.111328125, 0.3994140625, 0.6875, 0.9755859375, 1.263671875, 1.5517578125, 1.83984375, 2.1279296875, 2.416015625, 2.7041015625, 2.9921875, 3.2802734375, 3.568359375, 3.8564453125, 4.14453125, 4.4326171875, 4.720703125, 5.0087890625, 5.296875, 5.5849609375, 5.873046875, 6.1611328125, 6.44921875, 6.7373046875, 7.025390625, 7.3134765625, 7.6015625, 7.8896484375, 8.177734375, 8.4658203125, 8.75390625, 9.0419921875, 9.330078125, 9.6181640625, 9.90625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 10.0, 10.0, 24.0, 28.0, 34.0, 61.0, 68.0, 95.0, 185.0, 258.0, 457.0, 884.0, 2135.0, 6456.0, 33891.0, 471554.0, 2475907.0, 131024.0, 15443.0, 3858.0, 1504.0, 753.0, 380.0, 217.0, 143.0, 98.0, 47.0, 42.0, 29.0, 16.0, 15.0, 17.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-18.515625, -17.990966796875, -17.46630859375, -16.941650390625, -16.4169921875, -15.892333984375, -15.36767578125, -14.843017578125, -14.318359375, -13.793701171875, -13.26904296875, -12.744384765625, -12.2197265625, -11.695068359375, -11.17041015625, -10.645751953125, -10.12109375, -9.596435546875, -9.07177734375, -8.547119140625, -8.0224609375, -7.497802734375, -6.97314453125, -6.448486328125, -5.923828125, -5.399169921875, -4.87451171875, -4.349853515625, -3.8251953125, -3.300537109375, -2.77587890625, -2.251220703125, -1.7265625, -1.201904296875, -0.67724609375, -0.152587890625, 0.3720703125, 0.896728515625, 1.42138671875, 1.946044921875, 2.470703125, 2.995361328125, 3.52001953125, 4.044677734375, 4.5693359375, 5.093994140625, 5.61865234375, 6.143310546875, 6.66796875, 7.192626953125, 7.71728515625, 8.241943359375, 8.7666015625, 9.291259765625, 9.81591796875, 10.340576171875, 10.865234375, 11.389892578125, 11.91455078125, 12.439208984375, 12.9638671875, 13.488525390625, 14.01318359375, 14.537841796875, 15.0625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 14.0, 45.0, 83.0, 262.0, 267.0, 217.0, 89.0, 19.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.848533630371094, -31.134279251098633, -28.420024871826172, -25.705772399902344, -22.991518020629883, -20.277263641357422, -17.563011169433594, -14.848756790161133, -12.134502410888672, -9.420248031616211, -6.705994606018066, -3.991741180419922, -1.277486801147461, 1.436767578125, 4.151020050048828, 6.865274429321289, 9.57952880859375, 12.293783187866211, 15.008036613464355, 17.7222900390625, 20.43654441833496, 23.150798797607422, 25.86505126953125, 28.57930564880371, 31.293560028076172, 34.0078125, 36.722068786621094, 39.43632125854492, 42.15057373046875, 44.864830017089844, 47.57908248901367, 50.2933349609375, 53.007598876953125, 55.72185134887695, 58.43610763549805, 61.150360107421875, 63.86461639404297, 66.57887268066406, 69.29312133789062, 72.00737762451172, 74.72163391113281, 77.4358901977539, 80.15013885498047, 82.86439514160156, 85.57865142822266, 88.29290771484375, 91.00715637207031, 93.7214126586914, 96.43566131591797, 99.14991760253906, 101.86416625976562, 104.57842254638672, 107.29267883300781, 110.00692749023438, 112.72118377685547, 115.43544006347656, 118.14968872070312, 120.86394500732422, 123.57819366455078, 126.29244995117188, 129.00669860839844, 131.72096252441406, 134.43521118164062, 137.1494598388672, 139.8637237548828]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 3.0, 6.0, 9.0, 9.0, 8.0, 15.0, 13.0, 19.0, 19.0, 23.0, 23.0, 25.0, 29.0, 32.0, 34.0, 31.0, 23.0, 40.0, 41.0, 48.0, 39.0, 37.0, 36.0, 38.0, 30.0, 36.0, 36.0, 20.0, 32.0, 26.0, 25.0, 19.0, 24.0, 21.0, 16.0, 17.0, 20.0, 7.0, 12.0, 11.0, 6.0, 3.0, 8.0, 7.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.35373306274414, -24.54157257080078, -23.72941017150879, -22.91724967956543, -22.105087280273438, -21.292926788330078, -20.48076629638672, -19.668603897094727, -18.856443405151367, -18.044282913208008, -17.232120513916016, -16.419960021972656, -15.60779857635498, -14.795637130737305, -13.983475685119629, -13.171314239501953, -12.359152793884277, -11.546991348266602, -10.734829902648926, -9.92266845703125, -9.11050796508789, -8.298346519470215, -7.486185073852539, -6.6740241050720215, -5.861862659454346, -5.04970121383667, -4.237540245056152, -3.4253787994384766, -2.61321759223938, -1.8010563850402832, -0.9888949394226074, -0.17673397064208984, 0.6354274749755859, 1.4475886821746826, 2.2597498893737793, 3.071911334991455, 3.8840725421905518, 4.696233749389648, 5.508395195007324, 6.320556163787842, 7.132717609405518, 7.944879055023193, 8.757040023803711, 9.569201469421387, 10.381362915039062, 11.193523406982422, 12.005685806274414, 12.817846298217773, 13.63000774383545, 14.442169189453125, 15.2543306350708, 16.066492080688477, 16.878652572631836, 17.690814971923828, 18.502975463867188, 19.315135955810547, 20.12729835510254, 20.9394588470459, 21.75162124633789, 22.56378173828125, 23.375944137573242, 24.1881046295166, 25.000267028808594, 25.812427520751953, 26.624588012695312]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 12.0, 12.0, 17.0, 16.0, 19.0, 30.0, 27.0, 27.0, 28.0, 44.0, 38.0, 45.0, 48.0, 49.0, 55.0, 44.0, 54.0, 47.0, 37.0, 41.0, 35.0, 35.0, 36.0, 30.0, 31.0, 20.0, 11.0, 18.0, 12.0, 11.0, 7.0, 11.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.138671875, -3.043243408203125, -2.94781494140625, -2.852386474609375, -2.7569580078125, -2.661529541015625, -2.56610107421875, -2.470672607421875, -2.375244140625, -2.279815673828125, -2.18438720703125, -2.088958740234375, -1.9935302734375, -1.898101806640625, -1.80267333984375, -1.707244873046875, -1.61181640625, -1.516387939453125, -1.42095947265625, -1.325531005859375, -1.2301025390625, -1.134674072265625, -1.03924560546875, -0.943817138671875, -0.848388671875, -0.752960205078125, -0.65753173828125, -0.562103271484375, -0.4666748046875, -0.371246337890625, -0.27581787109375, -0.180389404296875, -0.0849609375, 0.010467529296875, 0.10589599609375, 0.201324462890625, 0.2967529296875, 0.392181396484375, 0.48760986328125, 0.583038330078125, 0.678466796875, 0.773895263671875, 0.86932373046875, 0.964752197265625, 1.0601806640625, 1.155609130859375, 1.25103759765625, 1.346466064453125, 1.44189453125, 1.537322998046875, 1.63275146484375, 1.728179931640625, 1.8236083984375, 1.919036865234375, 2.01446533203125, 2.109893798828125, 2.205322265625, 2.300750732421875, 2.39617919921875, 2.491607666015625, 2.5870361328125, 2.682464599609375, 2.77789306640625, 2.873321533203125, 2.96875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 10.0, 25.0, 23.0, 26.0, 47.0, 95.0, 107.0, 167.0, 293.0, 417.0, 679.0, 1202.0, 2217.0, 4334.0, 9773.0, 27206.0, 139078.0, 1457781.0, 2247907.0, 241964.0, 38458.0, 12147.0, 5058.0, 2364.0, 1172.0, 674.0, 368.0, 236.0, 151.0, 90.0, 74.0, 31.0, 27.0, 17.0, 11.0, 11.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.2890625, -10.00421142578125, -9.7193603515625, -9.43450927734375, -9.149658203125, -8.86480712890625, -8.5799560546875, -8.29510498046875, -8.01025390625, -7.72540283203125, -7.4405517578125, -7.15570068359375, -6.870849609375, -6.58599853515625, -6.3011474609375, -6.01629638671875, -5.7314453125, -5.44659423828125, -5.1617431640625, -4.87689208984375, -4.592041015625, -4.30718994140625, -4.0223388671875, -3.73748779296875, -3.45263671875, -3.16778564453125, -2.8829345703125, -2.59808349609375, -2.313232421875, -2.02838134765625, -1.7435302734375, -1.45867919921875, -1.173828125, -0.88897705078125, -0.6041259765625, -0.31927490234375, -0.034423828125, 0.25042724609375, 0.5352783203125, 0.82012939453125, 1.10498046875, 1.38983154296875, 1.6746826171875, 1.95953369140625, 2.244384765625, 2.52923583984375, 2.8140869140625, 3.09893798828125, 3.3837890625, 3.66864013671875, 3.9534912109375, 4.23834228515625, 4.523193359375, 4.80804443359375, 5.0928955078125, 5.37774658203125, 5.66259765625, 5.94744873046875, 6.2322998046875, 6.51715087890625, 6.802001953125, 7.08685302734375, 7.3717041015625, 7.65655517578125, 7.94140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 9.0, 5.0, 16.0, 13.0, 22.0, 28.0, 35.0, 70.0, 112.0, 169.0, 242.0, 363.0, 493.0, 621.0, 538.0, 409.0, 303.0, 190.0, 135.0, 70.0, 63.0, 44.0, 26.0, 20.0, 14.0, 10.0, 11.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.2890625, -7.035400390625, -6.78173828125, -6.528076171875, -6.2744140625, -6.020751953125, -5.76708984375, -5.513427734375, -5.259765625, -5.006103515625, -4.75244140625, -4.498779296875, -4.2451171875, -3.991455078125, -3.73779296875, -3.484130859375, -3.23046875, -2.976806640625, -2.72314453125, -2.469482421875, -2.2158203125, -1.962158203125, -1.70849609375, -1.454833984375, -1.201171875, -0.947509765625, -0.69384765625, -0.440185546875, -0.1865234375, 0.067138671875, 0.32080078125, 0.574462890625, 0.828125, 1.081787109375, 1.33544921875, 1.589111328125, 1.8427734375, 2.096435546875, 2.35009765625, 2.603759765625, 2.857421875, 3.111083984375, 3.36474609375, 3.618408203125, 3.8720703125, 4.125732421875, 4.37939453125, 4.633056640625, 4.88671875, 5.140380859375, 5.39404296875, 5.647705078125, 5.9013671875, 6.155029296875, 6.40869140625, 6.662353515625, 6.916015625, 7.169677734375, 7.42333984375, 7.677001953125, 7.9306640625, 8.184326171875, 8.43798828125, 8.691650390625, 8.9453125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 6.0, 5.0, 13.0, 12.0, 13.0, 35.0, 48.0, 56.0, 95.0, 184.0, 342.0, 626.0, 1453.0, 3699.0, 11632.0, 60272.0, 994363.0, 2912691.0, 176357.0, 22148.0, 6103.0, 2173.0, 931.0, 428.0, 216.0, 131.0, 72.0, 43.0, 34.0, 31.0, 16.0, 14.0, 11.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.8704833984375, -18.319091796875, -17.7677001953125, -17.21630859375, -16.6649169921875, -16.113525390625, -15.5621337890625, -15.0107421875, -14.4593505859375, -13.907958984375, -13.3565673828125, -12.80517578125, -12.2537841796875, -11.702392578125, -11.1510009765625, -10.599609375, -10.0482177734375, -9.496826171875, -8.9454345703125, -8.39404296875, -7.8426513671875, -7.291259765625, -6.7398681640625, -6.1884765625, -5.6370849609375, -5.085693359375, -4.5343017578125, -3.98291015625, -3.4315185546875, -2.880126953125, -2.3287353515625, -1.77734375, -1.2259521484375, -0.674560546875, -0.1231689453125, 0.42822265625, 0.9796142578125, 1.531005859375, 2.0823974609375, 2.6337890625, 3.1851806640625, 3.736572265625, 4.2879638671875, 4.83935546875, 5.3907470703125, 5.942138671875, 6.4935302734375, 7.044921875, 7.5963134765625, 8.147705078125, 8.6990966796875, 9.25048828125, 9.8018798828125, 10.353271484375, 10.9046630859375, 11.4560546875, 12.0074462890625, 12.558837890625, 13.1102294921875, 13.66162109375, 14.2130126953125, 14.764404296875, 15.3157958984375, 15.8671875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 15.0, 10.0, 33.0, 43.0, 66.0, 78.0, 100.0, 103.0, 106.0, 114.0, 93.0, 65.0, 51.0, 45.0, 25.0, 17.0, 9.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.406036376953125, -48.03774642944336, -46.66946029663086, -45.301170349121094, -43.932884216308594, -42.56459426879883, -41.19630432128906, -39.82801818847656, -38.4597282409668, -37.09143829345703, -35.72315216064453, -34.354862213134766, -32.986572265625, -31.6182861328125, -30.249996185302734, -28.8817081451416, -27.51342010498047, -26.145132064819336, -24.776844024658203, -23.408554077148438, -22.040266036987305, -20.671977996826172, -19.303688049316406, -17.935400009155273, -16.56711196899414, -15.198823928833008, -13.830534934997559, -12.46224594116211, -11.093957901000977, -9.725669860839844, -8.357380867004395, -6.989091873168945, -5.620807647705078, -4.252519130706787, -2.884230613708496, -1.515942096710205, -0.14765357971191406, 1.220634937286377, 2.588923454284668, 3.957212448120117, 5.32550048828125, 6.693789005279541, 8.062077522277832, 9.430366516113281, 10.798654556274414, 12.166942596435547, 13.535231590270996, 14.903520584106445, 16.271808624267578, 17.64009666442871, 19.008384704589844, 20.37667465209961, 21.744962692260742, 23.113250732421875, 24.48154067993164, 25.849828720092773, 27.218116760253906, 28.58640480041504, 29.954692840576172, 31.322982788085938, 32.69126892089844, 34.0595588684082, 35.42784881591797, 36.79613494873047, 38.164424896240234]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 14.0, 10.0, 9.0, 17.0, 15.0, 18.0, 17.0, 15.0, 21.0, 24.0, 24.0, 33.0, 36.0, 29.0, 33.0, 43.0, 40.0, 32.0, 28.0, 35.0, 32.0, 37.0, 40.0, 37.0, 46.0, 32.0, 39.0, 29.0, 24.0, 28.0, 24.0, 20.0, 19.0, 10.0, 14.0, 9.0, 13.0, 16.0, 11.0, 9.0, 8.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.156085968017578, -25.404306411743164, -24.652524948120117, -23.900745391845703, -23.14896583557129, -22.397184371948242, -21.645404815673828, -20.89362335205078, -20.141843795776367, -19.390064239501953, -18.638282775878906, -17.886503219604492, -17.134723663330078, -16.38294219970703, -15.631162643432617, -14.879382133483887, -14.127602577209473, -13.375822067260742, -12.624042510986328, -11.872262001037598, -11.120481491088867, -10.368701934814453, -9.616921424865723, -8.865140914916992, -8.113361358642578, -7.361581325531006, -6.609800815582275, -5.858020782470703, -5.106240272521973, -4.3544602394104, -3.602680206298828, -2.8508996963500977, -2.099119186401367, -1.3473389148712158, -0.595558762550354, 0.1562213897705078, 0.9080016613006592, 1.6597819328308105, 2.411561965942383, 3.1633424758911133, 3.9151225090026855, 4.666902542114258, 5.418683052062988, 6.1704630851745605, 6.922243118286133, 7.674023628234863, 8.425804138183594, 9.177583694458008, 9.929364204406738, 10.681144714355469, 11.432924270629883, 12.184704780578613, 12.936485290527344, 13.688264846801758, 14.440045356750488, 15.191825866699219, 15.943605422973633, 16.695384979248047, 17.447166442871094, 18.198945999145508, 18.950725555419922, 19.70250701904297, 20.454286575317383, 21.206066131591797, 21.957847595214844]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0, 8.0, 5.0, 1.0, 5.0, 11.0, 14.0, 12.0, 19.0, 22.0, 23.0, 27.0, 31.0, 42.0, 29.0, 40.0, 43.0, 37.0, 60.0, 54.0, 46.0, 35.0, 42.0, 61.0, 36.0, 49.0, 32.0, 49.0, 25.0, 24.0, 20.0, 26.0, 11.0, 19.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.107421875, -3.0081787109375, -2.908935546875, -2.8096923828125, -2.71044921875, -2.6112060546875, -2.511962890625, -2.4127197265625, -2.3134765625, -2.2142333984375, -2.114990234375, -2.0157470703125, -1.91650390625, -1.8172607421875, -1.718017578125, -1.6187744140625, -1.51953125, -1.4202880859375, -1.321044921875, -1.2218017578125, -1.12255859375, -1.0233154296875, -0.924072265625, -0.8248291015625, -0.7255859375, -0.6263427734375, -0.527099609375, -0.4278564453125, -0.32861328125, -0.2293701171875, -0.130126953125, -0.0308837890625, 0.068359375, 0.1676025390625, 0.266845703125, 0.3660888671875, 0.46533203125, 0.5645751953125, 0.663818359375, 0.7630615234375, 0.8623046875, 0.9615478515625, 1.060791015625, 1.1600341796875, 1.25927734375, 1.3585205078125, 1.457763671875, 1.5570068359375, 1.65625, 1.7554931640625, 1.854736328125, 1.9539794921875, 2.05322265625, 2.1524658203125, 2.251708984375, 2.3509521484375, 2.4501953125, 2.5494384765625, 2.648681640625, 2.7479248046875, 2.84716796875, 2.9464111328125, 3.045654296875, 3.1448974609375, 3.244140625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 13.0, 19.0, 20.0, 52.0, 68.0, 93.0, 128.0, 208.0, 307.0, 483.0, 693.0, 1033.0, 1606.0, 2451.0, 3652.0, 5676.0, 8713.0, 13744.0, 21105.0, 33493.0, 56761.0, 101764.0, 241199.0, 279582.0, 113250.0, 61446.0, 36416.0, 22868.0, 14570.0, 9430.0, 6098.0, 3970.0, 2603.0, 1708.0, 1114.0, 718.0, 512.0, 320.0, 230.0, 142.0, 95.0, 71.0, 46.0, 24.0, 19.0, 14.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1541748046875, -0.14965057373046875, -0.1451263427734375, -0.14060211181640625, -0.136077880859375, -0.13155364990234375, -0.1270294189453125, -0.12250518798828125, -0.11798095703125, -0.11345672607421875, -0.1089324951171875, -0.10440826416015625, -0.099884033203125, -0.09535980224609375, -0.0908355712890625, -0.08631134033203125, -0.081787109375, -0.07726287841796875, -0.0727386474609375, -0.06821441650390625, -0.063690185546875, -0.05916595458984375, -0.0546417236328125, -0.05011749267578125, -0.04559326171875, -0.04106903076171875, -0.0365447998046875, -0.03202056884765625, -0.027496337890625, -0.02297210693359375, -0.0184478759765625, -0.01392364501953125, -0.0093994140625, -0.00487518310546875, -0.0003509521484375, 0.00417327880859375, 0.008697509765625, 0.01322174072265625, 0.0177459716796875, 0.02227020263671875, 0.02679443359375, 0.03131866455078125, 0.0358428955078125, 0.04036712646484375, 0.044891357421875, 0.04941558837890625, 0.0539398193359375, 0.05846405029296875, 0.06298828125, 0.06751251220703125, 0.0720367431640625, 0.07656097412109375, 0.081085205078125, 0.08560943603515625, 0.0901336669921875, 0.09465789794921875, 0.09918212890625, 0.10370635986328125, 0.1082305908203125, 0.11275482177734375, 0.117279052734375, 0.12180328369140625, 0.1263275146484375, 0.13085174560546875, 0.1353759765625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 8.0, 7.0, 11.0, 16.0, 15.0, 8.0, 16.0, 17.0, 32.0, 19.0, 26.0, 25.0, 40.0, 43.0, 29.0, 36.0, 43.0, 34.0, 37.0, 1066.0, 42.0, 38.0, 50.0, 41.0, 29.0, 40.0, 36.0, 39.0, 24.0, 22.0, 14.0, 21.0, 11.0, 12.0, 11.0, 15.0, 7.0, 7.0, 7.0, 4.0, 7.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.298828125, -2.22186279296875, -2.1448974609375, -2.06793212890625, -1.990966796875, -1.91400146484375, -1.8370361328125, -1.76007080078125, -1.68310546875, -1.60614013671875, -1.5291748046875, -1.45220947265625, -1.375244140625, -1.29827880859375, -1.2213134765625, -1.14434814453125, -1.0673828125, -0.99041748046875, -0.9134521484375, -0.83648681640625, -0.759521484375, -0.68255615234375, -0.6055908203125, -0.52862548828125, -0.45166015625, -0.37469482421875, -0.2977294921875, -0.22076416015625, -0.143798828125, -0.06683349609375, 0.0101318359375, 0.08709716796875, 0.1640625, 0.24102783203125, 0.3179931640625, 0.39495849609375, 0.471923828125, 0.54888916015625, 0.6258544921875, 0.70281982421875, 0.77978515625, 0.85675048828125, 0.9337158203125, 1.01068115234375, 1.087646484375, 1.16461181640625, 1.2415771484375, 1.31854248046875, 1.3955078125, 1.47247314453125, 1.5494384765625, 1.62640380859375, 1.703369140625, 1.78033447265625, 1.8572998046875, 1.93426513671875, 2.01123046875, 2.08819580078125, 2.1651611328125, 2.24212646484375, 2.319091796875, 2.39605712890625, 2.4730224609375, 2.54998779296875, 2.626953125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 10.0, 22.0, 18.0, 19.0, 25.0, 53.0, 60.0, 103.0, 142.0, 147.0, 235.0, 322.0, 464.0, 619.0, 923.0, 1232.0, 1923.0, 2685.0, 3877.0, 5452.0, 7873.0, 12008.0, 17751.0, 26737.0, 40833.0, 65781.0, 116257.0, 1170532.0, 334786.0, 107504.0, 61664.0, 38815.0, 25357.0, 16509.0, 11107.0, 7859.0, 5189.0, 3595.0, 2455.0, 1743.0, 1256.0, 896.0, 686.0, 469.0, 327.0, 254.0, 149.0, 125.0, 90.0, 55.0, 32.0, 35.0, 26.0, 14.0, 10.0, 9.0, 9.0, 7.0, 4.0], "bins": [-0.05206298828125, -0.05048227310180664, -0.04890155792236328, -0.04732084274291992, -0.04574012756347656, -0.0441594123840332, -0.042578697204589844, -0.040997982025146484, -0.039417266845703125, -0.037836551666259766, -0.036255836486816406, -0.03467512130737305, -0.03309440612792969, -0.03151369094848633, -0.02993297576904297, -0.02835226058959961, -0.02677154541015625, -0.02519083023071289, -0.02361011505126953, -0.022029399871826172, -0.020448684692382812, -0.018867969512939453, -0.017287254333496094, -0.015706539154052734, -0.014125823974609375, -0.012545108795166016, -0.010964393615722656, -0.009383678436279297, -0.0078029632568359375, -0.006222248077392578, -0.004641532897949219, -0.0030608177185058594, -0.0014801025390625, 0.00010061264038085938, 0.0016813278198242188, 0.003262042999267578, 0.0048427581787109375, 0.006423473358154297, 0.008004188537597656, 0.009584903717041016, 0.011165618896484375, 0.012746334075927734, 0.014327049255371094, 0.015907764434814453, 0.017488479614257812, 0.019069194793701172, 0.02064990997314453, 0.02223062515258789, 0.02381134033203125, 0.02539205551147461, 0.02697277069091797, 0.028553485870361328, 0.030134201049804688, 0.03171491622924805, 0.033295631408691406, 0.034876346588134766, 0.036457061767578125, 0.038037776947021484, 0.039618492126464844, 0.0411992073059082, 0.04277992248535156, 0.04436063766479492, 0.04594135284423828, 0.04752206802368164, 0.049102783203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 13.0, 15.0, 7.0, 9.0, 27.0, 13.0, 27.0, 41.0, 42.0, 39.0, 46.0, 74.0, 118.0, 120.0, 73.0, 51.0, 37.0, 43.0, 35.0, 25.0, 23.0, 27.0, 22.0, 11.0, 12.0, 6.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00070953369140625, -0.000684201717376709, -0.000658869743347168, -0.000633537769317627, -0.0006082057952880859, -0.0005828738212585449, -0.0005575418472290039, -0.0005322098731994629, -0.0005068778991699219, -0.00048154592514038086, -0.00045621395111083984, -0.00043088197708129883, -0.0004055500030517578, -0.0003802180290222168, -0.0003548860549926758, -0.00032955408096313477, -0.00030422210693359375, -0.00027889013290405273, -0.0002535581588745117, -0.0002282261848449707, -0.0002028942108154297, -0.00017756223678588867, -0.00015223026275634766, -0.00012689828872680664, -0.00010156631469726562, -7.623434066772461e-05, -5.0902366638183594e-05, -2.5570392608642578e-05, -2.384185791015625e-07, 2.5093555450439453e-05, 5.042552947998047e-05, 7.575750350952148e-05, 0.0001010894775390625, 0.00012642145156860352, 0.00015175342559814453, 0.00017708539962768555, 0.00020241737365722656, 0.00022774934768676758, 0.0002530813217163086, 0.0002784132957458496, 0.0003037452697753906, 0.00032907724380493164, 0.00035440921783447266, 0.00037974119186401367, 0.0004050731658935547, 0.0004304051399230957, 0.0004557371139526367, 0.00048106908798217773, 0.0005064010620117188, 0.0005317330360412598, 0.0005570650100708008, 0.0005823969841003418, 0.0006077289581298828, 0.0006330609321594238, 0.0006583929061889648, 0.0006837248802185059, 0.0007090568542480469, 0.0007343888282775879, 0.0007597208023071289, 0.0007850527763366699, 0.0008103847503662109, 0.000835716724395752, 0.000861048698425293, 0.000886380672454834, 0.000911712646484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 8.0, 12.0, 5.0, 14.0, 20.0, 26.0, 32.0, 32.0, 57.0, 102.0, 175.0, 671.0, 8313.0, 449726.0, 578541.0, 9465.0, 793.0, 227.0, 100.0, 64.0, 43.0, 20.0, 25.0, 12.0, 12.0, 14.0, 10.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0154571533203125, -0.015027999877929688, -0.014598846435546875, -0.014169692993164062, -0.01374053955078125, -0.013311386108398438, -0.012882232666015625, -0.012453079223632812, -0.01202392578125, -0.011594772338867188, -0.011165618896484375, -0.010736465454101562, -0.01030731201171875, -0.009878158569335938, -0.009449005126953125, -0.009019851684570312, -0.0085906982421875, -0.008161544799804688, -0.007732391357421875, -0.0073032379150390625, -0.00687408447265625, -0.0064449310302734375, -0.006015777587890625, -0.0055866241455078125, -0.005157470703125, -0.0047283172607421875, -0.004299163818359375, -0.0038700103759765625, -0.00344085693359375, -0.0030117034912109375, -0.002582550048828125, -0.0021533966064453125, -0.0017242431640625, -0.0012950897216796875, -0.000865936279296875, -0.0004367828369140625, -7.62939453125e-06, 0.0004215240478515625, 0.000850677490234375, 0.0012798309326171875, 0.001708984375, 0.0021381378173828125, 0.002567291259765625, 0.0029964447021484375, 0.00342559814453125, 0.0038547515869140625, 0.004283905029296875, 0.0047130584716796875, 0.0051422119140625, 0.0055713653564453125, 0.006000518798828125, 0.0064296722412109375, 0.00685882568359375, 0.0072879791259765625, 0.007717132568359375, 0.008146286010742188, 0.008575439453125, 0.009004592895507812, 0.009433746337890625, 0.009862899780273438, 0.01029205322265625, 0.010721206665039062, 0.011150360107421875, 0.011579513549804688, 0.0120086669921875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 12.0, 485.0, 503.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022504893131554127, -0.001876032561995089, -0.0015015758108347654, -0.00112711894325912, -0.0007526621920987964, -0.00037820544093847275, -3.748573362827301e-06, 0.0003707080613821745, 0.0007451649289578199, 0.0011196216801181436, 0.0014940784312784672, 0.0018685352988541126, 0.002242992166429758, 0.00261744880117476, 0.0029919056687504053, 0.003366362303495407, 0.0037408191710710526, 0.004115276038646698, 0.0044897329062223434, 0.004864189773797989, 0.005238646175712347, 0.0056131030432879925, 0.005987559910863638, 0.006362016312777996, 0.0067364731803536415, 0.007110930047929287, 0.007485386915504932, 0.007859843783080578, 0.008234300650656223, 0.008608756586909294, 0.00898321345448494, 0.009357670322060585, 0.009732128120958805, 0.01010658498853445, 0.010481041856110096, 0.010855498723685741, 0.011229955591261387, 0.011604411527514458, 0.011978868395090103, 0.012353325262665749, 0.012727782130241394, 0.01310223899781704, 0.013476695865392685, 0.01385115273296833, 0.014225609600543976, 0.014600066468119621, 0.014974523335695267, 0.015348979271948338, 0.015723437070846558, 0.016097893938422203, 0.01647235080599785, 0.016846807673573494, 0.01722126454114914, 0.017595721408724785, 0.01797017827630043, 0.018344635143876076, 0.018719090148806572, 0.019093547016382217, 0.019468003883957863, 0.01984246075153351, 0.020216917619109154, 0.0205913744866848, 0.020965831354260445, 0.02134028822183609, 0.021714745089411736]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 5.0, 8.0, 9.0, 18.0, 19.0, 32.0, 38.0, 50.0, 47.0, 65.0, 65.0, 76.0, 59.0, 71.0, 78.0, 89.0, 61.0, 47.0, 42.0, 36.0, 18.0, 19.0, 19.0, 15.0, 6.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001292884349822998, -0.0012626098468899727, -0.0012323353439569473, -0.001202060841023922, -0.0011717863380908966, -0.0011415118351578712, -0.0011112373322248459, -0.0010809628292918205, -0.0010506883263587952, -0.0010204138234257698, -0.0009901393204927444, -0.0009598648175597191, -0.0009295903146266937, -0.0008993158116936684, -0.000869041308760643, -0.0008387668058276176, -0.0008084923028945923, -0.0007782177999615669, -0.0007479432970285416, -0.0007176687940955162, -0.0006873942911624908, -0.0006571197882294655, -0.0006268452852964401, -0.0005965707823634148, -0.0005662962794303894, -0.000536021776497364, -0.0005057472735643387, -0.0004754727706313133, -0.00044519826769828796, -0.0004149237647652626, -0.00038464926183223724, -0.0003543747588992119, -0.0003241002559661865, -0.00029382575303316116, -0.0002635512501001358, -0.00023327674716711044, -0.00020300224423408508, -0.00017272774130105972, -0.00014245323836803436, -0.000112178735435009, -8.190423250198364e-05, -5.162972956895828e-05, -2.1355226635932922e-05, 8.919276297092438e-06, 3.91937792301178e-05, 6.946828216314316e-05, 9.974278509616852e-05, 0.00013001728802919388, 0.00016029179096221924, 0.0001905662938952446, 0.00022084079682826996, 0.0002511152997612953, 0.0002813898026943207, 0.00031166430562734604, 0.0003419388085603714, 0.00037221331149339676, 0.0004024878144264221, 0.0004327623173594475, 0.00046303682029247284, 0.0004933113232254982, 0.0005235858261585236, 0.0005538603290915489, 0.0005841348320245743, 0.0006144093349575996, 0.000644683837890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0, 8.0, 5.0, 1.0, 5.0, 11.0, 14.0, 12.0, 19.0, 22.0, 24.0, 26.0, 31.0, 42.0, 29.0, 40.0, 43.0, 37.0, 60.0, 54.0, 46.0, 35.0, 42.0, 61.0, 36.0, 49.0, 32.0, 49.0, 25.0, 24.0, 20.0, 26.0, 11.0, 19.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.107421875, -3.0081787109375, -2.908935546875, -2.8096923828125, -2.71044921875, -2.6112060546875, -2.511962890625, -2.4127197265625, -2.3134765625, -2.2142333984375, -2.114990234375, -2.0157470703125, -1.91650390625, -1.8172607421875, -1.718017578125, -1.6187744140625, -1.51953125, -1.4202880859375, -1.321044921875, -1.2218017578125, -1.12255859375, -1.0233154296875, -0.924072265625, -0.8248291015625, -0.7255859375, -0.6263427734375, -0.527099609375, -0.4278564453125, -0.32861328125, -0.2293701171875, -0.130126953125, -0.0308837890625, 0.068359375, 0.1676025390625, 0.266845703125, 0.3660888671875, 0.46533203125, 0.5645751953125, 0.663818359375, 0.7630615234375, 0.8623046875, 0.9615478515625, 1.060791015625, 1.1600341796875, 1.25927734375, 1.3585205078125, 1.457763671875, 1.5570068359375, 1.65625, 1.7554931640625, 1.854736328125, 1.9539794921875, 2.05322265625, 2.1524658203125, 2.251708984375, 2.3509521484375, 2.4501953125, 2.5494384765625, 2.648681640625, 2.7479248046875, 2.84716796875, 2.9464111328125, 3.045654296875, 3.1448974609375, 3.244140625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 10.0, 11.0, 17.0, 39.0, 46.0, 81.0, 115.0, 202.0, 367.0, 691.0, 1319.0, 2844.0, 6723.0, 19350.0, 75653.0, 466056.0, 383934.0, 63006.0, 16792.0, 6000.0, 2576.0, 1236.0, 621.0, 321.0, 200.0, 121.0, 86.0, 32.0, 29.0, 19.0, 17.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.2568359375, -10.880859375, -10.5048828125, -10.12890625, -9.7529296875, -9.376953125, -9.0009765625, -8.625, -8.2490234375, -7.873046875, -7.4970703125, -7.12109375, -6.7451171875, -6.369140625, -5.9931640625, -5.6171875, -5.2412109375, -4.865234375, -4.4892578125, -4.11328125, -3.7373046875, -3.361328125, -2.9853515625, -2.609375, -2.2333984375, -1.857421875, -1.4814453125, -1.10546875, -0.7294921875, -0.353515625, 0.0224609375, 0.3984375, 0.7744140625, 1.150390625, 1.5263671875, 1.90234375, 2.2783203125, 2.654296875, 3.0302734375, 3.40625, 3.7822265625, 4.158203125, 4.5341796875, 4.91015625, 5.2861328125, 5.662109375, 6.0380859375, 6.4140625, 6.7900390625, 7.166015625, 7.5419921875, 7.91796875, 8.2939453125, 8.669921875, 9.0458984375, 9.421875, 9.7978515625, 10.173828125, 10.5498046875, 10.92578125, 11.3017578125, 11.677734375, 12.0537109375, 12.4296875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 13.0, 15.0, 13.0, 11.0, 22.0, 12.0, 33.0, 43.0, 32.0, 41.0, 45.0, 60.0, 101.0, 138.0, 208.0, 1313.0, 249.0, 177.0, 98.0, 74.0, 60.0, 40.0, 40.0, 34.0, 32.0, 23.0, 8.0, 19.0, 20.0, 10.0, 11.0, 13.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.20654296875, -8.8974609375, -8.58837890625, -8.279296875, -7.97021484375, -7.6611328125, -7.35205078125, -7.04296875, -6.73388671875, -6.4248046875, -6.11572265625, -5.806640625, -5.49755859375, -5.1884765625, -4.87939453125, -4.5703125, -4.26123046875, -3.9521484375, -3.64306640625, -3.333984375, -3.02490234375, -2.7158203125, -2.40673828125, -2.09765625, -1.78857421875, -1.4794921875, -1.17041015625, -0.861328125, -0.55224609375, -0.2431640625, 0.06591796875, 0.375, 0.68408203125, 0.9931640625, 1.30224609375, 1.611328125, 1.92041015625, 2.2294921875, 2.53857421875, 2.84765625, 3.15673828125, 3.4658203125, 3.77490234375, 4.083984375, 4.39306640625, 4.7021484375, 5.01123046875, 5.3203125, 5.62939453125, 5.9384765625, 6.24755859375, 6.556640625, 6.86572265625, 7.1748046875, 7.48388671875, 7.79296875, 8.10205078125, 8.4111328125, 8.72021484375, 9.029296875, 9.33837890625, 9.6474609375, 9.95654296875, 10.265625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 15.0, 8.0, 14.0, 13.0, 21.0, 29.0, 31.0, 41.0, 61.0, 101.0, 169.0, 293.0, 629.0, 1467.0, 4089.0, 13232.0, 74066.0, 1477895.0, 1478421.0, 74509.0, 13687.0, 4047.0, 1478.0, 605.0, 288.0, 132.0, 97.0, 62.0, 46.0, 33.0, 21.0, 13.0, 17.0, 11.0, 12.0, 9.0, 5.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.234375, -15.72705078125, -15.2197265625, -14.71240234375, -14.205078125, -13.69775390625, -13.1904296875, -12.68310546875, -12.17578125, -11.66845703125, -11.1611328125, -10.65380859375, -10.146484375, -9.63916015625, -9.1318359375, -8.62451171875, -8.1171875, -7.60986328125, -7.1025390625, -6.59521484375, -6.087890625, -5.58056640625, -5.0732421875, -4.56591796875, -4.05859375, -3.55126953125, -3.0439453125, -2.53662109375, -2.029296875, -1.52197265625, -1.0146484375, -0.50732421875, 0.0, 0.50732421875, 1.0146484375, 1.52197265625, 2.029296875, 2.53662109375, 3.0439453125, 3.55126953125, 4.05859375, 4.56591796875, 5.0732421875, 5.58056640625, 6.087890625, 6.59521484375, 7.1025390625, 7.60986328125, 8.1171875, 8.62451171875, 9.1318359375, 9.63916015625, 10.146484375, 10.65380859375, 11.1611328125, 11.66845703125, 12.17578125, 12.68310546875, 13.1904296875, 13.69775390625, 14.205078125, 14.71240234375, 15.2197265625, 15.72705078125, 16.234375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 15.0, 20.0, 40.0, 68.0, 100.0, 125.0, 147.0, 134.0, 132.0, 82.0, 54.0, 45.0, 19.0, 12.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.56389045715332, -15.25368881225586, -13.943486213684082, -12.633284568786621, -11.323081970214844, -10.012880325317383, -8.702678680419922, -7.3924760818481445, -6.082274436950684, -4.7720723152160645, -3.4618704319000244, -2.1516685485839844, -0.8414664268493652, 0.4687356948852539, 1.7789373397827148, 3.089139938354492, 4.399341583251953, 5.709543704986572, 7.019745826721191, 8.329947471618652, 9.64015007019043, 10.95035171508789, 12.260553359985352, 13.570755958557129, 14.88095760345459, 16.191160202026367, 17.501361846923828, 18.81156349182129, 20.12176513671875, 21.431968688964844, 22.742168426513672, 24.052371978759766, 25.36257553100586, 26.67277717590332, 27.98297882080078, 29.293182373046875, 30.603384017944336, 31.913585662841797, 33.223785400390625, 34.53398895263672, 35.84419250488281, 37.154396057128906, 38.464595794677734, 39.77479934692383, 41.084999084472656, 42.39520263671875, 43.705406188964844, 45.01560592651367, 46.3258056640625, 47.636009216308594, 48.94620895385742, 50.256412506103516, 51.566612243652344, 52.87681579589844, 54.18701934814453, 55.49721908569336, 56.80742263793945, 58.11762619018555, 59.427825927734375, 60.73802947998047, 62.0482292175293, 63.35843276977539, 64.66863250732422, 65.97883605957031, 67.2890396118164]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 9.0, 11.0, 17.0, 14.0, 14.0, 23.0, 27.0, 27.0, 25.0, 24.0, 26.0, 30.0, 37.0, 47.0, 47.0, 45.0, 46.0, 40.0, 43.0, 48.0, 36.0, 48.0, 30.0, 40.0, 32.0, 20.0, 31.0, 26.0, 18.0, 16.0, 13.0, 11.0, 9.0, 13.0, 8.0, 12.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.860036849975586, -28.899385452270508, -27.93873405456543, -26.97808074951172, -26.01742935180664, -25.056777954101562, -24.096126556396484, -23.135475158691406, -22.174823760986328, -21.21417236328125, -20.253520965576172, -19.292869567871094, -18.332216262817383, -17.371564865112305, -16.410913467407227, -15.450262069702148, -14.489608764648438, -13.52895736694336, -12.568305015563965, -11.607653617858887, -10.647001266479492, -9.686349868774414, -8.725698471069336, -7.7650465965271, -6.804394721984863, -5.843742847442627, -4.883090972900391, -3.9224395751953125, -2.961787700653076, -2.00113582611084, -1.0404844284057617, -0.07983255386352539, 0.8808174133300781, 1.841469168663025, 2.8021209239959717, 3.762772560119629, 4.723424434661865, 5.684076309204102, 6.64472770690918, 7.605379581451416, 8.566031455993652, 9.52668285369873, 10.487335205078125, 11.447986602783203, 12.408638000488281, 13.369290351867676, 14.329941749572754, 15.290594100952148, 16.251245498657227, 17.211896896362305, 18.172548294067383, 19.133201599121094, 20.093852996826172, 21.05450439453125, 22.015155792236328, 22.975807189941406, 23.936458587646484, 24.897109985351562, 25.85776138305664, 26.81841278076172, 27.77906608581543, 28.739717483520508, 29.700368881225586, 30.661020278930664, 31.621673583984375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 1.0, 6.0, 15.0, 23.0, 17.0, 19.0, 22.0, 22.0, 50.0, 21.0, 35.0, 32.0, 40.0, 38.0, 49.0, 53.0, 49.0, 38.0, 46.0, 37.0, 50.0, 48.0, 36.0, 39.0, 37.0, 30.0, 24.0, 20.0, 19.0, 7.0, 13.0, 9.0, 8.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.486328125, -3.382415771484375, -3.27850341796875, -3.174591064453125, -3.0706787109375, -2.966766357421875, -2.86285400390625, -2.758941650390625, -2.655029296875, -2.551116943359375, -2.44720458984375, -2.343292236328125, -2.2393798828125, -2.135467529296875, -2.03155517578125, -1.927642822265625, -1.82373046875, -1.719818115234375, -1.61590576171875, -1.511993408203125, -1.4080810546875, -1.304168701171875, -1.20025634765625, -1.096343994140625, -0.992431640625, -0.888519287109375, -0.78460693359375, -0.680694580078125, -0.5767822265625, -0.472869873046875, -0.36895751953125, -0.265045166015625, -0.1611328125, -0.057220458984375, 0.04669189453125, 0.150604248046875, 0.2545166015625, 0.358428955078125, 0.46234130859375, 0.566253662109375, 0.670166015625, 0.774078369140625, 0.87799072265625, 0.981903076171875, 1.0858154296875, 1.189727783203125, 1.29364013671875, 1.397552490234375, 1.50146484375, 1.605377197265625, 1.70928955078125, 1.813201904296875, 1.9171142578125, 2.021026611328125, 2.12493896484375, 2.228851318359375, 2.332763671875, 2.436676025390625, 2.54058837890625, 2.644500732421875, 2.7484130859375, 2.852325439453125, 2.95623779296875, 3.060150146484375, 3.1640625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 4.0, 9.0, 7.0, 25.0, 24.0, 40.0, 49.0, 108.0, 158.0, 272.0, 455.0, 771.0, 1500.0, 3344.0, 8105.0, 26570.0, 199498.0, 2623301.0, 1221508.0, 82779.0, 15952.0, 5244.0, 2146.0, 1069.0, 549.0, 311.0, 172.0, 114.0, 67.0, 42.0, 33.0, 14.0, 11.0, 13.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4921875, -11.1419677734375, -10.791748046875, -10.4415283203125, -10.09130859375, -9.7410888671875, -9.390869140625, -9.0406494140625, -8.6904296875, -8.3402099609375, -7.989990234375, -7.6397705078125, -7.28955078125, -6.9393310546875, -6.589111328125, -6.2388916015625, -5.888671875, -5.5384521484375, -5.188232421875, -4.8380126953125, -4.48779296875, -4.1375732421875, -3.787353515625, -3.4371337890625, -3.0869140625, -2.7366943359375, -2.386474609375, -2.0362548828125, -1.68603515625, -1.3358154296875, -0.985595703125, -0.6353759765625, -0.28515625, 0.0650634765625, 0.415283203125, 0.7655029296875, 1.11572265625, 1.4659423828125, 1.816162109375, 2.1663818359375, 2.5166015625, 2.8668212890625, 3.217041015625, 3.5672607421875, 3.91748046875, 4.2677001953125, 4.617919921875, 4.9681396484375, 5.318359375, 5.6685791015625, 6.018798828125, 6.3690185546875, 6.71923828125, 7.0694580078125, 7.419677734375, 7.7698974609375, 8.1201171875, 8.4703369140625, 8.820556640625, 9.1707763671875, 9.52099609375, 9.8712158203125, 10.221435546875, 10.5716552734375, 10.921875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 5.0, 2.0, 7.0, 9.0, 11.0, 12.0, 25.0, 25.0, 38.0, 52.0, 69.0, 96.0, 114.0, 155.0, 241.0, 302.0, 389.0, 458.0, 482.0, 428.0, 304.0, 220.0, 182.0, 134.0, 82.0, 47.0, 44.0, 33.0, 13.0, 16.0, 14.0, 15.0, 13.0, 4.0, 8.0, 3.0, 10.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.28125, -6.07208251953125, -5.8629150390625, -5.65374755859375, -5.444580078125, -5.23541259765625, -5.0262451171875, -4.81707763671875, -4.60791015625, -4.39874267578125, -4.1895751953125, -3.98040771484375, -3.771240234375, -3.56207275390625, -3.3529052734375, -3.14373779296875, -2.9345703125, -2.72540283203125, -2.5162353515625, -2.30706787109375, -2.097900390625, -1.88873291015625, -1.6795654296875, -1.47039794921875, -1.26123046875, -1.05206298828125, -0.8428955078125, -0.63372802734375, -0.424560546875, -0.21539306640625, -0.0062255859375, 0.20294189453125, 0.412109375, 0.62127685546875, 0.8304443359375, 1.03961181640625, 1.248779296875, 1.45794677734375, 1.6671142578125, 1.87628173828125, 2.08544921875, 2.29461669921875, 2.5037841796875, 2.71295166015625, 2.922119140625, 3.13128662109375, 3.3404541015625, 3.54962158203125, 3.7587890625, 3.96795654296875, 4.1771240234375, 4.38629150390625, 4.595458984375, 4.80462646484375, 5.0137939453125, 5.22296142578125, 5.43212890625, 5.64129638671875, 5.8504638671875, 6.05963134765625, 6.268798828125, 6.47796630859375, 6.6871337890625, 6.89630126953125, 7.10546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 13.0, 6.0, 18.0, 19.0, 23.0, 24.0, 32.0, 53.0, 88.0, 143.0, 270.0, 711.0, 1902.0, 7106.0, 56316.0, 2241944.0, 1828059.0, 47723.0, 6559.0, 1820.0, 634.0, 307.0, 159.0, 111.0, 66.0, 38.0, 28.0, 26.0, 15.0, 18.0, 4.0, 4.0, 10.0, 2.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.375, -22.666015625, -21.95703125, -21.248046875, -20.5390625, -19.830078125, -19.12109375, -18.412109375, -17.703125, -16.994140625, -16.28515625, -15.576171875, -14.8671875, -14.158203125, -13.44921875, -12.740234375, -12.03125, -11.322265625, -10.61328125, -9.904296875, -9.1953125, -8.486328125, -7.77734375, -7.068359375, -6.359375, -5.650390625, -4.94140625, -4.232421875, -3.5234375, -2.814453125, -2.10546875, -1.396484375, -0.6875, 0.021484375, 0.73046875, 1.439453125, 2.1484375, 2.857421875, 3.56640625, 4.275390625, 4.984375, 5.693359375, 6.40234375, 7.111328125, 7.8203125, 8.529296875, 9.23828125, 9.947265625, 10.65625, 11.365234375, 12.07421875, 12.783203125, 13.4921875, 14.201171875, 14.91015625, 15.619140625, 16.328125, 17.037109375, 17.74609375, 18.455078125, 19.1640625, 19.873046875, 20.58203125, 21.291015625, 22.0]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 16.0, 29.0, 86.0, 143.0, 184.0, 229.0, 151.0, 95.0, 46.0, 14.0, 9.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.230268478393555, -17.723499298095703, -15.216730117797852, -12.709961891174316, -10.203192710876465, -7.696423530578613, -5.189655303955078, -2.6828861236572266, -0.176116943359375, 2.3306519985198975, 4.83742094039917, 7.344189643859863, 9.850958824157715, 12.357728004455566, 14.864496231079102, 17.371265411376953, 19.878034591674805, 22.384803771972656, 24.891572952270508, 27.39834213256836, 29.905109405517578, 32.41188049316406, 34.91864776611328, 37.4254150390625, 39.932186126708984, 42.4389533996582, 44.94572448730469, 47.452491760253906, 49.95926284790039, 52.46603012084961, 54.972801208496094, 57.47956848144531, 59.98633575439453, 62.49310302734375, 64.99987030029297, 67.50664520263672, 70.01341247558594, 72.52017974853516, 75.02694702148438, 77.53372192382812, 80.04048919677734, 82.54725646972656, 85.05402374267578, 87.56079864501953, 90.06756591796875, 92.57433319091797, 95.08110046386719, 97.58787536621094, 100.09463500976562, 102.60140228271484, 105.10816955566406, 107.61494445800781, 110.12171173095703, 112.62847900390625, 115.13524627685547, 117.64201354980469, 120.14878845214844, 122.65555572509766, 125.16232299804688, 127.66909790039062, 130.1758575439453, 132.68263244628906, 135.1894073486328, 137.6961669921875, 140.20294189453125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 5.0, 10.0, 8.0, 11.0, 14.0, 18.0, 16.0, 21.0, 16.0, 37.0, 30.0, 38.0, 29.0, 33.0, 41.0, 44.0, 50.0, 39.0, 50.0, 49.0, 53.0, 44.0, 45.0, 36.0, 25.0, 21.0, 22.0, 31.0, 26.0, 19.0, 22.0, 18.0, 18.0, 12.0, 8.0, 6.0, 10.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.2144832611084, -24.47092628479004, -23.727367401123047, -22.983810424804688, -22.240253448486328, -21.49669647216797, -20.75313949584961, -20.009580612182617, -19.266023635864258, -18.5224666595459, -17.778907775878906, -17.035350799560547, -16.291793823242188, -15.548236846923828, -14.804678916931152, -14.061120986938477, -13.317564010620117, -12.574007034301758, -11.830449104309082, -11.086891174316406, -10.343334197998047, -9.599777221679688, -8.856219291687012, -8.112661361694336, -7.369104385375977, -6.625546932220459, -5.881989479064941, -5.138432025909424, -4.394874572753906, -3.6513171195983887, -2.907759666442871, -2.1642022132873535, -1.4206466674804688, -0.6770892143249512, 0.0664682388305664, 0.810025691986084, 1.5535831451416016, 2.297140598297119, 3.0406980514526367, 3.7842555046081543, 4.527812957763672, 5.2713704109191895, 6.014927864074707, 6.758485317230225, 7.502042770385742, 8.245599746704102, 8.989157676696777, 9.732715606689453, 10.476272583007812, 11.219829559326172, 11.963387489318848, 12.706945419311523, 13.450502395629883, 14.194059371948242, 14.937617301940918, 15.681175231933594, 16.424732208251953, 17.168289184570312, 17.911846160888672, 18.655405044555664, 19.398962020874023, 20.142518997192383, 20.886077880859375, 21.629634857177734, 22.373191833496094]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 6.0, 11.0, 10.0, 15.0, 14.0, 19.0, 30.0, 29.0, 30.0, 22.0, 28.0, 39.0, 53.0, 35.0, 44.0, 47.0, 42.0, 40.0, 50.0, 39.0, 45.0, 43.0, 37.0, 40.0, 42.0, 32.0, 27.0, 17.0, 18.0, 18.0, 12.0, 19.0, 8.0, 7.0, 6.0, 4.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.013580322265625, -2.90997314453125, -2.806365966796875, -2.7027587890625, -2.599151611328125, -2.49554443359375, -2.391937255859375, -2.288330078125, -2.184722900390625, -2.08111572265625, -1.977508544921875, -1.8739013671875, -1.770294189453125, -1.66668701171875, -1.563079833984375, -1.45947265625, -1.355865478515625, -1.25225830078125, -1.148651123046875, -1.0450439453125, -0.941436767578125, -0.83782958984375, -0.734222412109375, -0.630615234375, -0.527008056640625, -0.42340087890625, -0.319793701171875, -0.2161865234375, -0.112579345703125, -0.00897216796875, 0.094635009765625, 0.1982421875, 0.301849365234375, 0.40545654296875, 0.509063720703125, 0.6126708984375, 0.716278076171875, 0.81988525390625, 0.923492431640625, 1.027099609375, 1.130706787109375, 1.23431396484375, 1.337921142578125, 1.4415283203125, 1.545135498046875, 1.64874267578125, 1.752349853515625, 1.85595703125, 1.959564208984375, 2.06317138671875, 2.166778564453125, 2.2703857421875, 2.373992919921875, 2.47760009765625, 2.581207275390625, 2.684814453125, 2.788421630859375, 2.89202880859375, 2.995635986328125, 3.0992431640625, 3.202850341796875, 3.30645751953125, 3.410064697265625, 3.513671875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 18.0, 13.0, 21.0, 43.0, 59.0, 81.0, 149.0, 153.0, 291.0, 399.0, 654.0, 1037.0, 1585.0, 2429.0, 3767.0, 5756.0, 9417.0, 15253.0, 25505.0, 44359.0, 81679.0, 169423.0, 325170.0, 168612.0, 81923.0, 44404.0, 25564.0, 15045.0, 9259.0, 5881.0, 3776.0, 2366.0, 1475.0, 1020.0, 661.0, 433.0, 300.0, 195.0, 122.0, 92.0, 49.0, 37.0, 22.0, 21.0, 17.0, 10.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.16057205200195312, -0.15512847900390625, -0.14968490600585938, -0.1442413330078125, -0.13879776000976562, -0.13335418701171875, -0.12791061401367188, -0.122467041015625, -0.11702346801757812, -0.11157989501953125, -0.10613632202148438, -0.1006927490234375, -0.09524917602539062, -0.08980560302734375, -0.08436203002929688, -0.07891845703125, -0.07347488403320312, -0.06803131103515625, -0.06258773803710938, -0.0571441650390625, -0.051700592041015625, -0.04625701904296875, -0.040813446044921875, -0.035369873046875, -0.029926300048828125, -0.02448272705078125, -0.019039154052734375, -0.0135955810546875, -0.008152008056640625, -0.00270843505859375, 0.002735137939453125, 0.0081787109375, 0.013622283935546875, 0.01906585693359375, 0.024509429931640625, 0.0299530029296875, 0.035396575927734375, 0.04084014892578125, 0.046283721923828125, 0.051727294921875, 0.057170867919921875, 0.06261444091796875, 0.06805801391601562, 0.0735015869140625, 0.07894515991210938, 0.08438873291015625, 0.08983230590820312, 0.09527587890625, 0.10071945190429688, 0.10616302490234375, 0.11160659790039062, 0.1170501708984375, 0.12249374389648438, 0.12793731689453125, 0.13338088989257812, 0.138824462890625, 0.14426803588867188, 0.14971160888671875, 0.15515518188476562, 0.1605987548828125, 0.16604232788085938, 0.17148590087890625, 0.17692947387695312, 0.182373046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 12.0, 7.0, 12.0, 13.0, 16.0, 16.0, 21.0, 16.0, 17.0, 28.0, 26.0, 26.0, 26.0, 42.0, 35.0, 33.0, 44.0, 36.0, 38.0, 1064.0, 39.0, 36.0, 39.0, 38.0, 26.0, 36.0, 28.0, 31.0, 31.0, 33.0, 22.0, 18.0, 21.0, 12.0, 16.0, 11.0, 13.0, 7.0, 5.0, 6.0, 9.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.615234375, -2.535308837890625, -2.45538330078125, -2.375457763671875, -2.2955322265625, -2.215606689453125, -2.13568115234375, -2.055755615234375, -1.975830078125, -1.895904541015625, -1.81597900390625, -1.736053466796875, -1.6561279296875, -1.576202392578125, -1.49627685546875, -1.416351318359375, -1.33642578125, -1.256500244140625, -1.17657470703125, -1.096649169921875, -1.0167236328125, -0.936798095703125, -0.85687255859375, -0.776947021484375, -0.697021484375, -0.617095947265625, -0.53717041015625, -0.457244873046875, -0.3773193359375, -0.297393798828125, -0.21746826171875, -0.137542724609375, -0.0576171875, 0.022308349609375, 0.10223388671875, 0.182159423828125, 0.2620849609375, 0.342010498046875, 0.42193603515625, 0.501861572265625, 0.581787109375, 0.661712646484375, 0.74163818359375, 0.821563720703125, 0.9014892578125, 0.981414794921875, 1.06134033203125, 1.141265869140625, 1.22119140625, 1.301116943359375, 1.38104248046875, 1.460968017578125, 1.5408935546875, 1.620819091796875, 1.70074462890625, 1.780670166015625, 1.860595703125, 1.940521240234375, 2.02044677734375, 2.100372314453125, 2.1802978515625, 2.260223388671875, 2.34014892578125, 2.420074462890625, 2.5]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 7.0, 10.0, 17.0, 13.0, 31.0, 33.0, 45.0, 72.0, 87.0, 126.0, 181.0, 299.0, 385.0, 518.0, 712.0, 1051.0, 1457.0, 1978.0, 2709.0, 3980.0, 5565.0, 7791.0, 11214.0, 15667.0, 23360.0, 34812.0, 53961.0, 89851.0, 170040.0, 1300163.0, 141790.0, 78705.0, 48532.0, 31463.0, 20914.0, 14568.0, 10081.0, 7094.0, 5098.0, 3584.0, 2611.0, 1898.0, 1280.0, 967.0, 684.0, 477.0, 369.0, 258.0, 203.0, 127.0, 81.0, 70.0, 46.0, 40.0, 19.0, 21.0, 12.0, 11.0, 1.0, 5.0, 2.0, 1.0], "bins": [-0.050750732421875, -0.04913330078125, -0.047515869140625, -0.0458984375, -0.044281005859375, -0.04266357421875, -0.041046142578125, -0.0394287109375, -0.037811279296875, -0.03619384765625, -0.034576416015625, -0.032958984375, -0.031341552734375, -0.02972412109375, -0.028106689453125, -0.0264892578125, -0.024871826171875, -0.02325439453125, -0.021636962890625, -0.02001953125, -0.018402099609375, -0.01678466796875, -0.015167236328125, -0.0135498046875, -0.011932373046875, -0.01031494140625, -0.008697509765625, -0.007080078125, -0.005462646484375, -0.00384521484375, -0.002227783203125, -0.0006103515625, 0.001007080078125, 0.00262451171875, 0.004241943359375, 0.005859375, 0.007476806640625, 0.00909423828125, 0.010711669921875, 0.0123291015625, 0.013946533203125, 0.01556396484375, 0.017181396484375, 0.018798828125, 0.020416259765625, 0.02203369140625, 0.023651123046875, 0.0252685546875, 0.026885986328125, 0.02850341796875, 0.030120849609375, 0.03173828125, 0.033355712890625, 0.03497314453125, 0.036590576171875, 0.0382080078125, 0.039825439453125, 0.04144287109375, 0.043060302734375, 0.044677734375, 0.046295166015625, 0.04791259765625, 0.049530029296875, 0.0511474609375, 0.052764892578125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 1.0, 7.0, 7.0, 6.0, 8.0, 8.0, 7.0, 19.0, 24.0, 30.0, 27.0, 36.0, 54.0, 58.0, 73.0, 126.0, 125.0, 83.0, 47.0, 44.0, 31.0, 32.0, 27.0, 18.0, 11.0, 15.0, 5.0, 9.0, 12.0, 6.0, 7.0, 1.0, 5.0, 2.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009245872497558594, -0.0008936896920204163, -0.0008627921342849731, -0.00083189457654953, -0.0008009970188140869, -0.0007700994610786438, -0.0007392019033432007, -0.0007083043456077576, -0.0006774067878723145, -0.0006465092301368713, -0.0006156116724014282, -0.0005847141146659851, -0.000553816556930542, -0.0005229189991950989, -0.0004920214414596558, -0.00046112388372421265, -0.00043022632598876953, -0.0003993287682533264, -0.0003684312105178833, -0.0003375336527824402, -0.00030663609504699707, -0.00027573853731155396, -0.00024484097957611084, -0.00021394342184066772, -0.0001830458641052246, -0.0001521483063697815, -0.00012125074863433838, -9.035319089889526e-05, -5.945563316345215e-05, -2.8558075428009033e-05, 2.339482307434082e-06, 3.32370400428772e-05, 6.413459777832031e-05, 9.503215551376343e-05, 0.00012592971324920654, 0.00015682727098464966, 0.00018772482872009277, 0.0002186223864555359, 0.000249519944190979, 0.0002804175019264221, 0.00031131505966186523, 0.00034221261739730835, 0.00037311017513275146, 0.0004040077328681946, 0.0004349052906036377, 0.0004658028483390808, 0.0004967004060745239, 0.000527597963809967, 0.0005584955215454102, 0.0005893930792808533, 0.0006202906370162964, 0.0006511881947517395, 0.0006820857524871826, 0.0007129833102226257, 0.0007438808679580688, 0.000774778425693512, 0.0008056759834289551, 0.0008365735411643982, 0.0008674710988998413, 0.0008983686566352844, 0.0009292662143707275, 0.0009601637721061707, 0.0009910613298416138, 0.0010219588875770569, 0.0010528564453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 10.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 13.0, 5.0, 11.0, 15.0, 17.0, 35.0, 40.0, 72.0, 102.0, 283.0, 1278.0, 31318.0, 979370.0, 33975.0, 1363.0, 251.0, 116.0, 58.0, 51.0, 37.0, 27.0, 16.0, 9.0, 11.0, 7.0, 6.0, 6.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.019622802734375, -0.019054174423217773, -0.018485546112060547, -0.01791691780090332, -0.017348289489746094, -0.016779661178588867, -0.01621103286743164, -0.015642404556274414, -0.015073776245117188, -0.014505147933959961, -0.013936519622802734, -0.013367891311645508, -0.012799263000488281, -0.012230634689331055, -0.011662006378173828, -0.011093378067016602, -0.010524749755859375, -0.009956121444702148, -0.009387493133544922, -0.008818864822387695, -0.008250236511230469, -0.007681608200073242, -0.007112979888916016, -0.006544351577758789, -0.0059757232666015625, -0.005407094955444336, -0.004838466644287109, -0.004269838333129883, -0.0037012100219726562, -0.0031325817108154297, -0.002563953399658203, -0.0019953250885009766, -0.00142669677734375, -0.0008580684661865234, -0.0002894401550292969, 0.0002791881561279297, 0.0008478164672851562, 0.0014164447784423828, 0.0019850730895996094, 0.002553701400756836, 0.0031223297119140625, 0.003690958023071289, 0.004259586334228516, 0.004828214645385742, 0.005396842956542969, 0.005965471267700195, 0.006534099578857422, 0.0071027278900146484, 0.007671356201171875, 0.008239984512329102, 0.008808612823486328, 0.009377241134643555, 0.009945869445800781, 0.010514497756958008, 0.011083126068115234, 0.011651754379272461, 0.012220382690429688, 0.012789011001586914, 0.01335763931274414, 0.013926267623901367, 0.014494895935058594, 0.01506352424621582, 0.015632152557373047, 0.016200780868530273, 0.0167694091796875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 653.0, 359.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018341382965445518, -0.001212620292790234, -0.0005911022890359163, 3.0415714718401432e-05, 0.0006519337184727192, 0.0012734518386423588, 0.0018949697259813547, 0.0025164876133203506, 0.0031380057334899902, 0.00375952385365963, 0.004381041973829269, 0.005002559628337622, 0.005624077748507261, 0.006245595868676901, 0.006867113523185253, 0.007488631643354893, 0.008110149763524532, 0.008731667883694172, 0.009353186003863811, 0.009974704124033451, 0.010596221312880516, 0.011217739433050156, 0.011839257553219795, 0.012460775673389435, 0.013082293793559074, 0.013703811913728714, 0.014325330033898354, 0.014946848154067993, 0.015568366274237633, 0.016189884394407272, 0.016811402514576912, 0.01743292063474655, 0.018054436892271042, 0.01867595501244068, 0.01929747313261032, 0.01991899125277996, 0.0205405093729496, 0.02116202749311924, 0.02178354561328888, 0.02240506187081337, 0.02302658185362816, 0.023648099973797798, 0.024269618093967438, 0.024891136214137077, 0.025512654334306717, 0.026134172454476357, 0.026755690574645996, 0.027377206832170486, 0.027998724952340126, 0.028620243072509766, 0.029241761192679405, 0.029863279312849045, 0.030484797433018684, 0.031106315553188324, 0.031727831810712814, 0.0323493517935276, 0.032970868051052094, 0.033592384308576584, 0.03421390429139137, 0.03483542054891586, 0.03545694053173065, 0.03607845678925514, 0.03669997677206993, 0.03732149302959442, 0.03794301301240921]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 9.0, 7.0, 13.0, 29.0, 30.0, 30.0, 46.0, 55.0, 50.0, 84.0, 73.0, 79.0, 108.0, 66.0, 85.0, 63.0, 53.0, 42.0, 35.0, 24.0, 10.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.002049744129180908, -0.002006715163588524, -0.0019636861979961395, -0.0019206572324037552, -0.0018776282668113708, -0.0018345993012189865, -0.0017915703356266022, -0.0017485413700342178, -0.0017055124044418335, -0.0016624834388494492, -0.0016194544732570648, -0.0015764255076646805, -0.0015333965420722961, -0.0014903675764799118, -0.0014473386108875275, -0.0014043096452951431, -0.0013612806797027588, -0.0013182517141103745, -0.0012752227485179901, -0.0012321937829256058, -0.0011891648173332214, -0.001146135851740837, -0.0011031068861484528, -0.0010600779205560684, -0.001017048954963684, -0.0009740199893712997, -0.0009309910237789154, -0.0008879620581865311, -0.0008449330925941467, -0.0008019041270017624, -0.000758875161409378, -0.0007158461958169937, -0.0006728172302246094, -0.000629788264632225, -0.0005867592990398407, -0.0005437303334474564, -0.000500701367855072, -0.0004576724022626877, -0.00041464343667030334, -0.000371614471077919, -0.00032858550548553467, -0.00028555653989315033, -0.000242527574300766, -0.00019949860870838165, -0.00015646964311599731, -0.00011344067752361298, -7.041171193122864e-05, -2.73827463388443e-05, 1.564621925354004e-05, 5.867518484592438e-05, 0.00010170415043830872, 0.00014473311603069305, 0.0001877620816230774, 0.00023079104721546173, 0.00027382001280784607, 0.0003168489784002304, 0.00035987794399261475, 0.0004029069095849991, 0.0004459358751773834, 0.0004889648407697678, 0.0005319938063621521, 0.0005750227719545364, 0.0006180517375469208, 0.0006610807031393051, 0.0007041096687316895]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 6.0, 11.0, 10.0, 15.0, 14.0, 19.0, 30.0, 29.0, 30.0, 22.0, 28.0, 39.0, 53.0, 35.0, 44.0, 47.0, 42.0, 40.0, 50.0, 39.0, 45.0, 43.0, 37.0, 40.0, 42.0, 32.0, 27.0, 17.0, 18.0, 18.0, 12.0, 19.0, 8.0, 7.0, 6.0, 4.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.013580322265625, -2.90997314453125, -2.806365966796875, -2.7027587890625, -2.599151611328125, -2.49554443359375, -2.391937255859375, -2.288330078125, -2.184722900390625, -2.08111572265625, -1.977508544921875, -1.8739013671875, -1.770294189453125, -1.66668701171875, -1.563079833984375, -1.45947265625, -1.355865478515625, -1.25225830078125, -1.148651123046875, -1.0450439453125, -0.941436767578125, -0.83782958984375, -0.734222412109375, -0.630615234375, -0.527008056640625, -0.42340087890625, -0.319793701171875, -0.2161865234375, -0.112579345703125, -0.00897216796875, 0.094635009765625, 0.1982421875, 0.301849365234375, 0.40545654296875, 0.509063720703125, 0.6126708984375, 0.716278076171875, 0.81988525390625, 0.923492431640625, 1.027099609375, 1.130706787109375, 1.23431396484375, 1.337921142578125, 1.4415283203125, 1.545135498046875, 1.64874267578125, 1.752349853515625, 1.85595703125, 1.959564208984375, 2.06317138671875, 2.166778564453125, 2.2703857421875, 2.373992919921875, 2.47760009765625, 2.581207275390625, 2.684814453125, 2.788421630859375, 2.89202880859375, 2.995635986328125, 3.0992431640625, 3.202850341796875, 3.30645751953125, 3.410064697265625, 3.513671875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 8.0, 19.0, 21.0, 43.0, 61.0, 118.0, 154.0, 265.0, 454.0, 751.0, 1355.0, 2515.0, 4702.0, 9846.0, 22616.0, 57395.0, 176433.0, 428822.0, 223002.0, 69928.0, 26697.0, 11492.0, 5494.0, 2769.0, 1478.0, 782.0, 526.0, 282.0, 178.0, 116.0, 62.0, 56.0, 32.0, 22.0, 18.0, 9.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.91058349609375, -5.7235107421875, -5.53643798828125, -5.349365234375, -5.16229248046875, -4.9752197265625, -4.78814697265625, -4.60107421875, -4.41400146484375, -4.2269287109375, -4.03985595703125, -3.852783203125, -3.66571044921875, -3.4786376953125, -3.29156494140625, -3.1044921875, -2.91741943359375, -2.7303466796875, -2.54327392578125, -2.356201171875, -2.16912841796875, -1.9820556640625, -1.79498291015625, -1.60791015625, -1.42083740234375, -1.2337646484375, -1.04669189453125, -0.859619140625, -0.67254638671875, -0.4854736328125, -0.29840087890625, -0.111328125, 0.07574462890625, 0.2628173828125, 0.44989013671875, 0.636962890625, 0.82403564453125, 1.0111083984375, 1.19818115234375, 1.38525390625, 1.57232666015625, 1.7593994140625, 1.94647216796875, 2.133544921875, 2.32061767578125, 2.5076904296875, 2.69476318359375, 2.8818359375, 3.06890869140625, 3.2559814453125, 3.44305419921875, 3.630126953125, 3.81719970703125, 4.0042724609375, 4.19134521484375, 4.37841796875, 4.56549072265625, 4.7525634765625, 4.93963623046875, 5.126708984375, 5.31378173828125, 5.5008544921875, 5.68792724609375, 5.875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 8.0, 9.0, 15.0, 12.0, 13.0, 16.0, 24.0, 28.0, 23.0, 34.0, 43.0, 51.0, 52.0, 73.0, 119.0, 171.0, 1339.0, 330.0, 175.0, 111.0, 70.0, 61.0, 42.0, 41.0, 20.0, 32.0, 28.0, 18.0, 12.0, 20.0, 13.0, 7.0, 8.0, 8.0, 2.0, 6.0, 0.0, 2.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9466552734375, -10.604248046875, -10.2618408203125, -9.91943359375, -9.5770263671875, -9.234619140625, -8.8922119140625, -8.5498046875, -8.2073974609375, -7.864990234375, -7.5225830078125, -7.18017578125, -6.8377685546875, -6.495361328125, -6.1529541015625, -5.810546875, -5.4681396484375, -5.125732421875, -4.7833251953125, -4.44091796875, -4.0985107421875, -3.756103515625, -3.4136962890625, -3.0712890625, -2.7288818359375, -2.386474609375, -2.0440673828125, -1.70166015625, -1.3592529296875, -1.016845703125, -0.6744384765625, -0.33203125, 0.0103759765625, 0.352783203125, 0.6951904296875, 1.03759765625, 1.3800048828125, 1.722412109375, 2.0648193359375, 2.4072265625, 2.7496337890625, 3.092041015625, 3.4344482421875, 3.77685546875, 4.1192626953125, 4.461669921875, 4.8040771484375, 5.146484375, 5.4888916015625, 5.831298828125, 6.1737060546875, 6.51611328125, 6.8585205078125, 7.200927734375, 7.5433349609375, 7.8857421875, 8.2281494140625, 8.570556640625, 8.9129638671875, 9.25537109375, 9.5977783203125, 9.940185546875, 10.2825927734375, 10.625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 11.0, 11.0, 4.0, 14.0, 22.0, 28.0, 41.0, 38.0, 54.0, 71.0, 107.0, 165.0, 228.0, 463.0, 1219.0, 3885.0, 25041.0, 782205.0, 2262337.0, 60165.0, 6404.0, 1626.0, 618.0, 306.0, 183.0, 120.0, 73.0, 65.0, 44.0, 35.0, 19.0, 22.0, 21.0, 14.0, 13.0, 9.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.07373046875, -15.5224609375, -14.97119140625, -14.419921875, -13.86865234375, -13.3173828125, -12.76611328125, -12.21484375, -11.66357421875, -11.1123046875, -10.56103515625, -10.009765625, -9.45849609375, -8.9072265625, -8.35595703125, -7.8046875, -7.25341796875, -6.7021484375, -6.15087890625, -5.599609375, -5.04833984375, -4.4970703125, -3.94580078125, -3.39453125, -2.84326171875, -2.2919921875, -1.74072265625, -1.189453125, -0.63818359375, -0.0869140625, 0.46435546875, 1.015625, 1.56689453125, 2.1181640625, 2.66943359375, 3.220703125, 3.77197265625, 4.3232421875, 4.87451171875, 5.42578125, 5.97705078125, 6.5283203125, 7.07958984375, 7.630859375, 8.18212890625, 8.7333984375, 9.28466796875, 9.8359375, 10.38720703125, 10.9384765625, 11.48974609375, 12.041015625, 12.59228515625, 13.1435546875, 13.69482421875, 14.24609375, 14.79736328125, 15.3486328125, 15.89990234375, 16.451171875, 17.00244140625, 17.5537109375, 18.10498046875, 18.65625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 13.0, 325.0, 639.0, 42.0, 1.0], "bins": [-458.5304870605469, -451.0351867675781, -443.5398864746094, -436.0445556640625, -428.54925537109375, -421.053955078125, -413.55865478515625, -406.0633239746094, -398.5680236816406, -391.0727233886719, -383.5774230957031, -376.08209228515625, -368.5867919921875, -361.09149169921875, -353.59619140625, -346.1008605957031, -338.6055603027344, -331.1102600097656, -323.6149597167969, -316.11962890625, -308.62432861328125, -301.1290283203125, -293.63372802734375, -286.1383972167969, -278.6430969238281, -271.1477966308594, -263.6524963378906, -256.15716552734375, -248.661865234375, -241.16656494140625, -233.67124938964844, -226.1759490966797, -218.68063354492188, -211.18533325195312, -203.6900177001953, -196.19471740722656, -188.69940185546875, -181.2041015625, -173.7087860107422, -166.21348571777344, -158.7181854248047, -151.22288513183594, -143.72756958007812, -136.23226928710938, -128.73695373535156, -121.24165344238281, -113.746337890625, -106.25103759765625, -98.75572204589844, -91.26041412353516, -83.76510620117188, -76.2697982788086, -68.77449035644531, -61.2791862487793, -53.783878326416016, -46.288570404052734, -38.79326248168945, -31.297954559326172, -23.80264663696289, -16.307340621948242, -8.812032699584961, -1.3167266845703125, 6.178581237792969, 13.67388916015625, 21.16919708251953]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 5.0, 12.0, 18.0, 16.0, 17.0, 18.0, 20.0, 19.0, 33.0, 37.0, 38.0, 39.0, 45.0, 41.0, 58.0, 40.0, 45.0, 38.0, 39.0, 33.0, 51.0, 32.0, 32.0, 31.0, 30.0, 25.0, 27.0, 23.0, 32.0, 18.0, 12.0, 17.0, 11.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.43394470214844, -32.4145393371582, -31.395137786865234, -30.375734329223633, -29.35633087158203, -28.336925506591797, -27.317522048950195, -26.298118591308594, -25.278715133666992, -24.25931167602539, -23.23990821838379, -22.220504760742188, -21.201099395751953, -20.181697845458984, -19.16229248046875, -18.14288902282715, -17.123485565185547, -16.104082107543945, -15.084678649902344, -14.065274238586426, -13.045870780944824, -12.026467323303223, -11.007062911987305, -9.987659454345703, -8.968255996704102, -7.9488525390625, -6.92944860458374, -5.9100446701049805, -4.890641212463379, -3.8712377548217773, -2.8518338203430176, -1.8324298858642578, -0.8130302429199219, 0.2063734531402588, 1.2257771492004395, 2.24518084526062, 3.264584541320801, 4.283987998962402, 5.303391933441162, 6.322795867919922, 7.342199325561523, 8.361602783203125, 9.381006240844727, 10.400410652160645, 11.419814109802246, 12.439217567443848, 13.458621978759766, 14.478025436401367, 15.497428894042969, 16.51683235168457, 17.536235809326172, 18.555639266967773, 19.575042724609375, 20.59444808959961, 21.61385154724121, 22.633255004882812, 23.652658462524414, 24.672061920166016, 25.691465377807617, 26.71086883544922, 27.730274200439453, 28.749675750732422, 29.769081115722656, 30.788484573364258, 31.80788803100586]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 4.0, 9.0, 11.0, 6.0, 6.0, 15.0, 12.0, 20.0, 17.0, 22.0, 28.0, 27.0, 30.0, 38.0, 25.0, 40.0, 45.0, 44.0, 51.0, 45.0, 36.0, 39.0, 51.0, 46.0, 36.0, 35.0, 41.0, 38.0, 37.0, 26.0, 20.0, 18.0, 17.0, 13.0, 12.0, 10.0, 7.0, 6.0, 10.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.404296875, -3.298065185546875, -3.19183349609375, -3.085601806640625, -2.9793701171875, -2.873138427734375, -2.76690673828125, -2.660675048828125, -2.554443359375, -2.448211669921875, -2.34197998046875, -2.235748291015625, -2.1295166015625, -2.023284912109375, -1.91705322265625, -1.810821533203125, -1.70458984375, -1.598358154296875, -1.49212646484375, -1.385894775390625, -1.2796630859375, -1.173431396484375, -1.06719970703125, -0.960968017578125, -0.854736328125, -0.748504638671875, -0.64227294921875, -0.536041259765625, -0.4298095703125, -0.323577880859375, -0.21734619140625, -0.111114501953125, -0.0048828125, 0.101348876953125, 0.20758056640625, 0.313812255859375, 0.4200439453125, 0.526275634765625, 0.63250732421875, 0.738739013671875, 0.844970703125, 0.951202392578125, 1.05743408203125, 1.163665771484375, 1.2698974609375, 1.376129150390625, 1.48236083984375, 1.588592529296875, 1.69482421875, 1.801055908203125, 1.90728759765625, 2.013519287109375, 2.1197509765625, 2.225982666015625, 2.33221435546875, 2.438446044921875, 2.544677734375, 2.650909423828125, 2.75714111328125, 2.863372802734375, 2.9696044921875, 3.075836181640625, 3.18206787109375, 3.288299560546875, 3.39453125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 6.0, 9.0, 12.0, 24.0, 47.0, 56.0, 97.0, 169.0, 234.0, 452.0, 883.0, 1849.0, 3893.0, 10331.0, 37207.0, 369706.0, 2999431.0, 692840.0, 55603.0, 12653.0, 4565.0, 2034.0, 1001.0, 489.0, 259.0, 153.0, 95.0, 67.0, 29.0, 28.0, 17.0, 17.0, 5.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53125, -11.1776123046875, -10.823974609375, -10.4703369140625, -10.11669921875, -9.7630615234375, -9.409423828125, -9.0557861328125, -8.7021484375, -8.3485107421875, -7.994873046875, -7.6412353515625, -7.28759765625, -6.9339599609375, -6.580322265625, -6.2266845703125, -5.873046875, -5.5194091796875, -5.165771484375, -4.8121337890625, -4.45849609375, -4.1048583984375, -3.751220703125, -3.3975830078125, -3.0439453125, -2.6903076171875, -2.336669921875, -1.9830322265625, -1.62939453125, -1.2757568359375, -0.922119140625, -0.5684814453125, -0.21484375, 0.1387939453125, 0.492431640625, 0.8460693359375, 1.19970703125, 1.5533447265625, 1.906982421875, 2.2606201171875, 2.6142578125, 2.9678955078125, 3.321533203125, 3.6751708984375, 4.02880859375, 4.3824462890625, 4.736083984375, 5.0897216796875, 5.443359375, 5.7969970703125, 6.150634765625, 6.5042724609375, 6.85791015625, 7.2115478515625, 7.565185546875, 7.9188232421875, 8.2724609375, 8.6260986328125, 8.979736328125, 9.3333740234375, 9.68701171875, 10.0406494140625, 10.394287109375, 10.7479248046875, 11.1015625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 12.0, 20.0, 31.0, 40.0, 64.0, 123.0, 151.0, 277.0, 453.0, 713.0, 794.0, 557.0, 358.0, 201.0, 105.0, 63.0, 41.0, 17.0, 23.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.203125, -11.845703125, -11.48828125, -11.130859375, -10.7734375, -10.416015625, -10.05859375, -9.701171875, -9.34375, -8.986328125, -8.62890625, -8.271484375, -7.9140625, -7.556640625, -7.19921875, -6.841796875, -6.484375, -6.126953125, -5.76953125, -5.412109375, -5.0546875, -4.697265625, -4.33984375, -3.982421875, -3.625, -3.267578125, -2.91015625, -2.552734375, -2.1953125, -1.837890625, -1.48046875, -1.123046875, -0.765625, -0.408203125, -0.05078125, 0.306640625, 0.6640625, 1.021484375, 1.37890625, 1.736328125, 2.09375, 2.451171875, 2.80859375, 3.166015625, 3.5234375, 3.880859375, 4.23828125, 4.595703125, 4.953125, 5.310546875, 5.66796875, 6.025390625, 6.3828125, 6.740234375, 7.09765625, 7.455078125, 7.8125, 8.169921875, 8.52734375, 8.884765625, 9.2421875, 9.599609375, 9.95703125, 10.314453125, 10.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 20.0, 25.0, 38.0, 67.0, 159.0, 255.0, 792.0, 2887.0, 28037.0, 3335165.0, 811808.0, 12016.0, 1859.0, 553.0, 277.0, 126.0, 69.0, 45.0, 27.0, 13.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.9375, -31.7958984375, -30.654296875, -29.5126953125, -28.37109375, -27.2294921875, -26.087890625, -24.9462890625, -23.8046875, -22.6630859375, -21.521484375, -20.3798828125, -19.23828125, -18.0966796875, -16.955078125, -15.8134765625, -14.671875, -13.5302734375, -12.388671875, -11.2470703125, -10.10546875, -8.9638671875, -7.822265625, -6.6806640625, -5.5390625, -4.3974609375, -3.255859375, -2.1142578125, -0.97265625, 0.1689453125, 1.310546875, 2.4521484375, 3.59375, 4.7353515625, 5.876953125, 7.0185546875, 8.16015625, 9.3017578125, 10.443359375, 11.5849609375, 12.7265625, 13.8681640625, 15.009765625, 16.1513671875, 17.29296875, 18.4345703125, 19.576171875, 20.7177734375, 21.859375, 23.0009765625, 24.142578125, 25.2841796875, 26.42578125, 27.5673828125, 28.708984375, 29.8505859375, 30.9921875, 32.1337890625, 33.275390625, 34.4169921875, 35.55859375, 36.7001953125, 37.841796875, 38.9833984375, 40.125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 10.0, 16.0, 20.0, 25.0, 38.0, 54.0, 76.0, 95.0, 108.0, 113.0, 90.0, 90.0, 73.0, 61.0, 35.0, 34.0, 17.0, 13.0, 8.0, 13.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78776168823242, -36.51385498046875, -35.23994445800781, -33.96603775024414, -32.69213104248047, -31.418222427368164, -30.14431381225586, -28.870407104492188, -27.596500396728516, -26.32259178161621, -25.04868507385254, -23.774776458740234, -22.500869750976562, -21.226961135864258, -19.953052520751953, -18.67914581298828, -17.405237197875977, -16.131328582763672, -14.857421875, -13.583513259887695, -12.309606552124023, -11.035697937011719, -9.76179027557373, -8.487882614135742, -7.213974952697754, -5.940067291259766, -4.666159629821777, -3.392251491546631, -2.1183438301086426, -0.8444361686706543, 0.4294719696044922, 1.7033796310424805, 2.9772872924804688, 4.251194953918457, 5.525102615356445, 6.799010753631592, 8.072917938232422, 9.346826553344727, 10.620734214782715, 11.894641876220703, 13.168549537658691, 14.44245719909668, 15.716364860534668, 16.990272521972656, 18.26418113708496, 19.538087844848633, 20.811996459960938, 22.08590316772461, 23.359811782836914, 24.63372039794922, 25.90762710571289, 27.181535720825195, 28.455442428588867, 29.729351043701172, 31.003257751464844, 32.27716827392578, 33.55107498168945, 34.824981689453125, 36.09889221191406, 37.372798919677734, 38.646705627441406, 39.92061233520508, 41.194522857666016, 42.46842956542969, 43.74233627319336]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 5.0, 7.0, 15.0, 6.0, 15.0, 13.0, 22.0, 18.0, 28.0, 28.0, 21.0, 25.0, 28.0, 35.0, 25.0, 46.0, 35.0, 33.0, 33.0, 47.0, 39.0, 30.0, 34.0, 30.0, 32.0, 35.0, 37.0, 32.0, 31.0, 26.0, 28.0, 17.0, 22.0, 18.0, 13.0, 7.0, 18.0, 10.0, 13.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 6.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-20.617080688476562, -19.964778900146484, -19.312477111816406, -18.660175323486328, -18.00787353515625, -17.355571746826172, -16.703269958496094, -16.050968170166016, -15.398666381835938, -14.74636459350586, -14.094062805175781, -13.441761016845703, -12.789459228515625, -12.137157440185547, -11.484855651855469, -10.83255386352539, -10.180252075195312, -9.527950286865234, -8.875648498535156, -8.223346710205078, -7.571044921875, -6.918743133544922, -6.266441345214844, -5.614139556884766, -4.9618377685546875, -4.309535980224609, -3.6572341918945312, -3.004932403564453, -2.352630615234375, -1.7003288269042969, -1.0480270385742188, -0.3957252502441406, 0.2565765380859375, 0.9088783264160156, 1.5611801147460938, 2.213481903076172, 2.86578369140625, 3.518085479736328, 4.170387268066406, 4.822689056396484, 5.4749908447265625, 6.127292633056641, 6.779594421386719, 7.431896209716797, 8.084197998046875, 8.736499786376953, 9.388801574707031, 10.04110336303711, 10.693405151367188, 11.345706939697266, 11.998008728027344, 12.650310516357422, 13.3026123046875, 13.954914093017578, 14.607215881347656, 15.259517669677734, 15.911819458007812, 16.56412124633789, 17.21642303466797, 17.868724822998047, 18.521026611328125, 19.173328399658203, 19.82563018798828, 20.47793197631836, 21.130233764648438]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 5.0, 7.0, 3.0, 12.0, 5.0, 10.0, 9.0, 14.0, 14.0, 18.0, 18.0, 28.0, 26.0, 30.0, 30.0, 37.0, 37.0, 39.0, 38.0, 54.0, 38.0, 39.0, 44.0, 47.0, 38.0, 41.0, 38.0, 33.0, 36.0, 35.0, 28.0, 28.0, 23.0, 13.0, 15.0, 17.0, 13.0, 9.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.5078125, -3.403350830078125, -3.29888916015625, -3.194427490234375, -3.0899658203125, -2.985504150390625, -2.88104248046875, -2.776580810546875, -2.672119140625, -2.567657470703125, -2.46319580078125, -2.358734130859375, -2.2542724609375, -2.149810791015625, -2.04534912109375, -1.940887451171875, -1.83642578125, -1.731964111328125, -1.62750244140625, -1.523040771484375, -1.4185791015625, -1.314117431640625, -1.20965576171875, -1.105194091796875, -1.000732421875, -0.896270751953125, -0.79180908203125, -0.687347412109375, -0.5828857421875, -0.478424072265625, -0.37396240234375, -0.269500732421875, -0.1650390625, -0.060577392578125, 0.04388427734375, 0.148345947265625, 0.2528076171875, 0.357269287109375, 0.46173095703125, 0.566192626953125, 0.670654296875, 0.775115966796875, 0.87957763671875, 0.984039306640625, 1.0885009765625, 1.192962646484375, 1.29742431640625, 1.401885986328125, 1.50634765625, 1.610809326171875, 1.71527099609375, 1.819732666015625, 1.9241943359375, 2.028656005859375, 2.13311767578125, 2.237579345703125, 2.342041015625, 2.446502685546875, 2.55096435546875, 2.655426025390625, 2.7598876953125, 2.864349365234375, 2.96881103515625, 3.073272705078125, 3.177734375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 12.0, 16.0, 37.0, 44.0, 65.0, 65.0, 139.0, 199.0, 267.0, 428.0, 615.0, 857.0, 1327.0, 2132.0, 3340.0, 5147.0, 8506.0, 13864.0, 23269.0, 40812.0, 74616.0, 159974.0, 372954.0, 162192.0, 75524.0, 41149.0, 23777.0, 13865.0, 8476.0, 5177.0, 3396.0, 2109.0, 1424.0, 939.0, 560.0, 405.0, 310.0, 178.0, 105.0, 100.0, 63.0, 34.0, 34.0, 19.0, 14.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19729995727539062, -0.19123077392578125, -0.18516159057617188, -0.1790924072265625, -0.17302322387695312, -0.16695404052734375, -0.16088485717773438, -0.154815673828125, -0.14874649047851562, -0.14267730712890625, -0.13660812377929688, -0.1305389404296875, -0.12446975708007812, -0.11840057373046875, -0.11233139038085938, -0.10626220703125, -0.10019302368164062, -0.09412384033203125, -0.08805465698242188, -0.0819854736328125, -0.07591629028320312, -0.06984710693359375, -0.06377792358398438, -0.057708740234375, -0.051639556884765625, -0.04557037353515625, -0.039501190185546875, -0.0334320068359375, -0.027362823486328125, -0.02129364013671875, -0.015224456787109375, -0.0091552734375, -0.003086090087890625, 0.00298309326171875, 0.009052276611328125, 0.0151214599609375, 0.021190643310546875, 0.02725982666015625, 0.033329010009765625, 0.039398193359375, 0.045467376708984375, 0.05153656005859375, 0.057605743408203125, 0.0636749267578125, 0.06974411010742188, 0.07581329345703125, 0.08188247680664062, 0.08795166015625, 0.09402084350585938, 0.10009002685546875, 0.10615921020507812, 0.1122283935546875, 0.11829757690429688, 0.12436676025390625, 0.13043594360351562, 0.136505126953125, 0.14257431030273438, 0.14864349365234375, 0.15471267700195312, 0.1607818603515625, 0.16685104370117188, 0.17292022705078125, 0.17898941040039062, 0.18505859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 10.0, 4.0, 11.0, 7.0, 19.0, 16.0, 23.0, 27.0, 20.0, 22.0, 31.0, 30.0, 28.0, 33.0, 32.0, 31.0, 44.0, 31.0, 39.0, 1070.0, 44.0, 51.0, 33.0, 43.0, 40.0, 35.0, 29.0, 30.0, 34.0, 27.0, 19.0, 15.0, 15.0, 14.0, 9.0, 15.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.811279296875, -2.72412109375, -2.636962890625, -2.5498046875, -2.462646484375, -2.37548828125, -2.288330078125, -2.201171875, -2.114013671875, -2.02685546875, -1.939697265625, -1.8525390625, -1.765380859375, -1.67822265625, -1.591064453125, -1.50390625, -1.416748046875, -1.32958984375, -1.242431640625, -1.1552734375, -1.068115234375, -0.98095703125, -0.893798828125, -0.806640625, -0.719482421875, -0.63232421875, -0.545166015625, -0.4580078125, -0.370849609375, -0.28369140625, -0.196533203125, -0.109375, -0.022216796875, 0.06494140625, 0.152099609375, 0.2392578125, 0.326416015625, 0.41357421875, 0.500732421875, 0.587890625, 0.675048828125, 0.76220703125, 0.849365234375, 0.9365234375, 1.023681640625, 1.11083984375, 1.197998046875, 1.28515625, 1.372314453125, 1.45947265625, 1.546630859375, 1.6337890625, 1.720947265625, 1.80810546875, 1.895263671875, 1.982421875, 2.069580078125, 2.15673828125, 2.243896484375, 2.3310546875, 2.418212890625, 2.50537109375, 2.592529296875, 2.6796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 2.0, 10.0, 6.0, 14.0, 20.0, 36.0, 46.0, 58.0, 92.0, 107.0, 200.0, 283.0, 372.0, 569.0, 801.0, 1213.0, 1775.0, 2722.0, 4082.0, 6403.0, 9795.0, 15047.0, 23948.0, 37636.0, 62233.0, 113683.0, 520384.0, 1008119.0, 116570.0, 63608.0, 38210.0, 24113.0, 15651.0, 9924.0, 6619.0, 4262.0, 2808.0, 1921.0, 1191.0, 820.0, 547.0, 394.0, 261.0, 184.0, 124.0, 85.0, 64.0, 29.0, 30.0, 20.0, 19.0, 9.0, 10.0, 3.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.06573486328125, -0.06374406814575195, -0.061753273010253906, -0.05976247787475586, -0.05777168273925781, -0.055780887603759766, -0.05379009246826172, -0.05179929733276367, -0.049808502197265625, -0.04781770706176758, -0.04582691192626953, -0.043836116790771484, -0.04184532165527344, -0.03985452651977539, -0.037863731384277344, -0.0358729362487793, -0.03388214111328125, -0.0318913459777832, -0.029900550842285156, -0.02790975570678711, -0.025918960571289062, -0.023928165435791016, -0.02193737030029297, -0.019946575164794922, -0.017955780029296875, -0.015964984893798828, -0.013974189758300781, -0.011983394622802734, -0.009992599487304688, -0.00800180435180664, -0.006011009216308594, -0.004020214080810547, -0.0020294189453125, -3.8623809814453125e-05, 0.0019521713256835938, 0.003942966461181641, 0.0059337615966796875, 0.007924556732177734, 0.009915351867675781, 0.011906147003173828, 0.013896942138671875, 0.015887737274169922, 0.01787853240966797, 0.019869327545166016, 0.021860122680664062, 0.02385091781616211, 0.025841712951660156, 0.027832508087158203, 0.02982330322265625, 0.0318140983581543, 0.033804893493652344, 0.03579568862915039, 0.03778648376464844, 0.039777278900146484, 0.04176807403564453, 0.04375886917114258, 0.045749664306640625, 0.04774045944213867, 0.04973125457763672, 0.051722049713134766, 0.05371284484863281, 0.05570363998413086, 0.057694435119628906, 0.05968523025512695, 0.061676025390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 6.0, 8.0, 18.0, 15.0, 19.0, 24.0, 19.0, 32.0, 30.0, 59.0, 29.0, 50.0, 66.0, 106.0, 79.0, 65.0, 50.0, 43.0, 44.0, 36.0, 34.0, 26.0, 22.0, 20.0, 12.0, 9.0, 12.0, 3.0, 7.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007395744323730469, -0.0007162019610404968, -0.0006928294897079468, -0.0006694570183753967, -0.0006460845470428467, -0.0006227120757102966, -0.0005993396043777466, -0.0005759671330451965, -0.0005525946617126465, -0.0005292221903800964, -0.0005058497190475464, -0.00048247724771499634, -0.0004591047763824463, -0.00043573230504989624, -0.0004123598337173462, -0.00038898736238479614, -0.0003656148910522461, -0.00034224241971969604, -0.000318869948387146, -0.00029549747705459595, -0.0002721250057220459, -0.00024875253438949585, -0.0002253800630569458, -0.00020200759172439575, -0.0001786351203918457, -0.00015526264905929565, -0.0001318901777267456, -0.00010851770639419556, -8.514523506164551e-05, -6.177276372909546e-05, -3.840029239654541e-05, -1.5027821063995361e-05, 8.344650268554688e-06, 3.1717121601104736e-05, 5.5089592933654785e-05, 7.846206426620483e-05, 0.00010183453559875488, 0.00012520700693130493, 0.00014857947826385498, 0.00017195194959640503, 0.00019532442092895508, 0.00021869689226150513, 0.00024206936359405518, 0.0002654418349266052, 0.0002888143062591553, 0.0003121867775917053, 0.00033555924892425537, 0.0003589317202568054, 0.00038230419158935547, 0.0004056766629219055, 0.00042904913425445557, 0.0004524216055870056, 0.00047579407691955566, 0.0004991665482521057, 0.0005225390195846558, 0.0005459114909172058, 0.0005692839622497559, 0.0005926564335823059, 0.000616028904914856, 0.000639401376247406, 0.0006627738475799561, 0.0006861463189125061, 0.0007095187902450562, 0.0007328912615776062, 0.0007562637329101562]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 9.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 10.0, 12.0, 29.0, 33.0, 39.0, 49.0, 74.0, 105.0, 185.0, 581.0, 4876.0, 102722.0, 905777.0, 31211.0, 2026.0, 346.0, 146.0, 75.0, 62.0, 40.0, 28.0, 20.0, 16.0, 11.0, 10.0, 4.0, 12.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.0151519775390625, -0.014683246612548828, -0.014214515686035156, -0.013745784759521484, -0.013277053833007812, -0.01280832290649414, -0.012339591979980469, -0.011870861053466797, -0.011402130126953125, -0.010933399200439453, -0.010464668273925781, -0.00999593734741211, -0.009527206420898438, -0.009058475494384766, -0.008589744567871094, -0.008121013641357422, -0.00765228271484375, -0.007183551788330078, -0.006714820861816406, -0.006246089935302734, -0.0057773590087890625, -0.005308628082275391, -0.004839897155761719, -0.004371166229248047, -0.003902435302734375, -0.003433704376220703, -0.0029649734497070312, -0.0024962425231933594, -0.0020275115966796875, -0.0015587806701660156, -0.0010900497436523438, -0.0006213188171386719, -0.000152587890625, 0.0003161430358886719, 0.0007848739624023438, 0.0012536048889160156, 0.0017223358154296875, 0.0021910667419433594, 0.0026597976684570312, 0.003128528594970703, 0.003597259521484375, 0.004065990447998047, 0.004534721374511719, 0.005003452301025391, 0.0054721832275390625, 0.005940914154052734, 0.006409645080566406, 0.006878376007080078, 0.00734710693359375, 0.007815837860107422, 0.008284568786621094, 0.008753299713134766, 0.009222030639648438, 0.00969076156616211, 0.010159492492675781, 0.010628223419189453, 0.011096954345703125, 0.011565685272216797, 0.012034416198730469, 0.01250314712524414, 0.012971878051757812, 0.013440608978271484, 0.013909339904785156, 0.014378070831298828, 0.0148468017578125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 58.0, 937.0, 21.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020125017035752535, -0.0014199453871697187, -0.0008273891871795058, -0.0002348329871892929, 0.00035772332921624184, 0.0009502796456217766, 0.0015428357291966677, 0.0021353920456022024, 0.002727948362007737, 0.003320504678413272, 0.003913060761988163, 0.004505617078393698, 0.0050981733947992325, 0.005690729711204767, 0.006283286027610302, 0.006875841878354549, 0.0074683986604213715, 0.008060954511165619, 0.008653511293232441, 0.009246067143976688, 0.00983862392604351, 0.010431179776787758, 0.011023735627532005, 0.011616292409598827, 0.012208848260343075, 0.012801404111087322, 0.013393960893154144, 0.013986516743898392, 0.014579073525965214, 0.015171629376709461, 0.015764186158776283, 0.01635674200952053, 0.016949297860264778, 0.017541853711009026, 0.018134409561753273, 0.01872696727514267, 0.019319523125886917, 0.019912078976631165, 0.020504634827375412, 0.02109719067811966, 0.021689748391509056, 0.022282304242253304, 0.02287486009299755, 0.023467417806386948, 0.024059973657131195, 0.024652529507875443, 0.02524508535861969, 0.025837641209363937, 0.026430197060108185, 0.027022752910852432, 0.02761530876159668, 0.028207866474986076, 0.028800422325730324, 0.02939297817647457, 0.02998553402721882, 0.030578091740608215, 0.031170647591352463, 0.03176320344209671, 0.03235575929284096, 0.032948315143585205, 0.03354087099432945, 0.034133430570364, 0.034725986421108246, 0.03531854227185249, 0.03591109812259674]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 11.0, 22.0, 25.0, 40.0, 59.0, 79.0, 65.0, 105.0, 103.0, 84.0, 94.0, 88.0, 64.0, 49.0, 52.0, 21.0, 15.0, 7.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018720626831054688, -0.0018301485106348991, -0.0017882343381643295, -0.00174632016569376, -0.0017044059932231903, -0.0016624918207526207, -0.001620577648282051, -0.0015786634758114815, -0.0015367493033409119, -0.0014948351308703423, -0.0014529209583997726, -0.001411006785929203, -0.0013690926134586334, -0.0013271784409880638, -0.0012852642685174942, -0.0012433500960469246, -0.001201435923576355, -0.0011595217511057854, -0.0011176075786352158, -0.0010756934061646461, -0.0010337792336940765, -0.000991865061223507, -0.0009499508887529373, -0.0009080367162823677, -0.0008661225438117981, -0.0008242083713412285, -0.0007822941988706589, -0.0007403800264000893, -0.0006984658539295197, -0.00065655168145895, -0.0006146375089883804, -0.0005727233365178108, -0.0005308091640472412, -0.0004888949915766716, -0.000446980819106102, -0.0004050666466355324, -0.00036315247416496277, -0.00032123830169439316, -0.00027932412922382355, -0.00023740995675325394, -0.00019549578428268433, -0.00015358161181211472, -0.0001116674393415451, -6.97532668709755e-05, -2.7839094400405884e-05, 1.4075078070163727e-05, 5.598925054073334e-05, 9.790342301130295e-05, 0.00013981759548187256, 0.00018173176795244217, 0.00022364594042301178, 0.0002655601128935814, 0.000307474285364151, 0.0003493884578347206, 0.0003913026303052902, 0.00043321680277585983, 0.00047513097524642944, 0.000517045147716999, 0.0005589593201875687, 0.0006008734926581383, 0.0006427876651287079, 0.0006847018375992775, 0.0007266160100698471, 0.0007685301825404167, 0.0008104443550109863]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 5.0, 7.0, 4.0, 11.0, 5.0, 10.0, 9.0, 14.0, 14.0, 18.0, 18.0, 28.0, 26.0, 30.0, 30.0, 37.0, 37.0, 39.0, 38.0, 54.0, 38.0, 39.0, 44.0, 47.0, 38.0, 41.0, 38.0, 33.0, 36.0, 35.0, 28.0, 28.0, 23.0, 13.0, 15.0, 17.0, 13.0, 9.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.5078125, -3.403350830078125, -3.29888916015625, -3.194427490234375, -3.0899658203125, -2.985504150390625, -2.88104248046875, -2.776580810546875, -2.672119140625, -2.567657470703125, -2.46319580078125, -2.358734130859375, -2.2542724609375, -2.149810791015625, -2.04534912109375, -1.940887451171875, -1.83642578125, -1.731964111328125, -1.62750244140625, -1.523040771484375, -1.4185791015625, -1.314117431640625, -1.20965576171875, -1.105194091796875, -1.000732421875, -0.896270751953125, -0.79180908203125, -0.687347412109375, -0.5828857421875, -0.478424072265625, -0.37396240234375, -0.269500732421875, -0.1650390625, -0.060577392578125, 0.04388427734375, 0.148345947265625, 0.2528076171875, 0.357269287109375, 0.46173095703125, 0.566192626953125, 0.670654296875, 0.775115966796875, 0.87957763671875, 0.984039306640625, 1.0885009765625, 1.192962646484375, 1.29742431640625, 1.401885986328125, 1.50634765625, 1.610809326171875, 1.71527099609375, 1.819732666015625, 1.9241943359375, 2.028656005859375, 2.13311767578125, 2.237579345703125, 2.342041015625, 2.446502685546875, 2.55096435546875, 2.655426025390625, 2.7598876953125, 2.864349365234375, 2.96881103515625, 3.073272705078125, 3.177734375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 13.0, 10.0, 15.0, 25.0, 27.0, 56.0, 80.0, 112.0, 186.0, 278.0, 418.0, 680.0, 1120.0, 1896.0, 3546.0, 6606.0, 14382.0, 34509.0, 93444.0, 308098.0, 389377.0, 117773.0, 41652.0, 16943.0, 7741.0, 3997.0, 2230.0, 1212.0, 776.0, 471.0, 304.0, 183.0, 121.0, 90.0, 61.0, 40.0, 30.0, 15.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.84765625, -6.62750244140625, -6.4073486328125, -6.18719482421875, -5.967041015625, -5.74688720703125, -5.5267333984375, -5.30657958984375, -5.08642578125, -4.86627197265625, -4.6461181640625, -4.42596435546875, -4.205810546875, -3.98565673828125, -3.7655029296875, -3.54534912109375, -3.3251953125, -3.10504150390625, -2.8848876953125, -2.66473388671875, -2.444580078125, -2.22442626953125, -2.0042724609375, -1.78411865234375, -1.56396484375, -1.34381103515625, -1.1236572265625, -0.90350341796875, -0.683349609375, -0.46319580078125, -0.2430419921875, -0.02288818359375, 0.197265625, 0.41741943359375, 0.6375732421875, 0.85772705078125, 1.077880859375, 1.29803466796875, 1.5181884765625, 1.73834228515625, 1.95849609375, 2.17864990234375, 2.3988037109375, 2.61895751953125, 2.839111328125, 3.05926513671875, 3.2794189453125, 3.49957275390625, 3.7197265625, 3.93988037109375, 4.1600341796875, 4.38018798828125, 4.600341796875, 4.82049560546875, 5.0406494140625, 5.26080322265625, 5.48095703125, 5.70111083984375, 5.9212646484375, 6.14141845703125, 6.361572265625, 6.58172607421875, 6.8018798828125, 7.02203369140625, 7.2421875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 7.0, 10.0, 6.0, 9.0, 8.0, 14.0, 17.0, 12.0, 24.0, 22.0, 29.0, 37.0, 20.0, 45.0, 41.0, 52.0, 61.0, 98.0, 135.0, 200.0, 1294.0, 218.0, 152.0, 94.0, 72.0, 55.0, 49.0, 41.0, 40.0, 30.0, 26.0, 29.0, 23.0, 16.0, 12.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-11.1796875, -10.85693359375, -10.5341796875, -10.21142578125, -9.888671875, -9.56591796875, -9.2431640625, -8.92041015625, -8.59765625, -8.27490234375, -7.9521484375, -7.62939453125, -7.306640625, -6.98388671875, -6.6611328125, -6.33837890625, -6.015625, -5.69287109375, -5.3701171875, -5.04736328125, -4.724609375, -4.40185546875, -4.0791015625, -3.75634765625, -3.43359375, -3.11083984375, -2.7880859375, -2.46533203125, -2.142578125, -1.81982421875, -1.4970703125, -1.17431640625, -0.8515625, -0.52880859375, -0.2060546875, 0.11669921875, 0.439453125, 0.76220703125, 1.0849609375, 1.40771484375, 1.73046875, 2.05322265625, 2.3759765625, 2.69873046875, 3.021484375, 3.34423828125, 3.6669921875, 3.98974609375, 4.3125, 4.63525390625, 4.9580078125, 5.28076171875, 5.603515625, 5.92626953125, 6.2490234375, 6.57177734375, 6.89453125, 7.21728515625, 7.5400390625, 7.86279296875, 8.185546875, 8.50830078125, 8.8310546875, 9.15380859375, 9.4765625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 4.0, 8.0, 9.0, 7.0, 4.0, 11.0, 17.0, 20.0, 23.0, 40.0, 56.0, 78.0, 102.0, 142.0, 233.0, 433.0, 933.0, 2373.0, 7585.0, 43016.0, 724148.0, 2235220.0, 110875.0, 13990.0, 3539.0, 1356.0, 566.0, 278.0, 183.0, 103.0, 82.0, 67.0, 44.0, 39.0, 25.0, 19.0, 20.0, 11.0, 9.0, 6.0, 10.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.115966796875, -15.54443359375, -14.972900390625, -14.4013671875, -13.829833984375, -13.25830078125, -12.686767578125, -12.115234375, -11.543701171875, -10.97216796875, -10.400634765625, -9.8291015625, -9.257568359375, -8.68603515625, -8.114501953125, -7.54296875, -6.971435546875, -6.39990234375, -5.828369140625, -5.2568359375, -4.685302734375, -4.11376953125, -3.542236328125, -2.970703125, -2.399169921875, -1.82763671875, -1.256103515625, -0.6845703125, -0.113037109375, 0.45849609375, 1.030029296875, 1.6015625, 2.173095703125, 2.74462890625, 3.316162109375, 3.8876953125, 4.459228515625, 5.03076171875, 5.602294921875, 6.173828125, 6.745361328125, 7.31689453125, 7.888427734375, 8.4599609375, 9.031494140625, 9.60302734375, 10.174560546875, 10.74609375, 11.317626953125, 11.88916015625, 12.460693359375, 13.0322265625, 13.603759765625, 14.17529296875, 14.746826171875, 15.318359375, 15.889892578125, 16.46142578125, 17.032958984375, 17.6044921875, 18.176025390625, 18.74755859375, 19.319091796875, 19.890625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 12.0, 34.0, 75.0, 212.0, 287.0, 246.0, 97.0, 34.0, 16.0, 3.0, 3.0], "bins": [-139.24452209472656, -136.82455444335938, -134.40460205078125, -131.98464965820312, -129.56468200683594, -127.14472198486328, -124.72476196289062, -122.30480194091797, -119.88484191894531, -117.46488189697266, -115.044921875, -112.62496185302734, -110.20500183105469, -107.78504180908203, -105.36508178710938, -102.94512176513672, -100.52516174316406, -98.1052017211914, -95.68524169921875, -93.2652816772461, -90.84532165527344, -88.42536163330078, -86.00540161132812, -83.58544158935547, -81.16548156738281, -78.74552154541016, -76.3255615234375, -73.90560150146484, -71.48564147949219, -69.06568145751953, -66.64572143554688, -64.22576141357422, -61.80579376220703, -59.385833740234375, -56.96587371826172, -54.54591369628906, -52.125953674316406, -49.70599365234375, -47.286033630371094, -44.86607360839844, -42.44611358642578, -40.026153564453125, -37.60619354248047, -35.18623352050781, -32.766273498535156, -30.3463134765625, -27.926353454589844, -25.506393432617188, -23.086435317993164, -20.666475296020508, -18.24651527404785, -15.826555252075195, -13.406595230102539, -10.986635208129883, -8.566675186157227, -6.14671516418457, -3.726755142211914, -1.3067951202392578, 1.1131649017333984, 3.5331249237060547, 5.953084945678711, 8.373044967651367, 10.793004989624023, 13.21296501159668, 15.632925033569336]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 4.0, 13.0, 13.0, 22.0, 20.0, 23.0, 22.0, 31.0, 23.0, 29.0, 30.0, 37.0, 44.0, 48.0, 50.0, 39.0, 39.0, 48.0, 42.0, 35.0, 37.0, 34.0, 43.0, 36.0, 31.0, 25.0, 28.0, 15.0, 22.0, 17.0, 19.0, 17.0, 14.0, 5.0, 7.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.509851455688477, -27.478479385375977, -26.447107315063477, -25.415735244750977, -24.384363174438477, -23.352991104125977, -22.321619033813477, -21.290246963500977, -20.258874893188477, -19.227502822875977, -18.196130752563477, -17.164758682250977, -16.133386611938477, -15.102014541625977, -14.070642471313477, -13.039270401000977, -12.007898330688477, -10.976526260375977, -9.945154190063477, -8.913782119750977, -7.882410049438477, -6.851037979125977, -5.819665908813477, -4.788293838500977, -3.7569217681884766, -2.7255496978759766, -1.6941776275634766, -0.6628055572509766, 0.36856651306152344, 1.3999385833740234, 2.4313106536865234, 3.4626827239990234, 4.494052886962891, 5.525424957275391, 6.556797027587891, 7.588169097900391, 8.61954116821289, 9.65091323852539, 10.68228530883789, 11.71365737915039, 12.74502944946289, 13.77640151977539, 14.80777359008789, 15.83914566040039, 16.87051773071289, 17.90188980102539, 18.93326187133789, 19.96463394165039, 20.99600601196289, 22.02737808227539, 23.05875015258789, 24.09012222290039, 25.12149429321289, 26.15286636352539, 27.18423843383789, 28.21561050415039, 29.24698257446289, 30.27835464477539, 31.30972671508789, 32.34109878540039, 33.37247085571289, 34.40384292602539, 35.43521499633789, 36.46658706665039, 37.49795913696289]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 5.0, 10.0, 6.0, 13.0, 18.0, 17.0, 17.0, 21.0, 22.0, 32.0, 33.0, 27.0, 32.0, 28.0, 44.0, 47.0, 44.0, 34.0, 46.0, 49.0, 39.0, 39.0, 44.0, 49.0, 31.0, 28.0, 28.0, 25.0, 28.0, 17.0, 25.0, 9.0, 9.0, 12.0, 18.0, 2.0, 9.0, 4.0, 3.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5546875, -3.44476318359375, -3.3348388671875, -3.22491455078125, -3.114990234375, -3.00506591796875, -2.8951416015625, -2.78521728515625, -2.67529296875, -2.56536865234375, -2.4554443359375, -2.34552001953125, -2.235595703125, -2.12567138671875, -2.0157470703125, -1.90582275390625, -1.7958984375, -1.68597412109375, -1.5760498046875, -1.46612548828125, -1.356201171875, -1.24627685546875, -1.1363525390625, -1.02642822265625, -0.91650390625, -0.80657958984375, -0.6966552734375, -0.58673095703125, -0.476806640625, -0.36688232421875, -0.2569580078125, -0.14703369140625, -0.037109375, 0.07281494140625, 0.1827392578125, 0.29266357421875, 0.402587890625, 0.51251220703125, 0.6224365234375, 0.73236083984375, 0.84228515625, 0.95220947265625, 1.0621337890625, 1.17205810546875, 1.281982421875, 1.39190673828125, 1.5018310546875, 1.61175537109375, 1.7216796875, 1.83160400390625, 1.9415283203125, 2.05145263671875, 2.161376953125, 2.27130126953125, 2.3812255859375, 2.49114990234375, 2.60107421875, 2.71099853515625, 2.8209228515625, 2.93084716796875, 3.040771484375, 3.15069580078125, 3.2606201171875, 3.37054443359375, 3.48046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 16.0, 24.0, 42.0, 70.0, 90.0, 144.0, 246.0, 448.0, 914.0, 1681.0, 3807.0, 9888.0, 37363.0, 320521.0, 2743810.0, 967320.0, 80734.0, 16426.0, 5712.0, 2459.0, 1115.0, 587.0, 292.0, 205.0, 105.0, 77.0, 54.0, 43.0, 20.0, 17.0, 10.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.3394775390625, -9.991455078125, -9.6434326171875, -9.29541015625, -8.9473876953125, -8.599365234375, -8.2513427734375, -7.9033203125, -7.5552978515625, -7.207275390625, -6.8592529296875, -6.51123046875, -6.1632080078125, -5.815185546875, -5.4671630859375, -5.119140625, -4.7711181640625, -4.423095703125, -4.0750732421875, -3.72705078125, -3.3790283203125, -3.031005859375, -2.6829833984375, -2.3349609375, -1.9869384765625, -1.638916015625, -1.2908935546875, -0.94287109375, -0.5948486328125, -0.246826171875, 0.1011962890625, 0.44921875, 0.7972412109375, 1.145263671875, 1.4932861328125, 1.84130859375, 2.1893310546875, 2.537353515625, 2.8853759765625, 3.2333984375, 3.5814208984375, 3.929443359375, 4.2774658203125, 4.62548828125, 4.9735107421875, 5.321533203125, 5.6695556640625, 6.017578125, 6.3656005859375, 6.713623046875, 7.0616455078125, 7.40966796875, 7.7576904296875, 8.105712890625, 8.4537353515625, 8.8017578125, 9.1497802734375, 9.497802734375, 9.8458251953125, 10.19384765625, 10.5418701171875, 10.889892578125, 11.2379150390625, 11.5859375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 9.0, 10.0, 5.0, 18.0, 23.0, 11.0, 30.0, 33.0, 49.0, 72.0, 98.0, 147.0, 220.0, 312.0, 453.0, 544.0, 564.0, 417.0, 343.0, 228.0, 145.0, 94.0, 74.0, 43.0, 37.0, 24.0, 18.0, 12.0, 12.0, 4.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.6796875, -8.416259765625, -8.15283203125, -7.889404296875, -7.6259765625, -7.362548828125, -7.09912109375, -6.835693359375, -6.572265625, -6.308837890625, -6.04541015625, -5.781982421875, -5.5185546875, -5.255126953125, -4.99169921875, -4.728271484375, -4.46484375, -4.201416015625, -3.93798828125, -3.674560546875, -3.4111328125, -3.147705078125, -2.88427734375, -2.620849609375, -2.357421875, -2.093994140625, -1.83056640625, -1.567138671875, -1.3037109375, -1.040283203125, -0.77685546875, -0.513427734375, -0.25, 0.013427734375, 0.27685546875, 0.540283203125, 0.8037109375, 1.067138671875, 1.33056640625, 1.593994140625, 1.857421875, 2.120849609375, 2.38427734375, 2.647705078125, 2.9111328125, 3.174560546875, 3.43798828125, 3.701416015625, 3.96484375, 4.228271484375, 4.49169921875, 4.755126953125, 5.0185546875, 5.281982421875, 5.54541015625, 5.808837890625, 6.072265625, 6.335693359375, 6.59912109375, 6.862548828125, 7.1259765625, 7.389404296875, 7.65283203125, 7.916259765625, 8.1796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 12.0, 14.0, 20.0, 27.0, 45.0, 42.0, 97.0, 143.0, 252.0, 604.0, 2460.0, 26530.0, 3408415.0, 742719.0, 10380.0, 1415.0, 462.0, 204.0, 121.0, 79.0, 56.0, 36.0, 26.0, 18.0, 23.0, 17.0, 6.0, 6.0, 12.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.75, -36.564453125, -35.37890625, -34.193359375, -33.0078125, -31.822265625, -30.63671875, -29.451171875, -28.265625, -27.080078125, -25.89453125, -24.708984375, -23.5234375, -22.337890625, -21.15234375, -19.966796875, -18.78125, -17.595703125, -16.41015625, -15.224609375, -14.0390625, -12.853515625, -11.66796875, -10.482421875, -9.296875, -8.111328125, -6.92578125, -5.740234375, -4.5546875, -3.369140625, -2.18359375, -0.998046875, 0.1875, 1.373046875, 2.55859375, 3.744140625, 4.9296875, 6.115234375, 7.30078125, 8.486328125, 9.671875, 10.857421875, 12.04296875, 13.228515625, 14.4140625, 15.599609375, 16.78515625, 17.970703125, 19.15625, 20.341796875, 21.52734375, 22.712890625, 23.8984375, 25.083984375, 26.26953125, 27.455078125, 28.640625, 29.826171875, 31.01171875, 32.197265625, 33.3828125, 34.568359375, 35.75390625, 36.939453125, 38.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 2.0, 6.0, 16.0, 21.0, 23.0, 36.0, 58.0, 53.0, 68.0, 73.0, 78.0, 89.0, 99.0, 85.0, 77.0, 54.0, 39.0, 28.0, 30.0, 20.0, 12.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.624752044677734, -40.56349182128906, -39.502227783203125, -38.44096755981445, -37.37970733642578, -36.31844711303711, -35.25718307495117, -34.1959228515625, -33.13466262817383, -32.073402404785156, -31.01214027404785, -29.950878143310547, -28.889617919921875, -27.82835578918457, -26.767093658447266, -25.705833435058594, -24.64457130432129, -23.583309173583984, -22.522048950195312, -21.460786819458008, -20.399526596069336, -19.33826446533203, -18.27700424194336, -17.215742111206055, -16.15447998046875, -15.093218803405762, -14.031957626342773, -12.970695495605469, -11.909435272216797, -10.848173141479492, -9.786911964416504, -8.725650787353516, -7.664388656616211, -6.603127479553223, -5.541866302490234, -4.480604648590088, -3.4193434715270996, -2.3580822944641113, -1.2968206405639648, -0.23555946350097656, 0.8257017135620117, 1.8869630098342896, 2.9482243061065674, 4.009485721588135, 5.070746898651123, 6.132008075714111, 7.193269729614258, 8.254530906677246, 9.315792083740234, 10.377053260803223, 11.438314437866211, 12.499576568603516, 13.560836791992188, 14.622098922729492, 15.68336009979248, 16.74462127685547, 17.80588150024414, 18.867143630981445, 19.928403854370117, 20.989665985107422, 22.050926208496094, 23.1121883392334, 24.173450469970703, 25.234710693359375, 26.29597282409668]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 0.0, 6.0, 6.0, 8.0, 7.0, 12.0, 10.0, 9.0, 21.0, 20.0, 35.0, 17.0, 29.0, 27.0, 39.0, 40.0, 39.0, 47.0, 35.0, 38.0, 30.0, 39.0, 41.0, 41.0, 44.0, 40.0, 40.0, 34.0, 27.0, 28.0, 29.0, 28.0, 32.0, 23.0, 11.0, 17.0, 10.0, 7.0, 5.0, 12.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.379417419433594, -28.551237106323242, -27.723058700561523, -26.894878387451172, -26.066699981689453, -25.2385196685791, -24.41033935546875, -23.58216094970703, -22.75398063659668, -21.925800323486328, -21.09762191772461, -20.269441604614258, -19.441261291503906, -18.613082885742188, -17.784902572631836, -16.956722259521484, -16.128543853759766, -15.30036449432373, -14.472185134887695, -13.644004821777344, -12.815825462341309, -11.987646102905273, -11.159465789794922, -10.331286430358887, -9.503107070922852, -8.674927711486816, -7.846747875213623, -7.01856803894043, -6.1903886795043945, -5.362209320068359, -4.534029483795166, -3.7058496475219727, -2.8776721954345703, -2.049492597579956, -1.2213129997253418, -0.39313340187072754, 0.4350461959838867, 1.2632255554199219, 2.0914053916931152, 2.9195852279663086, 3.7477645874023438, 4.575943946838379, 5.404123783111572, 6.232303619384766, 7.060482978820801, 7.888662338256836, 8.716842651367188, 9.545022010803223, 10.373201370239258, 11.201380729675293, 12.029560089111328, 12.85774040222168, 13.685919761657715, 14.51409912109375, 15.342279434204102, 16.170459747314453, 16.998638153076172, 17.826818466186523, 18.654996871948242, 19.483177185058594, 20.311355590820312, 21.139535903930664, 21.967716217041016, 22.795894622802734, 23.624074935913086]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 7.0, 9.0, 12.0, 12.0, 13.0, 19.0, 21.0, 23.0, 19.0, 25.0, 29.0, 29.0, 37.0, 33.0, 36.0, 42.0, 41.0, 53.0, 38.0, 49.0, 46.0, 43.0, 49.0, 32.0, 27.0, 25.0, 29.0, 28.0, 23.0, 22.0, 21.0, 13.0, 12.0, 14.0, 10.0, 14.0, 3.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.30078125, -3.192108154296875, -3.08343505859375, -2.974761962890625, -2.8660888671875, -2.757415771484375, -2.64874267578125, -2.540069580078125, -2.431396484375, -2.322723388671875, -2.21405029296875, -2.105377197265625, -1.9967041015625, -1.888031005859375, -1.77935791015625, -1.670684814453125, -1.56201171875, -1.453338623046875, -1.34466552734375, -1.235992431640625, -1.1273193359375, -1.018646240234375, -0.90997314453125, -0.801300048828125, -0.692626953125, -0.583953857421875, -0.47528076171875, -0.366607666015625, -0.2579345703125, -0.149261474609375, -0.04058837890625, 0.068084716796875, 0.1767578125, 0.285430908203125, 0.39410400390625, 0.502777099609375, 0.6114501953125, 0.720123291015625, 0.82879638671875, 0.937469482421875, 1.046142578125, 1.154815673828125, 1.26348876953125, 1.372161865234375, 1.4808349609375, 1.589508056640625, 1.69818115234375, 1.806854248046875, 1.91552734375, 2.024200439453125, 2.13287353515625, 2.241546630859375, 2.3502197265625, 2.458892822265625, 2.56756591796875, 2.676239013671875, 2.784912109375, 2.893585205078125, 3.00225830078125, 3.110931396484375, 3.2196044921875, 3.328277587890625, 3.43695068359375, 3.545623779296875, 3.654296875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 15.0, 29.0, 33.0, 53.0, 83.0, 120.0, 162.0, 228.0, 338.0, 503.0, 715.0, 1068.0, 1619.0, 2398.0, 3720.0, 5652.0, 8930.0, 14046.0, 22945.0, 38002.0, 66224.0, 122581.0, 314410.0, 212692.0, 94900.0, 53442.0, 31328.0, 18958.0, 11664.0, 7432.0, 4784.0, 3113.0, 2068.0, 1376.0, 927.0, 584.0, 429.0, 323.0, 212.0, 135.0, 84.0, 76.0, 54.0, 30.0, 18.0, 14.0, 10.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1890869140625, -0.18294906616210938, -0.17681121826171875, -0.17067337036132812, -0.1645355224609375, -0.15839767456054688, -0.15225982666015625, -0.14612197875976562, -0.139984130859375, -0.13384628295898438, -0.12770843505859375, -0.12157058715820312, -0.1154327392578125, -0.10929489135742188, -0.10315704345703125, -0.09701919555664062, -0.09088134765625, -0.08474349975585938, -0.07860565185546875, -0.07246780395507812, -0.0663299560546875, -0.060192108154296875, -0.05405426025390625, -0.047916412353515625, -0.041778564453125, -0.035640716552734375, -0.02950286865234375, -0.023365020751953125, -0.0172271728515625, -0.011089324951171875, -0.00495147705078125, 0.001186370849609375, 0.00732421875, 0.013462066650390625, 0.01959991455078125, 0.025737762451171875, 0.0318756103515625, 0.038013458251953125, 0.04415130615234375, 0.050289154052734375, 0.056427001953125, 0.06256484985351562, 0.06870269775390625, 0.07484054565429688, 0.0809783935546875, 0.08711624145507812, 0.09325408935546875, 0.09939193725585938, 0.10552978515625, 0.11166763305664062, 0.11780548095703125, 0.12394332885742188, 0.1300811767578125, 0.13621902465820312, 0.14235687255859375, 0.14849472045898438, 0.154632568359375, 0.16077041625976562, 0.16690826416015625, 0.17304611206054688, 0.1791839599609375, 0.18532180786132812, 0.19145965576171875, 0.19759750366210938, 0.2037353515625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 6.0, 5.0, 10.0, 8.0, 9.0, 11.0, 19.0, 17.0, 15.0, 9.0, 19.0, 24.0, 28.0, 32.0, 32.0, 30.0, 41.0, 39.0, 33.0, 44.0, 31.0, 44.0, 1056.0, 33.0, 31.0, 40.0, 43.0, 31.0, 33.0, 30.0, 33.0, 27.0, 18.0, 26.0, 17.0, 15.0, 12.0, 12.0, 10.0, 8.0, 9.0, 8.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.90234375, -2.815399169921875, -2.72845458984375, -2.641510009765625, -2.5545654296875, -2.467620849609375, -2.38067626953125, -2.293731689453125, -2.206787109375, -2.119842529296875, -2.03289794921875, -1.945953369140625, -1.8590087890625, -1.772064208984375, -1.68511962890625, -1.598175048828125, -1.51123046875, -1.424285888671875, -1.33734130859375, -1.250396728515625, -1.1634521484375, -1.076507568359375, -0.98956298828125, -0.902618408203125, -0.815673828125, -0.728729248046875, -0.64178466796875, -0.554840087890625, -0.4678955078125, -0.380950927734375, -0.29400634765625, -0.207061767578125, -0.1201171875, -0.033172607421875, 0.05377197265625, 0.140716552734375, 0.2276611328125, 0.314605712890625, 0.40155029296875, 0.488494873046875, 0.575439453125, 0.662384033203125, 0.74932861328125, 0.836273193359375, 0.9232177734375, 1.010162353515625, 1.09710693359375, 1.184051513671875, 1.27099609375, 1.357940673828125, 1.44488525390625, 1.531829833984375, 1.6187744140625, 1.705718994140625, 1.79266357421875, 1.879608154296875, 1.966552734375, 2.053497314453125, 2.14044189453125, 2.227386474609375, 2.3143310546875, 2.401275634765625, 2.48822021484375, 2.575164794921875, 2.662109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 17.0, 20.0, 40.0, 44.0, 69.0, 97.0, 166.0, 212.0, 330.0, 484.0, 728.0, 1118.0, 1618.0, 2386.0, 3736.0, 5950.0, 9205.0, 14501.0, 23140.0, 38395.0, 63919.0, 120484.0, 1282399.0, 273595.0, 104591.0, 56894.0, 34110.0, 21072.0, 13216.0, 8484.0, 5481.0, 3542.0, 2297.0, 1486.0, 1039.0, 670.0, 495.0, 313.0, 224.0, 161.0, 110.0, 93.0, 51.0, 45.0, 28.0, 12.0, 13.0, 13.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0692138671875, -0.06697368621826172, -0.06473350524902344, -0.062493324279785156, -0.060253143310546875, -0.058012962341308594, -0.05577278137207031, -0.05353260040283203, -0.05129241943359375, -0.04905223846435547, -0.04681205749511719, -0.044571876525878906, -0.042331695556640625, -0.040091514587402344, -0.03785133361816406, -0.03561115264892578, -0.0333709716796875, -0.03113079071044922, -0.028890609741210938, -0.026650428771972656, -0.024410247802734375, -0.022170066833496094, -0.019929885864257812, -0.01768970489501953, -0.01544952392578125, -0.013209342956542969, -0.010969161987304688, -0.008728981018066406, -0.006488800048828125, -0.004248619079589844, -0.0020084381103515625, 0.00023174285888671875, 0.002471923828125, 0.004712104797363281, 0.0069522857666015625, 0.009192466735839844, 0.011432647705078125, 0.013672828674316406, 0.015913009643554688, 0.01815319061279297, 0.02039337158203125, 0.02263355255126953, 0.024873733520507812, 0.027113914489746094, 0.029354095458984375, 0.031594276428222656, 0.03383445739746094, 0.03607463836669922, 0.0383148193359375, 0.04055500030517578, 0.04279518127441406, 0.045035362243652344, 0.047275543212890625, 0.049515724182128906, 0.05175590515136719, 0.05399608612060547, 0.05623626708984375, 0.05847644805908203, 0.06071662902832031, 0.0629568099975586, 0.06519699096679688, 0.06743717193603516, 0.06967735290527344, 0.07191753387451172, 0.07415771484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 7.0, 14.0, 13.0, 17.0, 17.0, 14.0, 17.0, 24.0, 27.0, 38.0, 27.0, 39.0, 42.0, 51.0, 44.0, 62.0, 48.0, 72.0, 55.0, 50.0, 37.0, 43.0, 33.0, 35.0, 25.0, 25.0, 25.0, 15.0, 11.0, 14.0, 9.0, 15.0, 7.0, 4.0, 2.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0008521080017089844, -0.0008273199200630188, -0.0008025318384170532, -0.0007777437567710876, -0.0007529556751251221, -0.0007281675934791565, -0.0007033795118331909, -0.0006785914301872253, -0.0006538033485412598, -0.0006290152668952942, -0.0006042271852493286, -0.000579439103603363, -0.0005546510219573975, -0.0005298629403114319, -0.0005050748586654663, -0.00048028677701950073, -0.00045549869537353516, -0.0004307106137275696, -0.000405922532081604, -0.00038113445043563843, -0.00035634636878967285, -0.0003315582871437073, -0.0003067702054977417, -0.0002819821238517761, -0.00025719404220581055, -0.00023240596055984497, -0.0002076178789138794, -0.00018282979726791382, -0.00015804171562194824, -0.00013325363397598267, -0.00010846555233001709, -8.367747068405151e-05, -5.888938903808594e-05, -3.410130739212036e-05, -9.313225746154785e-06, 1.547485589981079e-05, 4.026293754577637e-05, 6.505101919174194e-05, 8.983910083770752e-05, 0.0001146271824836731, 0.00013941526412963867, 0.00016420334577560425, 0.00018899142742156982, 0.0002137795090675354, 0.00023856759071350098, 0.00026335567235946655, 0.00028814375400543213, 0.0003129318356513977, 0.0003377199172973633, 0.00036250799894332886, 0.00038729608058929443, 0.00041208416223526, 0.0004368722438812256, 0.00046166032552719116, 0.00048644840717315674, 0.0005112364888191223, 0.0005360245704650879, 0.0005608126521110535, 0.000585600733757019, 0.0006103888154029846, 0.0006351768970489502, 0.0006599649786949158, 0.0006847530603408813, 0.0007095411419868469, 0.0007343292236328125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 5.0, 11.0, 10.0, 8.0, 8.0, 15.0, 21.0, 23.0, 27.0, 33.0, 39.0, 42.0, 92.0, 138.0, 386.0, 2134.0, 34680.0, 934023.0, 72376.0, 3417.0, 523.0, 165.0, 98.0, 52.0, 49.0, 28.0, 31.0, 14.0, 16.0, 15.0, 13.0, 18.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01458740234375, -0.01409459114074707, -0.01360177993774414, -0.013108968734741211, -0.012616157531738281, -0.012123346328735352, -0.011630535125732422, -0.011137723922729492, -0.010644912719726562, -0.010152101516723633, -0.009659290313720703, -0.009166479110717773, -0.008673667907714844, -0.008180856704711914, -0.007688045501708984, -0.007195234298706055, -0.006702423095703125, -0.006209611892700195, -0.005716800689697266, -0.005223989486694336, -0.004731178283691406, -0.0042383670806884766, -0.003745555877685547, -0.003252744674682617, -0.0027599334716796875, -0.002267122268676758, -0.0017743110656738281, -0.0012814998626708984, -0.0007886886596679688, -0.00029587745666503906, 0.00019693374633789062, 0.0006897449493408203, 0.00118255615234375, 0.0016753673553466797, 0.0021681785583496094, 0.002660989761352539, 0.0031538009643554688, 0.0036466121673583984, 0.004139423370361328, 0.004632234573364258, 0.0051250457763671875, 0.005617856979370117, 0.006110668182373047, 0.0066034793853759766, 0.007096290588378906, 0.007589101791381836, 0.008081912994384766, 0.008574724197387695, 0.009067535400390625, 0.009560346603393555, 0.010053157806396484, 0.010545969009399414, 0.011038780212402344, 0.011531591415405273, 0.012024402618408203, 0.012517213821411133, 0.013010025024414062, 0.013502836227416992, 0.013995647430419922, 0.014488458633422852, 0.014981269836425781, 0.015474081039428711, 0.01596689224243164, 0.01645970344543457, 0.0169525146484375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 861.0, 155.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002205475000664592, -0.001434606732800603, -0.0006637385813519359, 0.00010712957009673119, 0.0008779978379607201, 0.001648866105824709, 0.002419734140858054, 0.003190602408722043, 0.003961470909416676, 0.0047323391772806644, 0.005503207445144653, 0.006274075247347355, 0.007044943980872631, 0.007815811783075333, 0.008586680516600609, 0.00935754831880331, 0.010128416121006012, 0.010899283923208714, 0.01167015265673399, 0.012441020458936691, 0.013211889192461967, 0.013982756994664669, 0.01475362479686737, 0.015524493530392647, 0.016295362263917923, 0.0170662309974432, 0.017837097868323326, 0.018607966601848602, 0.01937883533537388, 0.020149704068899155, 0.02092057093977928, 0.021691439673304558, 0.022462306544184685, 0.02323317527770996, 0.024004042148590088, 0.024774910882115364, 0.02554577961564064, 0.026316648349165916, 0.027087515220046043, 0.02785838395357132, 0.028629252687096596, 0.029400121420621872, 0.030170988291502, 0.030941857025027275, 0.03171272575855255, 0.03248359262943268, 0.033254463225603104, 0.03402533009648323, 0.03479619696736336, 0.035567063838243484, 0.03633793443441391, 0.03710880130529404, 0.037879668176174164, 0.03865053877234459, 0.039421405643224716, 0.04019227623939514, 0.04096314311027527, 0.041734009981155396, 0.04250488057732582, 0.04327574744820595, 0.044046614319086075, 0.0448174849152565, 0.04558835178613663, 0.046359218657016754, 0.04713008925318718]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 19.0, 17.0, 36.0, 44.0, 71.0, 87.0, 99.0, 97.0, 75.0, 93.0, 77.0, 77.0, 50.0, 42.0, 49.0, 26.0, 14.0, 11.0, 7.0, 5.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.002314150333404541, -0.002266271971166134, -0.0022183936089277267, -0.0021705152466893196, -0.0021226368844509125, -0.0020747585222125053, -0.002026880159974098, -0.001979001797735691, -0.001931123435497284, -0.0018832450732588768, -0.0018353667110204697, -0.0017874883487820625, -0.0017396099865436554, -0.0016917316243052483, -0.0016438532620668411, -0.001595974899828434, -0.0015480965375900269, -0.0015002181753516197, -0.0014523398131132126, -0.0014044614508748055, -0.0013565830886363983, -0.0013087047263979912, -0.001260826364159584, -0.001212948001921177, -0.0011650696396827698, -0.0011171912774443626, -0.0010693129152059555, -0.0010214345529675484, -0.0009735561907291412, -0.0009256778284907341, -0.000877799466252327, -0.0008299211040139198, -0.0007820427417755127, -0.0007341643795371056, -0.0006862860172986984, -0.0006384076550602913, -0.0005905292928218842, -0.000542650930583477, -0.0004947725683450699, -0.00044689420610666275, -0.0003990158438682556, -0.0003511374816298485, -0.00030325911939144135, -0.0002553807571530342, -0.00020750239491462708, -0.00015962403267621994, -0.0001117456704378128, -6.386730819940567e-05, -1.5988945960998535e-05, 3.18894162774086e-05, 7.976777851581573e-05, 0.00012764614075422287, 0.00017552450299263, 0.00022340286523103714, 0.0002712812274694443, 0.0003191595897078514, 0.00036703795194625854, 0.0004149163141846657, 0.0004627946764230728, 0.00051067303866148, 0.0005585514008998871, 0.0006064297631382942, 0.0006543081253767014, 0.0007021864876151085, 0.0007500648498535156]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 7.0, 9.0, 12.0, 12.0, 13.0, 19.0, 22.0, 22.0, 19.0, 25.0, 29.0, 29.0, 37.0, 33.0, 36.0, 42.0, 41.0, 53.0, 38.0, 49.0, 46.0, 43.0, 49.0, 32.0, 27.0, 25.0, 29.0, 28.0, 23.0, 22.0, 21.0, 13.0, 12.0, 14.0, 10.0, 14.0, 3.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.30078125, -3.192108154296875, -3.08343505859375, -2.974761962890625, -2.8660888671875, -2.757415771484375, -2.64874267578125, -2.540069580078125, -2.431396484375, -2.322723388671875, -2.21405029296875, -2.105377197265625, -1.9967041015625, -1.888031005859375, -1.77935791015625, -1.670684814453125, -1.56201171875, -1.453338623046875, -1.34466552734375, -1.235992431640625, -1.1273193359375, -1.018646240234375, -0.90997314453125, -0.801300048828125, -0.692626953125, -0.583953857421875, -0.47528076171875, -0.366607666015625, -0.2579345703125, -0.149261474609375, -0.04058837890625, 0.068084716796875, 0.1767578125, 0.285430908203125, 0.39410400390625, 0.502777099609375, 0.6114501953125, 0.720123291015625, 0.82879638671875, 0.937469482421875, 1.046142578125, 1.154815673828125, 1.26348876953125, 1.372161865234375, 1.4808349609375, 1.589508056640625, 1.69818115234375, 1.806854248046875, 1.91552734375, 2.024200439453125, 2.13287353515625, 2.241546630859375, 2.3502197265625, 2.458892822265625, 2.56756591796875, 2.676239013671875, 2.784912109375, 2.893585205078125, 3.00225830078125, 3.110931396484375, 3.2196044921875, 3.328277587890625, 3.43695068359375, 3.545623779296875, 3.654296875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 10.0, 13.0, 18.0, 22.0, 38.0, 55.0, 80.0, 117.0, 190.0, 296.0, 441.0, 690.0, 1100.0, 1864.0, 3358.0, 6333.0, 12422.0, 25297.0, 64792.0, 317007.0, 460345.0, 90875.0, 31388.0, 14630.0, 7494.0, 3979.0, 2188.0, 1258.0, 808.0, 491.0, 309.0, 216.0, 145.0, 81.0, 63.0, 36.0, 32.0, 16.0, 15.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.078125, -7.83428955078125, -7.5904541015625, -7.34661865234375, -7.102783203125, -6.85894775390625, -6.6151123046875, -6.37127685546875, -6.12744140625, -5.88360595703125, -5.6397705078125, -5.39593505859375, -5.152099609375, -4.90826416015625, -4.6644287109375, -4.42059326171875, -4.1767578125, -3.93292236328125, -3.6890869140625, -3.44525146484375, -3.201416015625, -2.95758056640625, -2.7137451171875, -2.46990966796875, -2.22607421875, -1.98223876953125, -1.7384033203125, -1.49456787109375, -1.250732421875, -1.00689697265625, -0.7630615234375, -0.51922607421875, -0.275390625, -0.03155517578125, 0.2122802734375, 0.45611572265625, 0.699951171875, 0.94378662109375, 1.1876220703125, 1.43145751953125, 1.67529296875, 1.91912841796875, 2.1629638671875, 2.40679931640625, 2.650634765625, 2.89447021484375, 3.1383056640625, 3.38214111328125, 3.6259765625, 3.86981201171875, 4.1136474609375, 4.35748291015625, 4.601318359375, 4.84515380859375, 5.0889892578125, 5.33282470703125, 5.57666015625, 5.82049560546875, 6.0643310546875, 6.30816650390625, 6.552001953125, 6.79583740234375, 7.0396728515625, 7.28350830078125, 7.52734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 8.0, 10.0, 9.0, 21.0, 17.0, 10.0, 14.0, 21.0, 21.0, 29.0, 38.0, 37.0, 62.0, 53.0, 84.0, 111.0, 237.0, 1437.0, 229.0, 131.0, 84.0, 60.0, 47.0, 49.0, 43.0, 33.0, 35.0, 28.0, 18.0, 18.0, 14.0, 4.0, 7.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.8046875, -11.390625, -10.9765625, -10.5625, -10.1484375, -9.734375, -9.3203125, -8.90625, -8.4921875, -8.078125, -7.6640625, -7.25, -6.8359375, -6.421875, -6.0078125, -5.59375, -5.1796875, -4.765625, -4.3515625, -3.9375, -3.5234375, -3.109375, -2.6953125, -2.28125, -1.8671875, -1.453125, -1.0390625, -0.625, -0.2109375, 0.203125, 0.6171875, 1.03125, 1.4453125, 1.859375, 2.2734375, 2.6875, 3.1015625, 3.515625, 3.9296875, 4.34375, 4.7578125, 5.171875, 5.5859375, 6.0, 6.4140625, 6.828125, 7.2421875, 7.65625, 8.0703125, 8.484375, 8.8984375, 9.3125, 9.7265625, 10.140625, 10.5546875, 10.96875, 11.3828125, 11.796875, 12.2109375, 12.625, 13.0390625, 13.453125, 13.8671875, 14.28125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 7.0, 7.0, 8.0, 12.0, 15.0, 23.0, 29.0, 50.0, 46.0, 65.0, 90.0, 158.0, 287.0, 767.0, 4076.0, 43965.0, 2597837.0, 479536.0, 15562.0, 1952.0, 507.0, 208.0, 130.0, 89.0, 64.0, 48.0, 40.0, 27.0, 19.0, 16.0, 16.0, 14.0, 9.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.25, -27.4384765625, -26.626953125, -25.8154296875, -25.00390625, -24.1923828125, -23.380859375, -22.5693359375, -21.7578125, -20.9462890625, -20.134765625, -19.3232421875, -18.51171875, -17.7001953125, -16.888671875, -16.0771484375, -15.265625, -14.4541015625, -13.642578125, -12.8310546875, -12.01953125, -11.2080078125, -10.396484375, -9.5849609375, -8.7734375, -7.9619140625, -7.150390625, -6.3388671875, -5.52734375, -4.7158203125, -3.904296875, -3.0927734375, -2.28125, -1.4697265625, -0.658203125, 0.1533203125, 0.96484375, 1.7763671875, 2.587890625, 3.3994140625, 4.2109375, 5.0224609375, 5.833984375, 6.6455078125, 7.45703125, 8.2685546875, 9.080078125, 9.8916015625, 10.703125, 11.5146484375, 12.326171875, 13.1376953125, 13.94921875, 14.7607421875, 15.572265625, 16.3837890625, 17.1953125, 18.0068359375, 18.818359375, 19.6298828125, 20.44140625, 21.2529296875, 22.064453125, 22.8759765625, 23.6875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 62.0, 412.0, 460.0, 79.0, 4.0, 1.0, 1.0], "bins": [-264.3245544433594, -259.8451232910156, -255.3656768798828, -250.88624572753906, -246.40679931640625, -241.9273681640625, -237.44793701171875, -232.96849060058594, -228.4890594482422, -224.00962829589844, -219.53018188476562, -215.05075073242188, -210.57130432128906, -206.0918731689453, -201.6124267578125, -197.13299560546875, -192.653564453125, -188.17413330078125, -183.69468688964844, -179.2152557373047, -174.73580932617188, -170.25637817382812, -165.77694702148438, -161.29750061035156, -156.81805419921875, -152.338623046875, -147.8591766357422, -143.37974548339844, -138.90029907226562, -134.42086791992188, -129.94143676757812, -125.46199035644531, -120.98255920410156, -116.50312042236328, -112.023681640625, -107.54425048828125, -103.06481170654297, -98.58537292480469, -94.1059341430664, -89.62649536132812, -85.14705657958984, -80.66761779785156, -76.18817901611328, -71.708740234375, -67.22930908203125, -62.74987030029297, -58.27043151855469, -53.790992736816406, -49.31155776977539, -44.83211898803711, -40.352684020996094, -35.87324523925781, -31.393808364868164, -26.914371490478516, -22.434932708740234, -17.955495834350586, -13.476058959960938, -8.996622085571289, -4.517184257507324, -0.037746429443359375, 4.441690444946289, 8.921127319335938, 13.400566101074219, 17.880002975463867, 22.359439849853516]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 7.0, 5.0, 10.0, 11.0, 8.0, 10.0, 18.0, 19.0, 17.0, 18.0, 33.0, 36.0, 39.0, 33.0, 32.0, 39.0, 44.0, 39.0, 36.0, 40.0, 46.0, 37.0, 40.0, 31.0, 29.0, 32.0, 28.0, 27.0, 30.0, 30.0, 18.0, 21.0, 15.0, 10.0, 13.0, 12.0, 13.0, 8.0, 12.0, 9.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.69312858581543, -27.771778106689453, -26.850425720214844, -25.929075241088867, -25.00772476196289, -24.08637237548828, -23.165021896362305, -22.243671417236328, -21.32231903076172, -20.400968551635742, -19.479616165161133, -18.558265686035156, -17.636913299560547, -16.71556282043457, -15.794212341308594, -14.8728609085083, -13.951509475708008, -13.030158042907715, -12.108806610107422, -11.187456130981445, -10.266104698181152, -9.34475326538086, -8.423402786254883, -7.50205135345459, -6.580699920654297, -5.659348487854004, -4.737997531890869, -3.8166463375091553, -2.8952951431274414, -1.9739437103271484, -1.0525927543640137, -0.1312417984008789, 0.7901096343994141, 1.711460828781128, 2.632812023162842, 3.5541632175445557, 4.4755144119262695, 5.3968658447265625, 6.318216800689697, 7.239567756652832, 8.160919189453125, 9.082270622253418, 10.003622055053711, 10.924972534179688, 11.84632396697998, 12.767675399780273, 13.68902587890625, 14.610377311706543, 15.531728744506836, 16.453079223632812, 17.374431610107422, 18.2957820892334, 19.217132568359375, 20.138484954833984, 21.05983543395996, 21.981185913085938, 22.902538299560547, 23.823888778686523, 24.745241165161133, 25.66659164428711, 26.58794403076172, 27.509294509887695, 28.430644989013672, 29.35199737548828, 30.273347854614258]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 6.0, 8.0, 5.0, 12.0, 17.0, 10.0, 13.0, 22.0, 21.0, 31.0, 26.0, 28.0, 26.0, 41.0, 36.0, 32.0, 50.0, 52.0, 51.0, 46.0, 56.0, 52.0, 44.0, 39.0, 27.0, 33.0, 29.0, 27.0, 14.0, 24.0, 27.0, 17.0, 14.0, 14.0, 7.0, 13.0, 4.0, 1.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.619140625, -3.498321533203125, -3.37750244140625, -3.256683349609375, -3.1358642578125, -3.015045166015625, -2.89422607421875, -2.773406982421875, -2.652587890625, -2.531768798828125, -2.41094970703125, -2.290130615234375, -2.1693115234375, -2.048492431640625, -1.92767333984375, -1.806854248046875, -1.68603515625, -1.565216064453125, -1.44439697265625, -1.323577880859375, -1.2027587890625, -1.081939697265625, -0.96112060546875, -0.840301513671875, -0.719482421875, -0.598663330078125, -0.47784423828125, -0.357025146484375, -0.2362060546875, -0.115386962890625, 0.00543212890625, 0.126251220703125, 0.2470703125, 0.367889404296875, 0.48870849609375, 0.609527587890625, 0.7303466796875, 0.851165771484375, 0.97198486328125, 1.092803955078125, 1.213623046875, 1.334442138671875, 1.45526123046875, 1.576080322265625, 1.6968994140625, 1.817718505859375, 1.93853759765625, 2.059356689453125, 2.18017578125, 2.300994873046875, 2.42181396484375, 2.542633056640625, 2.6634521484375, 2.784271240234375, 2.90509033203125, 3.025909423828125, 3.146728515625, 3.267547607421875, 3.38836669921875, 3.509185791015625, 3.6300048828125, 3.750823974609375, 3.87164306640625, 3.992462158203125, 4.11328125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 8.0, 11.0, 12.0, 21.0, 29.0, 37.0, 56.0, 108.0, 163.0, 334.0, 885.0, 2570.0, 12295.0, 195303.0, 3681141.0, 281830.0, 14652.0, 2955.0, 942.0, 403.0, 198.0, 112.0, 55.0, 39.0, 36.0, 15.0, 18.0, 14.0, 9.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.494873046875, -15.89599609375, -15.297119140625, -14.6982421875, -14.099365234375, -13.50048828125, -12.901611328125, -12.302734375, -11.703857421875, -11.10498046875, -10.506103515625, -9.9072265625, -9.308349609375, -8.70947265625, -8.110595703125, -7.51171875, -6.912841796875, -6.31396484375, -5.715087890625, -5.1162109375, -4.517333984375, -3.91845703125, -3.319580078125, -2.720703125, -2.121826171875, -1.52294921875, -0.924072265625, -0.3251953125, 0.273681640625, 0.87255859375, 1.471435546875, 2.0703125, 2.669189453125, 3.26806640625, 3.866943359375, 4.4658203125, 5.064697265625, 5.66357421875, 6.262451171875, 6.861328125, 7.460205078125, 8.05908203125, 8.657958984375, 9.2568359375, 9.855712890625, 10.45458984375, 11.053466796875, 11.65234375, 12.251220703125, 12.85009765625, 13.448974609375, 14.0478515625, 14.646728515625, 15.24560546875, 15.844482421875, 16.443359375, 17.042236328125, 17.64111328125, 18.239990234375, 18.8388671875, 19.437744140625, 20.03662109375, 20.635498046875, 21.234375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 12.0, 12.0, 15.0, 22.0, 27.0, 69.0, 101.0, 142.0, 222.0, 393.0, 543.0, 784.0, 669.0, 425.0, 234.0, 161.0, 95.0, 50.0, 33.0, 16.0, 12.0, 11.0, 12.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.669677734375, -8.33154296875, -7.993408203125, -7.6552734375, -7.317138671875, -6.97900390625, -6.640869140625, -6.302734375, -5.964599609375, -5.62646484375, -5.288330078125, -4.9501953125, -4.612060546875, -4.27392578125, -3.935791015625, -3.59765625, -3.259521484375, -2.92138671875, -2.583251953125, -2.2451171875, -1.906982421875, -1.56884765625, -1.230712890625, -0.892578125, -0.554443359375, -0.21630859375, 0.121826171875, 0.4599609375, 0.798095703125, 1.13623046875, 1.474365234375, 1.8125, 2.150634765625, 2.48876953125, 2.826904296875, 3.1650390625, 3.503173828125, 3.84130859375, 4.179443359375, 4.517578125, 4.855712890625, 5.19384765625, 5.531982421875, 5.8701171875, 6.208251953125, 6.54638671875, 6.884521484375, 7.22265625, 7.560791015625, 7.89892578125, 8.237060546875, 8.5751953125, 8.913330078125, 9.25146484375, 9.589599609375, 9.927734375, 10.265869140625, 10.60400390625, 10.942138671875, 11.2802734375, 11.618408203125, 11.95654296875, 12.294677734375, 12.6328125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 12.0, 6.0, 19.0, 12.0, 28.0, 41.0, 80.0, 172.0, 308.0, 966.0, 12364.0, 3949046.0, 227451.0, 2637.0, 547.0, 258.0, 117.0, 89.0, 43.0, 26.0, 18.0, 10.0, 17.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.8125, -60.17529296875, -58.5380859375, -56.90087890625, -55.263671875, -53.62646484375, -51.9892578125, -50.35205078125, -48.71484375, -47.07763671875, -45.4404296875, -43.80322265625, -42.166015625, -40.52880859375, -38.8916015625, -37.25439453125, -35.6171875, -33.97998046875, -32.3427734375, -30.70556640625, -29.068359375, -27.43115234375, -25.7939453125, -24.15673828125, -22.51953125, -20.88232421875, -19.2451171875, -17.60791015625, -15.970703125, -14.33349609375, -12.6962890625, -11.05908203125, -9.421875, -7.78466796875, -6.1474609375, -4.51025390625, -2.873046875, -1.23583984375, 0.4013671875, 2.03857421875, 3.67578125, 5.31298828125, 6.9501953125, 8.58740234375, 10.224609375, 11.86181640625, 13.4990234375, 15.13623046875, 16.7734375, 18.41064453125, 20.0478515625, 21.68505859375, 23.322265625, 24.95947265625, 26.5966796875, 28.23388671875, 29.87109375, 31.50830078125, 33.1455078125, 34.78271484375, 36.419921875, 38.05712890625, 39.6943359375, 41.33154296875, 42.96875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 16.0, 20.0, 24.0, 39.0, 52.0, 78.0, 80.0, 106.0, 116.0, 98.0, 93.0, 75.0, 59.0, 39.0, 36.0, 30.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.172107696533203, -19.05388069152832, -17.935653686523438, -16.817428588867188, -15.699201583862305, -14.580974578857422, -13.462747573852539, -12.344520568847656, -11.22629451751709, -10.108067512512207, -8.98984146118164, -7.871614456176758, -6.753387928009033, -5.635161399841309, -4.516934394836426, -3.398707866668701, -2.2804813385009766, -1.1622546911239624, -0.04402804374694824, 1.0741987228393555, 2.19242525100708, 3.3106517791748047, 4.4288787841796875, 5.547105312347412, 6.665331840515137, 7.783558368682861, 8.901784896850586, 10.020011901855469, 11.138238906860352, 12.256464958190918, 13.3746919631958, 14.492918014526367, 15.61114501953125, 16.729372024536133, 17.847599029541016, 18.965824127197266, 20.08405113220215, 21.20227813720703, 22.320505142211914, 23.438732147216797, 24.556957244873047, 25.67518424987793, 26.793411254882812, 27.911636352539062, 29.029863357543945, 30.148090362548828, 31.26631736755371, 32.384544372558594, 33.502769470214844, 34.620994567871094, 35.73922348022461, 36.85744857788086, 37.975677490234375, 39.093902587890625, 40.212127685546875, 41.33035659790039, 42.448585510253906, 43.566810607910156, 44.68503952026367, 45.80326461791992, 46.92149353027344, 48.03971862792969, 49.15794372558594, 50.27617263793945, 51.3943977355957]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 7.0, 5.0, 13.0, 11.0, 11.0, 15.0, 21.0, 20.0, 23.0, 25.0, 25.0, 33.0, 38.0, 45.0, 30.0, 47.0, 45.0, 47.0, 53.0, 45.0, 44.0, 46.0, 50.0, 40.0, 39.0, 34.0, 25.0, 27.0, 24.0, 28.0, 14.0, 19.0, 15.0, 10.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-31.912277221679688, -31.053913116455078, -30.19554901123047, -29.337182998657227, -28.478818893432617, -27.620454788208008, -26.762088775634766, -25.903724670410156, -25.045360565185547, -24.186996459960938, -23.328632354736328, -22.470266342163086, -21.611902236938477, -20.753538131713867, -19.895172119140625, -19.036808013916016, -18.178443908691406, -17.320079803466797, -16.461715698242188, -15.603349685668945, -14.744985580444336, -13.886621475219727, -13.0282564163208, -12.169891357421875, -11.311527252197266, -10.453163146972656, -9.59479808807373, -8.736433029174805, -7.878068923950195, -7.019704341888428, -6.16133975982666, -5.302975177764893, -4.444612503051758, -3.5862479209899902, -2.7278833389282227, -1.869518756866455, -1.0111541748046875, -0.15278959274291992, 0.7055749893188477, 1.5639395713806152, 2.422304153442383, 3.2806687355041504, 4.139033317565918, 4.9973978996276855, 5.855762481689453, 6.714127063751221, 7.572491645812988, 8.430856704711914, 9.289220809936523, 10.147584915161133, 11.005949974060059, 11.864315032958984, 12.722679138183594, 13.581043243408203, 14.439408302307129, 15.297773361206055, 16.156137466430664, 17.014501571655273, 17.872867584228516, 18.731231689453125, 19.589595794677734, 20.447959899902344, 21.306324005126953, 22.164690017700195, 23.023054122924805]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 4.0, 9.0, 2.0, 10.0, 12.0, 10.0, 23.0, 14.0, 24.0, 18.0, 31.0, 24.0, 19.0, 34.0, 39.0, 34.0, 34.0, 43.0, 46.0, 50.0, 41.0, 54.0, 51.0, 44.0, 34.0, 33.0, 33.0, 24.0, 28.0, 16.0, 25.0, 28.0, 20.0, 21.0, 11.0, 13.0, 8.0, 11.0, 1.0, 9.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.405242919921875, -3.28900146484375, -3.172760009765625, -3.0565185546875, -2.940277099609375, -2.82403564453125, -2.707794189453125, -2.591552734375, -2.475311279296875, -2.35906982421875, -2.242828369140625, -2.1265869140625, -2.010345458984375, -1.89410400390625, -1.777862548828125, -1.66162109375, -1.545379638671875, -1.42913818359375, -1.312896728515625, -1.1966552734375, -1.080413818359375, -0.96417236328125, -0.847930908203125, -0.731689453125, -0.615447998046875, -0.49920654296875, -0.382965087890625, -0.2667236328125, -0.150482177734375, -0.03424072265625, 0.082000732421875, 0.1982421875, 0.314483642578125, 0.43072509765625, 0.546966552734375, 0.6632080078125, 0.779449462890625, 0.89569091796875, 1.011932373046875, 1.128173828125, 1.244415283203125, 1.36065673828125, 1.476898193359375, 1.5931396484375, 1.709381103515625, 1.82562255859375, 1.941864013671875, 2.05810546875, 2.174346923828125, 2.29058837890625, 2.406829833984375, 2.5230712890625, 2.639312744140625, 2.75555419921875, 2.871795654296875, 2.988037109375, 3.104278564453125, 3.22052001953125, 3.336761474609375, 3.4530029296875, 3.569244384765625, 3.68548583984375, 3.801727294921875, 3.91796875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 11.0, 5.0, 20.0, 18.0, 25.0, 22.0, 45.0, 59.0, 90.0, 112.0, 114.0, 212.0, 342.0, 492.0, 571.0, 933.0, 1289.0, 1713.0, 2590.0, 3689.0, 5434.0, 7995.0, 12017.0, 17903.0, 26344.0, 40451.0, 64383.0, 114507.0, 261002.0, 217331.0, 98990.0, 57762.0, 36982.0, 24292.0, 16013.0, 10706.0, 7558.0, 5167.0, 3380.0, 2418.0, 1659.0, 1108.0, 791.0, 615.0, 364.0, 286.0, 221.0, 153.0, 112.0, 69.0, 46.0, 51.0, 28.0, 30.0, 14.0, 10.0, 8.0, 8.0, 4.0, 5.0], "bins": [-0.1783447265625, -0.17292213439941406, -0.16749954223632812, -0.1620769500732422, -0.15665435791015625, -0.1512317657470703, -0.14580917358398438, -0.14038658142089844, -0.1349639892578125, -0.12954139709472656, -0.12411880493164062, -0.11869621276855469, -0.11327362060546875, -0.10785102844238281, -0.10242843627929688, -0.09700584411621094, -0.091583251953125, -0.08616065979003906, -0.08073806762695312, -0.07531547546386719, -0.06989288330078125, -0.06447029113769531, -0.059047698974609375, -0.05362510681152344, -0.0482025146484375, -0.04277992248535156, -0.037357330322265625, -0.03193473815917969, -0.02651214599609375, -0.021089553833007812, -0.015666961669921875, -0.010244369506835938, -0.00482177734375, 0.0006008148193359375, 0.006023406982421875, 0.011445999145507812, 0.01686859130859375, 0.022291183471679688, 0.027713775634765625, 0.03313636779785156, 0.0385589599609375, 0.04398155212402344, 0.049404144287109375, 0.05482673645019531, 0.06024932861328125, 0.06567192077636719, 0.07109451293945312, 0.07651710510253906, 0.081939697265625, 0.08736228942871094, 0.09278488159179688, 0.09820747375488281, 0.10363006591796875, 0.10905265808105469, 0.11447525024414062, 0.11989784240722656, 0.1253204345703125, 0.13074302673339844, 0.13616561889648438, 0.1415882110595703, 0.14701080322265625, 0.1524333953857422, 0.15785598754882812, 0.16327857971191406, 0.168701171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 6.0, 5.0, 12.0, 10.0, 14.0, 17.0, 14.0, 21.0, 23.0, 24.0, 25.0, 26.0, 43.0, 32.0, 40.0, 41.0, 33.0, 35.0, 53.0, 1070.0, 55.0, 56.0, 49.0, 32.0, 40.0, 39.0, 33.0, 34.0, 33.0, 23.0, 16.0, 21.0, 9.0, 9.0, 11.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.462890625, -3.35888671875, -3.2548828125, -3.15087890625, -3.046875, -2.94287109375, -2.8388671875, -2.73486328125, -2.630859375, -2.52685546875, -2.4228515625, -2.31884765625, -2.21484375, -2.11083984375, -2.0068359375, -1.90283203125, -1.798828125, -1.69482421875, -1.5908203125, -1.48681640625, -1.3828125, -1.27880859375, -1.1748046875, -1.07080078125, -0.966796875, -0.86279296875, -0.7587890625, -0.65478515625, -0.55078125, -0.44677734375, -0.3427734375, -0.23876953125, -0.134765625, -0.03076171875, 0.0732421875, 0.17724609375, 0.28125, 0.38525390625, 0.4892578125, 0.59326171875, 0.697265625, 0.80126953125, 0.9052734375, 1.00927734375, 1.11328125, 1.21728515625, 1.3212890625, 1.42529296875, 1.529296875, 1.63330078125, 1.7373046875, 1.84130859375, 1.9453125, 2.04931640625, 2.1533203125, 2.25732421875, 2.361328125, 2.46533203125, 2.5693359375, 2.67333984375, 2.77734375, 2.88134765625, 2.9853515625, 3.08935546875, 3.193359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 11.0, 8.0, 12.0, 16.0, 24.0, 45.0, 51.0, 86.0, 115.0, 175.0, 236.0, 365.0, 500.0, 711.0, 1105.0, 1582.0, 2295.0, 3457.0, 4911.0, 6964.0, 10494.0, 15649.0, 23735.0, 36908.0, 60520.0, 107590.0, 301436.0, 1208540.0, 122648.0, 67216.0, 40913.0, 26180.0, 16784.0, 11308.0, 7702.0, 5199.0, 3534.0, 2515.0, 1664.0, 1224.0, 830.0, 579.0, 399.0, 313.0, 183.0, 145.0, 75.0, 63.0, 37.0, 30.0, 20.0, 17.0, 4.0, 8.0, 5.0, 2.0, 5.0, 1.0], "bins": [-0.05926513671875, -0.057474613189697266, -0.05568408966064453, -0.0538935661315918, -0.05210304260253906, -0.05031251907348633, -0.048521995544433594, -0.04673147201538086, -0.044940948486328125, -0.04315042495727539, -0.041359901428222656, -0.03956937789916992, -0.03777885437011719, -0.03598833084106445, -0.03419780731201172, -0.032407283782958984, -0.03061676025390625, -0.028826236724853516, -0.02703571319580078, -0.025245189666748047, -0.023454666137695312, -0.021664142608642578, -0.019873619079589844, -0.01808309555053711, -0.016292572021484375, -0.01450204849243164, -0.012711524963378906, -0.010921001434326172, -0.009130477905273438, -0.007339954376220703, -0.005549430847167969, -0.0037589073181152344, -0.0019683837890625, -0.00017786026000976562, 0.0016126632690429688, 0.003403186798095703, 0.0051937103271484375, 0.006984233856201172, 0.008774757385253906, 0.01056528091430664, 0.012355804443359375, 0.01414632797241211, 0.015936851501464844, 0.017727375030517578, 0.019517898559570312, 0.021308422088623047, 0.02309894561767578, 0.024889469146728516, 0.02667999267578125, 0.028470516204833984, 0.03026103973388672, 0.03205156326293945, 0.03384208679199219, 0.03563261032104492, 0.037423133850097656, 0.03921365737915039, 0.041004180908203125, 0.04279470443725586, 0.044585227966308594, 0.04637575149536133, 0.04816627502441406, 0.0499567985534668, 0.05174732208251953, 0.053537845611572266, 0.055328369140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 4.0, 6.0, 11.0, 17.0, 17.0, 25.0, 32.0, 32.0, 41.0, 60.0, 74.0, 73.0, 80.0, 90.0, 73.0, 68.0, 49.0, 45.0, 36.0, 29.0, 21.0, 22.0, 18.0, 16.0, 11.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014886856079101562, -0.0014462918043136597, -0.001403898000717163, -0.0013615041971206665, -0.00131911039352417, -0.0012767165899276733, -0.0012343227863311768, -0.0011919289827346802, -0.0011495351791381836, -0.001107141375541687, -0.0010647475719451904, -0.0010223537683486938, -0.0009799599647521973, -0.0009375661611557007, -0.0008951723575592041, -0.0008527785539627075, -0.0008103847503662109, -0.0007679909467697144, -0.0007255971431732178, -0.0006832033395767212, -0.0006408095359802246, -0.000598415732383728, -0.0005560219287872314, -0.0005136281251907349, -0.0004712343215942383, -0.0004288405179977417, -0.0003864467144012451, -0.00034405291080474854, -0.00030165910720825195, -0.00025926530361175537, -0.0002168715000152588, -0.0001744776964187622, -0.00013208389282226562, -8.969008922576904e-05, -4.729628562927246e-05, -4.902482032775879e-06, 3.74913215637207e-05, 7.988512516021729e-05, 0.00012227892875671387, 0.00016467273235321045, 0.00020706653594970703, 0.0002494603395462036, 0.0002918541431427002, 0.0003342479467391968, 0.00037664175033569336, 0.00041903555393218994, 0.0004614293575286865, 0.0005038231611251831, 0.0005462169647216797, 0.0005886107683181763, 0.0006310045719146729, 0.0006733983755111694, 0.000715792179107666, 0.0007581859827041626, 0.0008005797863006592, 0.0008429735898971558, 0.0008853673934936523, 0.0009277611970901489, 0.0009701550006866455, 0.001012548804283142, 0.0010549426078796387, 0.0010973364114761353, 0.0011397302150726318, 0.0011821240186691284, 0.001224517822265625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 3.0, 7.0, 2.0, 9.0, 9.0, 20.0, 18.0, 23.0, 25.0, 29.0, 43.0, 68.0, 120.0, 342.0, 3412.0, 882491.0, 160013.0, 1301.0, 261.0, 112.0, 57.0, 38.0, 40.0, 26.0, 17.0, 16.0, 10.0, 7.0, 4.0, 11.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026042938232421875, -0.02510833740234375, -0.024173736572265625, -0.0232391357421875, -0.022304534912109375, -0.02136993408203125, -0.020435333251953125, -0.019500732421875, -0.018566131591796875, -0.01763153076171875, -0.016696929931640625, -0.0157623291015625, -0.014827728271484375, -0.01389312744140625, -0.012958526611328125, -0.01202392578125, -0.011089324951171875, -0.01015472412109375, -0.009220123291015625, -0.0082855224609375, -0.007350921630859375, -0.00641632080078125, -0.005481719970703125, -0.004547119140625, -0.003612518310546875, -0.00267791748046875, -0.001743316650390625, -0.0008087158203125, 0.000125885009765625, 0.00106048583984375, 0.001995086669921875, 0.0029296875, 0.003864288330078125, 0.00479888916015625, 0.005733489990234375, 0.0066680908203125, 0.007602691650390625, 0.00853729248046875, 0.009471893310546875, 0.010406494140625, 0.011341094970703125, 0.01227569580078125, 0.013210296630859375, 0.0141448974609375, 0.015079498291015625, 0.01601409912109375, 0.016948699951171875, 0.01788330078125, 0.018817901611328125, 0.01975250244140625, 0.020687103271484375, 0.0216217041015625, 0.022556304931640625, 0.02349090576171875, 0.024425506591796875, 0.025360107421875, 0.026294708251953125, 0.02722930908203125, 0.028163909912109375, 0.0290985107421875, 0.030033111572265625, 0.03096771240234375, 0.031902313232421875, 0.0328369140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 61.0, 951.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002530066529288888, -0.001415963633917272, -0.0003018607385456562, 0.0008122420404106379, 0.0019263450521975756, 0.0030404480639845133, 0.004154550842940807, 0.005268653854727745, 0.006382756866514683, 0.0074968598783016205, 0.008610962890088558, 0.009725065901875496, 0.010839167982339859, 0.011953271925449371, 0.013067374005913734, 0.014181477017700672, 0.01529558002948761, 0.016409682109951973, 0.017523786053061485, 0.01863788813352585, 0.01975199207663536, 0.020866094157099724, 0.021980196237564087, 0.0230943001806736, 0.024208402261137962, 0.025322504341602325, 0.026436608284711838, 0.0275507103651762, 0.028664814308285713, 0.029778916388750076, 0.03089302033185959, 0.0320071205496788, 0.033121224492788315, 0.03423532843589783, 0.03534942865371704, 0.03646353259682655, 0.037577636539936066, 0.03869174048304558, 0.03980584070086479, 0.040919944643974304, 0.042034048587083817, 0.04314815253019333, 0.04426225274801254, 0.045376356691122055, 0.04649046063423157, 0.04760456457734108, 0.048718664795160294, 0.049832768738269806, 0.05094686895608902, 0.05206097289919853, 0.053175073117017746, 0.05428917706012726, 0.05540328100323677, 0.05651738494634628, 0.0576314851641655, 0.05874558910727501, 0.05985969305038452, 0.060973796993494034, 0.06208789721131325, 0.06320200115442276, 0.06431610137224197, 0.06543020904064178, 0.066544309258461, 0.06765840947628021, 0.06877251714468002]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 20.0, 21.0, 26.0, 54.0, 69.0, 76.0, 80.0, 93.0, 102.0, 97.0, 84.0, 80.0, 49.0, 41.0, 32.0, 27.0, 18.0, 12.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0030908584594726562, -0.00302241463214159, -0.002953970804810524, -0.002885526977479458, -0.0028170831501483917, -0.0027486393228173256, -0.0026801954954862595, -0.0026117516681551933, -0.002543307840824127, -0.002474864013493061, -0.002406420186161995, -0.002337976358830929, -0.0022695325314998627, -0.0022010887041687965, -0.0021326448768377304, -0.0020642010495066643, -0.001995757222175598, -0.001927313394844532, -0.0018588695675134659, -0.0017904257401823997, -0.0017219819128513336, -0.0016535380855202675, -0.0015850942581892014, -0.0015166504308581352, -0.001448206603527069, -0.001379762776196003, -0.0013113189488649368, -0.0012428751215338707, -0.0011744312942028046, -0.0011059874668717384, -0.0010375436395406723, -0.0009690998122096062, -0.00090065598487854, -0.0008322121575474739, -0.0007637683302164078, -0.0006953245028853416, -0.0006268806755542755, -0.0005584368482232094, -0.0004899930208921432, -0.0004215491935610771, -0.000353105366230011, -0.00028466153889894485, -0.00021621771156787872, -0.0001477738842368126, -7.933005690574646e-05, -1.0886229574680328e-05, 5.75575977563858e-05, 0.00012600142508745193, 0.00019444525241851807, 0.0002628890797495842, 0.00033133290708065033, 0.00039977673441171646, 0.0004682205617427826, 0.0005366643890738487, 0.0006051082164049149, 0.000673552043735981, 0.0007419958710670471, 0.0008104396983981133, 0.0008788835257291794, 0.0009473273530602455, 0.0010157711803913116, 0.0010842150077223778, 0.001152658835053444, 0.00122110266238451, 0.0012895464897155762]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 4.0, 9.0, 2.0, 10.0, 12.0, 10.0, 23.0, 14.0, 24.0, 18.0, 31.0, 24.0, 19.0, 34.0, 39.0, 34.0, 34.0, 43.0, 46.0, 50.0, 41.0, 54.0, 51.0, 44.0, 34.0, 33.0, 33.0, 24.0, 28.0, 16.0, 25.0, 28.0, 20.0, 21.0, 11.0, 13.0, 8.0, 11.0, 1.0, 9.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.405242919921875, -3.28900146484375, -3.172760009765625, -3.0565185546875, -2.940277099609375, -2.82403564453125, -2.707794189453125, -2.591552734375, -2.475311279296875, -2.35906982421875, -2.242828369140625, -2.1265869140625, -2.010345458984375, -1.89410400390625, -1.777862548828125, -1.66162109375, -1.545379638671875, -1.42913818359375, -1.312896728515625, -1.1966552734375, -1.080413818359375, -0.96417236328125, -0.847930908203125, -0.731689453125, -0.615447998046875, -0.49920654296875, -0.382965087890625, -0.2667236328125, -0.150482177734375, -0.03424072265625, 0.082000732421875, 0.1982421875, 0.314483642578125, 0.43072509765625, 0.546966552734375, 0.6632080078125, 0.779449462890625, 0.89569091796875, 1.011932373046875, 1.128173828125, 1.244415283203125, 1.36065673828125, 1.476898193359375, 1.5931396484375, 1.709381103515625, 1.82562255859375, 1.941864013671875, 2.05810546875, 2.174346923828125, 2.29058837890625, 2.406829833984375, 2.5230712890625, 2.639312744140625, 2.75555419921875, 2.871795654296875, 2.988037109375, 3.104278564453125, 3.22052001953125, 3.336761474609375, 3.4530029296875, 3.569244384765625, 3.68548583984375, 3.801727294921875, 3.91796875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 3.0, 11.0, 9.0, 24.0, 24.0, 50.0, 63.0, 95.0, 182.0, 273.0, 403.0, 672.0, 1102.0, 1981.0, 3472.0, 6392.0, 12736.0, 25439.0, 58949.0, 178297.0, 448747.0, 192822.0, 61508.0, 26591.0, 12959.0, 6892.0, 3745.0, 2097.0, 1171.0, 721.0, 396.0, 241.0, 151.0, 112.0, 62.0, 45.0, 32.0, 31.0, 22.0, 9.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.2109375, -6.9892578125, -6.767578125, -6.5458984375, -6.32421875, -6.1025390625, -5.880859375, -5.6591796875, -5.4375, -5.2158203125, -4.994140625, -4.7724609375, -4.55078125, -4.3291015625, -4.107421875, -3.8857421875, -3.6640625, -3.4423828125, -3.220703125, -2.9990234375, -2.77734375, -2.5556640625, -2.333984375, -2.1123046875, -1.890625, -1.6689453125, -1.447265625, -1.2255859375, -1.00390625, -0.7822265625, -0.560546875, -0.3388671875, -0.1171875, 0.1044921875, 0.326171875, 0.5478515625, 0.76953125, 0.9912109375, 1.212890625, 1.4345703125, 1.65625, 1.8779296875, 2.099609375, 2.3212890625, 2.54296875, 2.7646484375, 2.986328125, 3.2080078125, 3.4296875, 3.6513671875, 3.873046875, 4.0947265625, 4.31640625, 4.5380859375, 4.759765625, 4.9814453125, 5.203125, 5.4248046875, 5.646484375, 5.8681640625, 6.08984375, 6.3115234375, 6.533203125, 6.7548828125, 6.9765625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 5.0, 8.0, 6.0, 5.0, 21.0, 15.0, 18.0, 18.0, 20.0, 20.0, 26.0, 27.0, 37.0, 43.0, 44.0, 59.0, 75.0, 126.0, 196.0, 1320.0, 261.0, 152.0, 112.0, 75.0, 64.0, 37.0, 30.0, 26.0, 28.0, 33.0, 23.0, 26.0, 15.0, 9.0, 12.0, 9.0, 11.0, 11.0, 11.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.540771484375, -9.19873046875, -8.856689453125, -8.5146484375, -8.172607421875, -7.83056640625, -7.488525390625, -7.146484375, -6.804443359375, -6.46240234375, -6.120361328125, -5.7783203125, -5.436279296875, -5.09423828125, -4.752197265625, -4.41015625, -4.068115234375, -3.72607421875, -3.384033203125, -3.0419921875, -2.699951171875, -2.35791015625, -2.015869140625, -1.673828125, -1.331787109375, -0.98974609375, -0.647705078125, -0.3056640625, 0.036376953125, 0.37841796875, 0.720458984375, 1.0625, 1.404541015625, 1.74658203125, 2.088623046875, 2.4306640625, 2.772705078125, 3.11474609375, 3.456787109375, 3.798828125, 4.140869140625, 4.48291015625, 4.824951171875, 5.1669921875, 5.509033203125, 5.85107421875, 6.193115234375, 6.53515625, 6.877197265625, 7.21923828125, 7.561279296875, 7.9033203125, 8.245361328125, 8.58740234375, 8.929443359375, 9.271484375, 9.613525390625, 9.95556640625, 10.297607421875, 10.6396484375, 10.981689453125, 11.32373046875, 11.665771484375, 12.0078125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 3.0, 9.0, 10.0, 26.0, 17.0, 24.0, 38.0, 57.0, 82.0, 125.0, 177.0, 378.0, 867.0, 2956.0, 17889.0, 363015.0, 2652274.0, 95966.0, 8586.0, 1828.0, 611.0, 293.0, 141.0, 87.0, 54.0, 52.0, 45.0, 22.0, 17.0, 13.0, 4.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.953125, -22.30322265625, -21.6533203125, -21.00341796875, -20.353515625, -19.70361328125, -19.0537109375, -18.40380859375, -17.75390625, -17.10400390625, -16.4541015625, -15.80419921875, -15.154296875, -14.50439453125, -13.8544921875, -13.20458984375, -12.5546875, -11.90478515625, -11.2548828125, -10.60498046875, -9.955078125, -9.30517578125, -8.6552734375, -8.00537109375, -7.35546875, -6.70556640625, -6.0556640625, -5.40576171875, -4.755859375, -4.10595703125, -3.4560546875, -2.80615234375, -2.15625, -1.50634765625, -0.8564453125, -0.20654296875, 0.443359375, 1.09326171875, 1.7431640625, 2.39306640625, 3.04296875, 3.69287109375, 4.3427734375, 4.99267578125, 5.642578125, 6.29248046875, 6.9423828125, 7.59228515625, 8.2421875, 8.89208984375, 9.5419921875, 10.19189453125, 10.841796875, 11.49169921875, 12.1416015625, 12.79150390625, 13.44140625, 14.09130859375, 14.7412109375, 15.39111328125, 16.041015625, 16.69091796875, 17.3408203125, 17.99072265625, 18.640625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 12.0, 22.0, 50.0, 85.0, 115.0, 139.0, 150.0, 147.0, 110.0, 72.0, 50.0, 31.0, 18.0, 7.0, 3.0], "bins": [-60.706565856933594, -59.61306381225586, -58.51956558227539, -57.426063537597656, -56.33256530761719, -55.23906326293945, -54.14556121826172, -53.05206298828125, -51.958560943603516, -50.86505889892578, -49.77156066894531, -48.67805862426758, -47.584556579589844, -46.491058349609375, -45.39755630493164, -44.30405807495117, -43.21055603027344, -42.1170539855957, -41.023555755615234, -39.9300537109375, -38.83655548095703, -37.7430534362793, -36.64955139160156, -35.556053161621094, -34.46255111694336, -33.369049072265625, -32.275550842285156, -31.182048797607422, -30.08854866027832, -28.99504852294922, -27.901546478271484, -26.808046340942383, -25.714550018310547, -24.621049880981445, -23.527549743652344, -22.43404769897461, -21.340547561645508, -20.247047424316406, -19.153545379638672, -18.06004524230957, -16.96654510498047, -15.873044967651367, -14.77954387664795, -13.686042785644531, -12.59254264831543, -11.499042510986328, -10.40554141998291, -9.312040328979492, -8.21854019165039, -7.125039577484131, -6.031538963317871, -4.938038349151611, -3.8445377349853516, -2.751037120819092, -1.657536506652832, -0.5640358924865723, 0.5294647216796875, 1.6229653358459473, 2.716465950012207, 3.809966564178467, 4.903467178344727, 5.996967792510986, 7.090468406677246, 8.183969497680664, 9.277469635009766]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 8.0, 9.0, 11.0, 13.0, 21.0, 16.0, 24.0, 31.0, 29.0, 31.0, 27.0, 28.0, 37.0, 41.0, 47.0, 46.0, 28.0, 50.0, 54.0, 47.0, 50.0, 33.0, 39.0, 33.0, 44.0, 22.0, 20.0, 21.0, 18.0, 19.0, 19.0, 7.0, 8.0, 21.0, 6.0, 11.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.46092987060547, -33.44132995605469, -32.421730041503906, -31.402130126953125, -30.382530212402344, -29.362930297851562, -28.34332847595215, -27.323728561401367, -26.304128646850586, -25.284528732299805, -24.264928817749023, -23.245328903198242, -22.225727081298828, -21.206127166748047, -20.186527252197266, -19.166927337646484, -18.147327423095703, -17.127727508544922, -16.10812759399414, -15.088526725769043, -14.068926811218262, -13.04932689666748, -12.029726028442383, -11.010126113891602, -9.99052619934082, -8.970926284790039, -7.9513258934021, -6.93172550201416, -5.912125587463379, -4.892525672912598, -3.872925281524658, -2.8533248901367188, -1.8337249755859375, -0.8141248226165771, 0.2054753303527832, 1.2250754833221436, 2.244675636291504, 3.264275550842285, 4.283875942230225, 5.303476333618164, 6.323076248168945, 7.342676162719727, 8.362276077270508, 9.381876945495605, 10.401476860046387, 11.421076774597168, 12.440677642822266, 13.460277557373047, 14.479877471923828, 15.49947738647461, 16.51907730102539, 17.538677215576172, 18.558277130126953, 19.577877044677734, 20.59747886657715, 21.61707878112793, 22.63667869567871, 23.656278610229492, 24.675878524780273, 25.695478439331055, 26.71508026123047, 27.73468017578125, 28.75428009033203, 29.773880004882812, 30.793479919433594]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 11.0, 18.0, 12.0, 8.0, 17.0, 17.0, 21.0, 29.0, 20.0, 25.0, 36.0, 34.0, 42.0, 40.0, 53.0, 37.0, 51.0, 58.0, 49.0, 48.0, 29.0, 34.0, 27.0, 33.0, 29.0, 28.0, 30.0, 18.0, 27.0, 17.0, 13.0, 10.0, 22.0, 9.0, 8.0, 6.0, 6.0, 4.0, 7.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.035614013671875, -3.91107177734375, -3.786529541015625, -3.6619873046875, -3.537445068359375, -3.41290283203125, -3.288360595703125, -3.163818359375, -3.039276123046875, -2.91473388671875, -2.790191650390625, -2.6656494140625, -2.541107177734375, -2.41656494140625, -2.292022705078125, -2.16748046875, -2.042938232421875, -1.91839599609375, -1.793853759765625, -1.6693115234375, -1.544769287109375, -1.42022705078125, -1.295684814453125, -1.171142578125, -1.046600341796875, -0.92205810546875, -0.797515869140625, -0.6729736328125, -0.548431396484375, -0.42388916015625, -0.299346923828125, -0.1748046875, -0.050262451171875, 0.07427978515625, 0.198822021484375, 0.3233642578125, 0.447906494140625, 0.57244873046875, 0.696990966796875, 0.821533203125, 0.946075439453125, 1.07061767578125, 1.195159912109375, 1.3197021484375, 1.444244384765625, 1.56878662109375, 1.693328857421875, 1.81787109375, 1.942413330078125, 2.06695556640625, 2.191497802734375, 2.3160400390625, 2.440582275390625, 2.56512451171875, 2.689666748046875, 2.814208984375, 2.938751220703125, 3.06329345703125, 3.187835693359375, 3.3123779296875, 3.436920166015625, 3.56146240234375, 3.686004638671875, 3.810546875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 17.0, 15.0, 9.0, 19.0, 22.0, 30.0, 45.0, 53.0, 75.0, 142.0, 212.0, 361.0, 748.0, 1482.0, 3365.0, 8978.0, 31787.0, 191536.0, 1580116.0, 2048505.0, 267471.0, 40742.0, 10886.0, 3931.0, 1745.0, 839.0, 408.0, 229.0, 146.0, 87.0, 83.0, 38.0, 33.0, 29.0, 24.0, 24.0, 13.0, 5.0, 10.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6875, -8.398681640625, -8.10986328125, -7.821044921875, -7.5322265625, -7.243408203125, -6.95458984375, -6.665771484375, -6.376953125, -6.088134765625, -5.79931640625, -5.510498046875, -5.2216796875, -4.932861328125, -4.64404296875, -4.355224609375, -4.06640625, -3.777587890625, -3.48876953125, -3.199951171875, -2.9111328125, -2.622314453125, -2.33349609375, -2.044677734375, -1.755859375, -1.467041015625, -1.17822265625, -0.889404296875, -0.6005859375, -0.311767578125, -0.02294921875, 0.265869140625, 0.5546875, 0.843505859375, 1.13232421875, 1.421142578125, 1.7099609375, 1.998779296875, 2.28759765625, 2.576416015625, 2.865234375, 3.154052734375, 3.44287109375, 3.731689453125, 4.0205078125, 4.309326171875, 4.59814453125, 4.886962890625, 5.17578125, 5.464599609375, 5.75341796875, 6.042236328125, 6.3310546875, 6.619873046875, 6.90869140625, 7.197509765625, 7.486328125, 7.775146484375, 8.06396484375, 8.352783203125, 8.6416015625, 8.930419921875, 9.21923828125, 9.508056640625, 9.796875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 5.0, 16.0, 12.0, 26.0, 27.0, 45.0, 55.0, 78.0, 93.0, 141.0, 215.0, 279.0, 397.0, 524.0, 573.0, 446.0, 319.0, 247.0, 148.0, 129.0, 72.0, 62.0, 40.0, 35.0, 15.0, 15.0, 14.0, 10.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.23828125, -7.006591796875, -6.77490234375, -6.543212890625, -6.3115234375, -6.079833984375, -5.84814453125, -5.616455078125, -5.384765625, -5.153076171875, -4.92138671875, -4.689697265625, -4.4580078125, -4.226318359375, -3.99462890625, -3.762939453125, -3.53125, -3.299560546875, -3.06787109375, -2.836181640625, -2.6044921875, -2.372802734375, -2.14111328125, -1.909423828125, -1.677734375, -1.446044921875, -1.21435546875, -0.982666015625, -0.7509765625, -0.519287109375, -0.28759765625, -0.055908203125, 0.17578125, 0.407470703125, 0.63916015625, 0.870849609375, 1.1025390625, 1.334228515625, 1.56591796875, 1.797607421875, 2.029296875, 2.260986328125, 2.49267578125, 2.724365234375, 2.9560546875, 3.187744140625, 3.41943359375, 3.651123046875, 3.8828125, 4.114501953125, 4.34619140625, 4.577880859375, 4.8095703125, 5.041259765625, 5.27294921875, 5.504638671875, 5.736328125, 5.968017578125, 6.19970703125, 6.431396484375, 6.6630859375, 6.894775390625, 7.12646484375, 7.358154296875, 7.58984375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 12.0, 14.0, 10.0, 12.0, 16.0, 25.0, 28.0, 48.0, 65.0, 87.0, 164.0, 218.0, 431.0, 1856.0, 53715.0, 4043571.0, 90323.0, 2389.0, 473.0, 288.0, 156.0, 101.0, 84.0, 60.0, 35.0, 28.0, 17.0, 19.0, 10.0, 9.0, 3.0, 5.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-45.125, -43.81884765625, -42.5126953125, -41.20654296875, -39.900390625, -38.59423828125, -37.2880859375, -35.98193359375, -34.67578125, -33.36962890625, -32.0634765625, -30.75732421875, -29.451171875, -28.14501953125, -26.8388671875, -25.53271484375, -24.2265625, -22.92041015625, -21.6142578125, -20.30810546875, -19.001953125, -17.69580078125, -16.3896484375, -15.08349609375, -13.77734375, -12.47119140625, -11.1650390625, -9.85888671875, -8.552734375, -7.24658203125, -5.9404296875, -4.63427734375, -3.328125, -2.02197265625, -0.7158203125, 0.59033203125, 1.896484375, 3.20263671875, 4.5087890625, 5.81494140625, 7.12109375, 8.42724609375, 9.7333984375, 11.03955078125, 12.345703125, 13.65185546875, 14.9580078125, 16.26416015625, 17.5703125, 18.87646484375, 20.1826171875, 21.48876953125, 22.794921875, 24.10107421875, 25.4072265625, 26.71337890625, 28.01953125, 29.32568359375, 30.6318359375, 31.93798828125, 33.244140625, 34.55029296875, 35.8564453125, 37.16259765625, 38.46875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 20.0, 53.0, 92.0, 138.0, 177.0, 168.0, 149.0, 105.0, 55.0, 24.0, 13.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.600791931152344, -17.844432830810547, -16.08807373046875, -14.33171558380127, -12.575357437133789, -10.818998336791992, -9.062639236450195, -7.306281089782715, -5.549921989440918, -3.7935633659362793, -2.0372045040130615, -0.28084564208984375, 1.475512981414795, 3.2318716049194336, 4.9882307052612305, 6.744588851928711, 8.500947952270508, 10.257307052612305, 12.013665199279785, 13.770024299621582, 15.526382446289062, 17.28274154663086, 19.039100646972656, 20.795459747314453, 22.55181884765625, 24.308177947998047, 26.064537048339844, 27.82089614868164, 29.577253341674805, 31.3336124420166, 33.08997344970703, 34.84632873535156, 36.60268783569336, 38.359046936035156, 40.11540603637695, 41.87176513671875, 43.62812423706055, 45.384483337402344, 47.140838623046875, 48.89719772338867, 50.65355682373047, 52.409915924072266, 54.16627502441406, 55.92263412475586, 57.678993225097656, 59.43534851074219, 61.19171142578125, 62.94806671142578, 64.70442962646484, 66.46078491210938, 68.21714782714844, 69.97350311279297, 71.72986602783203, 73.48622131347656, 75.24258422851562, 76.99893951416016, 78.75529479980469, 80.51165008544922, 82.26801300048828, 84.02436828613281, 85.78073120117188, 87.5370864868164, 89.29344940185547, 91.0498046875, 92.80616760253906]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 10.0, 4.0, 7.0, 9.0, 8.0, 13.0, 24.0, 15.0, 23.0, 30.0, 28.0, 27.0, 28.0, 42.0, 38.0, 27.0, 35.0, 32.0, 33.0, 31.0, 32.0, 37.0, 35.0, 39.0, 41.0, 39.0, 29.0, 42.0, 25.0, 37.0, 25.0, 21.0, 17.0, 14.0, 12.0, 13.0, 13.0, 10.0, 10.0, 6.0, 12.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 5.0, 1.0], "bins": [-22.695520401000977, -22.04084587097168, -21.386171340942383, -20.73149871826172, -20.076824188232422, -19.422149658203125, -18.767475128173828, -18.11280059814453, -17.458126068115234, -16.803451538085938, -16.14877700805664, -15.49410343170166, -14.83942985534668, -14.184755325317383, -13.530080795288086, -12.875406265258789, -12.220733642578125, -11.566059112548828, -10.911385536193848, -10.25671100616455, -9.60203742980957, -8.947362899780273, -8.292688369750977, -7.638014316558838, -6.983340263366699, -6.3286662101745605, -5.673992156982422, -5.019317626953125, -4.364643573760986, -3.7099695205688477, -3.05529522895813, -2.400620937347412, -1.7459487915039062, -1.091274619102478, -0.4366004467010498, 0.21807372570037842, 0.8727478981018066, 1.5274219512939453, 2.182096242904663, 2.836770534515381, 3.4914445877075195, 4.146118640899658, 4.800792694091797, 5.455467224121094, 6.110141277313232, 6.764815330505371, 7.419489860534668, 8.074163436889648, 8.728837966918945, 9.383512496948242, 10.038186073303223, 10.69286060333252, 11.3475341796875, 12.002208709716797, 12.656883239746094, 13.31155776977539, 13.966231346130371, 14.620905876159668, 15.275579452514648, 15.930253982543945, 16.584928512573242, 17.239601135253906, 17.894275665283203, 18.5489501953125, 19.203624725341797]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 8.0, 2.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 12.0, 11.0, 19.0, 26.0, 24.0, 19.0, 38.0, 23.0, 38.0, 44.0, 39.0, 53.0, 38.0, 38.0, 37.0, 42.0, 45.0, 33.0, 45.0, 29.0, 33.0, 28.0, 24.0, 23.0, 25.0, 25.0, 13.0, 17.0, 17.0, 22.0, 17.0, 15.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.939453125, -3.82269287109375, -3.7059326171875, -3.58917236328125, -3.472412109375, -3.35565185546875, -3.2388916015625, -3.12213134765625, -3.00537109375, -2.88861083984375, -2.7718505859375, -2.65509033203125, -2.538330078125, -2.42156982421875, -2.3048095703125, -2.18804931640625, -2.0712890625, -1.95452880859375, -1.8377685546875, -1.72100830078125, -1.604248046875, -1.48748779296875, -1.3707275390625, -1.25396728515625, -1.13720703125, -1.02044677734375, -0.9036865234375, -0.78692626953125, -0.670166015625, -0.55340576171875, -0.4366455078125, -0.31988525390625, -0.203125, -0.08636474609375, 0.0303955078125, 0.14715576171875, 0.263916015625, 0.38067626953125, 0.4974365234375, 0.61419677734375, 0.73095703125, 0.84771728515625, 0.9644775390625, 1.08123779296875, 1.197998046875, 1.31475830078125, 1.4315185546875, 1.54827880859375, 1.6650390625, 1.78179931640625, 1.8985595703125, 2.01531982421875, 2.132080078125, 2.24884033203125, 2.3656005859375, 2.48236083984375, 2.59912109375, 2.71588134765625, 2.8326416015625, 2.94940185546875, 3.066162109375, 3.18292236328125, 3.2996826171875, 3.41644287109375, 3.533203125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 8.0, 12.0, 12.0, 15.0, 32.0, 41.0, 70.0, 122.0, 168.0, 209.0, 354.0, 515.0, 822.0, 1201.0, 1686.0, 2515.0, 3845.0, 5872.0, 8390.0, 12648.0, 19356.0, 30151.0, 49108.0, 85605.0, 177136.0, 305986.0, 144983.0, 74906.0, 43469.0, 27036.0, 17387.0, 11355.0, 7623.0, 5209.0, 3494.0, 2367.0, 1602.0, 1083.0, 707.0, 486.0, 334.0, 209.0, 134.0, 95.0, 64.0, 57.0, 27.0, 21.0, 13.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.170654296875, -0.1650371551513672, -0.15942001342773438, -0.15380287170410156, -0.14818572998046875, -0.14256858825683594, -0.13695144653320312, -0.1313343048095703, -0.1257171630859375, -0.12010002136230469, -0.11448287963867188, -0.10886573791503906, -0.10324859619140625, -0.09763145446777344, -0.09201431274414062, -0.08639717102050781, -0.080780029296875, -0.07516288757324219, -0.06954574584960938, -0.06392860412597656, -0.05831146240234375, -0.05269432067871094, -0.047077178955078125, -0.04146003723144531, -0.0358428955078125, -0.030225753784179688, -0.024608612060546875, -0.018991470336914062, -0.01337432861328125, -0.0077571868896484375, -0.002140045166015625, 0.0034770965576171875, 0.00909423828125, 0.014711380004882812, 0.020328521728515625, 0.025945663452148438, 0.03156280517578125, 0.03717994689941406, 0.042797088623046875, 0.04841423034667969, 0.0540313720703125, 0.05964851379394531, 0.06526565551757812, 0.07088279724121094, 0.07649993896484375, 0.08211708068847656, 0.08773422241210938, 0.09335136413574219, 0.098968505859375, 0.10458564758300781, 0.11020278930664062, 0.11581993103027344, 0.12143707275390625, 0.12705421447753906, 0.13267135620117188, 0.1382884979248047, 0.1439056396484375, 0.1495227813720703, 0.15513992309570312, 0.16075706481933594, 0.16637420654296875, 0.17199134826660156, 0.17760848999023438, 0.1832256317138672, 0.1888427734375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 5.0, 9.0, 8.0, 10.0, 15.0, 15.0, 14.0, 19.0, 19.0, 26.0, 25.0, 23.0, 33.0, 37.0, 31.0, 33.0, 33.0, 36.0, 40.0, 40.0, 1061.0, 34.0, 30.0, 42.0, 56.0, 34.0, 30.0, 24.0, 26.0, 20.0, 21.0, 32.0, 18.0, 16.0, 13.0, 17.0, 10.0, 7.0, 6.0, 6.0, 10.0, 4.0, 5.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.822265625, -2.72857666015625, -2.6348876953125, -2.54119873046875, -2.447509765625, -2.35382080078125, -2.2601318359375, -2.16644287109375, -2.07275390625, -1.97906494140625, -1.8853759765625, -1.79168701171875, -1.697998046875, -1.60430908203125, -1.5106201171875, -1.41693115234375, -1.3232421875, -1.22955322265625, -1.1358642578125, -1.04217529296875, -0.948486328125, -0.85479736328125, -0.7611083984375, -0.66741943359375, -0.57373046875, -0.48004150390625, -0.3863525390625, -0.29266357421875, -0.198974609375, -0.10528564453125, -0.0115966796875, 0.08209228515625, 0.17578125, 0.26947021484375, 0.3631591796875, 0.45684814453125, 0.550537109375, 0.64422607421875, 0.7379150390625, 0.83160400390625, 0.92529296875, 1.01898193359375, 1.1126708984375, 1.20635986328125, 1.300048828125, 1.39373779296875, 1.4874267578125, 1.58111572265625, 1.6748046875, 1.76849365234375, 1.8621826171875, 1.95587158203125, 2.049560546875, 2.14324951171875, 2.2369384765625, 2.33062744140625, 2.42431640625, 2.51800537109375, 2.6116943359375, 2.70538330078125, 2.799072265625, 2.89276123046875, 2.9864501953125, 3.08013916015625, 3.173828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 1.0, 6.0, 7.0, 12.0, 22.0, 13.0, 36.0, 48.0, 67.0, 95.0, 156.0, 211.0, 342.0, 475.0, 698.0, 965.0, 1561.0, 2176.0, 3274.0, 4992.0, 7461.0, 11118.0, 17063.0, 26337.0, 41901.0, 68749.0, 123315.0, 1250471.0, 259724.0, 107324.0, 61036.0, 37490.0, 23842.0, 15728.0, 9995.0, 6704.0, 4494.0, 2921.0, 1995.0, 1435.0, 904.0, 624.0, 402.0, 300.0, 188.0, 137.0, 95.0, 73.0, 52.0, 29.0, 22.0, 26.0, 7.0, 9.0, 3.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.060638427734375, -0.058675289154052734, -0.05671215057373047, -0.0547490119934082, -0.05278587341308594, -0.05082273483276367, -0.048859596252441406, -0.04689645767211914, -0.044933319091796875, -0.04297018051147461, -0.041007041931152344, -0.03904390335083008, -0.03708076477050781, -0.03511762619018555, -0.03315448760986328, -0.031191349029541016, -0.02922821044921875, -0.027265071868896484, -0.02530193328857422, -0.023338794708251953, -0.021375656127929688, -0.019412517547607422, -0.017449378967285156, -0.01548624038696289, -0.013523101806640625, -0.01155996322631836, -0.009596824645996094, -0.007633686065673828, -0.0056705474853515625, -0.003707408905029297, -0.0017442703247070312, 0.00021886825561523438, 0.0021820068359375, 0.004145145416259766, 0.006108283996582031, 0.008071422576904297, 0.010034561157226562, 0.011997699737548828, 0.013960838317871094, 0.01592397689819336, 0.017887115478515625, 0.01985025405883789, 0.021813392639160156, 0.023776531219482422, 0.025739669799804688, 0.027702808380126953, 0.02966594696044922, 0.031629085540771484, 0.03359222412109375, 0.035555362701416016, 0.03751850128173828, 0.03948163986206055, 0.04144477844238281, 0.04340791702270508, 0.045371055603027344, 0.04733419418334961, 0.049297332763671875, 0.05126047134399414, 0.053223609924316406, 0.05518674850463867, 0.05714988708496094, 0.0591130256652832, 0.06107616424560547, 0.06303930282592773, 0.06500244140625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 9.0, 6.0, 4.0, 5.0, 10.0, 9.0, 17.0, 18.0, 27.0, 21.0, 29.0, 29.0, 49.0, 47.0, 56.0, 57.0, 76.0, 92.0, 70.0, 62.0, 43.0, 44.0, 38.0, 26.0, 29.0, 24.0, 15.0, 16.0, 9.0, 10.0, 13.0, 8.0, 7.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0008101463317871094, -0.0007843151688575745, -0.0007584840059280396, -0.0007326528429985046, -0.0007068216800689697, -0.0006809905171394348, -0.0006551593542098999, -0.000629328191280365, -0.0006034970283508301, -0.0005776658654212952, -0.0005518347024917603, -0.0005260035395622253, -0.0005001723766326904, -0.0004743412137031555, -0.0004485100507736206, -0.0004226788878440857, -0.0003968477249145508, -0.00037101656198501587, -0.00034518539905548096, -0.00031935423612594604, -0.00029352307319641113, -0.0002676919102668762, -0.0002418607473373413, -0.0002160295844078064, -0.00019019842147827148, -0.00016436725854873657, -0.00013853609561920166, -0.00011270493268966675, -8.687376976013184e-05, -6.104260683059692e-05, -3.521144390106201e-05, -9.3802809715271e-06, 1.6450881958007812e-05, 4.2282044887542725e-05, 6.811320781707764e-05, 9.394437074661255e-05, 0.00011977553367614746, 0.00014560669660568237, 0.00017143785953521729, 0.0001972690224647522, 0.0002231001853942871, 0.000248931348323822, 0.00027476251125335693, 0.00030059367418289185, 0.00032642483711242676, 0.00035225600004196167, 0.0003780871629714966, 0.0004039183259010315, 0.0004297494888305664, 0.0004555806517601013, 0.00048141181468963623, 0.0005072429776191711, 0.0005330741405487061, 0.000558905303478241, 0.0005847364664077759, 0.0006105676293373108, 0.0006363987922668457, 0.0006622299551963806, 0.0006880611181259155, 0.0007138922810554504, 0.0007397234439849854, 0.0007655546069145203, 0.0007913857698440552, 0.0008172169327735901, 0.000843048095703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 3.0, 5.0, 6.0, 15.0, 8.0, 7.0, 20.0, 13.0, 24.0, 33.0, 29.0, 41.0, 70.0, 129.0, 275.0, 2429.0, 931986.0, 112052.0, 814.0, 181.0, 109.0, 74.0, 38.0, 32.0, 30.0, 26.0, 16.0, 21.0, 14.0, 6.0, 4.0, 4.0, 7.0, 8.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0198822021484375, -0.01927661895751953, -0.018671035766601562, -0.018065452575683594, -0.017459869384765625, -0.016854286193847656, -0.016248703002929688, -0.01564311981201172, -0.01503753662109375, -0.014431953430175781, -0.013826370239257812, -0.013220787048339844, -0.012615203857421875, -0.012009620666503906, -0.011404037475585938, -0.010798454284667969, -0.01019287109375, -0.009587287902832031, -0.008981704711914062, -0.008376121520996094, -0.007770538330078125, -0.007164955139160156, -0.0065593719482421875, -0.005953788757324219, -0.00534820556640625, -0.004742622375488281, -0.0041370391845703125, -0.0035314559936523438, -0.002925872802734375, -0.0023202896118164062, -0.0017147064208984375, -0.0011091232299804688, -0.0005035400390625, 0.00010204315185546875, 0.0007076263427734375, 0.0013132095336914062, 0.001918792724609375, 0.0025243759155273438, 0.0031299591064453125, 0.0037355422973632812, 0.00434112548828125, 0.004946708679199219, 0.0055522918701171875, 0.006157875061035156, 0.006763458251953125, 0.007369041442871094, 0.007974624633789062, 0.008580207824707031, 0.009185791015625, 0.009791374206542969, 0.010396957397460938, 0.011002540588378906, 0.011608123779296875, 0.012213706970214844, 0.012819290161132812, 0.013424873352050781, 0.01403045654296875, 0.014636039733886719, 0.015241622924804688, 0.015847206115722656, 0.016452789306640625, 0.017058372497558594, 0.017663955688476562, 0.01826953887939453, 0.0188751220703125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 940.0, 67.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034326589666306973, -0.003038111375644803, -0.002643563784658909, -0.002249015960842371, -0.0018544683698564768, -0.0014599207788705826, -0.0010653729550540447, -0.0006708253640681505, -0.0002762777730822563, 0.0001182698761112988, 0.0005128175253048539, 0.00090736523270607, 0.0013019128236919641, 0.0016964604146778584, 0.002091008238494396, 0.0024855558294802904, 0.0028801034204661846, 0.003274651011452079, 0.003669198602437973, 0.004063746426254511, 0.004458294250071049, 0.004852841608226299, 0.005247389432042837, 0.005641937255859375, 0.0060364846140146255, 0.006431032437831163, 0.006825579795986414, 0.007220127619802952, 0.007614674977958202, 0.008009223267436028, 0.008403770625591278, 0.008798317983746529, 0.00919286534190178, 0.00958741270005703, 0.009981960989534855, 0.010376508347690105, 0.010771055705845356, 0.011165603995323181, 0.011560151353478432, 0.011954698711633682, 0.012349246069788933, 0.012743793427944183, 0.013138341717422009, 0.013532889075577259, 0.01392743643373251, 0.014321984723210335, 0.014716532081365585, 0.015111079439520836, 0.015505627728998661, 0.015900176018476486, 0.016294723376631737, 0.016689270734786987, 0.017083818092942238, 0.01747836545109749, 0.017872914671897888, 0.01826746203005314, 0.01866200938820839, 0.01905655674636364, 0.01945110410451889, 0.01984565332531929, 0.02024020068347454, 0.02063474804162979, 0.021029295399785042, 0.021423842757940292, 0.021818390116095543]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 7.0, 5.0, 2.0, 8.0, 5.0, 2.0, 8.0, 13.0, 24.0, 21.0, 25.0, 26.0, 24.0, 27.0, 42.0, 40.0, 43.0, 44.0, 54.0, 49.0, 50.0, 42.0, 66.0, 68.0, 50.0, 42.0, 42.0, 30.0, 23.0, 32.0, 20.0, 19.0, 19.0, 12.0, 9.0, 3.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009229183197021484, -0.0008987244218587875, -0.0008745305240154266, -0.0008503366261720657, -0.0008261427283287048, -0.0008019488304853439, -0.000777754932641983, -0.0007535610347986221, -0.0007293671369552612, -0.0007051732391119003, -0.0006809793412685394, -0.0006567854434251785, -0.0006325915455818176, -0.0006083976477384567, -0.0005842037498950958, -0.0005600098520517349, -0.000535815954208374, -0.0005116220563650131, -0.0004874281585216522, -0.0004632342606782913, -0.0004390403628349304, -0.0004148464649915695, -0.0003906525671482086, -0.0003664586693048477, -0.0003422647714614868, -0.0003180708736181259, -0.000293876975774765, -0.0002696830779314041, -0.0002454891800880432, -0.0002212952822446823, -0.0001971013844013214, -0.0001729074865579605, -0.0001487135887145996, -0.0001245196908712387, -0.00010032579302787781, -7.61318951845169e-05, -5.1937997341156006e-05, -2.7744099497795105e-05, -3.550201654434204e-06, 2.0643696188926697e-05, 4.48375940322876e-05, 6.90314918756485e-05, 9.32253897190094e-05, 0.0001174192875623703, 0.0001416131854057312, 0.0001658070832490921, 0.000190000981092453, 0.0002141948789358139, 0.0002383887767791748, 0.0002625826746225357, 0.0002867765724658966, 0.0003109704703092575, 0.0003351643681526184, 0.0003593582659959793, 0.0003835521638393402, 0.0004077460616827011, 0.000431939959526062, 0.0004561338573694229, 0.0004803277552127838, 0.0005045216530561447, 0.0005287155508995056, 0.0005529094487428665, 0.0005771033465862274, 0.0006012972444295883, 0.0006254911422729492]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 8.0, 2.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 12.0, 11.0, 19.0, 26.0, 24.0, 19.0, 38.0, 23.0, 38.0, 44.0, 39.0, 53.0, 38.0, 38.0, 37.0, 42.0, 45.0, 33.0, 45.0, 29.0, 33.0, 28.0, 24.0, 23.0, 25.0, 25.0, 13.0, 17.0, 17.0, 22.0, 17.0, 15.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.939453125, -3.82269287109375, -3.7059326171875, -3.58917236328125, -3.472412109375, -3.35565185546875, -3.2388916015625, -3.12213134765625, -3.00537109375, -2.88861083984375, -2.7718505859375, -2.65509033203125, -2.538330078125, -2.42156982421875, -2.3048095703125, -2.18804931640625, -2.0712890625, -1.95452880859375, -1.8377685546875, -1.72100830078125, -1.604248046875, -1.48748779296875, -1.3707275390625, -1.25396728515625, -1.13720703125, -1.02044677734375, -0.9036865234375, -0.78692626953125, -0.670166015625, -0.55340576171875, -0.4366455078125, -0.31988525390625, -0.203125, -0.08636474609375, 0.0303955078125, 0.14715576171875, 0.263916015625, 0.38067626953125, 0.4974365234375, 0.61419677734375, 0.73095703125, 0.84771728515625, 0.9644775390625, 1.08123779296875, 1.197998046875, 1.31475830078125, 1.4315185546875, 1.54827880859375, 1.6650390625, 1.78179931640625, 1.8985595703125, 2.01531982421875, 2.132080078125, 2.24884033203125, 2.3656005859375, 2.48236083984375, 2.59912109375, 2.71588134765625, 2.8326416015625, 2.94940185546875, 3.066162109375, 3.18292236328125, 3.2996826171875, 3.41644287109375, 3.533203125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 11.0, 12.0, 19.0, 32.0, 37.0, 62.0, 91.0, 128.0, 232.0, 442.0, 682.0, 1142.0, 1971.0, 3624.0, 7217.0, 15408.0, 35202.0, 93157.0, 350008.0, 372525.0, 97460.0, 36383.0, 16312.0, 7617.0, 3892.0, 2030.0, 1125.0, 645.0, 388.0, 228.0, 175.0, 103.0, 62.0, 50.0, 31.0, 20.0, 8.0, 9.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.39300537109375, -6.1727294921875, -5.95245361328125, -5.732177734375, -5.51190185546875, -5.2916259765625, -5.07135009765625, -4.85107421875, -4.63079833984375, -4.4105224609375, -4.19024658203125, -3.969970703125, -3.74969482421875, -3.5294189453125, -3.30914306640625, -3.0888671875, -2.86859130859375, -2.6483154296875, -2.42803955078125, -2.207763671875, -1.98748779296875, -1.7672119140625, -1.54693603515625, -1.32666015625, -1.10638427734375, -0.8861083984375, -0.66583251953125, -0.445556640625, -0.22528076171875, -0.0050048828125, 0.21527099609375, 0.435546875, 0.65582275390625, 0.8760986328125, 1.09637451171875, 1.316650390625, 1.53692626953125, 1.7572021484375, 1.97747802734375, 2.19775390625, 2.41802978515625, 2.6383056640625, 2.85858154296875, 3.078857421875, 3.29913330078125, 3.5194091796875, 3.73968505859375, 3.9599609375, 4.18023681640625, 4.4005126953125, 4.62078857421875, 4.841064453125, 5.06134033203125, 5.2816162109375, 5.50189208984375, 5.72216796875, 5.94244384765625, 6.1627197265625, 6.38299560546875, 6.603271484375, 6.82354736328125, 7.0438232421875, 7.26409912109375, 7.484375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 12.0, 10.0, 9.0, 8.0, 16.0, 11.0, 22.0, 18.0, 34.0, 37.0, 30.0, 36.0, 42.0, 43.0, 58.0, 55.0, 113.0, 191.0, 1405.0, 262.0, 126.0, 78.0, 66.0, 54.0, 38.0, 27.0, 46.0, 24.0, 28.0, 29.0, 21.0, 17.0, 13.0, 17.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.5703125, -12.1861572265625, -11.802001953125, -11.4178466796875, -11.03369140625, -10.6495361328125, -10.265380859375, -9.8812255859375, -9.4970703125, -9.1129150390625, -8.728759765625, -8.3446044921875, -7.96044921875, -7.5762939453125, -7.192138671875, -6.8079833984375, -6.423828125, -6.0396728515625, -5.655517578125, -5.2713623046875, -4.88720703125, -4.5030517578125, -4.118896484375, -3.7347412109375, -3.3505859375, -2.9664306640625, -2.582275390625, -2.1981201171875, -1.81396484375, -1.4298095703125, -1.045654296875, -0.6614990234375, -0.27734375, 0.1068115234375, 0.490966796875, 0.8751220703125, 1.25927734375, 1.6434326171875, 2.027587890625, 2.4117431640625, 2.7958984375, 3.1800537109375, 3.564208984375, 3.9483642578125, 4.33251953125, 4.7166748046875, 5.100830078125, 5.4849853515625, 5.869140625, 6.2532958984375, 6.637451171875, 7.0216064453125, 7.40576171875, 7.7899169921875, 8.174072265625, 8.5582275390625, 8.9423828125, 9.3265380859375, 9.710693359375, 10.0948486328125, 10.47900390625, 10.8631591796875, 11.247314453125, 11.6314697265625, 12.015625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 10.0, 9.0, 25.0, 22.0, 27.0, 26.0, 45.0, 44.0, 70.0, 102.0, 159.0, 357.0, 775.0, 2267.0, 8140.0, 57964.0, 1946268.0, 1076769.0, 42504.0, 6701.0, 1889.0, 690.0, 278.0, 159.0, 94.0, 65.0, 50.0, 37.0, 33.0, 23.0, 18.0, 16.0, 10.0, 10.0, 8.0, 7.0, 3.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.921875, -19.27783203125, -18.6337890625, -17.98974609375, -17.345703125, -16.70166015625, -16.0576171875, -15.41357421875, -14.76953125, -14.12548828125, -13.4814453125, -12.83740234375, -12.193359375, -11.54931640625, -10.9052734375, -10.26123046875, -9.6171875, -8.97314453125, -8.3291015625, -7.68505859375, -7.041015625, -6.39697265625, -5.7529296875, -5.10888671875, -4.46484375, -3.82080078125, -3.1767578125, -2.53271484375, -1.888671875, -1.24462890625, -0.6005859375, 0.04345703125, 0.6875, 1.33154296875, 1.9755859375, 2.61962890625, 3.263671875, 3.90771484375, 4.5517578125, 5.19580078125, 5.83984375, 6.48388671875, 7.1279296875, 7.77197265625, 8.416015625, 9.06005859375, 9.7041015625, 10.34814453125, 10.9921875, 11.63623046875, 12.2802734375, 12.92431640625, 13.568359375, 14.21240234375, 14.8564453125, 15.50048828125, 16.14453125, 16.78857421875, 17.4326171875, 18.07666015625, 18.720703125, 19.36474609375, 20.0087890625, 20.65283203125, 21.296875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [4.0, 41.0, 190.0, 412.0, 294.0, 71.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.550666809082031, -8.441230773925781, -5.331793785095215, -2.2223567962646484, 0.8870792388916016, 3.9965152740478516, 7.105953216552734, 10.215389251708984, 13.324825286865234, 16.434261322021484, 19.543697357177734, 22.653135299682617, 25.762571334838867, 28.872007369995117, 31.9814453125, 35.09088134765625, 38.2003173828125, 41.30975341796875, 44.419189453125, 47.52862548828125, 50.6380615234375, 53.74749755859375, 56.856937408447266, 59.966373443603516, 63.075809478759766, 66.18524932861328, 69.29468536376953, 72.40412139892578, 75.51355743408203, 78.62299346923828, 81.73242950439453, 84.84186553955078, 87.9512939453125, 91.06072998046875, 94.170166015625, 97.27960205078125, 100.3890380859375, 103.49847412109375, 106.60791015625, 109.71734619140625, 112.8267822265625, 115.93621826171875, 119.045654296875, 122.15509033203125, 125.2645263671875, 128.37396240234375, 131.4833984375, 134.59283447265625, 137.7022705078125, 140.81170654296875, 143.921142578125, 147.03057861328125, 150.1400146484375, 153.24945068359375, 156.35888671875, 159.46832275390625, 162.57777404785156, 165.6872100830078, 168.79664611816406, 171.9060821533203, 175.01551818847656, 178.1249542236328, 181.23439025878906, 184.3438262939453, 187.45326232910156]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 8.0, 4.0, 4.0, 15.0, 12.0, 17.0, 12.0, 16.0, 16.0, 20.0, 27.0, 30.0, 31.0, 28.0, 25.0, 50.0, 46.0, 41.0, 40.0, 46.0, 48.0, 41.0, 38.0, 45.0, 33.0, 38.0, 35.0, 22.0, 23.0, 25.0, 30.0, 18.0, 22.0, 10.0, 19.0, 13.0, 15.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.978919982910156, -37.775390625, -36.571861267089844, -35.36833572387695, -34.1648063659668, -32.96127700805664, -31.757749557495117, -30.554222106933594, -29.350692749023438, -28.14716339111328, -26.943635940551758, -25.740108489990234, -24.536579132080078, -23.333049774169922, -22.1295223236084, -20.925994873046875, -19.72246551513672, -18.518936157226562, -17.31540870666504, -16.111881256103516, -14.90835189819336, -13.70482349395752, -12.50129508972168, -11.29776668548584, -10.09423828125, -8.89070987701416, -7.68718147277832, -6.4836530685424805, -5.280124664306641, -4.076596260070801, -2.873067855834961, -1.669539451599121, -0.4660148620605469, 0.737513542175293, 1.9410419464111328, 3.1445703506469727, 4.3480987548828125, 5.551627159118652, 6.755155563354492, 7.958683967590332, 9.162212371826172, 10.365740776062012, 11.569269180297852, 12.772797584533691, 13.976325988769531, 15.179854393005371, 16.38338279724121, 17.586910247802734, 18.79043960571289, 19.993968963623047, 21.19749641418457, 22.401023864746094, 23.60455322265625, 24.808082580566406, 26.01161003112793, 27.215137481689453, 28.41866683959961, 29.622196197509766, 30.82572364807129, 32.02925109863281, 33.23278045654297, 34.436309814453125, 35.63983917236328, 36.84336471557617, 38.04689407348633]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 8.0, 7.0, 8.0, 9.0, 5.0, 10.0, 15.0, 25.0, 15.0, 15.0, 26.0, 32.0, 33.0, 33.0, 34.0, 30.0, 45.0, 45.0, 55.0, 41.0, 39.0, 50.0, 24.0, 48.0, 36.0, 22.0, 20.0, 32.0, 24.0, 30.0, 25.0, 18.0, 16.0, 22.0, 23.0, 16.0, 11.0, 8.0, 13.0, 5.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.3359375, -4.212860107421875, -4.08978271484375, -3.966705322265625, -3.8436279296875, -3.720550537109375, -3.59747314453125, -3.474395751953125, -3.351318359375, -3.228240966796875, -3.10516357421875, -2.982086181640625, -2.8590087890625, -2.735931396484375, -2.61285400390625, -2.489776611328125, -2.36669921875, -2.243621826171875, -2.12054443359375, -1.997467041015625, -1.8743896484375, -1.751312255859375, -1.62823486328125, -1.505157470703125, -1.382080078125, -1.259002685546875, -1.13592529296875, -1.012847900390625, -0.8897705078125, -0.766693115234375, -0.64361572265625, -0.520538330078125, -0.3974609375, -0.274383544921875, -0.15130615234375, -0.028228759765625, 0.0948486328125, 0.217926025390625, 0.34100341796875, 0.464080810546875, 0.587158203125, 0.710235595703125, 0.83331298828125, 0.956390380859375, 1.0794677734375, 1.202545166015625, 1.32562255859375, 1.448699951171875, 1.57177734375, 1.694854736328125, 1.81793212890625, 1.941009521484375, 2.0640869140625, 2.187164306640625, 2.31024169921875, 2.433319091796875, 2.556396484375, 2.679473876953125, 2.80255126953125, 2.925628662109375, 3.0487060546875, 3.171783447265625, 3.29486083984375, 3.417938232421875, 3.541015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 11.0, 13.0, 11.0, 26.0, 29.0, 30.0, 61.0, 76.0, 139.0, 227.0, 503.0, 1390.0, 4773.0, 28063.0, 527902.0, 3220112.0, 381677.0, 22859.0, 4111.0, 1179.0, 440.0, 222.0, 129.0, 93.0, 46.0, 40.0, 31.0, 20.0, 19.0, 7.0, 12.0, 6.0, 3.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.26416015625, -11.8173828125, -11.37060546875, -10.923828125, -10.47705078125, -10.0302734375, -9.58349609375, -9.13671875, -8.68994140625, -8.2431640625, -7.79638671875, -7.349609375, -6.90283203125, -6.4560546875, -6.00927734375, -5.5625, -5.11572265625, -4.6689453125, -4.22216796875, -3.775390625, -3.32861328125, -2.8818359375, -2.43505859375, -1.98828125, -1.54150390625, -1.0947265625, -0.64794921875, -0.201171875, 0.24560546875, 0.6923828125, 1.13916015625, 1.5859375, 2.03271484375, 2.4794921875, 2.92626953125, 3.373046875, 3.81982421875, 4.2666015625, 4.71337890625, 5.16015625, 5.60693359375, 6.0537109375, 6.50048828125, 6.947265625, 7.39404296875, 7.8408203125, 8.28759765625, 8.734375, 9.18115234375, 9.6279296875, 10.07470703125, 10.521484375, 10.96826171875, 11.4150390625, 11.86181640625, 12.30859375, 12.75537109375, 13.2021484375, 13.64892578125, 14.095703125, 14.54248046875, 14.9892578125, 15.43603515625, 15.8828125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 11.0, 12.0, 20.0, 32.0, 42.0, 30.0, 71.0, 113.0, 174.0, 243.0, 352.0, 535.0, 668.0, 515.0, 403.0, 248.0, 180.0, 130.0, 90.0, 62.0, 44.0, 25.0, 31.0, 12.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.515625, -10.2432861328125, -9.970947265625, -9.6986083984375, -9.42626953125, -9.1539306640625, -8.881591796875, -8.6092529296875, -8.3369140625, -8.0645751953125, -7.792236328125, -7.5198974609375, -7.24755859375, -6.9752197265625, -6.702880859375, -6.4305419921875, -6.158203125, -5.8858642578125, -5.613525390625, -5.3411865234375, -5.06884765625, -4.7965087890625, -4.524169921875, -4.2518310546875, -3.9794921875, -3.7071533203125, -3.434814453125, -3.1624755859375, -2.89013671875, -2.6177978515625, -2.345458984375, -2.0731201171875, -1.80078125, -1.5284423828125, -1.256103515625, -0.9837646484375, -0.71142578125, -0.4390869140625, -0.166748046875, 0.1055908203125, 0.3779296875, 0.6502685546875, 0.922607421875, 1.1949462890625, 1.46728515625, 1.7396240234375, 2.011962890625, 2.2843017578125, 2.556640625, 2.8289794921875, 3.101318359375, 3.3736572265625, 3.64599609375, 3.9183349609375, 4.190673828125, 4.4630126953125, 4.7353515625, 5.0076904296875, 5.280029296875, 5.5523681640625, 5.82470703125, 6.0970458984375, 6.369384765625, 6.6417236328125, 6.9140625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 2.0, 7.0, 16.0, 33.0, 34.0, 59.0, 97.0, 143.0, 260.0, 524.0, 1540.0, 15132.0, 3219881.0, 947011.0, 7383.0, 1176.0, 435.0, 211.0, 112.0, 64.0, 45.0, 43.0, 20.0, 15.0, 10.0, 5.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.734375, -28.585693359375, -27.43701171875, -26.288330078125, -25.1396484375, -23.990966796875, -22.84228515625, -21.693603515625, -20.544921875, -19.396240234375, -18.24755859375, -17.098876953125, -15.9501953125, -14.801513671875, -13.65283203125, -12.504150390625, -11.35546875, -10.206787109375, -9.05810546875, -7.909423828125, -6.7607421875, -5.612060546875, -4.46337890625, -3.314697265625, -2.166015625, -1.017333984375, 0.13134765625, 1.280029296875, 2.4287109375, 3.577392578125, 4.72607421875, 5.874755859375, 7.0234375, 8.172119140625, 9.32080078125, 10.469482421875, 11.6181640625, 12.766845703125, 13.91552734375, 15.064208984375, 16.212890625, 17.361572265625, 18.51025390625, 19.658935546875, 20.8076171875, 21.956298828125, 23.10498046875, 24.253662109375, 25.40234375, 26.551025390625, 27.69970703125, 28.848388671875, 29.9970703125, 31.145751953125, 32.29443359375, 33.443115234375, 34.591796875, 35.740478515625, 36.88916015625, 38.037841796875, 39.1865234375, 40.335205078125, 41.48388671875, 42.632568359375, 43.78125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 65.0, 224.0, 365.0, 250.0, 84.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75772476196289, -38.14714431762695, -34.53656005859375, -30.925979614257812, -27.315399169921875, -23.704818725585938, -20.094236373901367, -16.483654022216797, -12.87307357788086, -9.262492179870605, -5.651910781860352, -2.0413293838500977, 1.5692520141601562, 5.179832458496094, 8.790414810180664, 12.400997161865234, 16.011577606201172, 19.62215805053711, 23.23274040222168, 26.84332275390625, 30.453903198242188, 34.064483642578125, 37.67506408691406, 41.285648345947266, 44.8962287902832, 48.50680923461914, 52.117393493652344, 55.72797393798828, 59.33855438232422, 62.949134826660156, 66.5597152709961, 70.17030334472656, 73.7808837890625, 77.39146423339844, 81.00204467773438, 84.61262512207031, 88.22320556640625, 91.83378601074219, 95.44437408447266, 99.0549545288086, 102.66553497314453, 106.27611541748047, 109.8866958618164, 113.49727630615234, 117.10786437988281, 120.71844482421875, 124.32902526855469, 127.93960571289062, 131.55018615722656, 135.1607666015625, 138.77134704589844, 142.38192749023438, 145.9925079345703, 149.60308837890625, 153.2136688232422, 156.82424926757812, 160.43484497070312, 164.04542541503906, 167.656005859375, 171.26658630371094, 174.87716674804688, 178.4877471923828, 182.09832763671875, 185.70892333984375, 189.31948852539062]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 7.0, 6.0, 8.0, 10.0, 14.0, 12.0, 18.0, 12.0, 16.0, 24.0, 34.0, 30.0, 21.0, 35.0, 37.0, 31.0, 42.0, 47.0, 46.0, 43.0, 35.0, 35.0, 36.0, 42.0, 34.0, 32.0, 35.0, 27.0, 38.0, 33.0, 23.0, 23.0, 8.0, 17.0, 23.0, 10.0, 10.0, 14.0, 9.0, 2.0, 5.0, 3.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.64120101928711, -23.8935489654541, -23.145896911621094, -22.39824676513672, -21.65059471130371, -20.902942657470703, -20.155290603637695, -19.407638549804688, -18.659988403320312, -17.912336349487305, -17.164684295654297, -16.417034149169922, -15.669382095336914, -14.921730041503906, -14.174077987670898, -13.426426887512207, -12.6787748336792, -11.931122779846191, -11.1834716796875, -10.435819625854492, -9.6881685256958, -8.940516471862793, -8.192865371704102, -7.445213317871094, -6.697561740875244, -5.9499101638793945, -5.202258586883545, -4.454607009887695, -3.7069551944732666, -2.959303617477417, -2.2116518020629883, -1.4640002250671387, -0.7163486480712891, 0.03130298852920532, 0.7789546251296997, 1.5266063213348389, 2.2742578983306885, 3.021909475326538, 3.769561290740967, 4.517212867736816, 5.264864444732666, 6.012516021728516, 6.760167598724365, 7.507819175720215, 8.255471229553223, 9.003122329711914, 9.750774383544922, 10.49842643737793, 11.246077537536621, 11.993729591369629, 12.74138069152832, 13.489032745361328, 14.23668384552002, 14.984335899353027, 15.731986999511719, 16.479639053344727, 17.227291107177734, 17.974943161010742, 18.72259521484375, 19.470245361328125, 20.217897415161133, 20.96554946899414, 21.71320152282715, 22.460853576660156, 23.20850372314453]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 8.0, 8.0, 2.0, 8.0, 15.0, 19.0, 19.0, 18.0, 28.0, 28.0, 28.0, 31.0, 39.0, 46.0, 48.0, 31.0, 45.0, 42.0, 46.0, 45.0, 38.0, 42.0, 33.0, 35.0, 32.0, 33.0, 36.0, 27.0, 22.0, 15.0, 23.0, 13.0, 20.0, 19.0, 6.0, 13.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44921875, -4.320526123046875, -4.19183349609375, -4.063140869140625, -3.9344482421875, -3.805755615234375, -3.67706298828125, -3.548370361328125, -3.419677734375, -3.290985107421875, -3.16229248046875, -3.033599853515625, -2.9049072265625, -2.776214599609375, -2.64752197265625, -2.518829345703125, -2.39013671875, -2.261444091796875, -2.13275146484375, -2.004058837890625, -1.8753662109375, -1.746673583984375, -1.61798095703125, -1.489288330078125, -1.360595703125, -1.231903076171875, -1.10321044921875, -0.974517822265625, -0.8458251953125, -0.717132568359375, -0.58843994140625, -0.459747314453125, -0.3310546875, -0.202362060546875, -0.07366943359375, 0.055023193359375, 0.1837158203125, 0.312408447265625, 0.44110107421875, 0.569793701171875, 0.698486328125, 0.827178955078125, 0.95587158203125, 1.084564208984375, 1.2132568359375, 1.341949462890625, 1.47064208984375, 1.599334716796875, 1.72802734375, 1.856719970703125, 1.98541259765625, 2.114105224609375, 2.2427978515625, 2.371490478515625, 2.50018310546875, 2.628875732421875, 2.757568359375, 2.886260986328125, 3.01495361328125, 3.143646240234375, 3.2723388671875, 3.401031494140625, 3.52972412109375, 3.658416748046875, 3.787109375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 14.0, 10.0, 16.0, 28.0, 45.0, 59.0, 110.0, 117.0, 210.0, 298.0, 475.0, 714.0, 1012.0, 1613.0, 2412.0, 3592.0, 5607.0, 8718.0, 13382.0, 20489.0, 33493.0, 56108.0, 101231.0, 208453.0, 277830.0, 131057.0, 70448.0, 40382.0, 25410.0, 15671.0, 10186.0, 6549.0, 4367.0, 2937.0, 1857.0, 1234.0, 783.0, 525.0, 362.0, 239.0, 170.0, 116.0, 71.0, 41.0, 40.0, 22.0, 18.0, 11.0, 6.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.1827392578125, -0.17723464965820312, -0.17173004150390625, -0.16622543334960938, -0.1607208251953125, -0.15521621704101562, -0.14971160888671875, -0.14420700073242188, -0.138702392578125, -0.13319778442382812, -0.12769317626953125, -0.12218856811523438, -0.1166839599609375, -0.11117935180664062, -0.10567474365234375, -0.10017013549804688, -0.09466552734375, -0.08916091918945312, -0.08365631103515625, -0.07815170288085938, -0.0726470947265625, -0.06714248657226562, -0.06163787841796875, -0.056133270263671875, -0.050628662109375, -0.045124053955078125, -0.03961944580078125, -0.034114837646484375, -0.0286102294921875, -0.023105621337890625, -0.01760101318359375, -0.012096405029296875, -0.006591796875, -0.001087188720703125, 0.00441741943359375, 0.009922027587890625, 0.0154266357421875, 0.020931243896484375, 0.02643585205078125, 0.031940460205078125, 0.037445068359375, 0.042949676513671875, 0.04845428466796875, 0.053958892822265625, 0.0594635009765625, 0.06496810913085938, 0.07047271728515625, 0.07597732543945312, 0.08148193359375, 0.08698654174804688, 0.09249114990234375, 0.09799575805664062, 0.1035003662109375, 0.10900497436523438, 0.11450958251953125, 0.12001419067382812, 0.125518798828125, 0.13102340698242188, 0.13652801513671875, 0.14203262329101562, 0.1475372314453125, 0.15304183959960938, 0.15854644775390625, 0.16405105590820312, 0.1695556640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 4.0, 8.0, 5.0, 8.0, 10.0, 8.0, 16.0, 18.0, 16.0, 12.0, 22.0, 22.0, 25.0, 29.0, 36.0, 45.0, 26.0, 39.0, 48.0, 43.0, 27.0, 30.0, 1062.0, 34.0, 42.0, 38.0, 34.0, 34.0, 42.0, 30.0, 33.0, 29.0, 20.0, 24.0, 23.0, 13.0, 13.0, 8.0, 13.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.4722900390625, -3.356689453125, -3.2410888671875, -3.12548828125, -3.0098876953125, -2.894287109375, -2.7786865234375, -2.6630859375, -2.5474853515625, -2.431884765625, -2.3162841796875, -2.20068359375, -2.0850830078125, -1.969482421875, -1.8538818359375, -1.73828125, -1.6226806640625, -1.507080078125, -1.3914794921875, -1.27587890625, -1.1602783203125, -1.044677734375, -0.9290771484375, -0.8134765625, -0.6978759765625, -0.582275390625, -0.4666748046875, -0.35107421875, -0.2354736328125, -0.119873046875, -0.0042724609375, 0.111328125, 0.2269287109375, 0.342529296875, 0.4581298828125, 0.57373046875, 0.6893310546875, 0.804931640625, 0.9205322265625, 1.0361328125, 1.1517333984375, 1.267333984375, 1.3829345703125, 1.49853515625, 1.6141357421875, 1.729736328125, 1.8453369140625, 1.9609375, 2.0765380859375, 2.192138671875, 2.3077392578125, 2.42333984375, 2.5389404296875, 2.654541015625, 2.7701416015625, 2.8857421875, 3.0013427734375, 3.116943359375, 3.2325439453125, 3.34814453125, 3.4637451171875, 3.579345703125, 3.6949462890625, 3.810546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 10.0, 11.0, 10.0, 18.0, 31.0, 63.0, 79.0, 100.0, 141.0, 217.0, 283.0, 394.0, 632.0, 851.0, 1354.0, 1786.0, 2623.0, 3815.0, 5628.0, 8140.0, 11710.0, 17467.0, 26299.0, 40533.0, 64305.0, 111075.0, 248333.0, 1223109.0, 123900.0, 71448.0, 44280.0, 28608.0, 18970.0, 12884.0, 8700.0, 5894.0, 4047.0, 2885.0, 1987.0, 1372.0, 969.0, 659.0, 465.0, 321.0, 221.0, 162.0, 94.0, 78.0, 56.0, 33.0, 26.0, 20.0, 9.0, 5.0, 7.0, 6.0, 5.0, 4.0], "bins": [-0.06500244140625, -0.06303834915161133, -0.061074256896972656, -0.059110164642333984, -0.05714607238769531, -0.05518198013305664, -0.05321788787841797, -0.0512537956237793, -0.049289703369140625, -0.04732561111450195, -0.04536151885986328, -0.04339742660522461, -0.04143333435058594, -0.039469242095947266, -0.037505149841308594, -0.03554105758666992, -0.03357696533203125, -0.03161287307739258, -0.029648780822753906, -0.027684688568115234, -0.025720596313476562, -0.02375650405883789, -0.02179241180419922, -0.019828319549560547, -0.017864227294921875, -0.015900135040283203, -0.013936042785644531, -0.01197195053100586, -0.010007858276367188, -0.008043766021728516, -0.006079673767089844, -0.004115581512451172, -0.0021514892578125, -0.00018739700317382812, 0.0017766952514648438, 0.0037407875061035156, 0.0057048797607421875, 0.007668972015380859, 0.009633064270019531, 0.011597156524658203, 0.013561248779296875, 0.015525341033935547, 0.01748943328857422, 0.01945352554321289, 0.021417617797851562, 0.023381710052490234, 0.025345802307128906, 0.027309894561767578, 0.02927398681640625, 0.031238079071044922, 0.033202171325683594, 0.035166263580322266, 0.03713035583496094, 0.03909444808959961, 0.04105854034423828, 0.04302263259887695, 0.044986724853515625, 0.0469508171081543, 0.04891490936279297, 0.05087900161743164, 0.05284309387207031, 0.054807186126708984, 0.056771278381347656, 0.05873537063598633, 0.060699462890625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 4.0, 4.0, 4.0, 5.0, 6.0, 15.0, 9.0, 8.0, 17.0, 17.0, 21.0, 38.0, 52.0, 66.0, 88.0, 127.0, 124.0, 85.0, 70.0, 44.0, 40.0, 25.0, 19.0, 15.0, 16.0, 12.0, 13.0, 10.0, 6.0, 5.0, 7.0, 7.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.00091552734375, -0.0008915364742279053, -0.0008675456047058105, -0.0008435547351837158, -0.0008195638656616211, -0.0007955729961395264, -0.0007715821266174316, -0.0007475912570953369, -0.0007236003875732422, -0.0006996095180511475, -0.0006756186485290527, -0.000651627779006958, -0.0006276369094848633, -0.0006036460399627686, -0.0005796551704406738, -0.0005556643009185791, -0.0005316734313964844, -0.0005076825618743896, -0.0004836916923522949, -0.0004597008228302002, -0.00043570995330810547, -0.00041171908378601074, -0.000387728214263916, -0.0003637373447418213, -0.00033974647521972656, -0.00031575560569763184, -0.0002917647361755371, -0.0002677738666534424, -0.00024378299713134766, -0.00021979212760925293, -0.0001958012580871582, -0.00017181038856506348, -0.00014781951904296875, -0.00012382864952087402, -9.98377799987793e-05, -7.584691047668457e-05, -5.1856040954589844e-05, -2.7865171432495117e-05, -3.874301910400391e-06, 2.0116567611694336e-05, 4.410743713378906e-05, 6.809830665588379e-05, 9.208917617797852e-05, 0.00011608004570007324, 0.00014007091522216797, 0.0001640617847442627, 0.00018805265426635742, 0.00021204352378845215, 0.00023603439331054688, 0.0002600252628326416, 0.00028401613235473633, 0.00030800700187683105, 0.0003319978713989258, 0.0003559887409210205, 0.00037997961044311523, 0.00040397047996520996, 0.0004279613494873047, 0.0004519522190093994, 0.00047594308853149414, 0.0004999339580535889, 0.0005239248275756836, 0.0005479156970977783, 0.000571906566619873, 0.0005958974361419678, 0.0006198883056640625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 8.0, 5.0, 6.0, 5.0, 12.0, 12.0, 14.0, 16.0, 15.0, 22.0, 36.0, 61.0, 69.0, 197.0, 943.0, 931711.0, 114467.0, 512.0, 157.0, 85.0, 49.0, 37.0, 20.0, 15.0, 7.0, 12.0, 11.0, 8.0, 7.0, 3.0, 4.0, 5.0, 8.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015228271484375, -0.014639616012573242, -0.014050960540771484, -0.013462305068969727, -0.012873649597167969, -0.012284994125366211, -0.011696338653564453, -0.011107683181762695, -0.010519027709960938, -0.00993037223815918, -0.009341716766357422, -0.008753061294555664, -0.008164405822753906, -0.0075757503509521484, -0.006987094879150391, -0.006398439407348633, -0.005809783935546875, -0.005221128463745117, -0.004632472991943359, -0.0040438175201416016, -0.0034551620483398438, -0.002866506576538086, -0.002277851104736328, -0.0016891956329345703, -0.0011005401611328125, -0.0005118846893310547, 7.677078247070312e-05, 0.0006654262542724609, 0.0012540817260742188, 0.0018427371978759766, 0.0024313926696777344, 0.003020048141479492, 0.00360870361328125, 0.004197359085083008, 0.004786014556884766, 0.0053746700286865234, 0.005963325500488281, 0.006551980972290039, 0.007140636444091797, 0.007729291915893555, 0.008317947387695312, 0.00890660285949707, 0.009495258331298828, 0.010083913803100586, 0.010672569274902344, 0.011261224746704102, 0.01184988021850586, 0.012438535690307617, 0.013027191162109375, 0.013615846633911133, 0.01420450210571289, 0.014793157577514648, 0.015381813049316406, 0.015970468521118164, 0.016559123992919922, 0.01714777946472168, 0.017736434936523438, 0.018325090408325195, 0.018913745880126953, 0.01950240135192871, 0.02009105682373047, 0.020679712295532227, 0.021268367767333984, 0.021857023239135742, 0.0224456787109375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 72.0, 884.0, 61.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002409297041594982, -0.0022169805597513914, -0.002024663845077157, -0.0018323473632335663, -0.001640030648559332, -0.0014477141667157412, -0.0012553975684568286, -0.001063080970197916, -0.0008707643719390035, -0.0006784477736800909, -0.0004861312045250088, -0.0002938146353699267, -0.00010149803711101413, 9.081856114789844e-05, 0.0002831351011991501, 0.00047545169945806265, 0.0006677682977169752, 0.0008600848959758878, 0.0010524014942348003, 0.001244717976078391, 0.0014370346907526255, 0.0016293511725962162, 0.0018216677708551288, 0.0020139843691140413, 0.002206300850957632, 0.002398617332801223, 0.002590934047475457, 0.002783250529319048, 0.0029755672439932823, 0.003167883725836873, 0.003360200207680464, 0.003552516922354698, 0.0037448336370289326, 0.003937150351703167, 0.004129466600716114, 0.0043217833153903484, 0.004514100030064583, 0.004706416744738817, 0.004898732993751764, 0.005091049708425999, 0.005283366423100233, 0.0054756831377744675, 0.0056679993867874146, 0.005860316101461649, 0.006052632816135883, 0.006244949530810118, 0.006437265779823065, 0.006629582494497299, 0.006821898743510246, 0.007014215458184481, 0.007206531707197428, 0.007398848421871662, 0.0075911651365458965, 0.007783481851220131, 0.007975798100233078, 0.008168114349246025, 0.008360431529581547, 0.008552747778594494, 0.008745064958930016, 0.008937381207942963, 0.00912969745695591, 0.009322014637291431, 0.009514330886304379, 0.0097066480666399, 0.009898964315652847]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 10.0, 19.0, 15.0, 16.0, 23.0, 25.0, 25.0, 24.0, 32.0, 39.0, 39.0, 38.0, 38.0, 42.0, 45.0, 51.0, 46.0, 40.0, 39.0, 43.0, 37.0, 36.0, 35.0, 27.0, 35.0, 21.0, 23.0, 12.0, 10.0, 19.0, 15.0, 14.0, 10.0, 5.0, 9.0, 2.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004904270172119141, -0.0004765978083014488, -0.0004627685993909836, -0.00044893939048051834, -0.0004351101815700531, -0.00042128097265958786, -0.0004074517637491226, -0.0003936225548386574, -0.00037979334592819214, -0.0003659641370177269, -0.00035213492810726166, -0.0003383057191967964, -0.0003244765102863312, -0.00031064730137586594, -0.0002968180924654007, -0.00028298888355493546, -0.0002691596746444702, -0.000255330465734005, -0.00024150125682353973, -0.0002276720479130745, -0.00021384283900260925, -0.000200013630092144, -0.00018618442118167877, -0.00017235521227121353, -0.0001585260033607483, -0.00014469679445028305, -0.0001308675855398178, -0.00011703837662935257, -0.00010320916771888733, -8.937995880842209e-05, -7.555074989795685e-05, -6.172154098749161e-05, -4.789233207702637e-05, -3.406312316656113e-05, -2.0233914256095886e-05, -6.404705345630646e-06, 7.424503564834595e-06, 2.1253712475299835e-05, 3.5082921385765076e-05, 4.8912130296230316e-05, 6.274133920669556e-05, 7.65705481171608e-05, 9.039975702762604e-05, 0.00010422896593809128, 0.00011805817484855652, 0.00013188738375902176, 0.000145716592669487, 0.00015954580157995224, 0.00017337501049041748, 0.00018720421940088272, 0.00020103342831134796, 0.0002148626372218132, 0.00022869184613227844, 0.00024252105504274368, 0.0002563502639532089, 0.00027017947286367416, 0.0002840086817741394, 0.00029783789068460464, 0.0003116670995950699, 0.0003254963085055351, 0.00033932551741600037, 0.0003531547263264656, 0.00036698393523693085, 0.0003808131441473961, 0.00039464235305786133]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 8.0, 8.0, 2.0, 8.0, 15.0, 19.0, 19.0, 18.0, 28.0, 28.0, 28.0, 31.0, 39.0, 46.0, 48.0, 31.0, 45.0, 42.0, 46.0, 45.0, 38.0, 42.0, 33.0, 35.0, 32.0, 33.0, 36.0, 27.0, 22.0, 15.0, 23.0, 13.0, 20.0, 19.0, 6.0, 13.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44921875, -4.320526123046875, -4.19183349609375, -4.063140869140625, -3.9344482421875, -3.805755615234375, -3.67706298828125, -3.548370361328125, -3.419677734375, -3.290985107421875, -3.16229248046875, -3.033599853515625, -2.9049072265625, -2.776214599609375, -2.64752197265625, -2.518829345703125, -2.39013671875, -2.261444091796875, -2.13275146484375, -2.004058837890625, -1.8753662109375, -1.746673583984375, -1.61798095703125, -1.489288330078125, -1.360595703125, -1.231903076171875, -1.10321044921875, -0.974517822265625, -0.8458251953125, -0.717132568359375, -0.58843994140625, -0.459747314453125, -0.3310546875, -0.202362060546875, -0.07366943359375, 0.055023193359375, 0.1837158203125, 0.312408447265625, 0.44110107421875, 0.569793701171875, 0.698486328125, 0.827178955078125, 0.95587158203125, 1.084564208984375, 1.2132568359375, 1.341949462890625, 1.47064208984375, 1.599334716796875, 1.72802734375, 1.856719970703125, 1.98541259765625, 2.114105224609375, 2.2427978515625, 2.371490478515625, 2.50018310546875, 2.628875732421875, 2.757568359375, 2.886260986328125, 3.01495361328125, 3.143646240234375, 3.2723388671875, 3.401031494140625, 3.52972412109375, 3.658416748046875, 3.787109375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 10.0, 14.0, 27.0, 44.0, 57.0, 81.0, 140.0, 195.0, 290.0, 467.0, 694.0, 1078.0, 1615.0, 2686.0, 4119.0, 6863.0, 10796.0, 17771.0, 28542.0, 48818.0, 93650.0, 210939.0, 300369.0, 148193.0, 70398.0, 38848.0, 23248.0, 14204.0, 9056.0, 5638.0, 3548.0, 2202.0, 1398.0, 881.0, 536.0, 383.0, 255.0, 178.0, 114.0, 71.0, 46.0, 32.0, 21.0, 14.0, 7.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-4.828125, -4.68310546875, -4.5380859375, -4.39306640625, -4.248046875, -4.10302734375, -3.9580078125, -3.81298828125, -3.66796875, -3.52294921875, -3.3779296875, -3.23291015625, -3.087890625, -2.94287109375, -2.7978515625, -2.65283203125, -2.5078125, -2.36279296875, -2.2177734375, -2.07275390625, -1.927734375, -1.78271484375, -1.6376953125, -1.49267578125, -1.34765625, -1.20263671875, -1.0576171875, -0.91259765625, -0.767578125, -0.62255859375, -0.4775390625, -0.33251953125, -0.1875, -0.04248046875, 0.1025390625, 0.24755859375, 0.392578125, 0.53759765625, 0.6826171875, 0.82763671875, 0.97265625, 1.11767578125, 1.2626953125, 1.40771484375, 1.552734375, 1.69775390625, 1.8427734375, 1.98779296875, 2.1328125, 2.27783203125, 2.4228515625, 2.56787109375, 2.712890625, 2.85791015625, 3.0029296875, 3.14794921875, 3.29296875, 3.43798828125, 3.5830078125, 3.72802734375, 3.873046875, 4.01806640625, 4.1630859375, 4.30810546875, 4.453125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 4.0, 5.0, 6.0, 9.0, 5.0, 16.0, 13.0, 12.0, 9.0, 11.0, 26.0, 23.0, 32.0, 37.0, 29.0, 44.0, 38.0, 54.0, 67.0, 81.0, 147.0, 211.0, 1346.0, 197.0, 127.0, 63.0, 75.0, 56.0, 43.0, 41.0, 37.0, 29.0, 16.0, 18.0, 25.0, 11.0, 10.0, 14.0, 14.0, 13.0, 4.0, 5.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.5078125, -10.1380615234375, -9.768310546875, -9.3985595703125, -9.02880859375, -8.6590576171875, -8.289306640625, -7.9195556640625, -7.5498046875, -7.1800537109375, -6.810302734375, -6.4405517578125, -6.07080078125, -5.7010498046875, -5.331298828125, -4.9615478515625, -4.591796875, -4.2220458984375, -3.852294921875, -3.4825439453125, -3.11279296875, -2.7430419921875, -2.373291015625, -2.0035400390625, -1.6337890625, -1.2640380859375, -0.894287109375, -0.5245361328125, -0.15478515625, 0.2149658203125, 0.584716796875, 0.9544677734375, 1.32421875, 1.6939697265625, 2.063720703125, 2.4334716796875, 2.80322265625, 3.1729736328125, 3.542724609375, 3.9124755859375, 4.2822265625, 4.6519775390625, 5.021728515625, 5.3914794921875, 5.76123046875, 6.1309814453125, 6.500732421875, 6.8704833984375, 7.240234375, 7.6099853515625, 7.979736328125, 8.3494873046875, 8.71923828125, 9.0889892578125, 9.458740234375, 9.8284912109375, 10.1982421875, 10.5679931640625, 10.937744140625, 11.3074951171875, 11.67724609375, 12.0469970703125, 12.416748046875, 12.7864990234375, 13.15625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 5.0, 3.0, 4.0, 11.0, 5.0, 12.0, 7.0, 18.0, 15.0, 20.0, 33.0, 42.0, 51.0, 57.0, 93.0, 110.0, 186.0, 330.0, 644.0, 1719.0, 6042.0, 26518.0, 153274.0, 1776731.0, 1049072.0, 103653.0, 19510.0, 4646.0, 1391.0, 536.0, 274.0, 165.0, 143.0, 98.0, 67.0, 51.0, 29.0, 28.0, 23.0, 18.0, 13.0, 11.0, 11.0, 15.0, 6.0, 8.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.546875, -13.15869140625, -12.7705078125, -12.38232421875, -11.994140625, -11.60595703125, -11.2177734375, -10.82958984375, -10.44140625, -10.05322265625, -9.6650390625, -9.27685546875, -8.888671875, -8.50048828125, -8.1123046875, -7.72412109375, -7.3359375, -6.94775390625, -6.5595703125, -6.17138671875, -5.783203125, -5.39501953125, -5.0068359375, -4.61865234375, -4.23046875, -3.84228515625, -3.4541015625, -3.06591796875, -2.677734375, -2.28955078125, -1.9013671875, -1.51318359375, -1.125, -0.73681640625, -0.3486328125, 0.03955078125, 0.427734375, 0.81591796875, 1.2041015625, 1.59228515625, 1.98046875, 2.36865234375, 2.7568359375, 3.14501953125, 3.533203125, 3.92138671875, 4.3095703125, 4.69775390625, 5.0859375, 5.47412109375, 5.8623046875, 6.25048828125, 6.638671875, 7.02685546875, 7.4150390625, 7.80322265625, 8.19140625, 8.57958984375, 8.9677734375, 9.35595703125, 9.744140625, 10.13232421875, 10.5205078125, 10.90869140625, 11.296875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 10.0, 14.0, 34.0, 35.0, 58.0, 86.0, 103.0, 124.0, 113.0, 120.0, 93.0, 77.0, 58.0, 30.0, 23.0, 9.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.431642532348633, -19.52145767211914, -18.61127471923828, -17.70108985900879, -16.79090690612793, -15.880722045898438, -14.970538139343262, -14.060354232788086, -13.15017032623291, -12.239986419677734, -11.329802513122559, -10.419618606567383, -9.50943374633789, -8.599250793457031, -7.689065933227539, -6.778882026672363, -5.8686981201171875, -4.958514213562012, -4.048330307006836, -3.138145923614502, -2.227962017059326, -1.3177781105041504, -0.4075937271118164, 0.5025901794433594, 1.4127740859985352, 2.322957992553711, 3.233142137527466, 4.143326282501221, 5.0535101890563965, 5.963694095611572, 6.873878479003906, 7.784062385559082, 8.694244384765625, 9.6044282913208, 10.514612197875977, 11.424797058105469, 12.334980010986328, 13.24516487121582, 14.155348777770996, 15.065532684326172, 15.975716590881348, 16.885900497436523, 17.796085357666016, 18.706268310546875, 19.616453170776367, 20.526636123657227, 21.43682098388672, 22.347003936767578, 23.25718879699707, 24.167373657226562, 25.077556610107422, 25.987741470336914, 26.897924423217773, 27.808109283447266, 28.718292236328125, 29.628477096557617, 30.53866195678711, 31.4488468170166, 32.359031677246094, 33.26921463012695, 34.17939758300781, 35.08958053588867, 35.9997673034668, 36.909950256347656, 37.820133209228516]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 9.0, 9.0, 11.0, 11.0, 15.0, 17.0, 23.0, 23.0, 26.0, 23.0, 31.0, 31.0, 46.0, 45.0, 34.0, 37.0, 51.0, 51.0, 52.0, 44.0, 33.0, 43.0, 34.0, 43.0, 44.0, 25.0, 19.0, 30.0, 15.0, 27.0, 13.0, 16.0, 12.0, 14.0, 9.0, 2.0, 11.0, 6.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.04414367675781, -32.93817901611328, -31.832218170166016, -30.726255416870117, -29.62029266357422, -28.51432991027832, -27.408367156982422, -26.302404403686523, -25.196441650390625, -24.090478897094727, -22.984516143798828, -21.87855339050293, -20.77259063720703, -19.666627883911133, -18.560665130615234, -17.454702377319336, -16.348739624023438, -15.242776870727539, -14.13681411743164, -13.030851364135742, -11.924888610839844, -10.818925857543945, -9.712963104248047, -8.607000350952148, -7.50103759765625, -6.395074844360352, -5.289112091064453, -4.183149337768555, -3.0771865844726562, -1.9712238311767578, -0.8652610778808594, 0.24070167541503906, 1.3466682434082031, 2.4526309967041016, 3.55859375, 4.664556503295898, 5.770519256591797, 6.876482009887695, 7.982444763183594, 9.088407516479492, 10.19437026977539, 11.300333023071289, 12.406295776367188, 13.512258529663086, 14.618221282958984, 15.724184036254883, 16.83014678955078, 17.93610954284668, 19.042072296142578, 20.148035049438477, 21.253997802734375, 22.359960556030273, 23.465923309326172, 24.57188606262207, 25.67784881591797, 26.783811569213867, 27.889774322509766, 28.995737075805664, 30.101699829101562, 31.20766258239746, 32.31362533569336, 33.419586181640625, 34.525550842285156, 35.63151550292969, 36.73747634887695]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 5.0, 7.0, 16.0, 15.0, 13.0, 19.0, 19.0, 20.0, 18.0, 36.0, 46.0, 33.0, 38.0, 42.0, 42.0, 42.0, 40.0, 42.0, 38.0, 46.0, 35.0, 39.0, 35.0, 37.0, 28.0, 30.0, 22.0, 30.0, 24.0, 26.0, 13.0, 15.0, 14.0, 19.0, 7.0, 6.0, 4.0, 6.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-4.6953125, -4.564361572265625, -4.43341064453125, -4.302459716796875, -4.1715087890625, -4.040557861328125, -3.90960693359375, -3.778656005859375, -3.647705078125, -3.516754150390625, -3.38580322265625, -3.254852294921875, -3.1239013671875, -2.992950439453125, -2.86199951171875, -2.731048583984375, -2.60009765625, -2.469146728515625, -2.33819580078125, -2.207244873046875, -2.0762939453125, -1.945343017578125, -1.81439208984375, -1.683441162109375, -1.552490234375, -1.421539306640625, -1.29058837890625, -1.159637451171875, -1.0286865234375, -0.897735595703125, -0.76678466796875, -0.635833740234375, -0.5048828125, -0.373931884765625, -0.24298095703125, -0.112030029296875, 0.0189208984375, 0.149871826171875, 0.28082275390625, 0.411773681640625, 0.542724609375, 0.673675537109375, 0.80462646484375, 0.935577392578125, 1.0665283203125, 1.197479248046875, 1.32843017578125, 1.459381103515625, 1.59033203125, 1.721282958984375, 1.85223388671875, 1.983184814453125, 2.1141357421875, 2.245086669921875, 2.37603759765625, 2.506988525390625, 2.637939453125, 2.768890380859375, 2.89984130859375, 3.030792236328125, 3.1617431640625, 3.292694091796875, 3.42364501953125, 3.554595947265625, 3.685546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 11.0, 12.0, 14.0, 22.0, 33.0, 42.0, 65.0, 59.0, 127.0, 184.0, 289.0, 493.0, 964.0, 2076.0, 5440.0, 20010.0, 116945.0, 1016475.0, 2528107.0, 429394.0, 54856.0, 11300.0, 3715.0, 1589.0, 824.0, 445.0, 225.0, 145.0, 115.0, 78.0, 54.0, 43.0, 25.0, 14.0, 18.0, 17.0, 3.0, 7.0, 11.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-10.6875, -10.384765625, -10.08203125, -9.779296875, -9.4765625, -9.173828125, -8.87109375, -8.568359375, -8.265625, -7.962890625, -7.66015625, -7.357421875, -7.0546875, -6.751953125, -6.44921875, -6.146484375, -5.84375, -5.541015625, -5.23828125, -4.935546875, -4.6328125, -4.330078125, -4.02734375, -3.724609375, -3.421875, -3.119140625, -2.81640625, -2.513671875, -2.2109375, -1.908203125, -1.60546875, -1.302734375, -1.0, -0.697265625, -0.39453125, -0.091796875, 0.2109375, 0.513671875, 0.81640625, 1.119140625, 1.421875, 1.724609375, 2.02734375, 2.330078125, 2.6328125, 2.935546875, 3.23828125, 3.541015625, 3.84375, 4.146484375, 4.44921875, 4.751953125, 5.0546875, 5.357421875, 5.66015625, 5.962890625, 6.265625, 6.568359375, 6.87109375, 7.173828125, 7.4765625, 7.779296875, 8.08203125, 8.384765625, 8.6875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 14.0, 24.0, 18.0, 31.0, 45.0, 72.0, 117.0, 167.0, 253.0, 381.0, 519.0, 613.0, 545.0, 395.0, 292.0, 162.0, 127.0, 76.0, 62.0, 41.0, 28.0, 25.0, 19.0, 14.0, 7.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.953125, -8.6866455078125, -8.420166015625, -8.1536865234375, -7.88720703125, -7.6207275390625, -7.354248046875, -7.0877685546875, -6.8212890625, -6.5548095703125, -6.288330078125, -6.0218505859375, -5.75537109375, -5.4888916015625, -5.222412109375, -4.9559326171875, -4.689453125, -4.4229736328125, -4.156494140625, -3.8900146484375, -3.62353515625, -3.3570556640625, -3.090576171875, -2.8240966796875, -2.5576171875, -2.2911376953125, -2.024658203125, -1.7581787109375, -1.49169921875, -1.2252197265625, -0.958740234375, -0.6922607421875, -0.42578125, -0.1593017578125, 0.107177734375, 0.3736572265625, 0.64013671875, 0.9066162109375, 1.173095703125, 1.4395751953125, 1.7060546875, 1.9725341796875, 2.239013671875, 2.5054931640625, 2.77197265625, 3.0384521484375, 3.304931640625, 3.5714111328125, 3.837890625, 4.1043701171875, 4.370849609375, 4.6373291015625, 4.90380859375, 5.1702880859375, 5.436767578125, 5.7032470703125, 5.9697265625, 6.2362060546875, 6.502685546875, 6.7691650390625, 7.03564453125, 7.3021240234375, 7.568603515625, 7.8350830078125, 8.1015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 18.0, 13.0, 23.0, 41.0, 49.0, 74.0, 103.0, 228.0, 386.0, 1093.0, 7105.0, 302912.0, 3806578.0, 70754.0, 3380.0, 740.0, 345.0, 163.0, 105.0, 46.0, 30.0, 30.0, 16.0, 15.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.265625, -28.268310546875, -27.27099609375, -26.273681640625, -25.2763671875, -24.279052734375, -23.28173828125, -22.284423828125, -21.287109375, -20.289794921875, -19.29248046875, -18.295166015625, -17.2978515625, -16.300537109375, -15.30322265625, -14.305908203125, -13.30859375, -12.311279296875, -11.31396484375, -10.316650390625, -9.3193359375, -8.322021484375, -7.32470703125, -6.327392578125, -5.330078125, -4.332763671875, -3.33544921875, -2.338134765625, -1.3408203125, -0.343505859375, 0.65380859375, 1.651123046875, 2.6484375, 3.645751953125, 4.64306640625, 5.640380859375, 6.6376953125, 7.635009765625, 8.63232421875, 9.629638671875, 10.626953125, 11.624267578125, 12.62158203125, 13.618896484375, 14.6162109375, 15.613525390625, 16.61083984375, 17.608154296875, 18.60546875, 19.602783203125, 20.60009765625, 21.597412109375, 22.5947265625, 23.592041015625, 24.58935546875, 25.586669921875, 26.583984375, 27.581298828125, 28.57861328125, 29.575927734375, 30.5732421875, 31.570556640625, 32.56787109375, 33.565185546875, 34.5625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 18.0, 63.0, 159.0, 265.0, 251.0, 158.0, 68.0, 19.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.928932189941406, -38.51460266113281, -36.10027313232422, -33.685943603515625, -31.27161407470703, -28.857284545898438, -26.44295310974121, -24.028623580932617, -21.614294052124023, -19.19996452331543, -16.785634994506836, -14.371304512023926, -11.956974983215332, -9.542645454406738, -7.128314971923828, -4.713985443115234, -2.2996559143066406, 0.11467385292053223, 2.529003620147705, 4.943333625793457, 7.357663154602051, 9.771992683410645, 12.186323165893555, 14.600652694702148, 17.014982223510742, 19.429311752319336, 21.84364128112793, 24.257972717285156, 26.67230224609375, 29.086631774902344, 31.500961303710938, 33.91529083251953, 36.329620361328125, 38.74394989013672, 41.15827941894531, 43.572608947753906, 45.9869384765625, 48.401268005371094, 50.81559753417969, 53.22992706298828, 55.644256591796875, 58.05858612060547, 60.47291564941406, 62.887245178222656, 65.30157470703125, 67.71590423583984, 70.13023376464844, 72.54456329345703, 74.95889282226562, 77.37322235107422, 79.78755187988281, 82.2018814086914, 84.6162109375, 87.0305404663086, 89.44486999511719, 91.85919952392578, 94.2735366821289, 96.6878662109375, 99.1021957397461, 101.51652526855469, 103.93085479736328, 106.34518432617188, 108.75951385498047, 111.17384338378906, 113.58817291259766]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 7.0, 10.0, 12.0, 11.0, 15.0, 11.0, 15.0, 23.0, 25.0, 25.0, 29.0, 32.0, 30.0, 34.0, 39.0, 34.0, 28.0, 37.0, 54.0, 45.0, 41.0, 42.0, 38.0, 29.0, 40.0, 39.0, 34.0, 32.0, 36.0, 18.0, 16.0, 22.0, 18.0, 12.0, 13.0, 11.0, 12.0, 6.0, 4.0, 8.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.781631469726562, -21.092193603515625, -20.402755737304688, -19.71331787109375, -19.023880004882812, -18.334442138671875, -17.645004272460938, -16.95556640625, -16.266128540039062, -15.576690673828125, -14.887252807617188, -14.19781494140625, -13.508377075195312, -12.818939208984375, -12.129501342773438, -11.4400634765625, -10.750624656677246, -10.061186790466309, -9.371748924255371, -8.682311058044434, -7.992873191833496, -7.303435325622559, -6.613996982574463, -5.924559116363525, -5.235121250152588, -4.54568338394165, -3.856245517730713, -3.1668074131011963, -2.477369546890259, -1.7879316806793213, -1.0984935760498047, -0.4090557098388672, 0.2803821563720703, 0.9698200821876526, 1.6592580080032349, 2.348695993423462, 3.0381338596343994, 3.727571725845337, 4.4170098304748535, 5.106447696685791, 5.7958855628967285, 6.485323429107666, 7.1747612953186035, 7.864199638366699, 8.553637504577637, 9.243075370788574, 9.932513236999512, 10.62195110321045, 11.311388969421387, 12.000826835632324, 12.690264701843262, 13.3797025680542, 14.069140434265137, 14.758578300476074, 15.448017120361328, 16.137454986572266, 16.826892852783203, 17.51633071899414, 18.205768585205078, 18.895206451416016, 19.584644317626953, 20.27408218383789, 20.963520050048828, 21.652957916259766, 22.342395782470703]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 6.0, 7.0, 18.0, 16.0, 14.0, 12.0, 19.0, 24.0, 28.0, 22.0, 23.0, 34.0, 32.0, 44.0, 39.0, 33.0, 32.0, 33.0, 43.0, 45.0, 51.0, 30.0, 35.0, 42.0, 36.0, 30.0, 31.0, 28.0, 21.0, 24.0, 16.0, 19.0, 15.0, 12.0, 12.0, 14.0, 10.0, 11.0, 2.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.625, -4.498931884765625, -4.37286376953125, -4.246795654296875, -4.1207275390625, -3.994659423828125, -3.86859130859375, -3.742523193359375, -3.616455078125, -3.490386962890625, -3.36431884765625, -3.238250732421875, -3.1121826171875, -2.986114501953125, -2.86004638671875, -2.733978271484375, -2.60791015625, -2.481842041015625, -2.35577392578125, -2.229705810546875, -2.1036376953125, -1.977569580078125, -1.85150146484375, -1.725433349609375, -1.599365234375, -1.473297119140625, -1.34722900390625, -1.221160888671875, -1.0950927734375, -0.969024658203125, -0.84295654296875, -0.716888427734375, -0.5908203125, -0.464752197265625, -0.33868408203125, -0.212615966796875, -0.0865478515625, 0.039520263671875, 0.16558837890625, 0.291656494140625, 0.417724609375, 0.543792724609375, 0.66986083984375, 0.795928955078125, 0.9219970703125, 1.048065185546875, 1.17413330078125, 1.300201416015625, 1.42626953125, 1.552337646484375, 1.67840576171875, 1.804473876953125, 1.9305419921875, 2.056610107421875, 2.18267822265625, 2.308746337890625, 2.434814453125, 2.560882568359375, 2.68695068359375, 2.813018798828125, 2.9390869140625, 3.065155029296875, 3.19122314453125, 3.317291259765625, 3.443359375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 11.0, 17.0, 17.0, 24.0, 38.0, 59.0, 74.0, 130.0, 193.0, 255.0, 325.0, 540.0, 682.0, 1004.0, 1456.0, 2148.0, 3097.0, 4459.0, 6469.0, 9369.0, 13539.0, 19965.0, 29504.0, 43999.0, 71187.0, 129268.0, 256506.0, 189680.0, 94398.0, 56455.0, 36180.0, 24258.0, 16640.0, 11363.0, 7739.0, 5308.0, 3713.0, 2534.0, 1792.0, 1295.0, 866.0, 611.0, 415.0, 304.0, 199.0, 134.0, 104.0, 73.0, 61.0, 46.0, 25.0, 11.0, 6.0, 8.0, 3.0, 0.0, 0.0, 6.0], "bins": [-0.1502685546875, -0.14568138122558594, -0.14109420776367188, -0.1365070343017578, -0.13191986083984375, -0.1273326873779297, -0.12274551391601562, -0.11815834045410156, -0.1135711669921875, -0.10898399353027344, -0.10439682006835938, -0.09980964660644531, -0.09522247314453125, -0.09063529968261719, -0.08604812622070312, -0.08146095275878906, -0.076873779296875, -0.07228660583496094, -0.06769943237304688, -0.06311225891113281, -0.05852508544921875, -0.05393791198730469, -0.049350738525390625, -0.04476356506347656, -0.0401763916015625, -0.03558921813964844, -0.031002044677734375, -0.026414871215820312, -0.02182769775390625, -0.017240524291992188, -0.012653350830078125, -0.008066177368164062, -0.00347900390625, 0.0011081695556640625, 0.005695343017578125, 0.010282516479492188, 0.01486968994140625, 0.019456863403320312, 0.024044036865234375, 0.028631210327148438, 0.0332183837890625, 0.03780555725097656, 0.042392730712890625, 0.04697990417480469, 0.05156707763671875, 0.05615425109863281, 0.060741424560546875, 0.06532859802246094, 0.069915771484375, 0.07450294494628906, 0.07909011840820312, 0.08367729187011719, 0.08826446533203125, 0.09285163879394531, 0.09743881225585938, 0.10202598571777344, 0.1066131591796875, 0.11120033264160156, 0.11578750610351562, 0.12037467956542969, 0.12496185302734375, 0.1295490264892578, 0.13413619995117188, 0.13872337341308594, 0.143310546875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 5.0, 8.0, 9.0, 11.0, 15.0, 13.0, 15.0, 22.0, 24.0, 24.0, 26.0, 29.0, 21.0, 27.0, 37.0, 36.0, 46.0, 33.0, 1067.0, 52.0, 36.0, 42.0, 49.0, 45.0, 37.0, 30.0, 44.0, 30.0, 29.0, 25.0, 13.0, 16.0, 25.0, 14.0, 10.0, 7.0, 8.0, 7.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.787109375, -3.668365478515625, -3.54962158203125, -3.430877685546875, -3.3121337890625, -3.193389892578125, -3.07464599609375, -2.955902099609375, -2.837158203125, -2.718414306640625, -2.59967041015625, -2.480926513671875, -2.3621826171875, -2.243438720703125, -2.12469482421875, -2.005950927734375, -1.88720703125, -1.768463134765625, -1.64971923828125, -1.530975341796875, -1.4122314453125, -1.293487548828125, -1.17474365234375, -1.055999755859375, -0.937255859375, -0.818511962890625, -0.69976806640625, -0.581024169921875, -0.4622802734375, -0.343536376953125, -0.22479248046875, -0.106048583984375, 0.0126953125, 0.131439208984375, 0.25018310546875, 0.368927001953125, 0.4876708984375, 0.606414794921875, 0.72515869140625, 0.843902587890625, 0.962646484375, 1.081390380859375, 1.20013427734375, 1.318878173828125, 1.4376220703125, 1.556365966796875, 1.67510986328125, 1.793853759765625, 1.91259765625, 2.031341552734375, 2.15008544921875, 2.268829345703125, 2.3875732421875, 2.506317138671875, 2.62506103515625, 2.743804931640625, 2.862548828125, 2.981292724609375, 3.10003662109375, 3.218780517578125, 3.3375244140625, 3.456268310546875, 3.57501220703125, 3.693756103515625, 3.8125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 15.0, 14.0, 30.0, 35.0, 51.0, 82.0, 109.0, 147.0, 219.0, 321.0, 461.0, 659.0, 1046.0, 1497.0, 2162.0, 3214.0, 4618.0, 6749.0, 10223.0, 15669.0, 24027.0, 36993.0, 60929.0, 107170.0, 214845.0, 1285791.0, 127578.0, 71110.0, 42447.0, 26862.0, 17252.0, 11402.0, 7629.0, 5060.0, 3420.0, 2257.0, 1517.0, 1102.0, 737.0, 515.0, 371.0, 252.0, 167.0, 116.0, 81.0, 50.0, 45.0, 33.0, 18.0, 13.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.06304931640625, -0.06102466583251953, -0.05900001525878906, -0.056975364685058594, -0.054950714111328125, -0.052926063537597656, -0.05090141296386719, -0.04887676239013672, -0.04685211181640625, -0.04482746124267578, -0.04280281066894531, -0.040778160095214844, -0.038753509521484375, -0.036728858947753906, -0.03470420837402344, -0.03267955780029297, -0.0306549072265625, -0.02863025665283203, -0.026605606079101562, -0.024580955505371094, -0.022556304931640625, -0.020531654357910156, -0.018507003784179688, -0.01648235321044922, -0.01445770263671875, -0.012433052062988281, -0.010408401489257812, -0.008383750915527344, -0.006359100341796875, -0.004334449768066406, -0.0023097991943359375, -0.00028514862060546875, 0.001739501953125, 0.0037641525268554688, 0.0057888031005859375, 0.007813453674316406, 0.009838104248046875, 0.011862754821777344, 0.013887405395507812, 0.01591205596923828, 0.01793670654296875, 0.01996135711669922, 0.021986007690429688, 0.024010658264160156, 0.026035308837890625, 0.028059959411621094, 0.030084609985351562, 0.03210926055908203, 0.0341339111328125, 0.03615856170654297, 0.03818321228027344, 0.040207862854003906, 0.042232513427734375, 0.044257164001464844, 0.04628181457519531, 0.04830646514892578, 0.05033111572265625, 0.05235576629638672, 0.05438041687011719, 0.056405067443847656, 0.058429718017578125, 0.060454368591308594, 0.06247901916503906, 0.06450366973876953, 0.0665283203125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 11.0, 6.0, 7.0, 9.0, 8.0, 13.0, 13.0, 25.0, 18.0, 43.0, 28.0, 56.0, 67.0, 71.0, 86.0, 86.0, 82.0, 65.0, 51.0, 40.0, 30.0, 25.0, 26.0, 17.0, 20.0, 11.0, 18.0, 8.0, 11.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0002872943878173828, -0.00027855485677719116, -0.0002698153257369995, -0.00026107579469680786, -0.0002523362636566162, -0.00024359673261642456, -0.0002348572015762329, -0.00022611767053604126, -0.0002173781394958496, -0.00020863860845565796, -0.0001998990774154663, -0.00019115954637527466, -0.000182420015335083, -0.00017368048429489136, -0.0001649409532546997, -0.00015620142221450806, -0.0001474618911743164, -0.00013872236013412476, -0.0001299828290939331, -0.00012124329805374146, -0.0001125037670135498, -0.00010376423597335815, -9.50247049331665e-05, -8.628517389297485e-05, -7.75456428527832e-05, -6.880611181259155e-05, -6.00665807723999e-05, -5.132704973220825e-05, -4.25875186920166e-05, -3.384798765182495e-05, -2.51084566116333e-05, -1.636892557144165e-05, -7.62939453125e-06, 1.1101365089416504e-06, 9.8496675491333e-06, 1.858919858932495e-05, 2.73287296295166e-05, 3.606826066970825e-05, 4.48077917098999e-05, 5.354732275009155e-05, 6.22868537902832e-05, 7.102638483047485e-05, 7.97659158706665e-05, 8.850544691085815e-05, 9.72449779510498e-05, 0.00010598450899124146, 0.0001147240400314331, 0.00012346357107162476, 0.0001322031021118164, 0.00014094263315200806, 0.0001496821641921997, 0.00015842169523239136, 0.000167161226272583, 0.00017590075731277466, 0.0001846402883529663, 0.00019337981939315796, 0.0002021193504333496, 0.00021085888147354126, 0.0002195984125137329, 0.00022833794355392456, 0.0002370774745941162, 0.00024581700563430786, 0.0002545565366744995, 0.00026329606771469116, 0.0002720355987548828]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 7.0, 10.0, 12.0, 21.0, 19.0, 24.0, 26.0, 38.0, 40.0, 92.0, 165.0, 648.0, 7752.0, 257446.0, 764361.0, 16240.0, 1117.0, 195.0, 104.0, 51.0, 29.0, 27.0, 19.0, 17.0, 7.0, 14.0, 7.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0066375732421875, -0.006417214870452881, -0.006196856498718262, -0.005976498126983643, -0.0057561397552490234, -0.005535781383514404, -0.005315423011779785, -0.005095064640045166, -0.004874706268310547, -0.004654347896575928, -0.004433989524841309, -0.0042136311531066895, -0.00399327278137207, -0.003772914409637451, -0.003552556037902832, -0.003332197666168213, -0.0031118392944335938, -0.0028914809226989746, -0.0026711225509643555, -0.0024507641792297363, -0.002230405807495117, -0.002010047435760498, -0.001789689064025879, -0.0015693306922912598, -0.0013489723205566406, -0.0011286139488220215, -0.0009082555770874023, -0.0006878972053527832, -0.00046753883361816406, -0.0002471804618835449, -2.682209014892578e-05, 0.00019353628158569336, 0.0004138946533203125, 0.0006342530250549316, 0.0008546113967895508, 0.00107496976852417, 0.001295328140258789, 0.0015156865119934082, 0.0017360448837280273, 0.0019564032554626465, 0.0021767616271972656, 0.0023971199989318848, 0.002617478370666504, 0.002837836742401123, 0.003058195114135742, 0.0032785534858703613, 0.0034989118576049805, 0.0037192702293395996, 0.003939628601074219, 0.004159986972808838, 0.004380345344543457, 0.004600703716278076, 0.004821062088012695, 0.0050414204597473145, 0.005261778831481934, 0.005482137203216553, 0.005702495574951172, 0.005922853946685791, 0.00614321231842041, 0.006363570690155029, 0.0065839290618896484, 0.006804287433624268, 0.007024645805358887, 0.007245004177093506, 0.007465362548828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 4.0, 16.0, 13.0, 37.0, 46.0, 105.0, 189.0, 248.0, 148.0, 83.0, 40.0, 25.0, 17.0, 11.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.00111119425855577, -0.001089525525458157, -0.001067856908775866, -0.0010461881756782532, -0.0010245195589959621, -0.0010028508258983493, -0.0009811822092160583, -0.0009595134761184454, -0.0009378448012284935, -0.0009161761263385415, -0.0008945074514485896, -0.0008728387765586376, -0.0008511700434610248, -0.0008295013685710728, -0.0008078326936811209, -0.0007861640187911689, -0.000764495343901217, -0.000742826669011265, -0.0007211579941213131, -0.0006994893192313612, -0.0006778206443414092, -0.0006561519112437963, -0.0006344832363538444, -0.0006128145614638925, -0.0005911458865739405, -0.0005694772116839886, -0.0005478085367940366, -0.0005261398619040847, -0.0005044711288064718, -0.00048280248302035034, -0.00046113377902656794, -0.000439465104136616, -0.0004177964583504945, -0.00039612778346054256, -0.00037445907946676016, -0.0003527904045768082, -0.00033112172968685627, -0.0003094530547969043, -0.0002877843799069524, -0.00026611567591317, -0.00024444700102321804, -0.0002227783261332661, -0.00020110963669139892, -0.00017944094724953175, -0.0001577722723595798, -0.00013610359746962786, -0.00011443490802776068, -9.276621858589351e-05, -7.109754369594157e-05, -4.942886153003201e-05, -2.776017936412245e-05, -6.091497198212892e-06, 1.5577184967696667e-05, 3.7245867133606225e-05, 5.8914549299515784e-05, 8.058323874138296e-05, 0.0001022519136313349, 0.00012392058852128685, 0.00014558927796315402, 0.0001672579674050212, 0.00018892664229497313, 0.00021059531718492508, 0.00023226400662679225, 0.0002539326960686594, 0.00027560137095861137]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 12.0, 9.0, 6.0, 17.0, 21.0, 15.0, 27.0, 28.0, 33.0, 40.0, 48.0, 42.0, 40.0, 46.0, 58.0, 49.0, 54.0, 51.0, 46.0, 50.0, 37.0, 39.0, 43.0, 25.0, 32.0, 24.0, 28.0, 14.0, 13.0, 12.0, 9.0, 4.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0001927018165588379, -0.00018705707043409348, -0.00018141232430934906, -0.00017576757818460464, -0.00017012283205986023, -0.00016447808593511581, -0.0001588333398103714, -0.00015318859368562698, -0.00014754384756088257, -0.00014189910143613815, -0.00013625435531139374, -0.00013060960918664932, -0.0001249648630619049, -0.00011932011693716049, -0.00011367537081241608, -0.00010803062468767166, -0.00010238587856292725, -9.674113243818283e-05, -9.109638631343842e-05, -8.5451640188694e-05, -7.980689406394958e-05, -7.416214793920517e-05, -6.851740181446075e-05, -6.287265568971634e-05, -5.7227909564971924e-05, -5.158316344022751e-05, -4.593841731548309e-05, -4.029367119073868e-05, -3.464892506599426e-05, -2.9004178941249847e-05, -2.3359432816505432e-05, -1.7714686691761017e-05, -1.2069940567016602e-05, -6.425194442272186e-06, -7.80448317527771e-07, 4.864297807216644e-06, 1.050904393196106e-05, 1.6153790056705475e-05, 2.179853618144989e-05, 2.7443282306194305e-05, 3.308802843093872e-05, 3.8732774555683136e-05, 4.437752068042755e-05, 5.0022266805171967e-05, 5.566701292991638e-05, 6.13117590546608e-05, 6.695650517940521e-05, 7.260125130414963e-05, 7.824599742889404e-05, 8.389074355363846e-05, 8.953548967838287e-05, 9.518023580312729e-05, 0.0001008249819278717, 0.00010646972805261612, 0.00011211447417736053, 0.00011775922030210495, 0.00012340396642684937, 0.00012904871255159378, 0.0001346934586763382, 0.0001403382048010826, 0.00014598295092582703, 0.00015162769705057144, 0.00015727244317531586, 0.00016291718930006027, 0.0001685619354248047]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 6.0, 7.0, 18.0, 16.0, 14.0, 12.0, 19.0, 24.0, 28.0, 22.0, 23.0, 34.0, 32.0, 44.0, 39.0, 33.0, 32.0, 33.0, 43.0, 45.0, 51.0, 30.0, 35.0, 42.0, 36.0, 30.0, 31.0, 28.0, 21.0, 24.0, 16.0, 19.0, 15.0, 12.0, 12.0, 14.0, 10.0, 11.0, 2.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.625, -4.498931884765625, -4.37286376953125, -4.246795654296875, -4.1207275390625, -3.994659423828125, -3.86859130859375, -3.742523193359375, -3.616455078125, -3.490386962890625, -3.36431884765625, -3.238250732421875, -3.1121826171875, -2.986114501953125, -2.86004638671875, -2.733978271484375, -2.60791015625, -2.481842041015625, -2.35577392578125, -2.229705810546875, -2.1036376953125, -1.977569580078125, -1.85150146484375, -1.725433349609375, -1.599365234375, -1.473297119140625, -1.34722900390625, -1.221160888671875, -1.0950927734375, -0.969024658203125, -0.84295654296875, -0.716888427734375, -0.5908203125, -0.464752197265625, -0.33868408203125, -0.212615966796875, -0.0865478515625, 0.039520263671875, 0.16558837890625, 0.291656494140625, 0.417724609375, 0.543792724609375, 0.66986083984375, 0.795928955078125, 0.9219970703125, 1.048065185546875, 1.17413330078125, 1.300201416015625, 1.42626953125, 1.552337646484375, 1.67840576171875, 1.804473876953125, 1.9305419921875, 2.056610107421875, 2.18267822265625, 2.308746337890625, 2.434814453125, 2.560882568359375, 2.68695068359375, 2.813018798828125, 2.9390869140625, 3.065155029296875, 3.19122314453125, 3.317291259765625, 3.443359375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 6.0, 12.0, 11.0, 27.0, 33.0, 49.0, 59.0, 82.0, 138.0, 216.0, 316.0, 512.0, 784.0, 1154.0, 1976.0, 3350.0, 5653.0, 10131.0, 19394.0, 43950.0, 116288.0, 303441.0, 321516.0, 125963.0, 47450.0, 20506.0, 10701.0, 5858.0, 3400.0, 2015.0, 1236.0, 813.0, 484.0, 318.0, 254.0, 141.0, 105.0, 72.0, 45.0, 34.0, 21.0, 11.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75494384765625, -5.5567626953125, -5.35858154296875, -5.160400390625, -4.96221923828125, -4.7640380859375, -4.56585693359375, -4.36767578125, -4.16949462890625, -3.9713134765625, -3.77313232421875, -3.574951171875, -3.37677001953125, -3.1785888671875, -2.98040771484375, -2.7822265625, -2.58404541015625, -2.3858642578125, -2.18768310546875, -1.989501953125, -1.79132080078125, -1.5931396484375, -1.39495849609375, -1.19677734375, -0.99859619140625, -0.8004150390625, -0.60223388671875, -0.404052734375, -0.20587158203125, -0.0076904296875, 0.19049072265625, 0.388671875, 0.58685302734375, 0.7850341796875, 0.98321533203125, 1.181396484375, 1.37957763671875, 1.5777587890625, 1.77593994140625, 1.97412109375, 2.17230224609375, 2.3704833984375, 2.56866455078125, 2.766845703125, 2.96502685546875, 3.1632080078125, 3.36138916015625, 3.5595703125, 3.75775146484375, 3.9559326171875, 4.15411376953125, 4.352294921875, 4.55047607421875, 4.7486572265625, 4.94683837890625, 5.14501953125, 5.34320068359375, 5.5413818359375, 5.73956298828125, 5.937744140625, 6.13592529296875, 6.3341064453125, 6.53228759765625, 6.73046875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 9.0, 5.0, 10.0, 14.0, 15.0, 15.0, 20.0, 27.0, 23.0, 20.0, 31.0, 38.0, 40.0, 50.0, 63.0, 75.0, 139.0, 252.0, 1406.0, 248.0, 129.0, 62.0, 59.0, 40.0, 51.0, 33.0, 27.0, 22.0, 30.0, 15.0, 16.0, 13.0, 10.0, 8.0, 8.0, 6.0, 7.0, 1.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3671875, -12.9285888671875, -12.489990234375, -12.0513916015625, -11.61279296875, -11.1741943359375, -10.735595703125, -10.2969970703125, -9.8583984375, -9.4197998046875, -8.981201171875, -8.5426025390625, -8.10400390625, -7.6654052734375, -7.226806640625, -6.7882080078125, -6.349609375, -5.9110107421875, -5.472412109375, -5.0338134765625, -4.59521484375, -4.1566162109375, -3.718017578125, -3.2794189453125, -2.8408203125, -2.4022216796875, -1.963623046875, -1.5250244140625, -1.08642578125, -0.6478271484375, -0.209228515625, 0.2293701171875, 0.66796875, 1.1065673828125, 1.545166015625, 1.9837646484375, 2.42236328125, 2.8609619140625, 3.299560546875, 3.7381591796875, 4.1767578125, 4.6153564453125, 5.053955078125, 5.4925537109375, 5.93115234375, 6.3697509765625, 6.808349609375, 7.2469482421875, 7.685546875, 8.1241455078125, 8.562744140625, 9.0013427734375, 9.43994140625, 9.8785400390625, 10.317138671875, 10.7557373046875, 11.1943359375, 11.6329345703125, 12.071533203125, 12.5101318359375, 12.94873046875, 13.3873291015625, 13.825927734375, 14.2645263671875, 14.703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 13.0, 11.0, 17.0, 26.0, 31.0, 54.0, 81.0, 88.0, 162.0, 286.0, 514.0, 1076.0, 3235.0, 15708.0, 135203.0, 2454310.0, 491251.0, 34495.0, 5874.0, 1649.0, 633.0, 346.0, 200.0, 138.0, 78.0, 59.0, 37.0, 35.0, 25.0, 17.0, 11.0, 13.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.947509765625, -15.41064453125, -14.873779296875, -14.3369140625, -13.800048828125, -13.26318359375, -12.726318359375, -12.189453125, -11.652587890625, -11.11572265625, -10.578857421875, -10.0419921875, -9.505126953125, -8.96826171875, -8.431396484375, -7.89453125, -7.357666015625, -6.82080078125, -6.283935546875, -5.7470703125, -5.210205078125, -4.67333984375, -4.136474609375, -3.599609375, -3.062744140625, -2.52587890625, -1.989013671875, -1.4521484375, -0.915283203125, -0.37841796875, 0.158447265625, 0.6953125, 1.232177734375, 1.76904296875, 2.305908203125, 2.8427734375, 3.379638671875, 3.91650390625, 4.453369140625, 4.990234375, 5.527099609375, 6.06396484375, 6.600830078125, 7.1376953125, 7.674560546875, 8.21142578125, 8.748291015625, 9.28515625, 9.822021484375, 10.35888671875, 10.895751953125, 11.4326171875, 11.969482421875, 12.50634765625, 13.043212890625, 13.580078125, 14.116943359375, 14.65380859375, 15.190673828125, 15.7275390625, 16.264404296875, 16.80126953125, 17.338134765625, 17.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 45.0, 275.0, 450.0, 212.0, 32.0, 1.0], "bins": [-228.4581756591797, -224.67642211914062, -220.89466857910156, -217.1129150390625, -213.33116149902344, -209.54940795898438, -205.76763916015625, -201.98590087890625, -198.20413208007812, -194.42237854003906, -190.640625, -186.85887145996094, -183.07711791992188, -179.2953643798828, -175.51361083984375, -171.73184204101562, -167.95010375976562, -164.16835021972656, -160.3865966796875, -156.60484313964844, -152.82308959960938, -149.0413360595703, -145.25958251953125, -141.47781372070312, -137.69606018066406, -133.914306640625, -130.13255310058594, -126.35079956054688, -122.56903839111328, -118.78728485107422, -115.00553131103516, -111.2237777709961, -107.44202423095703, -103.66027069091797, -99.8785171508789, -96.09675598144531, -92.31500244140625, -88.53324890136719, -84.75149536132812, -80.96974182128906, -77.18798828125, -73.40623474121094, -69.62448120117188, -65.84272766113281, -62.060970306396484, -58.279212951660156, -54.497459411621094, -50.71570587158203, -46.93395233154297, -43.152198791503906, -39.37044143676758, -35.588687896728516, -31.806934356689453, -28.025178909301758, -24.243423461914062, -20.461669921875, -16.679912567138672, -12.898158073425293, -9.116403579711914, -5.334648132324219, -1.5528936386108398, 2.228860855102539, 6.010616302490234, 9.792369842529297, 13.574124336242676]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 2.0, 11.0, 5.0, 12.0, 15.0, 11.0, 8.0, 16.0, 12.0, 28.0, 21.0, 20.0, 44.0, 36.0, 39.0, 35.0, 50.0, 43.0, 37.0, 50.0, 45.0, 46.0, 41.0, 37.0, 32.0, 41.0, 39.0, 32.0, 18.0, 28.0, 30.0, 15.0, 17.0, 8.0, 13.0, 6.0, 9.0, 15.0, 11.0, 9.0, 2.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.09288787841797, -35.01768493652344, -33.942481994628906, -32.867279052734375, -31.79207420349121, -30.71687126159668, -29.641666412353516, -28.566463470458984, -27.491260528564453, -26.416057586669922, -25.34085464477539, -24.265649795532227, -23.190446853637695, -22.115243911743164, -21.0400390625, -19.96483612060547, -18.889633178710938, -17.814430236816406, -16.739227294921875, -15.664022445678711, -14.58881950378418, -13.513616561889648, -12.4384126663208, -11.363208770751953, -10.288005828857422, -9.21280288696289, -8.137598991394043, -7.0623955726623535, -5.987192153930664, -4.911988735198975, -3.836785316467285, -2.7615818977355957, -1.6863784790039062, -0.6111750602722168, 0.46402835845947266, 1.539231777191162, 2.6144351959228516, 3.689638614654541, 4.7648420333862305, 5.84004545211792, 6.915248870849609, 7.990452289581299, 9.065655708312988, 10.140859603881836, 11.216062545776367, 12.291265487670898, 13.366469383239746, 14.441673278808594, 15.516876220703125, 16.592079162597656, 17.667282104492188, 18.74248695373535, 19.817689895629883, 20.892892837524414, 21.968097686767578, 23.04330062866211, 24.11850357055664, 25.193706512451172, 26.268909454345703, 27.344114303588867, 28.4193172454834, 29.49452018737793, 30.569725036621094, 31.644927978515625, 32.720130920410156]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 1.0, 8.0, 5.0, 7.0, 5.0, 6.0, 13.0, 18.0, 14.0, 17.0, 18.0, 15.0, 21.0, 24.0, 25.0, 25.0, 39.0, 31.0, 37.0, 20.0, 50.0, 30.0, 50.0, 39.0, 46.0, 29.0, 39.0, 38.0, 34.0, 35.0, 37.0, 17.0, 21.0, 20.0, 30.0, 16.0, 21.0, 18.0, 15.0, 12.0, 9.0, 16.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 2.0], "bins": [-4.7265625, -4.599578857421875, -4.47259521484375, -4.345611572265625, -4.2186279296875, -4.091644287109375, -3.96466064453125, -3.837677001953125, -3.710693359375, -3.583709716796875, -3.45672607421875, -3.329742431640625, -3.2027587890625, -3.075775146484375, -2.94879150390625, -2.821807861328125, -2.69482421875, -2.567840576171875, -2.44085693359375, -2.313873291015625, -2.1868896484375, -2.059906005859375, -1.93292236328125, -1.805938720703125, -1.678955078125, -1.551971435546875, -1.42498779296875, -1.298004150390625, -1.1710205078125, -1.044036865234375, -0.91705322265625, -0.790069580078125, -0.6630859375, -0.536102294921875, -0.40911865234375, -0.282135009765625, -0.1551513671875, -0.028167724609375, 0.09881591796875, 0.225799560546875, 0.352783203125, 0.479766845703125, 0.60675048828125, 0.733734130859375, 0.8607177734375, 0.987701416015625, 1.11468505859375, 1.241668701171875, 1.36865234375, 1.495635986328125, 1.62261962890625, 1.749603271484375, 1.8765869140625, 2.003570556640625, 2.13055419921875, 2.257537841796875, 2.384521484375, 2.511505126953125, 2.63848876953125, 2.765472412109375, 2.8924560546875, 3.019439697265625, 3.14642333984375, 3.273406982421875, 3.400390625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 6.0, 8.0, 7.0, 5.0, 7.0, 14.0, 19.0, 29.0, 34.0, 47.0, 67.0, 135.0, 216.0, 452.0, 805.0, 1526.0, 3234.0, 7592.0, 21529.0, 79508.0, 361455.0, 1517815.0, 1652139.0, 415171.0, 91828.0, 24597.0, 8537.0, 3641.0, 1660.0, 919.0, 498.0, 307.0, 165.0, 115.0, 58.0, 43.0, 32.0, 15.0, 20.0, 8.0, 8.0, 4.0, 2.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.6640625, -7.44537353515625, -7.2266845703125, -7.00799560546875, -6.789306640625, -6.57061767578125, -6.3519287109375, -6.13323974609375, -5.91455078125, -5.69586181640625, -5.4771728515625, -5.25848388671875, -5.039794921875, -4.82110595703125, -4.6024169921875, -4.38372802734375, -4.1650390625, -3.94635009765625, -3.7276611328125, -3.50897216796875, -3.290283203125, -3.07159423828125, -2.8529052734375, -2.63421630859375, -2.41552734375, -2.19683837890625, -1.9781494140625, -1.75946044921875, -1.540771484375, -1.32208251953125, -1.1033935546875, -0.88470458984375, -0.666015625, -0.44732666015625, -0.2286376953125, -0.00994873046875, 0.208740234375, 0.42742919921875, 0.6461181640625, 0.86480712890625, 1.08349609375, 1.30218505859375, 1.5208740234375, 1.73956298828125, 1.958251953125, 2.17694091796875, 2.3956298828125, 2.61431884765625, 2.8330078125, 3.05169677734375, 3.2703857421875, 3.48907470703125, 3.707763671875, 3.92645263671875, 4.1451416015625, 4.36383056640625, 4.58251953125, 4.80120849609375, 5.0198974609375, 5.23858642578125, 5.457275390625, 5.67596435546875, 5.8946533203125, 6.11334228515625, 6.33203125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 8.0, 6.0, 16.0, 15.0, 19.0, 34.0, 40.0, 83.0, 108.0, 158.0, 212.0, 313.0, 410.0, 593.0, 568.0, 422.0, 348.0, 211.0, 153.0, 109.0, 79.0, 44.0, 26.0, 25.0, 15.0, 11.0, 7.0, 11.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51171875, -7.25286865234375, -6.9940185546875, -6.73516845703125, -6.476318359375, -6.21746826171875, -5.9586181640625, -5.69976806640625, -5.44091796875, -5.18206787109375, -4.9232177734375, -4.66436767578125, -4.405517578125, -4.14666748046875, -3.8878173828125, -3.62896728515625, -3.3701171875, -3.11126708984375, -2.8524169921875, -2.59356689453125, -2.334716796875, -2.07586669921875, -1.8170166015625, -1.55816650390625, -1.29931640625, -1.04046630859375, -0.7816162109375, -0.52276611328125, -0.263916015625, -0.00506591796875, 0.2537841796875, 0.51263427734375, 0.771484375, 1.03033447265625, 1.2891845703125, 1.54803466796875, 1.806884765625, 2.06573486328125, 2.3245849609375, 2.58343505859375, 2.84228515625, 3.10113525390625, 3.3599853515625, 3.61883544921875, 3.877685546875, 4.13653564453125, 4.3953857421875, 4.65423583984375, 4.9130859375, 5.17193603515625, 5.4307861328125, 5.68963623046875, 5.948486328125, 6.20733642578125, 6.4661865234375, 6.72503662109375, 6.98388671875, 7.24273681640625, 7.5015869140625, 7.76043701171875, 8.019287109375, 8.27813720703125, 8.5369873046875, 8.79583740234375, 9.0546875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 11.0, 17.0, 9.0, 22.0, 24.0, 46.0, 65.0, 113.0, 174.0, 350.0, 772.0, 2563.0, 13255.0, 212913.0, 3605022.0, 336952.0, 17146.0, 2937.0, 938.0, 402.0, 208.0, 107.0, 76.0, 62.0, 20.0, 18.0, 15.0, 15.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.8740234375, -24.154296875, -23.4345703125, -22.71484375, -21.9951171875, -21.275390625, -20.5556640625, -19.8359375, -19.1162109375, -18.396484375, -17.6767578125, -16.95703125, -16.2373046875, -15.517578125, -14.7978515625, -14.078125, -13.3583984375, -12.638671875, -11.9189453125, -11.19921875, -10.4794921875, -9.759765625, -9.0400390625, -8.3203125, -7.6005859375, -6.880859375, -6.1611328125, -5.44140625, -4.7216796875, -4.001953125, -3.2822265625, -2.5625, -1.8427734375, -1.123046875, -0.4033203125, 0.31640625, 1.0361328125, 1.755859375, 2.4755859375, 3.1953125, 3.9150390625, 4.634765625, 5.3544921875, 6.07421875, 6.7939453125, 7.513671875, 8.2333984375, 8.953125, 9.6728515625, 10.392578125, 11.1123046875, 11.83203125, 12.5517578125, 13.271484375, 13.9912109375, 14.7109375, 15.4306640625, 16.150390625, 16.8701171875, 17.58984375, 18.3095703125, 19.029296875, 19.7490234375, 20.46875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 44.0, 239.0, 458.0, 223.0, 40.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.15943145751953, -55.67448425292969, -51.18954086303711, -46.70459747314453, -42.21965026855469, -37.734703063964844, -33.249759674072266, -28.764814376831055, -24.279869079589844, -19.794923782348633, -15.309978485107422, -10.825033187866211, -6.340087890625, -1.855142593383789, 2.629802703857422, 7.114748001098633, 11.599693298339844, 16.084638595581055, 20.569583892822266, 25.054529190063477, 29.539474487304688, 34.02442169189453, 38.50936508178711, 42.99430847167969, 47.47925567626953, 51.964202880859375, 56.44914627075195, 60.93408966064453, 65.41903686523438, 69.90398406982422, 74.38893127441406, 78.87387084960938, 83.35881042480469, 87.84375762939453, 92.32870483398438, 96.81364440917969, 101.29859161376953, 105.78353881835938, 110.26847839355469, 114.75342559814453, 119.23837280273438, 123.72332000732422, 128.20826721191406, 132.69320678710938, 137.17816162109375, 141.66310119628906, 146.14804077148438, 150.63299560546875, 155.11793518066406, 159.60287475585938, 164.08782958984375, 168.57276916503906, 173.05770874023438, 177.54266357421875, 182.02760314941406, 186.51255798339844, 190.99749755859375, 195.48243713378906, 199.96739196777344, 204.45233154296875, 208.93728637695312, 213.42222595214844, 217.90716552734375, 222.39212036132812, 226.87705993652344]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 7.0, 8.0, 7.0, 19.0, 16.0, 14.0, 13.0, 22.0, 20.0, 25.0, 28.0, 28.0, 35.0, 32.0, 39.0, 38.0, 30.0, 33.0, 37.0, 35.0, 42.0, 32.0, 41.0, 42.0, 32.0, 38.0, 38.0, 21.0, 30.0, 25.0, 20.0, 20.0, 22.0, 20.0, 8.0, 15.0, 13.0, 9.0, 8.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-24.05582618713379, -23.329723358154297, -22.603622436523438, -21.877519607543945, -21.151416778564453, -20.425315856933594, -19.6992130279541, -18.97311019897461, -18.24700927734375, -17.520906448364258, -16.7948055267334, -16.068702697753906, -15.342599868774414, -14.616497993469238, -13.890396118164062, -13.16429328918457, -12.438190460205078, -11.712088584899902, -10.98598575592041, -10.259883880615234, -9.533781051635742, -8.807679176330566, -8.08157730102539, -7.355474948883057, -6.629372596740723, -5.903270244598389, -5.177167892456055, -4.451066017150879, -3.724963665008545, -2.998861312866211, -2.272759437561035, -1.5466570854187012, -0.8205528259277344, -0.09445059299468994, 0.6316516399383545, 1.3577537536621094, 2.0838561058044434, 2.8099584579467773, 3.536060333251953, 4.262162685394287, 4.988265037536621, 5.714367389678955, 6.440469741821289, 7.166571617126465, 7.892673969268799, 8.618776321411133, 9.344878196716309, 10.070980072021484, 10.797082901000977, 11.523184776306152, 12.249287605285645, 12.97538948059082, 13.701492309570312, 14.427594184875488, 15.153696060180664, 15.879798889160156, 16.605899810791016, 17.332002639770508, 18.058103561401367, 18.78420639038086, 19.51030921936035, 20.236412048339844, 20.962512969970703, 21.688615798950195, 22.414718627929688]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 8.0, 12.0, 9.0, 13.0, 9.0, 12.0, 16.0, 13.0, 19.0, 31.0, 19.0, 12.0, 31.0, 34.0, 33.0, 36.0, 33.0, 30.0, 39.0, 40.0, 47.0, 31.0, 31.0, 45.0, 32.0, 36.0, 35.0, 35.0, 29.0, 25.0, 19.0, 23.0, 26.0, 25.0, 21.0, 13.0, 12.0, 13.0, 10.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.640625, -4.510589599609375, -4.38055419921875, -4.250518798828125, -4.1204833984375, -3.990447998046875, -3.86041259765625, -3.730377197265625, -3.600341796875, -3.470306396484375, -3.34027099609375, -3.210235595703125, -3.0802001953125, -2.950164794921875, -2.82012939453125, -2.690093994140625, -2.56005859375, -2.430023193359375, -2.29998779296875, -2.169952392578125, -2.0399169921875, -1.909881591796875, -1.77984619140625, -1.649810791015625, -1.519775390625, -1.389739990234375, -1.25970458984375, -1.129669189453125, -0.9996337890625, -0.869598388671875, -0.73956298828125, -0.609527587890625, -0.4794921875, -0.349456787109375, -0.21942138671875, -0.089385986328125, 0.0406494140625, 0.170684814453125, 0.30072021484375, 0.430755615234375, 0.560791015625, 0.690826416015625, 0.82086181640625, 0.950897216796875, 1.0809326171875, 1.210968017578125, 1.34100341796875, 1.471038818359375, 1.60107421875, 1.731109619140625, 1.86114501953125, 1.991180419921875, 2.1212158203125, 2.251251220703125, 2.38128662109375, 2.511322021484375, 2.641357421875, 2.771392822265625, 2.90142822265625, 3.031463623046875, 3.1614990234375, 3.291534423828125, 3.42156982421875, 3.551605224609375, 3.681640625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 16.0, 22.0, 39.0, 62.0, 65.0, 129.0, 163.0, 233.0, 401.0, 642.0, 912.0, 1355.0, 1977.0, 3016.0, 4568.0, 7157.0, 10657.0, 16430.0, 26320.0, 43260.0, 75871.0, 144626.0, 282185.0, 190852.0, 95884.0, 53646.0, 31573.0, 19703.0, 12554.0, 8239.0, 5368.0, 3477.0, 2425.0, 1610.0, 1073.0, 663.0, 435.0, 283.0, 231.0, 148.0, 94.0, 54.0, 42.0, 25.0, 17.0, 9.0, 13.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.156005859375, -0.1509227752685547, -0.14583969116210938, -0.14075660705566406, -0.13567352294921875, -0.13059043884277344, -0.12550735473632812, -0.12042427062988281, -0.1153411865234375, -0.11025810241699219, -0.10517501831054688, -0.10009193420410156, -0.09500885009765625, -0.08992576599121094, -0.08484268188476562, -0.07975959777832031, -0.074676513671875, -0.06959342956542969, -0.06451034545898438, -0.05942726135253906, -0.05434417724609375, -0.04926109313964844, -0.044178009033203125, -0.03909492492675781, -0.0340118408203125, -0.028928756713867188, -0.023845672607421875, -0.018762588500976562, -0.01367950439453125, -0.008596420288085938, -0.003513336181640625, 0.0015697479248046875, 0.00665283203125, 0.011735916137695312, 0.016819000244140625, 0.021902084350585938, 0.02698516845703125, 0.03206825256347656, 0.037151336669921875, 0.04223442077636719, 0.0473175048828125, 0.05240058898925781, 0.057483673095703125, 0.06256675720214844, 0.06764984130859375, 0.07273292541503906, 0.07781600952148438, 0.08289909362792969, 0.087982177734375, 0.09306526184082031, 0.09814834594726562, 0.10323143005371094, 0.10831451416015625, 0.11339759826660156, 0.11848068237304688, 0.12356376647949219, 0.1286468505859375, 0.1337299346923828, 0.13881301879882812, 0.14389610290527344, 0.14897918701171875, 0.15406227111816406, 0.15914535522460938, 0.1642284393310547, 0.1693115234375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 4.0, 3.0, 8.0, 9.0, 12.0, 11.0, 8.0, 14.0, 21.0, 14.0, 22.0, 27.0, 19.0, 32.0, 28.0, 39.0, 34.0, 36.0, 41.0, 45.0, 38.0, 1072.0, 48.0, 42.0, 32.0, 30.0, 41.0, 24.0, 39.0, 33.0, 30.0, 25.0, 17.0, 23.0, 16.0, 21.0, 11.0, 14.0, 5.0, 10.0, 6.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.537933349609375, -3.41375732421875, -3.289581298828125, -3.1654052734375, -3.041229248046875, -2.91705322265625, -2.792877197265625, -2.668701171875, -2.544525146484375, -2.42034912109375, -2.296173095703125, -2.1719970703125, -2.047821044921875, -1.92364501953125, -1.799468994140625, -1.67529296875, -1.551116943359375, -1.42694091796875, -1.302764892578125, -1.1785888671875, -1.054412841796875, -0.93023681640625, -0.806060791015625, -0.681884765625, -0.557708740234375, -0.43353271484375, -0.309356689453125, -0.1851806640625, -0.061004638671875, 0.06317138671875, 0.187347412109375, 0.3115234375, 0.435699462890625, 0.55987548828125, 0.684051513671875, 0.8082275390625, 0.932403564453125, 1.05657958984375, 1.180755615234375, 1.304931640625, 1.429107666015625, 1.55328369140625, 1.677459716796875, 1.8016357421875, 1.925811767578125, 2.04998779296875, 2.174163818359375, 2.29833984375, 2.422515869140625, 2.54669189453125, 2.670867919921875, 2.7950439453125, 2.919219970703125, 3.04339599609375, 3.167572021484375, 3.291748046875, 3.415924072265625, 3.54010009765625, 3.664276123046875, 3.7884521484375, 3.912628173828125, 4.03680419921875, 4.160980224609375, 4.28515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 25.0, 34.0, 52.0, 67.0, 84.0, 130.0, 172.0, 246.0, 342.0, 459.0, 613.0, 886.0, 1247.0, 1631.0, 2326.0, 3319.0, 4559.0, 6274.0, 8840.0, 12787.0, 18205.0, 26840.0, 40401.0, 65178.0, 111778.0, 232978.0, 1225629.0, 122952.0, 70677.0, 43718.0, 28533.0, 19228.0, 13491.0, 9531.0, 6624.0, 4763.0, 3394.0, 2514.0, 1920.0, 1366.0, 958.0, 721.0, 455.0, 362.0, 222.0, 173.0, 115.0, 94.0, 61.0, 45.0, 33.0, 20.0, 17.0, 15.0, 5.0, 7.0, 4.0], "bins": [-0.062469482421875, -0.060581207275390625, -0.05869293212890625, -0.056804656982421875, -0.0549163818359375, -0.053028106689453125, -0.05113983154296875, -0.049251556396484375, -0.04736328125, -0.045475006103515625, -0.04358673095703125, -0.041698455810546875, -0.0398101806640625, -0.037921905517578125, -0.03603363037109375, -0.034145355224609375, -0.032257080078125, -0.030368804931640625, -0.02848052978515625, -0.026592254638671875, -0.0247039794921875, -0.022815704345703125, -0.02092742919921875, -0.019039154052734375, -0.01715087890625, -0.015262603759765625, -0.01337432861328125, -0.011486053466796875, -0.0095977783203125, -0.007709503173828125, -0.00582122802734375, -0.003932952880859375, -0.002044677734375, -0.000156402587890625, 0.00173187255859375, 0.003620147705078125, 0.0055084228515625, 0.007396697998046875, 0.00928497314453125, 0.011173248291015625, 0.0130615234375, 0.014949798583984375, 0.01683807373046875, 0.018726348876953125, 0.0206146240234375, 0.022502899169921875, 0.02439117431640625, 0.026279449462890625, 0.028167724609375, 0.030055999755859375, 0.03194427490234375, 0.033832550048828125, 0.0357208251953125, 0.037609100341796875, 0.03949737548828125, 0.041385650634765625, 0.04327392578125, 0.045162200927734375, 0.04705047607421875, 0.048938751220703125, 0.0508270263671875, 0.052715301513671875, 0.05460357666015625, 0.056491851806640625, 0.058380126953125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 9.0, 7.0, 13.0, 25.0, 31.0, 34.0, 45.0, 62.0, 80.0, 122.0, 141.0, 104.0, 73.0, 51.0, 39.0, 26.0, 29.0, 13.0, 11.0, 9.0, 12.0, 8.0, 10.0, 3.0, 5.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005860328674316406, -0.000567898154258728, -0.0005497634410858154, -0.0005316287279129028, -0.0005134940147399902, -0.0004953593015670776, -0.00047722458839416504, -0.00045908987522125244, -0.00044095516204833984, -0.00042282044887542725, -0.00040468573570251465, -0.00038655102252960205, -0.00036841630935668945, -0.00035028159618377686, -0.00033214688301086426, -0.00031401216983795166, -0.00029587745666503906, -0.00027774274349212646, -0.00025960803031921387, -0.00024147331714630127, -0.00022333860397338867, -0.00020520389080047607, -0.00018706917762756348, -0.00016893446445465088, -0.00015079975128173828, -0.00013266503810882568, -0.00011453032493591309, -9.639561176300049e-05, -7.826089859008789e-05, -6.012618541717529e-05, -4.1991472244262695e-05, -2.3856759071350098e-05, -5.7220458984375e-06, 1.2412667274475098e-05, 3.0547380447387695e-05, 4.868209362030029e-05, 6.681680679321289e-05, 8.495151996612549e-05, 0.00010308623313903809, 0.00012122094631195068, 0.00013935565948486328, 0.00015749037265777588, 0.00017562508583068848, 0.00019375979900360107, 0.00021189451217651367, 0.00023002922534942627, 0.00024816393852233887, 0.00026629865169525146, 0.00028443336486816406, 0.00030256807804107666, 0.00032070279121398926, 0.00033883750438690186, 0.00035697221755981445, 0.00037510693073272705, 0.00039324164390563965, 0.00041137635707855225, 0.00042951107025146484, 0.00044764578342437744, 0.00046578049659729004, 0.00048391520977020264, 0.0005020499229431152, 0.0005201846361160278, 0.0005383193492889404, 0.000556454062461853, 0.0005745887756347656]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 10.0, 7.0, 13.0, 12.0, 18.0, 21.0, 34.0, 49.0, 86.0, 197.0, 2066.0, 1012311.0, 33020.0, 331.0, 106.0, 82.0, 38.0, 39.0, 26.0, 12.0, 4.0, 11.0, 13.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01427459716796875, -0.01382458209991455, -0.013374567031860352, -0.012924551963806152, -0.012474536895751953, -0.012024521827697754, -0.011574506759643555, -0.011124491691589355, -0.010674476623535156, -0.010224461555480957, -0.009774446487426758, -0.009324431419372559, -0.00887441635131836, -0.00842440128326416, -0.007974386215209961, -0.007524371147155762, -0.0070743560791015625, -0.006624341011047363, -0.006174325942993164, -0.005724310874938965, -0.005274295806884766, -0.004824280738830566, -0.004374265670776367, -0.003924250602722168, -0.0034742355346679688, -0.0030242204666137695, -0.0025742053985595703, -0.002124190330505371, -0.0016741752624511719, -0.0012241601943969727, -0.0007741451263427734, -0.0003241300582885742, 0.000125885009765625, 0.0005759000778198242, 0.0010259151458740234, 0.0014759302139282227, 0.0019259452819824219, 0.002375960350036621, 0.0028259754180908203, 0.0032759904861450195, 0.0037260055541992188, 0.004176020622253418, 0.004626035690307617, 0.005076050758361816, 0.005526065826416016, 0.005976080894470215, 0.006426095962524414, 0.006876111030578613, 0.0073261260986328125, 0.007776141166687012, 0.008226156234741211, 0.00867617130279541, 0.00912618637084961, 0.009576201438903809, 0.010026216506958008, 0.010476231575012207, 0.010926246643066406, 0.011376261711120605, 0.011826276779174805, 0.012276291847229004, 0.012726306915283203, 0.013176321983337402, 0.013626337051391602, 0.0140763521194458, 0.0145263671875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 11.0, 101.0, 676.0, 209.0, 21.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033415743382647634, -0.00026288485969416797, -0.0001916122855618596, -0.00012033971142955124, -4.906713729724288e-05, 2.2205436835065484e-05, 9.347801096737385e-05, 0.00016475055599585176, 0.00023602315923199058, 0.00030729573336429894, 0.0003785683074966073, 0.00044984088162891567, 0.000521113455761224, 0.0005923860007897019, 0.0006636586040258408, 0.0007349311490543187, 0.0008062037522904575, 0.0008774762973189354, 0.0009487489005550742, 0.001020021503791213, 0.00109129399061203, 0.0011625665938481688, 0.0012338391970843077, 0.0013051116839051247, 0.0013763844035565853, 0.0014476570067927241, 0.001518929610028863, 0.00159020209684968, 0.0016614747000858188, 0.0017327473033219576, 0.0018040197901427746, 0.0018752923933789134, 0.0019465647637844086, 0.0020178372506052256, 0.002089109970256686, 0.002160382457077503, 0.002231655176728964, 0.002302927663549781, 0.002374200150370598, 0.0024454728700220585, 0.0025167453568428755, 0.0025880178436636925, 0.002659290563315153, 0.00273056305013597, 0.002801835536956787, 0.0028731082566082478, 0.0029443807434290648, 0.0030156532302498817, 0.0030869259499013424, 0.0031581984367221594, 0.00322947115637362, 0.003300743643194437, 0.0033720163628458977, 0.0034432888496667147, 0.0035145613364875317, 0.0035858340561389923, 0.0036571065429598093, 0.0037283790297806263, 0.003799651749432087, 0.003870924236252904, 0.003942196723073721, 0.004013469442725182, 0.004084742162376642, 0.004156014416366816, 0.004227287136018276]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 7.0, 9.0, 10.0, 11.0, 18.0, 15.0, 21.0, 25.0, 35.0, 27.0, 18.0, 31.0, 42.0, 34.0, 36.0, 55.0, 41.0, 48.0, 48.0, 43.0, 53.0, 33.0, 43.0, 38.0, 49.0, 26.0, 28.0, 29.0, 25.0, 10.0, 25.0, 12.0, 4.0, 9.0, 8.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002391338348388672, -0.0002312762662768364, -0.0002234186977148056, -0.0002155611291527748, -0.00020770356059074402, -0.00019984599202871323, -0.00019198842346668243, -0.00018413085490465164, -0.00017627328634262085, -0.00016841571778059006, -0.00016055814921855927, -0.00015270058065652847, -0.00014484301209449768, -0.0001369854435324669, -0.0001291278749704361, -0.0001212703064084053, -0.00011341273784637451, -0.00010555516928434372, -9.769760072231293e-05, -8.984003216028214e-05, -8.198246359825134e-05, -7.412489503622055e-05, -6.626732647418976e-05, -5.8409757912158966e-05, -5.0552189350128174e-05, -4.269462078809738e-05, -3.483705222606659e-05, -2.6979483664035797e-05, -1.9121915102005005e-05, -1.1264346539974213e-05, -3.4067779779434204e-06, 4.450790584087372e-06, 1.2308359146118164e-05, 2.0165927708148956e-05, 2.802349627017975e-05, 3.588106483221054e-05, 4.373863339424133e-05, 5.1596201956272125e-05, 5.945377051830292e-05, 6.731133908033371e-05, 7.51689076423645e-05, 8.30264762043953e-05, 9.088404476642609e-05, 9.874161332845688e-05, 0.00010659918189048767, 0.00011445675045251846, 0.00012231431901454926, 0.00013017188757658005, 0.00013802945613861084, 0.00014588702470064163, 0.00015374459326267242, 0.00016160216182470322, 0.000169459730386734, 0.0001773172989487648, 0.0001851748675107956, 0.00019303243607282639, 0.00020089000463485718, 0.00020874757319688797, 0.00021660514175891876, 0.00022446271032094955, 0.00023232027888298035, 0.00024017784744501114, 0.00024803541600704193, 0.0002558929845690727, 0.0002637505531311035]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 8.0, 12.0, 9.0, 13.0, 9.0, 12.0, 16.0, 13.0, 19.0, 31.0, 19.0, 12.0, 31.0, 34.0, 33.0, 36.0, 33.0, 30.0, 39.0, 40.0, 47.0, 31.0, 31.0, 45.0, 32.0, 36.0, 35.0, 35.0, 29.0, 25.0, 19.0, 23.0, 26.0, 25.0, 21.0, 13.0, 12.0, 13.0, 10.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.640625, -4.510589599609375, -4.38055419921875, -4.250518798828125, -4.1204833984375, -3.990447998046875, -3.86041259765625, -3.730377197265625, -3.600341796875, -3.470306396484375, -3.34027099609375, -3.210235595703125, -3.0802001953125, -2.950164794921875, -2.82012939453125, -2.690093994140625, -2.56005859375, -2.430023193359375, -2.29998779296875, -2.169952392578125, -2.0399169921875, -1.909881591796875, -1.77984619140625, -1.649810791015625, -1.519775390625, -1.389739990234375, -1.25970458984375, -1.129669189453125, -0.9996337890625, -0.869598388671875, -0.73956298828125, -0.609527587890625, -0.4794921875, -0.349456787109375, -0.21942138671875, -0.089385986328125, 0.0406494140625, 0.170684814453125, 0.30072021484375, 0.430755615234375, 0.560791015625, 0.690826416015625, 0.82086181640625, 0.950897216796875, 1.0809326171875, 1.210968017578125, 1.34100341796875, 1.471038818359375, 1.60107421875, 1.731109619140625, 1.86114501953125, 1.991180419921875, 2.1212158203125, 2.251251220703125, 2.38128662109375, 2.511322021484375, 2.641357421875, 2.771392822265625, 2.90142822265625, 3.031463623046875, 3.1614990234375, 3.291534423828125, 3.42156982421875, 3.551605224609375, 3.681640625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 4.0, 12.0, 14.0, 14.0, 20.0, 21.0, 45.0, 46.0, 79.0, 125.0, 170.0, 228.0, 395.0, 701.0, 1140.0, 1935.0, 3716.0, 6685.0, 12810.0, 26560.0, 60354.0, 182171.0, 480187.0, 163080.0, 56389.0, 24782.0, 12206.0, 6268.0, 3503.0, 1921.0, 1142.0, 652.0, 388.0, 252.0, 168.0, 108.0, 71.0, 54.0, 34.0, 36.0, 20.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.68359375, -6.45672607421875, -6.2298583984375, -6.00299072265625, -5.776123046875, -5.54925537109375, -5.3223876953125, -5.09552001953125, -4.86865234375, -4.64178466796875, -4.4149169921875, -4.18804931640625, -3.961181640625, -3.73431396484375, -3.5074462890625, -3.28057861328125, -3.0537109375, -2.82684326171875, -2.5999755859375, -2.37310791015625, -2.146240234375, -1.91937255859375, -1.6925048828125, -1.46563720703125, -1.23876953125, -1.01190185546875, -0.7850341796875, -0.55816650390625, -0.331298828125, -0.10443115234375, 0.1224365234375, 0.34930419921875, 0.576171875, 0.80303955078125, 1.0299072265625, 1.25677490234375, 1.483642578125, 1.71051025390625, 1.9373779296875, 2.16424560546875, 2.39111328125, 2.61798095703125, 2.8448486328125, 3.07171630859375, 3.298583984375, 3.52545166015625, 3.7523193359375, 3.97918701171875, 4.2060546875, 4.43292236328125, 4.6597900390625, 4.88665771484375, 5.113525390625, 5.34039306640625, 5.5672607421875, 5.79412841796875, 6.02099609375, 6.24786376953125, 6.4747314453125, 6.70159912109375, 6.928466796875, 7.15533447265625, 7.3822021484375, 7.60906982421875, 7.8359375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 11.0, 10.0, 10.0, 30.0, 22.0, 24.0, 40.0, 33.0, 36.0, 29.0, 54.0, 69.0, 69.0, 112.0, 201.0, 1392.0, 252.0, 121.0, 91.0, 76.0, 42.0, 39.0, 31.0, 42.0, 39.0, 25.0, 27.0, 14.0, 19.0, 18.0, 8.0, 14.0, 8.0, 6.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7734375, -12.3699951171875, -11.966552734375, -11.5631103515625, -11.15966796875, -10.7562255859375, -10.352783203125, -9.9493408203125, -9.5458984375, -9.1424560546875, -8.739013671875, -8.3355712890625, -7.93212890625, -7.5286865234375, -7.125244140625, -6.7218017578125, -6.318359375, -5.9149169921875, -5.511474609375, -5.1080322265625, -4.70458984375, -4.3011474609375, -3.897705078125, -3.4942626953125, -3.0908203125, -2.6873779296875, -2.283935546875, -1.8804931640625, -1.47705078125, -1.0736083984375, -0.670166015625, -0.2667236328125, 0.13671875, 0.5401611328125, 0.943603515625, 1.3470458984375, 1.75048828125, 2.1539306640625, 2.557373046875, 2.9608154296875, 3.3642578125, 3.7677001953125, 4.171142578125, 4.5745849609375, 4.97802734375, 5.3814697265625, 5.784912109375, 6.1883544921875, 6.591796875, 6.9952392578125, 7.398681640625, 7.8021240234375, 8.20556640625, 8.6090087890625, 9.012451171875, 9.4158935546875, 9.8193359375, 10.2227783203125, 10.626220703125, 11.0296630859375, 11.43310546875, 11.8365478515625, 12.239990234375, 12.6434326171875, 13.046875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 8.0, 10.0, 14.0, 10.0, 12.0, 27.0, 34.0, 53.0, 76.0, 126.0, 182.0, 264.0, 461.0, 827.0, 2060.0, 7056.0, 37158.0, 412344.0, 2486086.0, 170518.0, 20528.0, 4531.0, 1477.0, 692.0, 416.0, 239.0, 139.0, 97.0, 64.0, 58.0, 28.0, 24.0, 18.0, 12.0, 17.0, 10.0, 6.0, 1.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 4.0], "bins": [-18.9375, -18.4163818359375, -17.895263671875, -17.3741455078125, -16.85302734375, -16.3319091796875, -15.810791015625, -15.2896728515625, -14.7685546875, -14.2474365234375, -13.726318359375, -13.2052001953125, -12.68408203125, -12.1629638671875, -11.641845703125, -11.1207275390625, -10.599609375, -10.0784912109375, -9.557373046875, -9.0362548828125, -8.51513671875, -7.9940185546875, -7.472900390625, -6.9517822265625, -6.4306640625, -5.9095458984375, -5.388427734375, -4.8673095703125, -4.34619140625, -3.8250732421875, -3.303955078125, -2.7828369140625, -2.26171875, -1.7406005859375, -1.219482421875, -0.6983642578125, -0.17724609375, 0.3438720703125, 0.864990234375, 1.3861083984375, 1.9072265625, 2.4283447265625, 2.949462890625, 3.4705810546875, 3.99169921875, 4.5128173828125, 5.033935546875, 5.5550537109375, 6.076171875, 6.5972900390625, 7.118408203125, 7.6395263671875, 8.16064453125, 8.6817626953125, 9.202880859375, 9.7239990234375, 10.2451171875, 10.7662353515625, 11.287353515625, 11.8084716796875, 12.32958984375, 12.8507080078125, 13.371826171875, 13.8929443359375, 14.4140625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 87.0, 509.0, 368.0, 45.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-250.22364807128906, -245.8242950439453, -241.4249267578125, -237.02557373046875, -232.62620544433594, -228.2268524169922, -223.82748413085938, -219.42813110351562, -215.02877807617188, -210.62942504882812, -206.2300567626953, -201.83070373535156, -197.43133544921875, -193.031982421875, -188.6326141357422, -184.23326110839844, -179.83389282226562, -175.43453979492188, -171.03517150878906, -166.6358184814453, -162.2364501953125, -157.83709716796875, -153.43772888183594, -149.0383758544922, -144.63900756835938, -140.23965454101562, -135.8402862548828, -131.44093322753906, -127.04156494140625, -122.6422119140625, -118.24285125732422, -113.84349060058594, -109.44413757324219, -105.0447769165039, -100.64541625976562, -96.24605560302734, -91.84669494628906, -87.44734191894531, -83.04798126220703, -78.64862060546875, -74.24925994873047, -69.84989929199219, -65.4505386352539, -61.05118179321289, -56.65182113647461, -52.25246047973633, -47.85310363769531, -43.45374298095703, -39.05438232421875, -34.65502166748047, -30.25566291809082, -25.856304168701172, -21.45694351196289, -17.05758285522461, -12.658224105834961, -8.258865356445312, -3.8595046997070312, 0.5398550033569336, 4.939214706420898, 9.338574409484863, 13.737934112548828, 18.13729476928711, 22.536653518676758, 26.936012268066406, 31.335372924804688]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 5.0, 6.0, 5.0, 6.0, 12.0, 10.0, 17.0, 30.0, 16.0, 20.0, 17.0, 21.0, 33.0, 29.0, 31.0, 17.0, 42.0, 28.0, 35.0, 44.0, 35.0, 37.0, 32.0, 33.0, 41.0, 38.0, 25.0, 46.0, 29.0, 31.0, 31.0, 26.0, 17.0, 17.0, 14.0, 21.0, 17.0, 5.0, 17.0, 12.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0], "bins": [-30.363006591796875, -29.4329833984375, -28.502960205078125, -27.57293701171875, -26.642915725708008, -25.712892532348633, -24.782869338989258, -23.852846145629883, -22.922822952270508, -21.992799758911133, -21.062776565551758, -20.132755279541016, -19.20273208618164, -18.272708892822266, -17.34268569946289, -16.412662506103516, -15.482640266418457, -14.552617073059082, -13.622594833374023, -12.692571640014648, -11.762548446655273, -10.832525253295898, -9.90250301361084, -8.972479820251465, -8.042457580566406, -7.1124348640441895, -6.1824116706848145, -5.252388954162598, -4.322365760803223, -3.392343044281006, -2.462320327758789, -1.532297134399414, -0.6022739410400391, 0.32774895429611206, 1.2577718496322632, 2.1877946853637695, 3.1178176403045654, 4.047840595245361, 4.977863311767578, 5.907886505126953, 6.83790922164917, 7.767931938171387, 8.697955131530762, 9.62797737121582, 10.558000564575195, 11.48802375793457, 12.418046951293945, 13.34807014465332, 14.278092384338379, 15.208115577697754, 16.138137817382812, 17.068161010742188, 17.998184204101562, 18.928207397460938, 19.858230590820312, 20.788253784179688, 21.71827507019043, 22.648298263549805, 23.57832145690918, 24.508342742919922, 25.438365936279297, 26.368389129638672, 27.298412322998047, 28.228435516357422, 29.158458709716797]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 11.0, 7.0, 6.0, 17.0, 15.0, 13.0, 13.0, 17.0, 19.0, 26.0, 20.0, 20.0, 36.0, 31.0, 24.0, 41.0, 31.0, 27.0, 37.0, 37.0, 36.0, 35.0, 38.0, 39.0, 39.0, 38.0, 32.0, 33.0, 21.0, 26.0, 19.0, 22.0, 27.0, 19.0, 17.0, 14.0, 13.0, 14.0, 11.0, 5.0, 9.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.11468505859375, -3.9871826171875, -3.85968017578125, -3.732177734375, -3.60467529296875, -3.4771728515625, -3.34967041015625, -3.22216796875, -3.09466552734375, -2.9671630859375, -2.83966064453125, -2.712158203125, -2.58465576171875, -2.4571533203125, -2.32965087890625, -2.2021484375, -2.07464599609375, -1.9471435546875, -1.81964111328125, -1.692138671875, -1.56463623046875, -1.4371337890625, -1.30963134765625, -1.18212890625, -1.05462646484375, -0.9271240234375, -0.79962158203125, -0.672119140625, -0.54461669921875, -0.4171142578125, -0.28961181640625, -0.162109375, -0.03460693359375, 0.0928955078125, 0.22039794921875, 0.347900390625, 0.47540283203125, 0.6029052734375, 0.73040771484375, 0.85791015625, 0.98541259765625, 1.1129150390625, 1.24041748046875, 1.367919921875, 1.49542236328125, 1.6229248046875, 1.75042724609375, 1.8779296875, 2.00543212890625, 2.1329345703125, 2.26043701171875, 2.387939453125, 2.51544189453125, 2.6429443359375, 2.77044677734375, 2.89794921875, 3.02545166015625, 3.1529541015625, 3.28045654296875, 3.407958984375, 3.53546142578125, 3.6629638671875, 3.79046630859375, 3.91796875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 10.0, 12.0, 24.0, 33.0, 44.0, 63.0, 83.0, 122.0, 187.0, 301.0, 487.0, 887.0, 1822.0, 4047.0, 10502.0, 36558.0, 208679.0, 1468096.0, 2044994.0, 340484.0, 53285.0, 13435.0, 5010.0, 2236.0, 1098.0, 638.0, 388.0, 236.0, 139.0, 93.0, 65.0, 47.0, 41.0, 23.0, 21.0, 12.0, 15.0, 10.0, 4.0, 4.0, 2.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.7767333984375, -8.475341796875, -8.1739501953125, -7.87255859375, -7.5711669921875, -7.269775390625, -6.9683837890625, -6.6669921875, -6.3656005859375, -6.064208984375, -5.7628173828125, -5.46142578125, -5.1600341796875, -4.858642578125, -4.5572509765625, -4.255859375, -3.9544677734375, -3.653076171875, -3.3516845703125, -3.05029296875, -2.7489013671875, -2.447509765625, -2.1461181640625, -1.8447265625, -1.5433349609375, -1.241943359375, -0.9405517578125, -0.63916015625, -0.3377685546875, -0.036376953125, 0.2650146484375, 0.56640625, 0.8677978515625, 1.169189453125, 1.4705810546875, 1.77197265625, 2.0733642578125, 2.374755859375, 2.6761474609375, 2.9775390625, 3.2789306640625, 3.580322265625, 3.8817138671875, 4.18310546875, 4.4844970703125, 4.785888671875, 5.0872802734375, 5.388671875, 5.6900634765625, 5.991455078125, 6.2928466796875, 6.59423828125, 6.8956298828125, 7.197021484375, 7.4984130859375, 7.7998046875, 8.1011962890625, 8.402587890625, 8.7039794921875, 9.00537109375, 9.3067626953125, 9.608154296875, 9.9095458984375, 10.2109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 12.0, 10.0, 13.0, 18.0, 23.0, 28.0, 26.0, 35.0, 47.0, 50.0, 97.0, 131.0, 180.0, 192.0, 281.0, 373.0, 422.0, 429.0, 422.0, 312.0, 246.0, 150.0, 129.0, 97.0, 67.0, 62.0, 50.0, 38.0, 26.0, 20.0, 16.0, 12.0, 17.0, 6.0, 5.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.80078125, -5.6025390625, -5.404296875, -5.2060546875, -5.0078125, -4.8095703125, -4.611328125, -4.4130859375, -4.21484375, -4.0166015625, -3.818359375, -3.6201171875, -3.421875, -3.2236328125, -3.025390625, -2.8271484375, -2.62890625, -2.4306640625, -2.232421875, -2.0341796875, -1.8359375, -1.6376953125, -1.439453125, -1.2412109375, -1.04296875, -0.8447265625, -0.646484375, -0.4482421875, -0.25, -0.0517578125, 0.146484375, 0.3447265625, 0.54296875, 0.7412109375, 0.939453125, 1.1376953125, 1.3359375, 1.5341796875, 1.732421875, 1.9306640625, 2.12890625, 2.3271484375, 2.525390625, 2.7236328125, 2.921875, 3.1201171875, 3.318359375, 3.5166015625, 3.71484375, 3.9130859375, 4.111328125, 4.3095703125, 4.5078125, 4.7060546875, 4.904296875, 5.1025390625, 5.30078125, 5.4990234375, 5.697265625, 5.8955078125, 6.09375, 6.2919921875, 6.490234375, 6.6884765625, 6.88671875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 4.0, 5.0, 9.0, 10.0, 12.0, 27.0, 16.0, 26.0, 30.0, 51.0, 80.0, 100.0, 168.0, 248.0, 411.0, 802.0, 1760.0, 5027.0, 21086.0, 139569.0, 1843245.0, 1999434.0, 150385.0, 22486.0, 5377.0, 1823.0, 860.0, 439.0, 250.0, 148.0, 104.0, 74.0, 54.0, 39.0, 36.0, 23.0, 14.0, 15.0, 8.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-17.40625, -16.9229736328125, -16.439697265625, -15.9564208984375, -15.47314453125, -14.9898681640625, -14.506591796875, -14.0233154296875, -13.5400390625, -13.0567626953125, -12.573486328125, -12.0902099609375, -11.60693359375, -11.1236572265625, -10.640380859375, -10.1571044921875, -9.673828125, -9.1905517578125, -8.707275390625, -8.2239990234375, -7.74072265625, -7.2574462890625, -6.774169921875, -6.2908935546875, -5.8076171875, -5.3243408203125, -4.841064453125, -4.3577880859375, -3.87451171875, -3.3912353515625, -2.907958984375, -2.4246826171875, -1.94140625, -1.4581298828125, -0.974853515625, -0.4915771484375, -0.00830078125, 0.4749755859375, 0.958251953125, 1.4415283203125, 1.9248046875, 2.4080810546875, 2.891357421875, 3.3746337890625, 3.85791015625, 4.3411865234375, 4.824462890625, 5.3077392578125, 5.791015625, 6.2742919921875, 6.757568359375, 7.2408447265625, 7.72412109375, 8.2073974609375, 8.690673828125, 9.1739501953125, 9.6572265625, 10.1405029296875, 10.623779296875, 11.1070556640625, 11.59033203125, 12.0736083984375, 12.556884765625, 13.0401611328125, 13.5234375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 13.0, 63.0, 191.0, 350.0, 259.0, 102.0, 29.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.66197204589844, -52.304664611816406, -48.947357177734375, -45.59005355834961, -42.23274612426758, -38.87543869018555, -35.51813507080078, -32.16082763671875, -28.80352020263672, -25.446212768554688, -22.08890724182129, -18.73160171508789, -15.37429428100586, -12.016986846923828, -8.65968132019043, -5.302375793457031, -1.945068359375, 1.4122381210327148, 4.76954460144043, 8.126851081848145, 11.48415756225586, 14.84146499633789, 18.19877052307129, 21.556076049804688, 24.91338348388672, 28.27069091796875, 31.62799644470215, 34.98530197143555, 38.34260940551758, 41.69991683959961, 45.057220458984375, 48.414527893066406, 51.77183532714844, 55.12914276123047, 58.4864501953125, 61.843753814697266, 65.20106506347656, 68.55836486816406, 71.9156723022461, 75.27297973632812, 78.63028717041016, 81.98759460449219, 85.34490203857422, 88.70220947265625, 92.05950927734375, 95.41682434082031, 98.77412414550781, 102.13143157958984, 105.48873901367188, 108.8460464477539, 112.20335388183594, 115.56066131591797, 118.91796875, 122.2752685546875, 125.63257598876953, 128.98988342285156, 132.34719848632812, 135.70449829101562, 139.0618133544922, 142.4191131591797, 145.77642822265625, 149.13372802734375, 152.4910430908203, 155.8483428955078, 159.2056427001953]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 5.0, 4.0, 9.0, 7.0, 15.0, 14.0, 21.0, 20.0, 19.0, 27.0, 26.0, 34.0, 27.0, 37.0, 34.0, 37.0, 38.0, 35.0, 48.0, 43.0, 38.0, 42.0, 35.0, 38.0, 52.0, 35.0, 31.0, 30.0, 27.0, 21.0, 24.0, 26.0, 12.0, 17.0, 9.0, 14.0, 9.0, 11.0, 5.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.901531219482422, -24.117189407348633, -23.33284568786621, -22.548503875732422, -21.76416015625, -20.97981834411621, -20.195476531982422, -19.4111328125, -18.626789093017578, -17.84244728088379, -17.058103561401367, -16.273761749267578, -15.489418029785156, -14.705076217651367, -13.920733451843262, -13.136390686035156, -12.352048873901367, -11.567706108093262, -10.783363342285156, -9.999021530151367, -9.214677810668945, -8.430335998535156, -7.645993232727051, -6.861650466918945, -6.07730770111084, -5.292964935302734, -4.508622169494629, -3.7242798805236816, -2.939937114715576, -2.1555943489074707, -1.3712520599365234, -0.586909294128418, 0.1974334716796875, 0.9817761182785034, 1.7661187648773193, 2.5504612922668457, 3.334804058074951, 4.119146823883057, 4.903489112854004, 5.687831878662109, 6.472174644470215, 7.25651741027832, 8.040860176086426, 8.825202941894531, 9.60954475402832, 10.393888473510742, 11.178230285644531, 11.962573051452637, 12.746915817260742, 13.531258583068848, 14.315601348876953, 15.099943161010742, 15.884286880493164, 16.668628692626953, 17.452972412109375, 18.237314224243164, 19.021656036376953, 19.805997848510742, 20.590341567993164, 21.374683380126953, 22.159027099609375, 22.943368911743164, 23.727710723876953, 24.512054443359375, 25.296398162841797]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 13.0, 10.0, 5.0, 11.0, 9.0, 13.0, 18.0, 9.0, 21.0, 19.0, 17.0, 21.0, 32.0, 25.0, 32.0, 23.0, 44.0, 28.0, 31.0, 41.0, 40.0, 36.0, 42.0, 38.0, 36.0, 36.0, 40.0, 41.0, 19.0, 34.0, 28.0, 24.0, 22.0, 17.0, 15.0, 18.0, 16.0, 8.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.56640625, -4.43212890625, -4.2978515625, -4.16357421875, -4.029296875, -3.89501953125, -3.7607421875, -3.62646484375, -3.4921875, -3.35791015625, -3.2236328125, -3.08935546875, -2.955078125, -2.82080078125, -2.6865234375, -2.55224609375, -2.41796875, -2.28369140625, -2.1494140625, -2.01513671875, -1.880859375, -1.74658203125, -1.6123046875, -1.47802734375, -1.34375, -1.20947265625, -1.0751953125, -0.94091796875, -0.806640625, -0.67236328125, -0.5380859375, -0.40380859375, -0.26953125, -0.13525390625, -0.0009765625, 0.13330078125, 0.267578125, 0.40185546875, 0.5361328125, 0.67041015625, 0.8046875, 0.93896484375, 1.0732421875, 1.20751953125, 1.341796875, 1.47607421875, 1.6103515625, 1.74462890625, 1.87890625, 2.01318359375, 2.1474609375, 2.28173828125, 2.416015625, 2.55029296875, 2.6845703125, 2.81884765625, 2.953125, 3.08740234375, 3.2216796875, 3.35595703125, 3.490234375, 3.62451171875, 3.7587890625, 3.89306640625, 4.02734375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 17.0, 19.0, 21.0, 36.0, 50.0, 70.0, 95.0, 134.0, 217.0, 349.0, 500.0, 642.0, 992.0, 1479.0, 2147.0, 3254.0, 4769.0, 7232.0, 10630.0, 16475.0, 24964.0, 39789.0, 66783.0, 120375.0, 252705.0, 221679.0, 107766.0, 60248.0, 36537.0, 23065.0, 15085.0, 9913.0, 6745.0, 4512.0, 2954.0, 1979.0, 1412.0, 908.0, 590.0, 466.0, 306.0, 191.0, 137.0, 103.0, 75.0, 37.0, 33.0, 22.0, 22.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.156982421875, -0.15221214294433594, -0.14744186401367188, -0.1426715850830078, -0.13790130615234375, -0.1331310272216797, -0.12836074829101562, -0.12359046936035156, -0.1188201904296875, -0.11404991149902344, -0.10927963256835938, -0.10450935363769531, -0.09973907470703125, -0.09496879577636719, -0.09019851684570312, -0.08542823791503906, -0.080657958984375, -0.07588768005371094, -0.07111740112304688, -0.06634712219238281, -0.06157684326171875, -0.05680656433105469, -0.052036285400390625, -0.04726600646972656, -0.0424957275390625, -0.03772544860839844, -0.032955169677734375, -0.028184890747070312, -0.02341461181640625, -0.018644332885742188, -0.013874053955078125, -0.009103775024414062, -0.00433349609375, 0.0004367828369140625, 0.005207061767578125, 0.009977340698242188, 0.01474761962890625, 0.019517898559570312, 0.024288177490234375, 0.029058456420898438, 0.0338287353515625, 0.03859901428222656, 0.043369293212890625, 0.04813957214355469, 0.05290985107421875, 0.05768013000488281, 0.062450408935546875, 0.06722068786621094, 0.071990966796875, 0.07676124572753906, 0.08153152465820312, 0.08630180358886719, 0.09107208251953125, 0.09584236145019531, 0.10061264038085938, 0.10538291931152344, 0.1101531982421875, 0.11492347717285156, 0.11969375610351562, 0.12446403503417969, 0.12923431396484375, 0.1340045928955078, 0.13877487182617188, 0.14354515075683594, 0.1483154296875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 9.0, 14.0, 9.0, 10.0, 15.0, 19.0, 24.0, 15.0, 24.0, 24.0, 34.0, 39.0, 32.0, 32.0, 38.0, 34.0, 41.0, 29.0, 38.0, 1056.0, 38.0, 41.0, 47.0, 38.0, 41.0, 34.0, 28.0, 24.0, 17.0, 20.0, 21.0, 14.0, 15.0, 13.0, 16.0, 12.0, 13.0, 6.0, 9.0, 5.0, 12.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.383758544921875, -3.27532958984375, -3.166900634765625, -3.0584716796875, -2.950042724609375, -2.84161376953125, -2.733184814453125, -2.624755859375, -2.516326904296875, -2.40789794921875, -2.299468994140625, -2.1910400390625, -2.082611083984375, -1.97418212890625, -1.865753173828125, -1.75732421875, -1.648895263671875, -1.54046630859375, -1.432037353515625, -1.3236083984375, -1.215179443359375, -1.10675048828125, -0.998321533203125, -0.889892578125, -0.781463623046875, -0.67303466796875, -0.564605712890625, -0.4561767578125, -0.347747802734375, -0.23931884765625, -0.130889892578125, -0.0224609375, 0.085968017578125, 0.19439697265625, 0.302825927734375, 0.4112548828125, 0.519683837890625, 0.62811279296875, 0.736541748046875, 0.844970703125, 0.953399658203125, 1.06182861328125, 1.170257568359375, 1.2786865234375, 1.387115478515625, 1.49554443359375, 1.603973388671875, 1.71240234375, 1.820831298828125, 1.92926025390625, 2.037689208984375, 2.1461181640625, 2.254547119140625, 2.36297607421875, 2.471405029296875, 2.579833984375, 2.688262939453125, 2.79669189453125, 2.905120849609375, 3.0135498046875, 3.121978759765625, 3.23040771484375, 3.338836669921875, 3.447265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 8.0, 4.0, 11.0, 21.0, 30.0, 46.0, 66.0, 87.0, 131.0, 201.0, 312.0, 411.0, 594.0, 903.0, 1406.0, 2067.0, 2996.0, 4286.0, 6288.0, 9321.0, 14073.0, 21696.0, 34385.0, 55239.0, 94115.0, 175796.0, 1300306.0, 150478.0, 83028.0, 49185.0, 30456.0, 19474.0, 13070.0, 8712.0, 6034.0, 3901.0, 2505.0, 1703.0, 1175.0, 827.0, 577.0, 408.0, 251.0, 174.0, 128.0, 74.0, 54.0, 42.0, 27.0, 15.0, 15.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.0672607421875, -0.06518363952636719, -0.06310653686523438, -0.06102943420410156, -0.05895233154296875, -0.05687522888183594, -0.054798126220703125, -0.05272102355957031, -0.0506439208984375, -0.04856681823730469, -0.046489715576171875, -0.04441261291503906, -0.04233551025390625, -0.04025840759277344, -0.038181304931640625, -0.03610420227050781, -0.034027099609375, -0.03194999694824219, -0.029872894287109375, -0.027795791625976562, -0.02571868896484375, -0.023641586303710938, -0.021564483642578125, -0.019487380981445312, -0.0174102783203125, -0.015333175659179688, -0.013256072998046875, -0.011178970336914062, -0.00910186767578125, -0.0070247650146484375, -0.004947662353515625, -0.0028705596923828125, -0.00079345703125, 0.0012836456298828125, 0.003360748291015625, 0.0054378509521484375, 0.00751495361328125, 0.009592056274414062, 0.011669158935546875, 0.013746261596679688, 0.0158233642578125, 0.017900466918945312, 0.019977569580078125, 0.022054672241210938, 0.02413177490234375, 0.026208877563476562, 0.028285980224609375, 0.030363082885742188, 0.032440185546875, 0.03451728820800781, 0.036594390869140625, 0.03867149353027344, 0.04074859619140625, 0.04282569885253906, 0.044902801513671875, 0.04697990417480469, 0.0490570068359375, 0.05113410949707031, 0.053211212158203125, 0.05528831481933594, 0.05736541748046875, 0.05944252014160156, 0.061519622802734375, 0.06359672546386719, 0.065673828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 11.0, 5.0, 6.0, 7.0, 9.0, 13.0, 17.0, 16.0, 19.0, 17.0, 10.0, 33.0, 37.0, 56.0, 76.0, 108.0, 125.0, 127.0, 61.0, 52.0, 43.0, 27.0, 15.0, 16.0, 14.0, 12.0, 3.0, 9.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0003745555877685547, -0.00036362186074256897, -0.00035268813371658325, -0.00034175440669059753, -0.0003308206796646118, -0.0003198869526386261, -0.0003089532256126404, -0.00029801949858665466, -0.00028708577156066895, -0.00027615204453468323, -0.0002652183175086975, -0.0002542845904827118, -0.00024335086345672607, -0.00023241713643074036, -0.00022148340940475464, -0.00021054968237876892, -0.0001996159553527832, -0.00018868222832679749, -0.00017774850130081177, -0.00016681477427482605, -0.00015588104724884033, -0.00014494732022285461, -0.0001340135931968689, -0.00012307986617088318, -0.00011214613914489746, -0.00010121241211891174, -9.027868509292603e-05, -7.934495806694031e-05, -6.841123104095459e-05, -5.747750401496887e-05, -4.6543776988983154e-05, -3.5610049962997437e-05, -2.467632293701172e-05, -1.3742595911026001e-05, -2.808868885040283e-06, 8.124858140945435e-06, 1.9058585166931152e-05, 2.999231219291687e-05, 4.092603921890259e-05, 5.1859766244888306e-05, 6.279349327087402e-05, 7.372722029685974e-05, 8.466094732284546e-05, 9.559467434883118e-05, 0.0001065284013748169, 0.00011746212840080261, 0.00012839585542678833, 0.00013932958245277405, 0.00015026330947875977, 0.00016119703650474548, 0.0001721307635307312, 0.00018306449055671692, 0.00019399821758270264, 0.00020493194460868835, 0.00021586567163467407, 0.0002267993986606598, 0.0002377331256866455, 0.0002486668527126312, 0.00025960057973861694, 0.00027053430676460266, 0.0002814680337905884, 0.0002924017608165741, 0.0003033354878425598, 0.00031426921486854553, 0.00032520294189453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 9.0, 7.0, 6.0, 18.0, 17.0, 22.0, 37.0, 67.0, 120.0, 244.0, 2139.0, 776753.0, 267178.0, 1378.0, 200.0, 104.0, 54.0, 26.0, 23.0, 18.0, 18.0, 17.0, 12.0, 9.0, 6.0, 5.0, 8.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00846099853515625, -0.008178353309631348, -0.007895708084106445, -0.007613062858581543, -0.007330417633056641, -0.007047772407531738, -0.006765127182006836, -0.006482481956481934, -0.006199836730957031, -0.005917191505432129, -0.0056345462799072266, -0.005351901054382324, -0.005069255828857422, -0.0047866106033325195, -0.004503965377807617, -0.004221320152282715, -0.0039386749267578125, -0.00365602970123291, -0.003373384475708008, -0.0030907392501831055, -0.002808094024658203, -0.0025254487991333008, -0.0022428035736083984, -0.001960158348083496, -0.0016775131225585938, -0.0013948678970336914, -0.001112222671508789, -0.0008295774459838867, -0.0005469322204589844, -0.00026428699493408203, 1.8358230590820312e-05, 0.00030100345611572266, 0.000583648681640625, 0.0008662939071655273, 0.0011489391326904297, 0.001431584358215332, 0.0017142295837402344, 0.0019968748092651367, 0.002279520034790039, 0.0025621652603149414, 0.0028448104858398438, 0.003127455711364746, 0.0034101009368896484, 0.0036927461624145508, 0.003975391387939453, 0.0042580366134643555, 0.004540681838989258, 0.00482332706451416, 0.0051059722900390625, 0.005388617515563965, 0.005671262741088867, 0.0059539079666137695, 0.006236553192138672, 0.006519198417663574, 0.0068018436431884766, 0.007084488868713379, 0.007367134094238281, 0.007649779319763184, 0.007932424545288086, 0.008215069770812988, 0.00849771499633789, 0.008780360221862793, 0.009063005447387695, 0.009345650672912598, 0.0096282958984375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 13.0, 32.0, 122.0, 371.0, 344.0, 97.0, 22.0, 10.0, 5.0, 0.0, 1.0], "bins": [-0.0019118670606985688, -0.001878263894468546, -0.001844660728238523, -0.0018110575620085, -0.0017774543957784772, -0.0017438512295484543, -0.0017102480633184314, -0.0016766448970884085, -0.0016430417308583856, -0.0016094385646283627, -0.0015758353983983397, -0.0015422322321683168, -0.001508629065938294, -0.001475025899708271, -0.0014414227334782481, -0.0014078195672482252, -0.0013742165174335241, -0.0013406133512035012, -0.0013070101849734783, -0.0012734070187434554, -0.0012398038525134325, -0.0012062006862834096, -0.0011725975200533867, -0.0011389943538233638, -0.0011053911875933409, -0.001071788021363318, -0.001038184855133295, -0.0010045816889032722, -0.0009709785226732492, -0.0009373753564432263, -0.0009037721902132034, -0.0008701690239831805, -0.0008365659159608185, -0.0008029627497307956, -0.0007693595835007727, -0.0007357564172707498, -0.0007021532510407269, -0.000668550084810704, -0.000634946976788342, -0.0006013438105583191, -0.0005677405861206353, -0.0005341374198906124, -0.0005005342536605895, -0.00046693108743056655, -0.00043332792120054364, -0.00039972475497052073, -0.0003661216178443283, -0.0003325184516143054, -0.0002989153144881129, -0.00026531214825809, -0.0002317089820280671, -0.00019810583034995943, -0.00016450266411993653, -0.00013089949788991362, -9.729634621180594e-05, -6.369317998178303e-05, -3.0089999199844897e-05, 3.5131633921992034e-06, 3.7116325984243304e-05, 7.07194849383086e-05, 0.0001043226511683315, 0.0001379258173983544, 0.0001715289690764621, 0.000205132135306485, 0.0002387353015365079]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 10.0, 11.0, 11.0, 18.0, 18.0, 18.0, 19.0, 26.0, 25.0, 32.0, 37.0, 36.0, 45.0, 36.0, 36.0, 34.0, 56.0, 44.0, 41.0, 38.0, 30.0, 45.0, 30.0, 29.0, 25.0, 29.0, 21.0, 23.0, 32.0, 23.0, 21.0, 12.0, 13.0, 10.0, 6.0, 8.0, 4.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.00018358230590820312, -0.00017814245074987411, -0.0001727025955915451, -0.0001672627404332161, -0.00016182288527488708, -0.00015638303011655807, -0.00015094317495822906, -0.00014550331979990005, -0.00014006346464157104, -0.00013462360948324203, -0.00012918375432491302, -0.00012374389916658401, -0.000118304044008255, -0.000112864188849926, -0.00010742433369159698, -0.00010198447853326797, -9.654462337493896e-05, -9.110476821660995e-05, -8.566491305828094e-05, -8.022505789995193e-05, -7.478520274162292e-05, -6.934534758329391e-05, -6.39054924249649e-05, -5.8465637266635895e-05, -5.3025782108306885e-05, -4.7585926949977875e-05, -4.2146071791648865e-05, -3.6706216633319855e-05, -3.1266361474990845e-05, -2.5826506316661835e-05, -2.0386651158332825e-05, -1.4946796000003815e-05, -9.506940841674805e-06, -4.067085683345795e-06, 1.3727694749832153e-06, 6.812624633312225e-06, 1.2252479791641235e-05, 1.7692334949970245e-05, 2.3132190108299255e-05, 2.8572045266628265e-05, 3.4011900424957275e-05, 3.9451755583286285e-05, 4.4891610741615295e-05, 5.0331465899944305e-05, 5.5771321058273315e-05, 6.121117621660233e-05, 6.665103137493134e-05, 7.209088653326035e-05, 7.753074169158936e-05, 8.297059684991837e-05, 8.841045200824738e-05, 9.385030716657639e-05, 9.92901623249054e-05, 0.0001047300174832344, 0.00011016987264156342, 0.00011560972779989243, 0.00012104958295822144, 0.00012648943811655045, 0.00013192929327487946, 0.00013736914843320847, 0.00014280900359153748, 0.00014824885874986649, 0.0001536887139081955, 0.0001591285690665245, 0.00016456842422485352]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 13.0, 10.0, 5.0, 11.0, 9.0, 13.0, 18.0, 9.0, 21.0, 19.0, 17.0, 21.0, 32.0, 25.0, 32.0, 23.0, 44.0, 28.0, 31.0, 41.0, 40.0, 36.0, 42.0, 38.0, 36.0, 36.0, 40.0, 41.0, 19.0, 34.0, 28.0, 24.0, 22.0, 17.0, 16.0, 17.0, 16.0, 8.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.56640625, -4.43212890625, -4.2978515625, -4.16357421875, -4.029296875, -3.89501953125, -3.7607421875, -3.62646484375, -3.4921875, -3.35791015625, -3.2236328125, -3.08935546875, -2.955078125, -2.82080078125, -2.6865234375, -2.55224609375, -2.41796875, -2.28369140625, -2.1494140625, -2.01513671875, -1.880859375, -1.74658203125, -1.6123046875, -1.47802734375, -1.34375, -1.20947265625, -1.0751953125, -0.94091796875, -0.806640625, -0.67236328125, -0.5380859375, -0.40380859375, -0.26953125, -0.13525390625, -0.0009765625, 0.13330078125, 0.267578125, 0.40185546875, 0.5361328125, 0.67041015625, 0.8046875, 0.93896484375, 1.0732421875, 1.20751953125, 1.341796875, 1.47607421875, 1.6103515625, 1.74462890625, 1.87890625, 2.01318359375, 2.1474609375, 2.28173828125, 2.416015625, 2.55029296875, 2.6845703125, 2.81884765625, 2.953125, 3.08740234375, 3.2216796875, 3.35595703125, 3.490234375, 3.62451171875, 3.7587890625, 3.89306640625, 4.02734375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 21.0, 15.0, 32.0, 39.0, 51.0, 79.0, 145.0, 204.0, 270.0, 426.0, 576.0, 851.0, 1321.0, 1877.0, 2814.0, 4212.0, 6554.0, 10138.0, 15775.0, 25844.0, 41298.0, 69659.0, 119766.0, 189829.0, 205443.0, 139415.0, 81699.0, 48792.0, 29395.0, 18343.0, 11556.0, 7391.0, 4910.0, 3151.0, 2118.0, 1523.0, 971.0, 652.0, 437.0, 318.0, 222.0, 130.0, 104.0, 60.0, 39.0, 21.0, 19.0, 15.0, 12.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-5.125, -4.97039794921875, -4.8157958984375, -4.66119384765625, -4.506591796875, -4.35198974609375, -4.1973876953125, -4.04278564453125, -3.88818359375, -3.73358154296875, -3.5789794921875, -3.42437744140625, -3.269775390625, -3.11517333984375, -2.9605712890625, -2.80596923828125, -2.6513671875, -2.49676513671875, -2.3421630859375, -2.18756103515625, -2.032958984375, -1.87835693359375, -1.7237548828125, -1.56915283203125, -1.41455078125, -1.25994873046875, -1.1053466796875, -0.95074462890625, -0.796142578125, -0.64154052734375, -0.4869384765625, -0.33233642578125, -0.177734375, -0.02313232421875, 0.1314697265625, 0.28607177734375, 0.440673828125, 0.59527587890625, 0.7498779296875, 0.90447998046875, 1.05908203125, 1.21368408203125, 1.3682861328125, 1.52288818359375, 1.677490234375, 1.83209228515625, 1.9866943359375, 2.14129638671875, 2.2958984375, 2.45050048828125, 2.6051025390625, 2.75970458984375, 2.914306640625, 3.06890869140625, 3.2235107421875, 3.37811279296875, 3.53271484375, 3.68731689453125, 3.8419189453125, 3.99652099609375, 4.151123046875, 4.30572509765625, 4.4603271484375, 4.61492919921875, 4.76953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 12.0, 1.0, 4.0, 9.0, 10.0, 7.0, 12.0, 7.0, 10.0, 15.0, 14.0, 24.0, 32.0, 31.0, 27.0, 34.0, 49.0, 48.0, 57.0, 70.0, 102.0, 139.0, 199.0, 1263.0, 193.0, 153.0, 104.0, 63.0, 54.0, 52.0, 41.0, 31.0, 28.0, 23.0, 19.0, 20.0, 11.0, 18.0, 10.0, 15.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-12.296875, -11.9183349609375, -11.539794921875, -11.1612548828125, -10.78271484375, -10.4041748046875, -10.025634765625, -9.6470947265625, -9.2685546875, -8.8900146484375, -8.511474609375, -8.1329345703125, -7.75439453125, -7.3758544921875, -6.997314453125, -6.6187744140625, -6.240234375, -5.8616943359375, -5.483154296875, -5.1046142578125, -4.72607421875, -4.3475341796875, -3.968994140625, -3.5904541015625, -3.2119140625, -2.8333740234375, -2.454833984375, -2.0762939453125, -1.69775390625, -1.3192138671875, -0.940673828125, -0.5621337890625, -0.18359375, 0.1949462890625, 0.573486328125, 0.9520263671875, 1.33056640625, 1.7091064453125, 2.087646484375, 2.4661865234375, 2.8447265625, 3.2232666015625, 3.601806640625, 3.9803466796875, 4.35888671875, 4.7374267578125, 5.115966796875, 5.4945068359375, 5.873046875, 6.2515869140625, 6.630126953125, 7.0086669921875, 7.38720703125, 7.7657470703125, 8.144287109375, 8.5228271484375, 8.9013671875, 9.2799072265625, 9.658447265625, 10.0369873046875, 10.41552734375, 10.7940673828125, 11.172607421875, 11.5511474609375, 11.9296875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 12.0, 17.0, 19.0, 28.0, 33.0, 54.0, 78.0, 82.0, 126.0, 150.0, 228.0, 311.0, 450.0, 722.0, 1243.0, 2136.0, 4468.0, 10167.0, 27395.0, 94993.0, 506575.0, 1917699.0, 446380.0, 86990.0, 25913.0, 9643.0, 4216.0, 2175.0, 1150.0, 709.0, 440.0, 286.0, 215.0, 152.0, 110.0, 67.0, 61.0, 42.0, 36.0, 30.0, 15.0, 21.0, 16.0, 9.0, 5.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.65625, -11.2972412109375, -10.938232421875, -10.5792236328125, -10.22021484375, -9.8612060546875, -9.502197265625, -9.1431884765625, -8.7841796875, -8.4251708984375, -8.066162109375, -7.7071533203125, -7.34814453125, -6.9891357421875, -6.630126953125, -6.2711181640625, -5.912109375, -5.5531005859375, -5.194091796875, -4.8350830078125, -4.47607421875, -4.1170654296875, -3.758056640625, -3.3990478515625, -3.0400390625, -2.6810302734375, -2.322021484375, -1.9630126953125, -1.60400390625, -1.2449951171875, -0.885986328125, -0.5269775390625, -0.16796875, 0.1910400390625, 0.550048828125, 0.9090576171875, 1.26806640625, 1.6270751953125, 1.986083984375, 2.3450927734375, 2.7041015625, 3.0631103515625, 3.422119140625, 3.7811279296875, 4.14013671875, 4.4991455078125, 4.858154296875, 5.2171630859375, 5.576171875, 5.9351806640625, 6.294189453125, 6.6531982421875, 7.01220703125, 7.3712158203125, 7.730224609375, 8.0892333984375, 8.4482421875, 8.8072509765625, 9.166259765625, 9.5252685546875, 9.88427734375, 10.2432861328125, 10.602294921875, 10.9613037109375, 11.3203125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 13.0, 107.0, 491.0, 338.0, 49.0, 13.0, 3.0, 0.0, 0.0, 1.0], "bins": [-445.2985534667969, -437.456787109375, -429.6150207519531, -421.7732238769531, -413.93145751953125, -406.0896911621094, -398.2479248046875, -390.4061279296875, -382.5643615722656, -374.72259521484375, -366.8808288574219, -359.0390319824219, -351.197265625, -343.3554992675781, -335.51373291015625, -327.67193603515625, -319.8301696777344, -311.9884033203125, -304.1466369628906, -296.3048400878906, -288.46307373046875, -280.6213073730469, -272.779541015625, -264.937744140625, -257.0959777832031, -249.25421142578125, -241.4124298095703, -233.57066345214844, -225.7288818359375, -217.88711547851562, -210.0453338623047, -202.2035675048828, -194.36180114746094, -186.52003479003906, -178.67825317382812, -170.83648681640625, -162.9947052001953, -155.15293884277344, -147.3111572265625, -139.46939086914062, -131.6276092529297, -123.78583526611328, -115.94406127929688, -108.10228729248047, -100.26051330566406, -92.41874694824219, -84.57696533203125, -76.73519897460938, -68.89341735839844, -61.05164337158203, -53.209869384765625, -45.36809539794922, -37.52632141113281, -29.684551239013672, -21.842777252197266, -14.00100326538086, -6.159233093261719, 1.6825404167175293, 9.524313926696777, 17.366086959838867, 25.207860946655273, 33.04963302612305, 40.89140701293945, 48.73318099975586, 56.574954986572266]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 5.0, 13.0, 4.0, 6.0, 16.0, 11.0, 16.0, 12.0, 21.0, 24.0, 24.0, 27.0, 29.0, 18.0, 44.0, 31.0, 37.0, 29.0, 40.0, 34.0, 37.0, 37.0, 61.0, 38.0, 39.0, 47.0, 31.0, 38.0, 28.0, 30.0, 23.0, 23.0, 22.0, 21.0, 14.0, 9.0, 9.0, 13.0, 6.0, 7.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.93986129760742, -31.80710792541504, -30.674354553222656, -29.54159927368164, -28.408845901489258, -27.276092529296875, -26.14333724975586, -25.010583877563477, -23.877830505371094, -22.74507713317871, -21.612323760986328, -20.479568481445312, -19.34681510925293, -18.214061737060547, -17.08130645751953, -15.948553085327148, -14.815799713134766, -13.683046340942383, -12.550292015075684, -11.417537689208984, -10.284784317016602, -9.152030944824219, -8.01927661895752, -6.8865227699279785, -5.7537689208984375, -4.6210150718688965, -3.4882612228393555, -2.3555073738098145, -1.2227535247802734, -0.08999967575073242, 1.0427541732788086, 2.1755080223083496, 3.308258056640625, 4.441011905670166, 5.573765754699707, 6.706519603729248, 7.839273452758789, 8.972026824951172, 10.104781150817871, 11.23753547668457, 12.370288848876953, 13.503042221069336, 14.635796546936035, 15.768550872802734, 16.901304244995117, 18.0340576171875, 19.166812896728516, 20.2995662689209, 21.43231964111328, 22.565073013305664, 23.697826385498047, 24.830581665039062, 25.963335037231445, 27.096088409423828, 28.228843688964844, 29.361597061157227, 30.49435043334961, 31.627103805541992, 32.759857177734375, 33.89261245727539, 35.025367736816406, 36.158119201660156, 37.29087448120117, 38.42362594604492, 39.55638122558594]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 6.0, 8.0, 10.0, 12.0, 8.0, 8.0, 9.0, 20.0, 18.0, 18.0, 21.0, 19.0, 28.0, 23.0, 21.0, 33.0, 36.0, 34.0, 37.0, 30.0, 43.0, 43.0, 31.0, 26.0, 33.0, 47.0, 30.0, 35.0, 22.0, 37.0, 21.0, 26.0, 26.0, 19.0, 27.0, 19.0, 17.0, 15.0, 8.0, 7.0, 6.0, 14.0, 7.0, 7.0, 6.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.6640625, -4.52679443359375, -4.3895263671875, -4.25225830078125, -4.114990234375, -3.97772216796875, -3.8404541015625, -3.70318603515625, -3.56591796875, -3.42864990234375, -3.2913818359375, -3.15411376953125, -3.016845703125, -2.87957763671875, -2.7423095703125, -2.60504150390625, -2.4677734375, -2.33050537109375, -2.1932373046875, -2.05596923828125, -1.918701171875, -1.78143310546875, -1.6441650390625, -1.50689697265625, -1.36962890625, -1.23236083984375, -1.0950927734375, -0.95782470703125, -0.820556640625, -0.68328857421875, -0.5460205078125, -0.40875244140625, -0.271484375, -0.13421630859375, 0.0030517578125, 0.14031982421875, 0.277587890625, 0.41485595703125, 0.5521240234375, 0.68939208984375, 0.82666015625, 0.96392822265625, 1.1011962890625, 1.23846435546875, 1.375732421875, 1.51300048828125, 1.6502685546875, 1.78753662109375, 1.9248046875, 2.06207275390625, 2.1993408203125, 2.33660888671875, 2.473876953125, 2.61114501953125, 2.7484130859375, 2.88568115234375, 3.02294921875, 3.16021728515625, 3.2974853515625, 3.43475341796875, 3.572021484375, 3.70928955078125, 3.8465576171875, 3.98382568359375, 4.12109375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 11.0, 8.0, 14.0, 19.0, 28.0, 44.0, 54.0, 72.0, 119.0, 147.0, 203.0, 270.0, 423.0, 576.0, 818.0, 1190.0, 1882.0, 2849.0, 4956.0, 8802.0, 18863.0, 50128.0, 185571.0, 855820.0, 2080893.0, 734155.0, 162894.0, 44920.0, 17290.0, 8303.0, 4652.0, 2832.0, 1705.0, 1173.0, 787.0, 521.0, 376.0, 255.0, 185.0, 148.0, 100.0, 60.0, 52.0, 27.0, 24.0, 9.0, 18.0, 9.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.703125, -7.45819091796875, -7.2132568359375, -6.96832275390625, -6.723388671875, -6.47845458984375, -6.2335205078125, -5.98858642578125, -5.74365234375, -5.49871826171875, -5.2537841796875, -5.00885009765625, -4.763916015625, -4.51898193359375, -4.2740478515625, -4.02911376953125, -3.7841796875, -3.53924560546875, -3.2943115234375, -3.04937744140625, -2.804443359375, -2.55950927734375, -2.3145751953125, -2.06964111328125, -1.82470703125, -1.57977294921875, -1.3348388671875, -1.08990478515625, -0.844970703125, -0.60003662109375, -0.3551025390625, -0.11016845703125, 0.134765625, 0.37969970703125, 0.6246337890625, 0.86956787109375, 1.114501953125, 1.35943603515625, 1.6043701171875, 1.84930419921875, 2.09423828125, 2.33917236328125, 2.5841064453125, 2.82904052734375, 3.073974609375, 3.31890869140625, 3.5638427734375, 3.80877685546875, 4.0537109375, 4.29864501953125, 4.5435791015625, 4.78851318359375, 5.033447265625, 5.27838134765625, 5.5233154296875, 5.76824951171875, 6.01318359375, 6.25811767578125, 6.5030517578125, 6.74798583984375, 6.992919921875, 7.23785400390625, 7.4827880859375, 7.72772216796875, 7.97265625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 14.0, 7.0, 11.0, 15.0, 18.0, 32.0, 54.0, 59.0, 74.0, 107.0, 179.0, 252.0, 393.0, 505.0, 682.0, 554.0, 379.0, 251.0, 127.0, 102.0, 65.0, 52.0, 31.0, 28.0, 16.0, 17.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8125, -9.5098876953125, -9.207275390625, -8.9046630859375, -8.60205078125, -8.2994384765625, -7.996826171875, -7.6942138671875, -7.3916015625, -7.0889892578125, -6.786376953125, -6.4837646484375, -6.18115234375, -5.8785400390625, -5.575927734375, -5.2733154296875, -4.970703125, -4.6680908203125, -4.365478515625, -4.0628662109375, -3.76025390625, -3.4576416015625, -3.155029296875, -2.8524169921875, -2.5498046875, -2.2471923828125, -1.944580078125, -1.6419677734375, -1.33935546875, -1.0367431640625, -0.734130859375, -0.4315185546875, -0.12890625, 0.1737060546875, 0.476318359375, 0.7789306640625, 1.08154296875, 1.3841552734375, 1.686767578125, 1.9893798828125, 2.2919921875, 2.5946044921875, 2.897216796875, 3.1998291015625, 3.50244140625, 3.8050537109375, 4.107666015625, 4.4102783203125, 4.712890625, 5.0155029296875, 5.318115234375, 5.6207275390625, 5.92333984375, 6.2259521484375, 6.528564453125, 6.8311767578125, 7.1337890625, 7.4364013671875, 7.739013671875, 8.0416259765625, 8.34423828125, 8.6468505859375, 8.949462890625, 9.2520751953125, 9.5546875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 16.0, 30.0, 47.0, 75.0, 117.0, 188.0, 327.0, 628.0, 1079.0, 2504.0, 6608.0, 23828.0, 167610.0, 2979044.0, 928226.0, 62954.0, 13081.0, 4184.0, 1781.0, 861.0, 442.0, 267.0, 135.0, 91.0, 48.0, 37.0, 26.0, 10.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.96875, -20.3291015625, -19.689453125, -19.0498046875, -18.41015625, -17.7705078125, -17.130859375, -16.4912109375, -15.8515625, -15.2119140625, -14.572265625, -13.9326171875, -13.29296875, -12.6533203125, -12.013671875, -11.3740234375, -10.734375, -10.0947265625, -9.455078125, -8.8154296875, -8.17578125, -7.5361328125, -6.896484375, -6.2568359375, -5.6171875, -4.9775390625, -4.337890625, -3.6982421875, -3.05859375, -2.4189453125, -1.779296875, -1.1396484375, -0.5, 0.1396484375, 0.779296875, 1.4189453125, 2.05859375, 2.6982421875, 3.337890625, 3.9775390625, 4.6171875, 5.2568359375, 5.896484375, 6.5361328125, 7.17578125, 7.8154296875, 8.455078125, 9.0947265625, 9.734375, 10.3740234375, 11.013671875, 11.6533203125, 12.29296875, 12.9326171875, 13.572265625, 14.2119140625, 14.8515625, 15.4912109375, 16.130859375, 16.7705078125, 17.41015625, 18.0498046875, 18.689453125, 19.3291015625, 19.96875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [3.0, 16.0, 60.0, 348.0, 424.0, 137.0, 23.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.02175521850586, -17.56312370300293, -12.104493141174316, -6.645862579345703, -1.1872310638427734, 4.271400451660156, 9.730030059814453, 15.188663482666016, 20.647293090820312, 26.105924606323242, 31.564556121826172, 37.02318572998047, 42.48181915283203, 47.94044876098633, 53.399078369140625, 58.85771179199219, 64.31634521484375, 69.77497863769531, 75.23360443115234, 80.6922378540039, 86.15087127685547, 91.6094970703125, 97.06813049316406, 102.52676391601562, 107.98538970947266, 113.44402313232422, 118.90264892578125, 124.36128234863281, 129.81991577148438, 135.27854919433594, 140.7371826171875, 146.19580078125, 151.65443420410156, 157.11306762695312, 162.5717010498047, 168.03033447265625, 173.48895263671875, 178.9475860595703, 184.40621948242188, 189.86485290527344, 195.323486328125, 200.78211975097656, 206.24075317382812, 211.69937133789062, 217.1580047607422, 222.61663818359375, 228.0752716064453, 233.53390502929688, 238.99252319335938, 244.45115661621094, 249.9097900390625, 255.368408203125, 260.8270568847656, 266.2856750488281, 271.74432373046875, 277.20294189453125, 282.6615905761719, 288.1202087402344, 293.578857421875, 299.0374755859375, 304.4961242675781, 309.9547424316406, 315.41339111328125, 320.87200927734375, 326.33062744140625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 3.0, 7.0, 6.0, 7.0, 8.0, 9.0, 11.0, 20.0, 21.0, 20.0, 24.0, 28.0, 22.0, 27.0, 28.0, 38.0, 35.0, 43.0, 37.0, 49.0, 54.0, 38.0, 46.0, 44.0, 40.0, 35.0, 30.0, 36.0, 33.0, 25.0, 28.0, 28.0, 16.0, 11.0, 16.0, 10.0, 13.0, 8.0, 9.0, 7.0, 7.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.29015350341797, -26.372365951538086, -25.454578399658203, -24.536788940429688, -23.619001388549805, -22.701213836669922, -21.78342628479004, -20.865638732910156, -19.94784927368164, -19.030061721801758, -18.112274169921875, -17.19448471069336, -16.276697158813477, -15.358909606933594, -14.441122055053711, -13.523334503173828, -12.605546951293945, -11.687759399414062, -10.769970893859863, -9.85218334197998, -8.934394836425781, -8.016607284545898, -7.098819732666016, -6.181031703948975, -5.263243675231934, -4.345455646514893, -3.4276678562164307, -2.5098800659179688, -1.5920920372009277, -0.6743040084838867, 0.2434835433959961, 1.161271572113037, 2.079059600830078, 2.996847629547119, 3.914635419845581, 4.832423210144043, 5.750211238861084, 6.667999267578125, 7.585786819458008, 8.50357437133789, 9.42136287689209, 10.339150428771973, 11.256938934326172, 12.174726486206055, 13.092514038085938, 14.010302543640137, 14.92809009552002, 15.845878601074219, 16.7636661529541, 17.681453704833984, 18.599241256713867, 19.51702880859375, 20.434818267822266, 21.35260581970215, 22.27039337158203, 23.188180923461914, 24.105968475341797, 25.02375602722168, 25.941543579101562, 26.859333038330078, 27.77712059020996, 28.694908142089844, 29.612695693969727, 30.53048324584961, 31.448272705078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 6.0, 9.0, 12.0, 21.0, 17.0, 23.0, 20.0, 35.0, 23.0, 30.0, 35.0, 35.0, 29.0, 41.0, 33.0, 41.0, 33.0, 51.0, 39.0, 37.0, 33.0, 38.0, 37.0, 36.0, 30.0, 26.0, 27.0, 32.0, 32.0, 21.0, 18.0, 16.0, 10.0, 10.0, 6.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.400146484375, -5.23779296875, -5.075439453125, -4.9130859375, -4.750732421875, -4.58837890625, -4.426025390625, -4.263671875, -4.101318359375, -3.93896484375, -3.776611328125, -3.6142578125, -3.451904296875, -3.28955078125, -3.127197265625, -2.96484375, -2.802490234375, -2.64013671875, -2.477783203125, -2.3154296875, -2.153076171875, -1.99072265625, -1.828369140625, -1.666015625, -1.503662109375, -1.34130859375, -1.178955078125, -1.0166015625, -0.854248046875, -0.69189453125, -0.529541015625, -0.3671875, -0.204833984375, -0.04248046875, 0.119873046875, 0.2822265625, 0.444580078125, 0.60693359375, 0.769287109375, 0.931640625, 1.093994140625, 1.25634765625, 1.418701171875, 1.5810546875, 1.743408203125, 1.90576171875, 2.068115234375, 2.23046875, 2.392822265625, 2.55517578125, 2.717529296875, 2.8798828125, 3.042236328125, 3.20458984375, 3.366943359375, 3.529296875, 3.691650390625, 3.85400390625, 4.016357421875, 4.1787109375, 4.341064453125, 4.50341796875, 4.665771484375, 4.828125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 5.0, 10.0, 20.0, 23.0, 47.0, 47.0, 66.0, 110.0, 146.0, 198.0, 281.0, 455.0, 673.0, 932.0, 1283.0, 1884.0, 2638.0, 3964.0, 5737.0, 8309.0, 11807.0, 17408.0, 25686.0, 38718.0, 59696.0, 94983.0, 161028.0, 221048.0, 142178.0, 85234.0, 53966.0, 35153.0, 23267.0, 15762.0, 11014.0, 7736.0, 5168.0, 3605.0, 2540.0, 1689.0, 1268.0, 871.0, 612.0, 404.0, 260.0, 184.0, 144.0, 99.0, 62.0, 49.0, 34.0, 17.0, 16.0, 14.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.140380859375, -0.1359081268310547, -0.13143539428710938, -0.12696266174316406, -0.12248992919921875, -0.11801719665527344, -0.11354446411132812, -0.10907173156738281, -0.1045989990234375, -0.10012626647949219, -0.09565353393554688, -0.09118080139160156, -0.08670806884765625, -0.08223533630371094, -0.07776260375976562, -0.07328987121582031, -0.068817138671875, -0.06434440612792969, -0.059871673583984375, -0.05539894104003906, -0.05092620849609375, -0.04645347595214844, -0.041980743408203125, -0.03750801086425781, -0.0330352783203125, -0.028562545776367188, -0.024089813232421875, -0.019617080688476562, -0.01514434814453125, -0.010671615600585938, -0.006198883056640625, -0.0017261505126953125, 0.00274658203125, 0.0072193145751953125, 0.011692047119140625, 0.016164779663085938, 0.02063751220703125, 0.025110244750976562, 0.029582977294921875, 0.03405570983886719, 0.0385284423828125, 0.04300117492675781, 0.047473907470703125, 0.05194664001464844, 0.05641937255859375, 0.06089210510253906, 0.06536483764648438, 0.06983757019042969, 0.074310302734375, 0.07878303527832031, 0.08325576782226562, 0.08772850036621094, 0.09220123291015625, 0.09667396545410156, 0.10114669799804688, 0.10561943054199219, 0.1100921630859375, 0.11456489562988281, 0.11903762817382812, 0.12351036071777344, 0.12798309326171875, 0.13245582580566406, 0.13692855834960938, 0.1414012908935547, 0.1458740234375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 9.0, 9.0, 8.0, 23.0, 7.0, 27.0, 21.0, 18.0, 19.0, 24.0, 36.0, 29.0, 22.0, 49.0, 25.0, 40.0, 35.0, 34.0, 1070.0, 56.0, 37.0, 42.0, 49.0, 36.0, 23.0, 35.0, 38.0, 33.0, 17.0, 25.0, 12.0, 17.0, 9.0, 13.0, 13.0, 6.0, 8.0, 11.0, 3.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0], "bins": [-4.46875, -4.33966064453125, -4.2105712890625, -4.08148193359375, -3.952392578125, -3.82330322265625, -3.6942138671875, -3.56512451171875, -3.43603515625, -3.30694580078125, -3.1778564453125, -3.04876708984375, -2.919677734375, -2.79058837890625, -2.6614990234375, -2.53240966796875, -2.4033203125, -2.27423095703125, -2.1451416015625, -2.01605224609375, -1.886962890625, -1.75787353515625, -1.6287841796875, -1.49969482421875, -1.37060546875, -1.24151611328125, -1.1124267578125, -0.98333740234375, -0.854248046875, -0.72515869140625, -0.5960693359375, -0.46697998046875, -0.337890625, -0.20880126953125, -0.0797119140625, 0.04937744140625, 0.178466796875, 0.30755615234375, 0.4366455078125, 0.56573486328125, 0.69482421875, 0.82391357421875, 0.9530029296875, 1.08209228515625, 1.211181640625, 1.34027099609375, 1.4693603515625, 1.59844970703125, 1.7275390625, 1.85662841796875, 1.9857177734375, 2.11480712890625, 2.243896484375, 2.37298583984375, 2.5020751953125, 2.63116455078125, 2.76025390625, 2.88934326171875, 3.0184326171875, 3.14752197265625, 3.276611328125, 3.40570068359375, 3.5347900390625, 3.66387939453125, 3.79296875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 11.0, 22.0, 31.0, 23.0, 55.0, 77.0, 101.0, 153.0, 176.0, 282.0, 394.0, 523.0, 805.0, 1070.0, 1625.0, 2154.0, 3116.0, 4411.0, 6118.0, 8910.0, 12948.0, 19168.0, 28479.0, 44137.0, 71601.0, 123191.0, 1200283.0, 256551.0, 115251.0, 67271.0, 41893.0, 27159.0, 17954.0, 12331.0, 8596.0, 5958.0, 4213.0, 2830.0, 2080.0, 1478.0, 1073.0, 709.0, 572.0, 399.0, 287.0, 199.0, 141.0, 104.0, 64.0, 44.0, 36.0, 27.0, 19.0, 11.0, 6.0, 5.0, 2.0, 5.0], "bins": [-0.07073974609375, -0.06859207153320312, -0.06644439697265625, -0.06429672241210938, -0.0621490478515625, -0.060001373291015625, -0.05785369873046875, -0.055706024169921875, -0.053558349609375, -0.051410675048828125, -0.04926300048828125, -0.047115325927734375, -0.0449676513671875, -0.042819976806640625, -0.04067230224609375, -0.038524627685546875, -0.036376953125, -0.034229278564453125, -0.03208160400390625, -0.029933929443359375, -0.0277862548828125, -0.025638580322265625, -0.02349090576171875, -0.021343231201171875, -0.019195556640625, -0.017047882080078125, -0.01490020751953125, -0.012752532958984375, -0.0106048583984375, -0.008457183837890625, -0.00630950927734375, -0.004161834716796875, -0.00201416015625, 0.000133514404296875, 0.00228118896484375, 0.004428863525390625, 0.0065765380859375, 0.008724212646484375, 0.01087188720703125, 0.013019561767578125, 0.015167236328125, 0.017314910888671875, 0.01946258544921875, 0.021610260009765625, 0.0237579345703125, 0.025905609130859375, 0.02805328369140625, 0.030200958251953125, 0.0323486328125, 0.034496307373046875, 0.03664398193359375, 0.038791656494140625, 0.0409393310546875, 0.043087005615234375, 0.04523468017578125, 0.047382354736328125, 0.049530029296875, 0.051677703857421875, 0.05382537841796875, 0.055973052978515625, 0.0581207275390625, 0.060268402099609375, 0.06241607666015625, 0.06456375122070312, 0.06671142578125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 8.0, 6.0, 7.0, 12.0, 9.0, 18.0, 21.0, 46.0, 67.0, 92.0, 149.0, 169.0, 109.0, 84.0, 47.0, 32.0, 22.0, 10.0, 15.0, 12.0, 5.0, 5.0, 6.0, 5.0, 10.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007337108254432678, -0.0007116347551345825, -0.0006895586848258972, -0.0006674826145172119, -0.0006454065442085266, -0.0006233304738998413, -0.000601254403591156, -0.0005791783332824707, -0.0005571022629737854, -0.0005350261926651001, -0.0005129501223564148, -0.0004908740520477295, -0.0004687979817390442, -0.0004467219114303589, -0.0004246458411216736, -0.0004025697708129883, -0.000380493700504303, -0.0003584176301956177, -0.0003363415598869324, -0.00031426548957824707, -0.00029218941926956177, -0.00027011334896087646, -0.00024803727865219116, -0.00022596120834350586, -0.00020388513803482056, -0.00018180906772613525, -0.00015973299741744995, -0.00013765692710876465, -0.00011558085680007935, -9.350478649139404e-05, -7.142871618270874e-05, -4.935264587402344e-05, -2.7276575565338135e-05, -5.200505256652832e-06, 1.687556505203247e-05, 3.8951635360717773e-05, 6.1027705669403076e-05, 8.310377597808838e-05, 0.00010517984628677368, 0.00012725591659545898, 0.0001493319869041443, 0.0001714080572128296, 0.0001934841275215149, 0.0002155601978302002, 0.0002376362681388855, 0.0002597123384475708, 0.0002817884087562561, 0.0003038644790649414, 0.0003259405493736267, 0.000348016619682312, 0.0003700926899909973, 0.0003921687602996826, 0.0004142448306083679, 0.0004363209009170532, 0.0004583969712257385, 0.00048047304153442383, 0.0005025491118431091, 0.0005246251821517944, 0.0005467012524604797, 0.000568777322769165, 0.0005908533930778503, 0.0006129294633865356, 0.000635005533695221, 0.0006570816040039062]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 2.0, 10.0, 2.0, 7.0, 7.0, 6.0, 11.0, 19.0, 17.0, 37.0, 75.0, 113.0, 304.0, 1730.0, 985389.0, 59750.0, 592.0, 209.0, 111.0, 47.0, 27.0, 16.0, 16.0, 7.0, 4.0, 9.0, 6.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01580810546875, -0.015277624130249023, -0.014747142791748047, -0.01421666145324707, -0.013686180114746094, -0.013155698776245117, -0.01262521743774414, -0.012094736099243164, -0.011564254760742188, -0.011033773422241211, -0.010503292083740234, -0.009972810745239258, -0.009442329406738281, -0.008911848068237305, -0.008381366729736328, -0.007850885391235352, -0.007320404052734375, -0.0067899227142333984, -0.006259441375732422, -0.005728960037231445, -0.005198478698730469, -0.004667997360229492, -0.004137516021728516, -0.003607034683227539, -0.0030765533447265625, -0.002546072006225586, -0.0020155906677246094, -0.0014851093292236328, -0.0009546279907226562, -0.0004241466522216797, 0.00010633468627929688, 0.0006368160247802734, 0.00116729736328125, 0.0016977787017822266, 0.002228260040283203, 0.0027587413787841797, 0.0032892227172851562, 0.003819704055786133, 0.004350185394287109, 0.004880666732788086, 0.0054111480712890625, 0.005941629409790039, 0.006472110748291016, 0.007002592086791992, 0.007533073425292969, 0.008063554763793945, 0.008594036102294922, 0.009124517440795898, 0.009654998779296875, 0.010185480117797852, 0.010715961456298828, 0.011246442794799805, 0.011776924133300781, 0.012307405471801758, 0.012837886810302734, 0.013368368148803711, 0.013898849487304688, 0.014429330825805664, 0.01495981216430664, 0.015490293502807617, 0.016020774841308594, 0.01655125617980957, 0.017081737518310547, 0.017612218856811523, 0.0181427001953125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 42.0, 599.0, 341.0, 28.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016375152627006173, -0.0015273196622729301, -0.001417124061845243, -0.0013069284614175558, -0.0011967328609898686, -0.0010865372605621815, -0.0009763416019268334, -0.0008661460014991462, -0.0007559504010714591, -0.0006457548006437719, -0.0005355592002160847, -0.0004253635706845671, -0.0003151679702568799, -0.0002049723407253623, -9.477674029767513e-05, 1.5418860130012035e-05, 0.0001256144605576992, 0.00023581006098538637, 0.00034600566141307354, 0.00045620129094459116, 0.0005663968622684479, 0.000676592520903796, 0.0007867881213314831, 0.0008969837217591703, 0.0010071792639791965, 0.0011173748644068837, 0.0012275704648345709, 0.001337766065262258, 0.0014479616656899452, 0.0015581573825329542, 0.0016683528665453196, 0.0017785485833883286, 0.0018887443002313375, 0.0019989400170743465, 0.002109135501086712, 0.002219331217929721, 0.0023295267019420862, 0.002439722418785095, 0.0025499179027974606, 0.0026601136196404696, 0.002770309103652835, 0.002880504820495844, 0.0029907003045082092, 0.0031008960213512182, 0.0032110915053635836, 0.0033212872222065926, 0.003431482706218958, 0.003541678423061967, 0.003651874139904976, 0.003762069856747985, 0.0038722653407603502, 0.003982461057603359, 0.0040926565416157246, 0.00420285202562809, 0.0043130479753017426, 0.004423243459314108, 0.004533438943326473, 0.004643634427338839, 0.004753830377012491, 0.004864025861024857, 0.004974221345037222, 0.005084416829049587, 0.00519461277872324, 0.005304808262735605, 0.005415003746747971]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 8.0, 10.0, 11.0, 15.0, 10.0, 17.0, 27.0, 32.0, 30.0, 49.0, 36.0, 47.0, 41.0, 45.0, 56.0, 51.0, 53.0, 55.0, 47.0, 41.0, 45.0, 41.0, 46.0, 42.0, 32.0, 20.0, 21.0, 20.0, 14.0, 8.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002808570861816406, -0.0002685869112610817, -0.00025631673634052277, -0.00024404656141996384, -0.0002317763864994049, -0.00021950621157884598, -0.00020723603665828705, -0.00019496586173772812, -0.0001826956868171692, -0.00017042551189661026, -0.00015815533697605133, -0.0001458851620554924, -0.00013361498713493347, -0.00012134481221437454, -0.00010907463729381561, -9.680446237325668e-05, -8.453428745269775e-05, -7.226411253213882e-05, -5.9993937611579895e-05, -4.7723762691020966e-05, -3.5453587770462036e-05, -2.3183412849903107e-05, -1.0913237929344177e-05, 1.3569369912147522e-06, 1.3627111911773682e-05, 2.589728683233261e-05, 3.816746175289154e-05, 5.043763667345047e-05, 6.27078115940094e-05, 7.497798651456833e-05, 8.724816143512726e-05, 9.951833635568619e-05, 0.00011178851127624512, 0.00012405868619680405, 0.00013632886111736298, 0.0001485990360379219, 0.00016086921095848083, 0.00017313938587903976, 0.0001854095607995987, 0.00019767973572015762, 0.00020994991064071655, 0.00022222008556127548, 0.0002344902604818344, 0.00024676043540239334, 0.00025903061032295227, 0.0002713007852435112, 0.00028357096016407013, 0.00029584113508462906, 0.000308111310005188, 0.0003203814849257469, 0.00033265165984630585, 0.0003449218347668648, 0.0003571920096874237, 0.00036946218460798264, 0.00038173235952854156, 0.0003940025344491005, 0.0004062727093696594, 0.00041854288429021835, 0.0004308130592107773, 0.0004430832341313362, 0.00045535340905189514, 0.00046762358397245407, 0.000479893758893013, 0.0004921639338135719, 0.0005044341087341309]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 6.0, 9.0, 12.0, 21.0, 17.0, 23.0, 20.0, 35.0, 23.0, 30.0, 35.0, 35.0, 29.0, 41.0, 33.0, 41.0, 33.0, 51.0, 39.0, 37.0, 33.0, 38.0, 37.0, 36.0, 30.0, 26.0, 27.0, 32.0, 32.0, 21.0, 18.0, 16.0, 10.0, 10.0, 6.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.400146484375, -5.23779296875, -5.075439453125, -4.9130859375, -4.750732421875, -4.58837890625, -4.426025390625, -4.263671875, -4.101318359375, -3.93896484375, -3.776611328125, -3.6142578125, -3.451904296875, -3.28955078125, -3.127197265625, -2.96484375, -2.802490234375, -2.64013671875, -2.477783203125, -2.3154296875, -2.153076171875, -1.99072265625, -1.828369140625, -1.666015625, -1.503662109375, -1.34130859375, -1.178955078125, -1.0166015625, -0.854248046875, -0.69189453125, -0.529541015625, -0.3671875, -0.204833984375, -0.04248046875, 0.119873046875, 0.2822265625, 0.444580078125, 0.60693359375, 0.769287109375, 0.931640625, 1.093994140625, 1.25634765625, 1.418701171875, 1.5810546875, 1.743408203125, 1.90576171875, 2.068115234375, 2.23046875, 2.392822265625, 2.55517578125, 2.717529296875, 2.8798828125, 3.042236328125, 3.20458984375, 3.366943359375, 3.529296875, 3.691650390625, 3.85400390625, 4.016357421875, 4.1787109375, 4.341064453125, 4.50341796875, 4.665771484375, 4.828125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 26.0, 23.0, 36.0, 69.0, 78.0, 132.0, 223.0, 320.0, 450.0, 709.0, 997.0, 1588.0, 2590.0, 3951.0, 6320.0, 10119.0, 15997.0, 24858.0, 40777.0, 71067.0, 142353.0, 288369.0, 204338.0, 96239.0, 52505.0, 31271.0, 19390.0, 12306.0, 7859.0, 4909.0, 3117.0, 1961.0, 1223.0, 844.0, 515.0, 335.0, 189.0, 145.0, 110.0, 67.0, 56.0, 34.0, 24.0, 12.0, 15.0, 9.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75286865234375, -5.5526123046875, -5.35235595703125, -5.152099609375, -4.95184326171875, -4.7515869140625, -4.55133056640625, -4.35107421875, -4.15081787109375, -3.9505615234375, -3.75030517578125, -3.550048828125, -3.34979248046875, -3.1495361328125, -2.94927978515625, -2.7490234375, -2.54876708984375, -2.3485107421875, -2.14825439453125, -1.947998046875, -1.74774169921875, -1.5474853515625, -1.34722900390625, -1.14697265625, -0.94671630859375, -0.7464599609375, -0.54620361328125, -0.345947265625, -0.14569091796875, 0.0545654296875, 0.25482177734375, 0.455078125, 0.65533447265625, 0.8555908203125, 1.05584716796875, 1.256103515625, 1.45635986328125, 1.6566162109375, 1.85687255859375, 2.05712890625, 2.25738525390625, 2.4576416015625, 2.65789794921875, 2.858154296875, 3.05841064453125, 3.2586669921875, 3.45892333984375, 3.6591796875, 3.85943603515625, 4.0596923828125, 4.25994873046875, 4.460205078125, 4.66046142578125, 4.8607177734375, 5.06097412109375, 5.26123046875, 5.46148681640625, 5.6617431640625, 5.86199951171875, 6.062255859375, 6.26251220703125, 6.4627685546875, 6.66302490234375, 6.86328125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 15.0, 10.0, 20.0, 11.0, 27.0, 35.0, 37.0, 30.0, 39.0, 45.0, 34.0, 60.0, 78.0, 112.0, 168.0, 231.0, 1293.0, 186.0, 121.0, 76.0, 68.0, 48.0, 47.0, 45.0, 28.0, 38.0, 28.0, 22.0, 19.0, 16.0, 17.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.546875, -17.073974609375, -16.60107421875, -16.128173828125, -15.6552734375, -15.182373046875, -14.70947265625, -14.236572265625, -13.763671875, -13.290771484375, -12.81787109375, -12.344970703125, -11.8720703125, -11.399169921875, -10.92626953125, -10.453369140625, -9.98046875, -9.507568359375, -9.03466796875, -8.561767578125, -8.0888671875, -7.615966796875, -7.14306640625, -6.670166015625, -6.197265625, -5.724365234375, -5.25146484375, -4.778564453125, -4.3056640625, -3.832763671875, -3.35986328125, -2.886962890625, -2.4140625, -1.941162109375, -1.46826171875, -0.995361328125, -0.5224609375, -0.049560546875, 0.42333984375, 0.896240234375, 1.369140625, 1.842041015625, 2.31494140625, 2.787841796875, 3.2607421875, 3.733642578125, 4.20654296875, 4.679443359375, 5.15234375, 5.625244140625, 6.09814453125, 6.571044921875, 7.0439453125, 7.516845703125, 7.98974609375, 8.462646484375, 8.935546875, 9.408447265625, 9.88134765625, 10.354248046875, 10.8271484375, 11.300048828125, 11.77294921875, 12.245849609375, 12.71875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 3.0, 10.0, 10.0, 18.0, 22.0, 31.0, 54.0, 66.0, 110.0, 163.0, 223.0, 329.0, 462.0, 663.0, 1015.0, 1803.0, 3364.0, 7640.0, 22644.0, 92216.0, 897734.0, 1914844.0, 150484.0, 31920.0, 9869.0, 4151.0, 2104.0, 1292.0, 759.0, 518.0, 341.0, 244.0, 168.0, 126.0, 76.0, 70.0, 39.0, 28.0, 25.0, 16.0, 17.0, 9.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.136474609375, -15.60107421875, -15.065673828125, -14.5302734375, -13.994873046875, -13.45947265625, -12.924072265625, -12.388671875, -11.853271484375, -11.31787109375, -10.782470703125, -10.2470703125, -9.711669921875, -9.17626953125, -8.640869140625, -8.10546875, -7.570068359375, -7.03466796875, -6.499267578125, -5.9638671875, -5.428466796875, -4.89306640625, -4.357666015625, -3.822265625, -3.286865234375, -2.75146484375, -2.216064453125, -1.6806640625, -1.145263671875, -0.60986328125, -0.074462890625, 0.4609375, 0.996337890625, 1.53173828125, 2.067138671875, 2.6025390625, 3.137939453125, 3.67333984375, 4.208740234375, 4.744140625, 5.279541015625, 5.81494140625, 6.350341796875, 6.8857421875, 7.421142578125, 7.95654296875, 8.491943359375, 9.02734375, 9.562744140625, 10.09814453125, 10.633544921875, 11.1689453125, 11.704345703125, 12.23974609375, 12.775146484375, 13.310546875, 13.845947265625, 14.38134765625, 14.916748046875, 15.4521484375, 15.987548828125, 16.52294921875, 17.058349609375, 17.59375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 29.0, 46.0, 177.0, 383.0, 245.0, 86.0, 20.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.758544921875, -214.1777801513672, -207.59701538085938, -201.01625061035156, -194.43548583984375, -187.854736328125, -181.2739715576172, -174.69320678710938, -168.11244201660156, -161.53167724609375, -154.95091247558594, -148.37014770507812, -141.78939819335938, -135.2086181640625, -128.62786865234375, -122.04710388183594, -115.46633911132812, -108.88557434082031, -102.3048095703125, -95.72405242919922, -89.1432876586914, -82.5625228881836, -75.98176574707031, -69.4010009765625, -62.82023620605469, -56.239471435546875, -49.65871047973633, -43.07794952392578, -36.49718475341797, -29.916419982910156, -23.33565902709961, -16.754898071289062, -10.174118041992188, -3.593355178833008, 2.987407684326172, 9.568170547485352, 16.14893341064453, 22.729698181152344, 29.31045913696289, 35.89122009277344, 42.47198486328125, 49.05274963378906, 55.63351058959961, 62.214271545410156, 68.79503631591797, 75.37580108642578, 81.95655822753906, 88.53732299804688, 95.11808776855469, 101.6988525390625, 108.27961730957031, 114.8603744506836, 121.4411392211914, 128.02191162109375, 134.6026611328125, 141.1834259033203, 147.76419067382812, 154.34495544433594, 160.92572021484375, 167.50648498535156, 174.08724975585938, 180.66799926757812, 187.24876403808594, 193.82952880859375, 200.41029357910156]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 8.0, 6.0, 4.0, 12.0, 20.0, 10.0, 14.0, 25.0, 24.0, 15.0, 29.0, 29.0, 20.0, 36.0, 38.0, 26.0, 50.0, 48.0, 43.0, 37.0, 23.0, 35.0, 38.0, 39.0, 34.0, 30.0, 29.0, 45.0, 32.0, 18.0, 37.0, 29.0, 25.0, 14.0, 18.0, 15.0, 8.0, 9.0, 5.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.59511947631836, -36.26951599121094, -34.943912506103516, -33.618309020996094, -32.29270935058594, -30.967103958129883, -29.641502380371094, -28.315898895263672, -26.99029541015625, -25.664691925048828, -24.339088439941406, -23.013486862182617, -21.687883377075195, -20.362279891967773, -19.036678314208984, -17.711074829101562, -16.38547134399414, -15.059867858886719, -13.734265327453613, -12.408662796020508, -11.083059310913086, -9.757455825805664, -8.431853294372559, -7.106250762939453, -5.780647277832031, -4.455044269561768, -3.129441261291504, -1.8038382530212402, -0.47823524475097656, 0.8473677635192871, 2.172970771789551, 3.4985733032226562, 4.8241729736328125, 6.149775981903076, 7.47537899017334, 8.800981521606445, 10.126585006713867, 11.452188491821289, 12.777791023254395, 14.1033935546875, 15.428997039794922, 16.754600524902344, 18.080204010009766, 19.405805587768555, 20.731409072875977, 22.0570125579834, 23.382614135742188, 24.70821762084961, 26.03382110595703, 27.359424591064453, 28.685028076171875, 30.010629653930664, 31.336233139038086, 32.661834716796875, 33.9874382019043, 35.31304168701172, 36.63864517211914, 37.96424865722656, 39.289852142333984, 40.615455627441406, 41.94105529785156, 43.266658782958984, 44.592262268066406, 45.91786575317383, 47.24346923828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 3.0, 10.0, 7.0, 16.0, 6.0, 16.0, 16.0, 10.0, 23.0, 23.0, 25.0, 18.0, 36.0, 34.0, 32.0, 34.0, 31.0, 32.0, 34.0, 41.0, 42.0, 31.0, 32.0, 47.0, 39.0, 31.0, 31.0, 39.0, 39.0, 38.0, 18.0, 30.0, 24.0, 10.0, 16.0, 23.0, 15.0, 11.0, 6.0, 8.0, 1.0, 10.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.890625, -5.71673583984375, -5.5428466796875, -5.36895751953125, -5.195068359375, -5.02117919921875, -4.8472900390625, -4.67340087890625, -4.49951171875, -4.32562255859375, -4.1517333984375, -3.97784423828125, -3.803955078125, -3.63006591796875, -3.4561767578125, -3.28228759765625, -3.1083984375, -2.93450927734375, -2.7606201171875, -2.58673095703125, -2.412841796875, -2.23895263671875, -2.0650634765625, -1.89117431640625, -1.71728515625, -1.54339599609375, -1.3695068359375, -1.19561767578125, -1.021728515625, -0.84783935546875, -0.6739501953125, -0.50006103515625, -0.326171875, -0.15228271484375, 0.0216064453125, 0.19549560546875, 0.369384765625, 0.54327392578125, 0.7171630859375, 0.89105224609375, 1.06494140625, 1.23883056640625, 1.4127197265625, 1.58660888671875, 1.760498046875, 1.93438720703125, 2.1082763671875, 2.28216552734375, 2.4560546875, 2.62994384765625, 2.8038330078125, 2.97772216796875, 3.151611328125, 3.32550048828125, 3.4993896484375, 3.67327880859375, 3.84716796875, 4.02105712890625, 4.1949462890625, 4.36883544921875, 4.542724609375, 4.71661376953125, 4.8905029296875, 5.06439208984375, 5.23828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 5.0, 13.0, 15.0, 23.0, 23.0, 36.0, 45.0, 58.0, 86.0, 127.0, 189.0, 338.0, 647.0, 1914.0, 8705.0, 169969.0, 3963731.0, 40889.0, 4867.0, 1270.0, 501.0, 272.0, 179.0, 80.0, 76.0, 58.0, 46.0, 29.0, 17.0, 18.0, 13.0, 13.0, 9.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.81298828125, -44.2509765625, -42.68896484375, -41.126953125, -39.56494140625, -38.0029296875, -36.44091796875, -34.87890625, -33.31689453125, -31.7548828125, -30.19287109375, -28.630859375, -27.06884765625, -25.5068359375, -23.94482421875, -22.3828125, -20.82080078125, -19.2587890625, -17.69677734375, -16.134765625, -14.57275390625, -13.0107421875, -11.44873046875, -9.88671875, -8.32470703125, -6.7626953125, -5.20068359375, -3.638671875, -2.07666015625, -0.5146484375, 1.04736328125, 2.609375, 4.17138671875, 5.7333984375, 7.29541015625, 8.857421875, 10.41943359375, 11.9814453125, 13.54345703125, 15.10546875, 16.66748046875, 18.2294921875, 19.79150390625, 21.353515625, 22.91552734375, 24.4775390625, 26.03955078125, 27.6015625, 29.16357421875, 30.7255859375, 32.28759765625, 33.849609375, 35.41162109375, 36.9736328125, 38.53564453125, 40.09765625, 41.65966796875, 43.2216796875, 44.78369140625, 46.345703125, 47.90771484375, 49.4697265625, 51.03173828125, 52.59375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 21.0, 17.0, 58.0, 79.0, 164.0, 334.0, 715.0, 1436.0, 720.0, 249.0, 112.0, 75.0, 33.0, 21.0, 7.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.328125, -13.593017578125, -12.85791015625, -12.122802734375, -11.3876953125, -10.652587890625, -9.91748046875, -9.182373046875, -8.447265625, -7.712158203125, -6.97705078125, -6.241943359375, -5.5068359375, -4.771728515625, -4.03662109375, -3.301513671875, -2.56640625, -1.831298828125, -1.09619140625, -0.361083984375, 0.3740234375, 1.109130859375, 1.84423828125, 2.579345703125, 3.314453125, 4.049560546875, 4.78466796875, 5.519775390625, 6.2548828125, 6.989990234375, 7.72509765625, 8.460205078125, 9.1953125, 9.930419921875, 10.66552734375, 11.400634765625, 12.1357421875, 12.870849609375, 13.60595703125, 14.341064453125, 15.076171875, 15.811279296875, 16.54638671875, 17.281494140625, 18.0166015625, 18.751708984375, 19.48681640625, 20.221923828125, 20.95703125, 21.692138671875, 22.42724609375, 23.162353515625, 23.8974609375, 24.632568359375, 25.36767578125, 26.102783203125, 26.837890625, 27.572998046875, 28.30810546875, 29.043212890625, 29.7783203125, 30.513427734375, 31.24853515625, 31.983642578125, 32.71875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 10.0, 12.0, 22.0, 27.0, 68.0, 163.0, 394.0, 938.0, 3039.0, 15951.0, 1631968.0, 2519084.0, 17629.0, 3273.0, 1018.0, 362.0, 150.0, 71.0, 44.0, 19.0, 18.0, 8.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.71875, -41.81982421875, -39.9208984375, -38.02197265625, -36.123046875, -34.22412109375, -32.3251953125, -30.42626953125, -28.52734375, -26.62841796875, -24.7294921875, -22.83056640625, -20.931640625, -19.03271484375, -17.1337890625, -15.23486328125, -13.3359375, -11.43701171875, -9.5380859375, -7.63916015625, -5.740234375, -3.84130859375, -1.9423828125, -0.04345703125, 1.85546875, 3.75439453125, 5.6533203125, 7.55224609375, 9.451171875, 11.35009765625, 13.2490234375, 15.14794921875, 17.046875, 18.94580078125, 20.8447265625, 22.74365234375, 24.642578125, 26.54150390625, 28.4404296875, 30.33935546875, 32.23828125, 34.13720703125, 36.0361328125, 37.93505859375, 39.833984375, 41.73291015625, 43.6318359375, 45.53076171875, 47.4296875, 49.32861328125, 51.2275390625, 53.12646484375, 55.025390625, 56.92431640625, 58.8232421875, 60.72216796875, 62.62109375, 64.52001953125, 66.4189453125, 68.31787109375, 70.216796875, 72.11572265625, 74.0146484375, 75.91357421875, 77.8125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [2.0, 105.0, 740.0, 170.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.89746856689453, -22.230972290039062, -8.564477920532227, 5.102016448974609, 18.768512725830078, 32.43500518798828, 46.10150146484375, 59.76799774169922, 73.43449401855469, 87.10099029541016, 100.76748657226562, 114.43397521972656, 128.10047912597656, 141.7669677734375, 155.4334716796875, 169.09996032714844, 182.76644897460938, 196.4329376220703, 210.0994415283203, 223.76593017578125, 237.43243408203125, 251.0989227294922, 264.7654113769531, 278.4319152832031, 292.0984191894531, 305.7649230957031, 319.431396484375, 333.097900390625, 346.764404296875, 360.430908203125, 374.0973815917969, 387.7638854980469, 401.4303894042969, 415.0968933105469, 428.76336669921875, 442.42987060546875, 456.09637451171875, 469.76287841796875, 483.4293518066406, 497.0958557128906, 510.7623596191406, 524.4288330078125, 538.0953369140625, 551.7618408203125, 565.4283447265625, 579.0948486328125, 592.7613525390625, 606.4278564453125, 620.0942993164062, 633.7608032226562, 647.4273071289062, 661.0938110351562, 674.76025390625, 688.4267578125, 702.09326171875, 715.759765625, 729.42626953125, 743.0927734375, 756.75927734375, 770.42578125, 784.0922241210938, 797.7587280273438, 811.4252319335938, 825.0917358398438, 838.7582397460938]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 7.0, 12.0, 10.0, 11.0, 10.0, 20.0, 26.0, 22.0, 30.0, 30.0, 42.0, 44.0, 38.0, 54.0, 51.0, 53.0, 44.0, 31.0, 36.0, 38.0, 34.0, 44.0, 45.0, 33.0, 38.0, 23.0, 29.0, 21.0, 31.0, 15.0, 16.0, 13.0, 6.0, 5.0, 11.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.707557678222656, -38.42266845703125, -37.13777542114258, -35.852882385253906, -34.5679931640625, -33.283103942871094, -31.998210906982422, -30.713319778442383, -29.428428649902344, -28.143537521362305, -26.858646392822266, -25.573755264282227, -24.288864135742188, -23.00397300720215, -21.71908187866211, -20.43419075012207, -19.14929962158203, -17.864408493041992, -16.579517364501953, -15.294626235961914, -14.009735107421875, -12.724843978881836, -11.439952850341797, -10.155061721801758, -8.870170593261719, -7.58527946472168, -6.300388336181641, -5.015497207641602, -3.7306060791015625, -2.4457149505615234, -1.1608238220214844, 0.12406730651855469, 1.4089622497558594, 2.6938533782958984, 3.9787445068359375, 5.263635635375977, 6.548526763916016, 7.833417892456055, 9.118309020996094, 10.403200149536133, 11.688091278076172, 12.972982406616211, 14.25787353515625, 15.542764663696289, 16.827655792236328, 18.112546920776367, 19.397438049316406, 20.682329177856445, 21.967220306396484, 23.252111434936523, 24.537002563476562, 25.8218936920166, 27.10678482055664, 28.39167594909668, 29.67656707763672, 30.961458206176758, 32.2463493347168, 33.53124237060547, 34.816131591796875, 36.10102081298828, 37.38591384887695, 38.670806884765625, 39.95569610595703, 41.24058532714844, 42.52547836303711]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 6.0, 8.0, 17.0, 13.0, 19.0, 16.0, 28.0, 26.0, 30.0, 46.0, 30.0, 35.0, 34.0, 34.0, 35.0, 43.0, 41.0, 52.0, 50.0, 46.0, 44.0, 48.0, 31.0, 32.0, 20.0, 31.0, 32.0, 27.0, 20.0, 16.0, 13.0, 13.0, 16.0, 10.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.7242431640625, -5.526611328125, -5.3289794921875, -5.13134765625, -4.9337158203125, -4.736083984375, -4.5384521484375, -4.3408203125, -4.1431884765625, -3.945556640625, -3.7479248046875, -3.55029296875, -3.3526611328125, -3.155029296875, -2.9573974609375, -2.759765625, -2.5621337890625, -2.364501953125, -2.1668701171875, -1.96923828125, -1.7716064453125, -1.573974609375, -1.3763427734375, -1.1787109375, -0.9810791015625, -0.783447265625, -0.5858154296875, -0.38818359375, -0.1905517578125, 0.007080078125, 0.2047119140625, 0.40234375, 0.5999755859375, 0.797607421875, 0.9952392578125, 1.19287109375, 1.3905029296875, 1.588134765625, 1.7857666015625, 1.9833984375, 2.1810302734375, 2.378662109375, 2.5762939453125, 2.77392578125, 2.9715576171875, 3.169189453125, 3.3668212890625, 3.564453125, 3.7620849609375, 3.959716796875, 4.1573486328125, 4.35498046875, 4.5526123046875, 4.750244140625, 4.9478759765625, 5.1455078125, 5.3431396484375, 5.540771484375, 5.7384033203125, 5.93603515625, 6.1336669921875, 6.331298828125, 6.5289306640625, 6.7265625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 10.0, 23.0, 28.0, 31.0, 73.0, 105.0, 149.0, 222.0, 352.0, 550.0, 871.0, 1376.0, 2100.0, 3465.0, 5733.0, 9373.0, 15598.0, 26042.0, 45571.0, 81833.0, 154295.0, 263621.0, 196452.0, 103565.0, 56464.0, 31967.0, 19120.0, 11473.0, 6814.0, 4158.0, 2655.0, 1645.0, 1020.0, 612.0, 378.0, 259.0, 188.0, 122.0, 82.0, 52.0, 31.0, 19.0, 13.0, 10.0, 12.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2080078125, -0.20183372497558594, -0.19565963745117188, -0.1894855499267578, -0.18331146240234375, -0.1771373748779297, -0.17096328735351562, -0.16478919982910156, -0.1586151123046875, -0.15244102478027344, -0.14626693725585938, -0.1400928497314453, -0.13391876220703125, -0.1277446746826172, -0.12157058715820312, -0.11539649963378906, -0.109222412109375, -0.10304832458496094, -0.09687423706054688, -0.09070014953613281, -0.08452606201171875, -0.07835197448730469, -0.07217788696289062, -0.06600379943847656, -0.0598297119140625, -0.05365562438964844, -0.047481536865234375, -0.04130744934082031, -0.03513336181640625, -0.028959274291992188, -0.022785186767578125, -0.016611099243164062, -0.01043701171875, -0.0042629241943359375, 0.001911163330078125, 0.008085250854492188, 0.01425933837890625, 0.020433425903320312, 0.026607513427734375, 0.03278160095214844, 0.0389556884765625, 0.04512977600097656, 0.051303863525390625, 0.05747795104980469, 0.06365203857421875, 0.06982612609863281, 0.07600021362304688, 0.08217430114746094, 0.088348388671875, 0.09452247619628906, 0.10069656372070312, 0.10687065124511719, 0.11304473876953125, 0.11921882629394531, 0.12539291381835938, 0.13156700134277344, 0.1377410888671875, 0.14391517639160156, 0.15008926391601562, 0.1562633514404297, 0.16243743896484375, 0.1686115264892578, 0.17478561401367188, 0.18095970153808594, 0.1871337890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 12.0, 11.0, 9.0, 11.0, 17.0, 21.0, 14.0, 24.0, 25.0, 25.0, 27.0, 30.0, 34.0, 33.0, 46.0, 48.0, 55.0, 45.0, 1079.0, 49.0, 43.0, 41.0, 28.0, 52.0, 31.0, 28.0, 19.0, 17.0, 26.0, 22.0, 20.0, 18.0, 10.0, 13.0, 12.0, 5.0, 8.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.19921875, -6.02752685546875, -5.8558349609375, -5.68414306640625, -5.512451171875, -5.34075927734375, -5.1690673828125, -4.99737548828125, -4.82568359375, -4.65399169921875, -4.4822998046875, -4.31060791015625, -4.138916015625, -3.96722412109375, -3.7955322265625, -3.62384033203125, -3.4521484375, -3.28045654296875, -3.1087646484375, -2.93707275390625, -2.765380859375, -2.59368896484375, -2.4219970703125, -2.25030517578125, -2.07861328125, -1.90692138671875, -1.7352294921875, -1.56353759765625, -1.391845703125, -1.22015380859375, -1.0484619140625, -0.87677001953125, -0.705078125, -0.53338623046875, -0.3616943359375, -0.19000244140625, -0.018310546875, 0.15338134765625, 0.3250732421875, 0.49676513671875, 0.66845703125, 0.84014892578125, 1.0118408203125, 1.18353271484375, 1.355224609375, 1.52691650390625, 1.6986083984375, 1.87030029296875, 2.0419921875, 2.21368408203125, 2.3853759765625, 2.55706787109375, 2.728759765625, 2.90045166015625, 3.0721435546875, 3.24383544921875, 3.41552734375, 3.58721923828125, 3.7589111328125, 3.93060302734375, 4.102294921875, 4.27398681640625, 4.4456787109375, 4.61737060546875, 4.7890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 7.0, 10.0, 11.0, 12.0, 21.0, 37.0, 52.0, 57.0, 96.0, 109.0, 178.0, 234.0, 373.0, 559.0, 850.0, 1253.0, 1891.0, 2841.0, 4538.0, 7006.0, 10963.0, 17213.0, 28047.0, 46035.0, 80060.0, 143195.0, 1290677.0, 195928.0, 107408.0, 60800.0, 35771.0, 21785.0, 13867.0, 8854.0, 5571.0, 3760.0, 2385.0, 1614.0, 999.0, 664.0, 486.0, 312.0, 193.0, 128.0, 86.0, 67.0, 43.0, 21.0, 14.0, 14.0, 12.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0], "bins": [-0.0875244140625, -0.08485221862792969, -0.08218002319335938, -0.07950782775878906, -0.07683563232421875, -0.07416343688964844, -0.07149124145507812, -0.06881904602050781, -0.0661468505859375, -0.06347465515136719, -0.060802459716796875, -0.05813026428222656, -0.05545806884765625, -0.05278587341308594, -0.050113677978515625, -0.04744148254394531, -0.044769287109375, -0.04209709167480469, -0.039424896240234375, -0.03675270080566406, -0.03408050537109375, -0.03140830993652344, -0.028736114501953125, -0.026063919067382812, -0.0233917236328125, -0.020719528198242188, -0.018047332763671875, -0.015375137329101562, -0.01270294189453125, -0.010030746459960938, -0.007358551025390625, -0.0046863555908203125, -0.00201416015625, 0.0006580352783203125, 0.003330230712890625, 0.0060024261474609375, 0.00867462158203125, 0.011346817016601562, 0.014019012451171875, 0.016691207885742188, 0.0193634033203125, 0.022035598754882812, 0.024707794189453125, 0.027379989624023438, 0.03005218505859375, 0.03272438049316406, 0.035396575927734375, 0.03806877136230469, 0.040740966796875, 0.04341316223144531, 0.046085357666015625, 0.04875755310058594, 0.05142974853515625, 0.05410194396972656, 0.056774139404296875, 0.05944633483886719, 0.0621185302734375, 0.06479072570800781, 0.06746292114257812, 0.07013511657714844, 0.07280731201171875, 0.07547950744628906, 0.07815170288085938, 0.08082389831542969, 0.08349609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 5.0, 11.0, 14.0, 7.0, 11.0, 20.0, 12.0, 19.0, 24.0, 27.0, 39.0, 34.0, 72.0, 76.0, 107.0, 87.0, 78.0, 55.0, 43.0, 39.0, 48.0, 19.0, 16.0, 15.0, 16.0, 11.0, 16.0, 12.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005183219909667969, -0.0005003586411476135, -0.0004823952913284302, -0.0004644319415092468, -0.0004464685916900635, -0.0004285052418708801, -0.0004105418920516968, -0.00039257854223251343, -0.0003746151924133301, -0.00035665184259414673, -0.0003386884927749634, -0.00032072514295578003, -0.0003027617931365967, -0.00028479844331741333, -0.00026683509349823, -0.00024887174367904663, -0.00023090839385986328, -0.00021294504404067993, -0.00019498169422149658, -0.00017701834440231323, -0.00015905499458312988, -0.00014109164476394653, -0.00012312829494476318, -0.00010516494512557983, -8.720159530639648e-05, -6.923824548721313e-05, -5.1274895668029785e-05, -3.3311545848846436e-05, -1.5348196029663086e-05, 2.6151537895202637e-06, 2.0578503608703613e-05, 3.854185342788696e-05, 5.650520324707031e-05, 7.446855306625366e-05, 9.243190288543701e-05, 0.00011039525270462036, 0.0001283586025238037, 0.00014632195234298706, 0.0001642853021621704, 0.00018224865198135376, 0.0002002120018005371, 0.00021817535161972046, 0.0002361387014389038, 0.00025410205125808716, 0.0002720654010772705, 0.00029002875089645386, 0.0003079921007156372, 0.00032595545053482056, 0.0003439188003540039, 0.00036188215017318726, 0.0003798454999923706, 0.00039780884981155396, 0.0004157721996307373, 0.00043373554944992065, 0.000451698899269104, 0.00046966224908828735, 0.0004876255989074707, 0.000505588948726654, 0.0005235522985458374, 0.0005415156483650208, 0.0005594789981842041, 0.0005774423480033875, 0.0005954056978225708, 0.0006133690476417542, 0.0006313323974609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 10.0, 17.0, 17.0, 20.0, 20.0, 28.0, 39.0, 74.0, 92.0, 194.0, 359.0, 1980.0, 264832.0, 776533.0, 3268.0, 489.0, 189.0, 110.0, 58.0, 34.0, 25.0, 18.0, 24.0, 11.0, 9.0, 16.0, 11.0, 8.0, 9.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.01486968994140625, -0.014445781707763672, -0.014021873474121094, -0.013597965240478516, -0.013174057006835938, -0.01275014877319336, -0.012326240539550781, -0.011902332305908203, -0.011478424072265625, -0.011054515838623047, -0.010630607604980469, -0.01020669937133789, -0.009782791137695312, -0.009358882904052734, -0.008934974670410156, -0.008511066436767578, -0.008087158203125, -0.007663249969482422, -0.007239341735839844, -0.006815433502197266, -0.0063915252685546875, -0.005967617034912109, -0.005543708801269531, -0.005119800567626953, -0.004695892333984375, -0.004271984100341797, -0.0038480758666992188, -0.0034241676330566406, -0.0030002593994140625, -0.0025763511657714844, -0.0021524429321289062, -0.0017285346984863281, -0.00130462646484375, -0.0008807182312011719, -0.00045680999755859375, -3.2901763916015625e-05, 0.0003910064697265625, 0.0008149147033691406, 0.0012388229370117188, 0.0016627311706542969, 0.002086639404296875, 0.002510547637939453, 0.0029344558715820312, 0.0033583641052246094, 0.0037822723388671875, 0.004206180572509766, 0.004630088806152344, 0.005053997039794922, 0.0054779052734375, 0.005901813507080078, 0.006325721740722656, 0.006749629974365234, 0.0071735382080078125, 0.007597446441650391, 0.008021354675292969, 0.008445262908935547, 0.008869171142578125, 0.009293079376220703, 0.009716987609863281, 0.01014089584350586, 0.010564804077148438, 0.010988712310791016, 0.011412620544433594, 0.011836528778076172, 0.01226043701171875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 33.0, 247.0, 601.0, 111.0, 15.0, 4.0], "bins": [-0.0061801765114068985, -0.006077658850699663, -0.0059751407243311405, -0.005872623063623905, -0.00577010540291667, -0.005667587276548147, -0.005565069615840912, -0.005462551489472389, -0.005360033828765154, -0.0052575161680579185, -0.005154998041689396, -0.005052480380982161, -0.004949962720274925, -0.004847444593906403, -0.004744926933199167, -0.004642409272491932, -0.004539891146123409, -0.004437373485416174, -0.004334855359047651, -0.004232337698340416, -0.004129820037633181, -0.004027301911264658, -0.003924784250557423, -0.0038222663570195436, -0.0037197486963123083, -0.0036172308027744293, -0.003514713142067194, -0.003412195248529315, -0.003309677354991436, -0.0032071596942842007, -0.0031046418007463217, -0.0030021239072084427, -0.0028996060136705637, -0.0027970881201326847, -0.0026945704594254494, -0.0025920525658875704, -0.0024895346723496914, -0.002387017011642456, -0.002284499118104577, -0.002181981224566698, -0.0020794635638594627, -0.0019769456703215837, -0.0018744278931990266, -0.0017719101160764694, -0.0016693922225385904, -0.0015668744454160333, -0.001464356668293476, -0.0013618387747555971, -0.0012593208812177181, -0.001156803104095161, -0.001054285210557282, -0.0009517674334347248, -0.0008492495398968458, -0.0007467317627742887, -0.0006442139274440706, -0.0005416960921138525, -0.00043917822767980397, -0.0003366603923495859, -0.00023414257157128304, -0.0001316247507929802, -2.9106915462762117e-05, 7.34108907636255e-05, 0.00017592872609384358, 0.00027844656142406166, 0.00038096439675427973]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 5.0, 16.0, 14.0, 11.0, 15.0, 22.0, 18.0, 30.0, 24.0, 28.0, 28.0, 36.0, 43.0, 41.0, 40.0, 37.0, 35.0, 57.0, 55.0, 46.0, 40.0, 41.0, 37.0, 43.0, 23.0, 20.0, 16.0, 28.0, 21.0, 19.0, 9.0, 14.0, 10.0, 10.0, 9.0, 8.0, 9.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00036454200744628906, -0.0003531603142619133, -0.00034177862107753754, -0.0003303969278931618, -0.000319015234708786, -0.00030763354152441025, -0.0002962518483400345, -0.0002848701551556587, -0.00027348846197128296, -0.0002621067687869072, -0.00025072507560253143, -0.00023934338241815567, -0.0002279616892337799, -0.00021657999604940414, -0.00020519830286502838, -0.00019381660968065262, -0.00018243491649627686, -0.0001710532233119011, -0.00015967153012752533, -0.00014828983694314957, -0.0001369081437587738, -0.00012552645057439804, -0.00011414475739002228, -0.00010276306420564651, -9.138137102127075e-05, -7.999967783689499e-05, -6.861798465251923e-05, -5.723629146814346e-05, -4.58545982837677e-05, -3.447290509939194e-05, -2.3091211915016174e-05, -1.1709518730640411e-05, -3.2782554626464844e-07, 1.1053867638111115e-05, 2.2435560822486877e-05, 3.381725400686264e-05, 4.51989471912384e-05, 5.6580640375614166e-05, 6.796233355998993e-05, 7.934402674436569e-05, 9.072571992874146e-05, 0.00010210741311311722, 0.00011348910629749298, 0.00012487079948186874, 0.0001362524926662445, 0.00014763418585062027, 0.00015901587903499603, 0.0001703975722193718, 0.00018177926540374756, 0.00019316095858812332, 0.00020454265177249908, 0.00021592434495687485, 0.0002273060381412506, 0.00023868773132562637, 0.00025006942451000214, 0.0002614511176943779, 0.00027283281087875366, 0.0002842145040631294, 0.0002955961972475052, 0.00030697789043188095, 0.0003183595836162567, 0.0003297412768006325, 0.00034112296998500824, 0.000352504663169384, 0.00036388635635375977]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 6.0, 8.0, 17.0, 13.0, 19.0, 16.0, 28.0, 26.0, 30.0, 46.0, 30.0, 35.0, 34.0, 34.0, 35.0, 43.0, 41.0, 52.0, 50.0, 46.0, 44.0, 48.0, 31.0, 32.0, 20.0, 31.0, 32.0, 27.0, 20.0, 16.0, 13.0, 13.0, 16.0, 10.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.7242431640625, -5.526611328125, -5.3289794921875, -5.13134765625, -4.9337158203125, -4.736083984375, -4.5384521484375, -4.3408203125, -4.1431884765625, -3.945556640625, -3.7479248046875, -3.55029296875, -3.3526611328125, -3.155029296875, -2.9573974609375, -2.759765625, -2.5621337890625, -2.364501953125, -2.1668701171875, -1.96923828125, -1.7716064453125, -1.573974609375, -1.3763427734375, -1.1787109375, -0.9810791015625, -0.783447265625, -0.5858154296875, -0.38818359375, -0.1905517578125, 0.007080078125, 0.2047119140625, 0.40234375, 0.5999755859375, 0.797607421875, 0.9952392578125, 1.19287109375, 1.3905029296875, 1.588134765625, 1.7857666015625, 1.9833984375, 2.1810302734375, 2.378662109375, 2.5762939453125, 2.77392578125, 2.9715576171875, 3.169189453125, 3.3668212890625, 3.564453125, 3.7620849609375, 3.959716796875, 4.1573486328125, 4.35498046875, 4.5526123046875, 4.750244140625, 4.9478759765625, 5.1455078125, 5.3431396484375, 5.540771484375, 5.7384033203125, 5.93603515625, 6.1336669921875, 6.331298828125, 6.5289306640625, 6.7265625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 11.0, 8.0, 13.0, 14.0, 32.0, 63.0, 129.0, 258.0, 539.0, 1497.0, 4147.0, 16373.0, 83455.0, 490559.0, 372037.0, 61172.0, 12546.0, 3565.0, 1139.0, 506.0, 219.0, 107.0, 52.0, 35.0, 15.0, 12.0, 13.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-23.390625, -22.679931640625, -21.96923828125, -21.258544921875, -20.5478515625, -19.837158203125, -19.12646484375, -18.415771484375, -17.705078125, -16.994384765625, -16.28369140625, -15.572998046875, -14.8623046875, -14.151611328125, -13.44091796875, -12.730224609375, -12.01953125, -11.308837890625, -10.59814453125, -9.887451171875, -9.1767578125, -8.466064453125, -7.75537109375, -7.044677734375, -6.333984375, -5.623291015625, -4.91259765625, -4.201904296875, -3.4912109375, -2.780517578125, -2.06982421875, -1.359130859375, -0.6484375, 0.062255859375, 0.77294921875, 1.483642578125, 2.1943359375, 2.905029296875, 3.61572265625, 4.326416015625, 5.037109375, 5.747802734375, 6.45849609375, 7.169189453125, 7.8798828125, 8.590576171875, 9.30126953125, 10.011962890625, 10.72265625, 11.433349609375, 12.14404296875, 12.854736328125, 13.5654296875, 14.276123046875, 14.98681640625, 15.697509765625, 16.408203125, 17.118896484375, 17.82958984375, 18.540283203125, 19.2509765625, 19.961669921875, 20.67236328125, 21.383056640625, 22.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 17.0, 16.0, 24.0, 23.0, 37.0, 30.0, 64.0, 63.0, 79.0, 109.0, 187.0, 293.0, 1342.0, 187.0, 131.0, 100.0, 71.0, 49.0, 54.0, 32.0, 28.0, 23.0, 20.0, 11.0, 8.0, 12.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.9375, -17.32177734375, -16.7060546875, -16.09033203125, -15.474609375, -14.85888671875, -14.2431640625, -13.62744140625, -13.01171875, -12.39599609375, -11.7802734375, -11.16455078125, -10.548828125, -9.93310546875, -9.3173828125, -8.70166015625, -8.0859375, -7.47021484375, -6.8544921875, -6.23876953125, -5.623046875, -5.00732421875, -4.3916015625, -3.77587890625, -3.16015625, -2.54443359375, -1.9287109375, -1.31298828125, -0.697265625, -0.08154296875, 0.5341796875, 1.14990234375, 1.765625, 2.38134765625, 2.9970703125, 3.61279296875, 4.228515625, 4.84423828125, 5.4599609375, 6.07568359375, 6.69140625, 7.30712890625, 7.9228515625, 8.53857421875, 9.154296875, 9.77001953125, 10.3857421875, 11.00146484375, 11.6171875, 12.23291015625, 12.8486328125, 13.46435546875, 14.080078125, 14.69580078125, 15.3115234375, 15.92724609375, 16.54296875, 17.15869140625, 17.7744140625, 18.39013671875, 19.005859375, 19.62158203125, 20.2373046875, 20.85302734375, 21.46875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 12.0, 12.0, 15.0, 35.0, 37.0, 53.0, 79.0, 114.0, 155.0, 213.0, 333.0, 571.0, 1068.0, 3763.0, 50418.0, 2942086.0, 137825.0, 5739.0, 1326.0, 668.0, 385.0, 263.0, 174.0, 113.0, 84.0, 53.0, 35.0, 33.0, 27.0, 5.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.4189453125, -38.087890625, -36.7568359375, -35.42578125, -34.0947265625, -32.763671875, -31.4326171875, -30.1015625, -28.7705078125, -27.439453125, -26.1083984375, -24.77734375, -23.4462890625, -22.115234375, -20.7841796875, -19.453125, -18.1220703125, -16.791015625, -15.4599609375, -14.12890625, -12.7978515625, -11.466796875, -10.1357421875, -8.8046875, -7.4736328125, -6.142578125, -4.8115234375, -3.48046875, -2.1494140625, -0.818359375, 0.5126953125, 1.84375, 3.1748046875, 4.505859375, 5.8369140625, 7.16796875, 8.4990234375, 9.830078125, 11.1611328125, 12.4921875, 13.8232421875, 15.154296875, 16.4853515625, 17.81640625, 19.1474609375, 20.478515625, 21.8095703125, 23.140625, 24.4716796875, 25.802734375, 27.1337890625, 28.46484375, 29.7958984375, 31.126953125, 32.4580078125, 33.7890625, 35.1201171875, 36.451171875, 37.7822265625, 39.11328125, 40.4443359375, 41.775390625, 43.1064453125, 44.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 21.0, 47.0, 122.0, 239.0, 286.0, 176.0, 77.0, 27.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.66944885253906, -95.56439971923828, -91.4593505859375, -87.35430145263672, -83.24925231933594, -79.14420318603516, -75.03915405273438, -70.9341049194336, -66.82905578613281, -62.72400665283203, -58.61895751953125, -54.51390838623047, -50.40885925292969, -46.303810119628906, -42.198760986328125, -38.093711853027344, -33.98866271972656, -29.88361358642578, -25.778564453125, -21.67351531982422, -17.568466186523438, -13.463417053222656, -9.358367919921875, -5.253318786621094, -1.1482696533203125, 2.9567794799804688, 7.06182861328125, 11.166877746582031, 15.271926879882812, 19.376976013183594, 23.482025146484375, 27.587074279785156, 31.692108154296875, 35.797157287597656, 39.90220642089844, 44.00725555419922, 48.1123046875, 52.21735382080078, 56.32240295410156, 60.427452087402344, 64.53250122070312, 68.6375503540039, 72.74259948730469, 76.84764862060547, 80.95269775390625, 85.05774688720703, 89.16279602050781, 93.2678451538086, 97.37289428710938, 101.47794342041016, 105.58299255371094, 109.68804168701172, 113.7930908203125, 117.89813995361328, 122.00318908691406, 126.10823822021484, 130.21328735351562, 134.31832885742188, 138.4233856201172, 142.5284423828125, 146.63348388671875, 150.738525390625, 154.8435821533203, 158.94863891601562, 163.05368041992188]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 10.0, 5.0, 7.0, 11.0, 12.0, 14.0, 18.0, 17.0, 31.0, 21.0, 28.0, 23.0, 27.0, 39.0, 39.0, 32.0, 27.0, 38.0, 40.0, 43.0, 50.0, 45.0, 38.0, 44.0, 32.0, 37.0, 35.0, 36.0, 25.0, 24.0, 23.0, 23.0, 13.0, 16.0, 11.0, 11.0, 11.0, 6.0, 5.0, 7.0, 7.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.98893356323242, -49.46489715576172, -47.94085693359375, -46.41682052612305, -44.892784118652344, -43.368743896484375, -41.84470748901367, -40.32067108154297, -38.796630859375, -37.2725944519043, -35.74855422973633, -34.224517822265625, -32.700477600097656, -31.176441192626953, -29.65240478515625, -28.128366470336914, -26.604328155517578, -25.080289840698242, -23.556251525878906, -22.032215118408203, -20.508176803588867, -18.98413848876953, -17.460102081298828, -15.936063766479492, -14.412025451660156, -12.88798713684082, -11.3639497756958, -9.839912414550781, -8.315874099731445, -6.791836261749268, -5.26779842376709, -3.7437610626220703, -2.2197265625, -0.6956887245178223, 0.8283491134643555, 2.352386951446533, 3.876424789428711, 5.400462627410889, 6.924500465393066, 8.448537826538086, 9.972576141357422, 11.496614456176758, 13.020651817321777, 14.544689178466797, 16.068727493286133, 17.59276580810547, 19.116802215576172, 20.640840530395508, 22.164878845214844, 23.68891716003418, 25.212955474853516, 26.73699188232422, 28.261030197143555, 29.78506851196289, 31.309104919433594, 32.83314514160156, 34.357181549072266, 35.88121795654297, 37.40525817871094, 38.92929458618164, 40.453330993652344, 41.97737121582031, 43.501407623291016, 45.02544403076172, 46.54948425292969]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 6.0, 9.0, 13.0, 12.0, 13.0, 17.0, 25.0, 22.0, 28.0, 36.0, 29.0, 31.0, 33.0, 40.0, 40.0, 47.0, 43.0, 42.0, 45.0, 44.0, 49.0, 46.0, 39.0, 33.0, 28.0, 24.0, 32.0, 24.0, 24.0, 19.0, 10.0, 15.0, 18.0, 6.0, 9.0, 14.0, 3.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.52154541015625, -6.3282470703125, -6.13494873046875, -5.941650390625, -5.74835205078125, -5.5550537109375, -5.36175537109375, -5.16845703125, -4.97515869140625, -4.7818603515625, -4.58856201171875, -4.395263671875, -4.20196533203125, -4.0086669921875, -3.81536865234375, -3.6220703125, -3.42877197265625, -3.2354736328125, -3.04217529296875, -2.848876953125, -2.65557861328125, -2.4622802734375, -2.26898193359375, -2.07568359375, -1.88238525390625, -1.6890869140625, -1.49578857421875, -1.302490234375, -1.10919189453125, -0.9158935546875, -0.72259521484375, -0.529296875, -0.33599853515625, -0.1427001953125, 0.05059814453125, 0.243896484375, 0.43719482421875, 0.6304931640625, 0.82379150390625, 1.01708984375, 1.21038818359375, 1.4036865234375, 1.59698486328125, 1.790283203125, 1.98358154296875, 2.1768798828125, 2.37017822265625, 2.5634765625, 2.75677490234375, 2.9500732421875, 3.14337158203125, 3.336669921875, 3.52996826171875, 3.7232666015625, 3.91656494140625, 4.10986328125, 4.30316162109375, 4.4964599609375, 4.68975830078125, 4.883056640625, 5.07635498046875, 5.2696533203125, 5.46295166015625, 5.65625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 8.0, 4.0, 11.0, 22.0, 38.0, 78.0, 112.0, 221.0, 382.0, 653.0, 1177.0, 2302.0, 5997.0, 23638.0, 404287.0, 3264174.0, 454559.0, 25200.0, 6208.0, 2456.0, 1172.0, 633.0, 407.0, 247.0, 119.0, 72.0, 45.0, 19.0, 14.0, 5.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.171875, -17.576416015625, -16.98095703125, -16.385498046875, -15.7900390625, -15.194580078125, -14.59912109375, -14.003662109375, -13.408203125, -12.812744140625, -12.21728515625, -11.621826171875, -11.0263671875, -10.430908203125, -9.83544921875, -9.239990234375, -8.64453125, -8.049072265625, -7.45361328125, -6.858154296875, -6.2626953125, -5.667236328125, -5.07177734375, -4.476318359375, -3.880859375, -3.285400390625, -2.68994140625, -2.094482421875, -1.4990234375, -0.903564453125, -0.30810546875, 0.287353515625, 0.8828125, 1.478271484375, 2.07373046875, 2.669189453125, 3.2646484375, 3.860107421875, 4.45556640625, 5.051025390625, 5.646484375, 6.241943359375, 6.83740234375, 7.432861328125, 8.0283203125, 8.623779296875, 9.21923828125, 9.814697265625, 10.41015625, 11.005615234375, 11.60107421875, 12.196533203125, 12.7919921875, 13.387451171875, 13.98291015625, 14.578369140625, 15.173828125, 15.769287109375, 16.36474609375, 16.960205078125, 17.5556640625, 18.151123046875, 18.74658203125, 19.342041015625, 19.9375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 12.0, 9.0, 19.0, 22.0, 37.0, 44.0, 66.0, 136.0, 189.0, 300.0, 457.0, 740.0, 678.0, 447.0, 310.0, 180.0, 133.0, 85.0, 55.0, 35.0, 27.0, 20.0, 16.0, 10.0, 3.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.688232421875, -10.30615234375, -9.924072265625, -9.5419921875, -9.159912109375, -8.77783203125, -8.395751953125, -8.013671875, -7.631591796875, -7.24951171875, -6.867431640625, -6.4853515625, -6.103271484375, -5.72119140625, -5.339111328125, -4.95703125, -4.574951171875, -4.19287109375, -3.810791015625, -3.4287109375, -3.046630859375, -2.66455078125, -2.282470703125, -1.900390625, -1.518310546875, -1.13623046875, -0.754150390625, -0.3720703125, 0.010009765625, 0.39208984375, 0.774169921875, 1.15625, 1.538330078125, 1.92041015625, 2.302490234375, 2.6845703125, 3.066650390625, 3.44873046875, 3.830810546875, 4.212890625, 4.594970703125, 4.97705078125, 5.359130859375, 5.7412109375, 6.123291015625, 6.50537109375, 6.887451171875, 7.26953125, 7.651611328125, 8.03369140625, 8.415771484375, 8.7978515625, 9.179931640625, 9.56201171875, 9.944091796875, 10.326171875, 10.708251953125, 11.09033203125, 11.472412109375, 11.8544921875, 12.236572265625, 12.61865234375, 13.000732421875, 13.3828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 9.0, 5.0, 17.0, 33.0, 46.0, 63.0, 125.0, 192.0, 378.0, 792.0, 1869.0, 5212.0, 21332.0, 221749.0, 3631149.0, 278130.0, 23819.0, 5669.0, 1900.0, 833.0, 417.0, 233.0, 134.0, 56.0, 40.0, 29.0, 12.0, 13.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.1865234375, -22.451171875, -21.7158203125, -20.98046875, -20.2451171875, -19.509765625, -18.7744140625, -18.0390625, -17.3037109375, -16.568359375, -15.8330078125, -15.09765625, -14.3623046875, -13.626953125, -12.8916015625, -12.15625, -11.4208984375, -10.685546875, -9.9501953125, -9.21484375, -8.4794921875, -7.744140625, -7.0087890625, -6.2734375, -5.5380859375, -4.802734375, -4.0673828125, -3.33203125, -2.5966796875, -1.861328125, -1.1259765625, -0.390625, 0.3447265625, 1.080078125, 1.8154296875, 2.55078125, 3.2861328125, 4.021484375, 4.7568359375, 5.4921875, 6.2275390625, 6.962890625, 7.6982421875, 8.43359375, 9.1689453125, 9.904296875, 10.6396484375, 11.375, 12.1103515625, 12.845703125, 13.5810546875, 14.31640625, 15.0517578125, 15.787109375, 16.5224609375, 17.2578125, 17.9931640625, 18.728515625, 19.4638671875, 20.19921875, 20.9345703125, 21.669921875, 22.4052734375, 23.140625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 14.0, 97.0, 381.0, 369.0, 131.0, 17.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.70587158203125, -128.3730926513672, -123.04029846191406, -117.70751190185547, -112.37472534179688, -107.04193878173828, -101.70915222167969, -96.37637329101562, -91.0435791015625, -85.7107925415039, -80.37800598144531, -75.04521942138672, -69.71243286132812, -64.37964630126953, -59.0468635559082, -53.71407699584961, -48.38129425048828, -43.04850769042969, -37.715721130371094, -32.3829345703125, -27.05014991760254, -21.717363357543945, -16.384578704833984, -11.05179214477539, -5.719005584716797, -0.38621950149536133, 4.946566581726074, 10.279352188110352, 15.612138748168945, 20.94492530822754, 26.2777099609375, 31.610496520996094, 36.94328308105469, 42.27606964111328, 47.608856201171875, 52.94164276123047, 58.27442932128906, 63.607215881347656, 68.94000244140625, 74.27278137207031, 79.60557556152344, 84.93836212158203, 90.27114868164062, 95.60393524169922, 100.93672180175781, 106.2695083618164, 111.602294921875, 116.93507385253906, 122.26786041259766, 127.60064697265625, 132.9334259033203, 138.26622009277344, 143.5989990234375, 148.93179321289062, 154.2645721435547, 159.5973663330078, 164.93014526367188, 170.26292419433594, 175.59571838378906, 180.92849731445312, 186.26129150390625, 191.5940704345703, 196.92686462402344, 202.2596435546875, 207.59243774414062]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 11.0, 15.0, 23.0, 16.0, 26.0, 43.0, 55.0, 40.0, 57.0, 52.0, 63.0, 80.0, 85.0, 60.0, 60.0, 76.0, 60.0, 53.0, 44.0, 28.0, 26.0, 3.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.37450408935547, -67.34610748291016, -65.31771850585938, -63.28932189941406, -61.26092529296875, -59.23252868652344, -57.20413589477539, -55.175743103027344, -53.14734649658203, -51.11894989013672, -49.09055709838867, -47.062164306640625, -45.03376770019531, -43.00537109375, -40.97697830200195, -38.948585510253906, -36.920188903808594, -34.89179229736328, -32.863399505615234, -30.835004806518555, -28.806610107421875, -26.778215408325195, -24.749820709228516, -22.721426010131836, -20.693031311035156, -18.664636611938477, -16.636241912841797, -14.607847213745117, -12.579452514648438, -10.551057815551758, -8.522663116455078, -6.494268417358398, -4.465869903564453, -2.4374752044677734, -0.40908050537109375, 1.619314193725586, 3.6477088928222656, 5.676103591918945, 7.704498291015625, 9.732892990112305, 11.761287689208984, 13.789682388305664, 15.818077087402344, 17.846471786499023, 19.874866485595703, 21.903261184692383, 23.931655883789062, 25.960050582885742, 27.988445281982422, 30.0168399810791, 32.04523468017578, 34.073631286621094, 36.10202407836914, 38.13041687011719, 40.1588134765625, 42.18721008300781, 44.21560287475586, 46.243995666503906, 48.27239227294922, 50.30078887939453, 52.32918167114258, 54.357574462890625, 56.38597106933594, 58.41436767578125, 60.4427604675293]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 13.0, 7.0, 16.0, 11.0, 18.0, 25.0, 21.0, 28.0, 25.0, 39.0, 30.0, 38.0, 29.0, 35.0, 33.0, 36.0, 40.0, 36.0, 50.0, 34.0, 37.0, 28.0, 42.0, 28.0, 31.0, 35.0, 29.0, 28.0, 21.0, 21.0, 18.0, 19.0, 11.0, 11.0, 14.0, 8.0, 4.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.97686767578125, -4.8092041015625, -4.64154052734375, -4.473876953125, -4.30621337890625, -4.1385498046875, -3.97088623046875, -3.80322265625, -3.63555908203125, -3.4678955078125, -3.30023193359375, -3.132568359375, -2.96490478515625, -2.7972412109375, -2.62957763671875, -2.4619140625, -2.29425048828125, -2.1265869140625, -1.95892333984375, -1.791259765625, -1.62359619140625, -1.4559326171875, -1.28826904296875, -1.12060546875, -0.95294189453125, -0.7852783203125, -0.61761474609375, -0.449951171875, -0.28228759765625, -0.1146240234375, 0.05303955078125, 0.220703125, 0.38836669921875, 0.5560302734375, 0.72369384765625, 0.891357421875, 1.05902099609375, 1.2266845703125, 1.39434814453125, 1.56201171875, 1.72967529296875, 1.8973388671875, 2.06500244140625, 2.232666015625, 2.40032958984375, 2.5679931640625, 2.73565673828125, 2.9033203125, 3.07098388671875, 3.2386474609375, 3.40631103515625, 3.573974609375, 3.74163818359375, 3.9093017578125, 4.07696533203125, 4.24462890625, 4.41229248046875, 4.5799560546875, 4.74761962890625, 4.915283203125, 5.08294677734375, 5.2506103515625, 5.41827392578125, 5.5859375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 4.0, 9.0, 15.0, 22.0, 28.0, 50.0, 77.0, 97.0, 128.0, 226.0, 301.0, 488.0, 703.0, 1033.0, 1550.0, 2314.0, 3562.0, 5375.0, 8054.0, 12101.0, 18168.0, 27374.0, 43215.0, 71542.0, 125205.0, 228969.0, 207752.0, 111111.0, 64414.0, 39626.0, 25123.0, 16421.0, 11088.0, 7229.0, 4943.0, 3390.0, 2208.0, 1511.0, 985.0, 707.0, 475.0, 309.0, 205.0, 135.0, 106.0, 75.0, 45.0, 27.0, 26.0, 12.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15978622436523438, -0.15477752685546875, -0.14976882934570312, -0.1447601318359375, -0.13975143432617188, -0.13474273681640625, -0.12973403930664062, -0.124725341796875, -0.11971664428710938, -0.11470794677734375, -0.10969924926757812, -0.1046905517578125, -0.09968185424804688, -0.09467315673828125, -0.08966445922851562, -0.08465576171875, -0.07964706420898438, -0.07463836669921875, -0.06962966918945312, -0.0646209716796875, -0.059612274169921875, -0.05460357666015625, -0.049594879150390625, -0.044586181640625, -0.039577484130859375, -0.03456878662109375, -0.029560089111328125, -0.0245513916015625, -0.019542694091796875, -0.01453399658203125, -0.009525299072265625, -0.0045166015625, 0.000492095947265625, 0.00550079345703125, 0.010509490966796875, 0.0155181884765625, 0.020526885986328125, 0.02553558349609375, 0.030544281005859375, 0.035552978515625, 0.040561676025390625, 0.04557037353515625, 0.050579071044921875, 0.0555877685546875, 0.060596466064453125, 0.06560516357421875, 0.07061386108398438, 0.07562255859375, 0.08063125610351562, 0.08563995361328125, 0.09064865112304688, 0.0956573486328125, 0.10066604614257812, 0.10567474365234375, 0.11068344116210938, 0.115692138671875, 0.12070083618164062, 0.12570953369140625, 0.13071823120117188, 0.1357269287109375, 0.14073562622070312, 0.14574432373046875, 0.15075302124023438, 0.15576171875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 9.0, 10.0, 14.0, 14.0, 21.0, 18.0, 29.0, 27.0, 25.0, 33.0, 30.0, 49.0, 41.0, 26.0, 41.0, 28.0, 45.0, 49.0, 1072.0, 40.0, 22.0, 28.0, 42.0, 28.0, 36.0, 20.0, 33.0, 21.0, 20.0, 15.0, 29.0, 7.0, 16.0, 18.0, 11.0, 10.0, 6.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4453125, -4.28656005859375, -4.1278076171875, -3.96905517578125, -3.810302734375, -3.65155029296875, -3.4927978515625, -3.33404541015625, -3.17529296875, -3.01654052734375, -2.8577880859375, -2.69903564453125, -2.540283203125, -2.38153076171875, -2.2227783203125, -2.06402587890625, -1.9052734375, -1.74652099609375, -1.5877685546875, -1.42901611328125, -1.270263671875, -1.11151123046875, -0.9527587890625, -0.79400634765625, -0.63525390625, -0.47650146484375, -0.3177490234375, -0.15899658203125, -0.000244140625, 0.15850830078125, 0.3172607421875, 0.47601318359375, 0.634765625, 0.79351806640625, 0.9522705078125, 1.11102294921875, 1.269775390625, 1.42852783203125, 1.5872802734375, 1.74603271484375, 1.90478515625, 2.06353759765625, 2.2222900390625, 2.38104248046875, 2.539794921875, 2.69854736328125, 2.8572998046875, 3.01605224609375, 3.1748046875, 3.33355712890625, 3.4923095703125, 3.65106201171875, 3.809814453125, 3.96856689453125, 4.1273193359375, 4.28607177734375, 4.44482421875, 4.60357666015625, 4.7623291015625, 4.92108154296875, 5.079833984375, 5.23858642578125, 5.3973388671875, 5.55609130859375, 5.71484375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 5.0, 14.0, 23.0, 32.0, 55.0, 89.0, 157.0, 225.0, 375.0, 669.0, 987.0, 1761.0, 2870.0, 4626.0, 7647.0, 12831.0, 22120.0, 39295.0, 73723.0, 149206.0, 1347233.0, 211501.0, 100252.0, 51773.0, 28340.0, 16374.0, 9950.0, 5949.0, 3504.0, 2101.0, 1293.0, 784.0, 496.0, 308.0, 190.0, 127.0, 79.0, 47.0, 33.0, 28.0, 11.0, 16.0, 4.0, 4.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11102294921875, -0.10740947723388672, -0.10379600524902344, -0.10018253326416016, -0.09656906127929688, -0.0929555892944336, -0.08934211730957031, -0.08572864532470703, -0.08211517333984375, -0.07850170135498047, -0.07488822937011719, -0.0712747573852539, -0.06766128540039062, -0.06404781341552734, -0.06043434143066406, -0.05682086944580078, -0.0532073974609375, -0.04959392547607422, -0.04598045349121094, -0.042366981506347656, -0.038753509521484375, -0.035140037536621094, -0.03152656555175781, -0.02791309356689453, -0.02429962158203125, -0.02068614959716797, -0.017072677612304688, -0.013459205627441406, -0.009845733642578125, -0.006232261657714844, -0.0026187896728515625, 0.0009946823120117188, 0.004608154296875, 0.008221626281738281, 0.011835098266601562, 0.015448570251464844, 0.019062042236328125, 0.022675514221191406, 0.026288986206054688, 0.02990245819091797, 0.03351593017578125, 0.03712940216064453, 0.04074287414550781, 0.044356346130371094, 0.047969818115234375, 0.051583290100097656, 0.05519676208496094, 0.05881023406982422, 0.0624237060546875, 0.06603717803955078, 0.06965065002441406, 0.07326412200927734, 0.07687759399414062, 0.0804910659790039, 0.08410453796386719, 0.08771800994873047, 0.09133148193359375, 0.09494495391845703, 0.09855842590332031, 0.1021718978881836, 0.10578536987304688, 0.10939884185791016, 0.11301231384277344, 0.11662578582763672, 0.1202392578125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 9.0, 17.0, 35.0, 40.0, 56.0, 80.0, 96.0, 197.0, 164.0, 94.0, 57.0, 42.0, 27.0, 25.0, 14.0, 7.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006814002990722656, -0.0006584897637367249, -0.0006355792284011841, -0.0006126686930656433, -0.0005897581577301025, -0.0005668476223945618, -0.000543937087059021, -0.0005210265517234802, -0.0004981160163879395, -0.0004752054810523987, -0.0004522949457168579, -0.00042938441038131714, -0.00040647387504577637, -0.0003835633397102356, -0.0003606528043746948, -0.00033774226903915405, -0.0003148317337036133, -0.0002919211983680725, -0.00026901066303253174, -0.00024610012769699097, -0.0002231895923614502, -0.00020027905702590942, -0.00017736852169036865, -0.00015445798635482788, -0.0001315474510192871, -0.00010863691568374634, -8.572638034820557e-05, -6.28158450126648e-05, -3.9905309677124023e-05, -1.6994774341583252e-05, 5.9157609939575195e-06, 2.882629632949829e-05, 5.173683166503906e-05, 7.464736700057983e-05, 9.75579023361206e-05, 0.00012046843767166138, 0.00014337897300720215, 0.00016628950834274292, 0.0001892000436782837, 0.00021211057901382446, 0.00023502111434936523, 0.000257931649684906, 0.0002808421850204468, 0.00030375272035598755, 0.0003266632556915283, 0.0003495737910270691, 0.00037248432636260986, 0.00039539486169815063, 0.0004183053970336914, 0.0004412159323692322, 0.00046412646770477295, 0.0004870370030403137, 0.0005099475383758545, 0.0005328580737113953, 0.000555768609046936, 0.0005786791443824768, 0.0006015896797180176, 0.0006245002150535583, 0.0006474107503890991, 0.0006703212857246399, 0.0006932318210601807, 0.0007161423563957214, 0.0007390528917312622, 0.000761963427066803, 0.0007848739624023438]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 9.0, 7.0, 11.0, 17.0, 25.0, 40.0, 53.0, 130.0, 396.0, 22311.0, 1023468.0, 1599.0, 214.0, 101.0, 60.0, 46.0, 20.0, 14.0, 9.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01800537109375, -0.017480134963989258, -0.016954898834228516, -0.016429662704467773, -0.01590442657470703, -0.015379190444946289, -0.014853954315185547, -0.014328718185424805, -0.013803482055664062, -0.01327824592590332, -0.012753009796142578, -0.012227773666381836, -0.011702537536621094, -0.011177301406860352, -0.01065206527709961, -0.010126829147338867, -0.009601593017578125, -0.009076356887817383, -0.00855112075805664, -0.008025884628295898, -0.007500648498535156, -0.006975412368774414, -0.006450176239013672, -0.00592494010925293, -0.0053997039794921875, -0.004874467849731445, -0.004349231719970703, -0.003823995590209961, -0.0032987594604492188, -0.0027735233306884766, -0.0022482872009277344, -0.0017230510711669922, -0.00119781494140625, -0.0006725788116455078, -0.00014734268188476562, 0.00037789344787597656, 0.0009031295776367188, 0.001428365707397461, 0.001953601837158203, 0.0024788379669189453, 0.0030040740966796875, 0.0035293102264404297, 0.004054546356201172, 0.004579782485961914, 0.005105018615722656, 0.0056302547454833984, 0.006155490875244141, 0.006680727005004883, 0.007205963134765625, 0.007731199264526367, 0.00825643539428711, 0.008781671524047852, 0.009306907653808594, 0.009832143783569336, 0.010357379913330078, 0.01088261604309082, 0.011407852172851562, 0.011933088302612305, 0.012458324432373047, 0.012983560562133789, 0.013508796691894531, 0.014034032821655273, 0.014559268951416016, 0.015084505081176758, 0.0156097412109375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 16.0, 156.0, 658.0, 160.0, 19.0, 3.0], "bins": [-0.004613654688000679, -0.004537419881671667, -0.004461185075342655, -0.004384950269013643, -0.004308715462684631, -0.004232480656355619, -0.0041562458500266075, -0.004080011043697596, -0.004003776237368584, -0.003927541431039572, -0.00385130662471056, -0.003775071818381548, -0.003698837012052536, -0.003622602205723524, -0.003546367399394512, -0.0034701325930655003, -0.0033938977867364883, -0.0033176629804074764, -0.0032414281740784645, -0.0031651933677494526, -0.0030889585614204407, -0.0030127237550914288, -0.002936488948762417, -0.002860254142433405, -0.002784019336104393, -0.002707784529775381, -0.002631549723446369, -0.0025553149171173573, -0.0024790801107883453, -0.0024028453044593334, -0.0023266104981303215, -0.0022503756918013096, -0.0021741408854722977, -0.0020979060791432858, -0.002021671272814274, -0.001945436466485262, -0.00186920166015625, -0.001792966853827238, -0.0017167320474982262, -0.0016404972411692142, -0.0015642623184248805, -0.0014880275120958686, -0.0014117927057668567, -0.0013355578994378448, -0.0012593230931088328, -0.001183088286779821, -0.001106853480450809, -0.001030618674121797, -0.0009543838677927852, -0.0008781490614637733, -0.0008019142551347613, -0.0007256794488057494, -0.0006494446424767375, -0.0005732098361477256, -0.0004969750298187137, -0.00042074022348970175, -0.00034450541716068983, -0.0002682706108316779, -0.000192035804502666, -0.00011580099817365408, -3.956619184464216e-05, 3.6668614484369755e-05, 0.00011290342081338167, 0.0001891382271423936, 0.0002653730334714055]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 8.0, 17.0, 15.0, 17.0, 16.0, 12.0, 21.0, 20.0, 17.0, 25.0, 31.0, 37.0, 39.0, 36.0, 40.0, 38.0, 41.0, 44.0, 38.0, 28.0, 46.0, 37.0, 43.0, 44.0, 32.0, 36.0, 26.0, 20.0, 25.0, 22.0, 16.0, 10.0, 13.0, 19.0, 14.0, 7.0, 7.0, 6.0, 7.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00025153160095214844, -0.0002434970811009407, -0.00023546256124973297, -0.00022742804139852524, -0.0002193935215473175, -0.00021135900169610977, -0.00020332448184490204, -0.0001952899619936943, -0.00018725544214248657, -0.00017922092229127884, -0.0001711864024400711, -0.00016315188258886337, -0.00015511736273765564, -0.0001470828428864479, -0.00013904832303524017, -0.00013101380318403244, -0.0001229792833328247, -0.00011494476348161697, -0.00010691024363040924, -9.887572377920151e-05, -9.084120392799377e-05, -8.280668407678604e-05, -7.477216422557831e-05, -6.673764437437057e-05, -5.870312452316284e-05, -5.066860467195511e-05, -4.2634084820747375e-05, -3.459956496953964e-05, -2.656504511833191e-05, -1.8530525267124176e-05, -1.0496005415916443e-05, -2.4614855647087097e-06, 5.5730342864990234e-06, 1.3607554137706757e-05, 2.164207398891449e-05, 2.9676593840122223e-05, 3.7711113691329956e-05, 4.574563354253769e-05, 5.378015339374542e-05, 6.181467324495316e-05, 6.984919309616089e-05, 7.788371294736862e-05, 8.591823279857635e-05, 9.395275264978409e-05, 0.00010198727250099182, 0.00011002179235219955, 0.00011805631220340729, 0.00012609083205461502, 0.00013412535190582275, 0.0001421598717570305, 0.00015019439160823822, 0.00015822891145944595, 0.0001662634313106537, 0.00017429795116186142, 0.00018233247101306915, 0.00019036699086427689, 0.00019840151071548462, 0.00020643603056669235, 0.00021447055041790009, 0.00022250507026910782, 0.00023053959012031555, 0.00023857410997152328, 0.000246608629822731, 0.00025464314967393875, 0.0002626776695251465]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 13.0, 6.0, 17.0, 11.0, 18.0, 25.0, 21.0, 28.0, 25.0, 39.0, 30.0, 38.0, 29.0, 35.0, 33.0, 36.0, 40.0, 36.0, 50.0, 34.0, 37.0, 28.0, 42.0, 28.0, 31.0, 35.0, 29.0, 28.0, 21.0, 21.0, 18.0, 19.0, 11.0, 11.0, 14.0, 8.0, 4.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.97686767578125, -4.8092041015625, -4.64154052734375, -4.473876953125, -4.30621337890625, -4.1385498046875, -3.97088623046875, -3.80322265625, -3.63555908203125, -3.4678955078125, -3.30023193359375, -3.132568359375, -2.96490478515625, -2.7972412109375, -2.62957763671875, -2.4619140625, -2.29425048828125, -2.1265869140625, -1.95892333984375, -1.791259765625, -1.62359619140625, -1.4559326171875, -1.28826904296875, -1.12060546875, -0.95294189453125, -0.7852783203125, -0.61761474609375, -0.449951171875, -0.28228759765625, -0.1146240234375, 0.05303955078125, 0.220703125, 0.38836669921875, 0.5560302734375, 0.72369384765625, 0.891357421875, 1.05902099609375, 1.2266845703125, 1.39434814453125, 1.56201171875, 1.72967529296875, 1.8973388671875, 2.06500244140625, 2.232666015625, 2.40032958984375, 2.5679931640625, 2.73565673828125, 2.9033203125, 3.07098388671875, 3.2386474609375, 3.40631103515625, 3.573974609375, 3.74163818359375, 3.9093017578125, 4.07696533203125, 4.24462890625, 4.41229248046875, 4.5799560546875, 4.74761962890625, 4.915283203125, 5.08294677734375, 5.2506103515625, 5.41827392578125, 5.5859375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 2.0, 3.0, 9.0, 5.0, 11.0, 21.0, 30.0, 50.0, 85.0, 107.0, 219.0, 420.0, 855.0, 1874.0, 4212.0, 10889.0, 31505.0, 112851.0, 496300.0, 288961.0, 66624.0, 20438.0, 7220.0, 3031.0, 1347.0, 662.0, 357.0, 172.0, 115.0, 55.0, 39.0, 20.0, 20.0, 10.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.7059326171875, -11.325927734375, -10.9459228515625, -10.56591796875, -10.1859130859375, -9.805908203125, -9.4259033203125, -9.0458984375, -8.6658935546875, -8.285888671875, -7.9058837890625, -7.52587890625, -7.1458740234375, -6.765869140625, -6.3858642578125, -6.005859375, -5.6258544921875, -5.245849609375, -4.8658447265625, -4.48583984375, -4.1058349609375, -3.725830078125, -3.3458251953125, -2.9658203125, -2.5858154296875, -2.205810546875, -1.8258056640625, -1.44580078125, -1.0657958984375, -0.685791015625, -0.3057861328125, 0.07421875, 0.4542236328125, 0.834228515625, 1.2142333984375, 1.59423828125, 1.9742431640625, 2.354248046875, 2.7342529296875, 3.1142578125, 3.4942626953125, 3.874267578125, 4.2542724609375, 4.63427734375, 5.0142822265625, 5.394287109375, 5.7742919921875, 6.154296875, 6.5343017578125, 6.914306640625, 7.2943115234375, 7.67431640625, 8.0543212890625, 8.434326171875, 8.8143310546875, 9.1943359375, 9.5743408203125, 9.954345703125, 10.3343505859375, 10.71435546875, 11.0943603515625, 11.474365234375, 11.8543701171875, 12.234375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 6.0, 12.0, 2.0, 10.0, 11.0, 11.0, 12.0, 15.0, 24.0, 33.0, 43.0, 40.0, 57.0, 81.0, 102.0, 188.0, 363.0, 1406.0, 175.0, 105.0, 78.0, 49.0, 49.0, 38.0, 31.0, 23.0, 21.0, 18.0, 17.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.398193359375, -17.85888671875, -17.319580078125, -16.7802734375, -16.240966796875, -15.70166015625, -15.162353515625, -14.623046875, -14.083740234375, -13.54443359375, -13.005126953125, -12.4658203125, -11.926513671875, -11.38720703125, -10.847900390625, -10.30859375, -9.769287109375, -9.22998046875, -8.690673828125, -8.1513671875, -7.612060546875, -7.07275390625, -6.533447265625, -5.994140625, -5.454833984375, -4.91552734375, -4.376220703125, -3.8369140625, -3.297607421875, -2.75830078125, -2.218994140625, -1.6796875, -1.140380859375, -0.60107421875, -0.061767578125, 0.4775390625, 1.016845703125, 1.55615234375, 2.095458984375, 2.634765625, 3.174072265625, 3.71337890625, 4.252685546875, 4.7919921875, 5.331298828125, 5.87060546875, 6.409912109375, 6.94921875, 7.488525390625, 8.02783203125, 8.567138671875, 9.1064453125, 9.645751953125, 10.18505859375, 10.724365234375, 11.263671875, 11.802978515625, 12.34228515625, 12.881591796875, 13.4208984375, 13.960205078125, 14.49951171875, 15.038818359375, 15.578125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 6.0, 7.0, 11.0, 14.0, 21.0, 30.0, 38.0, 72.0, 110.0, 159.0, 227.0, 388.0, 694.0, 1621.0, 5860.0, 1483335.0, 1643553.0, 6190.0, 1577.0, 687.0, 400.0, 239.0, 180.0, 91.0, 69.0, 42.0, 30.0, 21.0, 11.0, 11.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.53125, -32.28955078125, -31.0478515625, -29.80615234375, -28.564453125, -27.32275390625, -26.0810546875, -24.83935546875, -23.59765625, -22.35595703125, -21.1142578125, -19.87255859375, -18.630859375, -17.38916015625, -16.1474609375, -14.90576171875, -13.6640625, -12.42236328125, -11.1806640625, -9.93896484375, -8.697265625, -7.45556640625, -6.2138671875, -4.97216796875, -3.73046875, -2.48876953125, -1.2470703125, -0.00537109375, 1.236328125, 2.47802734375, 3.7197265625, 4.96142578125, 6.203125, 7.44482421875, 8.6865234375, 9.92822265625, 11.169921875, 12.41162109375, 13.6533203125, 14.89501953125, 16.13671875, 17.37841796875, 18.6201171875, 19.86181640625, 21.103515625, 22.34521484375, 23.5869140625, 24.82861328125, 26.0703125, 27.31201171875, 28.5537109375, 29.79541015625, 31.037109375, 32.27880859375, 33.5205078125, 34.76220703125, 36.00390625, 37.24560546875, 38.4873046875, 39.72900390625, 40.970703125, 42.21240234375, 43.4541015625, 44.69580078125, 45.9375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 22.0, 171.0, 518.0, 266.0, 31.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.76693725585938, -214.76980590820312, -207.77267456054688, -200.7755584716797, -193.77842712402344, -186.7812957763672, -179.78416442871094, -172.78704833984375, -165.7899169921875, -158.79278564453125, -151.795654296875, -144.7985382080078, -137.80140686035156, -130.8042755126953, -123.80714416503906, -116.81002044677734, -109.8128890991211, -102.81575775146484, -95.81863403320312, -88.82150268554688, -81.82437896728516, -74.8272476196289, -67.83012390136719, -60.83299255371094, -53.83586502075195, -46.83873748779297, -39.841609954833984, -32.844482421875, -25.847352981567383, -18.850223541259766, -11.853096008300781, -4.855968475341797, 2.1411590576171875, 9.138286590576172, 16.135414123535156, 23.132543563842773, 30.129671096801758, 37.126800537109375, 44.12392807006836, 51.121055603027344, 58.11818313598633, 65.11531066894531, 72.11244201660156, 79.10956573486328, 86.10669708251953, 93.10382080078125, 100.1009521484375, 107.09808349609375, 114.09520721435547, 121.09233856201172, 128.08946228027344, 135.0865936279297, 142.08372497558594, 149.08084106445312, 156.07797241210938, 163.07510375976562, 170.07223510742188, 177.06936645507812, 184.06649780273438, 191.06361389160156, 198.0607452392578, 205.05787658691406, 212.0550079345703, 219.0521240234375, 226.04925537109375]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 4.0, 12.0, 18.0, 6.0, 17.0, 20.0, 15.0, 18.0, 23.0, 21.0, 26.0, 37.0, 30.0, 34.0, 30.0, 41.0, 40.0, 42.0, 29.0, 49.0, 42.0, 49.0, 40.0, 37.0, 44.0, 34.0, 25.0, 31.0, 29.0, 20.0, 23.0, 18.0, 20.0, 12.0, 11.0, 8.0, 5.0, 9.0, 5.0, 5.0, 1.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.837921142578125, -37.444236755371094, -36.05055236816406, -34.65686798095703, -33.263179779052734, -31.869495391845703, -30.475811004638672, -29.08212661743164, -27.688440322875977, -26.294755935668945, -24.90106964111328, -23.50738525390625, -22.11370086669922, -20.720014572143555, -19.326330184936523, -17.93264389038086, -16.538959503173828, -15.14527416229248, -13.751588821411133, -12.357904434204102, -10.964219093322754, -9.570533752441406, -8.176849365234375, -6.783164024353027, -5.38947868347168, -3.995793581008911, -2.6021084785461426, -1.2084236145019531, 0.18526172637939453, 1.5789470672607422, 2.9726314544677734, 4.366316795349121, 5.760002136230469, 7.153687477111816, 8.547372817993164, 9.941057205200195, 11.334742546081543, 12.72842788696289, 14.122112274169922, 15.51579761505127, 16.909482955932617, 18.30316734313965, 19.696853637695312, 21.090538024902344, 22.484222412109375, 23.87790870666504, 25.27159309387207, 26.665279388427734, 28.058963775634766, 29.452648162841797, 30.84633445739746, 32.240020751953125, 33.633705139160156, 35.02738952636719, 36.42107391357422, 37.81475830078125, 39.20844268798828, 40.60212707519531, 41.995811462402344, 43.389495849609375, 44.78318405151367, 46.1768684387207, 47.570552825927734, 48.964237213134766, 50.35792541503906]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 7.0, 7.0, 12.0, 16.0, 17.0, 14.0, 20.0, 22.0, 20.0, 28.0, 33.0, 32.0, 36.0, 32.0, 32.0, 32.0, 39.0, 41.0, 32.0, 40.0, 38.0, 34.0, 38.0, 43.0, 33.0, 35.0, 32.0, 31.0, 25.0, 20.0, 22.0, 11.0, 19.0, 15.0, 13.0, 15.0, 8.0, 10.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.484375, -5.31842041015625, -5.1524658203125, -4.98651123046875, -4.820556640625, -4.65460205078125, -4.4886474609375, -4.32269287109375, -4.15673828125, -3.99078369140625, -3.8248291015625, -3.65887451171875, -3.492919921875, -3.32696533203125, -3.1610107421875, -2.99505615234375, -2.8291015625, -2.66314697265625, -2.4971923828125, -2.33123779296875, -2.165283203125, -1.99932861328125, -1.8333740234375, -1.66741943359375, -1.50146484375, -1.33551025390625, -1.1695556640625, -1.00360107421875, -0.837646484375, -0.67169189453125, -0.5057373046875, -0.33978271484375, -0.173828125, -0.00787353515625, 0.1580810546875, 0.32403564453125, 0.489990234375, 0.65594482421875, 0.8218994140625, 0.98785400390625, 1.15380859375, 1.31976318359375, 1.4857177734375, 1.65167236328125, 1.817626953125, 1.98358154296875, 2.1495361328125, 2.31549072265625, 2.4814453125, 2.64739990234375, 2.8133544921875, 2.97930908203125, 3.145263671875, 3.31121826171875, 3.4771728515625, 3.64312744140625, 3.80908203125, 3.97503662109375, 4.1409912109375, 4.30694580078125, 4.472900390625, 4.63885498046875, 4.8048095703125, 4.97076416015625, 5.13671875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 9.0, 11.0, 14.0, 11.0, 33.0, 30.0, 40.0, 37.0, 68.0, 110.0, 131.0, 166.0, 223.0, 320.0, 453.0, 660.0, 1038.0, 1605.0, 2715.0, 4971.0, 9889.0, 26003.0, 141450.0, 1081529.0, 2331394.0, 495122.0, 61913.0, 16687.0, 7325.0, 3798.0, 2206.0, 1312.0, 894.0, 604.0, 383.0, 302.0, 205.0, 174.0, 103.0, 83.0, 63.0, 57.0, 39.0, 25.0, 26.0, 16.0, 9.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.7879638671875, -10.419677734375, -10.0513916015625, -9.68310546875, -9.3148193359375, -8.946533203125, -8.5782470703125, -8.2099609375, -7.8416748046875, -7.473388671875, -7.1051025390625, -6.73681640625, -6.3685302734375, -6.000244140625, -5.6319580078125, -5.263671875, -4.8953857421875, -4.527099609375, -4.1588134765625, -3.79052734375, -3.4222412109375, -3.053955078125, -2.6856689453125, -2.3173828125, -1.9490966796875, -1.580810546875, -1.2125244140625, -0.84423828125, -0.4759521484375, -0.107666015625, 0.2606201171875, 0.62890625, 0.9971923828125, 1.365478515625, 1.7337646484375, 2.10205078125, 2.4703369140625, 2.838623046875, 3.2069091796875, 3.5751953125, 3.9434814453125, 4.311767578125, 4.6800537109375, 5.04833984375, 5.4166259765625, 5.784912109375, 6.1531982421875, 6.521484375, 6.8897705078125, 7.258056640625, 7.6263427734375, 7.99462890625, 8.3629150390625, 8.731201171875, 9.0994873046875, 9.4677734375, 9.8360595703125, 10.204345703125, 10.5726318359375, 10.94091796875, 11.3092041015625, 11.677490234375, 12.0457763671875, 12.4140625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 9.0, 21.0, 38.0, 49.0, 90.0, 127.0, 217.0, 340.0, 562.0, 852.0, 658.0, 433.0, 252.0, 156.0, 88.0, 63.0, 31.0, 22.0, 21.0, 13.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4765625, -9.0594482421875, -8.642333984375, -8.2252197265625, -7.80810546875, -7.3909912109375, -6.973876953125, -6.5567626953125, -6.1396484375, -5.7225341796875, -5.305419921875, -4.8883056640625, -4.47119140625, -4.0540771484375, -3.636962890625, -3.2198486328125, -2.802734375, -2.3856201171875, -1.968505859375, -1.5513916015625, -1.13427734375, -0.7171630859375, -0.300048828125, 0.1170654296875, 0.5341796875, 0.9512939453125, 1.368408203125, 1.7855224609375, 2.20263671875, 2.6197509765625, 3.036865234375, 3.4539794921875, 3.87109375, 4.2882080078125, 4.705322265625, 5.1224365234375, 5.53955078125, 5.9566650390625, 6.373779296875, 6.7908935546875, 7.2080078125, 7.6251220703125, 8.042236328125, 8.4593505859375, 8.87646484375, 9.2935791015625, 9.710693359375, 10.1278076171875, 10.544921875, 10.9620361328125, 11.379150390625, 11.7962646484375, 12.21337890625, 12.6304931640625, 13.047607421875, 13.4647216796875, 13.8818359375, 14.2989501953125, 14.716064453125, 15.1331787109375, 15.55029296875, 15.9674072265625, 16.384521484375, 16.8016357421875, 17.21875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 12.0, 9.0, 28.0, 31.0, 50.0, 57.0, 114.0, 162.0, 289.0, 526.0, 1436.0, 4722.0, 28356.0, 707687.0, 3349882.0, 87461.0, 9578.0, 2232.0, 753.0, 355.0, 199.0, 125.0, 75.0, 39.0, 29.0, 19.0, 15.0, 10.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -19.9091796875, -19.177734375, -18.4462890625, -17.71484375, -16.9833984375, -16.251953125, -15.5205078125, -14.7890625, -14.0576171875, -13.326171875, -12.5947265625, -11.86328125, -11.1318359375, -10.400390625, -9.6689453125, -8.9375, -8.2060546875, -7.474609375, -6.7431640625, -6.01171875, -5.2802734375, -4.548828125, -3.8173828125, -3.0859375, -2.3544921875, -1.623046875, -0.8916015625, -0.16015625, 0.5712890625, 1.302734375, 2.0341796875, 2.765625, 3.4970703125, 4.228515625, 4.9599609375, 5.69140625, 6.4228515625, 7.154296875, 7.8857421875, 8.6171875, 9.3486328125, 10.080078125, 10.8115234375, 11.54296875, 12.2744140625, 13.005859375, 13.7373046875, 14.46875, 15.2001953125, 15.931640625, 16.6630859375, 17.39453125, 18.1259765625, 18.857421875, 19.5888671875, 20.3203125, 21.0517578125, 21.783203125, 22.5146484375, 23.24609375, 23.9775390625, 24.708984375, 25.4404296875, 26.171875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 70.0, 677.0, 261.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-499.9446105957031, -488.7540588378906, -477.5635070800781, -466.3729553222656, -455.1824035644531, -443.9918518066406, -432.8013000488281, -421.6107482910156, -410.4201965332031, -399.2296447753906, -388.0390930175781, -376.8485412597656, -365.6579895019531, -354.4674377441406, -343.2768859863281, -332.0863342285156, -320.895751953125, -309.7052001953125, -298.5146484375, -287.3240966796875, -276.133544921875, -264.9429931640625, -253.75244140625, -242.5618896484375, -231.371337890625, -220.1807861328125, -208.990234375, -197.7996826171875, -186.609130859375, -175.4185791015625, -164.22802734375, -153.0374755859375, -141.84693908691406, -130.65638732910156, -119.46583557128906, -108.27528381347656, -97.08473205566406, -85.89418029785156, -74.70362091064453, -63.51306915283203, -52.32251739501953, -41.13196563720703, -29.9414119720459, -18.750858306884766, -7.560306549072266, 3.6302452087402344, 14.82080078125, 26.0113525390625, 37.201904296875, 48.3924560546875, 59.5830078125, 70.7735595703125, 81.964111328125, 93.1546630859375, 104.34522247314453, 115.53577423095703, 126.72632598876953, 137.91688537597656, 149.10743713378906, 160.29798889160156, 171.48854064941406, 182.67909240722656, 193.86964416503906, 205.06019592285156, 216.25074768066406]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 15.0, 13.0, 12.0, 14.0, 23.0, 24.0, 22.0, 31.0, 33.0, 42.0, 33.0, 42.0, 45.0, 49.0, 52.0, 53.0, 61.0, 41.0, 41.0, 39.0, 36.0, 49.0, 38.0, 35.0, 16.0, 18.0, 17.0, 19.0, 16.0, 14.0, 9.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-48.039894104003906, -46.751075744628906, -45.462257385253906, -44.173439025878906, -42.884620666503906, -41.595802307128906, -40.306983947753906, -39.018165588378906, -37.729347229003906, -36.440528869628906, -35.151710510253906, -33.862892150878906, -32.574073791503906, -31.285255432128906, -29.996435165405273, -28.707616806030273, -27.41879653930664, -26.12997817993164, -24.84115982055664, -23.55234146118164, -22.26352310180664, -20.97470474243164, -19.685884475708008, -18.397066116333008, -17.108247756958008, -15.819429397583008, -14.530611038208008, -13.241791725158691, -11.952973365783691, -10.664155006408691, -9.375335693359375, -8.086517333984375, -6.797698974609375, -5.508880615234375, -4.220061779022217, -2.9312431812286377, -1.6424245834350586, -0.3536062240600586, 0.9352126121520996, 2.224031448364258, 3.512849807739258, 4.801668167114258, 6.090487003326416, 7.379305839538574, 8.668124198913574, 9.956942558288574, 11.24576187133789, 12.53458023071289, 13.82339859008789, 15.11221694946289, 16.40103530883789, 17.68985366821289, 18.97867202758789, 20.26749038696289, 21.556310653686523, 22.845129013061523, 24.133947372436523, 25.422765731811523, 26.711584091186523, 28.000402450561523, 29.289222717285156, 30.578041076660156, 31.866859436035156, 33.155677795410156, 34.444496154785156]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 4.0, 8.0, 10.0, 6.0, 8.0, 14.0, 20.0, 12.0, 23.0, 21.0, 30.0, 24.0, 34.0, 35.0, 24.0, 37.0, 39.0, 32.0, 38.0, 50.0, 38.0, 36.0, 37.0, 41.0, 38.0, 33.0, 25.0, 40.0, 27.0, 28.0, 29.0, 16.0, 10.0, 20.0, 11.0, 10.0, 15.0, 11.0, 13.0, 10.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.34375, -5.1767578125, -5.009765625, -4.8427734375, -4.67578125, -4.5087890625, -4.341796875, -4.1748046875, -4.0078125, -3.8408203125, -3.673828125, -3.5068359375, -3.33984375, -3.1728515625, -3.005859375, -2.8388671875, -2.671875, -2.5048828125, -2.337890625, -2.1708984375, -2.00390625, -1.8369140625, -1.669921875, -1.5029296875, -1.3359375, -1.1689453125, -1.001953125, -0.8349609375, -0.66796875, -0.5009765625, -0.333984375, -0.1669921875, 0.0, 0.1669921875, 0.333984375, 0.5009765625, 0.66796875, 0.8349609375, 1.001953125, 1.1689453125, 1.3359375, 1.5029296875, 1.669921875, 1.8369140625, 2.00390625, 2.1708984375, 2.337890625, 2.5048828125, 2.671875, 2.8388671875, 3.005859375, 3.1728515625, 3.33984375, 3.5068359375, 3.673828125, 3.8408203125, 4.0078125, 4.1748046875, 4.341796875, 4.5087890625, 4.67578125, 4.8427734375, 5.009765625, 5.1767578125, 5.34375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 11.0, 9.0, 14.0, 25.0, 28.0, 64.0, 67.0, 120.0, 152.0, 276.0, 414.0, 551.0, 780.0, 1175.0, 1751.0, 2468.0, 3739.0, 5378.0, 7953.0, 11753.0, 17426.0, 26033.0, 41394.0, 68597.0, 126762.0, 241114.0, 211937.0, 108364.0, 60361.0, 37100.0, 23621.0, 15783.0, 10468.0, 7232.0, 4957.0, 3405.0, 2302.0, 1638.0, 1070.0, 687.0, 517.0, 323.0, 224.0, 151.0, 127.0, 89.0, 52.0, 27.0, 30.0, 16.0, 15.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1663818359375, -0.16132164001464844, -0.15626144409179688, -0.1512012481689453, -0.14614105224609375, -0.1410808563232422, -0.13602066040039062, -0.13096046447753906, -0.1259002685546875, -0.12084007263183594, -0.11577987670898438, -0.11071968078613281, -0.10565948486328125, -0.10059928894042969, -0.09553909301757812, -0.09047889709472656, -0.085418701171875, -0.08035850524902344, -0.07529830932617188, -0.07023811340332031, -0.06517791748046875, -0.06011772155761719, -0.055057525634765625, -0.04999732971191406, -0.0449371337890625, -0.03987693786621094, -0.034816741943359375, -0.029756546020507812, -0.02469635009765625, -0.019636154174804688, -0.014575958251953125, -0.009515762329101562, -0.00445556640625, 0.0006046295166015625, 0.005664825439453125, 0.010725021362304688, 0.01578521728515625, 0.020845413208007812, 0.025905609130859375, 0.030965805053710938, 0.0360260009765625, 0.04108619689941406, 0.046146392822265625, 0.05120658874511719, 0.05626678466796875, 0.06132698059082031, 0.06638717651367188, 0.07144737243652344, 0.076507568359375, 0.08156776428222656, 0.08662796020507812, 0.09168815612792969, 0.09674835205078125, 0.10180854797363281, 0.10686874389648438, 0.11192893981933594, 0.1169891357421875, 0.12204933166503906, 0.12710952758789062, 0.1321697235107422, 0.13722991943359375, 0.1422901153564453, 0.14735031127929688, 0.15241050720214844, 0.157470703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 0.0, 5.0, 6.0, 8.0, 5.0, 13.0, 10.0, 19.0, 19.0, 19.0, 20.0, 20.0, 19.0, 29.0, 32.0, 37.0, 36.0, 36.0, 35.0, 39.0, 38.0, 29.0, 1062.0, 37.0, 26.0, 56.0, 44.0, 48.0, 35.0, 32.0, 35.0, 13.0, 31.0, 24.0, 13.0, 14.0, 12.0, 17.0, 14.0, 4.0, 12.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.87109375, -4.71942138671875, -4.5677490234375, -4.41607666015625, -4.264404296875, -4.11273193359375, -3.9610595703125, -3.80938720703125, -3.65771484375, -3.50604248046875, -3.3543701171875, -3.20269775390625, -3.051025390625, -2.89935302734375, -2.7476806640625, -2.59600830078125, -2.4443359375, -2.29266357421875, -2.1409912109375, -1.98931884765625, -1.837646484375, -1.68597412109375, -1.5343017578125, -1.38262939453125, -1.23095703125, -1.07928466796875, -0.9276123046875, -0.77593994140625, -0.624267578125, -0.47259521484375, -0.3209228515625, -0.16925048828125, -0.017578125, 0.13409423828125, 0.2857666015625, 0.43743896484375, 0.589111328125, 0.74078369140625, 0.8924560546875, 1.04412841796875, 1.19580078125, 1.34747314453125, 1.4991455078125, 1.65081787109375, 1.802490234375, 1.95416259765625, 2.1058349609375, 2.25750732421875, 2.4091796875, 2.56085205078125, 2.7125244140625, 2.86419677734375, 3.015869140625, 3.16754150390625, 3.3192138671875, 3.47088623046875, 3.62255859375, 3.77423095703125, 3.9259033203125, 4.07757568359375, 4.229248046875, 4.38092041015625, 4.5325927734375, 4.68426513671875, 4.8359375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 2.0, 12.0, 17.0, 9.0, 28.0, 28.0, 57.0, 79.0, 106.0, 177.0, 251.0, 370.0, 546.0, 841.0, 1126.0, 1674.0, 2428.0, 3455.0, 5184.0, 7621.0, 11771.0, 18063.0, 28643.0, 47428.0, 82636.0, 152420.0, 1301055.0, 183555.0, 98100.0, 55093.0, 33206.0, 20706.0, 13384.0, 8779.0, 5956.0, 3773.0, 2741.0, 1883.0, 1202.0, 804.0, 588.0, 405.0, 289.0, 209.0, 125.0, 106.0, 70.0, 48.0, 27.0, 25.0, 13.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.085693359375, -0.08289718627929688, -0.08010101318359375, -0.07730484008789062, -0.0745086669921875, -0.07171249389648438, -0.06891632080078125, -0.06612014770507812, -0.063323974609375, -0.060527801513671875, -0.05773162841796875, -0.054935455322265625, -0.0521392822265625, -0.049343109130859375, -0.04654693603515625, -0.043750762939453125, -0.04095458984375, -0.038158416748046875, -0.03536224365234375, -0.032566070556640625, -0.0297698974609375, -0.026973724365234375, -0.02417755126953125, -0.021381378173828125, -0.018585205078125, -0.015789031982421875, -0.01299285888671875, -0.010196685791015625, -0.0074005126953125, -0.004604339599609375, -0.00180816650390625, 0.000988006591796875, 0.0037841796875, 0.006580352783203125, 0.00937652587890625, 0.012172698974609375, 0.0149688720703125, 0.017765045166015625, 0.02056121826171875, 0.023357391357421875, 0.026153564453125, 0.028949737548828125, 0.03174591064453125, 0.034542083740234375, 0.0373382568359375, 0.040134429931640625, 0.04293060302734375, 0.045726776123046875, 0.04852294921875, 0.051319122314453125, 0.05411529541015625, 0.056911468505859375, 0.0597076416015625, 0.06250381469726562, 0.06529998779296875, 0.06809616088867188, 0.070892333984375, 0.07368850708007812, 0.07648468017578125, 0.07928085327148438, 0.0820770263671875, 0.08487319946289062, 0.08766937255859375, 0.09046554565429688, 0.09326171875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 5.0, 2.0, 7.0, 11.0, 15.0, 20.0, 22.0, 34.0, 57.0, 89.0, 118.0, 166.0, 144.0, 81.0, 57.0, 41.0, 30.0, 28.0, 15.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011606216430664062, -0.001123964786529541, -0.0010873079299926758, -0.0010506510734558105, -0.0010139942169189453, -0.00097733736038208, -0.0009406805038452148, -0.0009040236473083496, -0.0008673667907714844, -0.0008307099342346191, -0.0007940530776977539, -0.0007573962211608887, -0.0007207393646240234, -0.0006840825080871582, -0.000647425651550293, -0.0006107687950134277, -0.0005741119384765625, -0.0005374550819396973, -0.000500798225402832, -0.0004641413688659668, -0.00042748451232910156, -0.00039082765579223633, -0.0003541707992553711, -0.00031751394271850586, -0.0002808570861816406, -0.0002442002296447754, -0.00020754337310791016, -0.00017088651657104492, -0.0001342296600341797, -9.757280349731445e-05, -6.091594696044922e-05, -2.4259090423583984e-05, 1.239776611328125e-05, 4.9054622650146484e-05, 8.571147918701172e-05, 0.00012236833572387695, 0.0001590251922607422, 0.00019568204879760742, 0.00023233890533447266, 0.0002689957618713379, 0.0003056526184082031, 0.00034230947494506836, 0.0003789663314819336, 0.00041562318801879883, 0.00045228004455566406, 0.0004889369010925293, 0.0005255937576293945, 0.0005622506141662598, 0.000598907470703125, 0.0006355643272399902, 0.0006722211837768555, 0.0007088780403137207, 0.0007455348968505859, 0.0007821917533874512, 0.0008188486099243164, 0.0008555054664611816, 0.0008921623229980469, 0.0009288191795349121, 0.0009654760360717773, 0.0010021328926086426, 0.0010387897491455078, 0.001075446605682373, 0.0011121034622192383, 0.0011487603187561035, 0.0011854171752929688]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 2.0, 7.0, 6.0, 19.0, 21.0, 35.0, 44.0, 47.0, 115.0, 186.0, 479.0, 10880.0, 1033895.0, 1994.0, 368.0, 181.0, 75.0, 53.0, 38.0, 27.0, 16.0, 13.0, 10.0, 3.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023681640625, -0.022949695587158203, -0.022217750549316406, -0.02148580551147461, -0.020753860473632812, -0.020021915435791016, -0.01928997039794922, -0.018558025360107422, -0.017826080322265625, -0.017094135284423828, -0.01636219024658203, -0.015630245208740234, -0.014898300170898438, -0.01416635513305664, -0.013434410095214844, -0.012702465057373047, -0.01197052001953125, -0.011238574981689453, -0.010506629943847656, -0.00977468490600586, -0.009042739868164062, -0.008310794830322266, -0.007578849792480469, -0.006846904754638672, -0.006114959716796875, -0.005383014678955078, -0.004651069641113281, -0.003919124603271484, -0.0031871795654296875, -0.0024552345275878906, -0.0017232894897460938, -0.0009913444519042969, -0.0002593994140625, 0.0004725456237792969, 0.0012044906616210938, 0.0019364356994628906, 0.0026683807373046875, 0.0034003257751464844, 0.004132270812988281, 0.004864215850830078, 0.005596160888671875, 0.006328105926513672, 0.007060050964355469, 0.007791996002197266, 0.008523941040039062, 0.00925588607788086, 0.009987831115722656, 0.010719776153564453, 0.01145172119140625, 0.012183666229248047, 0.012915611267089844, 0.01364755630493164, 0.014379501342773438, 0.015111446380615234, 0.01584339141845703, 0.016575336456298828, 0.017307281494140625, 0.018039226531982422, 0.01877117156982422, 0.019503116607666016, 0.020235061645507812, 0.02096700668334961, 0.021698951721191406, 0.022430896759033203, 0.023162841796875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 67.0, 396.0, 436.0, 77.0, 19.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002718091243878007, -0.0026244448963552713, -0.0025307987816631794, -0.002437152434140444, -0.002343506319448352, -0.0022498599719256163, -0.0021562138572335243, -0.0020625675097107887, -0.001968921162188053, -0.0018752749310806394, -0.0017816286999732256, -0.00168798235245049, -0.001594336237758398, -0.0015006898902356625, -0.0014070436591282487, -0.001313397428020835, -0.001219751313328743, -0.0011261050822213292, -0.0010324588511139154, -0.0009388125617988408, -0.000845166330691427, -0.0007515200995840132, -0.0006578738102689385, -0.0005642275791615248, -0.000470581348054111, -0.00037693511694669724, -0.000283288856735453, -0.00018964259652420878, -9.599636541679502e-05, -2.3501343093812466e-06, 9.129615500569344e-05, 0.0001849423861131072, 0.000278588617220521, 0.00037223484832793474, 0.00046588110853917897, 0.0005595273687504232, 0.000653173599857837, 0.0007468198309652507, 0.0008404661202803254, 0.0009341123513877392, 0.001027758582495153, 0.0011214048136025667, 0.0012150510447099805, 0.0013086972758173943, 0.0014023436233401299, 0.0014959897380322218, 0.0015896360855549574, 0.0016832823166623712, 0.001776928547769785, 0.0018705747788771987, 0.0019642210099846125, 0.002057867357507348, 0.00215151347219944, 0.0022451598197221756, 0.002338806167244911, 0.002432452281937003, 0.002526098396629095, 0.0026197447441518307, 0.0027133908588439226, 0.002807037206366658, 0.00290068332105875, 0.0029943296685814857, 0.0030879760161042213, 0.0031816221307963133, 0.003275268478319049]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 13.0, 13.0, 11.0, 19.0, 10.0, 23.0, 12.0, 18.0, 18.0, 29.0, 36.0, 40.0, 32.0, 34.0, 36.0, 36.0, 39.0, 42.0, 33.0, 34.0, 40.0, 37.0, 43.0, 37.0, 29.0, 34.0, 34.0, 32.0, 25.0, 24.0, 21.0, 24.0, 11.0, 16.0, 14.0, 7.0, 9.0, 7.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005884170532226562, -0.0005696052685379982, -0.0005507934838533401, -0.0005319816991686821, -0.000513169914484024, -0.000494358129799366, -0.00047554634511470795, -0.0004567345604300499, -0.00043792277574539185, -0.0004191109910607338, -0.00040029920637607574, -0.0003814874216914177, -0.00036267563700675964, -0.0003438638523221016, -0.00032505206763744354, -0.0003062402829527855, -0.00028742849826812744, -0.0002686167135834694, -0.00024980492889881134, -0.0002309931442141533, -0.00021218135952949524, -0.0001933695748448372, -0.00017455779016017914, -0.0001557460054755211, -0.00013693422079086304, -0.00011812243610620499, -9.931065142154694e-05, -8.049886673688889e-05, -6.168708205223083e-05, -4.2875297367572784e-05, -2.4063512682914734e-05, -5.251727998256683e-06, 1.3560056686401367e-05, 3.237184137105942e-05, 5.118362605571747e-05, 6.999541074037552e-05, 8.880719542503357e-05, 0.00010761898010969162, 0.00012643076479434967, 0.00014524254947900772, 0.00016405433416366577, 0.00018286611884832382, 0.00020167790353298187, 0.00022048968821763992, 0.00023930147290229797, 0.000258113257586956, 0.0002769250422716141, 0.0002957368269562721, 0.0003145486116409302, 0.0003333603963255882, 0.0003521721810102463, 0.00037098396569490433, 0.0003897957503795624, 0.00040860753506422043, 0.0004274193197488785, 0.00044623110443353653, 0.0004650428891181946, 0.00048385467380285263, 0.0005026664584875107, 0.0005214782431721687, 0.0005402900278568268, 0.0005591018125414848, 0.0005779135972261429, 0.0005967253819108009, 0.000615537166595459]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 4.0, 8.0, 10.0, 6.0, 8.0, 14.0, 20.0, 12.0, 23.0, 21.0, 30.0, 24.0, 34.0, 35.0, 24.0, 37.0, 39.0, 32.0, 38.0, 50.0, 38.0, 36.0, 37.0, 41.0, 38.0, 33.0, 25.0, 40.0, 27.0, 28.0, 29.0, 15.0, 11.0, 20.0, 11.0, 10.0, 15.0, 11.0, 13.0, 10.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.34375, -5.1767578125, -5.009765625, -4.8427734375, -4.67578125, -4.5087890625, -4.341796875, -4.1748046875, -4.0078125, -3.8408203125, -3.673828125, -3.5068359375, -3.33984375, -3.1728515625, -3.005859375, -2.8388671875, -2.671875, -2.5048828125, -2.337890625, -2.1708984375, -2.00390625, -1.8369140625, -1.669921875, -1.5029296875, -1.3359375, -1.1689453125, -1.001953125, -0.8349609375, -0.66796875, -0.5009765625, -0.333984375, -0.1669921875, 0.0, 0.1669921875, 0.333984375, 0.5009765625, 0.66796875, 0.8349609375, 1.001953125, 1.1689453125, 1.3359375, 1.5029296875, 1.669921875, 1.8369140625, 2.00390625, 2.1708984375, 2.337890625, 2.5048828125, 2.671875, 2.8388671875, 3.005859375, 3.1728515625, 3.33984375, 3.5068359375, 3.673828125, 3.8408203125, 4.0078125, 4.1748046875, 4.341796875, 4.5087890625, 4.67578125, 4.8427734375, 5.009765625, 5.1767578125, 5.34375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 10.0, 13.0, 20.0, 25.0, 22.0, 35.0, 72.0, 71.0, 101.0, 153.0, 202.0, 293.0, 401.0, 566.0, 906.0, 1496.0, 2390.0, 4314.0, 7759.0, 14504.0, 27194.0, 53712.0, 106715.0, 209371.0, 276948.0, 166821.0, 83728.0, 41892.0, 21580.0, 11539.0, 6337.0, 3513.0, 2009.0, 1283.0, 826.0, 485.0, 370.0, 259.0, 186.0, 133.0, 84.0, 64.0, 41.0, 28.0, 23.0, 16.0, 15.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.2734375, -5.11029052734375, -4.9471435546875, -4.78399658203125, -4.620849609375, -4.45770263671875, -4.2945556640625, -4.13140869140625, -3.96826171875, -3.80511474609375, -3.6419677734375, -3.47882080078125, -3.315673828125, -3.15252685546875, -2.9893798828125, -2.82623291015625, -2.6630859375, -2.49993896484375, -2.3367919921875, -2.17364501953125, -2.010498046875, -1.84735107421875, -1.6842041015625, -1.52105712890625, -1.35791015625, -1.19476318359375, -1.0316162109375, -0.86846923828125, -0.705322265625, -0.54217529296875, -0.3790283203125, -0.21588134765625, -0.052734375, 0.11041259765625, 0.2735595703125, 0.43670654296875, 0.599853515625, 0.76300048828125, 0.9261474609375, 1.08929443359375, 1.25244140625, 1.41558837890625, 1.5787353515625, 1.74188232421875, 1.905029296875, 2.06817626953125, 2.2313232421875, 2.39447021484375, 2.5576171875, 2.72076416015625, 2.8839111328125, 3.04705810546875, 3.210205078125, 3.37335205078125, 3.5364990234375, 3.69964599609375, 3.86279296875, 4.02593994140625, 4.1890869140625, 4.35223388671875, 4.515380859375, 4.67852783203125, 4.8416748046875, 5.00482177734375, 5.16796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 4.0, 9.0, 11.0, 7.0, 12.0, 25.0, 19.0, 30.0, 33.0, 51.0, 58.0, 78.0, 79.0, 149.0, 299.0, 1400.0, 267.0, 140.0, 77.0, 56.0, 50.0, 41.0, 25.0, 26.0, 24.0, 15.0, 13.0, 9.0, 16.0, 7.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.3868408203125, -12.812744140625, -12.2386474609375, -11.66455078125, -11.0904541015625, -10.516357421875, -9.9422607421875, -9.3681640625, -8.7940673828125, -8.219970703125, -7.6458740234375, -7.07177734375, -6.4976806640625, -5.923583984375, -5.3494873046875, -4.775390625, -4.2012939453125, -3.627197265625, -3.0531005859375, -2.47900390625, -1.9049072265625, -1.330810546875, -0.7567138671875, -0.1826171875, 0.3914794921875, 0.965576171875, 1.5396728515625, 2.11376953125, 2.6878662109375, 3.261962890625, 3.8360595703125, 4.41015625, 4.9842529296875, 5.558349609375, 6.1324462890625, 6.70654296875, 7.2806396484375, 7.854736328125, 8.4288330078125, 9.0029296875, 9.5770263671875, 10.151123046875, 10.7252197265625, 11.29931640625, 11.8734130859375, 12.447509765625, 13.0216064453125, 13.595703125, 14.1697998046875, 14.743896484375, 15.3179931640625, 15.89208984375, 16.4661865234375, 17.040283203125, 17.6143798828125, 18.1884765625, 18.7625732421875, 19.336669921875, 19.9107666015625, 20.48486328125, 21.0589599609375, 21.633056640625, 22.2071533203125, 22.78125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 11.0, 12.0, 8.0, 12.0, 16.0, 14.0, 32.0, 46.0, 31.0, 48.0, 71.0, 102.0, 178.0, 312.0, 662.0, 3235.0, 86730.0, 2972088.0, 77559.0, 3015.0, 641.0, 308.0, 166.0, 114.0, 73.0, 64.0, 40.0, 25.0, 28.0, 16.0, 15.0, 11.0, 4.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-30.859375, -30.077880859375, -29.29638671875, -28.514892578125, -27.7333984375, -26.951904296875, -26.17041015625, -25.388916015625, -24.607421875, -23.825927734375, -23.04443359375, -22.262939453125, -21.4814453125, -20.699951171875, -19.91845703125, -19.136962890625, -18.35546875, -17.573974609375, -16.79248046875, -16.010986328125, -15.2294921875, -14.447998046875, -13.66650390625, -12.885009765625, -12.103515625, -11.322021484375, -10.54052734375, -9.759033203125, -8.9775390625, -8.196044921875, -7.41455078125, -6.633056640625, -5.8515625, -5.070068359375, -4.28857421875, -3.507080078125, -2.7255859375, -1.944091796875, -1.16259765625, -0.381103515625, 0.400390625, 1.181884765625, 1.96337890625, 2.744873046875, 3.5263671875, 4.307861328125, 5.08935546875, 5.870849609375, 6.65234375, 7.433837890625, 8.21533203125, 8.996826171875, 9.7783203125, 10.559814453125, 11.34130859375, 12.122802734375, 12.904296875, 13.685791015625, 14.46728515625, 15.248779296875, 16.0302734375, 16.811767578125, 17.59326171875, 18.374755859375, 19.15625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 12.0, 50.0, 118.0, 212.0, 241.0, 193.0, 111.0, 46.0, 15.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.87434768676758, -34.32606506347656, -31.777782440185547, -29.22949981689453, -26.681217193603516, -24.1329345703125, -21.584651947021484, -19.03636932373047, -16.488086700439453, -13.939804077148438, -11.391521453857422, -8.843238830566406, -6.294956207275391, -3.746673583984375, -1.1983909606933594, 1.3498916625976562, 3.898174285888672, 6.4464569091796875, 8.994739532470703, 11.543022155761719, 14.091304779052734, 16.63958740234375, 19.187870025634766, 21.73615264892578, 24.284435272216797, 26.832717895507812, 29.381000518798828, 31.929283142089844, 34.47756576538086, 37.025848388671875, 39.57413101196289, 42.122413635253906, 44.670692443847656, 47.21897506713867, 49.76725769042969, 52.3155403137207, 54.86382293701172, 57.412105560302734, 59.96038818359375, 62.508670806884766, 65.05695343017578, 67.60523986816406, 70.15351867675781, 72.70179748535156, 75.25008392333984, 77.79837036132812, 80.34664916992188, 82.89492797851562, 85.4432144165039, 87.99150085449219, 90.53977966308594, 93.08805847167969, 95.63634490966797, 98.18463134765625, 100.73291015625, 103.28118896484375, 105.82947540283203, 108.37776184082031, 110.92604064941406, 113.47431945800781, 116.0226058959961, 118.57089233398438, 121.11917114257812, 123.66744995117188, 126.21573638916016]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 13.0, 22.0, 14.0, 14.0, 16.0, 25.0, 23.0, 26.0, 32.0, 34.0, 44.0, 45.0, 36.0, 48.0, 46.0, 38.0, 55.0, 34.0, 39.0, 43.0, 40.0, 41.0, 38.0, 28.0, 22.0, 24.0, 19.0, 19.0, 18.0, 15.0, 13.0, 11.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-43.98972702026367, -42.67571258544922, -41.3616943359375, -40.04767990112305, -38.73366165161133, -37.419647216796875, -36.105628967285156, -34.7916145324707, -33.47760009765625, -32.1635856628418, -30.849567413330078, -29.535551071166992, -28.221534729003906, -26.907520294189453, -25.593503952026367, -24.27948760986328, -22.965469360351562, -21.651453018188477, -20.33743667602539, -19.023420333862305, -17.70940399169922, -16.395389556884766, -15.08137321472168, -13.767356872558594, -12.453340530395508, -11.139324188232422, -9.825307846069336, -8.511292457580566, -7.1972761154174805, -5.8832597732543945, -4.569243907928467, -3.255228042602539, -1.9412155151367188, -0.6271994113922119, 0.6868166923522949, 2.0008327960968018, 3.3148488998413086, 4.6288652420043945, 5.942881107330322, 7.25689697265625, 8.570913314819336, 9.884929656982422, 11.198945999145508, 12.512961387634277, 13.826977729797363, 15.14099407196045, 16.45500946044922, 17.769025802612305, 19.08304214477539, 20.397058486938477, 21.711074829101562, 23.02509117126465, 24.339107513427734, 25.653121948242188, 26.967138290405273, 28.28115463256836, 29.595170974731445, 30.90918731689453, 32.223201751708984, 33.5372200012207, 34.851234436035156, 36.165252685546875, 37.47926712036133, 38.79328155517578, 40.1072998046875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 7.0, 8.0, 12.0, 12.0, 18.0, 11.0, 16.0, 14.0, 22.0, 15.0, 29.0, 18.0, 31.0, 39.0, 40.0, 33.0, 42.0, 38.0, 27.0, 40.0, 42.0, 36.0, 34.0, 37.0, 37.0, 27.0, 33.0, 32.0, 25.0, 20.0, 17.0, 15.0, 13.0, 21.0, 22.0, 12.0, 14.0, 13.0, 8.0, 7.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.2578125, -5.0858154296875, -4.913818359375, -4.7418212890625, -4.56982421875, -4.3978271484375, -4.225830078125, -4.0538330078125, -3.8818359375, -3.7098388671875, -3.537841796875, -3.3658447265625, -3.19384765625, -3.0218505859375, -2.849853515625, -2.6778564453125, -2.505859375, -2.3338623046875, -2.161865234375, -1.9898681640625, -1.81787109375, -1.6458740234375, -1.473876953125, -1.3018798828125, -1.1298828125, -0.9578857421875, -0.785888671875, -0.6138916015625, -0.44189453125, -0.2698974609375, -0.097900390625, 0.0740966796875, 0.24609375, 0.4180908203125, 0.590087890625, 0.7620849609375, 0.93408203125, 1.1060791015625, 1.278076171875, 1.4500732421875, 1.6220703125, 1.7940673828125, 1.966064453125, 2.1380615234375, 2.31005859375, 2.4820556640625, 2.654052734375, 2.8260498046875, 2.998046875, 3.1700439453125, 3.342041015625, 3.5140380859375, 3.68603515625, 3.8580322265625, 4.030029296875, 4.2020263671875, 4.3740234375, 4.5460205078125, 4.718017578125, 4.8900146484375, 5.06201171875, 5.2340087890625, 5.406005859375, 5.5780029296875, 5.75]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 6.0, 6.0, 17.0, 12.0, 7.0, 11.0, 13.0, 27.0, 32.0, 42.0, 59.0, 81.0, 150.0, 201.0, 359.0, 680.0, 1403.0, 3079.0, 8223.0, 28132.0, 167334.0, 2439550.0, 1411730.0, 100443.0, 20768.0, 6644.0, 2591.0, 1155.0, 610.0, 335.0, 177.0, 100.0, 67.0, 45.0, 37.0, 23.0, 27.0, 17.0, 16.0, 8.0, 15.0, 8.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.3125, -31.26611328125, -30.2197265625, -29.17333984375, -28.126953125, -27.08056640625, -26.0341796875, -24.98779296875, -23.94140625, -22.89501953125, -21.8486328125, -20.80224609375, -19.755859375, -18.70947265625, -17.6630859375, -16.61669921875, -15.5703125, -14.52392578125, -13.4775390625, -12.43115234375, -11.384765625, -10.33837890625, -9.2919921875, -8.24560546875, -7.19921875, -6.15283203125, -5.1064453125, -4.06005859375, -3.013671875, -1.96728515625, -0.9208984375, 0.12548828125, 1.171875, 2.21826171875, 3.2646484375, 4.31103515625, 5.357421875, 6.40380859375, 7.4501953125, 8.49658203125, 9.54296875, 10.58935546875, 11.6357421875, 12.68212890625, 13.728515625, 14.77490234375, 15.8212890625, 16.86767578125, 17.9140625, 18.96044921875, 20.0068359375, 21.05322265625, 22.099609375, 23.14599609375, 24.1923828125, 25.23876953125, 26.28515625, 27.33154296875, 28.3779296875, 29.42431640625, 30.470703125, 31.51708984375, 32.5634765625, 33.60986328125, 34.65625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 14.0, 15.0, 27.0, 46.0, 56.0, 101.0, 233.0, 417.0, 779.0, 930.0, 612.0, 379.0, 212.0, 114.0, 58.0, 37.0, 24.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.78125, -28.767578125, -27.75390625, -26.740234375, -25.7265625, -24.712890625, -23.69921875, -22.685546875, -21.671875, -20.658203125, -19.64453125, -18.630859375, -17.6171875, -16.603515625, -15.58984375, -14.576171875, -13.5625, -12.548828125, -11.53515625, -10.521484375, -9.5078125, -8.494140625, -7.48046875, -6.466796875, -5.453125, -4.439453125, -3.42578125, -2.412109375, -1.3984375, -0.384765625, 0.62890625, 1.642578125, 2.65625, 3.669921875, 4.68359375, 5.697265625, 6.7109375, 7.724609375, 8.73828125, 9.751953125, 10.765625, 11.779296875, 12.79296875, 13.806640625, 14.8203125, 15.833984375, 16.84765625, 17.861328125, 18.875, 19.888671875, 20.90234375, 21.916015625, 22.9296875, 23.943359375, 24.95703125, 25.970703125, 26.984375, 27.998046875, 29.01171875, 30.025390625, 31.0390625, 32.052734375, 33.06640625, 34.080078125, 35.09375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 13.0, 14.0, 17.0, 24.0, 36.0, 46.0, 66.0, 66.0, 106.0, 182.0, 330.0, 718.0, 2214.0, 8853.0, 46328.0, 521715.0, 3272750.0, 298418.0, 32413.0, 6643.0, 1829.0, 609.0, 279.0, 184.0, 107.0, 77.0, 48.0, 39.0, 34.0, 32.0, 17.0, 19.0, 16.0, 6.0, 10.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.375, -35.2861328125, -34.197265625, -33.1083984375, -32.01953125, -30.9306640625, -29.841796875, -28.7529296875, -27.6640625, -26.5751953125, -25.486328125, -24.3974609375, -23.30859375, -22.2197265625, -21.130859375, -20.0419921875, -18.953125, -17.8642578125, -16.775390625, -15.6865234375, -14.59765625, -13.5087890625, -12.419921875, -11.3310546875, -10.2421875, -9.1533203125, -8.064453125, -6.9755859375, -5.88671875, -4.7978515625, -3.708984375, -2.6201171875, -1.53125, -0.4423828125, 0.646484375, 1.7353515625, 2.82421875, 3.9130859375, 5.001953125, 6.0908203125, 7.1796875, 8.2685546875, 9.357421875, 10.4462890625, 11.53515625, 12.6240234375, 13.712890625, 14.8017578125, 15.890625, 16.9794921875, 18.068359375, 19.1572265625, 20.24609375, 21.3349609375, 22.423828125, 23.5126953125, 24.6015625, 25.6904296875, 26.779296875, 27.8681640625, 28.95703125, 30.0458984375, 31.134765625, 32.2236328125, 33.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 27.0, 22.0, 16.0, 32.0, 45.0, 61.0, 69.0, 77.0, 77.0, 101.0, 80.0, 67.0, 77.0, 54.0, 40.0, 26.0, 30.0, 17.0, 15.0, 11.0, 2.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-119.81044006347656, -115.21060180664062, -110.61077117919922, -106.01094055175781, -101.41110229492188, -96.81126403808594, -92.21143341064453, -87.61160278320312, -83.01176452636719, -78.41192626953125, -73.81209564208984, -69.21226501464844, -64.6124267578125, -60.01259231567383, -55.412757873535156, -50.812923431396484, -46.21308898925781, -41.61325454711914, -37.01342010498047, -32.4135856628418, -27.813751220703125, -23.213916778564453, -18.61408233642578, -14.01424789428711, -9.414413452148438, -4.814579010009766, -0.21474456787109375, 4.385089874267578, 8.98492431640625, 13.584758758544922, 18.184593200683594, 22.784427642822266, 27.384246826171875, 31.984081268310547, 36.58391571044922, 41.18375015258789, 45.78358459472656, 50.383419036865234, 54.983253479003906, 59.58308792114258, 64.18292236328125, 68.78276062011719, 73.3825912475586, 77.982421875, 82.58226013183594, 87.18209838867188, 91.78192901611328, 96.38175964355469, 100.98159790039062, 105.58143615722656, 110.18126678466797, 114.78109741210938, 119.38093566894531, 123.98077392578125, 128.58059692382812, 133.18043518066406, 137.7802734375, 142.38011169433594, 146.97994995117188, 151.57977294921875, 156.1796112060547, 160.77944946289062, 165.3792724609375, 169.97911071777344, 174.57894897460938]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 8.0, 13.0, 12.0, 9.0, 13.0, 22.0, 15.0, 18.0, 21.0, 26.0, 24.0, 35.0, 29.0, 28.0, 36.0, 43.0, 39.0, 44.0, 54.0, 37.0, 51.0, 29.0, 36.0, 41.0, 33.0, 31.0, 32.0, 39.0, 34.0, 23.0, 25.0, 18.0, 17.0, 13.0, 6.0, 8.0, 8.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-103.0640869140625, -100.19120025634766, -97.31831359863281, -94.44542694091797, -91.57254028320312, -88.69965362548828, -85.82676696777344, -82.95388793945312, -80.08099365234375, -77.2081069946289, -74.33522033691406, -71.46233367919922, -68.58944702148438, -65.71656036376953, -62.84367752075195, -59.97079086303711, -57.09790802001953, -54.22502136230469, -51.352134704589844, -48.479248046875, -45.606361389160156, -42.73347473144531, -39.860591888427734, -36.98770523071289, -34.11481857299805, -31.241931915283203, -28.36904525756836, -25.49616050720215, -22.623273849487305, -19.75038719177246, -16.87750244140625, -14.004615783691406, -11.131729125976562, -8.258842468261719, -5.385956764221191, -2.513071060180664, 0.3598155975341797, 3.2327022552490234, 6.105587005615234, 8.978473663330078, 11.851360321044922, 14.724246978759766, 17.59713363647461, 20.47001838684082, 23.342905044555664, 26.215791702270508, 29.08867645263672, 31.961563110351562, 34.834449768066406, 37.70733642578125, 40.580223083496094, 43.45310974121094, 46.32599639892578, 49.198883056640625, 52.0717658996582, 54.94465255737305, 57.81753921508789, 60.690425872802734, 63.56331253051758, 66.43619537353516, 69.30908203125, 72.18196868896484, 75.05485534667969, 77.92774200439453, 80.80062866210938]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 6.0, 16.0, 15.0, 15.0, 19.0, 18.0, 21.0, 26.0, 21.0, 31.0, 23.0, 35.0, 42.0, 43.0, 50.0, 44.0, 50.0, 43.0, 41.0, 47.0, 52.0, 37.0, 32.0, 38.0, 34.0, 39.0, 28.0, 31.0, 19.0, 17.0, 9.0, 10.0, 11.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-250.625, -243.646484375, -236.66796875, -229.689453125, -222.7109375, -215.732421875, -208.75390625, -201.775390625, -194.796875, -187.818359375, -180.83984375, -173.861328125, -166.8828125, -159.904296875, -152.92578125, -145.947265625, -138.96875, -131.990234375, -125.01171875, -118.033203125, -111.0546875, -104.076171875, -97.09765625, -90.119140625, -83.140625, -76.162109375, -69.18359375, -62.205078125, -55.2265625, -48.248046875, -41.26953125, -34.291015625, -27.3125, -20.333984375, -13.35546875, -6.376953125, 0.6015625, 7.580078125, 14.55859375, 21.537109375, 28.515625, 35.494140625, 42.47265625, 49.451171875, 56.4296875, 63.408203125, 70.38671875, 77.365234375, 84.34375, 91.322265625, 98.30078125, 105.279296875, 112.2578125, 119.236328125, 126.21484375, 133.193359375, 140.171875, 147.150390625, 154.12890625, 161.107421875, 168.0859375, 175.064453125, 182.04296875, 189.021484375, 196.0]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 10.0, 18.0, 17.0, 21.0, 51.0, 87.0, 119.0, 142.0, 245.0, 428.0, 628.0, 964.0, 1668.0, 2590.0, 4469.0, 7540.0, 13304.0, 23379.0, 42008.0, 79523.0, 173573.0, 360450.0, 165376.0, 77008.0, 40903.0, 22577.0, 12837.0, 7327.0, 4410.0, 2580.0, 1628.0, 956.0, 579.0, 407.0, 239.0, 173.0, 129.0, 56.0, 41.0, 28.0, 23.0, 14.0, 16.0, 2.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5390625, -7.3138427734375, -7.088623046875, -6.8634033203125, -6.63818359375, -6.4129638671875, -6.187744140625, -5.9625244140625, -5.7373046875, -5.5120849609375, -5.286865234375, -5.0616455078125, -4.83642578125, -4.6112060546875, -4.385986328125, -4.1607666015625, -3.935546875, -3.7103271484375, -3.485107421875, -3.2598876953125, -3.03466796875, -2.8094482421875, -2.584228515625, -2.3590087890625, -2.1337890625, -1.9085693359375, -1.683349609375, -1.4581298828125, -1.23291015625, -1.0076904296875, -0.782470703125, -0.5572509765625, -0.33203125, -0.1068115234375, 0.118408203125, 0.3436279296875, 0.56884765625, 0.7940673828125, 1.019287109375, 1.2445068359375, 1.4697265625, 1.6949462890625, 1.920166015625, 2.1453857421875, 2.37060546875, 2.5958251953125, 2.821044921875, 3.0462646484375, 3.271484375, 3.4967041015625, 3.721923828125, 3.9471435546875, 4.17236328125, 4.3975830078125, 4.622802734375, 4.8480224609375, 5.0732421875, 5.2984619140625, 5.523681640625, 5.7489013671875, 5.97412109375, 6.1993408203125, 6.424560546875, 6.6497802734375, 6.875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 5.0, 7.0, 13.0, 9.0, 15.0, 16.0, 17.0, 16.0, 25.0, 18.0, 27.0, 25.0, 38.0, 41.0, 30.0, 30.0, 34.0, 42.0, 44.0, 37.0, 1071.0, 29.0, 33.0, 42.0, 39.0, 30.0, 32.0, 32.0, 24.0, 28.0, 31.0, 12.0, 19.0, 12.0, 22.0, 14.0, 14.0, 14.0, 5.0, 6.0, 5.0, 3.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.5, -133.83984375, -129.1796875, -124.51953125, -119.859375, -115.19921875, -110.5390625, -105.87890625, -101.21875, -96.55859375, -91.8984375, -87.23828125, -82.578125, -77.91796875, -73.2578125, -68.59765625, -63.9375, -59.27734375, -54.6171875, -49.95703125, -45.296875, -40.63671875, -35.9765625, -31.31640625, -26.65625, -21.99609375, -17.3359375, -12.67578125, -8.015625, -3.35546875, 1.3046875, 5.96484375, 10.625, 15.28515625, 19.9453125, 24.60546875, 29.265625, 33.92578125, 38.5859375, 43.24609375, 47.90625, 52.56640625, 57.2265625, 61.88671875, 66.546875, 71.20703125, 75.8671875, 80.52734375, 85.1875, 89.84765625, 94.5078125, 99.16796875, 103.828125, 108.48828125, 113.1484375, 117.80859375, 122.46875, 127.12890625, 131.7890625, 136.44921875, 141.109375, 145.76953125, 150.4296875, 155.08984375, 159.75]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 12.0, 16.0, 13.0, 39.0, 44.0, 77.0, 101.0, 172.0, 254.0, 352.0, 550.0, 821.0, 1265.0, 1849.0, 2820.0, 4292.0, 6624.0, 10201.0, 15684.0, 25178.0, 40450.0, 67584.0, 124013.0, 1322280.0, 217783.0, 100715.0, 57103.0, 35064.0, 21866.0, 14004.0, 8888.0, 5835.0, 3855.0, 2526.0, 1654.0, 1054.0, 705.0, 462.0, 294.0, 215.0, 135.0, 95.0, 70.0, 39.0, 22.0, 16.0, 14.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.95703125, -3.8365478515625, -3.716064453125, -3.5955810546875, -3.47509765625, -3.3546142578125, -3.234130859375, -3.1136474609375, -2.9931640625, -2.8726806640625, -2.752197265625, -2.6317138671875, -2.51123046875, -2.3907470703125, -2.270263671875, -2.1497802734375, -2.029296875, -1.9088134765625, -1.788330078125, -1.6678466796875, -1.54736328125, -1.4268798828125, -1.306396484375, -1.1859130859375, -1.0654296875, -0.9449462890625, -0.824462890625, -0.7039794921875, -0.58349609375, -0.4630126953125, -0.342529296875, -0.2220458984375, -0.1015625, 0.0189208984375, 0.139404296875, 0.2598876953125, 0.38037109375, 0.5008544921875, 0.621337890625, 0.7418212890625, 0.8623046875, 0.9827880859375, 1.103271484375, 1.2237548828125, 1.34423828125, 1.4647216796875, 1.585205078125, 1.7056884765625, 1.826171875, 1.9466552734375, 2.067138671875, 2.1876220703125, 2.30810546875, 2.4285888671875, 2.549072265625, 2.6695556640625, 2.7900390625, 2.9105224609375, 3.031005859375, 3.1514892578125, 3.27197265625, 3.3924560546875, 3.512939453125, 3.6334228515625, 3.75390625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 10.0, 6.0, 11.0, 15.0, 8.0, 16.0, 15.0, 24.0, 26.0, 39.0, 49.0, 58.0, 55.0, 79.0, 82.0, 84.0, 62.0, 55.0, 60.0, 54.0, 32.0, 28.0, 23.0, 24.0, 17.0, 12.0, 10.0, 8.0, 3.0, 5.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015625, -0.015136480331420898, -0.014647960662841797, -0.014159440994262695, -0.013670921325683594, -0.013182401657104492, -0.01269388198852539, -0.012205362319946289, -0.011716842651367188, -0.011228322982788086, -0.010739803314208984, -0.010251283645629883, -0.009762763977050781, -0.00927424430847168, -0.008785724639892578, -0.008297204971313477, -0.007808685302734375, -0.0073201656341552734, -0.006831645965576172, -0.00634312629699707, -0.005854606628417969, -0.005366086959838867, -0.004877567291259766, -0.004389047622680664, -0.0039005279541015625, -0.003412008285522461, -0.0029234886169433594, -0.002434968948364258, -0.0019464492797851562, -0.0014579296112060547, -0.0009694099426269531, -0.00048089027404785156, 7.62939453125e-06, 0.0004961490631103516, 0.0009846687316894531, 0.0014731884002685547, 0.0019617080688476562, 0.002450227737426758, 0.0029387474060058594, 0.003427267074584961, 0.0039157867431640625, 0.004404306411743164, 0.004892826080322266, 0.005381345748901367, 0.005869865417480469, 0.00635838508605957, 0.006846904754638672, 0.0073354244232177734, 0.007823944091796875, 0.008312463760375977, 0.008800983428955078, 0.00928950309753418, 0.009778022766113281, 0.010266542434692383, 0.010755062103271484, 0.011243581771850586, 0.011732101440429688, 0.012220621109008789, 0.01270914077758789, 0.013197660446166992, 0.013686180114746094, 0.014174699783325195, 0.014663219451904297, 0.015151739120483398, 0.0156402587890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 4.0, 15.0, 19.0, 28.0, 49.0, 92.0, 112.0, 188.0, 374.0, 595.0, 1023.0, 1945.0, 3838.0, 8340.0, 18819.0, 48435.0, 152236.0, 500630.0, 208434.0, 60946.0, 23005.0, 9705.0, 4585.0, 2295.0, 1214.0, 656.0, 367.0, 232.0, 123.0, 75.0, 64.0, 41.0, 26.0, 9.0, 10.0, 8.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09222412109375, -0.08955955505371094, -0.08689498901367188, -0.08423042297363281, -0.08156585693359375, -0.07890129089355469, -0.07623672485351562, -0.07357215881347656, -0.0709075927734375, -0.06824302673339844, -0.06557846069335938, -0.06291389465332031, -0.06024932861328125, -0.05758476257324219, -0.054920196533203125, -0.05225563049316406, -0.049591064453125, -0.04692649841308594, -0.044261932373046875, -0.04159736633300781, -0.03893280029296875, -0.03626823425292969, -0.033603668212890625, -0.030939102172851562, -0.0282745361328125, -0.025609970092773438, -0.022945404052734375, -0.020280838012695312, -0.01761627197265625, -0.014951705932617188, -0.012287139892578125, -0.009622573852539062, -0.0069580078125, -0.0042934417724609375, -0.001628875732421875, 0.0010356903076171875, 0.00370025634765625, 0.0063648223876953125, 0.009029388427734375, 0.011693954467773438, 0.0143585205078125, 0.017023086547851562, 0.019687652587890625, 0.022352218627929688, 0.02501678466796875, 0.027681350708007812, 0.030345916748046875, 0.03301048278808594, 0.035675048828125, 0.03833961486816406, 0.041004180908203125, 0.04366874694824219, 0.04633331298828125, 0.04899787902832031, 0.051662445068359375, 0.05432701110839844, 0.0569915771484375, 0.05965614318847656, 0.062320709228515625, 0.06498527526855469, 0.06764984130859375, 0.07031440734863281, 0.07297897338867188, 0.07564353942871094, 0.07830810546875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 3.0, 11.0, 7.0, 7.0, 9.0, 18.0, 20.0, 22.0, 29.0, 38.0, 55.0, 61.0, 67.0, 73.0, 74.0, 84.0, 72.0, 72.0, 47.0, 44.0, 44.0, 33.0, 25.0, 19.0, 15.0, 13.0, 3.0, 7.0, 3.0, 9.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0177143607288599, -0.017120180651545525, -0.016525998711586, -0.01593181863427162, -0.01533763762563467, -0.014743456616997719, -0.014149276539683342, -0.01355509553104639, -0.012960914522409439, -0.012366733513772488, -0.011772552505135536, -0.01117837242782116, -0.010584191419184208, -0.009990010410547256, -0.00939583033323288, -0.008801649324595928, -0.008207468315958977, -0.007613287307322025, -0.007019106764346361, -0.006424926221370697, -0.005830745212733746, -0.005236564204096794, -0.00464238366112113, -0.004048203118145466, -0.0034540221095085144, -0.0028598413337022066, -0.002265660557895899, -0.001671479782089591, -0.0010772990062832832, -0.00048311823047697544, 0.00011106254532933235, 0.0007052430883049965, 0.0012994222342967987, 0.0018936030101031065, 0.0024877837859094143, 0.003081964561715722, 0.00367614533752203, 0.004270326346158981, 0.0048645068891346455, 0.00545868743211031, 0.006052868440747261, 0.0066470494493842125, 0.007241229992359877, 0.00783541053533554, 0.008429591543972492, 0.009023772552609444, 0.00961795262992382, 0.010212133638560772, 0.010806314647197723, 0.011400495655834675, 0.011994676664471626, 0.012588856741786003, 0.013183037750422955, 0.013777218759059906, 0.014371398836374283, 0.014965579845011234, 0.015559760853648186, 0.016153940930962563, 0.01674812287092209, 0.017342302948236465, 0.017936483025550842, 0.01853066496551037, 0.019124845042824745, 0.01971902698278427, 0.020313207060098648]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 14.0, 14.0, 13.0, 17.0, 10.0, 31.0, 21.0, 24.0, 35.0, 27.0, 34.0, 31.0, 36.0, 42.0, 46.0, 54.0, 37.0, 31.0, 39.0, 45.0, 46.0, 42.0, 33.0, 32.0, 23.0, 34.0, 22.0, 25.0, 24.0, 20.0, 15.0, 19.0, 8.0, 5.0, 6.0, 11.0, 5.0, 3.0, 0.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.011652886867523193, -0.011288831941783428, -0.010924777016043663, -0.010560722090303898, -0.010196667164564133, -0.009832612238824368, -0.009468557313084602, -0.009104502387344837, -0.008740447461605072, -0.008376392535865307, -0.008012337610125542, -0.0076482826843857765, -0.007284227758646011, -0.006920172832906246, -0.006556117907166481, -0.006192062981426716, -0.005828008055686951, -0.0054639531299471855, -0.00509989820420742, -0.004735843278467655, -0.00437178835272789, -0.004007733426988125, -0.0036436785012483597, -0.0032796235755085945, -0.0029155686497688293, -0.002551513724029064, -0.002187458798289299, -0.0018234038725495338, -0.0014593489468097687, -0.0010952940210700035, -0.0007312390953302383, -0.0003671841695904732, -3.129243850708008e-06, 0.00036092568188905716, 0.0007249806076288223, 0.0010890355333685875, 0.0014530904591083527, 0.0018171453848481178, 0.002181200310587883, 0.002545255236327648, 0.0029093101620674133, 0.0032733650878071785, 0.0036374200135469437, 0.004001474939286709, 0.004365529865026474, 0.004729584790766239, 0.005093639716506004, 0.0054576946422457695, 0.005821749567985535, 0.0061858044937253, 0.006549859419465065, 0.00691391434520483, 0.007277969270944595, 0.0076420241966843605, 0.008006079122424126, 0.00837013404816389, 0.008734188973903656, 0.009098243899643421, 0.009462298825383186, 0.009826353751122952, 0.010190408676862717, 0.010554463602602482, 0.010918518528342247, 0.011282573454082012, 0.011646628379821777]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 6.0, 16.0, 15.0, 15.0, 19.0, 18.0, 21.0, 26.0, 21.0, 31.0, 23.0, 34.0, 43.0, 43.0, 50.0, 44.0, 49.0, 44.0, 41.0, 46.0, 53.0, 37.0, 31.0, 39.0, 33.0, 40.0, 28.0, 29.0, 21.0, 17.0, 9.0, 10.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-250.625, -243.6484375, -236.671875, -229.6953125, -222.71875, -215.7421875, -208.765625, -201.7890625, -194.8125, -187.8359375, -180.859375, -173.8828125, -166.90625, -159.9296875, -152.953125, -145.9765625, -139.0, -132.0234375, -125.046875, -118.0703125, -111.09375, -104.1171875, -97.140625, -90.1640625, -83.1875, -76.2109375, -69.234375, -62.2578125, -55.28125, -48.3046875, -41.328125, -34.3515625, -27.375, -20.3984375, -13.421875, -6.4453125, 0.53125, 7.5078125, 14.484375, 21.4609375, 28.4375, 35.4140625, 42.390625, 49.3671875, 56.34375, 63.3203125, 70.296875, 77.2734375, 84.25, 91.2265625, 98.203125, 105.1796875, 112.15625, 119.1328125, 126.109375, 133.0859375, 140.0625, 147.0390625, 154.015625, 160.9921875, 167.96875, 174.9453125, 181.921875, 188.8984375, 195.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 4.0, 13.0, 6.0, 8.0, 19.0, 13.0, 22.0, 22.0, 22.0, 27.0, 41.0, 62.0, 87.0, 172.0, 270.0, 567.0, 1804.0, 14631.0, 440088.0, 567335.0, 19808.0, 1988.0, 651.0, 302.0, 184.0, 115.0, 62.0, 57.0, 42.0, 30.0, 28.0, 20.0, 7.0, 12.0, 10.0, 5.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-49.65625, -48.27880859375, -46.9013671875, -45.52392578125, -44.146484375, -42.76904296875, -41.3916015625, -40.01416015625, -38.63671875, -37.25927734375, -35.8818359375, -34.50439453125, -33.126953125, -31.74951171875, -30.3720703125, -28.99462890625, -27.6171875, -26.23974609375, -24.8623046875, -23.48486328125, -22.107421875, -20.72998046875, -19.3525390625, -17.97509765625, -16.59765625, -15.22021484375, -13.8427734375, -12.46533203125, -11.087890625, -9.71044921875, -8.3330078125, -6.95556640625, -5.578125, -4.20068359375, -2.8232421875, -1.44580078125, -0.068359375, 1.30908203125, 2.6865234375, 4.06396484375, 5.44140625, 6.81884765625, 8.1962890625, 9.57373046875, 10.951171875, 12.32861328125, 13.7060546875, 15.08349609375, 16.4609375, 17.83837890625, 19.2158203125, 20.59326171875, 21.970703125, 23.34814453125, 24.7255859375, 26.10302734375, 27.48046875, 28.85791015625, 30.2353515625, 31.61279296875, 32.990234375, 34.36767578125, 35.7451171875, 37.12255859375, 38.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 18.0, 19.0, 24.0, 20.0, 36.0, 33.0, 43.0, 65.0, 62.0, 79.0, 80.0, 2105.0, 75.0, 48.0, 63.0, 50.0, 46.0, 47.0, 25.0, 24.0, 14.0, 11.0, 10.0, 10.0, 10.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-443.0, -429.23046875, -415.4609375, -401.69140625, -387.921875, -374.15234375, -360.3828125, -346.61328125, -332.84375, -319.07421875, -305.3046875, -291.53515625, -277.765625, -263.99609375, -250.2265625, -236.45703125, -222.6875, -208.91796875, -195.1484375, -181.37890625, -167.609375, -153.83984375, -140.0703125, -126.30078125, -112.53125, -98.76171875, -84.9921875, -71.22265625, -57.453125, -43.68359375, -29.9140625, -16.14453125, -2.375, 11.39453125, 25.1640625, 38.93359375, 52.703125, 66.47265625, 80.2421875, 94.01171875, 107.78125, 121.55078125, 135.3203125, 149.08984375, 162.859375, 176.62890625, 190.3984375, 204.16796875, 217.9375, 231.70703125, 245.4765625, 259.24609375, 273.015625, 286.78515625, 300.5546875, 314.32421875, 328.09375, 341.86328125, 355.6328125, 369.40234375, 383.171875, 396.94140625, 410.7109375, 424.48046875, 438.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 12.0, 12.0, 19.0, 34.0, 75.0, 147.0, 333.0, 1014.0, 5484.0, 92770.0, 2982915.0, 57071.0, 4294.0, 929.0, 303.0, 135.0, 56.0, 31.0, 19.0, 5.0, 10.0, 9.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.84375, -38.71923828125, -37.5947265625, -36.47021484375, -35.345703125, -34.22119140625, -33.0966796875, -31.97216796875, -30.84765625, -29.72314453125, -28.5986328125, -27.47412109375, -26.349609375, -25.22509765625, -24.1005859375, -22.97607421875, -21.8515625, -20.72705078125, -19.6025390625, -18.47802734375, -17.353515625, -16.22900390625, -15.1044921875, -13.97998046875, -12.85546875, -11.73095703125, -10.6064453125, -9.48193359375, -8.357421875, -7.23291015625, -6.1083984375, -4.98388671875, -3.859375, -2.73486328125, -1.6103515625, -0.48583984375, 0.638671875, 1.76318359375, 2.8876953125, 4.01220703125, 5.13671875, 6.26123046875, 7.3857421875, 8.51025390625, 9.634765625, 10.75927734375, 11.8837890625, 13.00830078125, 14.1328125, 15.25732421875, 16.3818359375, 17.50634765625, 18.630859375, 19.75537109375, 20.8798828125, 22.00439453125, 23.12890625, 24.25341796875, 25.3779296875, 26.50244140625, 27.626953125, 28.75146484375, 29.8759765625, 31.00048828125, 32.125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 5.0, 8.0, 14.0, 15.0, 22.0, 43.0, 51.0, 91.0, 196.0, 204.0, 153.0, 68.0, 29.0, 35.0, 15.0, 10.0, 7.0, 2.0, 6.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-559.679443359375, -539.1724853515625, -518.66552734375, -498.1585998535156, -477.6516418457031, -457.1446838378906, -436.63775634765625, -416.13079833984375, -395.62384033203125, -375.11688232421875, -354.60992431640625, -334.1029968261719, -313.5960388183594, -293.0890808105469, -272.5821533203125, -252.0751953125, -231.5682373046875, -211.061279296875, -190.55433654785156, -170.04739379882812, -149.54043579101562, -129.03347778320312, -108.52653503417969, -88.01959228515625, -67.51263427734375, -47.00568389892578, -26.498733520507812, -5.991783142089844, 14.515167236328125, 35.022117614746094, 55.52906799316406, 76.0360107421875, 96.54296875, 117.04991912841797, 137.55686950683594, 158.06381225585938, 178.57077026367188, 199.07772827148438, 219.5846710205078, 240.09161376953125, 260.59857177734375, 281.10552978515625, 301.61248779296875, 322.1194152832031, 342.6263732910156, 363.1333312988281, 383.6402587890625, 404.147216796875, 424.6541748046875, 445.1611328125, 465.6680908203125, 486.1750183105469, 506.6819763183594, 527.1889038085938, 547.6958618164062, 568.2028198242188, 588.7097778320312, 609.2167358398438, 629.7236938476562, 650.2306518554688, 670.737548828125, 691.2445068359375, 711.75146484375, 732.2584228515625, 752.765380859375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 5.0, 7.0, 11.0, 17.0, 23.0, 16.0, 23.0, 18.0, 13.0, 26.0, 24.0, 27.0, 31.0, 55.0, 44.0, 43.0, 48.0, 49.0, 50.0, 40.0, 33.0, 34.0, 44.0, 29.0, 34.0, 27.0, 48.0, 29.0, 26.0, 18.0, 18.0, 12.0, 15.0, 7.0, 8.0, 9.0, 2.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-704.7015380859375, -684.605224609375, -664.5088500976562, -644.4125366210938, -624.316162109375, -604.2198486328125, -584.1234741210938, -564.0271606445312, -543.9307861328125, -523.83447265625, -503.73809814453125, -483.6417541503906, -463.54541015625, -443.4490661621094, -423.35272216796875, -403.25640869140625, -383.1600646972656, -363.063720703125, -342.9673767089844, -322.87103271484375, -302.7746887207031, -282.6783447265625, -262.58203125, -242.4856719970703, -222.3893280029297, -202.29298400878906, -182.19664001464844, -162.10031127929688, -142.00396728515625, -121.9076156616211, -101.811279296875, -81.71493530273438, -61.61859130859375, -41.522247314453125, -21.425907135009766, -1.3295669555664062, 18.76677703857422, 38.863121032714844, 58.95945739746094, 79.05580139160156, 99.15214538574219, 119.24848937988281, 139.34483337402344, 159.441162109375, 179.53750610351562, 199.63385009765625, 219.73019409179688, 239.8265380859375, 259.9228820800781, 280.01922607421875, 300.1155700683594, 320.2119140625, 340.3082580566406, 360.40460205078125, 380.50091552734375, 400.5972900390625, 420.693603515625, 440.7899475097656, 460.88629150390625, 480.9826354980469, 501.0789794921875, 521.17529296875, 541.2716674804688, 561.3679809570312, 581.46435546875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 10.0, 9.0, 9.0, 12.0, 22.0, 24.0, 29.0, 37.0, 27.0, 51.0, 54.0, 109.0, 177.0, 263.0, 552.0, 1553.0, 5682.0, 1025233.0, 10269.0, 2567.0, 775.0, 362.0, 226.0, 138.0, 71.0, 51.0, 41.0, 27.0, 30.0, 12.0, 14.0, 17.0, 11.0, 18.0, 11.0, 7.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-148.81954956054688, -144.12600708007812, -139.43246459960938, -134.73892211914062, -130.0453643798828, -125.35182189941406, -120.65827941894531, -115.96473693847656, -111.27119445800781, -106.57765197753906, -101.88410186767578, -97.19055938720703, -92.49701690673828, -87.803466796875, -83.10992431640625, -78.4163818359375, -73.72283172607422, -69.02928924560547, -64.33573913574219, -59.64219665527344, -54.94865417480469, -50.25510787963867, -45.561561584472656, -40.868019104003906, -36.17447280883789, -31.480928421020508, -26.787384033203125, -22.09383773803711, -17.400293350219727, -12.706748962402344, -8.013202667236328, -3.319660186767578, 1.3738861083984375, 6.0674309730529785, 10.76097583770752, 15.454521179199219, 20.1480655670166, 24.841609954833984, 29.53515625, 34.22869873046875, 38.922245025634766, 43.61579132080078, 48.30933380126953, 53.00288009643555, 57.69642639160156, 62.38996887207031, 67.08351135253906, 71.77705383300781, 76.4706039428711, 81.16414642333984, 85.85769653320312, 90.55123901367188, 95.24478149414062, 99.93832397460938, 104.63187408447266, 109.3254165649414, 114.01896667480469, 118.71250915527344, 123.40605926513672, 128.099609375, 132.79315185546875, 137.4866943359375, 142.18023681640625, 146.873779296875, 151.56732177734375]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 2.0, 5.0, 12.0, 12.0, 24.0, 30.0, 65.0, 85.0, 155.0, 286.0, 550.0, 2039.0, 49823.0, 51402116.0, 6298.0, 911.0, 310.0, 159.0, 93.0, 56.0, 30.0, 10.0, 15.0, 17.0, 15.0, 6.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-407.26434326171875, -394.21893310546875, -381.1735534667969, -368.1281433105469, -355.082763671875, -342.037353515625, -328.991943359375, -315.9465637207031, -302.90118408203125, -289.85577392578125, -276.8103942871094, -263.7649841308594, -250.7196044921875, -237.6741943359375, -224.62879943847656, -211.58340454101562, -198.53799438476562, -185.4925994873047, -172.44720458984375, -159.40179443359375, -146.35641479492188, -133.31100463867188, -120.26560974121094, -107.22021484375, -94.17481994628906, -81.12942504882812, -68.08403015136719, -55.03862762451172, -41.99323272705078, -28.947837829589844, -15.902435302734375, -2.8570404052734375, 10.188385009765625, 23.233781814575195, 36.279178619384766, 49.32457733154297, 62.369972229003906, 75.41536712646484, 88.46076965332031, 101.50616455078125, 114.55155944824219, 127.59695434570312, 140.64234924316406, 153.687744140625, 166.733154296875, 179.77853393554688, 192.82394409179688, 205.8693389892578, 218.91473388671875, 231.9601287841797, 245.00552368164062, 258.0509338378906, 271.0963134765625, 284.1417236328125, 297.1871337890625, 310.2325134277344, 323.27789306640625, 336.32330322265625, 349.3686828613281, 362.4140930175781, 375.45947265625, 388.5048828125, 401.55029296875, 414.5956726074219, 427.6410827636719]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 2.0, 8.0, 21.0, 19.0, 33.0, 61.0, 75.0, 119.0, 196.0, 338.0, 471.0, 742.0, 1195.0, 1776.0, 2593.0, 3998.0, 6034.0, 9242.0, 14371.0, 23046.0, 36345.0, 58880.0, 99671.0, 175856.0, 340920.0, 783054.0, 3871106.0, 385483.0, 195006.0, 109252.0, 64453.0, 38800.0, 24846.0, 15508.0, 9789.0, 6259.0, 4011.0, 2649.0, 1727.0, 1129.0, 739.0, 530.0, 325.0, 246.0, 170.0, 116.0, 85.0, 42.0, 35.0, 29.0, 14.0, 5.0, 0.0, 2.0, 2.0, 1.0, 5.0], "bins": [-1.134765625, -1.1004638671875, -1.066162109375, -1.0318603515625, -0.99755859375, -0.9632568359375, -0.928955078125, -0.8946533203125, -0.8603515625, -0.8260498046875, -0.791748046875, -0.7574462890625, -0.72314453125, -0.6888427734375, -0.654541015625, -0.6202392578125, -0.5859375, -0.5516357421875, -0.517333984375, -0.4830322265625, -0.44873046875, -0.4144287109375, -0.380126953125, -0.3458251953125, -0.3115234375, -0.2772216796875, -0.242919921875, -0.2086181640625, -0.17431640625, -0.1400146484375, -0.105712890625, -0.0714111328125, -0.037109375, -0.0028076171875, 0.031494140625, 0.0657958984375, 0.10009765625, 0.1343994140625, 0.168701171875, 0.2030029296875, 0.2373046875, 0.2716064453125, 0.305908203125, 0.3402099609375, 0.37451171875, 0.4088134765625, 0.443115234375, 0.4774169921875, 0.51171875, 0.5460205078125, 0.580322265625, 0.6146240234375, 0.64892578125, 0.6832275390625, 0.717529296875, 0.7518310546875, 0.7861328125, 0.8204345703125, 0.854736328125, 0.8890380859375, 0.92333984375, 0.9576416015625, 0.991943359375, 1.0262451171875, 1.060546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 11.0, 5.0, 7.0, 15.0, 12.0, 13.0, 24.0, 13.0, 36.0, 24.0, 32.0, 37.0, 35.0, 37.0, 41.0, 35.0, 39.0, 53.0, 1064.0, 41.0, 54.0, 44.0, 35.0, 35.0, 33.0, 32.0, 26.0, 27.0, 28.0, 12.0, 22.0, 17.0, 12.0, 9.0, 10.0, 11.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.0, -65.90234375, -63.8046875, -61.70703125, -59.609375, -57.51171875, -55.4140625, -53.31640625, -51.21875, -49.12109375, -47.0234375, -44.92578125, -42.828125, -40.73046875, -38.6328125, -36.53515625, -34.4375, -32.33984375, -30.2421875, -28.14453125, -26.046875, -23.94921875, -21.8515625, -19.75390625, -17.65625, -15.55859375, -13.4609375, -11.36328125, -9.265625, -7.16796875, -5.0703125, -2.97265625, -0.875, 1.22265625, 3.3203125, 5.41796875, 7.515625, 9.61328125, 11.7109375, 13.80859375, 15.90625, 18.00390625, 20.1015625, 22.19921875, 24.296875, 26.39453125, 28.4921875, 30.58984375, 32.6875, 34.78515625, 36.8828125, 38.98046875, 41.078125, 43.17578125, 45.2734375, 47.37109375, 49.46875, 51.56640625, 53.6640625, 55.76171875, 57.859375, 59.95703125, 62.0546875, 64.15234375, 66.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 9.0, 9.0, 30.0, 38.0, 45.0, 68.0, 120.0, 158.0, 226.0, 349.0, 481.0, 754.0, 1175.0, 1732.0, 2617.0, 4137.0, 6467.0, 10102.0, 15675.0, 25011.0, 39961.0, 66043.0, 114546.0, 215911.0, 440240.0, 3932259.0, 674187.0, 332650.0, 168221.0, 92687.0, 54211.0, 33213.0, 20643.0, 13314.0, 8331.0, 5452.0, 3527.0, 2330.0, 1530.0, 971.0, 661.0, 425.0, 270.0, 190.0, 126.0, 78.0, 61.0, 54.0, 41.0, 29.0, 14.0, 15.0, 9.0, 10.0, 5.0, 4.0], "bins": [-0.94775390625, -0.9197235107421875, -0.891693115234375, -0.8636627197265625, -0.83563232421875, -0.8076019287109375, -0.779571533203125, -0.7515411376953125, -0.7235107421875, -0.6954803466796875, -0.667449951171875, -0.6394195556640625, -0.61138916015625, -0.5833587646484375, -0.555328369140625, -0.5272979736328125, -0.499267578125, -0.4712371826171875, -0.443206787109375, -0.4151763916015625, -0.38714599609375, -0.3591156005859375, -0.331085205078125, -0.3030548095703125, -0.2750244140625, -0.2469940185546875, -0.218963623046875, -0.1909332275390625, -0.16290283203125, -0.1348724365234375, -0.106842041015625, -0.0788116455078125, -0.05078125, -0.0227508544921875, 0.005279541015625, 0.0333099365234375, 0.06134033203125, 0.0893707275390625, 0.117401123046875, 0.1454315185546875, 0.1734619140625, 0.2014923095703125, 0.229522705078125, 0.2575531005859375, 0.28558349609375, 0.3136138916015625, 0.341644287109375, 0.3696746826171875, 0.397705078125, 0.4257354736328125, 0.453765869140625, 0.4817962646484375, 0.50982666015625, 0.5378570556640625, 0.565887451171875, 0.5939178466796875, 0.6219482421875, 0.6499786376953125, 0.678009033203125, 0.7060394287109375, 0.73406982421875, 0.7621002197265625, 0.790130615234375, 0.8181610107421875, 0.84619140625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 3.0, 11.0, 10.0, 10.0, 12.0, 11.0, 10.0, 13.0, 14.0, 23.0, 19.0, 20.0, 19.0, 29.0, 31.0, 38.0, 31.0, 30.0, 42.0, 30.0, 34.0, 1061.0, 33.0, 51.0, 36.0, 40.0, 37.0, 40.0, 31.0, 33.0, 23.0, 14.0, 25.0, 15.0, 21.0, 19.0, 11.0, 14.0, 14.0, 8.0, 8.0, 8.0, 6.0, 6.0, 5.0, 4.0, 1.0, 8.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-47.78125, -46.2177734375, -44.654296875, -43.0908203125, -41.52734375, -39.9638671875, -38.400390625, -36.8369140625, -35.2734375, -33.7099609375, -32.146484375, -30.5830078125, -29.01953125, -27.4560546875, -25.892578125, -24.3291015625, -22.765625, -21.2021484375, -19.638671875, -18.0751953125, -16.51171875, -14.9482421875, -13.384765625, -11.8212890625, -10.2578125, -8.6943359375, -7.130859375, -5.5673828125, -4.00390625, -2.4404296875, -0.876953125, 0.6865234375, 2.25, 3.8134765625, 5.376953125, 6.9404296875, 8.50390625, 10.0673828125, 11.630859375, 13.1943359375, 14.7578125, 16.3212890625, 17.884765625, 19.4482421875, 21.01171875, 22.5751953125, 24.138671875, 25.7021484375, 27.265625, 28.8291015625, 30.392578125, 31.9560546875, 33.51953125, 35.0830078125, 36.646484375, 38.2099609375, 39.7734375, 41.3369140625, 42.900390625, 44.4638671875, 46.02734375, 47.5908203125, 49.154296875, 50.7177734375, 52.28125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 11.0, 18.0, 12.0, 23.0, 31.0, 34.0, 50.0, 58.0, 69.0, 116.0, 127.0, 134.0, 199.0, 260.0, 333.0, 466.0, 702.0, 981.0, 1525.0, 2588.0, 5597.0, 14041.0, 42023.0, 198596.0, 5906098.0, 77368.0, 21565.0, 8411.0, 3772.0, 1990.0, 1154.0, 790.0, 535.0, 407.0, 308.0, 241.0, 218.0, 152.0, 101.0, 82.0, 52.0, 55.0, 40.0, 32.0, 19.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.30078125, -4.16302490234375, -4.0252685546875, -3.88751220703125, -3.749755859375, -3.61199951171875, -3.4742431640625, -3.33648681640625, -3.19873046875, -3.06097412109375, -2.9232177734375, -2.78546142578125, -2.647705078125, -2.50994873046875, -2.3721923828125, -2.23443603515625, -2.0966796875, -1.95892333984375, -1.8211669921875, -1.68341064453125, -1.545654296875, -1.40789794921875, -1.2701416015625, -1.13238525390625, -0.99462890625, -0.85687255859375, -0.7191162109375, -0.58135986328125, -0.443603515625, -0.30584716796875, -0.1680908203125, -0.03033447265625, 0.107421875, 0.24517822265625, 0.3829345703125, 0.52069091796875, 0.658447265625, 0.79620361328125, 0.9339599609375, 1.07171630859375, 1.20947265625, 1.34722900390625, 1.4849853515625, 1.62274169921875, 1.760498046875, 1.89825439453125, 2.0360107421875, 2.17376708984375, 2.3115234375, 2.44927978515625, 2.5870361328125, 2.72479248046875, 2.862548828125, 3.00030517578125, 3.1380615234375, 3.27581787109375, 3.41357421875, 3.55133056640625, 3.6890869140625, 3.82684326171875, 3.964599609375, 4.10235595703125, 4.2401123046875, 4.37786865234375, 4.515625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 8.0, 9.0, 11.0, 10.0, 9.0, 21.0, 18.0, 15.0, 23.0, 19.0, 27.0, 23.0, 33.0, 35.0, 36.0, 27.0, 29.0, 33.0, 31.0, 41.0, 1073.0, 32.0, 47.0, 32.0, 37.0, 27.0, 32.0, 34.0, 36.0, 31.0, 18.0, 31.0, 14.0, 15.0, 14.0, 19.0, 16.0, 16.0, 10.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-52.0625, -50.552734375, -49.04296875, -47.533203125, -46.0234375, -44.513671875, -43.00390625, -41.494140625, -39.984375, -38.474609375, -36.96484375, -35.455078125, -33.9453125, -32.435546875, -30.92578125, -29.416015625, -27.90625, -26.396484375, -24.88671875, -23.376953125, -21.8671875, -20.357421875, -18.84765625, -17.337890625, -15.828125, -14.318359375, -12.80859375, -11.298828125, -9.7890625, -8.279296875, -6.76953125, -5.259765625, -3.75, -2.240234375, -0.73046875, 0.779296875, 2.2890625, 3.798828125, 5.30859375, 6.818359375, 8.328125, 9.837890625, 11.34765625, 12.857421875, 14.3671875, 15.876953125, 17.38671875, 18.896484375, 20.40625, 21.916015625, 23.42578125, 24.935546875, 26.4453125, 27.955078125, 29.46484375, 30.974609375, 32.484375, 33.994140625, 35.50390625, 37.013671875, 38.5234375, 40.033203125, 41.54296875, 43.052734375, 44.5625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 13.0, 128.0, 808.0, 31.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-701.2349853515625, -687.2791748046875, -673.3233032226562, -659.3674926757812, -645.4116821289062, -631.4558715820312, -617.5, -603.544189453125, -589.58837890625, -575.632568359375, -561.6766967773438, -547.7208862304688, -533.7650756835938, -519.8092651367188, -505.8533935546875, -491.8975830078125, -477.9417419433594, -463.98590087890625, -450.03009033203125, -436.0742492675781, -422.1184387207031, -408.16259765625, -394.206787109375, -380.2509460449219, -366.29510498046875, -352.3392639160156, -338.3834533691406, -324.4276123046875, -310.4718017578125, -296.5159606933594, -282.56011962890625, -268.60430908203125, -254.64846801757812, -240.69264221191406, -226.73681640625, -212.78097534179688, -198.82516479492188, -184.86932373046875, -170.9134979248047, -156.95767211914062, -143.00184631347656, -129.0460205078125, -115.09019470214844, -101.13436126708984, -87.17853546142578, -73.22270965576172, -59.266876220703125, -45.31105041503906, -31.355224609375, -17.399396896362305, -3.4435691833496094, 10.512260437011719, 24.46808624267578, 38.423912048339844, 52.37974548339844, 66.3355712890625, 80.29139709472656, 94.24722290039062, 108.20304870605469, 122.15888214111328, 136.11471557617188, 150.07052612304688, 164.0263671875, 177.98219299316406, 191.93801879882812]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 1.0, 4.0, 10.0, 10.0, 16.0, 15.0, 18.0, 22.0, 26.0, 33.0, 22.0, 37.0, 31.0, 44.0, 41.0, 40.0, 46.0, 42.0, 46.0, 48.0, 44.0, 45.0, 41.0, 39.0, 40.0, 35.0, 27.0, 24.0, 23.0, 20.0, 15.0, 15.0, 12.0, 12.0, 9.0, 9.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.25540161132812, -123.369873046875, -119.48434448242188, -115.59882354736328, -111.71329498291016, -107.82776641845703, -103.94224548339844, -100.05671691894531, -96.17118835449219, -92.28565979003906, -88.40013122558594, -84.51461029052734, -80.62908172607422, -76.7435531616211, -72.8580322265625, -68.97250366210938, -65.08697509765625, -61.201446533203125, -57.315921783447266, -53.430397033691406, -49.54486846923828, -45.659339904785156, -41.7738151550293, -37.88829040527344, -34.00276184082031, -30.11723518371582, -26.231708526611328, -22.346181869506836, -18.460655212402344, -14.575128555297852, -10.68960189819336, -6.804075241088867, -2.918548583984375, 0.9669780731201172, 4.852504730224609, 8.738031387329102, 12.623558044433594, 16.509084701538086, 20.394611358642578, 24.28013801574707, 28.165664672851562, 32.05119323730469, 35.93671798706055, 39.822242736816406, 43.70777130126953, 47.593299865722656, 51.478824615478516, 55.364349365234375, 59.2498779296875, 63.135406494140625, 67.02093505859375, 70.90645599365234, 74.79198455810547, 78.6775131225586, 82.56303405761719, 86.44856262207031, 90.33409118652344, 94.21961975097656, 98.10514831542969, 101.99066925048828, 105.8761978149414, 109.76172637939453, 113.64724731445312, 117.53277587890625, 121.41830444335938]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 0.0, 6.0, 2.0, 6.0, 2.0, 1.0, 6.0, 0.0, 4.0, 3.0, 7.0, 18.0, 6.0, 3.0, 1.0, 16.0, 5.0, 14.0, 15.0, 11.0, 15.0, 14.0, 24.0, 26.0, 39.0, 76.0, 103.0, 360.0, 2873.0, 56601.0, 4117218.0, 14809.0, 1520.0, 213.0, 46.0, 30.0, 35.0, 33.0, 19.0, 15.0, 10.0, 18.0, 4.0, 12.0, 8.0, 8.0, 2.0, 6.0, 5.0, 8.0, 0.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-0.1676025390625, -0.1627063751220703, -0.15781021118164062, -0.15291404724121094, -0.14801788330078125, -0.14312171936035156, -0.13822555541992188, -0.1333293914794922, -0.1284332275390625, -0.12353706359863281, -0.11864089965820312, -0.11374473571777344, -0.10884857177734375, -0.10395240783691406, -0.09905624389648438, -0.09416007995605469, -0.089263916015625, -0.08436775207519531, -0.07947158813476562, -0.07457542419433594, -0.06967926025390625, -0.06478309631347656, -0.059886932373046875, -0.05499076843261719, -0.0500946044921875, -0.04519844055175781, -0.040302276611328125, -0.03540611267089844, -0.03050994873046875, -0.025613784790039062, -0.020717620849609375, -0.015821456909179688, -0.01092529296875, -0.0060291290283203125, -0.001132965087890625, 0.0037631988525390625, 0.00865936279296875, 0.013555526733398438, 0.018451690673828125, 0.023347854614257812, 0.0282440185546875, 0.03314018249511719, 0.038036346435546875, 0.04293251037597656, 0.04782867431640625, 0.05272483825683594, 0.057621002197265625, 0.06251716613769531, 0.067413330078125, 0.07230949401855469, 0.07720565795898438, 0.08210182189941406, 0.08699798583984375, 0.09189414978027344, 0.09679031372070312, 0.10168647766113281, 0.1065826416015625, 0.11147880554199219, 0.11637496948242188, 0.12127113342285156, 0.12616729736328125, 0.13106346130371094, 0.13595962524414062, 0.1408557891845703, 0.145751953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 10.0, 6.0, 7.0, 13.0, 13.0, 17.0, 715.0, 94.0, 20.0, 15.0, 6.0, 4.0, 10.0, 11.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1058349609375, -0.10268402099609375, -0.0995330810546875, -0.09638214111328125, -0.093231201171875, -0.09008026123046875, -0.0869293212890625, -0.08377838134765625, -0.08062744140625, -0.07747650146484375, -0.0743255615234375, -0.07117462158203125, -0.068023681640625, -0.06487274169921875, -0.0617218017578125, -0.05857086181640625, -0.055419921875, -0.05226898193359375, -0.0491180419921875, -0.04596710205078125, -0.042816162109375, -0.03966522216796875, -0.0365142822265625, -0.03336334228515625, -0.03021240234375, -0.02706146240234375, -0.0239105224609375, -0.02075958251953125, -0.017608642578125, -0.01445770263671875, -0.0113067626953125, -0.00815582275390625, -0.0050048828125, -0.00185394287109375, 0.0012969970703125, 0.00444793701171875, 0.007598876953125, 0.01074981689453125, 0.0139007568359375, 0.01705169677734375, 0.02020263671875, 0.02335357666015625, 0.0265045166015625, 0.02965545654296875, 0.032806396484375, 0.03595733642578125, 0.0391082763671875, 0.04225921630859375, 0.04541015625, 0.04856109619140625, 0.0517120361328125, 0.05486297607421875, 0.058013916015625, 0.06116485595703125, 0.0643157958984375, 0.06746673583984375, 0.07061767578125, 0.07376861572265625, 0.0769195556640625, 0.08007049560546875, 0.083221435546875, 0.08637237548828125, 0.0895233154296875, 0.09267425537109375, 0.0958251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 2.0, 5.0, 14.0, 2.0, 12.0, 19.0, 21.0, 37.0, 71.0, 108.0, 138.0, 313.0, 537.0, 1440.0, 5015.0, 204959.0, 3970652.0, 8460.0, 1577.0, 458.0, 177.0, 83.0, 58.0, 39.0, 18.0, 19.0, 7.0, 7.0, 5.0, 5.0, 4.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177490234375, -0.17196083068847656, -0.16643142700195312, -0.1609020233154297, -0.15537261962890625, -0.1498432159423828, -0.14431381225585938, -0.13878440856933594, -0.1332550048828125, -0.12772560119628906, -0.12219619750976562, -0.11666679382324219, -0.11113739013671875, -0.10560798645019531, -0.10007858276367188, -0.09454917907714844, -0.089019775390625, -0.08349037170410156, -0.07796096801757812, -0.07243156433105469, -0.06690216064453125, -0.06137275695800781, -0.055843353271484375, -0.05031394958496094, -0.0447845458984375, -0.03925514221191406, -0.033725738525390625, -0.028196334838867188, -0.02266693115234375, -0.017137527465820312, -0.011608123779296875, -0.0060787200927734375, -0.00054931640625, 0.0049800872802734375, 0.010509490966796875, 0.016038894653320312, 0.02156829833984375, 0.027097702026367188, 0.032627105712890625, 0.03815650939941406, 0.0436859130859375, 0.04921531677246094, 0.054744720458984375, 0.06027412414550781, 0.06580352783203125, 0.07133293151855469, 0.07686233520507812, 0.08239173889160156, 0.087921142578125, 0.09345054626464844, 0.09897994995117188, 0.10450935363769531, 0.11003875732421875, 0.11556816101074219, 0.12109756469726562, 0.12662696838378906, 0.1321563720703125, 0.13768577575683594, 0.14321517944335938, 0.1487445831298828, 0.15427398681640625, 0.1598033905029297, 0.16533279418945312, 0.17086219787597656, 0.1763916015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 7.0, 4.0, 24.0, 67.0, 290.0, 2684.0, 719.0, 151.0, 48.0, 22.0, 14.0, 3.0, 7.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1121826171875, -0.10921096801757812, -0.10623931884765625, -0.10326766967773438, -0.1002960205078125, -0.09732437133789062, -0.09435272216796875, -0.09138107299804688, -0.088409423828125, -0.08543777465820312, -0.08246612548828125, -0.07949447631835938, -0.0765228271484375, -0.07355117797851562, -0.07057952880859375, -0.06760787963867188, -0.06463623046875, -0.061664581298828125, -0.05869293212890625, -0.055721282958984375, -0.0527496337890625, -0.049777984619140625, -0.04680633544921875, -0.043834686279296875, -0.040863037109375, -0.037891387939453125, -0.03491973876953125, -0.031948089599609375, -0.0289764404296875, -0.026004791259765625, -0.02303314208984375, -0.020061492919921875, -0.01708984375, -0.014118194580078125, -0.01114654541015625, -0.008174896240234375, -0.0052032470703125, -0.002231597900390625, 0.00074005126953125, 0.003711700439453125, 0.006683349609375, 0.009654998779296875, 0.01262664794921875, 0.015598297119140625, 0.0185699462890625, 0.021541595458984375, 0.02451324462890625, 0.027484893798828125, 0.03045654296875, 0.033428192138671875, 0.03639984130859375, 0.039371490478515625, 0.0423431396484375, 0.045314788818359375, 0.04828643798828125, 0.051258087158203125, 0.054229736328125, 0.057201385498046875, 0.06017303466796875, 0.06314468383789062, 0.0661163330078125, 0.06908798217773438, 0.07205963134765625, 0.07503128051757812, 0.0780029296875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 10.0, 27.0, 606.0, 305.0, 27.0, 9.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5389622449874878, -0.5269617438316345, -0.5149612426757812, -0.502960741519928, -0.4909602701663971, -0.4789597690105438, -0.46695929765701294, -0.45495879650115967, -0.4429582953453064, -0.4309577941894531, -0.41895729303359985, -0.40695682168006897, -0.3949563205242157, -0.3829558193683624, -0.37095534801483154, -0.35895484685897827, -0.346954345703125, -0.33495384454727173, -0.32295334339141846, -0.3109528720378876, -0.2989523708820343, -0.28695186972618103, -0.27495139837265015, -0.2629508972167969, -0.2509503960609436, -0.23894989490509033, -0.22694940865039825, -0.21494892239570618, -0.2029484212398529, -0.19094792008399963, -0.17894743382930756, -0.16694694757461548, -0.1549464464187622, -0.14294594526290894, -0.13094545900821686, -0.11894496530294418, -0.10694447159767151, -0.09494397789239883, -0.08294348418712616, -0.07094299048185349, -0.05894249677658081, -0.046942003071308136, -0.03494150936603546, -0.022941015660762787, -0.010940521955490112, 0.0010599717497825623, 0.013060465455055237, 0.02506095916032791, 0.037061452865600586, 0.04906194657087326, 0.061062440276145935, 0.07306293398141861, 0.08506342768669128, 0.09706392139196396, 0.10906441509723663, 0.12106490880250931, 0.13306540250778198, 0.14506590366363525, 0.15706638991832733, 0.1690668761730194, 0.18106737732887268, 0.19306787848472595, 0.20506836473941803, 0.2170688509941101, 0.22906935214996338]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 10.0, 7.0, 5.0, 9.0, 5.0, 13.0, 26.0, 44.0, 55.0, 101.0, 128.0, 132.0, 131.0, 96.0, 75.0, 42.0, 22.0, 16.0, 11.0, 7.0, 5.0, 10.0, 5.0, 5.0, 0.0, 7.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.39849191904067993, -0.3884199559688568, -0.3783479928970337, -0.3682760000228882, -0.35820403695106506, -0.34813207387924194, -0.33806008100509644, -0.3279881179332733, -0.3179161548614502, -0.3078441917896271, -0.29777222871780396, -0.28770023584365845, -0.2776282727718353, -0.2675563097000122, -0.2574843168258667, -0.24741235375404358, -0.23734039068222046, -0.22726842761039734, -0.21719644963741302, -0.2071244716644287, -0.1970525085926056, -0.18698054552078247, -0.17690856754779816, -0.16683658957481384, -0.15676462650299072, -0.1466926634311676, -0.1366206854581833, -0.12654870748519897, -0.11647674441337585, -0.10640477389097214, -0.09633280336856842, -0.0862608328461647, -0.07618886232376099, -0.06611689180135727, -0.05604492127895355, -0.045972950756549835, -0.03590098023414612, -0.0258290097117424, -0.015757039189338684, -0.005685068666934967, 0.00438690185546875, 0.014458872377872467, 0.024530842900276184, 0.0346028134226799, 0.04467478394508362, 0.054746754467487335, 0.06481872498989105, 0.07489069551229477, 0.08496266603469849, 0.0950346365571022, 0.10510660707950592, 0.11517857760190964, 0.12525054812431335, 0.13532251119613647, 0.1453944891691208, 0.1554664671421051, 0.16553843021392822, 0.17561039328575134, 0.18568237125873566, 0.19575434923171997, 0.2058263123035431, 0.2158982753753662, 0.22597025334835052, 0.23604223132133484, 0.24611419439315796]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 18.0, 17.0, 36.0, 59.0, 73.0, 108.0, 184.0, 206.0, 343.0, 451.0, 765.0, 1075.0, 1660.0, 2695.0, 4454.0, 8430.0, 18642.0, 175983.0, 790616.0, 20833.0, 9017.0, 4853.0, 2737.0, 1818.0, 1130.0, 721.0, 504.0, 333.0, 204.0, 181.0, 122.0, 75.0, 58.0, 39.0, 20.0, 28.0, 21.0, 7.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444580078125, -0.4297904968261719, -0.41500091552734375, -0.4002113342285156, -0.3854217529296875, -0.3706321716308594, -0.35584259033203125, -0.3410530090332031, -0.326263427734375, -0.3114738464355469, -0.29668426513671875, -0.2818946838378906, -0.2671051025390625, -0.2523155212402344, -0.23752593994140625, -0.22273635864257812, -0.20794677734375, -0.19315719604492188, -0.17836761474609375, -0.16357803344726562, -0.1487884521484375, -0.13399887084960938, -0.11920928955078125, -0.10441970825195312, -0.089630126953125, -0.07484054565429688, -0.06005096435546875, -0.045261383056640625, -0.0304718017578125, -0.015682220458984375, -0.00089263916015625, 0.013896942138671875, 0.0286865234375, 0.043476104736328125, 0.05826568603515625, 0.07305526733398438, 0.0878448486328125, 0.10263442993164062, 0.11742401123046875, 0.13221359252929688, 0.147003173828125, 0.16179275512695312, 0.17658233642578125, 0.19137191772460938, 0.2061614990234375, 0.22095108032226562, 0.23574066162109375, 0.2505302429199219, 0.26531982421875, 0.2801094055175781, 0.29489898681640625, 0.3096885681152344, 0.3244781494140625, 0.3392677307128906, 0.35405731201171875, 0.3688468933105469, 0.383636474609375, 0.3984260559082031, 0.41321563720703125, 0.4280052185058594, 0.4427947998046875, 0.4575843811035156, 0.47237396240234375, 0.4871635437011719, 0.501953125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 11.0, 13.0, 10.0, 69.0, 739.0, 27.0, 14.0, 12.0, 3.0, 7.0, 10.0, 7.0, 3.0, 4.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10589599609375, -0.10278129577636719, -0.09966659545898438, -0.09655189514160156, -0.09343719482421875, -0.09032249450683594, -0.08720779418945312, -0.08409309387207031, -0.0809783935546875, -0.07786369323730469, -0.07474899291992188, -0.07163429260253906, -0.06851959228515625, -0.06540489196777344, -0.062290191650390625, -0.05917549133300781, -0.056060791015625, -0.05294609069824219, -0.049831390380859375, -0.04671669006347656, -0.04360198974609375, -0.04048728942871094, -0.037372589111328125, -0.03425788879394531, -0.0311431884765625, -0.028028488159179688, -0.024913787841796875, -0.021799087524414062, -0.01868438720703125, -0.015569686889648438, -0.012454986572265625, -0.009340286254882812, -0.0062255859375, -0.0031108856201171875, 3.814697265625e-06, 0.0031185150146484375, 0.00623321533203125, 0.009347915649414062, 0.012462615966796875, 0.015577316284179688, 0.0186920166015625, 0.021806716918945312, 0.024921417236328125, 0.028036117553710938, 0.03115081787109375, 0.03426551818847656, 0.037380218505859375, 0.04049491882324219, 0.043609619140625, 0.04672431945800781, 0.049839019775390625, 0.05295372009277344, 0.05606842041015625, 0.05918312072753906, 0.062297821044921875, 0.06541252136230469, 0.0685272216796875, 0.07164192199707031, 0.07475662231445312, 0.07787132263183594, 0.08098602294921875, 0.08410072326660156, 0.08721542358398438, 0.09033012390136719, 0.09344482421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 8.0, 13.0, 20.0, 30.0, 32.0, 59.0, 49.0, 68.0, 86.0, 93.0, 135.0, 199.0, 353.0, 678.0, 1159.0, 2412.0, 5854.0, 16505.0, 63494.0, 549617.0, 339015.0, 46358.0, 12779.0, 4772.0, 2133.0, 1013.0, 577.0, 287.0, 173.0, 144.0, 82.0, 84.0, 67.0, 64.0, 36.0, 34.0, 15.0, 16.0, 10.0, 6.0, 11.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.251708984375, -0.24449729919433594, -0.23728561401367188, -0.2300739288330078, -0.22286224365234375, -0.2156505584716797, -0.20843887329101562, -0.20122718811035156, -0.1940155029296875, -0.18680381774902344, -0.17959213256835938, -0.1723804473876953, -0.16516876220703125, -0.1579570770263672, -0.15074539184570312, -0.14353370666503906, -0.136322021484375, -0.12911033630371094, -0.12189865112304688, -0.11468696594238281, -0.10747528076171875, -0.10026359558105469, -0.09305191040039062, -0.08584022521972656, -0.0786285400390625, -0.07141685485839844, -0.06420516967773438, -0.05699348449707031, -0.04978179931640625, -0.04257011413574219, -0.035358428955078125, -0.028146743774414062, -0.02093505859375, -0.013723373413085938, -0.006511688232421875, 0.0006999969482421875, 0.00791168212890625, 0.015123367309570312, 0.022335052490234375, 0.029546737670898438, 0.0367584228515625, 0.04397010803222656, 0.051181793212890625, 0.05839347839355469, 0.06560516357421875, 0.07281684875488281, 0.08002853393554688, 0.08724021911621094, 0.094451904296875, 0.10166358947753906, 0.10887527465820312, 0.11608695983886719, 0.12329864501953125, 0.1305103302001953, 0.13772201538085938, 0.14493370056152344, 0.1521453857421875, 0.15935707092285156, 0.16656875610351562, 0.1737804412841797, 0.18099212646484375, 0.1882038116455078, 0.19541549682617188, 0.20262718200683594, 0.2098388671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 8.0, 7.0, 13.0, 18.0, 13.0, 21.0, 18.0, 18.0, 20.0, 21.0, 27.0, 26.0, 26.0, 36.0, 33.0, 36.0, 44.0, 29.0, 47.0, 36.0, 33.0, 43.0, 49.0, 38.0, 37.0, 33.0, 31.0, 35.0, 35.0, 23.0, 13.0, 23.0, 13.0, 15.0, 17.0, 9.0, 22.0, 4.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.37841796875, -0.3673553466796875, -0.356292724609375, -0.3452301025390625, -0.33416748046875, -0.3231048583984375, -0.312042236328125, -0.3009796142578125, -0.2899169921875, -0.2788543701171875, -0.267791748046875, -0.2567291259765625, -0.24566650390625, -0.2346038818359375, -0.223541259765625, -0.2124786376953125, -0.201416015625, -0.1903533935546875, -0.179290771484375, -0.1682281494140625, -0.15716552734375, -0.1461029052734375, -0.135040283203125, -0.1239776611328125, -0.1129150390625, -0.1018524169921875, -0.090789794921875, -0.0797271728515625, -0.06866455078125, -0.0576019287109375, -0.046539306640625, -0.0354766845703125, -0.0244140625, -0.0133514404296875, -0.002288818359375, 0.0087738037109375, 0.01983642578125, 0.0308990478515625, 0.041961669921875, 0.0530242919921875, 0.0640869140625, 0.0751495361328125, 0.086212158203125, 0.0972747802734375, 0.10833740234375, 0.1194000244140625, 0.130462646484375, 0.1415252685546875, 0.152587890625, 0.1636505126953125, 0.174713134765625, 0.1857757568359375, 0.19683837890625, 0.2079010009765625, 0.218963623046875, 0.2300262451171875, 0.2410888671875, 0.2521514892578125, 0.263214111328125, 0.2742767333984375, 0.28533935546875, 0.2964019775390625, 0.307464599609375, 0.3185272216796875, 0.32958984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 7.0, 8.0, 9.0, 17.0, 16.0, 36.0, 59.0, 108.0, 230.0, 476.0, 1163.0, 4851.0, 174406.0, 857683.0, 7082.0, 1422.0, 490.0, 205.0, 107.0, 61.0, 31.0, 24.0, 14.0, 8.0, 12.0, 8.0, 7.0, 2.0, 0.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.114013671875, -0.11109733581542969, -0.10818099975585938, -0.10526466369628906, -0.10234832763671875, -0.09943199157714844, -0.09651565551757812, -0.09359931945800781, -0.0906829833984375, -0.08776664733886719, -0.08485031127929688, -0.08193397521972656, -0.07901763916015625, -0.07610130310058594, -0.07318496704101562, -0.07026863098144531, -0.067352294921875, -0.06443595886230469, -0.061519622802734375, -0.05860328674316406, -0.05568695068359375, -0.05277061462402344, -0.049854278564453125, -0.04693794250488281, -0.0440216064453125, -0.04110527038574219, -0.038188934326171875, -0.03527259826660156, -0.03235626220703125, -0.029439926147460938, -0.026523590087890625, -0.023607254028320312, -0.02069091796875, -0.017774581909179688, -0.014858245849609375, -0.011941909790039062, -0.00902557373046875, -0.0061092376708984375, -0.003192901611328125, -0.0002765655517578125, 0.0026397705078125, 0.0055561065673828125, 0.008472442626953125, 0.011388778686523438, 0.01430511474609375, 0.017221450805664062, 0.020137786865234375, 0.023054122924804688, 0.025970458984375, 0.028886795043945312, 0.031803131103515625, 0.03471946716308594, 0.03763580322265625, 0.04055213928222656, 0.043468475341796875, 0.04638481140136719, 0.0493011474609375, 0.05221748352050781, 0.055133819580078125, 0.05805015563964844, 0.06096649169921875, 0.06388282775878906, 0.06679916381835938, 0.06971549987792969, 0.0726318359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 10.0, 13.0, 22.0, 22.0, 54.0, 57.0, 78.0, 82.0, 102.0, 111.0, 92.0, 81.0, 76.0, 54.0, 43.0, 20.0, 18.0, 10.0, 7.0, 11.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.329183578491211e-05, -1.2675300240516663e-05, -1.2058764696121216e-05, -1.1442229151725769e-05, -1.0825693607330322e-05, -1.0209158062934875e-05, -9.592622518539429e-06, -8.976086974143982e-06, -8.359551429748535e-06, -7.743015885353088e-06, -7.126480340957642e-06, -6.509944796562195e-06, -5.893409252166748e-06, -5.276873707771301e-06, -4.6603381633758545e-06, -4.043802618980408e-06, -3.427267074584961e-06, -2.810731530189514e-06, -2.1941959857940674e-06, -1.5776604413986206e-06, -9.611248970031738e-07, -3.4458935260772705e-07, 2.7194619178771973e-07, 8.884817361831665e-07, 1.5050172805786133e-06, 2.12155282497406e-06, 2.738088369369507e-06, 3.3546239137649536e-06, 3.9711594581604e-06, 4.587695002555847e-06, 5.204230546951294e-06, 5.820766091346741e-06, 6.4373016357421875e-06, 7.053837180137634e-06, 7.670372724533081e-06, 8.286908268928528e-06, 8.903443813323975e-06, 9.519979357719421e-06, 1.0136514902114868e-05, 1.0753050446510315e-05, 1.1369585990905762e-05, 1.1986121535301208e-05, 1.2602657079696655e-05, 1.3219192624092102e-05, 1.3835728168487549e-05, 1.4452263712882996e-05, 1.5068799257278442e-05, 1.568533480167389e-05, 1.6301870346069336e-05, 1.6918405890464783e-05, 1.753494143486023e-05, 1.8151476979255676e-05, 1.8768012523651123e-05, 1.938454806804657e-05, 2.0001083612442017e-05, 2.0617619156837463e-05, 2.123415470123291e-05, 2.1850690245628357e-05, 2.2467225790023804e-05, 2.308376133441925e-05, 2.3700296878814697e-05, 2.4316832423210144e-05, 2.493336796760559e-05, 2.5549903512001038e-05, 2.6166439056396484e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 13.0, 14.0, 19.0, 29.0, 36.0, 55.0, 92.0, 127.0, 257.0, 494.0, 1062.0, 2937.0, 10760.0, 98576.0, 884489.0, 39317.0, 6505.0, 1997.0, 789.0, 426.0, 203.0, 102.0, 80.0, 48.0, 36.0, 22.0, 12.0, 13.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06585693359375, -0.06388139724731445, -0.061905860900878906, -0.05993032455444336, -0.05795478820800781, -0.055979251861572266, -0.05400371551513672, -0.05202817916870117, -0.050052642822265625, -0.04807710647583008, -0.04610157012939453, -0.044126033782958984, -0.04215049743652344, -0.04017496109008789, -0.038199424743652344, -0.0362238883972168, -0.03424835205078125, -0.0322728157043457, -0.030297279357910156, -0.02832174301147461, -0.026346206665039062, -0.024370670318603516, -0.02239513397216797, -0.020419597625732422, -0.018444061279296875, -0.016468524932861328, -0.014492988586425781, -0.012517452239990234, -0.010541915893554688, -0.00856637954711914, -0.006590843200683594, -0.004615306854248047, -0.0026397705078125, -0.0006642341613769531, 0.0013113021850585938, 0.0032868385314941406, 0.0052623748779296875, 0.007237911224365234, 0.009213447570800781, 0.011188983917236328, 0.013164520263671875, 0.015140056610107422, 0.01711559295654297, 0.019091129302978516, 0.021066665649414062, 0.02304220199584961, 0.025017738342285156, 0.026993274688720703, 0.02896881103515625, 0.030944347381591797, 0.032919883728027344, 0.03489542007446289, 0.03687095642089844, 0.038846492767333984, 0.04082202911376953, 0.04279756546020508, 0.044773101806640625, 0.04674863815307617, 0.04872417449951172, 0.050699710845947266, 0.05267524719238281, 0.05465078353881836, 0.056626319885253906, 0.05860185623168945, 0.060577392578125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 2.0, 9.0, 9.0, 8.0, 26.0, 14.0, 27.0, 36.0, 45.0, 78.0, 76.0, 110.0, 107.0, 108.0, 73.0, 63.0, 51.0, 31.0, 41.0, 24.0, 11.0, 14.0, 7.0, 5.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1173095703125, -0.11426067352294922, -0.11121177673339844, -0.10816287994384766, -0.10511398315429688, -0.1020650863647461, -0.09901618957519531, -0.09596729278564453, -0.09291839599609375, -0.08986949920654297, -0.08682060241699219, -0.0837717056274414, -0.08072280883789062, -0.07767391204833984, -0.07462501525878906, -0.07157611846923828, -0.0685272216796875, -0.06547832489013672, -0.06242942810058594, -0.059380531311035156, -0.056331634521484375, -0.053282737731933594, -0.05023384094238281, -0.04718494415283203, -0.04413604736328125, -0.04108715057373047, -0.03803825378417969, -0.034989356994628906, -0.031940460205078125, -0.028891563415527344, -0.025842666625976562, -0.02279376983642578, -0.019744873046875, -0.01669597625732422, -0.013647079467773438, -0.010598182678222656, -0.007549285888671875, -0.004500389099121094, -0.0014514923095703125, 0.0015974044799804688, 0.00464630126953125, 0.007695198059082031, 0.010744094848632812, 0.013792991638183594, 0.016841888427734375, 0.019890785217285156, 0.022939682006835938, 0.02598857879638672, 0.0290374755859375, 0.03208637237548828, 0.03513526916503906, 0.038184165954589844, 0.041233062744140625, 0.044281959533691406, 0.04733085632324219, 0.05037975311279297, 0.05342864990234375, 0.05647754669189453, 0.05952644348144531, 0.0625753402709961, 0.06562423706054688, 0.06867313385009766, 0.07172203063964844, 0.07477092742919922, 0.07781982421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 37.0, 670.0, 261.0, 23.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.026463508605957, -12.754094123840332, -12.48172378540039, -12.209354400634766, -11.936984062194824, -11.6646146774292, -11.392244338989258, -11.119874954223633, -10.847505569458008, -10.575136184692383, -10.302765846252441, -10.030396461486816, -9.758026123046875, -9.48565673828125, -9.213286399841309, -8.940917015075684, -8.668546676635742, -8.396177291870117, -8.123806953430176, -7.851437091827393, -7.579067230224609, -7.306697845458984, -7.034327983856201, -6.761958122253418, -6.489588260650635, -6.217218399047852, -5.944848537445068, -5.672478675842285, -5.40010929107666, -5.127738952636719, -4.855369567871094, -4.5829997062683105, -4.310628890991211, -4.038259029388428, -3.7658891677856445, -3.4935195446014404, -3.2211496829986572, -2.948779821395874, -2.67641019821167, -2.4040403366088867, -2.1316704750061035, -1.8593006134033203, -1.5869308710098267, -1.314561128616333, -1.0421912670135498, -0.7698214054107666, -0.49745166301727295, -0.2250819206237793, 0.047287940979003906, 0.31965774297714233, 0.5920275449752808, 0.8643973469734192, 1.1367671489715576, 1.4091370105743408, 1.6815067529678345, 1.9538764953613281, 2.2262463569641113, 2.4986162185668945, 2.7709860801696777, 3.043355703353882, 3.315725564956665, 3.5880954265594482, 3.8604650497436523, 4.1328349113464355, 4.405204772949219]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 7.0, 9.0, 12.0, 20.0, 26.0, 54.0, 93.0, 110.0, 153.0, 158.0, 104.0, 71.0, 58.0, 26.0, 25.0, 8.0, 15.0, 5.0, 8.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.521082878112793, -7.284963607788086, -7.048844337463379, -6.812725067138672, -6.576605796813965, -6.340486526489258, -6.104366779327393, -5.8682475090026855, -5.6321282386779785, -5.3960089683532715, -5.1598896980285645, -4.923770427703857, -4.687650680541992, -4.451531410217285, -4.215412139892578, -3.979292869567871, -3.743173599243164, -3.507054328918457, -3.27093505859375, -3.034815549850464, -2.798696279525757, -2.56257700920105, -2.3264575004577637, -2.0903382301330566, -1.8542189598083496, -1.6180996894836426, -1.381980299949646, -1.1458609104156494, -0.9097416400909424, -0.6736223697662354, -0.43750298023223877, -0.2013835906982422, 0.034735679626464844, 0.27085500955581665, 0.5069743394851685, 0.7430936694145203, 0.9792129993438721, 1.215332269668579, 1.4514516592025757, 1.6875710487365723, 1.9236903190612793, 2.1598095893859863, 2.3959288597106934, 2.6320483684539795, 2.8681676387786865, 3.1042869091033936, 3.3404064178466797, 3.5765256881713867, 3.8126449584960938, 4.048764228820801, 4.284883499145508, 4.521002769470215, 4.757122039794922, 4.993241310119629, 5.229361057281494, 5.465480327606201, 5.701599597930908, 5.937718868255615, 6.173838138580322, 6.409957408905029, 6.6460771560668945, 6.882196426391602, 7.118315696716309, 7.354434967041016, 7.590554237365723]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 13.0, 24.0, 22.0, 31.0, 56.0, 91.0, 163.0, 257.0, 476.0, 858.0, 1551.0, 3380.0, 7397.0, 22416.0, 4055415.0, 83882.0, 11475.0, 3939.0, 1548.0, 659.0, 298.0, 117.0, 71.0, 45.0, 29.0, 14.0, 14.0, 14.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0461883544921875, -1.013275146484375, -0.9803619384765625, -0.94744873046875, -0.9145355224609375, -0.881622314453125, -0.8487091064453125, -0.8157958984375, -0.7828826904296875, -0.749969482421875, -0.7170562744140625, -0.68414306640625, -0.6512298583984375, -0.618316650390625, -0.5854034423828125, -0.552490234375, -0.5195770263671875, -0.486663818359375, -0.4537506103515625, -0.42083740234375, -0.3879241943359375, -0.355010986328125, -0.3220977783203125, -0.2891845703125, -0.2562713623046875, -0.223358154296875, -0.1904449462890625, -0.15753173828125, -0.1246185302734375, -0.091705322265625, -0.0587921142578125, -0.02587890625, 0.0070343017578125, 0.039947509765625, 0.0728607177734375, 0.10577392578125, 0.1386871337890625, 0.171600341796875, 0.2045135498046875, 0.2374267578125, 0.2703399658203125, 0.303253173828125, 0.3361663818359375, 0.36907958984375, 0.4019927978515625, 0.434906005859375, 0.4678192138671875, 0.500732421875, 0.5336456298828125, 0.566558837890625, 0.5994720458984375, 0.63238525390625, 0.6652984619140625, 0.698211669921875, 0.7311248779296875, 0.7640380859375, 0.7969512939453125, 0.829864501953125, 0.8627777099609375, 0.89569091796875, 0.9286041259765625, 0.961517333984375, 0.9944305419921875, 1.02734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 10.0, 3.0, 7.0, 7.0, 11.0, 9.0, 21.0, 18.0, 442.0, 355.0, 27.0, 7.0, 15.0, 10.0, 7.0, 11.0, 8.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.0982208251953125, -0.095306396484375, -0.0923919677734375, -0.0894775390625, -0.0865631103515625, -0.083648681640625, -0.0807342529296875, -0.07781982421875, -0.0749053955078125, -0.071990966796875, -0.0690765380859375, -0.066162109375, -0.0632476806640625, -0.060333251953125, -0.0574188232421875, -0.05450439453125, -0.0515899658203125, -0.048675537109375, -0.0457611083984375, -0.0428466796875, -0.0399322509765625, -0.037017822265625, -0.0341033935546875, -0.03118896484375, -0.0282745361328125, -0.025360107421875, -0.0224456787109375, -0.01953125, -0.0166168212890625, -0.013702392578125, -0.0107879638671875, -0.00787353515625, -0.0049591064453125, -0.002044677734375, 0.0008697509765625, 0.0037841796875, 0.0066986083984375, 0.009613037109375, 0.0125274658203125, 0.01544189453125, 0.0183563232421875, 0.021270751953125, 0.0241851806640625, 0.027099609375, 0.0300140380859375, 0.032928466796875, 0.0358428955078125, 0.03875732421875, 0.0416717529296875, 0.044586181640625, 0.0475006103515625, 0.0504150390625, 0.0533294677734375, 0.056243896484375, 0.0591583251953125, 0.06207275390625, 0.0649871826171875, 0.067901611328125, 0.0708160400390625, 0.07373046875, 0.0766448974609375, 0.079559326171875, 0.0824737548828125, 0.08538818359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 12.0, 15.0, 16.0, 16.0, 33.0, 62.0, 74.0, 119.0, 279.0, 594.0, 1315.0, 4059.0, 18178.0, 224298.0, 3864296.0, 62010.0, 12017.0, 3791.0, 1532.0, 697.0, 357.0, 168.0, 111.0, 59.0, 38.0, 30.0, 18.0, 14.0, 13.0, 9.0, 10.0, 7.0, 8.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.457275390625, -0.44309234619140625, -0.4289093017578125, -0.41472625732421875, -0.400543212890625, -0.38636016845703125, -0.3721771240234375, -0.35799407958984375, -0.34381103515625, -0.32962799072265625, -0.3154449462890625, -0.30126190185546875, -0.287078857421875, -0.27289581298828125, -0.2587127685546875, -0.24452972412109375, -0.2303466796875, -0.21616363525390625, -0.2019805908203125, -0.18779754638671875, -0.173614501953125, -0.15943145751953125, -0.1452484130859375, -0.13106536865234375, -0.11688232421875, -0.10269927978515625, -0.0885162353515625, -0.07433319091796875, -0.060150146484375, -0.04596710205078125, -0.0317840576171875, -0.01760101318359375, -0.00341796875, 0.01076507568359375, 0.0249481201171875, 0.03913116455078125, 0.053314208984375, 0.06749725341796875, 0.0816802978515625, 0.09586334228515625, 0.11004638671875, 0.12422943115234375, 0.1384124755859375, 0.15259552001953125, 0.166778564453125, 0.18096160888671875, 0.1951446533203125, 0.20932769775390625, 0.2235107421875, 0.23769378662109375, 0.2518768310546875, 0.26605987548828125, 0.280242919921875, 0.29442596435546875, 0.3086090087890625, 0.32279205322265625, 0.33697509765625, 0.35115814208984375, 0.3653411865234375, 0.37952423095703125, 0.393707275390625, 0.40789031982421875, 0.4220733642578125, 0.43625640869140625, 0.450439453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 7.0, 11.0, 9.0, 8.0, 8.0, 18.0, 32.0, 47.0, 59.0, 131.0, 724.0, 2162.0, 268.0, 122.0, 78.0, 58.0, 49.0, 43.0, 31.0, 26.0, 21.0, 17.0, 18.0, 16.0, 11.0, 11.0, 11.0, 7.0, 5.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.0792236328125, -0.07650566101074219, -0.07378768920898438, -0.07106971740722656, -0.06835174560546875, -0.06563377380371094, -0.06291580200195312, -0.06019783020019531, -0.0574798583984375, -0.05476188659667969, -0.052043914794921875, -0.04932594299316406, -0.04660797119140625, -0.04388999938964844, -0.041172027587890625, -0.03845405578613281, -0.035736083984375, -0.03301811218261719, -0.030300140380859375, -0.027582168579101562, -0.02486419677734375, -0.022146224975585938, -0.019428253173828125, -0.016710281372070312, -0.0139923095703125, -0.011274337768554688, -0.008556365966796875, -0.0058383941650390625, -0.00312042236328125, -0.0004024505615234375, 0.002315521240234375, 0.0050334930419921875, 0.00775146484375, 0.010469436645507812, 0.013187408447265625, 0.015905380249023438, 0.01862335205078125, 0.021341323852539062, 0.024059295654296875, 0.026777267456054688, 0.0294952392578125, 0.03221321105957031, 0.034931182861328125, 0.03764915466308594, 0.04036712646484375, 0.04308509826660156, 0.045803070068359375, 0.04852104187011719, 0.051239013671875, 0.05395698547363281, 0.056674957275390625, 0.05939292907714844, 0.06211090087890625, 0.06482887268066406, 0.06754684448242188, 0.07026481628417969, 0.0729827880859375, 0.07570075988769531, 0.07841873168945312, 0.08113670349121094, 0.08385467529296875, 0.08657264709472656, 0.08929061889648438, 0.09200859069824219, 0.0947265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 746.0, 246.0, 10.0, 4.0, 4.0, 1.0, 1.0], "bins": [-14.510116577148438, -14.259368896484375, -14.008621215820312, -13.75787353515625, -13.507124900817871, -13.256377220153809, -13.005629539489746, -12.754881858825684, -12.504134178161621, -12.253386497497559, -12.002638816833496, -11.751890182495117, -11.501142501831055, -11.250394821166992, -10.99964714050293, -10.748899459838867, -10.498151779174805, -10.247404098510742, -9.99665641784668, -9.745908737182617, -9.495160102844238, -9.244412422180176, -8.993664741516113, -8.74291706085205, -8.492168426513672, -8.24142074584961, -7.990672588348389, -7.739924907684326, -7.489177227020264, -7.238429069519043, -6.9876813888549805, -6.736933708190918, -6.486185073852539, -6.235437393188477, -5.984689235687256, -5.733941555023193, -5.483193874359131, -5.23244571685791, -4.981698036193848, -4.730950355529785, -4.480202674865723, -4.22945499420166, -3.9787070751190186, -3.727959156036377, -3.4772114753723145, -3.226463556289673, -2.9757156372070312, -2.7249679565429688, -2.474220037460327, -2.2234721183776855, -1.972724437713623, -1.7219765186309814, -1.4712287187576294, -1.2204809188842773, -0.9697329998016357, -0.7189851999282837, -0.46823740005493164, -0.2174895703792572, 0.033258259296417236, 0.28400611877441406, 0.5347539186477661, 0.7855017185211182, 1.0362496376037598, 1.2869974374771118, 1.5377452373504639]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 10.0, 12.0, 20.0, 27.0, 57.0, 72.0, 109.0, 100.0, 124.0, 104.0, 90.0, 95.0, 57.0, 45.0, 32.0, 18.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5981602668762207, -1.5600923299789429, -1.5220245122909546, -1.4839565753936768, -1.4458887577056885, -1.4078208208084106, -1.3697530031204224, -1.3316850662231445, -1.2936172485351562, -1.2555493116378784, -1.2174814939498901, -1.1794135570526123, -1.141345739364624, -1.1032778024673462, -1.065209984779358, -1.02714204788208, -0.9890741109848022, -0.9510062336921692, -0.9129383563995361, -0.8748704791069031, -0.83680260181427, -0.7987346649169922, -0.7606667876243591, -0.7225989103317261, -0.684531033039093, -0.64646315574646, -0.6083952784538269, -0.5703274011611938, -0.532259464263916, -0.49419161677360535, -0.4561237096786499, -0.41805583238601685, -0.37998783588409424, -0.3419199585914612, -0.3038520812988281, -0.2657841742038727, -0.22771629691123962, -0.18964841961860657, -0.15158052742481232, -0.11351263523101807, -0.07544475793838501, -0.037376873195171356, 0.0006910115480422974, 0.03875889629125595, 0.0768267810344696, 0.11489465832710266, 0.1529625505208969, 0.19103044271469116, 0.22909832000732422, 0.2671661972999573, 0.30523407459259033, 0.3433019816875458, 0.38136985898017883, 0.4194377362728119, 0.45750564336776733, 0.4955735206604004, 0.5336413979530334, 0.5717092752456665, 0.6097771525382996, 0.6478450298309326, 0.6859129667282104, 0.7239807844161987, 0.7620487213134766, 0.8001165986061096, 0.8381844758987427]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 12.0, 17.0, 25.0, 34.0, 46.0, 83.0, 133.0, 178.0, 298.0, 510.0, 960.0, 1922.0, 4525.0, 11776.0, 43058.0, 915777.0, 47523.0, 12429.0, 4803.0, 2041.0, 949.0, 525.0, 339.0, 175.0, 119.0, 83.0, 55.0, 48.0, 27.0, 14.0, 7.0, 9.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49951171875, -0.48314666748046875, -0.4667816162109375, -0.45041656494140625, -0.434051513671875, -0.41768646240234375, -0.4013214111328125, -0.38495635986328125, -0.36859130859375, -0.35222625732421875, -0.3358612060546875, -0.31949615478515625, -0.303131103515625, -0.28676605224609375, -0.2704010009765625, -0.25403594970703125, -0.2376708984375, -0.22130584716796875, -0.2049407958984375, -0.18857574462890625, -0.172210693359375, -0.15584564208984375, -0.1394805908203125, -0.12311553955078125, -0.10675048828125, -0.09038543701171875, -0.0740203857421875, -0.05765533447265625, -0.041290283203125, -0.02492523193359375, -0.0085601806640625, 0.00780487060546875, 0.024169921875, 0.04053497314453125, 0.0569000244140625, 0.07326507568359375, 0.089630126953125, 0.10599517822265625, 0.1223602294921875, 0.13872528076171875, 0.15509033203125, 0.17145538330078125, 0.1878204345703125, 0.20418548583984375, 0.220550537109375, 0.23691558837890625, 0.2532806396484375, 0.26964569091796875, 0.2860107421875, 0.30237579345703125, 0.3187408447265625, 0.33510589599609375, 0.351470947265625, 0.36783599853515625, 0.3842010498046875, 0.40056610107421875, 0.41693115234375, 0.43329620361328125, 0.4496612548828125, 0.46602630615234375, 0.482391357421875, 0.49875640869140625, 0.5151214599609375, 0.5314865112304688, 0.5478515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 5.0, 9.0, 8.0, 12.0, 18.0, 13.0, 81.0, 429.0, 294.0, 46.0, 12.0, 12.0, 8.0, 10.0, 10.0, 6.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10260200500488281, -0.09955215454101562, -0.09650230407714844, -0.09345245361328125, -0.09040260314941406, -0.08735275268554688, -0.08430290222167969, -0.0812530517578125, -0.07820320129394531, -0.07515335083007812, -0.07210350036621094, -0.06905364990234375, -0.06600379943847656, -0.06295394897460938, -0.05990409851074219, -0.056854248046875, -0.05380439758300781, -0.050754547119140625, -0.04770469665527344, -0.04465484619140625, -0.04160499572753906, -0.038555145263671875, -0.03550529479980469, -0.0324554443359375, -0.029405593872070312, -0.026355743408203125, -0.023305892944335938, -0.02025604248046875, -0.017206192016601562, -0.014156341552734375, -0.011106491088867188, -0.008056640625, -0.0050067901611328125, -0.001956939697265625, 0.0010929107666015625, 0.00414276123046875, 0.0071926116943359375, 0.010242462158203125, 0.013292312622070312, 0.0163421630859375, 0.019392013549804688, 0.022441864013671875, 0.025491714477539062, 0.02854156494140625, 0.03159141540527344, 0.034641265869140625, 0.03769111633300781, 0.040740966796875, 0.04379081726074219, 0.046840667724609375, 0.04989051818847656, 0.05294036865234375, 0.05599021911621094, 0.059040069580078125, 0.06208992004394531, 0.0651397705078125, 0.06818962097167969, 0.07123947143554688, 0.07428932189941406, 0.07733917236328125, 0.08038902282714844, 0.08343887329101562, 0.08648872375488281, 0.08953857421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 4.0, 3.0, 10.0, 9.0, 7.0, 11.0, 4.0, 12.0, 9.0, 21.0, 27.0, 32.0, 26.0, 39.0, 64.0, 98.0, 151.0, 256.0, 467.0, 900.0, 2171.0, 7366.0, 44771.0, 594949.0, 357426.0, 30581.0, 5546.0, 1735.0, 749.0, 392.0, 246.0, 115.0, 82.0, 50.0, 43.0, 25.0, 19.0, 26.0, 21.0, 14.0, 11.0, 12.0, 16.0, 10.0, 7.0, 9.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.3134765625, -0.304229736328125, -0.29498291015625, -0.285736083984375, -0.2764892578125, -0.267242431640625, -0.25799560546875, -0.248748779296875, -0.239501953125, -0.230255126953125, -0.22100830078125, -0.211761474609375, -0.2025146484375, -0.193267822265625, -0.18402099609375, -0.174774169921875, -0.16552734375, -0.156280517578125, -0.14703369140625, -0.137786865234375, -0.1285400390625, -0.119293212890625, -0.11004638671875, -0.100799560546875, -0.091552734375, -0.082305908203125, -0.07305908203125, -0.063812255859375, -0.0545654296875, -0.045318603515625, -0.03607177734375, -0.026824951171875, -0.017578125, -0.008331298828125, 0.00091552734375, 0.010162353515625, 0.0194091796875, 0.028656005859375, 0.03790283203125, 0.047149658203125, 0.056396484375, 0.065643310546875, 0.07489013671875, 0.084136962890625, 0.0933837890625, 0.102630615234375, 0.11187744140625, 0.121124267578125, 0.13037109375, 0.139617919921875, 0.14886474609375, 0.158111572265625, 0.1673583984375, 0.176605224609375, 0.18585205078125, 0.195098876953125, 0.204345703125, 0.213592529296875, 0.22283935546875, 0.232086181640625, 0.2413330078125, 0.250579833984375, 0.25982666015625, 0.269073486328125, 0.2783203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 5.0, 11.0, 10.0, 9.0, 8.0, 9.0, 19.0, 24.0, 18.0, 25.0, 18.0, 30.0, 33.0, 34.0, 40.0, 29.0, 45.0, 44.0, 44.0, 36.0, 33.0, 39.0, 28.0, 51.0, 35.0, 38.0, 37.0, 25.0, 23.0, 24.0, 11.0, 23.0, 21.0, 17.0, 16.0, 11.0, 11.0, 17.0, 9.0, 13.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.220458984375, -0.21431541442871094, -0.20817184448242188, -0.2020282745361328, -0.19588470458984375, -0.1897411346435547, -0.18359756469726562, -0.17745399475097656, -0.1713104248046875, -0.16516685485839844, -0.15902328491210938, -0.1528797149658203, -0.14673614501953125, -0.1405925750732422, -0.13444900512695312, -0.12830543518066406, -0.122161865234375, -0.11601829528808594, -0.10987472534179688, -0.10373115539550781, -0.09758758544921875, -0.09144401550292969, -0.08530044555664062, -0.07915687561035156, -0.0730133056640625, -0.06686973571777344, -0.060726165771484375, -0.05458259582519531, -0.04843902587890625, -0.04229545593261719, -0.036151885986328125, -0.030008316040039062, -0.02386474609375, -0.017721176147460938, -0.011577606201171875, -0.0054340362548828125, 0.00070953369140625, 0.0068531036376953125, 0.012996673583984375, 0.019140243530273438, 0.0252838134765625, 0.03142738342285156, 0.037570953369140625, 0.04371452331542969, 0.04985809326171875, 0.05600166320800781, 0.062145233154296875, 0.06828880310058594, 0.074432373046875, 0.08057594299316406, 0.08671951293945312, 0.09286308288574219, 0.09900665283203125, 0.10515022277832031, 0.11129379272460938, 0.11743736267089844, 0.1235809326171875, 0.12972450256347656, 0.13586807250976562, 0.1420116424560547, 0.14815521240234375, 0.1542987823486328, 0.16044235229492188, 0.16658592224121094, 0.1727294921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 8.0, 13.0, 13.0, 8.0, 21.0, 28.0, 59.0, 76.0, 181.0, 386.0, 873.0, 2975.0, 17053.0, 977829.0, 42477.0, 4320.0, 1249.0, 451.0, 233.0, 108.0, 40.0, 32.0, 27.0, 24.0, 10.0, 15.0, 3.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1954345703125, -0.18995094299316406, -0.18446731567382812, -0.1789836883544922, -0.17350006103515625, -0.1680164337158203, -0.16253280639648438, -0.15704917907714844, -0.1515655517578125, -0.14608192443847656, -0.14059829711914062, -0.1351146697998047, -0.12963104248046875, -0.12414741516113281, -0.11866378784179688, -0.11318016052246094, -0.107696533203125, -0.10221290588378906, -0.09672927856445312, -0.09124565124511719, -0.08576202392578125, -0.08027839660644531, -0.07479476928710938, -0.06931114196777344, -0.0638275146484375, -0.05834388732910156, -0.052860260009765625, -0.04737663269042969, -0.04189300537109375, -0.03640937805175781, -0.030925750732421875, -0.025442123413085938, -0.01995849609375, -0.014474868774414062, -0.008991241455078125, -0.0035076141357421875, 0.00197601318359375, 0.0074596405029296875, 0.012943267822265625, 0.018426895141601562, 0.0239105224609375, 0.029394149780273438, 0.034877777099609375, 0.04036140441894531, 0.04584503173828125, 0.05132865905761719, 0.056812286376953125, 0.06229591369628906, 0.067779541015625, 0.07326316833496094, 0.07874679565429688, 0.08423042297363281, 0.08971405029296875, 0.09519767761230469, 0.10068130493164062, 0.10616493225097656, 0.1116485595703125, 0.11713218688964844, 0.12261581420898438, 0.1280994415283203, 0.13358306884765625, 0.1390666961669922, 0.14455032348632812, 0.15003395080566406, 0.155517578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 4.0, 2.0, 8.0, 2.0, 12.0, 24.0, 445.0, 399.0, 37.0, 14.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002301931381225586, -0.00022413022816181183, -0.00021806731820106506, -0.0002120044082403183, -0.00020594149827957153, -0.00019987858831882477, -0.000193815678358078, -0.00018775276839733124, -0.00018168985843658447, -0.0001756269484758377, -0.00016956403851509094, -0.00016350112855434418, -0.0001574382185935974, -0.00015137530863285065, -0.00014531239867210388, -0.00013924948871135712, -0.00013318657875061035, -0.00012712366878986359, -0.00012106075882911682, -0.00011499784886837006, -0.00010893493890762329, -0.00010287202894687653, -9.680911898612976e-05, -9.0746209025383e-05, -8.468329906463623e-05, -7.862038910388947e-05, -7.25574791431427e-05, -6.649456918239594e-05, -6.043165922164917e-05, -5.4368749260902405e-05, -4.830583930015564e-05, -4.2242929339408875e-05, -3.618001937866211e-05, -3.0117109417915344e-05, -2.405419945716858e-05, -1.7991289496421814e-05, -1.1928379535675049e-05, -5.865469574928284e-06, 1.9744038581848145e-07, 6.260350346565247e-06, 1.2323260307312012e-05, 1.8386170268058777e-05, 2.4449080228805542e-05, 3.0511990189552307e-05, 3.657490015029907e-05, 4.263781011104584e-05, 4.87007200717926e-05, 5.476363003253937e-05, 6.082653999328613e-05, 6.68894499540329e-05, 7.295235991477966e-05, 7.901526987552643e-05, 8.50781798362732e-05, 9.114108979701996e-05, 9.720399975776672e-05, 0.00010326690971851349, 0.00010932981967926025, 0.00011539272964000702, 0.00012145563960075378, 0.00012751854956150055, 0.00013358145952224731, 0.00013964436948299408, 0.00014570727944374084, 0.0001517701894044876, 0.00015783309936523438]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 13.0, 30.0, 39.0, 42.0, 95.0, 198.0, 345.0, 894.0, 3145.0, 23462.0, 915796.0, 95150.0, 6617.0, 1541.0, 543.0, 275.0, 133.0, 91.0, 50.0, 32.0, 19.0, 6.0, 9.0, 3.0, 8.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1541748046875, -0.1491546630859375, -0.144134521484375, -0.1391143798828125, -0.13409423828125, -0.1290740966796875, -0.124053955078125, -0.1190338134765625, -0.114013671875, -0.1089935302734375, -0.103973388671875, -0.0989532470703125, -0.09393310546875, -0.0889129638671875, -0.083892822265625, -0.0788726806640625, -0.0738525390625, -0.0688323974609375, -0.063812255859375, -0.0587921142578125, -0.05377197265625, -0.0487518310546875, -0.043731689453125, -0.0387115478515625, -0.03369140625, -0.0286712646484375, -0.023651123046875, -0.0186309814453125, -0.01361083984375, -0.0085906982421875, -0.003570556640625, 0.0014495849609375, 0.0064697265625, 0.0114898681640625, 0.016510009765625, 0.0215301513671875, 0.02655029296875, 0.0315704345703125, 0.036590576171875, 0.0416107177734375, 0.046630859375, 0.0516510009765625, 0.056671142578125, 0.0616912841796875, 0.06671142578125, 0.0717315673828125, 0.076751708984375, 0.0817718505859375, 0.0867919921875, 0.0918121337890625, 0.096832275390625, 0.1018524169921875, 0.10687255859375, 0.1118927001953125, 0.116912841796875, 0.1219329833984375, 0.126953125, 0.1319732666015625, 0.136993408203125, 0.1420135498046875, 0.14703369140625, 0.1520538330078125, 0.157073974609375, 0.1620941162109375, 0.1671142578125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 8.0, 17.0, 12.0, 16.0, 44.0, 39.0, 62.0, 86.0, 92.0, 133.0, 124.0, 109.0, 74.0, 45.0, 49.0, 20.0, 19.0, 14.0, 10.0, 2.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08362388610839844, -0.08008956909179688, -0.07655525207519531, -0.07302093505859375, -0.06948661804199219, -0.06595230102539062, -0.06241798400878906, -0.0588836669921875, -0.05534934997558594, -0.051815032958984375, -0.04828071594238281, -0.04474639892578125, -0.04121208190917969, -0.037677764892578125, -0.03414344787597656, -0.030609130859375, -0.027074813842773438, -0.023540496826171875, -0.020006179809570312, -0.01647186279296875, -0.012937545776367188, -0.009403228759765625, -0.0058689117431640625, -0.0023345947265625, 0.0011997222900390625, 0.004734039306640625, 0.008268356323242188, 0.01180267333984375, 0.015336990356445312, 0.018871307373046875, 0.022405624389648438, 0.02593994140625, 0.029474258422851562, 0.033008575439453125, 0.03654289245605469, 0.04007720947265625, 0.04361152648925781, 0.047145843505859375, 0.05068016052246094, 0.0542144775390625, 0.05774879455566406, 0.061283111572265625, 0.06481742858886719, 0.06835174560546875, 0.07188606262207031, 0.07542037963867188, 0.07895469665527344, 0.082489013671875, 0.08602333068847656, 0.08955764770507812, 0.09309196472167969, 0.09662628173828125, 0.10016059875488281, 0.10369491577148438, 0.10722923278808594, 0.1107635498046875, 0.11429786682128906, 0.11783218383789062, 0.12136650085449219, 0.12490081787109375, 0.1284351348876953, 0.13196945190429688, 0.13550376892089844, 0.1390380859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 22.0, 134.0, 503.0, 240.0, 54.0, 17.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.889031171798706, -2.817814588546753, -2.746598243713379, -2.675381660461426, -2.6041650772094727, -2.5329487323760986, -2.4617321491241455, -2.3905158042907715, -2.3192992210388184, -2.2480826377868652, -2.176866292953491, -2.105649709701538, -2.034433364868164, -1.963216781616211, -1.8920001983642578, -1.8207837343215942, -1.7495672702789307, -1.678350806236267, -1.6071343421936035, -1.5359177589416504, -1.4647012948989868, -1.3934848308563232, -1.3222682476043701, -1.2510517835617065, -1.179835319519043, -1.1086188554763794, -1.0374023914337158, -0.9661858081817627, -0.8949693441390991, -0.8237528800964355, -0.7525363564491272, -0.6813198328018188, -0.6101036071777344, -0.5388871431350708, -0.46767061948776245, -0.3964541256427765, -0.3252376317977905, -0.25402113795280457, -0.1828046441078186, -0.11158815026283264, -0.04037165641784668, 0.030844837427139282, 0.10206133127212524, 0.1732778251171112, 0.24449431896209717, 0.31571081280708313, 0.3869273066520691, 0.45814380049705505, 0.529360294342041, 0.6005767583847046, 0.6717932820320129, 0.7430098056793213, 0.8142262697219849, 0.8854427337646484, 0.9566592574119568, 1.0278757810592651, 1.0990922451019287, 1.1703087091445923, 1.2415251731872559, 1.312741756439209, 1.3839582204818726, 1.4551746845245361, 1.5263912677764893, 1.5976077318191528, 1.6688241958618164]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 10.0, 7.0, 9.0, 7.0, 11.0, 16.0, 24.0, 30.0, 42.0, 43.0, 54.0, 61.0, 69.0, 82.0, 73.0, 69.0, 56.0, 65.0, 57.0, 38.0, 38.0, 22.0, 21.0, 17.0, 20.0, 12.0, 7.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9664127826690674, -1.9060291051864624, -1.8456453084945679, -1.785261631011963, -1.7248778343200684, -1.6644941568374634, -1.6041104793548584, -1.5437266826629639, -1.4833428859710693, -1.4229592084884644, -1.3625754117965698, -1.3021917343139648, -1.2418079376220703, -1.1814242601394653, -1.1210405826568604, -1.0606567859649658, -1.0002731084823608, -0.9398893713951111, -0.8795056343078613, -0.8191219568252563, -0.7587381601333618, -0.6983544826507568, -0.6379707455635071, -0.5775870084762573, -0.5172032713890076, -0.4568195343017578, -0.39643579721450806, -0.3360520899295807, -0.27566835284233093, -0.21528461575508118, -0.1549009084701538, -0.09451717138290405, -0.0341334342956543, 0.026250295341014862, 0.08663402497768402, 0.14701774716377258, 0.20740148425102234, 0.2677852213382721, 0.32816892862319946, 0.3885526657104492, 0.448936402797699, 0.5093201398849487, 0.5697038769721985, 0.6300876140594482, 0.6904712915420532, 0.7508550882339478, 0.8112387657165527, 0.8716225028038025, 0.9320062398910522, 0.992389976978302, 1.0527737140655518, 1.1131573915481567, 1.1735411882400513, 1.2339248657226562, 1.2943086624145508, 1.3546923398971558, 1.4150760173797607, 1.4754596948623657, 1.5358434915542603, 1.5962271690368652, 1.6566109657287598, 1.7169946432113647, 1.7773783206939697, 1.8377621173858643, 1.8981459140777588]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 12.0, 12.0, 18.0, 18.0, 28.0, 67.0, 59.0, 82.0, 120.0, 259.0, 521.0, 1201.0, 2664.0, 8070.0, 97311.0, 4065752.0, 13045.0, 2894.0, 1117.0, 505.0, 234.0, 93.0, 53.0, 35.0, 25.0, 15.0, 14.0, 8.0, 6.0, 11.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1512908935546875, -1.113128662109375, -1.0749664306640625, -1.03680419921875, -0.9986419677734375, -0.960479736328125, -0.9223175048828125, -0.8841552734375, -0.8459930419921875, -0.807830810546875, -0.7696685791015625, -0.73150634765625, -0.6933441162109375, -0.655181884765625, -0.6170196533203125, -0.578857421875, -0.5406951904296875, -0.502532958984375, -0.4643707275390625, -0.42620849609375, -0.3880462646484375, -0.349884033203125, -0.3117218017578125, -0.2735595703125, -0.2353973388671875, -0.197235107421875, -0.1590728759765625, -0.12091064453125, -0.0827484130859375, -0.044586181640625, -0.0064239501953125, 0.03173828125, 0.0699005126953125, 0.108062744140625, 0.1462249755859375, 0.18438720703125, 0.2225494384765625, 0.260711669921875, 0.2988739013671875, 0.3370361328125, 0.3751983642578125, 0.413360595703125, 0.4515228271484375, 0.48968505859375, 0.5278472900390625, 0.566009521484375, 0.6041717529296875, 0.642333984375, 0.6804962158203125, 0.718658447265625, 0.7568206787109375, 0.79498291015625, 0.8331451416015625, 0.871307373046875, 0.9094696044921875, 0.9476318359375, 0.9857940673828125, 1.023956298828125, 1.0621185302734375, 1.10028076171875, 1.1384429931640625, 1.176605224609375, 1.2147674560546875, 1.2529296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 7.0, 9.0, 5.0, 12.0, 8.0, 19.0, 13.0, 28.0, 159.0, 418.0, 214.0, 47.0, 15.0, 12.0, 13.0, 9.0, 7.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10174560546875, -0.09870433807373047, -0.09566307067871094, -0.0926218032836914, -0.08958053588867188, -0.08653926849365234, -0.08349800109863281, -0.08045673370361328, -0.07741546630859375, -0.07437419891357422, -0.07133293151855469, -0.06829166412353516, -0.06525039672851562, -0.062209129333496094, -0.05916786193847656, -0.05612659454345703, -0.0530853271484375, -0.05004405975341797, -0.04700279235839844, -0.043961524963378906, -0.040920257568359375, -0.037878990173339844, -0.03483772277832031, -0.03179645538330078, -0.02875518798828125, -0.02571392059326172, -0.022672653198242188, -0.019631385803222656, -0.016590118408203125, -0.013548851013183594, -0.010507583618164062, -0.007466316223144531, -0.004425048828125, -0.0013837814331054688, 0.0016574859619140625, 0.004698753356933594, 0.007740020751953125, 0.010781288146972656, 0.013822555541992188, 0.01686382293701172, 0.01990509033203125, 0.02294635772705078, 0.025987625122070312, 0.029028892517089844, 0.032070159912109375, 0.035111427307128906, 0.03815269470214844, 0.04119396209716797, 0.0442352294921875, 0.04727649688720703, 0.05031776428222656, 0.053359031677246094, 0.056400299072265625, 0.059441566467285156, 0.06248283386230469, 0.06552410125732422, 0.06856536865234375, 0.07160663604736328, 0.07464790344238281, 0.07768917083740234, 0.08073043823242188, 0.0837717056274414, 0.08681297302246094, 0.08985424041748047, 0.0928955078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 6.0, 12.0, 6.0, 9.0, 12.0, 12.0, 26.0, 32.0, 42.0, 67.0, 114.0, 242.0, 868.0, 6484.0, 3175249.0, 1003323.0, 6356.0, 854.0, 264.0, 110.0, 67.0, 34.0, 28.0, 13.0, 9.0, 14.0, 3.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8319625854492188, -0.8011322021484375, -0.7703018188476562, -0.739471435546875, -0.7086410522460938, -0.6778106689453125, -0.6469802856445312, -0.61614990234375, -0.5853195190429688, -0.5544891357421875, -0.5236587524414062, -0.492828369140625, -0.46199798583984375, -0.4311676025390625, -0.40033721923828125, -0.3695068359375, -0.33867645263671875, -0.3078460693359375, -0.27701568603515625, -0.246185302734375, -0.21535491943359375, -0.1845245361328125, -0.15369415283203125, -0.12286376953125, -0.09203338623046875, -0.0612030029296875, -0.03037261962890625, 0.000457763671875, 0.03128814697265625, 0.0621185302734375, 0.09294891357421875, 0.123779296875, 0.15460968017578125, 0.1854400634765625, 0.21627044677734375, 0.247100830078125, 0.27793121337890625, 0.3087615966796875, 0.33959197998046875, 0.37042236328125, 0.40125274658203125, 0.4320831298828125, 0.46291351318359375, 0.493743896484375, 0.5245742797851562, 0.5554046630859375, 0.5862350463867188, 0.6170654296875, 0.6478958129882812, 0.6787261962890625, 0.7095565795898438, 0.740386962890625, 0.7712173461914062, 0.8020477294921875, 0.8328781127929688, 0.86370849609375, 0.8945388793945312, 0.9253692626953125, 0.9561996459960938, 0.987030029296875, 1.0178604125976562, 1.0486907958984375, 1.0795211791992188, 1.1103515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 8.0, 13.0, 17.0, 20.0, 42.0, 55.0, 106.0, 406.0, 2709.0, 279.0, 134.0, 61.0, 50.0, 23.0, 23.0, 28.0, 15.0, 11.0, 7.0, 6.0, 8.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.141357421875, -0.1375732421875, -0.1337890625, -0.1300048828125, -0.126220703125, -0.1224365234375, -0.11865234375, -0.1148681640625, -0.111083984375, -0.1072998046875, -0.103515625, -0.0997314453125, -0.095947265625, -0.0921630859375, -0.08837890625, -0.0845947265625, -0.080810546875, -0.0770263671875, -0.0732421875, -0.0694580078125, -0.065673828125, -0.0618896484375, -0.05810546875, -0.0543212890625, -0.050537109375, -0.0467529296875, -0.04296875, -0.0391845703125, -0.035400390625, -0.0316162109375, -0.02783203125, -0.0240478515625, -0.020263671875, -0.0164794921875, -0.0126953125, -0.0089111328125, -0.005126953125, -0.0013427734375, 0.00244140625, 0.0062255859375, 0.010009765625, 0.0137939453125, 0.017578125, 0.0213623046875, 0.025146484375, 0.0289306640625, 0.03271484375, 0.0364990234375, 0.040283203125, 0.0440673828125, 0.0478515625, 0.0516357421875, 0.055419921875, 0.0592041015625, 0.06298828125, 0.0667724609375, 0.070556640625, 0.0743408203125, 0.078125, 0.0819091796875, 0.085693359375, 0.0894775390625, 0.09326171875, 0.0970458984375, 0.100830078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 665.0, 330.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.783815383911133, -6.660317420959473, -6.5368194580078125, -6.413321018218994, -6.289823055267334, -6.166325092315674, -6.042827129364014, -5.919328689575195, -5.795830726623535, -5.672332763671875, -5.548834800720215, -5.4253363609313965, -5.301838397979736, -5.178340435028076, -5.054842472076416, -4.931344032287598, -4.8078460693359375, -4.684348106384277, -4.560850143432617, -4.437351703643799, -4.313853740692139, -4.1903557777404785, -4.066857814788818, -3.943359613418579, -3.819861650466919, -3.696363687515259, -3.5728654861450195, -3.4493675231933594, -3.32586932182312, -3.20237135887146, -3.0788731575012207, -2.9553751945495605, -2.831876754760742, -2.708378791809082, -2.5848805904388428, -2.4613826274871826, -2.3378844261169434, -2.214386463165283, -2.090888261795044, -1.9673902988433838, -1.8438923358917236, -1.720394253730774, -1.5968961715698242, -1.4733980894088745, -1.3499000072479248, -1.2264020442962646, -1.1029038429260254, -0.9794058203697205, -0.855907678604126, -0.7324095964431763, -0.6089115142822266, -0.48541346192359924, -0.36191537976264954, -0.23841732740402222, -0.11491924524307251, 0.008578836917877197, 0.1320769190788269, 0.2555750012397766, 0.3790730834007263, 0.5025711059570312, 0.626069188117981, 0.7495672702789307, 0.8730653524398804, 0.9965634346008301, 1.1200615167617798]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 5.0, 8.0, 7.0, 13.0, 31.0, 38.0, 59.0, 60.0, 76.0, 102.0, 86.0, 106.0, 85.0, 72.0, 70.0, 53.0, 35.0, 25.0, 21.0, 13.0, 7.0, 5.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5499835014343262, -0.5298078060150146, -0.5096321702003479, -0.4894564747810364, -0.46928080916404724, -0.4491051435470581, -0.42892947793006897, -0.40875381231307983, -0.3885781168937683, -0.3684024512767792, -0.34822678565979004, -0.3280510902404785, -0.3078754246234894, -0.28769975900650024, -0.2675240933895111, -0.24734841287136078, -0.22717276215553284, -0.2069970965385437, -0.18682141602039337, -0.16664575040340424, -0.1464700698852539, -0.12629440426826477, -0.10611873865127563, -0.0859430581331253, -0.06576739251613617, -0.04559171944856644, -0.025416050106287003, -0.005240380764007568, 0.014935292303562164, 0.0351109653711319, 0.05528663098812103, 0.07546231150627136, 0.0956379771232605, 0.11581365019083023, 0.13598932325839996, 0.1561649888753891, 0.17634066939353943, 0.19651633501052856, 0.2166920006275177, 0.23686768114566803, 0.25704336166381836, 0.2772190272808075, 0.29739469289779663, 0.31757038831710815, 0.3377460539340973, 0.3579217195510864, 0.37809738516807556, 0.3982730507850647, 0.41844871640205383, 0.43862438201904297, 0.4588000476360321, 0.47897571325302124, 0.49915140867233276, 0.5193270444869995, 0.539502739906311, 0.5596784353256226, 0.5798540711402893, 0.6000297665596008, 0.6202054023742676, 0.6403810977935791, 0.6605567336082458, 0.6807324290275574, 0.7009080648422241, 0.7210837602615356, 0.7412594556808472]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 17.0, 9.0, 19.0, 27.0, 17.0, 24.0, 31.0, 43.0, 60.0, 87.0, 145.0, 194.0, 274.0, 491.0, 930.0, 1892.0, 4380.0, 14350.0, 139988.0, 841478.0, 31321.0, 6917.0, 2784.0, 1217.0, 636.0, 400.0, 233.0, 137.0, 115.0, 89.0, 49.0, 27.0, 38.0, 30.0, 19.0, 18.0, 12.0, 17.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.45361328125, -0.4390869140625, -0.424560546875, -0.4100341796875, -0.3955078125, -0.3809814453125, -0.366455078125, -0.3519287109375, -0.33740234375, -0.3228759765625, -0.308349609375, -0.2938232421875, -0.279296875, -0.2647705078125, -0.250244140625, -0.2357177734375, -0.22119140625, -0.2066650390625, -0.192138671875, -0.1776123046875, -0.1630859375, -0.1485595703125, -0.134033203125, -0.1195068359375, -0.10498046875, -0.0904541015625, -0.075927734375, -0.0614013671875, -0.046875, -0.0323486328125, -0.017822265625, -0.0032958984375, 0.01123046875, 0.0257568359375, 0.040283203125, 0.0548095703125, 0.0693359375, 0.0838623046875, 0.098388671875, 0.1129150390625, 0.12744140625, 0.1419677734375, 0.156494140625, 0.1710205078125, 0.185546875, 0.2000732421875, 0.214599609375, 0.2291259765625, 0.24365234375, 0.2581787109375, 0.272705078125, 0.2872314453125, 0.3017578125, 0.3162841796875, 0.330810546875, 0.3453369140625, 0.35986328125, 0.3743896484375, 0.388916015625, 0.4034423828125, 0.41796875, 0.4324951171875, 0.447021484375, 0.4615478515625, 0.47607421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 10.0, 14.0, 16.0, 17.0, 116.0, 325.0, 304.0, 104.0, 27.0, 18.0, 9.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.0956888198852539, -0.09268379211425781, -0.08967876434326172, -0.08667373657226562, -0.08366870880126953, -0.08066368103027344, -0.07765865325927734, -0.07465362548828125, -0.07164859771728516, -0.06864356994628906, -0.06563854217529297, -0.06263351440429688, -0.05962848663330078, -0.05662345886230469, -0.053618431091308594, -0.0506134033203125, -0.047608375549316406, -0.04460334777832031, -0.04159832000732422, -0.038593292236328125, -0.03558826446533203, -0.03258323669433594, -0.029578208923339844, -0.02657318115234375, -0.023568153381347656, -0.020563125610351562, -0.01755809783935547, -0.014553070068359375, -0.011548042297363281, -0.008543014526367188, -0.005537986755371094, -0.002532958984375, 0.00047206878662109375, 0.0034770965576171875, 0.006482124328613281, 0.009487152099609375, 0.012492179870605469, 0.015497207641601562, 0.018502235412597656, 0.02150726318359375, 0.024512290954589844, 0.027517318725585938, 0.03052234649658203, 0.033527374267578125, 0.03653240203857422, 0.03953742980957031, 0.042542457580566406, 0.0455474853515625, 0.048552513122558594, 0.05155754089355469, 0.05456256866455078, 0.057567596435546875, 0.06057262420654297, 0.06357765197753906, 0.06658267974853516, 0.06958770751953125, 0.07259273529052734, 0.07559776306152344, 0.07860279083251953, 0.08160781860351562, 0.08461284637451172, 0.08761787414550781, 0.0906229019165039, 0.0936279296875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 13.0, 8.0, 10.0, 7.0, 19.0, 20.0, 19.0, 32.0, 51.0, 59.0, 67.0, 105.0, 130.0, 223.0, 326.0, 582.0, 1009.0, 2020.0, 6162.0, 40531.0, 798150.0, 179255.0, 13120.0, 3282.0, 1399.0, 664.0, 403.0, 275.0, 173.0, 103.0, 90.0, 50.0, 42.0, 33.0, 26.0, 10.0, 18.0, 15.0, 11.0, 9.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.420166015625, -0.4073333740234375, -0.394500732421875, -0.3816680908203125, -0.36883544921875, -0.3560028076171875, -0.343170166015625, -0.3303375244140625, -0.3175048828125, -0.3046722412109375, -0.291839599609375, -0.2790069580078125, -0.26617431640625, -0.2533416748046875, -0.240509033203125, -0.2276763916015625, -0.21484375, -0.2020111083984375, -0.189178466796875, -0.1763458251953125, -0.16351318359375, -0.1506805419921875, -0.137847900390625, -0.1250152587890625, -0.1121826171875, -0.0993499755859375, -0.086517333984375, -0.0736846923828125, -0.06085205078125, -0.0480194091796875, -0.035186767578125, -0.0223541259765625, -0.009521484375, 0.0033111572265625, 0.016143798828125, 0.0289764404296875, 0.04180908203125, 0.0546417236328125, 0.067474365234375, 0.0803070068359375, 0.0931396484375, 0.1059722900390625, 0.118804931640625, 0.1316375732421875, 0.14447021484375, 0.1573028564453125, 0.170135498046875, 0.1829681396484375, 0.19580078125, 0.2086334228515625, 0.221466064453125, 0.2342987060546875, 0.24713134765625, 0.2599639892578125, 0.272796630859375, 0.2856292724609375, 0.2984619140625, 0.3112945556640625, 0.324127197265625, 0.3369598388671875, 0.34979248046875, 0.3626251220703125, 0.375457763671875, 0.3882904052734375, 0.401123046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 9.0, 10.0, 11.0, 13.0, 15.0, 26.0, 19.0, 26.0, 31.0, 26.0, 41.0, 36.0, 39.0, 43.0, 51.0, 48.0, 41.0, 46.0, 38.0, 44.0, 45.0, 31.0, 39.0, 35.0, 30.0, 31.0, 22.0, 23.0, 14.0, 13.0, 13.0, 17.0, 15.0, 7.0, 6.0, 7.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1868896484375, -0.18124008178710938, -0.17559051513671875, -0.16994094848632812, -0.1642913818359375, -0.15864181518554688, -0.15299224853515625, -0.14734268188476562, -0.141693115234375, -0.13604354858398438, -0.13039398193359375, -0.12474441528320312, -0.1190948486328125, -0.11344528198242188, -0.10779571533203125, -0.10214614868164062, -0.09649658203125, -0.09084701538085938, -0.08519744873046875, -0.07954788208007812, -0.0738983154296875, -0.06824874877929688, -0.06259918212890625, -0.056949615478515625, -0.051300048828125, -0.045650482177734375, -0.04000091552734375, -0.034351348876953125, -0.0287017822265625, -0.023052215576171875, -0.01740264892578125, -0.011753082275390625, -0.006103515625, -0.000453948974609375, 0.00519561767578125, 0.010845184326171875, 0.0164947509765625, 0.022144317626953125, 0.02779388427734375, 0.033443450927734375, 0.039093017578125, 0.044742584228515625, 0.05039215087890625, 0.056041717529296875, 0.0616912841796875, 0.06734085083007812, 0.07299041748046875, 0.07863998413085938, 0.08428955078125, 0.08993911743164062, 0.09558868408203125, 0.10123825073242188, 0.1068878173828125, 0.11253738403320312, 0.11818695068359375, 0.12383651733398438, 0.129486083984375, 0.13513565063476562, 0.14078521728515625, 0.14643478393554688, 0.1520843505859375, 0.15773391723632812, 0.16338348388671875, 0.16903305053710938, 0.1746826171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 24.0, 35.0, 54.0, 96.0, 137.0, 280.0, 577.0, 1474.0, 6130.0, 65073.0, 918035.0, 48975.0, 5258.0, 1279.0, 477.0, 224.0, 130.0, 63.0, 49.0, 41.0, 32.0, 17.0, 14.0, 9.0, 7.0, 2.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.25537109375, -0.24795913696289062, -0.24054718017578125, -0.23313522338867188, -0.2257232666015625, -0.21831130981445312, -0.21089935302734375, -0.20348739624023438, -0.196075439453125, -0.18866348266601562, -0.18125152587890625, -0.17383956909179688, -0.1664276123046875, -0.15901565551757812, -0.15160369873046875, -0.14419174194335938, -0.13677978515625, -0.12936782836914062, -0.12195587158203125, -0.11454391479492188, -0.1071319580078125, -0.09972000122070312, -0.09230804443359375, -0.08489608764648438, -0.077484130859375, -0.07007217407226562, -0.06266021728515625, -0.055248260498046875, -0.0478363037109375, -0.040424346923828125, -0.03301239013671875, -0.025600433349609375, -0.0181884765625, -0.010776519775390625, -0.00336456298828125, 0.004047393798828125, 0.0114593505859375, 0.018871307373046875, 0.02628326416015625, 0.033695220947265625, 0.041107177734375, 0.048519134521484375, 0.05593109130859375, 0.06334304809570312, 0.0707550048828125, 0.07816696166992188, 0.08557891845703125, 0.09299087524414062, 0.10040283203125, 0.10781478881835938, 0.11522674560546875, 0.12263870239257812, 0.1300506591796875, 0.13746261596679688, 0.14487457275390625, 0.15228652954101562, 0.159698486328125, 0.16711044311523438, 0.17452239990234375, 0.18193435668945312, 0.1893463134765625, 0.19675827026367188, 0.20417022705078125, 0.21158218383789062, 0.218994140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 10.0, 3.0, 3.0, 13.0, 4.0, 11.0, 13.0, 20.0, 27.0, 39.0, 56.0, 57.0, 108.0, 249.0, 112.0, 66.0, 58.0, 34.0, 31.0, 20.0, 15.0, 16.0, 9.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00022661685943603516, -0.00022023916244506836, -0.00021386146545410156, -0.00020748376846313477, -0.00020110607147216797, -0.00019472837448120117, -0.00018835067749023438, -0.00018197298049926758, -0.00017559528350830078, -0.00016921758651733398, -0.0001628398895263672, -0.0001564621925354004, -0.0001500844955444336, -0.0001437067985534668, -0.0001373291015625, -0.0001309514045715332, -0.0001245737075805664, -0.00011819601058959961, -0.00011181831359863281, -0.00010544061660766602, -9.906291961669922e-05, -9.268522262573242e-05, -8.630752563476562e-05, -7.992982864379883e-05, -7.355213165283203e-05, -6.717443466186523e-05, -6.079673767089844e-05, -5.441904067993164e-05, -4.8041343688964844e-05, -4.166364669799805e-05, -3.528594970703125e-05, -2.8908252716064453e-05, -2.2530555725097656e-05, -1.615285873413086e-05, -9.775161743164062e-06, -3.3974647521972656e-06, 2.9802322387695312e-06, 9.357929229736328e-06, 1.5735626220703125e-05, 2.2113323211669922e-05, 2.849102020263672e-05, 3.4868717193603516e-05, 4.124641418457031e-05, 4.762411117553711e-05, 5.4001808166503906e-05, 6.03795051574707e-05, 6.67572021484375e-05, 7.31348991394043e-05, 7.95125961303711e-05, 8.589029312133789e-05, 9.226799011230469e-05, 9.864568710327148e-05, 0.00010502338409423828, 0.00011140108108520508, 0.00011777877807617188, 0.00012415647506713867, 0.00013053417205810547, 0.00013691186904907227, 0.00014328956604003906, 0.00014966726303100586, 0.00015604496002197266, 0.00016242265701293945, 0.00016880035400390625, 0.00017517805099487305, 0.00018155574798583984]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 14.0, 8.0, 11.0, 26.0, 39.0, 55.0, 72.0, 176.0, 385.0, 971.0, 5173.0, 321141.0, 712628.0, 5960.0, 1100.0, 386.0, 167.0, 78.0, 55.0, 29.0, 26.0, 17.0, 7.0, 7.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.496826171875, -0.48223114013671875, -0.4676361083984375, -0.45304107666015625, -0.438446044921875, -0.42385101318359375, -0.4092559814453125, -0.39466094970703125, -0.38006591796875, -0.36547088623046875, -0.3508758544921875, -0.33628082275390625, -0.321685791015625, -0.30709075927734375, -0.2924957275390625, -0.27790069580078125, -0.2633056640625, -0.24871063232421875, -0.2341156005859375, -0.21952056884765625, -0.204925537109375, -0.19033050537109375, -0.1757354736328125, -0.16114044189453125, -0.14654541015625, -0.13195037841796875, -0.1173553466796875, -0.10276031494140625, -0.088165283203125, -0.07357025146484375, -0.0589752197265625, -0.04438018798828125, -0.02978515625, -0.01519012451171875, -0.0005950927734375, 0.01399993896484375, 0.028594970703125, 0.04319000244140625, 0.0577850341796875, 0.07238006591796875, 0.08697509765625, 0.10157012939453125, 0.1161651611328125, 0.13076019287109375, 0.145355224609375, 0.15995025634765625, 0.1745452880859375, 0.18914031982421875, 0.2037353515625, 0.21833038330078125, 0.2329254150390625, 0.24752044677734375, 0.262115478515625, 0.27671051025390625, 0.2913055419921875, 0.30590057373046875, 0.32049560546875, 0.33509063720703125, 0.3496856689453125, 0.36428070068359375, 0.378875732421875, 0.39347076416015625, 0.4080657958984375, 0.42266082763671875, 0.437255859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 5.0, 10.0, 9.0, 15.0, 16.0, 37.0, 49.0, 91.0, 142.0, 184.0, 144.0, 96.0, 51.0, 31.0, 24.0, 17.0, 11.0, 15.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2091064453125, -0.2036876678466797, -0.19826889038085938, -0.19285011291503906, -0.18743133544921875, -0.18201255798339844, -0.17659378051757812, -0.1711750030517578, -0.1657562255859375, -0.1603374481201172, -0.15491867065429688, -0.14949989318847656, -0.14408111572265625, -0.13866233825683594, -0.13324356079101562, -0.1278247833251953, -0.122406005859375, -0.11698722839355469, -0.11156845092773438, -0.10614967346191406, -0.10073089599609375, -0.09531211853027344, -0.08989334106445312, -0.08447456359863281, -0.0790557861328125, -0.07363700866699219, -0.06821823120117188, -0.06279945373535156, -0.05738067626953125, -0.05196189880371094, -0.046543121337890625, -0.04112434387207031, -0.03570556640625, -0.030286788940429688, -0.024868011474609375, -0.019449234008789062, -0.01403045654296875, -0.008611679077148438, -0.003192901611328125, 0.0022258758544921875, 0.0076446533203125, 0.013063430786132812, 0.018482208251953125, 0.023900985717773438, 0.02931976318359375, 0.03473854064941406, 0.040157318115234375, 0.04557609558105469, 0.050994873046875, 0.05641365051269531, 0.061832427978515625, 0.06725120544433594, 0.07266998291015625, 0.07808876037597656, 0.08350753784179688, 0.08892631530761719, 0.0943450927734375, 0.09976387023925781, 0.10518264770507812, 0.11060142517089844, 0.11602020263671875, 0.12143898010253906, 0.12685775756835938, 0.1322765350341797, 0.1376953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 12.0, 24.0, 90.0, 377.0, 401.0, 69.0, 13.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6290292739868164, -3.5252389907836914, -3.4214487075805664, -3.3176584243774414, -3.2138681411743164, -3.1100778579711914, -3.0062878131866455, -2.9024975299835205, -2.7987072467803955, -2.6949169635772705, -2.5911266803741455, -2.4873363971710205, -2.3835463523864746, -2.2797560691833496, -2.1759657859802246, -2.0721755027770996, -1.9683852195739746, -1.8645949363708496, -1.7608046531677246, -1.6570144891738892, -1.5532242059707642, -1.4494339227676392, -1.3456437587738037, -1.2418534755706787, -1.1380631923675537, -1.0342729091644287, -0.9304826855659485, -0.8266924619674683, -0.7229021787643433, -0.6191118955612183, -0.515321671962738, -0.4115314483642578, -0.3077414035797119, -0.2039511501789093, -0.10016089677810669, 0.003629356622695923, 0.10741961002349854, 0.21120989322662354, 0.31500011682510376, 0.418790340423584, 0.522580623626709, 0.626370906829834, 0.7301611304283142, 0.8339513540267944, 0.9377416372299194, 1.0415319204330444, 1.1453220844268799, 1.2491123676300049, 1.3529026508331299, 1.4566929340362549, 1.5604832172393799, 1.6642733812332153, 1.7680636644363403, 1.8718539476394653, 1.9756441116333008, 2.079434394836426, 2.183224678039551, 2.287014961242676, 2.390805244445801, 2.494595527648926, 2.598385810852051, 2.702176094055176, 2.8059661388397217, 2.9097564220428467, 3.0135467052459717]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 9.0, 5.0, 12.0, 21.0, 20.0, 28.0, 50.0, 40.0, 44.0, 60.0, 54.0, 55.0, 82.0, 66.0, 70.0, 58.0, 70.0, 59.0, 38.0, 38.0, 34.0, 20.0, 23.0, 9.0, 12.0, 4.0, 10.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.2630128860473633, -2.1985321044921875, -2.134051561355591, -2.069571018218994, -2.0050902366638184, -1.9406095743179321, -1.876128911972046, -1.8116482496261597, -1.7471675872802734, -1.6826869249343872, -1.618206262588501, -1.5537256002426147, -1.4892449378967285, -1.4247642755508423, -1.360283613204956, -1.2958029508590698, -1.2313222885131836, -1.1668416261672974, -1.1023609638214111, -1.037880301475525, -0.9733996391296387, -0.9089189767837524, -0.8444383144378662, -0.77995765209198, -0.7154769897460938, -0.6509963274002075, -0.5865156650543213, -0.5220350027084351, -0.45755434036254883, -0.3930736780166626, -0.32859301567077637, -0.26411235332489014, -0.1996316909790039, -0.13515102863311768, -0.07067036628723145, -0.006189703941345215, 0.058290958404541016, 0.12277162075042725, 0.18725228309631348, 0.2517329454421997, 0.31621360778808594, 0.38069427013397217, 0.4451749324798584, 0.5096555948257446, 0.5741362571716309, 0.6386169195175171, 0.7030975818634033, 0.7675782442092896, 0.8320589065551758, 0.896539568901062, 0.9610202312469482, 1.0255008935928345, 1.0899815559387207, 1.154462218284607, 1.2189428806304932, 1.2834235429763794, 1.3479042053222656, 1.4123848676681519, 1.476865530014038, 1.5413461923599243, 1.6058268547058105, 1.6703075170516968, 1.734788179397583, 1.7992688417434692, 1.8637495040893555]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 17.0, 24.0, 55.0, 124.0, 442.0, 5764.0, 4184984.0, 2458.0, 285.0, 65.0, 21.0, 17.0, 18.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.7738037109375, -2.672607421875, -2.5714111328125, -2.47021484375, -2.3690185546875, -2.267822265625, -2.1666259765625, -2.0654296875, -1.9642333984375, -1.863037109375, -1.7618408203125, -1.66064453125, -1.5594482421875, -1.458251953125, -1.3570556640625, -1.255859375, -1.1546630859375, -1.053466796875, -0.9522705078125, -0.85107421875, -0.7498779296875, -0.648681640625, -0.5474853515625, -0.4462890625, -0.3450927734375, -0.243896484375, -0.1427001953125, -0.04150390625, 0.0596923828125, 0.160888671875, 0.2620849609375, 0.36328125, 0.4644775390625, 0.565673828125, 0.6668701171875, 0.76806640625, 0.8692626953125, 0.970458984375, 1.0716552734375, 1.1728515625, 1.2740478515625, 1.375244140625, 1.4764404296875, 1.57763671875, 1.6788330078125, 1.780029296875, 1.8812255859375, 1.982421875, 2.0836181640625, 2.184814453125, 2.2860107421875, 2.38720703125, 2.4884033203125, 2.589599609375, 2.6907958984375, 2.7919921875, 2.8931884765625, 2.994384765625, 3.0955810546875, 3.19677734375, 3.2979736328125, 3.399169921875, 3.5003662109375, 3.6015625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 15.0, 9.0, 15.0, 18.0, 42.0, 165.0, 289.0, 275.0, 99.0, 30.0, 16.0, 8.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.09336280822753906, -0.09010696411132812, -0.08685111999511719, -0.08359527587890625, -0.08033943176269531, -0.07708358764648438, -0.07382774353027344, -0.0705718994140625, -0.06731605529785156, -0.06406021118164062, -0.06080436706542969, -0.05754852294921875, -0.05429267883300781, -0.051036834716796875, -0.04778099060058594, -0.044525146484375, -0.04126930236816406, -0.038013458251953125, -0.03475761413574219, -0.03150177001953125, -0.028245925903320312, -0.024990081787109375, -0.021734237670898438, -0.0184783935546875, -0.015222549438476562, -0.011966705322265625, -0.008710861206054688, -0.00545501708984375, -0.0021991729736328125, 0.001056671142578125, 0.0043125152587890625, 0.007568359375, 0.010824203491210938, 0.014080047607421875, 0.017335891723632812, 0.02059173583984375, 0.023847579956054688, 0.027103424072265625, 0.030359268188476562, 0.0336151123046875, 0.03687095642089844, 0.040126800537109375, 0.04338264465332031, 0.04663848876953125, 0.04989433288574219, 0.053150177001953125, 0.05640602111816406, 0.059661865234375, 0.06291770935058594, 0.06617355346679688, 0.06942939758300781, 0.07268524169921875, 0.07594108581542969, 0.07919692993164062, 0.08245277404785156, 0.0857086181640625, 0.08896446228027344, 0.09222030639648438, 0.09547615051269531, 0.09873199462890625, 0.10198783874511719, 0.10524368286132812, 0.10849952697753906, 0.11175537109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 7.0, 11.0, 13.0, 18.0, 36.0, 56.0, 68.0, 99.0, 208.0, 424.0, 849.0, 2526.0, 13032.0, 3572018.0, 589218.0, 11049.0, 2514.0, 981.0, 418.0, 240.0, 179.0, 105.0, 61.0, 46.0, 32.0, 23.0, 9.0, 8.0, 4.0, 6.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5830078125, -0.5621414184570312, -0.5412750244140625, -0.5204086303710938, -0.499542236328125, -0.47867584228515625, -0.4578094482421875, -0.43694305419921875, -0.41607666015625, -0.39521026611328125, -0.3743438720703125, -0.35347747802734375, -0.332611083984375, -0.31174468994140625, -0.2908782958984375, -0.27001190185546875, -0.2491455078125, -0.22827911376953125, -0.2074127197265625, -0.18654632568359375, -0.165679931640625, -0.14481353759765625, -0.1239471435546875, -0.10308074951171875, -0.08221435546875, -0.06134796142578125, -0.0404815673828125, -0.01961517333984375, 0.001251220703125, 0.02211761474609375, 0.0429840087890625, 0.06385040283203125, 0.084716796875, 0.10558319091796875, 0.1264495849609375, 0.14731597900390625, 0.168182373046875, 0.18904876708984375, 0.2099151611328125, 0.23078155517578125, 0.25164794921875, 0.27251434326171875, 0.2933807373046875, 0.31424713134765625, 0.335113525390625, 0.35597991943359375, 0.3768463134765625, 0.39771270751953125, 0.4185791015625, 0.43944549560546875, 0.4603118896484375, 0.48117828369140625, 0.502044677734375, 0.5229110717773438, 0.5437774658203125, 0.5646438598632812, 0.58551025390625, 0.6063766479492188, 0.6272430419921875, 0.6481094360351562, 0.668975830078125, 0.6898422241210938, 0.7107086181640625, 0.7315750122070312, 0.75244140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 8.0, 6.0, 19.0, 23.0, 35.0, 74.0, 202.0, 2515.0, 844.0, 150.0, 59.0, 37.0, 24.0, 18.0, 13.0, 5.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07672882080078125, -0.0726470947265625, -0.06856536865234375, -0.064483642578125, -0.06040191650390625, -0.0563201904296875, -0.05223846435546875, -0.04815673828125, -0.04407501220703125, -0.0399932861328125, -0.03591156005859375, -0.031829833984375, -0.02774810791015625, -0.0236663818359375, -0.01958465576171875, -0.0155029296875, -0.01142120361328125, -0.0073394775390625, -0.00325775146484375, 0.000823974609375, 0.00490570068359375, 0.0089874267578125, 0.01306915283203125, 0.01715087890625, 0.02123260498046875, 0.0253143310546875, 0.02939605712890625, 0.033477783203125, 0.03755950927734375, 0.0416412353515625, 0.04572296142578125, 0.0498046875, 0.05388641357421875, 0.0579681396484375, 0.06204986572265625, 0.066131591796875, 0.07021331787109375, 0.0742950439453125, 0.07837677001953125, 0.08245849609375, 0.08654022216796875, 0.0906219482421875, 0.09470367431640625, 0.098785400390625, 0.10286712646484375, 0.1069488525390625, 0.11103057861328125, 0.1151123046875, 0.11919403076171875, 0.1232757568359375, 0.12735748291015625, 0.131439208984375, 0.13552093505859375, 0.1396026611328125, 0.14368438720703125, 0.14776611328125, 0.15184783935546875, 0.1559295654296875, 0.16001129150390625, 0.164093017578125, 0.16817474365234375, 0.1722564697265625, 0.17633819580078125, 0.180419921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 13.0, 162.0, 755.0, 63.0, 13.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944117307662964, -2.871133327484131, -2.7981491088867188, -2.7251651287078857, -2.6521811485290527, -2.5791969299316406, -2.5062129497528076, -2.4332289695739746, -2.3602447509765625, -2.2872607707977295, -2.2142765522003174, -2.1412925720214844, -2.0683085918426514, -1.9953244924545288, -1.9223403930664062, -1.8493564128875732, -1.7763724327087402, -1.7033883333206177, -1.6304043531417847, -1.557420253753662, -1.484436273574829, -1.4114521741867065, -1.338468074798584, -1.265484094619751, -1.1924999952316284, -1.1195158958435059, -1.0465319156646729, -0.9735478162765503, -0.9005637764930725, -0.8275797367095947, -0.7545956373214722, -0.6816115975379944, -0.6086273193359375, -0.5356432795524597, -0.46265920996665955, -0.3896751403808594, -0.3166911005973816, -0.2437070608139038, -0.17072299122810364, -0.09773892164230347, -0.024754881858825684, 0.04822917282581329, 0.12121322751045227, 0.19419728219509125, 0.2671813368797302, 0.340165376663208, 0.4131494462490082, 0.48613351583480835, 0.5591175556182861, 0.6321015954017639, 0.7050856351852417, 0.7780697345733643, 0.851053774356842, 0.9240378141403198, 0.9970219135284424, 1.0700058937072754, 1.142989993095398, 1.2159740924835205, 1.2889580726623535, 1.361942172050476, 1.4349262714385986, 1.5079102516174316, 1.5808943510055542, 1.6538784503936768, 1.7268624305725098]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 6.0, 9.0, 14.0, 16.0, 15.0, 32.0, 20.0, 40.0, 54.0, 48.0, 42.0, 58.0, 57.0, 59.0, 48.0, 49.0, 66.0, 64.0, 50.0, 45.0, 34.0, 28.0, 42.0, 25.0, 21.0, 9.0, 8.0, 10.0, 5.0, 2.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4465025067329407, -0.4348994791507721, -0.42329642176628113, -0.41169339418411255, -0.4000903367996216, -0.388487309217453, -0.3768842816352844, -0.36528122425079346, -0.3536781668663025, -0.3420751392841339, -0.33047208189964294, -0.31886905431747437, -0.3072659969329834, -0.2956629693508148, -0.28405994176864624, -0.2724568843841553, -0.2608538568019867, -0.24925081431865692, -0.23764777183532715, -0.22604474425315857, -0.2144416868686676, -0.20283865928649902, -0.19123561680316925, -0.17963257431983948, -0.1680295318365097, -0.15642648935317993, -0.14482344686985016, -0.13322040438652039, -0.12161736935377121, -0.11001432687044144, -0.09841129183769226, -0.08680824935436249, -0.07520520687103271, -0.06360216438770294, -0.05199912562966347, -0.04039608687162399, -0.02879304438829422, -0.017190001904964447, -0.005586966872215271, 0.006016075611114502, 0.017619118094444275, 0.0292221587151289, 0.04082519933581352, 0.052428238093853, 0.06403128057718277, 0.07563432306051254, 0.08723735809326172, 0.09884040057659149, 0.11044344305992126, 0.12204648554325104, 0.1336495280265808, 0.1452525556087494, 0.15685561299324036, 0.16845864057540894, 0.1800616830587387, 0.19166472554206848, 0.20326776802539825, 0.21487081050872803, 0.2264738529920578, 0.23807689547538757, 0.24967992305755615, 0.2612829804420471, 0.2728860080242157, 0.2844890356063843, 0.29609209299087524]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 8.0, 5.0, 8.0, 8.0, 10.0, 14.0, 13.0, 16.0, 10.0, 23.0, 36.0, 54.0, 65.0, 113.0, 112.0, 166.0, 219.0, 339.0, 420.0, 774.0, 1280.0, 2803.0, 9042.0, 56144.0, 800351.0, 152910.0, 15154.0, 4135.0, 1621.0, 895.0, 534.0, 348.0, 228.0, 178.0, 136.0, 107.0, 68.0, 50.0, 44.0, 29.0, 22.0, 17.0, 11.0, 11.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291015625, -0.2821083068847656, -0.27320098876953125, -0.2642936706542969, -0.2553863525390625, -0.24647903442382812, -0.23757171630859375, -0.22866439819335938, -0.219757080078125, -0.21084976196289062, -0.20194244384765625, -0.19303512573242188, -0.1841278076171875, -0.17522048950195312, -0.16631317138671875, -0.15740585327148438, -0.14849853515625, -0.13959121704101562, -0.13068389892578125, -0.12177658081054688, -0.1128692626953125, -0.10396194458007812, -0.09505462646484375, -0.08614730834960938, -0.077239990234375, -0.06833267211914062, -0.05942535400390625, -0.050518035888671875, -0.0416107177734375, -0.032703399658203125, -0.02379608154296875, -0.014888763427734375, -0.0059814453125, 0.002925872802734375, 0.01183319091796875, 0.020740509033203125, 0.0296478271484375, 0.038555145263671875, 0.04746246337890625, 0.056369781494140625, 0.065277099609375, 0.07418441772460938, 0.08309173583984375, 0.09199905395507812, 0.1009063720703125, 0.10981369018554688, 0.11872100830078125, 0.12762832641601562, 0.13653564453125, 0.14544296264648438, 0.15435028076171875, 0.16325759887695312, 0.1721649169921875, 0.18107223510742188, 0.18997955322265625, 0.19888687133789062, 0.207794189453125, 0.21670150756835938, 0.22560882568359375, 0.23451614379882812, 0.2434234619140625, 0.2523307800292969, 0.26123809814453125, 0.2701454162597656, 0.279052734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 11.0, 17.0, 16.0, 22.0, 70.0, 166.0, 290.0, 250.0, 91.0, 35.0, 9.0, 10.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1014404296875, -0.09822463989257812, -0.09500885009765625, -0.09179306030273438, -0.0885772705078125, -0.08536148071289062, -0.08214569091796875, -0.07892990112304688, -0.075714111328125, -0.07249832153320312, -0.06928253173828125, -0.06606674194335938, -0.0628509521484375, -0.059635162353515625, -0.05641937255859375, -0.053203582763671875, -0.04998779296875, -0.046772003173828125, -0.04355621337890625, -0.040340423583984375, -0.0371246337890625, -0.033908843994140625, -0.03069305419921875, -0.027477264404296875, -0.024261474609375, -0.021045684814453125, -0.01782989501953125, -0.014614105224609375, -0.0113983154296875, -0.008182525634765625, -0.00496673583984375, -0.001750946044921875, 0.00146484375, 0.004680633544921875, 0.00789642333984375, 0.011112213134765625, 0.0143280029296875, 0.017543792724609375, 0.02075958251953125, 0.023975372314453125, 0.027191162109375, 0.030406951904296875, 0.03362274169921875, 0.036838531494140625, 0.0400543212890625, 0.043270111083984375, 0.04648590087890625, 0.049701690673828125, 0.05291748046875, 0.056133270263671875, 0.05934906005859375, 0.06256484985351562, 0.0657806396484375, 0.06899642944335938, 0.07221221923828125, 0.07542800903320312, 0.078643798828125, 0.08185958862304688, 0.08507537841796875, 0.08829116821289062, 0.0915069580078125, 0.09472274780273438, 0.09793853759765625, 0.10115432739257812, 0.1043701171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 5.0, 12.0, 20.0, 20.0, 35.0, 34.0, 45.0, 84.0, 120.0, 168.0, 250.0, 378.0, 652.0, 1274.0, 2564.0, 7550.0, 50289.0, 684883.0, 270945.0, 20606.0, 4433.0, 1782.0, 913.0, 498.0, 308.0, 214.0, 155.0, 95.0, 51.0, 40.0, 36.0, 26.0, 13.0, 17.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.33251953125, -0.3232307434082031, -0.31394195556640625, -0.3046531677246094, -0.2953643798828125, -0.2860755920410156, -0.27678680419921875, -0.2674980163574219, -0.258209228515625, -0.24892044067382812, -0.23963165283203125, -0.23034286499023438, -0.2210540771484375, -0.21176528930664062, -0.20247650146484375, -0.19318771362304688, -0.18389892578125, -0.17461013793945312, -0.16532135009765625, -0.15603256225585938, -0.1467437744140625, -0.13745498657226562, -0.12816619873046875, -0.11887741088867188, -0.109588623046875, -0.10029983520507812, -0.09101104736328125, -0.08172225952148438, -0.0724334716796875, -0.06314468383789062, -0.05385589599609375, -0.044567108154296875, -0.0352783203125, -0.025989532470703125, -0.01670074462890625, -0.007411956787109375, 0.0018768310546875, 0.011165618896484375, 0.02045440673828125, 0.029743194580078125, 0.039031982421875, 0.048320770263671875, 0.05760955810546875, 0.06689834594726562, 0.0761871337890625, 0.08547592163085938, 0.09476470947265625, 0.10405349731445312, 0.11334228515625, 0.12263107299804688, 0.13191986083984375, 0.14120864868164062, 0.1504974365234375, 0.15978622436523438, 0.16907501220703125, 0.17836380004882812, 0.187652587890625, 0.19694137573242188, 0.20623016357421875, 0.21551895141601562, 0.2248077392578125, 0.23409652709960938, 0.24338531494140625, 0.2526741027832031, 0.261962890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 9.0, 9.0, 9.0, 10.0, 16.0, 12.0, 27.0, 24.0, 35.0, 37.0, 26.0, 41.0, 61.0, 54.0, 46.0, 49.0, 57.0, 43.0, 41.0, 50.0, 44.0, 48.0, 52.0, 33.0, 26.0, 27.0, 24.0, 16.0, 17.0, 14.0, 10.0, 11.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.270263671875, -0.2636280059814453, -0.2569923400878906, -0.25035667419433594, -0.24372100830078125, -0.23708534240722656, -0.23044967651367188, -0.2238140106201172, -0.2171783447265625, -0.2105426788330078, -0.20390701293945312, -0.19727134704589844, -0.19063568115234375, -0.18400001525878906, -0.17736434936523438, -0.1707286834716797, -0.164093017578125, -0.1574573516845703, -0.15082168579101562, -0.14418601989746094, -0.13755035400390625, -0.13091468811035156, -0.12427902221679688, -0.11764335632324219, -0.1110076904296875, -0.10437202453613281, -0.09773635864257812, -0.09110069274902344, -0.08446502685546875, -0.07782936096191406, -0.07119369506835938, -0.06455802917480469, -0.05792236328125, -0.05128669738769531, -0.044651031494140625, -0.03801536560058594, -0.03137969970703125, -0.024744033813476562, -0.018108367919921875, -0.011472702026367188, -0.0048370361328125, 0.0017986297607421875, 0.008434295654296875, 0.015069961547851562, 0.02170562744140625, 0.028341293334960938, 0.034976959228515625, 0.04161262512207031, 0.048248291015625, 0.05488395690917969, 0.061519622802734375, 0.06815528869628906, 0.07479095458984375, 0.08142662048339844, 0.08806228637695312, 0.09469795227050781, 0.1013336181640625, 0.10796928405761719, 0.11460494995117188, 0.12124061584472656, 0.12787628173828125, 0.13451194763183594, 0.14114761352539062, 0.1477832794189453, 0.1544189453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 2.0, 9.0, 15.0, 22.0, 23.0, 33.0, 65.0, 111.0, 219.0, 420.0, 978.0, 2565.0, 10290.0, 153450.0, 830715.0, 40999.0, 5514.0, 1711.0, 667.0, 308.0, 176.0, 86.0, 49.0, 35.0, 20.0, 20.0, 15.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1686840057373047, -0.16329574584960938, -0.15790748596191406, -0.15251922607421875, -0.14713096618652344, -0.14174270629882812, -0.1363544464111328, -0.1309661865234375, -0.1255779266357422, -0.12018966674804688, -0.11480140686035156, -0.10941314697265625, -0.10402488708496094, -0.09863662719726562, -0.09324836730957031, -0.087860107421875, -0.08247184753417969, -0.07708358764648438, -0.07169532775878906, -0.06630706787109375, -0.06091880798339844, -0.055530548095703125, -0.05014228820800781, -0.0447540283203125, -0.03936576843261719, -0.033977508544921875, -0.028589248657226562, -0.02320098876953125, -0.017812728881835938, -0.012424468994140625, -0.0070362091064453125, -0.00164794921875, 0.0037403106689453125, 0.009128570556640625, 0.014516830444335938, 0.01990509033203125, 0.025293350219726562, 0.030681610107421875, 0.03606986999511719, 0.0414581298828125, 0.04684638977050781, 0.052234649658203125, 0.05762290954589844, 0.06301116943359375, 0.06839942932128906, 0.07378768920898438, 0.07917594909667969, 0.084564208984375, 0.08995246887207031, 0.09534072875976562, 0.10072898864746094, 0.10611724853515625, 0.11150550842285156, 0.11689376831054688, 0.12228202819824219, 0.1276702880859375, 0.1330585479736328, 0.13844680786132812, 0.14383506774902344, 0.14922332763671875, 0.15461158752441406, 0.15999984741210938, 0.1653881072998047, 0.1707763671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 2.0, 5.0, 9.0, 8.0, 8.0, 9.0, 14.0, 19.0, 31.0, 45.0, 99.0, 212.0, 233.0, 105.0, 57.0, 34.0, 32.0, 19.0, 15.0, 10.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001747608184814453, -0.00016832351684570312, -0.00016188621520996094, -0.00015544891357421875, -0.00014901161193847656, -0.00014257431030273438, -0.0001361370086669922, -0.00012969970703125, -0.0001232624053955078, -0.00011682510375976562, -0.00011038780212402344, -0.00010395050048828125, -9.751319885253906e-05, -9.107589721679688e-05, -8.463859558105469e-05, -7.82012939453125e-05, -7.176399230957031e-05, -6.532669067382812e-05, -5.888938903808594e-05, -5.245208740234375e-05, -4.601478576660156e-05, -3.9577484130859375e-05, -3.314018249511719e-05, -2.6702880859375e-05, -2.0265579223632812e-05, -1.3828277587890625e-05, -7.3909759521484375e-06, -9.5367431640625e-07, 5.4836273193359375e-06, 1.1920928955078125e-05, 1.8358230590820312e-05, 2.47955322265625e-05, 3.123283386230469e-05, 3.7670135498046875e-05, 4.410743713378906e-05, 5.054473876953125e-05, 5.698204040527344e-05, 6.341934204101562e-05, 6.985664367675781e-05, 7.62939453125e-05, 8.273124694824219e-05, 8.916854858398438e-05, 9.560585021972656e-05, 0.00010204315185546875, 0.00010848045349121094, 0.00011491775512695312, 0.00012135505676269531, 0.0001277923583984375, 0.0001342296600341797, 0.00014066696166992188, 0.00014710426330566406, 0.00015354156494140625, 0.00015997886657714844, 0.00016641616821289062, 0.0001728534698486328, 0.000179290771484375, 0.0001857280731201172, 0.00019216537475585938, 0.00019860267639160156, 0.00020503997802734375, 0.00021147727966308594, 0.00021791458129882812, 0.0002243518829345703, 0.0002307891845703125, 0.0002372264862060547]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 13.0, 13.0, 24.0, 37.0, 57.0, 72.0, 129.0, 193.0, 391.0, 728.0, 1630.0, 4203.0, 15172.0, 144186.0, 783347.0, 80667.0, 11271.0, 3484.0, 1373.0, 644.0, 363.0, 180.0, 113.0, 61.0, 60.0, 35.0, 20.0, 17.0, 13.0, 17.0, 8.0, 11.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.173828125, -0.1690521240234375, -0.164276123046875, -0.1595001220703125, -0.15472412109375, -0.1499481201171875, -0.145172119140625, -0.1403961181640625, -0.1356201171875, -0.1308441162109375, -0.126068115234375, -0.1212921142578125, -0.11651611328125, -0.1117401123046875, -0.106964111328125, -0.1021881103515625, -0.097412109375, -0.0926361083984375, -0.087860107421875, -0.0830841064453125, -0.07830810546875, -0.0735321044921875, -0.068756103515625, -0.0639801025390625, -0.0592041015625, -0.0544281005859375, -0.049652099609375, -0.0448760986328125, -0.04010009765625, -0.0353240966796875, -0.030548095703125, -0.0257720947265625, -0.02099609375, -0.0162200927734375, -0.011444091796875, -0.0066680908203125, -0.00189208984375, 0.0028839111328125, 0.007659912109375, 0.0124359130859375, 0.0172119140625, 0.0219879150390625, 0.026763916015625, 0.0315399169921875, 0.03631591796875, 0.0410919189453125, 0.045867919921875, 0.0506439208984375, 0.055419921875, 0.0601959228515625, 0.064971923828125, 0.0697479248046875, 0.07452392578125, 0.0792999267578125, 0.084075927734375, 0.0888519287109375, 0.0936279296875, 0.0984039306640625, 0.103179931640625, 0.1079559326171875, 0.11273193359375, 0.1175079345703125, 0.122283935546875, 0.1270599365234375, 0.1318359375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 7.0, 17.0, 17.0, 28.0, 51.0, 52.0, 85.0, 91.0, 120.0, 127.0, 86.0, 88.0, 57.0, 36.0, 33.0, 27.0, 13.0, 16.0, 13.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.13589859008789062, -0.13190460205078125, -0.12791061401367188, -0.1239166259765625, -0.11992263793945312, -0.11592864990234375, -0.11193466186523438, -0.107940673828125, -0.10394668579101562, -0.09995269775390625, -0.09595870971679688, -0.0919647216796875, -0.08797073364257812, -0.08397674560546875, -0.07998275756835938, -0.07598876953125, -0.07199478149414062, -0.06800079345703125, -0.06400680541992188, -0.0600128173828125, -0.056018829345703125, -0.05202484130859375, -0.048030853271484375, -0.044036865234375, -0.040042877197265625, -0.03604888916015625, -0.032054901123046875, -0.0280609130859375, -0.024066925048828125, -0.02007293701171875, -0.016078948974609375, -0.0120849609375, -0.008090972900390625, -0.00409698486328125, -0.000102996826171875, 0.0038909912109375, 0.007884979248046875, 0.01187896728515625, 0.015872955322265625, 0.019866943359375, 0.023860931396484375, 0.02785491943359375, 0.031848907470703125, 0.0358428955078125, 0.039836883544921875, 0.04383087158203125, 0.047824859619140625, 0.05181884765625, 0.055812835693359375, 0.05980682373046875, 0.06380081176757812, 0.0677947998046875, 0.07178878784179688, 0.07578277587890625, 0.07977676391601562, 0.083770751953125, 0.08776473999023438, 0.09175872802734375, 0.09575271606445312, 0.0997467041015625, 0.10374069213867188, 0.10773468017578125, 0.11172866821289062, 0.11572265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 25.0, 379.0, 580.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.153179168701172, -11.932692527770996, -11.712206840515137, -11.491720199584961, -11.271233558654785, -11.05074691772461, -10.83026123046875, -10.609774589538574, -10.389287948608398, -10.168801307678223, -9.948315620422363, -9.727828979492188, -9.507342338562012, -9.286855697631836, -9.066370010375977, -8.8458833694458, -8.625396728515625, -8.40491008758545, -8.18442440032959, -7.963937759399414, -7.743451118469238, -7.522964954376221, -7.302478313446045, -7.081992149353027, -6.86150598526001, -6.641019821166992, -6.420533180236816, -6.200047016143799, -5.979560375213623, -5.7590742111206055, -5.53858757019043, -5.318101406097412, -5.097614765167236, -4.877128601074219, -4.656641960144043, -4.436155796051025, -4.21566915512085, -3.995182991027832, -3.7746963500976562, -3.5542101860046387, -3.333723545074463, -3.113237142562866, -2.8927507400512695, -2.672264337539673, -2.451777935028076, -2.2312917709350586, -2.010805130004883, -1.7903188467025757, -1.5698325634002686, -1.3493461608886719, -1.1288597583770752, -0.9083734154701233, -0.6878870129585266, -0.4674006700515747, -0.24691426753997803, -0.026427865028381348, 0.19405853748321533, 0.414544939994812, 0.6350313425064087, 0.8555176854133606, 1.0760040283203125, 1.2964904308319092, 1.5169768333435059, 1.7374632358551025, 1.9579496383666992]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 12.0, 12.0, 5.0, 10.0, 21.0, 22.0, 32.0, 44.0, 47.0, 49.0, 55.0, 69.0, 73.0, 63.0, 57.0, 58.0, 55.0, 44.0, 47.0, 41.0, 36.0, 35.0, 21.0, 27.0, 17.0, 17.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.251816749572754, -1.1966667175292969, -1.1415166854858398, -1.0863665342330933, -1.0312165021896362, -0.9760664701461792, -0.9209163784980774, -0.8657662868499756, -0.8106162548065186, -0.7554662227630615, -0.7003161311149597, -0.6451660394668579, -0.5900160074234009, -0.5348659753799438, -0.47971588373184204, -0.4245658218860626, -0.3694157600402832, -0.3142656981945038, -0.25911563634872437, -0.20396557450294495, -0.14881551265716553, -0.09366545081138611, -0.03851538896560669, 0.01663467288017273, 0.07178473472595215, 0.12693479657173157, 0.182084858417511, 0.2372349202632904, 0.2923849821090698, 0.34753504395484924, 0.40268510580062866, 0.4578351676464081, 0.5129852294921875, 0.5681352615356445, 0.6232853531837463, 0.6784354448318481, 0.7335854768753052, 0.7887355089187622, 0.843885600566864, 0.8990356922149658, 0.9541857242584229, 1.0093357563018799, 1.064485788345337, 1.1196359395980835, 1.1747859716415405, 1.2299360036849976, 1.2850861549377441, 1.3402361869812012, 1.3953862190246582, 1.4505362510681152, 1.5056862831115723, 1.5608364343643188, 1.6159864664077759, 1.671136498451233, 1.7262866497039795, 1.7814366817474365, 1.8365867137908936, 1.8917367458343506, 1.9468867778778076, 2.0020368099212646, 2.057187080383301, 2.112337112426758, 2.167487144470215, 2.222637176513672, 2.277787208557129]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 8.0, 7.0, 16.0, 16.0, 23.0, 35.0, 71.0, 114.0, 220.0, 527.0, 1580.0, 8503.0, 4056540.0, 121050.0, 3924.0, 929.0, 320.0, 161.0, 75.0, 51.0, 38.0, 19.0, 15.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5664443969726562, -0.5445098876953125, -0.5225753784179688, -0.500640869140625, -0.47870635986328125, -0.4567718505859375, -0.43483734130859375, -0.41290283203125, -0.39096832275390625, -0.3690338134765625, -0.34709930419921875, -0.325164794921875, -0.30323028564453125, -0.2812957763671875, -0.25936126708984375, -0.2374267578125, -0.21549224853515625, -0.1935577392578125, -0.17162322998046875, -0.149688720703125, -0.12775421142578125, -0.1058197021484375, -0.08388519287109375, -0.06195068359375, -0.04001617431640625, -0.0180816650390625, 0.00385284423828125, 0.025787353515625, 0.04772186279296875, 0.0696563720703125, 0.09159088134765625, 0.113525390625, 0.13545989990234375, 0.1573944091796875, 0.17932891845703125, 0.201263427734375, 0.22319793701171875, 0.2451324462890625, 0.26706695556640625, 0.28900146484375, 0.31093597412109375, 0.3328704833984375, 0.35480499267578125, 0.376739501953125, 0.39867401123046875, 0.4206085205078125, 0.44254302978515625, 0.4644775390625, 0.48641204833984375, 0.5083465576171875, 0.5302810668945312, 0.552215576171875, 0.5741500854492188, 0.5960845947265625, 0.6180191040039062, 0.63995361328125, 0.6618881225585938, 0.6838226318359375, 0.7057571411132812, 0.727691650390625, 0.7496261596679688, 0.7715606689453125, 0.7934951782226562, 0.8154296875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 15.0, 18.0, 17.0, 53.0, 126.0, 219.0, 245.0, 163.0, 81.0, 27.0, 13.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093017578125, -0.08992671966552734, -0.08683586120605469, -0.08374500274658203, -0.08065414428710938, -0.07756328582763672, -0.07447242736816406, -0.0713815689086914, -0.06829071044921875, -0.0651998519897461, -0.06210899353027344, -0.05901813507080078, -0.055927276611328125, -0.05283641815185547, -0.04974555969238281, -0.046654701232910156, -0.0435638427734375, -0.040472984313964844, -0.03738212585449219, -0.03429126739501953, -0.031200408935546875, -0.02810955047607422, -0.025018692016601562, -0.021927833557128906, -0.01883697509765625, -0.015746116638183594, -0.012655258178710938, -0.009564399719238281, -0.006473541259765625, -0.0033826828002929688, -0.0002918243408203125, 0.0027990341186523438, 0.005889892578125, 0.008980751037597656, 0.012071609497070312, 0.015162467956542969, 0.018253326416015625, 0.02134418487548828, 0.024435043334960938, 0.027525901794433594, 0.03061676025390625, 0.033707618713378906, 0.03679847717285156, 0.03988933563232422, 0.042980194091796875, 0.04607105255126953, 0.04916191101074219, 0.052252769470214844, 0.0553436279296875, 0.058434486389160156, 0.06152534484863281, 0.06461620330810547, 0.06770706176757812, 0.07079792022705078, 0.07388877868652344, 0.0769796371459961, 0.08007049560546875, 0.0831613540649414, 0.08625221252441406, 0.08934307098388672, 0.09243392944335938, 0.09552478790283203, 0.09861564636230469, 0.10170650482177734, 0.10479736328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 3.0, 4.0, 9.0, 16.0, 17.0, 22.0, 34.0, 56.0, 115.0, 222.0, 433.0, 929.0, 2340.0, 9778.0, 192169.0, 3960707.0, 21379.0, 3742.0, 1240.0, 532.0, 222.0, 136.0, 64.0, 33.0, 41.0, 7.0, 8.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48046875, -0.46506500244140625, -0.4496612548828125, -0.43425750732421875, -0.418853759765625, -0.40345001220703125, -0.3880462646484375, -0.37264251708984375, -0.35723876953125, -0.34183502197265625, -0.3264312744140625, -0.31102752685546875, -0.295623779296875, -0.28022003173828125, -0.2648162841796875, -0.24941253662109375, -0.2340087890625, -0.21860504150390625, -0.2032012939453125, -0.18779754638671875, -0.172393798828125, -0.15699005126953125, -0.1415863037109375, -0.12618255615234375, -0.11077880859375, -0.09537506103515625, -0.0799713134765625, -0.06456756591796875, -0.049163818359375, -0.03376007080078125, -0.0183563232421875, -0.00295257568359375, 0.012451171875, 0.02785491943359375, 0.0432586669921875, 0.05866241455078125, 0.074066162109375, 0.08946990966796875, 0.1048736572265625, 0.12027740478515625, 0.13568115234375, 0.15108489990234375, 0.1664886474609375, 0.18189239501953125, 0.197296142578125, 0.21269989013671875, 0.2281036376953125, 0.24350738525390625, 0.2589111328125, 0.27431488037109375, 0.2897186279296875, 0.30512237548828125, 0.320526123046875, 0.33592987060546875, 0.3513336181640625, 0.36673736572265625, 0.38214111328125, 0.39754486083984375, 0.4129486083984375, 0.42835235595703125, 0.443756103515625, 0.45915985107421875, 0.4745635986328125, 0.48996734619140625, 0.50537109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 11.0, 13.0, 25.0, 51.0, 123.0, 719.0, 2718.0, 239.0, 72.0, 30.0, 19.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12194061279296875, -0.1179046630859375, -0.11386871337890625, -0.109832763671875, -0.10579681396484375, -0.1017608642578125, -0.09772491455078125, -0.09368896484375, -0.08965301513671875, -0.0856170654296875, -0.08158111572265625, -0.077545166015625, -0.07350921630859375, -0.0694732666015625, -0.06543731689453125, -0.0614013671875, -0.05736541748046875, -0.0533294677734375, -0.04929351806640625, -0.045257568359375, -0.04122161865234375, -0.0371856689453125, -0.03314971923828125, -0.02911376953125, -0.02507781982421875, -0.0210418701171875, -0.01700592041015625, -0.012969970703125, -0.00893402099609375, -0.0048980712890625, -0.00086212158203125, 0.003173828125, 0.00720977783203125, 0.0112457275390625, 0.01528167724609375, 0.019317626953125, 0.02335357666015625, 0.0273895263671875, 0.03142547607421875, 0.03546142578125, 0.03949737548828125, 0.0435333251953125, 0.04756927490234375, 0.051605224609375, 0.05564117431640625, 0.0596771240234375, 0.06371307373046875, 0.0677490234375, 0.07178497314453125, 0.0758209228515625, 0.07985687255859375, 0.083892822265625, 0.08792877197265625, 0.0919647216796875, 0.09600067138671875, 0.10003662109375, 0.10407257080078125, 0.1081085205078125, 0.11214447021484375, 0.116180419921875, 0.12021636962890625, 0.1242523193359375, 0.12828826904296875, 0.13232421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 19.0, 194.0, 723.0, 54.0, 13.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944915771484375, -2.886420726776123, -2.82792592048645, -2.7694308757781982, -2.7109360694885254, -2.6524410247802734, -2.5939462184906006, -2.5354511737823486, -2.476956367492676, -2.418461322784424, -2.359966516494751, -2.301471471786499, -2.242976665496826, -2.184481620788574, -2.1259868144989014, -2.0674917697906494, -2.0089969635009766, -1.9505020380020142, -1.8920071125030518, -1.8335121870040894, -1.775017261505127, -1.7165223360061646, -1.6580274105072021, -1.5995323657989502, -1.5410373210906982, -1.4825423955917358, -1.4240474700927734, -1.365552544593811, -1.3070576190948486, -1.2485626935958862, -1.1900677680969238, -1.1315727233886719, -1.073077917098999, -1.0145829916000366, -0.9560880661010742, -0.8975931406021118, -0.8390982151031494, -0.780603289604187, -0.7221083045005798, -0.6636133790016174, -0.605118453502655, -0.5466235280036926, -0.4881286025047302, -0.42963364720344543, -0.37113872170448303, -0.31264379620552063, -0.25414884090423584, -0.19565391540527344, -0.13715898990631104, -0.07866405695676804, -0.020169124007225037, 0.03832581639289856, 0.09682074189186096, 0.15531566739082336, 0.21381062269210815, 0.27230554819107056, 0.33080047369003296, 0.38929539918899536, 0.44779032468795776, 0.5062853097915649, 0.5647802352905273, 0.6232751607894897, 0.6817700862884521, 0.7402650117874146, 0.798759937286377]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 2.0, 10.0, 15.0, 12.0, 12.0, 19.0, 23.0, 26.0, 21.0, 36.0, 42.0, 41.0, 41.0, 38.0, 51.0, 54.0, 54.0, 48.0, 59.0, 58.0, 49.0, 31.0, 31.0, 45.0, 43.0, 15.0, 18.0, 19.0, 15.0, 16.0, 7.0, 12.0, 13.0, 8.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2920803427696228, -0.2838532328605652, -0.27562612295150757, -0.26739904284477234, -0.2591719329357147, -0.2509448230266571, -0.24271772801876068, -0.23449063301086426, -0.22626352310180664, -0.21803641319274902, -0.2098093181848526, -0.20158222317695618, -0.19335511326789856, -0.18512800335884094, -0.17690090835094452, -0.1686738133430481, -0.16044670343399048, -0.15221959352493286, -0.14399249851703644, -0.13576540350914001, -0.1275382936000824, -0.11931119114160538, -0.11108408868312836, -0.10285698622465134, -0.09462988376617432, -0.0864027813076973, -0.07817567884922028, -0.06994857639074326, -0.061721473932266235, -0.053494371473789215, -0.045267269015312195, -0.037040166556835175, -0.028813064098358154, -0.020585961639881134, -0.012358859181404114, -0.0041317567229270935, 0.004095345735549927, 0.012322448194026947, 0.020549550652503967, 0.028776653110980988, 0.03700375556945801, 0.04523085802793503, 0.05345796048641205, 0.06168506294488907, 0.06991216540336609, 0.07813926786184311, 0.08636637032032013, 0.09459347277879715, 0.10282057523727417, 0.11104767769575119, 0.11927478015422821, 0.12750187516212463, 0.13572898507118225, 0.14395609498023987, 0.1521831899881363, 0.16041028499603271, 0.16863739490509033, 0.17686450481414795, 0.18509159982204437, 0.1933186948299408, 0.2015458047389984, 0.20977291464805603, 0.21800000965595245, 0.22622710466384888, 0.2344542145729065]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 19.0, 14.0, 27.0, 38.0, 44.0, 56.0, 90.0, 118.0, 157.0, 241.0, 380.0, 603.0, 990.0, 2230.0, 7859.0, 68327.0, 825119.0, 125418.0, 11039.0, 2683.0, 1185.0, 619.0, 378.0, 275.0, 176.0, 121.0, 92.0, 68.0, 49.0, 34.0, 24.0, 17.0, 14.0, 6.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.25162506103515625, -0.2425079345703125, -0.23339080810546875, -0.224273681640625, -0.21515655517578125, -0.2060394287109375, -0.19692230224609375, -0.18780517578125, -0.17868804931640625, -0.1695709228515625, -0.16045379638671875, -0.151336669921875, -0.14221954345703125, -0.1331024169921875, -0.12398529052734375, -0.1148681640625, -0.10575103759765625, -0.0966339111328125, -0.08751678466796875, -0.078399658203125, -0.06928253173828125, -0.0601654052734375, -0.05104827880859375, -0.04193115234375, -0.03281402587890625, -0.0236968994140625, -0.01457977294921875, -0.005462646484375, 0.00365447998046875, 0.0127716064453125, 0.02188873291015625, 0.031005859375, 0.04012298583984375, 0.0492401123046875, 0.05835723876953125, 0.067474365234375, 0.07659149169921875, 0.0857086181640625, 0.09482574462890625, 0.10394287109375, 0.11305999755859375, 0.1221771240234375, 0.13129425048828125, 0.140411376953125, 0.14952850341796875, 0.1586456298828125, 0.16776275634765625, 0.1768798828125, 0.18599700927734375, 0.1951141357421875, 0.20423126220703125, 0.213348388671875, 0.22246551513671875, 0.2315826416015625, 0.24069976806640625, 0.24981689453125, 0.25893402099609375, 0.2680511474609375, 0.27716827392578125, 0.286285400390625, 0.29540252685546875, 0.3045196533203125, 0.31363677978515625, 0.32275390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 6.0, 20.0, 9.0, 26.0, 68.0, 127.0, 222.0, 234.0, 144.0, 82.0, 36.0, 9.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09480094909667969, -0.09164047241210938, -0.08847999572753906, -0.08531951904296875, -0.08215904235839844, -0.07899856567382812, -0.07583808898925781, -0.0726776123046875, -0.06951713562011719, -0.06635665893554688, -0.06319618225097656, -0.06003570556640625, -0.05687522888183594, -0.053714752197265625, -0.05055427551269531, -0.047393798828125, -0.04423332214355469, -0.041072845458984375, -0.03791236877441406, -0.03475189208984375, -0.03159141540527344, -0.028430938720703125, -0.025270462036132812, -0.0221099853515625, -0.018949508666992188, -0.015789031982421875, -0.012628555297851562, -0.00946807861328125, -0.0063076019287109375, -0.003147125244140625, 1.33514404296875e-05, 0.003173828125, 0.0063343048095703125, 0.009494781494140625, 0.012655258178710938, 0.01581573486328125, 0.018976211547851562, 0.022136688232421875, 0.025297164916992188, 0.0284576416015625, 0.03161811828613281, 0.034778594970703125, 0.03793907165527344, 0.04109954833984375, 0.04426002502441406, 0.047420501708984375, 0.05058097839355469, 0.053741455078125, 0.05690193176269531, 0.060062408447265625, 0.06322288513183594, 0.06638336181640625, 0.06954383850097656, 0.07270431518554688, 0.07586479187011719, 0.0790252685546875, 0.08218574523925781, 0.08534622192382812, 0.08850669860839844, 0.09166717529296875, 0.09482765197753906, 0.09798812866210938, 0.10114860534667969, 0.10430908203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 11.0, 12.0, 16.0, 27.0, 27.0, 39.0, 86.0, 124.0, 264.0, 489.0, 965.0, 2391.0, 7433.0, 43299.0, 760428.0, 209280.0, 16509.0, 4095.0, 1512.0, 694.0, 349.0, 191.0, 95.0, 81.0, 35.0, 32.0, 13.0, 11.0, 15.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.34722137451171875, -0.3355560302734375, -0.32389068603515625, -0.312225341796875, -0.30055999755859375, -0.2888946533203125, -0.27722930908203125, -0.26556396484375, -0.25389862060546875, -0.2422332763671875, -0.23056793212890625, -0.218902587890625, -0.20723724365234375, -0.1955718994140625, -0.18390655517578125, -0.1722412109375, -0.16057586669921875, -0.1489105224609375, -0.13724517822265625, -0.125579833984375, -0.11391448974609375, -0.1022491455078125, -0.09058380126953125, -0.07891845703125, -0.06725311279296875, -0.0555877685546875, -0.04392242431640625, -0.032257080078125, -0.02059173583984375, -0.0089263916015625, 0.00273895263671875, 0.014404296875, 0.02606964111328125, 0.0377349853515625, 0.04940032958984375, 0.061065673828125, 0.07273101806640625, 0.0843963623046875, 0.09606170654296875, 0.10772705078125, 0.11939239501953125, 0.1310577392578125, 0.14272308349609375, 0.154388427734375, 0.16605377197265625, 0.1777191162109375, 0.18938446044921875, 0.2010498046875, 0.21271514892578125, 0.2243804931640625, 0.23604583740234375, 0.247711181640625, 0.25937652587890625, 0.2710418701171875, 0.28270721435546875, 0.29437255859375, 0.30603790283203125, 0.3177032470703125, 0.32936859130859375, 0.341033935546875, 0.35269927978515625, 0.3643646240234375, 0.37602996826171875, 0.3876953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 12.0, 19.0, 18.0, 29.0, 32.0, 33.0, 52.0, 48.0, 54.0, 64.0, 62.0, 72.0, 65.0, 72.0, 52.0, 45.0, 42.0, 37.0, 32.0, 20.0, 27.0, 19.0, 21.0, 12.0, 8.0, 5.0, 12.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.29052734375, -0.28219032287597656, -0.2738533020019531, -0.2655162811279297, -0.25717926025390625, -0.2488422393798828, -0.24050521850585938, -0.23216819763183594, -0.2238311767578125, -0.21549415588378906, -0.20715713500976562, -0.1988201141357422, -0.19048309326171875, -0.1821460723876953, -0.17380905151367188, -0.16547203063964844, -0.157135009765625, -0.14879798889160156, -0.14046096801757812, -0.1321239471435547, -0.12378692626953125, -0.11544990539550781, -0.10711288452148438, -0.09877586364746094, -0.0904388427734375, -0.08210182189941406, -0.07376480102539062, -0.06542778015136719, -0.05709075927734375, -0.04875373840332031, -0.040416717529296875, -0.03207969665527344, -0.02374267578125, -0.015405654907226562, -0.007068634033203125, 0.0012683868408203125, 0.00960540771484375, 0.017942428588867188, 0.026279449462890625, 0.03461647033691406, 0.0429534912109375, 0.05129051208496094, 0.059627532958984375, 0.06796455383300781, 0.07630157470703125, 0.08463859558105469, 0.09297561645507812, 0.10131263732910156, 0.109649658203125, 0.11798667907714844, 0.12632369995117188, 0.1346607208251953, 0.14299774169921875, 0.1513347625732422, 0.15967178344726562, 0.16800880432128906, 0.1763458251953125, 0.18468284606933594, 0.19301986694335938, 0.2013568878173828, 0.20969390869140625, 0.2180309295654297, 0.22636795043945312, 0.23470497131347656, 0.2430419921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 12.0, 12.0, 22.0, 26.0, 44.0, 61.0, 79.0, 112.0, 182.0, 236.0, 378.0, 696.0, 1607.0, 4612.0, 52068.0, 974863.0, 8616.0, 2466.0, 1010.0, 499.0, 272.0, 187.0, 126.0, 98.0, 66.0, 55.0, 40.0, 34.0, 15.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.394775390625, -0.38126373291015625, -0.3677520751953125, -0.35424041748046875, -0.340728759765625, -0.32721710205078125, -0.3137054443359375, -0.30019378662109375, -0.28668212890625, -0.27317047119140625, -0.2596588134765625, -0.24614715576171875, -0.232635498046875, -0.21912384033203125, -0.2056121826171875, -0.19210052490234375, -0.1785888671875, -0.16507720947265625, -0.1515655517578125, -0.13805389404296875, -0.124542236328125, -0.11103057861328125, -0.0975189208984375, -0.08400726318359375, -0.07049560546875, -0.05698394775390625, -0.0434722900390625, -0.02996063232421875, -0.016448974609375, -0.00293731689453125, 0.0105743408203125, 0.02408599853515625, 0.03759765625, 0.05110931396484375, 0.0646209716796875, 0.07813262939453125, 0.091644287109375, 0.10515594482421875, 0.1186676025390625, 0.13217926025390625, 0.14569091796875, 0.15920257568359375, 0.1727142333984375, 0.18622589111328125, 0.199737548828125, 0.21324920654296875, 0.2267608642578125, 0.24027252197265625, 0.2537841796875, 0.26729583740234375, 0.2808074951171875, 0.29431915283203125, 0.307830810546875, 0.32134246826171875, 0.3348541259765625, 0.34836578369140625, 0.36187744140625, 0.37538909912109375, 0.3889007568359375, 0.40241241455078125, 0.415924072265625, 0.42943572998046875, 0.4429473876953125, 0.45645904541015625, 0.469970703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 6.0, 9.0, 9.0, 6.0, 10.0, 15.0, 9.0, 20.0, 32.0, 33.0, 37.0, 37.0, 43.0, 69.0, 100.0, 92.0, 82.0, 54.0, 62.0, 57.0, 37.0, 32.0, 26.0, 24.0, 18.0, 18.0, 15.0, 8.0, 3.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.125471115112305e-05, -8.846446871757507e-05, -8.56742262840271e-05, -8.288398385047913e-05, -8.009374141693115e-05, -7.730349898338318e-05, -7.45132565498352e-05, -7.172301411628723e-05, -6.893277168273926e-05, -6.614252924919128e-05, -6.335228681564331e-05, -6.056204438209534e-05, -5.777180194854736e-05, -5.498155951499939e-05, -5.2191317081451416e-05, -4.940107464790344e-05, -4.661083221435547e-05, -4.3820589780807495e-05, -4.103034734725952e-05, -3.824010491371155e-05, -3.5449862480163574e-05, -3.26596200466156e-05, -2.9869377613067627e-05, -2.7079135179519653e-05, -2.428889274597168e-05, -2.1498650312423706e-05, -1.8708407878875732e-05, -1.591816544532776e-05, -1.3127923011779785e-05, -1.0337680578231812e-05, -7.547438144683838e-06, -4.757195711135864e-06, -1.9669532775878906e-06, 8.23289155960083e-07, 3.6135315895080566e-06, 6.40377402305603e-06, 9.194016456604004e-06, 1.1984258890151978e-05, 1.4774501323699951e-05, 1.7564743757247925e-05, 2.03549861907959e-05, 2.3145228624343872e-05, 2.5935471057891846e-05, 2.872571349143982e-05, 3.151595592498779e-05, 3.4306198358535767e-05, 3.709644079208374e-05, 3.9886683225631714e-05, 4.267692565917969e-05, 4.546716809272766e-05, 4.8257410526275635e-05, 5.104765295982361e-05, 5.383789539337158e-05, 5.6628137826919556e-05, 5.941838026046753e-05, 6.22086226940155e-05, 6.499886512756348e-05, 6.778910756111145e-05, 7.057934999465942e-05, 7.33695924282074e-05, 7.615983486175537e-05, 7.895007729530334e-05, 8.174031972885132e-05, 8.453056216239929e-05, 8.732080459594727e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 6.0, 11.0, 10.0, 13.0, 5.0, 23.0, 21.0, 23.0, 30.0, 48.0, 63.0, 111.0, 194.0, 322.0, 695.0, 1476.0, 3702.0, 12068.0, 178932.0, 817142.0, 24037.0, 5429.0, 2139.0, 890.0, 439.0, 247.0, 151.0, 79.0, 66.0, 42.0, 40.0, 27.0, 17.0, 9.0, 12.0, 5.0, 4.0, 8.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1595458984375, -0.15367889404296875, -0.1478118896484375, -0.14194488525390625, -0.136077880859375, -0.13021087646484375, -0.1243438720703125, -0.11847686767578125, -0.11260986328125, -0.10674285888671875, -0.1008758544921875, -0.09500885009765625, -0.089141845703125, -0.08327484130859375, -0.0774078369140625, -0.07154083251953125, -0.065673828125, -0.05980682373046875, -0.0539398193359375, -0.04807281494140625, -0.042205810546875, -0.03633880615234375, -0.0304718017578125, -0.02460479736328125, -0.01873779296875, -0.01287078857421875, -0.0070037841796875, -0.00113677978515625, 0.004730224609375, 0.01059722900390625, 0.0164642333984375, 0.02233123779296875, 0.0281982421875, 0.03406524658203125, 0.0399322509765625, 0.04579925537109375, 0.051666259765625, 0.05753326416015625, 0.0634002685546875, 0.06926727294921875, 0.07513427734375, 0.08100128173828125, 0.0868682861328125, 0.09273529052734375, 0.098602294921875, 0.10446929931640625, 0.1103363037109375, 0.11620330810546875, 0.1220703125, 0.12793731689453125, 0.1338043212890625, 0.13967132568359375, 0.145538330078125, 0.15140533447265625, 0.1572723388671875, 0.16313934326171875, 0.16900634765625, 0.17487335205078125, 0.1807403564453125, 0.18660736083984375, 0.192474365234375, 0.19834136962890625, 0.2042083740234375, 0.21007537841796875, 0.2159423828125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 11.0, 27.0, 52.0, 161.0, 264.0, 230.0, 123.0, 55.0, 24.0, 10.0, 5.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3033027648925781, -0.29508209228515625, -0.2868614196777344, -0.2786407470703125, -0.2704200744628906, -0.26219940185546875, -0.2539787292480469, -0.245758056640625, -0.23753738403320312, -0.22931671142578125, -0.22109603881835938, -0.2128753662109375, -0.20465469360351562, -0.19643402099609375, -0.18821334838867188, -0.17999267578125, -0.17177200317382812, -0.16355133056640625, -0.15533065795898438, -0.1471099853515625, -0.13888931274414062, -0.13066864013671875, -0.12244796752929688, -0.114227294921875, -0.10600662231445312, -0.09778594970703125, -0.08956527709960938, -0.0813446044921875, -0.07312393188476562, -0.06490325927734375, -0.056682586669921875, -0.0484619140625, -0.040241241455078125, -0.03202056884765625, -0.023799896240234375, -0.0155792236328125, -0.007358551025390625, 0.00086212158203125, 0.009082794189453125, 0.017303466796875, 0.025524139404296875, 0.03374481201171875, 0.041965484619140625, 0.0501861572265625, 0.058406829833984375, 0.06662750244140625, 0.07484817504882812, 0.08306884765625, 0.09128952026367188, 0.09951019287109375, 0.10773086547851562, 0.1159515380859375, 0.12417221069335938, 0.13239288330078125, 0.14061355590820312, 0.148834228515625, 0.15705490112304688, 0.16527557373046875, 0.17349624633789062, 0.1817169189453125, 0.18993759155273438, 0.19815826416015625, 0.20637893676757812, 0.214599609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 15.0, 40.0, 111.0, 333.0, 337.0, 108.0, 31.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.772488594055176, -4.659119606018066, -4.545750617980957, -4.432381629943848, -4.319012641906738, -4.205643653869629, -4.0922746658325195, -3.97890567779541, -3.865536689758301, -3.7521677017211914, -3.638798713684082, -3.5254297256469727, -3.4120607376098633, -3.298691749572754, -3.1853227615356445, -3.071953773498535, -2.958585023880005, -2.8452160358428955, -2.731847047805786, -2.6184780597686768, -2.5051090717315674, -2.391740083694458, -2.2783713340759277, -2.1650023460388184, -2.051633358001709, -1.9382643699645996, -1.8248953819274902, -1.7115263938903809, -1.5981574058532715, -1.484788417816162, -1.3714195489883423, -1.258050560951233, -1.144681692123413, -1.0313127040863037, -0.9179437160491943, -0.8045747876167297, -0.6912057995796204, -0.577836811542511, -0.4644678831100464, -0.351098895072937, -0.23772990703582764, -0.12436093389987946, -0.010991960763931274, 0.10237699747085571, 0.2157459855079651, 0.32911497354507446, 0.44248390197753906, 0.5558528900146484, 0.6692218780517578, 0.7825908660888672, 0.8959598541259766, 1.009328842163086, 1.1226978302001953, 1.2360668182373047, 1.3494356870651245, 1.4628046751022339, 1.5761736631393433, 1.6895426511764526, 1.802911639213562, 1.9162805080413818, 2.029649496078491, 2.1430184841156006, 2.25638747215271, 2.3697564601898193, 2.4831254482269287]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 17.0, 19.0, 28.0, 25.0, 38.0, 36.0, 47.0, 47.0, 57.0, 70.0, 55.0, 52.0, 49.0, 51.0, 39.0, 53.0, 50.0, 47.0, 39.0, 22.0, 20.0, 15.0, 17.0, 11.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5680876970291138, -1.5160160064697266, -1.4639441967010498, -1.411872386932373, -1.3598006963729858, -1.3077290058135986, -1.2556571960449219, -1.2035853862762451, -1.151513695716858, -1.0994420051574707, -1.047370195388794, -0.995298445224762, -0.94322669506073, -0.891154944896698, -0.839083194732666, -0.787011444568634, -0.734939694404602, -0.6828679442405701, -0.6307961940765381, -0.5787244439125061, -0.5266526937484741, -0.47458094358444214, -0.42250919342041016, -0.3704374432563782, -0.3183656930923462, -0.2662939429283142, -0.21422219276428223, -0.16215044260025024, -0.11007869243621826, -0.05800694227218628, -0.005935192108154297, 0.046136558055877686, 0.09820842742919922, 0.1502801775932312, 0.20235192775726318, 0.25442367792129517, 0.30649542808532715, 0.35856717824935913, 0.4106389284133911, 0.4627106785774231, 0.5147824287414551, 0.5668541789054871, 0.618925929069519, 0.670997679233551, 0.723069429397583, 0.775141179561615, 0.827212929725647, 0.879284679889679, 0.9313564300537109, 0.9834281802177429, 1.035499930381775, 1.087571620941162, 1.1396434307098389, 1.1917152404785156, 1.2437869310379028, 1.29585862159729, 1.3479304313659668, 1.4000022411346436, 1.4520739316940308, 1.504145622253418, 1.5562174320220947, 1.6082892417907715, 1.6603609323501587, 1.712432622909546, 1.7645044326782227]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 21.0, 23.0, 54.0, 102.0, 258.0, 848.0, 6127.0, 4109695.0, 74126.0, 2219.0, 479.0, 154.0, 60.0, 49.0, 28.0, 7.0, 19.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7734375, -0.7498550415039062, -0.7262725830078125, -0.7026901245117188, -0.679107666015625, -0.6555252075195312, -0.6319427490234375, -0.6083602905273438, -0.58477783203125, -0.5611953735351562, -0.5376129150390625, -0.5140304565429688, -0.490447998046875, -0.46686553955078125, -0.4432830810546875, -0.41970062255859375, -0.3961181640625, -0.37253570556640625, -0.3489532470703125, -0.32537078857421875, -0.301788330078125, -0.27820587158203125, -0.2546234130859375, -0.23104095458984375, -0.20745849609375, -0.18387603759765625, -0.1602935791015625, -0.13671112060546875, -0.113128662109375, -0.08954620361328125, -0.0659637451171875, -0.04238128662109375, -0.018798828125, 0.00478363037109375, 0.0283660888671875, 0.05194854736328125, 0.075531005859375, 0.09911346435546875, 0.1226959228515625, 0.14627838134765625, 0.16986083984375, 0.19344329833984375, 0.2170257568359375, 0.24060821533203125, 0.264190673828125, 0.28777313232421875, 0.3113555908203125, 0.33493804931640625, 0.3585205078125, 0.38210296630859375, 0.4056854248046875, 0.42926788330078125, 0.452850341796875, 0.47643280029296875, 0.5000152587890625, 0.5235977172851562, 0.54718017578125, 0.5707626342773438, 0.5943450927734375, 0.6179275512695312, 0.641510009765625, 0.6650924682617188, 0.6886749267578125, 0.7122573852539062, 0.73583984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 9.0, 26.0, 43.0, 79.0, 129.0, 216.0, 181.0, 150.0, 73.0, 38.0, 21.0, 8.0, 9.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09136486053466797, -0.08830833435058594, -0.0852518081665039, -0.08219528198242188, -0.07913875579833984, -0.07608222961425781, -0.07302570343017578, -0.06996917724609375, -0.06691265106201172, -0.06385612487792969, -0.060799598693847656, -0.057743072509765625, -0.054686546325683594, -0.05163002014160156, -0.04857349395751953, -0.0455169677734375, -0.04246044158935547, -0.03940391540527344, -0.036347389221191406, -0.033290863037109375, -0.030234336853027344, -0.027177810668945312, -0.02412128448486328, -0.02106475830078125, -0.01800823211669922, -0.014951705932617188, -0.011895179748535156, -0.008838653564453125, -0.005782127380371094, -0.0027256011962890625, 0.00033092498779296875, 0.003387451171875, 0.006443977355957031, 0.009500503540039062, 0.012557029724121094, 0.015613555908203125, 0.018670082092285156, 0.021726608276367188, 0.02478313446044922, 0.02783966064453125, 0.03089618682861328, 0.03395271301269531, 0.037009239196777344, 0.040065765380859375, 0.043122291564941406, 0.04617881774902344, 0.04923534393310547, 0.0522918701171875, 0.05534839630126953, 0.05840492248535156, 0.061461448669433594, 0.06451797485351562, 0.06757450103759766, 0.07063102722167969, 0.07368755340576172, 0.07674407958984375, 0.07980060577392578, 0.08285713195800781, 0.08591365814208984, 0.08897018432617188, 0.0920267105102539, 0.09508323669433594, 0.09813976287841797, 0.1011962890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 11.0, 13.0, 23.0, 29.0, 60.0, 89.0, 177.0, 414.0, 1100.0, 4916.0, 153116.0, 4023207.0, 8529.0, 1680.0, 486.0, 221.0, 81.0, 57.0, 37.0, 14.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.970703125, -0.9465179443359375, -0.922332763671875, -0.8981475830078125, -0.87396240234375, -0.8497772216796875, -0.825592041015625, -0.8014068603515625, -0.7772216796875, -0.7530364990234375, -0.728851318359375, -0.7046661376953125, -0.68048095703125, -0.6562957763671875, -0.632110595703125, -0.6079254150390625, -0.583740234375, -0.5595550537109375, -0.535369873046875, -0.5111846923828125, -0.48699951171875, -0.4628143310546875, -0.438629150390625, -0.4144439697265625, -0.3902587890625, -0.3660736083984375, -0.341888427734375, -0.3177032470703125, -0.29351806640625, -0.2693328857421875, -0.245147705078125, -0.2209625244140625, -0.19677734375, -0.1725921630859375, -0.148406982421875, -0.1242218017578125, -0.10003662109375, -0.0758514404296875, -0.051666259765625, -0.0274810791015625, -0.0032958984375, 0.0208892822265625, 0.045074462890625, 0.0692596435546875, 0.09344482421875, 0.1176300048828125, 0.141815185546875, 0.1660003662109375, 0.190185546875, 0.2143707275390625, 0.238555908203125, 0.2627410888671875, 0.28692626953125, 0.3111114501953125, 0.335296630859375, 0.3594818115234375, 0.3836669921875, 0.4078521728515625, 0.432037353515625, 0.4562225341796875, 0.48040771484375, 0.5045928955078125, 0.528778076171875, 0.5529632568359375, 0.5771484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 16.0, 29.0, 69.0, 288.0, 3327.0, 245.0, 46.0, 17.0, 12.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.21020889282226562, -0.20459747314453125, -0.19898605346679688, -0.1933746337890625, -0.18776321411132812, -0.18215179443359375, -0.17654037475585938, -0.170928955078125, -0.16531753540039062, -0.15970611572265625, -0.15409469604492188, -0.1484832763671875, -0.14287185668945312, -0.13726043701171875, -0.13164901733398438, -0.12603759765625, -0.12042617797851562, -0.11481475830078125, -0.10920333862304688, -0.1035919189453125, -0.09798049926757812, -0.09236907958984375, -0.08675765991210938, -0.081146240234375, -0.07553482055664062, -0.06992340087890625, -0.06431198120117188, -0.0587005615234375, -0.053089141845703125, -0.04747772216796875, -0.041866302490234375, -0.0362548828125, -0.030643463134765625, -0.02503204345703125, -0.019420623779296875, -0.0138092041015625, -0.008197784423828125, -0.00258636474609375, 0.003025054931640625, 0.008636474609375, 0.014247894287109375, 0.01985931396484375, 0.025470733642578125, 0.0310821533203125, 0.036693572998046875, 0.04230499267578125, 0.047916412353515625, 0.05352783203125, 0.059139251708984375, 0.06475067138671875, 0.07036209106445312, 0.0759735107421875, 0.08158493041992188, 0.08719635009765625, 0.09280776977539062, 0.098419189453125, 0.10403060913085938, 0.10964202880859375, 0.11525344848632812, 0.1208648681640625, 0.12647628784179688, 0.13208770751953125, 0.13769912719726562, 0.143310546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 10.0, 59.0, 351.0, 524.0, 56.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796971321105957, -1.7426871061325073, -1.6884030103683472, -1.6341187953948975, -1.5798345804214478, -1.5255504846572876, -1.471266269683838, -1.4169821739196777, -1.362697958946228, -1.3084137439727783, -1.2541296482086182, -1.1998454332351685, -1.1455612182617188, -1.0912771224975586, -1.0369929075241089, -0.982708752155304, -0.9284245371818542, -0.8741403818130493, -0.8198561668395996, -0.7655720114707947, -0.7112878561019897, -0.65700364112854, -0.6027194857597351, -0.5484353303909302, -0.49415114521980286, -0.43986696004867554, -0.3855828046798706, -0.3312986195087433, -0.27701443433761597, -0.22273027896881104, -0.16844609379768372, -0.11416193842887878, -0.059877753257751465, -0.005593579262495041, 0.04869059473276138, 0.1029747724533081, 0.15725894272327423, 0.21154311299324036, 0.2658272981643677, 0.3201114535331726, 0.3743956387042999, 0.42867982387542725, 0.4829639792442322, 0.5372481346130371, 0.5915323495864868, 0.6458165049552917, 0.7001006603240967, 0.7543848752975464, 0.8086690306663513, 0.8629531860351562, 0.917237401008606, 0.9715215563774109, 1.0258057117462158, 1.0800899267196655, 1.1343741416931152, 1.1886582374572754, 1.242942452430725, 1.2972266674041748, 1.351510763168335, 1.4057949781417847, 1.4600791931152344, 1.5143632888793945, 1.5686475038528442, 1.622931718826294, 1.677215814590454]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 9.0, 10.0, 11.0, 14.0, 18.0, 31.0, 30.0, 32.0, 39.0, 36.0, 50.0, 52.0, 65.0, 61.0, 60.0, 59.0, 63.0, 53.0, 56.0, 31.0, 41.0, 34.0, 38.0, 16.0, 17.0, 17.0, 7.0, 5.0, 5.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3317965865135193, -0.32152053713798523, -0.31124448776245117, -0.3009684383869171, -0.29069238901138306, -0.2804163098335266, -0.27014029026031494, -0.2598642110824585, -0.24958816170692444, -0.23931211233139038, -0.22903606295585632, -0.21876001358032227, -0.20848394930362701, -0.19820789992809296, -0.1879318505525589, -0.17765578627586365, -0.16737975180149078, -0.15710370242595673, -0.14682765305042267, -0.13655158877372742, -0.12627553939819336, -0.1159994900226593, -0.10572344064712524, -0.09544738382101059, -0.08517133444547653, -0.07489528506994247, -0.06461922824382782, -0.05434317886829376, -0.044067125767469406, -0.03379107266664505, -0.023515023291110992, -0.013238966464996338, -0.0029629170894622803, 0.007313135080039501, 0.017589187249541283, 0.02786523848772049, 0.038141291588544846, 0.0484173446893692, 0.05869339406490326, 0.06896945089101791, 0.07924550026655197, 0.08952154964208603, 0.09979760646820068, 0.11007365584373474, 0.1203497052192688, 0.13062575459480286, 0.14090180397033691, 0.15117786824703217, 0.16145391762256622, 0.17172996699810028, 0.18200601637363434, 0.1922820806503296, 0.20255813002586365, 0.2128341794013977, 0.22311022877693176, 0.23338627815246582, 0.24366232752799988, 0.25393837690353394, 0.264214426279068, 0.27449047565460205, 0.2847665250301361, 0.29504257440567017, 0.3053186535835266, 0.31559470295906067, 0.3258707523345947]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 5.0, 8.0, 9.0, 10.0, 16.0, 17.0, 31.0, 50.0, 73.0, 123.0, 187.0, 303.0, 569.0, 1118.0, 2759.0, 10632.0, 96672.0, 835743.0, 85329.0, 9657.0, 2754.0, 1090.0, 538.0, 325.0, 154.0, 118.0, 75.0, 55.0, 33.0, 27.0, 20.0, 17.0, 8.0, 3.0, 6.0, 1.0, 6.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.255126953125, -0.24511337280273438, -0.23509979248046875, -0.22508621215820312, -0.2150726318359375, -0.20505905151367188, -0.19504547119140625, -0.18503189086914062, -0.175018310546875, -0.16500473022460938, -0.15499114990234375, -0.14497756958007812, -0.1349639892578125, -0.12495040893554688, -0.11493682861328125, -0.10492324829101562, -0.09490966796875, -0.08489608764648438, -0.07488250732421875, -0.06486892700195312, -0.0548553466796875, -0.044841766357421875, -0.03482818603515625, -0.024814605712890625, -0.014801025390625, -0.004787445068359375, 0.00522613525390625, 0.015239715576171875, 0.0252532958984375, 0.035266876220703125, 0.04528045654296875, 0.055294036865234375, 0.0653076171875, 0.07532119750976562, 0.08533477783203125, 0.09534835815429688, 0.1053619384765625, 0.11537551879882812, 0.12538909912109375, 0.13540267944335938, 0.145416259765625, 0.15542984008789062, 0.16544342041015625, 0.17545700073242188, 0.1854705810546875, 0.19548416137695312, 0.20549774169921875, 0.21551132202148438, 0.22552490234375, 0.23553848266601562, 0.24555206298828125, 0.2555656433105469, 0.2655792236328125, 0.2755928039550781, 0.28560638427734375, 0.2956199645996094, 0.305633544921875, 0.3156471252441406, 0.32566070556640625, 0.3356742858886719, 0.3456878662109375, 0.3557014465332031, 0.36571502685546875, 0.3757286071777344, 0.3857421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 6.0, 9.0, 22.0, 30.0, 54.0, 90.0, 171.0, 192.0, 160.0, 131.0, 49.0, 40.0, 18.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0921630859375, -0.08923912048339844, -0.08631515502929688, -0.08339118957519531, -0.08046722412109375, -0.07754325866699219, -0.07461929321289062, -0.07169532775878906, -0.0687713623046875, -0.06584739685058594, -0.06292343139648438, -0.05999946594238281, -0.05707550048828125, -0.05415153503417969, -0.051227569580078125, -0.04830360412597656, -0.045379638671875, -0.04245567321777344, -0.039531707763671875, -0.03660774230957031, -0.03368377685546875, -0.030759811401367188, -0.027835845947265625, -0.024911880493164062, -0.0219879150390625, -0.019063949584960938, -0.016139984130859375, -0.013216018676757812, -0.01029205322265625, -0.0073680877685546875, -0.004444122314453125, -0.0015201568603515625, 0.00140380859375, 0.0043277740478515625, 0.007251739501953125, 0.010175704956054688, 0.01309967041015625, 0.016023635864257812, 0.018947601318359375, 0.021871566772460938, 0.0247955322265625, 0.027719497680664062, 0.030643463134765625, 0.03356742858886719, 0.03649139404296875, 0.03941535949707031, 0.042339324951171875, 0.04526329040527344, 0.048187255859375, 0.05111122131347656, 0.054035186767578125, 0.05695915222167969, 0.05988311767578125, 0.06280708312988281, 0.06573104858398438, 0.06865501403808594, 0.0715789794921875, 0.07450294494628906, 0.07742691040039062, 0.08035087585449219, 0.08327484130859375, 0.08619880676269531, 0.08912277221679688, 0.09204673767089844, 0.094970703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 7.0, 8.0, 16.0, 10.0, 28.0, 19.0, 35.0, 44.0, 61.0, 92.0, 130.0, 199.0, 271.0, 424.0, 753.0, 1477.0, 3296.0, 8694.0, 30525.0, 176676.0, 656045.0, 131086.0, 24951.0, 7484.0, 2881.0, 1344.0, 698.0, 396.0, 286.0, 200.0, 120.0, 84.0, 50.0, 38.0, 26.0, 22.0, 12.0, 11.0, 10.0, 10.0, 7.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.204345703125, -0.1978435516357422, -0.19134140014648438, -0.18483924865722656, -0.17833709716796875, -0.17183494567871094, -0.16533279418945312, -0.1588306427001953, -0.1523284912109375, -0.1458263397216797, -0.13932418823242188, -0.13282203674316406, -0.12631988525390625, -0.11981773376464844, -0.11331558227539062, -0.10681343078613281, -0.100311279296875, -0.09380912780761719, -0.08730697631835938, -0.08080482482910156, -0.07430267333984375, -0.06780052185058594, -0.061298370361328125, -0.05479621887207031, -0.0482940673828125, -0.04179191589355469, -0.035289764404296875, -0.028787612915039062, -0.02228546142578125, -0.015783309936523438, -0.009281158447265625, -0.0027790069580078125, 0.00372314453125, 0.010225296020507812, 0.016727447509765625, 0.023229598999023438, 0.02973175048828125, 0.03623390197753906, 0.042736053466796875, 0.04923820495605469, 0.0557403564453125, 0.06224250793457031, 0.06874465942382812, 0.07524681091308594, 0.08174896240234375, 0.08825111389160156, 0.09475326538085938, 0.10125541687011719, 0.107757568359375, 0.11425971984863281, 0.12076187133789062, 0.12726402282714844, 0.13376617431640625, 0.14026832580566406, 0.14677047729492188, 0.1532726287841797, 0.1597747802734375, 0.1662769317626953, 0.17277908325195312, 0.17928123474121094, 0.18578338623046875, 0.19228553771972656, 0.19878768920898438, 0.2052898406982422, 0.2117919921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 5.0, 7.0, 16.0, 11.0, 16.0, 17.0, 14.0, 17.0, 22.0, 38.0, 24.0, 18.0, 41.0, 24.0, 38.0, 39.0, 39.0, 39.0, 31.0, 42.0, 44.0, 42.0, 42.0, 43.0, 30.0, 34.0, 41.0, 22.0, 31.0, 22.0, 24.0, 20.0, 11.0, 22.0, 14.0, 9.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.177490234375, -0.17191123962402344, -0.16633224487304688, -0.1607532501220703, -0.15517425537109375, -0.1495952606201172, -0.14401626586914062, -0.13843727111816406, -0.1328582763671875, -0.12727928161621094, -0.12170028686523438, -0.11612129211425781, -0.11054229736328125, -0.10496330261230469, -0.09938430786132812, -0.09380531311035156, -0.088226318359375, -0.08264732360839844, -0.07706832885742188, -0.07148933410644531, -0.06591033935546875, -0.06033134460449219, -0.054752349853515625, -0.04917335510253906, -0.0435943603515625, -0.03801536560058594, -0.032436370849609375, -0.026857376098632812, -0.02127838134765625, -0.015699386596679688, -0.010120391845703125, -0.0045413970947265625, 0.00103759765625, 0.0066165924072265625, 0.012195587158203125, 0.017774581909179688, 0.02335357666015625, 0.028932571411132812, 0.034511566162109375, 0.04009056091308594, 0.0456695556640625, 0.05124855041503906, 0.056827545166015625, 0.06240653991699219, 0.06798553466796875, 0.07356452941894531, 0.07914352416992188, 0.08472251892089844, 0.090301513671875, 0.09588050842285156, 0.10145950317382812, 0.10703849792480469, 0.11261749267578125, 0.11819648742675781, 0.12377548217773438, 0.12935447692871094, 0.1349334716796875, 0.14051246643066406, 0.14609146118164062, 0.1516704559326172, 0.15724945068359375, 0.1628284454345703, 0.16840744018554688, 0.17398643493652344, 0.1795654296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 10.0, 11.0, 10.0, 10.0, 31.0, 37.0, 58.0, 86.0, 139.0, 261.0, 537.0, 1189.0, 3098.0, 11869.0, 108733.0, 830764.0, 77292.0, 9568.0, 2643.0, 1074.0, 445.0, 256.0, 140.0, 96.0, 62.0, 41.0, 26.0, 17.0, 9.0, 11.0, 4.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11126708984375, -0.10748767852783203, -0.10370826721191406, -0.0999288558959961, -0.09614944458007812, -0.09237003326416016, -0.08859062194824219, -0.08481121063232422, -0.08103179931640625, -0.07725238800048828, -0.07347297668457031, -0.06969356536865234, -0.06591415405273438, -0.062134742736816406, -0.05835533142089844, -0.05457592010498047, -0.0507965087890625, -0.04701709747314453, -0.04323768615722656, -0.039458274841308594, -0.035678863525390625, -0.031899452209472656, -0.028120040893554688, -0.02434062957763672, -0.02056121826171875, -0.01678180694580078, -0.013002395629882812, -0.009222984313964844, -0.005443572998046875, -0.0016641616821289062, 0.0021152496337890625, 0.005894660949707031, 0.009674072265625, 0.013453483581542969, 0.017232894897460938, 0.021012306213378906, 0.024791717529296875, 0.028571128845214844, 0.03235054016113281, 0.03612995147705078, 0.03990936279296875, 0.04368877410888672, 0.04746818542480469, 0.051247596740722656, 0.055027008056640625, 0.058806419372558594, 0.06258583068847656, 0.06636524200439453, 0.0701446533203125, 0.07392406463623047, 0.07770347595214844, 0.0814828872680664, 0.08526229858398438, 0.08904170989990234, 0.09282112121582031, 0.09660053253173828, 0.10037994384765625, 0.10415935516357422, 0.10793876647949219, 0.11171817779541016, 0.11549758911132812, 0.1192770004272461, 0.12305641174316406, 0.12683582305908203, 0.130615234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 10.0, 8.0, 15.0, 18.0, 19.0, 32.0, 34.0, 52.0, 53.0, 69.0, 97.0, 124.0, 95.0, 78.0, 46.0, 33.0, 29.0, 28.0, 25.0, 20.0, 18.0, 5.0, 11.0, 7.0, 5.0, 10.0, 4.0, 8.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.82012939453125e-05, -7.562246173620224e-05, -7.304362952709198e-05, -7.046479731798172e-05, -6.788596510887146e-05, -6.53071328997612e-05, -6.272830069065094e-05, -6.014946848154068e-05, -5.757063627243042e-05, -5.499180406332016e-05, -5.24129718542099e-05, -4.983413964509964e-05, -4.725530743598938e-05, -4.467647522687912e-05, -4.209764301776886e-05, -3.95188108086586e-05, -3.693997859954834e-05, -3.436114639043808e-05, -3.178231418132782e-05, -2.920348197221756e-05, -2.66246497631073e-05, -2.404581755399704e-05, -2.146698534488678e-05, -1.888815313577652e-05, -1.630932092666626e-05, -1.3730488717556e-05, -1.115165650844574e-05, -8.57282429933548e-06, -5.99399209022522e-06, -3.4151598811149597e-06, -8.363276720046997e-07, 1.7425045371055603e-06, 4.32133674621582e-06, 6.90016895532608e-06, 9.47900116443634e-06, 1.20578333735466e-05, 1.463666558265686e-05, 1.721549779176712e-05, 1.979433000087738e-05, 2.237316220998764e-05, 2.49519944190979e-05, 2.753082662820816e-05, 3.010965883731842e-05, 3.268849104642868e-05, 3.526732325553894e-05, 3.78461554646492e-05, 4.042498767375946e-05, 4.300381988286972e-05, 4.558265209197998e-05, 4.816148430109024e-05, 5.07403165102005e-05, 5.331914871931076e-05, 5.589798092842102e-05, 5.847681313753128e-05, 6.105564534664154e-05, 6.36344775557518e-05, 6.621330976486206e-05, 6.879214197397232e-05, 7.137097418308258e-05, 7.394980639219284e-05, 7.65286386013031e-05, 7.910747081041336e-05, 8.168630301952362e-05, 8.426513522863388e-05, 8.684396743774414e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 11.0, 17.0, 9.0, 19.0, 22.0, 37.0, 40.0, 75.0, 114.0, 133.0, 220.0, 356.0, 590.0, 1177.0, 2397.0, 5347.0, 16255.0, 84129.0, 701185.0, 195141.0, 26965.0, 7887.0, 3018.0, 1385.0, 766.0, 414.0, 236.0, 170.0, 114.0, 79.0, 61.0, 44.0, 30.0, 23.0, 20.0, 16.0, 4.0, 7.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.091552734375, -0.08856868743896484, -0.08558464050292969, -0.08260059356689453, -0.07961654663085938, -0.07663249969482422, -0.07364845275878906, -0.0706644058227539, -0.06768035888671875, -0.0646963119506836, -0.06171226501464844, -0.05872821807861328, -0.055744171142578125, -0.05276012420654297, -0.04977607727050781, -0.046792030334472656, -0.0438079833984375, -0.040823936462402344, -0.03783988952636719, -0.03485584259033203, -0.031871795654296875, -0.02888774871826172, -0.025903701782226562, -0.022919654846191406, -0.01993560791015625, -0.016951560974121094, -0.013967514038085938, -0.010983467102050781, -0.007999420166015625, -0.005015373229980469, -0.0020313262939453125, 0.0009527206420898438, 0.003936767578125, 0.006920814514160156, 0.009904861450195312, 0.012888908386230469, 0.015872955322265625, 0.01885700225830078, 0.021841049194335938, 0.024825096130371094, 0.02780914306640625, 0.030793190002441406, 0.03377723693847656, 0.03676128387451172, 0.039745330810546875, 0.04272937774658203, 0.04571342468261719, 0.048697471618652344, 0.0516815185546875, 0.054665565490722656, 0.05764961242675781, 0.06063365936279297, 0.06361770629882812, 0.06660175323486328, 0.06958580017089844, 0.0725698471069336, 0.07555389404296875, 0.0785379409790039, 0.08152198791503906, 0.08450603485107422, 0.08749008178710938, 0.09047412872314453, 0.09345817565917969, 0.09644222259521484, 0.09942626953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 11.0, 13.0, 20.0, 24.0, 49.0, 75.0, 115.0, 158.0, 174.0, 107.0, 71.0, 52.0, 27.0, 19.0, 10.0, 12.0, 5.0, 6.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.172607421875, -0.16793251037597656, -0.16325759887695312, -0.1585826873779297, -0.15390777587890625, -0.1492328643798828, -0.14455795288085938, -0.13988304138183594, -0.1352081298828125, -0.13053321838378906, -0.12585830688476562, -0.12118339538574219, -0.11650848388671875, -0.11183357238769531, -0.10715866088867188, -0.10248374938964844, -0.097808837890625, -0.09313392639160156, -0.08845901489257812, -0.08378410339355469, -0.07910919189453125, -0.07443428039550781, -0.06975936889648438, -0.06508445739746094, -0.0604095458984375, -0.05573463439941406, -0.051059722900390625, -0.04638481140136719, -0.04170989990234375, -0.03703498840332031, -0.032360076904296875, -0.027685165405273438, -0.02301025390625, -0.018335342407226562, -0.013660430908203125, -0.008985519409179688, -0.00431060791015625, 0.0003643035888671875, 0.005039215087890625, 0.009714126586914062, 0.0143890380859375, 0.019063949584960938, 0.023738861083984375, 0.028413772583007812, 0.03308868408203125, 0.03776359558105469, 0.042438507080078125, 0.04711341857910156, 0.051788330078125, 0.05646324157714844, 0.061138153076171875, 0.06581306457519531, 0.07048797607421875, 0.07516288757324219, 0.07983779907226562, 0.08451271057128906, 0.0891876220703125, 0.09386253356933594, 0.09853744506835938, 0.10321235656738281, 0.10788726806640625, 0.11256217956542969, 0.11723709106445312, 0.12191200256347656, 0.1265869140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 22.0, 73.0, 365.0, 428.0, 86.0, 18.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.296441078186035, -4.186485767364502, -4.076530456542969, -3.9665749073028564, -3.8566195964813232, -3.74666428565979, -3.6367087364196777, -3.5267534255981445, -3.4167981147766113, -3.306842803955078, -3.196887493133545, -3.0869319438934326, -2.9769766330718994, -2.867021322250366, -2.757065773010254, -2.6471104621887207, -2.5371551513671875, -2.4271998405456543, -2.317244529724121, -2.207288980484009, -2.0973336696624756, -1.9873783588409424, -1.8774229288101196, -1.7674674987792969, -1.6575121879577637, -1.5475568771362305, -1.4376014471054077, -1.327646017074585, -1.2176907062530518, -1.1077353954315186, -0.9977799654006958, -0.8878245949745178, -0.7778692245483398, -0.6679138541221619, -0.5579584836959839, -0.4480031132698059, -0.33804774284362793, -0.22809237241744995, -0.11813700199127197, -0.008181631565093994, 0.10177373886108398, 0.21172910928726196, 0.32168447971343994, 0.4316398501396179, 0.5415952205657959, 0.6515505909919739, 0.7615059614181519, 0.8714613318443298, 0.9814167022705078, 1.091372013092041, 1.2013274431228638, 1.3112828731536865, 1.4212381839752197, 1.531193494796753, 1.6411489248275757, 1.7511043548583984, 1.8610596656799316, 1.9710149765014648, 2.080970287322998, 2.1909258365631104, 2.3008811473846436, 2.4108364582061768, 2.520792007446289, 2.6307473182678223, 2.7407026290893555]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 10.0, 19.0, 7.0, 24.0, 27.0, 34.0, 36.0, 23.0, 65.0, 51.0, 39.0, 60.0, 55.0, 65.0, 70.0, 50.0, 48.0, 50.0, 38.0, 39.0, 35.0, 37.0, 19.0, 14.0, 17.0, 17.0, 10.0, 12.0, 10.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.976169228553772, -0.932508111000061, -0.8888469934463501, -0.8451858758926392, -0.8015247583389282, -0.7578636407852173, -0.7142025828361511, -0.6705414652824402, -0.6268803477287292, -0.5832192301750183, -0.5395581126213074, -0.4958970248699188, -0.4522359073162079, -0.40857478976249695, -0.3649137020111084, -0.32125258445739746, -0.2775914669036865, -0.23393034934997559, -0.19026924669742584, -0.1466081440448761, -0.10294702649116516, -0.059285908937454224, -0.015624821186065674, 0.028036296367645264, 0.0716974139213562, 0.11535852402448654, 0.15901963412761688, 0.20268073678016663, 0.24634185433387756, 0.2900029718875885, 0.33366405963897705, 0.377325177192688, 0.4209862947463989, 0.46464741230010986, 0.5083085298538208, 0.5519696474075317, 0.5956307649612427, 0.6392918825149536, 0.6829529404640198, 0.7266140580177307, 0.7702751755714417, 0.8139362931251526, 0.8575974106788635, 0.9012584686279297, 0.9449195861816406, 0.9885807037353516, 1.0322418212890625, 1.0759029388427734, 1.1195640563964844, 1.1632251739501953, 1.2068862915039062, 1.2505474090576172, 1.2942085266113281, 1.337869644165039, 1.38153076171875, 1.425191879272461, 1.4688529968261719, 1.5125141143798828, 1.5561752319335938, 1.5998363494873047, 1.6434974670410156, 1.6871585845947266, 1.7308197021484375, 1.7744808197021484, 1.8181418180465698]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 4.0, 3.0, 12.0, 13.0, 12.0, 23.0, 34.0, 59.0, 87.0, 134.0, 282.0, 526.0, 1290.0, 4424.0, 26498.0, 3661290.0, 477847.0, 16311.0, 3333.0, 1082.0, 446.0, 209.0, 122.0, 83.0, 48.0, 27.0, 26.0, 13.0, 11.0, 11.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.3885231018066406, -0.37738800048828125, -0.3662528991699219, -0.3551177978515625, -0.3439826965332031, -0.33284759521484375, -0.3217124938964844, -0.310577392578125, -0.2994422912597656, -0.28830718994140625, -0.2771720886230469, -0.2660369873046875, -0.2549018859863281, -0.24376678466796875, -0.23263168334960938, -0.22149658203125, -0.21036148071289062, -0.19922637939453125, -0.18809127807617188, -0.1769561767578125, -0.16582107543945312, -0.15468597412109375, -0.14355087280273438, -0.132415771484375, -0.12128067016601562, -0.11014556884765625, -0.09901046752929688, -0.0878753662109375, -0.07674026489257812, -0.06560516357421875, -0.054470062255859375, -0.0433349609375, -0.032199859619140625, -0.02106475830078125, -0.009929656982421875, 0.0012054443359375, 0.012340545654296875, 0.02347564697265625, 0.034610748291015625, 0.045745849609375, 0.056880950927734375, 0.06801605224609375, 0.07915115356445312, 0.0902862548828125, 0.10142135620117188, 0.11255645751953125, 0.12369155883789062, 0.13482666015625, 0.14596176147460938, 0.15709686279296875, 0.16823196411132812, 0.1793670654296875, 0.19050216674804688, 0.20163726806640625, 0.21277236938476562, 0.223907470703125, 0.23504257202148438, 0.24617767333984375, 0.2573127746582031, 0.2684478759765625, 0.2795829772949219, 0.29071807861328125, 0.3018531799316406, 0.31298828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 10.0, 13.0, 19.0, 31.0, 68.0, 122.0, 167.0, 200.0, 146.0, 101.0, 52.0, 31.0, 14.0, 13.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0926513671875, -0.08968544006347656, -0.08671951293945312, -0.08375358581542969, -0.08078765869140625, -0.07782173156738281, -0.07485580444335938, -0.07188987731933594, -0.0689239501953125, -0.06595802307128906, -0.06299209594726562, -0.06002616882324219, -0.05706024169921875, -0.05409431457519531, -0.051128387451171875, -0.04816246032714844, -0.045196533203125, -0.04223060607910156, -0.039264678955078125, -0.03629875183105469, -0.03333282470703125, -0.030366897583007812, -0.027400970458984375, -0.024435043334960938, -0.0214691162109375, -0.018503189086914062, -0.015537261962890625, -0.012571334838867188, -0.00960540771484375, -0.0066394805908203125, -0.003673553466796875, -0.0007076263427734375, 0.00225830078125, 0.0052242279052734375, 0.008190155029296875, 0.011156082153320312, 0.01412200927734375, 0.017087936401367188, 0.020053863525390625, 0.023019790649414062, 0.0259857177734375, 0.028951644897460938, 0.031917572021484375, 0.03488349914550781, 0.03784942626953125, 0.04081535339355469, 0.043781280517578125, 0.04674720764160156, 0.049713134765625, 0.05267906188964844, 0.055644989013671875, 0.05861091613769531, 0.06157684326171875, 0.06454277038574219, 0.06750869750976562, 0.07047462463378906, 0.0734405517578125, 0.07640647888183594, 0.07937240600585938, 0.08233833312988281, 0.08530426025390625, 0.08827018737792969, 0.09123611450195312, 0.09420204162597656, 0.09716796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 14.0, 18.0, 17.0, 31.0, 42.0, 91.0, 148.0, 243.0, 499.0, 1150.0, 3314.0, 15548.0, 226204.0, 3887875.0, 48825.0, 7042.0, 1813.0, 704.0, 307.0, 146.0, 89.0, 50.0, 34.0, 27.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3946342468261719, -0.38375091552734375, -0.3728675842285156, -0.3619842529296875, -0.3511009216308594, -0.34021759033203125, -0.3293342590332031, -0.318450927734375, -0.3075675964355469, -0.29668426513671875, -0.2858009338378906, -0.2749176025390625, -0.2640342712402344, -0.25315093994140625, -0.24226760864257812, -0.23138427734375, -0.22050094604492188, -0.20961761474609375, -0.19873428344726562, -0.1878509521484375, -0.17696762084960938, -0.16608428955078125, -0.15520095825195312, -0.144317626953125, -0.13343429565429688, -0.12255096435546875, -0.11166763305664062, -0.1007843017578125, -0.08990097045898438, -0.07901763916015625, -0.06813430786132812, -0.0572509765625, -0.046367645263671875, -0.03548431396484375, -0.024600982666015625, -0.0137176513671875, -0.002834320068359375, 0.00804901123046875, 0.018932342529296875, 0.029815673828125, 0.040699005126953125, 0.05158233642578125, 0.062465667724609375, 0.0733489990234375, 0.08423233032226562, 0.09511566162109375, 0.10599899291992188, 0.11688232421875, 0.12776565551757812, 0.13864898681640625, 0.14953231811523438, 0.1604156494140625, 0.17129898071289062, 0.18218231201171875, 0.19306564331054688, 0.203948974609375, 0.21483230590820312, 0.22571563720703125, 0.23659896850585938, 0.2474822998046875, 0.2583656311035156, 0.26924896240234375, 0.2801322937011719, 0.291015625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 16.0, 27.0, 52.0, 79.0, 197.0, 816.0, 2258.0, 366.0, 111.0, 57.0, 27.0, 20.0, 11.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.18842697143554688, -0.18386077880859375, -0.17929458618164062, -0.1747283935546875, -0.17016220092773438, -0.16559600830078125, -0.16102981567382812, -0.156463623046875, -0.15189743041992188, -0.14733123779296875, -0.14276504516601562, -0.1381988525390625, -0.13363265991210938, -0.12906646728515625, -0.12450027465820312, -0.11993408203125, -0.11536788940429688, -0.11080169677734375, -0.10623550415039062, -0.1016693115234375, -0.09710311889648438, -0.09253692626953125, -0.08797073364257812, -0.083404541015625, -0.07883834838867188, -0.07427215576171875, -0.06970596313476562, -0.0651397705078125, -0.060573577880859375, -0.05600738525390625, -0.051441192626953125, -0.046875, -0.042308807373046875, -0.03774261474609375, -0.033176422119140625, -0.0286102294921875, -0.024044036865234375, -0.01947784423828125, -0.014911651611328125, -0.010345458984375, -0.005779266357421875, -0.00121307373046875, 0.003353118896484375, 0.0079193115234375, 0.012485504150390625, 0.01705169677734375, 0.021617889404296875, 0.02618408203125, 0.030750274658203125, 0.03531646728515625, 0.039882659912109375, 0.0444488525390625, 0.049015045166015625, 0.05358123779296875, 0.058147430419921875, 0.062713623046875, 0.06727981567382812, 0.07184600830078125, 0.07641220092773438, 0.0809783935546875, 0.08554458618164062, 0.09011077880859375, 0.09467697143554688, 0.0992431640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 12.0, 28.0, 91.0, 184.0, 347.0, 247.0, 61.0, 23.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.449288010597229, -0.418795108795166, -0.38830217719078064, -0.35780927538871765, -0.3273163437843323, -0.2968234419822693, -0.2663305401802063, -0.23583760857582092, -0.20534469187259674, -0.17485177516937256, -0.14435885846614838, -0.11386594921350479, -0.08337303251028061, -0.052880123257637024, -0.022387206554412842, 0.00810571014881134, 0.03859862685203552, 0.0690915435552597, 0.09958446025848389, 0.13007736206054688, 0.16057029366493225, 0.19106319546699524, 0.22155611217021942, 0.2520490288734436, 0.2825419306755066, 0.3130348324775696, 0.34352776408195496, 0.37402066588401794, 0.4045135974884033, 0.4350064992904663, 0.4654994010925293, 0.4959923326969147, 0.5264852643013, 0.556978166103363, 0.587471067905426, 0.6179640293121338, 0.6484569311141968, 0.6789498329162598, 0.7094427347183228, 0.7399356365203857, 0.7704285979270935, 0.8009214997291565, 0.8314144015312195, 0.8619073629379272, 0.8924002647399902, 0.9228931665420532, 0.9533860683441162, 0.9838789701461792, 1.0143718719482422, 1.0448647737503052, 1.0753576755523682, 1.1058505773544312, 1.1363434791564941, 1.1668365001678467, 1.1973294019699097, 1.2278223037719727, 1.2583152055740356, 1.2888081073760986, 1.3193010091781616, 1.3497939109802246, 1.3802868127822876, 1.4107797145843506, 1.4412727355957031, 1.4717656373977661, 1.502258539199829]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 11.0, 12.0, 28.0, 30.0, 38.0, 47.0, 44.0, 73.0, 59.0, 81.0, 75.0, 60.0, 61.0, 61.0, 58.0, 51.0, 45.0, 44.0, 28.0, 36.0, 23.0, 11.0, 9.0, 11.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5464600324630737, -0.5318363308906555, -0.5172126293182373, -0.5025889277458191, -0.4879651963710785, -0.4733414947986603, -0.4587177634239197, -0.44409406185150146, -0.42947036027908325, -0.41484665870666504, -0.4002229571342468, -0.3855992257595062, -0.370975524187088, -0.3563518226146698, -0.3417280912399292, -0.327104389667511, -0.3124806880950928, -0.29785698652267456, -0.28323328495025635, -0.26860955357551575, -0.25398585200309753, -0.23936215043067932, -0.22473843395709991, -0.2101147174835205, -0.1954910159111023, -0.18086731433868408, -0.16624359786510468, -0.15161988139152527, -0.13699617981910706, -0.12237247079610825, -0.10774876177310944, -0.09312505275011063, -0.07850134372711182, -0.063877634704113, -0.0492539256811142, -0.03463021665811539, -0.020006507635116577, -0.005382798612117767, 0.009240910410881042, 0.023864619433879852, 0.03848832845687866, 0.05311203747987747, 0.06773574650287628, 0.08235945552587509, 0.0969831645488739, 0.11160687357187271, 0.12623058259487152, 0.14085429906845093, 0.15547800064086914, 0.17010170221328735, 0.18472541868686676, 0.19934913516044617, 0.21397283673286438, 0.2285965383052826, 0.243220254778862, 0.2578439712524414, 0.2724676728248596, 0.28709137439727783, 0.30171507596969604, 0.31633880734443665, 0.33096250891685486, 0.34558621048927307, 0.36020994186401367, 0.3748336434364319, 0.3894573450088501]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 3.0, 8.0, 8.0, 17.0, 26.0, 36.0, 40.0, 51.0, 79.0, 120.0, 208.0, 337.0, 547.0, 1137.0, 2931.0, 10573.0, 81968.0, 832629.0, 100043.0, 12005.0, 3159.0, 1174.0, 564.0, 310.0, 176.0, 118.0, 83.0, 56.0, 46.0, 21.0, 29.0, 16.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.369384765625, -0.3589897155761719, -0.34859466552734375, -0.3381996154785156, -0.3278045654296875, -0.3174095153808594, -0.30701446533203125, -0.2966194152832031, -0.286224365234375, -0.2758293151855469, -0.26543426513671875, -0.2550392150878906, -0.2446441650390625, -0.23424911499023438, -0.22385406494140625, -0.21345901489257812, -0.20306396484375, -0.19266891479492188, -0.18227386474609375, -0.17187881469726562, -0.1614837646484375, -0.15108871459960938, -0.14069366455078125, -0.13029861450195312, -0.119903564453125, -0.10950851440429688, -0.09911346435546875, -0.08871841430664062, -0.0783233642578125, -0.06792831420898438, -0.05753326416015625, -0.047138214111328125, -0.0367431640625, -0.026348114013671875, -0.01595306396484375, -0.005558013916015625, 0.0048370361328125, 0.015232086181640625, 0.02562713623046875, 0.036022186279296875, 0.046417236328125, 0.056812286376953125, 0.06720733642578125, 0.07760238647460938, 0.0879974365234375, 0.09839248657226562, 0.10878753662109375, 0.11918258666992188, 0.12957763671875, 0.13997268676757812, 0.15036773681640625, 0.16076278686523438, 0.1711578369140625, 0.18155288696289062, 0.19194793701171875, 0.20234298706054688, 0.212738037109375, 0.22313308715820312, 0.23352813720703125, 0.24392318725585938, 0.2543182373046875, 0.2647132873535156, 0.27510833740234375, 0.2855033874511719, 0.2958984375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 12.0, 8.0, 13.0, 16.0, 34.0, 68.0, 110.0, 169.0, 201.0, 148.0, 88.0, 61.0, 40.0, 13.0, 9.0, 7.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.0936279296875, -0.09063720703125, -0.087646484375, -0.08465576171875, -0.0816650390625, -0.07867431640625, -0.07568359375, -0.07269287109375, -0.0697021484375, -0.06671142578125, -0.063720703125, -0.06072998046875, -0.0577392578125, -0.05474853515625, -0.0517578125, -0.04876708984375, -0.0457763671875, -0.04278564453125, -0.039794921875, -0.03680419921875, -0.0338134765625, -0.03082275390625, -0.02783203125, -0.02484130859375, -0.0218505859375, -0.01885986328125, -0.015869140625, -0.01287841796875, -0.0098876953125, -0.00689697265625, -0.00390625, -0.00091552734375, 0.0020751953125, 0.00506591796875, 0.008056640625, 0.01104736328125, 0.0140380859375, 0.01702880859375, 0.02001953125, 0.02301025390625, 0.0260009765625, 0.02899169921875, 0.031982421875, 0.03497314453125, 0.0379638671875, 0.04095458984375, 0.0439453125, 0.04693603515625, 0.0499267578125, 0.05291748046875, 0.055908203125, 0.05889892578125, 0.0618896484375, 0.06488037109375, 0.06787109375, 0.07086181640625, 0.0738525390625, 0.07684326171875, 0.079833984375, 0.08282470703125, 0.0858154296875, 0.08880615234375, 0.091796875, 0.09478759765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 16.0, 12.0, 15.0, 15.0, 27.0, 34.0, 60.0, 67.0, 111.0, 170.0, 217.0, 399.0, 631.0, 1133.0, 2114.0, 4385.0, 11041.0, 33562.0, 159299.0, 641184.0, 142587.0, 31508.0, 10584.0, 4347.0, 2164.0, 1084.0, 652.0, 370.0, 225.0, 153.0, 120.0, 75.0, 58.0, 36.0, 31.0, 16.0, 13.0, 14.0, 4.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.211181640625, -0.20554542541503906, -0.19990921020507812, -0.1942729949951172, -0.18863677978515625, -0.1830005645751953, -0.17736434936523438, -0.17172813415527344, -0.1660919189453125, -0.16045570373535156, -0.15481948852539062, -0.1491832733154297, -0.14354705810546875, -0.1379108428955078, -0.13227462768554688, -0.12663841247558594, -0.121002197265625, -0.11536598205566406, -0.10972976684570312, -0.10409355163574219, -0.09845733642578125, -0.09282112121582031, -0.08718490600585938, -0.08154869079589844, -0.0759124755859375, -0.07027626037597656, -0.06464004516601562, -0.05900382995605469, -0.05336761474609375, -0.04773139953613281, -0.042095184326171875, -0.03645896911621094, -0.03082275390625, -0.025186538696289062, -0.019550323486328125, -0.013914108276367188, -0.00827789306640625, -0.0026416778564453125, 0.002994537353515625, 0.008630752563476562, 0.0142669677734375, 0.019903182983398438, 0.025539398193359375, 0.031175613403320312, 0.03681182861328125, 0.04244804382324219, 0.048084259033203125, 0.05372047424316406, 0.059356689453125, 0.06499290466308594, 0.07062911987304688, 0.07626533508300781, 0.08190155029296875, 0.08753776550292969, 0.09317398071289062, 0.09881019592285156, 0.1044464111328125, 0.11008262634277344, 0.11571884155273438, 0.12135505676269531, 0.12699127197265625, 0.1326274871826172, 0.13826370239257812, 0.14389991760253906, 0.1495361328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 9.0, 11.0, 9.0, 15.0, 23.0, 25.0, 35.0, 28.0, 41.0, 37.0, 59.0, 50.0, 51.0, 61.0, 63.0, 74.0, 54.0, 53.0, 52.0, 40.0, 34.0, 31.0, 30.0, 25.0, 26.0, 9.0, 11.0, 3.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.274658203125, -0.2673473358154297, -0.2600364685058594, -0.25272560119628906, -0.24541473388671875, -0.23810386657714844, -0.23079299926757812, -0.2234821319580078, -0.2161712646484375, -0.2088603973388672, -0.20154953002929688, -0.19423866271972656, -0.18692779541015625, -0.17961692810058594, -0.17230606079101562, -0.1649951934814453, -0.157684326171875, -0.1503734588623047, -0.14306259155273438, -0.13575172424316406, -0.12844085693359375, -0.12112998962402344, -0.11381912231445312, -0.10650825500488281, -0.0991973876953125, -0.09188652038574219, -0.08457565307617188, -0.07726478576660156, -0.06995391845703125, -0.06264305114746094, -0.055332183837890625, -0.04802131652832031, -0.04071044921875, -0.03339958190917969, -0.026088714599609375, -0.018777847290039062, -0.01146697998046875, -0.0041561126708984375, 0.003154754638671875, 0.010465621948242188, 0.0177764892578125, 0.025087356567382812, 0.032398223876953125, 0.03970909118652344, 0.04701995849609375, 0.05433082580566406, 0.061641693115234375, 0.06895256042480469, 0.076263427734375, 0.08357429504394531, 0.09088516235351562, 0.09819602966308594, 0.10550689697265625, 0.11281776428222656, 0.12012863159179688, 0.1274394989013672, 0.1347503662109375, 0.1420612335205078, 0.14937210083007812, 0.15668296813964844, 0.16399383544921875, 0.17130470275878906, 0.17861557006835938, 0.1859264373779297, 0.1932373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 7.0, 7.0, 13.0, 15.0, 28.0, 37.0, 47.0, 89.0, 143.0, 303.0, 741.0, 2285.0, 8319.0, 45936.0, 873661.0, 99405.0, 12416.0, 3132.0, 1052.0, 406.0, 180.0, 107.0, 60.0, 52.0, 24.0, 18.0, 13.0, 17.0, 4.0, 2.0, 2.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16552734375, -0.15974807739257812, -0.15396881103515625, -0.14818954467773438, -0.1424102783203125, -0.13663101196289062, -0.13085174560546875, -0.12507247924804688, -0.119293212890625, -0.11351394653320312, -0.10773468017578125, -0.10195541381835938, -0.0961761474609375, -0.09039688110351562, -0.08461761474609375, -0.07883834838867188, -0.07305908203125, -0.06727981567382812, -0.06150054931640625, -0.055721282958984375, -0.0499420166015625, -0.044162750244140625, -0.03838348388671875, -0.032604217529296875, -0.026824951171875, -0.021045684814453125, -0.01526641845703125, -0.009487152099609375, -0.0037078857421875, 0.002071380615234375, 0.00785064697265625, 0.013629913330078125, 0.0194091796875, 0.025188446044921875, 0.03096771240234375, 0.036746978759765625, 0.0425262451171875, 0.048305511474609375, 0.05408477783203125, 0.059864044189453125, 0.065643310546875, 0.07142257690429688, 0.07720184326171875, 0.08298110961914062, 0.0887603759765625, 0.09453964233398438, 0.10031890869140625, 0.10609817504882812, 0.11187744140625, 0.11765670776367188, 0.12343597412109375, 0.12921524047851562, 0.1349945068359375, 0.14077377319335938, 0.14655303955078125, 0.15233230590820312, 0.158111572265625, 0.16389083862304688, 0.16967010498046875, 0.17544937133789062, 0.1812286376953125, 0.18700790405273438, 0.19278717041015625, 0.19856643676757812, 0.204345703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 7.0, 8.0, 5.0, 3.0, 7.0, 8.0, 14.0, 20.0, 20.0, 16.0, 25.0, 32.0, 42.0, 67.0, 72.0, 107.0, 97.0, 104.0, 81.0, 53.0, 32.0, 25.0, 21.0, 20.0, 18.0, 16.0, 14.0, 6.0, 10.0, 8.0, 7.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.153915405273438e-05, -7.901154458522797e-05, -7.648393511772156e-05, -7.395632565021515e-05, -7.142871618270874e-05, -6.890110671520233e-05, -6.637349724769592e-05, -6.384588778018951e-05, -6.13182783126831e-05, -5.87906688451767e-05, -5.626305937767029e-05, -5.373544991016388e-05, -5.120784044265747e-05, -4.868023097515106e-05, -4.615262150764465e-05, -4.3625012040138245e-05, -4.1097402572631836e-05, -3.856979310512543e-05, -3.604218363761902e-05, -3.351457417011261e-05, -3.09869647026062e-05, -2.8459355235099792e-05, -2.5931745767593384e-05, -2.3404136300086975e-05, -2.0876526832580566e-05, -1.8348917365074158e-05, -1.582130789756775e-05, -1.329369843006134e-05, -1.0766088962554932e-05, -8.238479495048523e-06, -5.710870027542114e-06, -3.1832605600357056e-06, -6.556510925292969e-07, 1.8719583749771118e-06, 4.3995678424835205e-06, 6.927177309989929e-06, 9.454786777496338e-06, 1.1982396245002747e-05, 1.4510005712509155e-05, 1.7037615180015564e-05, 1.9565224647521973e-05, 2.209283411502838e-05, 2.462044358253479e-05, 2.71480530500412e-05, 2.9675662517547607e-05, 3.2203271985054016e-05, 3.4730881452560425e-05, 3.7258490920066833e-05, 3.978610038757324e-05, 4.231370985507965e-05, 4.484131932258606e-05, 4.736892879009247e-05, 4.989653825759888e-05, 5.2424147725105286e-05, 5.4951757192611694e-05, 5.74793666601181e-05, 6.000697612762451e-05, 6.253458559513092e-05, 6.506219506263733e-05, 6.758980453014374e-05, 7.011741399765015e-05, 7.264502346515656e-05, 7.517263293266296e-05, 7.770024240016937e-05, 8.022785186767578e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 16.0, 28.0, 31.0, 50.0, 73.0, 88.0, 184.0, 205.0, 397.0, 664.0, 1299.0, 2639.0, 5931.0, 15977.0, 75319.0, 795829.0, 116039.0, 19827.0, 7246.0, 3161.0, 1538.0, 793.0, 444.0, 278.0, 158.0, 91.0, 59.0, 48.0, 26.0, 21.0, 13.0, 10.0, 12.0, 9.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10601806640625, -0.10203075408935547, -0.09804344177246094, -0.0940561294555664, -0.09006881713867188, -0.08608150482177734, -0.08209419250488281, -0.07810688018798828, -0.07411956787109375, -0.07013225555419922, -0.06614494323730469, -0.062157630920410156, -0.058170318603515625, -0.054183006286621094, -0.05019569396972656, -0.04620838165283203, -0.0422210693359375, -0.03823375701904297, -0.03424644470214844, -0.030259132385253906, -0.026271820068359375, -0.022284507751464844, -0.018297195434570312, -0.014309883117675781, -0.01032257080078125, -0.006335258483886719, -0.0023479461669921875, 0.0016393661499023438, 0.005626678466796875, 0.009613990783691406, 0.013601303100585938, 0.01758861541748047, 0.021575927734375, 0.02556324005126953, 0.029550552368164062, 0.033537864685058594, 0.037525177001953125, 0.041512489318847656, 0.04549980163574219, 0.04948711395263672, 0.05347442626953125, 0.05746173858642578, 0.06144905090332031, 0.06543636322021484, 0.06942367553710938, 0.0734109878540039, 0.07739830017089844, 0.08138561248779297, 0.0853729248046875, 0.08936023712158203, 0.09334754943847656, 0.0973348617553711, 0.10132217407226562, 0.10530948638916016, 0.10929679870605469, 0.11328411102294922, 0.11727142333984375, 0.12125873565673828, 0.1252460479736328, 0.12923336029052734, 0.13322067260742188, 0.1372079849243164, 0.14119529724121094, 0.14518260955810547, 0.149169921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 8.0, 13.0, 14.0, 20.0, 50.0, 74.0, 194.0, 330.0, 109.0, 49.0, 30.0, 17.0, 21.0, 8.0, 7.0, 3.0, 8.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2073974609375, -0.1998004913330078, -0.19220352172851562, -0.18460655212402344, -0.17700958251953125, -0.16941261291503906, -0.16181564331054688, -0.1542186737060547, -0.1466217041015625, -0.1390247344970703, -0.13142776489257812, -0.12383079528808594, -0.11623382568359375, -0.10863685607910156, -0.10103988647460938, -0.09344291687011719, -0.085845947265625, -0.07824897766113281, -0.07065200805664062, -0.06305503845214844, -0.05545806884765625, -0.04786109924316406, -0.040264129638671875, -0.03266716003417969, -0.0250701904296875, -0.017473220825195312, -0.009876251220703125, -0.0022792816162109375, 0.00531768798828125, 0.012914657592773438, 0.020511627197265625, 0.028108596801757812, 0.03570556640625, 0.04330253601074219, 0.050899505615234375, 0.05849647521972656, 0.06609344482421875, 0.07369041442871094, 0.08128738403320312, 0.08888435363769531, 0.0964813232421875, 0.10407829284667969, 0.11167526245117188, 0.11927223205566406, 0.12686920166015625, 0.13446617126464844, 0.14206314086914062, 0.1496601104736328, 0.157257080078125, 0.1648540496826172, 0.17245101928710938, 0.18004798889160156, 0.18764495849609375, 0.19524192810058594, 0.20283889770507812, 0.2104358673095703, 0.2180328369140625, 0.2256298065185547, 0.23322677612304688, 0.24082374572753906, 0.24842071533203125, 0.25601768493652344, 0.2636146545410156, 0.2712116241455078, 0.27880859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 21.0, 11.0, 19.0, 68.0, 176.0, 328.0, 269.0, 73.0, 25.0, 2.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7482235431671143, -3.662583827972412, -3.576944351196289, -3.491304636001587, -3.4056649208068848, -3.3200254440307617, -3.2343857288360596, -3.1487460136413574, -3.0631065368652344, -2.9774668216705322, -2.891827344894409, -2.806187629699707, -2.720547914505005, -2.6349081993103027, -2.5492687225341797, -2.4636290073394775, -2.3779892921447754, -2.2923495769500732, -2.20671010017395, -2.121070384979248, -2.035430669784546, -1.9497910737991333, -1.8641514778137207, -1.7785117626190186, -1.692872166633606, -1.6072325706481934, -1.5215928554534912, -1.4359532594680786, -1.350313663482666, -1.2646739482879639, -1.1790343523025513, -1.0933947563171387, -1.0077552795410156, -0.9221156239509583, -0.8364759683609009, -0.7508363723754883, -0.6651967167854309, -0.5795570611953735, -0.49391746520996094, -0.40827780961990356, -0.3226381540298462, -0.23699851334095, -0.15135887265205383, -0.06571924686431885, 0.019920408725738525, 0.1055600643157959, 0.1911996603012085, 0.27683931589126587, 0.36247897148132324, 0.4481186270713806, 0.533758282661438, 0.6193978786468506, 0.705037534236908, 0.7906771898269653, 0.8763167858123779, 0.9619564414024353, 1.0475960969924927, 1.1332356929779053, 1.2188754081726074, 1.30451500415802, 1.3901546001434326, 1.4757943153381348, 1.5614339113235474, 1.64707350730896, 1.732713222503662]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 7.0, 2.0, 11.0, 11.0, 8.0, 13.0, 12.0, 14.0, 28.0, 22.0, 32.0, 35.0, 36.0, 29.0, 42.0, 44.0, 42.0, 44.0, 51.0, 53.0, 56.0, 42.0, 36.0, 27.0, 35.0, 33.0, 40.0, 30.0, 23.0, 22.0, 16.0, 17.0, 21.0, 20.0, 8.0, 8.0, 4.0, 4.0, 5.0, 6.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0845484733581543, -1.0480408668518066, -1.0115331411361694, -0.9750255346298218, -0.9385178685188293, -0.9020102024078369, -0.8655025959014893, -0.8289949297904968, -0.7924872636795044, -0.755979597568512, -0.7194719910621643, -0.6829643249511719, -0.6464566588401794, -0.609948992729187, -0.5734413862228394, -0.5369337201118469, -0.5004261136054993, -0.4639184772968292, -0.4274108111858368, -0.39090317487716675, -0.3543955087661743, -0.3178878724575043, -0.28138023614883423, -0.2448725700378418, -0.20836493372917175, -0.17185728251934052, -0.13534963130950928, -0.09884199500083923, -0.062334343791007996, -0.025826692581176758, 0.010680943727493286, 0.04718860983848572, 0.08369624614715576, 0.120203897356987, 0.15671154856681824, 0.19321918487548828, 0.22972683608531952, 0.26623448729515076, 0.3027421236038208, 0.33924978971481323, 0.3757574260234833, 0.4122650623321533, 0.44877272844314575, 0.4852803647518158, 0.5217880010604858, 0.5582956671714783, 0.5948033332824707, 0.6313109397888184, 0.6678186058998108, 0.7043262720108032, 0.7408338785171509, 0.7773415446281433, 0.8138492107391357, 0.8503568172454834, 0.8868644833564758, 0.9233721494674683, 0.9598797559738159, 0.9963874220848083, 1.0328950881958008, 1.0694026947021484, 1.105910301208496, 1.1424180269241333, 1.178925633430481, 1.2154333591461182, 1.2519409656524658]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 13.0, 15.0, 19.0, 42.0, 69.0, 136.0, 283.0, 609.0, 1920.0, 12701.0, 3996934.0, 173006.0, 6254.0, 1314.0, 471.0, 215.0, 111.0, 58.0, 42.0, 18.0, 15.0, 10.0, 0.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467529296875, -0.4518623352050781, -0.43619537353515625, -0.4205284118652344, -0.4048614501953125, -0.3891944885253906, -0.37352752685546875, -0.3578605651855469, -0.342193603515625, -0.3265266418457031, -0.31085968017578125, -0.2951927185058594, -0.2795257568359375, -0.2638587951660156, -0.24819183349609375, -0.23252487182617188, -0.21685791015625, -0.20119094848632812, -0.18552398681640625, -0.16985702514648438, -0.1541900634765625, -0.13852310180664062, -0.12285614013671875, -0.10718917846679688, -0.091522216796875, -0.07585525512695312, -0.06018829345703125, -0.044521331787109375, -0.0288543701171875, -0.013187408447265625, 0.00247955322265625, 0.018146514892578125, 0.0338134765625, 0.049480438232421875, 0.06514739990234375, 0.08081436157226562, 0.0964813232421875, 0.11214828491210938, 0.12781524658203125, 0.14348220825195312, 0.159149169921875, 0.17481613159179688, 0.19048309326171875, 0.20615005493164062, 0.2218170166015625, 0.23748397827148438, 0.25315093994140625, 0.2688179016113281, 0.28448486328125, 0.3001518249511719, 0.31581878662109375, 0.3314857482910156, 0.3471527099609375, 0.3628196716308594, 0.37848663330078125, 0.3941535949707031, 0.409820556640625, 0.4254875183105469, 0.44115447998046875, 0.4568214416503906, 0.4724884033203125, 0.4881553649902344, 0.5038223266601562, 0.5194892883300781, 0.53515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 12.0, 22.0, 32.0, 65.0, 115.0, 155.0, 180.0, 127.0, 113.0, 67.0, 42.0, 25.0, 12.0, 10.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09369945526123047, -0.09071922302246094, -0.0877389907836914, -0.08475875854492188, -0.08177852630615234, -0.07879829406738281, -0.07581806182861328, -0.07283782958984375, -0.06985759735107422, -0.06687736511230469, -0.06389713287353516, -0.060916900634765625, -0.057936668395996094, -0.05495643615722656, -0.05197620391845703, -0.0489959716796875, -0.04601573944091797, -0.04303550720214844, -0.040055274963378906, -0.037075042724609375, -0.034094810485839844, -0.031114578247070312, -0.02813434600830078, -0.02515411376953125, -0.02217388153076172, -0.019193649291992188, -0.016213417053222656, -0.013233184814453125, -0.010252952575683594, -0.0072727203369140625, -0.004292488098144531, -0.001312255859375, 0.0016679763793945312, 0.0046482086181640625, 0.007628440856933594, 0.010608673095703125, 0.013588905334472656, 0.016569137573242188, 0.01954936981201172, 0.02252960205078125, 0.02550983428955078, 0.028490066528320312, 0.031470298767089844, 0.034450531005859375, 0.037430763244628906, 0.04041099548339844, 0.04339122772216797, 0.0463714599609375, 0.04935169219970703, 0.05233192443847656, 0.055312156677246094, 0.058292388916015625, 0.061272621154785156, 0.06425285339355469, 0.06723308563232422, 0.07021331787109375, 0.07319355010986328, 0.07617378234863281, 0.07915401458740234, 0.08213424682617188, 0.0851144790649414, 0.08809471130371094, 0.09107494354248047, 0.09405517578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 12.0, 22.0, 27.0, 46.0, 54.0, 56.0, 99.0, 134.0, 175.0, 247.0, 321.0, 473.0, 667.0, 1106.0, 2260.0, 7380.0, 48461.0, 3934971.0, 176400.0, 13965.0, 3456.0, 1401.0, 781.0, 543.0, 346.0, 265.0, 168.0, 135.0, 103.0, 45.0, 45.0, 27.0, 26.0, 20.0, 13.0, 6.0, 1.0, 7.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.368408203125, -0.3591289520263672, -0.3498497009277344, -0.34057044982910156, -0.33129119873046875, -0.32201194763183594, -0.3127326965332031, -0.3034534454345703, -0.2941741943359375, -0.2848949432373047, -0.2756156921386719, -0.26633644104003906, -0.25705718994140625, -0.24777793884277344, -0.23849868774414062, -0.2292194366455078, -0.219940185546875, -0.2106609344482422, -0.20138168334960938, -0.19210243225097656, -0.18282318115234375, -0.17354393005371094, -0.16426467895507812, -0.1549854278564453, -0.1457061767578125, -0.1364269256591797, -0.12714767456054688, -0.11786842346191406, -0.10858917236328125, -0.09930992126464844, -0.09003067016601562, -0.08075141906738281, -0.07147216796875, -0.06219291687011719, -0.052913665771484375, -0.04363441467285156, -0.03435516357421875, -0.025075912475585938, -0.015796661376953125, -0.0065174102783203125, 0.0027618408203125, 0.012041091918945312, 0.021320343017578125, 0.030599594116210938, 0.03987884521484375, 0.04915809631347656, 0.058437347412109375, 0.06771659851074219, 0.076995849609375, 0.08627510070800781, 0.09555435180664062, 0.10483360290527344, 0.11411285400390625, 0.12339210510253906, 0.13267135620117188, 0.1419506072998047, 0.1512298583984375, 0.1605091094970703, 0.16978836059570312, 0.17906761169433594, 0.18834686279296875, 0.19762611389160156, 0.20690536499023438, 0.2161846160888672, 0.2254638671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 10.0, 19.0, 40.0, 94.0, 415.0, 3033.0, 334.0, 64.0, 28.0, 14.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2269287109375, -0.2214508056640625, -0.215972900390625, -0.2104949951171875, -0.20501708984375, -0.1995391845703125, -0.194061279296875, -0.1885833740234375, -0.18310546875, -0.1776275634765625, -0.172149658203125, -0.1666717529296875, -0.16119384765625, -0.1557159423828125, -0.150238037109375, -0.1447601318359375, -0.1392822265625, -0.1338043212890625, -0.128326416015625, -0.1228485107421875, -0.11737060546875, -0.1118927001953125, -0.106414794921875, -0.1009368896484375, -0.095458984375, -0.0899810791015625, -0.084503173828125, -0.0790252685546875, -0.07354736328125, -0.0680694580078125, -0.062591552734375, -0.0571136474609375, -0.0516357421875, -0.0461578369140625, -0.040679931640625, -0.0352020263671875, -0.02972412109375, -0.0242462158203125, -0.018768310546875, -0.0132904052734375, -0.0078125, -0.0023345947265625, 0.003143310546875, 0.0086212158203125, 0.01409912109375, 0.0195770263671875, 0.025054931640625, 0.0305328369140625, 0.0360107421875, 0.0414886474609375, 0.046966552734375, 0.0524444580078125, 0.05792236328125, 0.0634002685546875, 0.068878173828125, 0.0743560791015625, 0.079833984375, 0.0853118896484375, 0.090789794921875, 0.0962677001953125, 0.10174560546875, 0.1072235107421875, 0.112701416015625, 0.1181793212890625, 0.1236572265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 9.0, 13.0, 46.0, 109.0, 384.0, 340.0, 88.0, 14.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1068203449249268, -2.0655229091644287, -2.0242257118225098, -1.9829282760620117, -1.9416308403015137, -1.9003335237503052, -1.8590360879898071, -1.8177387714385986, -1.7764413356781006, -1.735144019126892, -1.693846583366394, -1.6525492668151855, -1.6112518310546875, -1.569954514503479, -1.528657078742981, -1.4873597621917725, -1.4460623264312744, -1.404765009880066, -1.3634675741195679, -1.3221702575683594, -1.2808728218078613, -1.2395755052566528, -1.1982780694961548, -1.1569807529449463, -1.1156834363937378, -1.0743861198425293, -1.0330886840820312, -0.991791307926178, -0.9504939317703247, -0.9091965556144714, -0.8678991794586182, -0.8266018629074097, -0.7853043675422668, -0.7440069913864136, -0.7027096152305603, -0.661412239074707, -0.6201148629188538, -0.5788174867630005, -0.537520170211792, -0.49622276425361633, -0.45492538809776306, -0.4136280119419098, -0.3723306357860565, -0.33103328943252563, -0.28973591327667236, -0.2484385222196579, -0.20714116096496582, -0.16584378480911255, -0.12454640865325928, -0.083249032497406, -0.04195166379213333, -0.0006542950868606567, 0.040643081068992615, 0.08194045722484589, 0.12323781847953796, 0.16453519463539124, 0.2058325707912445, 0.24712994694709778, 0.28842732310295105, 0.32972466945648193, 0.3710220456123352, 0.4123194217681885, 0.45361679792404175, 0.494914174079895, 0.5362115502357483]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 11.0, 7.0, 14.0, 14.0, 15.0, 14.0, 20.0, 36.0, 26.0, 45.0, 35.0, 47.0, 46.0, 52.0, 48.0, 43.0, 55.0, 54.0, 43.0, 48.0, 47.0, 43.0, 41.0, 29.0, 30.0, 23.0, 23.0, 18.0, 18.0, 19.0, 12.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2975556254386902, -0.2845814824104309, -0.27160730957984924, -0.25863316655158997, -0.2456590086221695, -0.23268485069274902, -0.21971070766448975, -0.20673654973506927, -0.1937623918056488, -0.18078823387622833, -0.16781407594680786, -0.15483993291854858, -0.1418657749891281, -0.12889161705970764, -0.11591746658086777, -0.1029433161020279, -0.08996915817260742, -0.07699500024318695, -0.06402084976434708, -0.051046695560216904, -0.03807254135608673, -0.02509838342666626, -0.012124232947826385, 0.0008499175310134888, 0.01382407546043396, 0.026798229664564133, 0.039772383868694305, 0.05274653807282448, 0.06572069227695465, 0.07869485020637512, 0.091669000685215, 0.10464315116405487, 0.11761730909347534, 0.1305914670228958, 0.14356562495231628, 0.15653976798057556, 0.16951392590999603, 0.1824880838394165, 0.19546222686767578, 0.20843638479709625, 0.22141054272651672, 0.2343847006559372, 0.24735885858535767, 0.26033300161361694, 0.2733071446418762, 0.2862813174724579, 0.29925546050071716, 0.31222963333129883, 0.3252037763595581, 0.3381779193878174, 0.35115209221839905, 0.3641262352466583, 0.37710040807724, 0.39007455110549927, 0.40304869413375854, 0.4160228371620178, 0.4289970099925995, 0.44197115302085876, 0.45494532585144043, 0.4679194688796997, 0.480893611907959, 0.49386778473854065, 0.5068419575691223, 0.5198161005973816, 0.5327902436256409]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 1.0, 4.0, 4.0, 11.0, 11.0, 16.0, 31.0, 28.0, 47.0, 83.0, 95.0, 150.0, 227.0, 344.0, 605.0, 1210.0, 2542.0, 7392.0, 30398.0, 226056.0, 673792.0, 82208.0, 14841.0, 4352.0, 1856.0, 872.0, 475.0, 289.0, 199.0, 131.0, 75.0, 62.0, 32.0, 25.0, 24.0, 11.0, 14.0, 7.0, 7.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.262451171875, -0.2543182373046875, -0.246185302734375, -0.2380523681640625, -0.22991943359375, -0.2217864990234375, -0.213653564453125, -0.2055206298828125, -0.1973876953125, -0.1892547607421875, -0.181121826171875, -0.1729888916015625, -0.16485595703125, -0.1567230224609375, -0.148590087890625, -0.1404571533203125, -0.13232421875, -0.1241912841796875, -0.116058349609375, -0.1079254150390625, -0.09979248046875, -0.0916595458984375, -0.083526611328125, -0.0753936767578125, -0.0672607421875, -0.0591278076171875, -0.050994873046875, -0.0428619384765625, -0.03472900390625, -0.0265960693359375, -0.018463134765625, -0.0103302001953125, -0.002197265625, 0.0059356689453125, 0.014068603515625, 0.0222015380859375, 0.03033447265625, 0.0384674072265625, 0.046600341796875, 0.0547332763671875, 0.0628662109375, 0.0709991455078125, 0.079132080078125, 0.0872650146484375, 0.09539794921875, 0.1035308837890625, 0.111663818359375, 0.1197967529296875, 0.1279296875, 0.1360626220703125, 0.144195556640625, 0.1523284912109375, 0.16046142578125, 0.1685943603515625, 0.176727294921875, 0.1848602294921875, 0.1929931640625, 0.2011260986328125, 0.209259033203125, 0.2173919677734375, 0.22552490234375, 0.2336578369140625, 0.241790771484375, 0.2499237060546875, 0.258056640625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 13.0, 11.0, 31.0, 44.0, 73.0, 110.0, 156.0, 156.0, 121.0, 98.0, 66.0, 43.0, 29.0, 15.0, 13.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097412109375, -0.09440135955810547, -0.09139060974121094, -0.0883798599243164, -0.08536911010742188, -0.08235836029052734, -0.07934761047363281, -0.07633686065673828, -0.07332611083984375, -0.07031536102294922, -0.06730461120605469, -0.06429386138916016, -0.061283111572265625, -0.058272361755371094, -0.05526161193847656, -0.05225086212158203, -0.0492401123046875, -0.04622936248779297, -0.04321861267089844, -0.040207862854003906, -0.037197113037109375, -0.034186363220214844, -0.031175613403320312, -0.02816486358642578, -0.02515411376953125, -0.02214336395263672, -0.019132614135742188, -0.016121864318847656, -0.013111114501953125, -0.010100364685058594, -0.0070896148681640625, -0.004078865051269531, -0.001068115234375, 0.0019426345825195312, 0.0049533843994140625, 0.007964134216308594, 0.010974884033203125, 0.013985633850097656, 0.016996383666992188, 0.02000713348388672, 0.02301788330078125, 0.02602863311767578, 0.029039382934570312, 0.032050132751464844, 0.035060882568359375, 0.038071632385253906, 0.04108238220214844, 0.04409313201904297, 0.0471038818359375, 0.05011463165283203, 0.05312538146972656, 0.056136131286621094, 0.059146881103515625, 0.062157630920410156, 0.06516838073730469, 0.06817913055419922, 0.07118988037109375, 0.07420063018798828, 0.07721138000488281, 0.08022212982177734, 0.08323287963867188, 0.0862436294555664, 0.08925437927246094, 0.09226512908935547, 0.09527587890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 14.0, 16.0, 16.0, 38.0, 55.0, 113.0, 121.0, 247.0, 455.0, 1027.0, 2399.0, 7356.0, 33275.0, 365486.0, 578564.0, 44925.0, 9191.0, 2880.0, 1091.0, 553.0, 281.0, 145.0, 98.0, 54.0, 39.0, 22.0, 18.0, 16.0, 15.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2844085693359375, -0.274627685546875, -0.2648468017578125, -0.25506591796875, -0.2452850341796875, -0.235504150390625, -0.2257232666015625, -0.2159423828125, -0.2061614990234375, -0.196380615234375, -0.1865997314453125, -0.17681884765625, -0.1670379638671875, -0.157257080078125, -0.1474761962890625, -0.1376953125, -0.1279144287109375, -0.118133544921875, -0.1083526611328125, -0.09857177734375, -0.0887908935546875, -0.079010009765625, -0.0692291259765625, -0.0594482421875, -0.0496673583984375, -0.039886474609375, -0.0301055908203125, -0.02032470703125, -0.0105438232421875, -0.000762939453125, 0.0090179443359375, 0.018798828125, 0.0285797119140625, 0.038360595703125, 0.0481414794921875, 0.05792236328125, 0.0677032470703125, 0.077484130859375, 0.0872650146484375, 0.0970458984375, 0.1068267822265625, 0.116607666015625, 0.1263885498046875, 0.13616943359375, 0.1459503173828125, 0.155731201171875, 0.1655120849609375, 0.17529296875, 0.1850738525390625, 0.194854736328125, 0.2046356201171875, 0.21441650390625, 0.2241973876953125, 0.233978271484375, 0.2437591552734375, 0.2535400390625, 0.2633209228515625, 0.273101806640625, 0.2828826904296875, 0.29266357421875, 0.3024444580078125, 0.312225341796875, 0.3220062255859375, 0.331787109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 11.0, 14.0, 8.0, 13.0, 16.0, 17.0, 16.0, 24.0, 30.0, 35.0, 34.0, 42.0, 44.0, 33.0, 51.0, 54.0, 44.0, 60.0, 42.0, 46.0, 37.0, 49.0, 39.0, 40.0, 35.0, 25.0, 21.0, 15.0, 17.0, 15.0, 7.0, 7.0, 12.0, 2.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2412109375, -0.2338104248046875, -0.226409912109375, -0.2190093994140625, -0.21160888671875, -0.2042083740234375, -0.196807861328125, -0.1894073486328125, -0.1820068359375, -0.1746063232421875, -0.167205810546875, -0.1598052978515625, -0.15240478515625, -0.1450042724609375, -0.137603759765625, -0.1302032470703125, -0.122802734375, -0.1154022216796875, -0.108001708984375, -0.1006011962890625, -0.09320068359375, -0.0858001708984375, -0.078399658203125, -0.0709991455078125, -0.0635986328125, -0.0561981201171875, -0.048797607421875, -0.0413970947265625, -0.03399658203125, -0.0265960693359375, -0.019195556640625, -0.0117950439453125, -0.00439453125, 0.0030059814453125, 0.010406494140625, 0.0178070068359375, 0.02520751953125, 0.0326080322265625, 0.040008544921875, 0.0474090576171875, 0.0548095703125, 0.0622100830078125, 0.069610595703125, 0.0770111083984375, 0.08441162109375, 0.0918121337890625, 0.099212646484375, 0.1066131591796875, 0.114013671875, 0.1214141845703125, 0.128814697265625, 0.1362152099609375, 0.14361572265625, 0.1510162353515625, 0.158416748046875, 0.1658172607421875, 0.1732177734375, 0.1806182861328125, 0.188018798828125, 0.1954193115234375, 0.20281982421875, 0.2102203369140625, 0.217620849609375, 0.2250213623046875, 0.232421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 13.0, 16.0, 24.0, 25.0, 66.0, 147.0, 318.0, 698.0, 2742.0, 85185.0, 951640.0, 5862.0, 1042.0, 369.0, 191.0, 75.0, 47.0, 25.0, 24.0, 9.0, 6.0, 11.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.583984375, -0.56689453125, -0.5498046875, -0.53271484375, -0.515625, -0.49853515625, -0.4814453125, -0.46435546875, -0.447265625, -0.43017578125, -0.4130859375, -0.39599609375, -0.37890625, -0.36181640625, -0.3447265625, -0.32763671875, -0.310546875, -0.29345703125, -0.2763671875, -0.25927734375, -0.2421875, -0.22509765625, -0.2080078125, -0.19091796875, -0.173828125, -0.15673828125, -0.1396484375, -0.12255859375, -0.10546875, -0.08837890625, -0.0712890625, -0.05419921875, -0.037109375, -0.02001953125, -0.0029296875, 0.01416015625, 0.03125, 0.04833984375, 0.0654296875, 0.08251953125, 0.099609375, 0.11669921875, 0.1337890625, 0.15087890625, 0.16796875, 0.18505859375, 0.2021484375, 0.21923828125, 0.236328125, 0.25341796875, 0.2705078125, 0.28759765625, 0.3046875, 0.32177734375, 0.3388671875, 0.35595703125, 0.373046875, 0.39013671875, 0.4072265625, 0.42431640625, 0.44140625, 0.45849609375, 0.4755859375, 0.49267578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 13.0, 12.0, 18.0, 14.0, 20.0, 27.0, 22.0, 33.0, 45.0, 60.0, 90.0, 113.0, 99.0, 91.0, 63.0, 47.0, 39.0, 27.0, 26.0, 26.0, 21.0, 11.0, 14.0, 9.0, 9.0, 12.0, 3.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.655952453613281e-05, -9.356345981359482e-05, -9.056739509105682e-05, -8.757133036851883e-05, -8.457526564598083e-05, -8.157920092344284e-05, -7.858313620090485e-05, -7.558707147836685e-05, -7.259100675582886e-05, -6.959494203329086e-05, -6.659887731075287e-05, -6.360281258821487e-05, -6.060674786567688e-05, -5.7610683143138885e-05, -5.461461842060089e-05, -5.16185536980629e-05, -4.86224889755249e-05, -4.562642425298691e-05, -4.2630359530448914e-05, -3.963429480791092e-05, -3.6638230085372925e-05, -3.364216536283493e-05, -3.0646100640296936e-05, -2.765003591775894e-05, -2.4653971195220947e-05, -2.1657906472682953e-05, -1.866184175014496e-05, -1.5665777027606964e-05, -1.266971230506897e-05, -9.673647582530975e-06, -6.677582859992981e-06, -3.6815181374549866e-06, -6.854534149169922e-07, 2.310611307621002e-06, 5.306676030158997e-06, 8.302740752696991e-06, 1.1298805475234985e-05, 1.429487019777298e-05, 1.7290934920310974e-05, 2.028699964284897e-05, 2.3283064365386963e-05, 2.6279129087924957e-05, 2.927519381046295e-05, 3.2271258533000946e-05, 3.526732325553894e-05, 3.8263387978076935e-05, 4.125945270061493e-05, 4.4255517423152924e-05, 4.725158214569092e-05, 5.024764686822891e-05, 5.324371159076691e-05, 5.62397763133049e-05, 5.9235841035842896e-05, 6.223190575838089e-05, 6.522797048091888e-05, 6.822403520345688e-05, 7.122009992599487e-05, 7.421616464853287e-05, 7.721222937107086e-05, 8.020829409360886e-05, 8.320435881614685e-05, 8.620042353868484e-05, 8.919648826122284e-05, 9.219255298376083e-05, 9.518861770629883e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 5.0, 8.0, 6.0, 12.0, 16.0, 22.0, 24.0, 29.0, 56.0, 90.0, 192.0, 319.0, 761.0, 1987.0, 6923.0, 47078.0, 895140.0, 81873.0, 9492.0, 2610.0, 965.0, 409.0, 203.0, 111.0, 75.0, 56.0, 30.0, 16.0, 6.0, 7.0, 0.0, 14.0, 9.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248046875, -0.2406635284423828, -0.23328018188476562, -0.22589683532714844, -0.21851348876953125, -0.21113014221191406, -0.20374679565429688, -0.1963634490966797, -0.1889801025390625, -0.1815967559814453, -0.17421340942382812, -0.16683006286621094, -0.15944671630859375, -0.15206336975097656, -0.14468002319335938, -0.1372966766357422, -0.129913330078125, -0.12252998352050781, -0.11514663696289062, -0.10776329040527344, -0.10037994384765625, -0.09299659729003906, -0.08561325073242188, -0.07822990417480469, -0.0708465576171875, -0.06346321105957031, -0.056079864501953125, -0.04869651794433594, -0.04131317138671875, -0.03392982482910156, -0.026546478271484375, -0.019163131713867188, -0.01177978515625, -0.0043964385986328125, 0.002986907958984375, 0.010370254516601562, 0.01775360107421875, 0.025136947631835938, 0.032520294189453125, 0.03990364074707031, 0.0472869873046875, 0.05467033386230469, 0.062053680419921875, 0.06943702697753906, 0.07682037353515625, 0.08420372009277344, 0.09158706665039062, 0.09897041320800781, 0.106353759765625, 0.11373710632324219, 0.12112045288085938, 0.12850379943847656, 0.13588714599609375, 0.14327049255371094, 0.15065383911132812, 0.1580371856689453, 0.1654205322265625, 0.1728038787841797, 0.18018722534179688, 0.18757057189941406, 0.19495391845703125, 0.20233726501464844, 0.20972061157226562, 0.2171039581298828, 0.2244873046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 7.0, 8.0, 13.0, 14.0, 24.0, 50.0, 67.0, 119.0, 275.0, 159.0, 102.0, 44.0, 30.0, 16.0, 11.0, 10.0, 7.0, 9.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3042259216308594, -0.29570770263671875, -0.2871894836425781, -0.2786712646484375, -0.2701530456542969, -0.26163482666015625, -0.2531166076660156, -0.244598388671875, -0.23608016967773438, -0.22756195068359375, -0.21904373168945312, -0.2105255126953125, -0.20200729370117188, -0.19348907470703125, -0.18497085571289062, -0.17645263671875, -0.16793441772460938, -0.15941619873046875, -0.15089797973632812, -0.1423797607421875, -0.13386154174804688, -0.12534332275390625, -0.11682510375976562, -0.108306884765625, -0.09978866577148438, -0.09127044677734375, -0.08275222778320312, -0.0742340087890625, -0.06571578979492188, -0.05719757080078125, -0.048679351806640625, -0.0401611328125, -0.031642913818359375, -0.02312469482421875, -0.014606475830078125, -0.0060882568359375, 0.002429962158203125, 0.01094818115234375, 0.019466400146484375, 0.027984619140625, 0.036502838134765625, 0.04502105712890625, 0.053539276123046875, 0.0620574951171875, 0.07057571411132812, 0.07909393310546875, 0.08761215209960938, 0.09613037109375, 0.10464859008789062, 0.11316680908203125, 0.12168502807617188, 0.1302032470703125, 0.13872146606445312, 0.14723968505859375, 0.15575790405273438, 0.164276123046875, 0.17279434204101562, 0.18131256103515625, 0.18983078002929688, 0.1983489990234375, 0.20686721801757812, 0.21538543701171875, 0.22390365600585938, 0.232421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 41.0, 322.0, 580.0, 40.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.710500717163086, -11.44558334350586, -11.180665016174316, -10.91574764251709, -10.650829315185547, -10.38591194152832, -10.120994567871094, -9.85607624053955, -9.591158866882324, -9.326241493225098, -9.061323165893555, -8.796405792236328, -8.531487464904785, -8.266570091247559, -8.001651763916016, -7.736734390258789, -7.471816539764404, -7.2068986892700195, -6.941980838775635, -6.67706298828125, -6.412145614624023, -6.147227764129639, -5.882309913635254, -5.617392063140869, -5.352474212646484, -5.0875563621521, -4.822638511657715, -4.557721138000488, -4.2928032875061035, -4.027885437011719, -3.762967586517334, -3.498049736022949, -3.233132839202881, -2.968214988708496, -2.7032973766326904, -2.4383795261383057, -2.1734619140625, -1.9085440635681152, -1.6436262130737305, -1.3787084817886353, -1.11379075050354, -0.8488730192184448, -0.5839552283287048, -0.31903743743896484, -0.05411970615386963, 0.21079802513122559, 0.47571587562561035, 0.7406336069107056, 1.0055513381958008, 1.270469069480896, 1.5353868007659912, 1.800304651260376, 2.0652222633361816, 2.3301401138305664, 2.595057964324951, 2.859975814819336, 3.1248934268951416, 3.3898112773895264, 3.654728889465332, 3.919646739959717, 4.184564590454102, 4.449481964111328, 4.714400291442871, 4.979317665100098, 5.244235515594482]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 10.0, 8.0, 15.0, 22.0, 27.0, 20.0, 30.0, 33.0, 62.0, 35.0, 55.0, 42.0, 56.0, 61.0, 67.0, 46.0, 54.0, 55.0, 37.0, 33.0, 47.0, 37.0, 23.0, 26.0, 19.0, 13.0, 11.0, 11.0, 14.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4613746404647827, -1.4001802206039429, -1.3389859199523926, -1.2777915000915527, -1.216597080230713, -1.155402660369873, -1.0942083597183228, -1.033013939857483, -0.9718195796012878, -0.9106252193450928, -0.8494307994842529, -0.7882364392280579, -0.7270420789718628, -0.665847659111023, -0.6046532988548279, -0.5434589385986328, -0.48226451873779297, -0.4210701286792755, -0.35987573862075806, -0.298681378364563, -0.23748698830604553, -0.17629259824752808, -0.11509823799133301, -0.05390384793281555, 0.007290542125701904, 0.06848492473363876, 0.12967930734157562, 0.19087368249893188, 0.25206807255744934, 0.3132624626159668, 0.37445682287216187, 0.4356512129306793, 0.4968454837799072, 0.5580398440361023, 0.6192342638969421, 0.6804286241531372, 0.741623044013977, 0.8028174042701721, 0.8640117645263672, 0.925206184387207, 0.9864005446434021, 1.0475949048995972, 1.108789324760437, 1.1699836254119873, 1.2311780452728271, 1.292372465133667, 1.3535668849945068, 1.4147611856460571, 1.475955605506897, 1.5371500253677368, 1.598344326019287, 1.659538745880127, 1.7207331657409668, 1.7819275856018066, 1.843121886253357, 1.9043163061141968, 1.965510606765747, 2.026705026626587, 2.0878994464874268, 2.1490936279296875, 2.2102880477905273, 2.271482467651367, 2.332676887512207, 2.393871307373047, 2.4550657272338867]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 8.0, 10.0, 13.0, 17.0, 41.0, 57.0, 80.0, 150.0, 280.0, 521.0, 1160.0, 2835.0, 9257.0, 48158.0, 3859858.0, 242071.0, 20550.0, 5454.0, 1947.0, 844.0, 418.0, 201.0, 127.0, 82.0, 41.0, 27.0, 22.0, 12.0, 8.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.268310546875, -0.26012420654296875, -0.2519378662109375, -0.24375152587890625, -0.235565185546875, -0.22737884521484375, -0.2191925048828125, -0.21100616455078125, -0.20281982421875, -0.19463348388671875, -0.1864471435546875, -0.17826080322265625, -0.170074462890625, -0.16188812255859375, -0.1537017822265625, -0.14551544189453125, -0.1373291015625, -0.12914276123046875, -0.1209564208984375, -0.11277008056640625, -0.104583740234375, -0.09639739990234375, -0.0882110595703125, -0.08002471923828125, -0.07183837890625, -0.06365203857421875, -0.0554656982421875, -0.04727935791015625, -0.039093017578125, -0.03090667724609375, -0.0227203369140625, -0.01453399658203125, -0.00634765625, 0.00183868408203125, 0.0100250244140625, 0.01821136474609375, 0.026397705078125, 0.03458404541015625, 0.0427703857421875, 0.05095672607421875, 0.05914306640625, 0.06732940673828125, 0.0755157470703125, 0.08370208740234375, 0.091888427734375, 0.10007476806640625, 0.1082611083984375, 0.11644744873046875, 0.1246337890625, 0.13282012939453125, 0.1410064697265625, 0.14919281005859375, 0.157379150390625, 0.16556549072265625, 0.1737518310546875, 0.18193817138671875, 0.19012451171875, 0.19831085205078125, 0.2064971923828125, 0.21468353271484375, 0.222869873046875, 0.23105621337890625, 0.2392425537109375, 0.24742889404296875, 0.255615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 8.0, 12.0, 20.0, 34.0, 47.0, 71.0, 98.0, 109.0, 138.0, 120.0, 109.0, 70.0, 46.0, 41.0, 23.0, 17.0, 10.0, 11.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09686279296875, -0.09388446807861328, -0.09090614318847656, -0.08792781829833984, -0.08494949340820312, -0.0819711685180664, -0.07899284362792969, -0.07601451873779297, -0.07303619384765625, -0.07005786895751953, -0.06707954406738281, -0.0641012191772461, -0.061122894287109375, -0.058144569396972656, -0.05516624450683594, -0.05218791961669922, -0.0492095947265625, -0.04623126983642578, -0.04325294494628906, -0.040274620056152344, -0.037296295166015625, -0.034317970275878906, -0.03133964538574219, -0.02836132049560547, -0.02538299560546875, -0.02240467071533203, -0.019426345825195312, -0.016448020935058594, -0.013469696044921875, -0.010491371154785156, -0.0075130462646484375, -0.004534721374511719, -0.001556396484375, 0.0014219284057617188, 0.0044002532958984375, 0.007378578186035156, 0.010356903076171875, 0.013335227966308594, 0.016313552856445312, 0.01929187774658203, 0.02227020263671875, 0.02524852752685547, 0.028226852416992188, 0.031205177307128906, 0.034183502197265625, 0.037161827087402344, 0.04014015197753906, 0.04311847686767578, 0.0460968017578125, 0.04907512664794922, 0.05205345153808594, 0.055031776428222656, 0.058010101318359375, 0.060988426208496094, 0.06396675109863281, 0.06694507598876953, 0.06992340087890625, 0.07290172576904297, 0.07588005065917969, 0.0788583755493164, 0.08183670043945312, 0.08481502532958984, 0.08779335021972656, 0.09077167510986328, 0.09375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 23.0, 29.0, 36.0, 65.0, 92.0, 113.0, 233.0, 440.0, 744.0, 1259.0, 2808.0, 8921.0, 74956.0, 4025171.0, 64996.0, 8380.0, 2918.0, 1324.0, 718.0, 388.0, 223.0, 139.0, 120.0, 64.0, 44.0, 18.0, 19.0, 7.0, 8.0, 5.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40478515625, -0.3933753967285156, -0.38196563720703125, -0.3705558776855469, -0.3591461181640625, -0.3477363586425781, -0.33632659912109375, -0.3249168395996094, -0.313507080078125, -0.3020973205566406, -0.29068756103515625, -0.2792778015136719, -0.2678680419921875, -0.2564582824707031, -0.24504852294921875, -0.23363876342773438, -0.22222900390625, -0.21081924438476562, -0.19940948486328125, -0.18799972534179688, -0.1765899658203125, -0.16518020629882812, -0.15377044677734375, -0.14236068725585938, -0.130950927734375, -0.11954116821289062, -0.10813140869140625, -0.09672164916992188, -0.0853118896484375, -0.07390213012695312, -0.06249237060546875, -0.051082611083984375, -0.0396728515625, -0.028263092041015625, -0.01685333251953125, -0.005443572998046875, 0.0059661865234375, 0.017375946044921875, 0.02878570556640625, 0.040195465087890625, 0.051605224609375, 0.06301498413085938, 0.07442474365234375, 0.08583450317382812, 0.0972442626953125, 0.10865402221679688, 0.12006378173828125, 0.13147354125976562, 0.14288330078125, 0.15429306030273438, 0.16570281982421875, 0.17711257934570312, 0.1885223388671875, 0.19993209838867188, 0.21134185791015625, 0.22275161743164062, 0.234161376953125, 0.24557113647460938, 0.25698089599609375, 0.2683906555175781, 0.2798004150390625, 0.2912101745605469, 0.30261993408203125, 0.3140296936035156, 0.325439453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 14.0, 34.0, 89.0, 501.0, 3077.0, 221.0, 55.0, 29.0, 18.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27099609375, -0.2633190155029297, -0.2556419372558594, -0.24796485900878906, -0.24028778076171875, -0.23261070251464844, -0.22493362426757812, -0.2172565460205078, -0.2095794677734375, -0.2019023895263672, -0.19422531127929688, -0.18654823303222656, -0.17887115478515625, -0.17119407653808594, -0.16351699829101562, -0.1558399200439453, -0.148162841796875, -0.1404857635498047, -0.13280868530273438, -0.12513160705566406, -0.11745452880859375, -0.10977745056152344, -0.10210037231445312, -0.09442329406738281, -0.0867462158203125, -0.07906913757324219, -0.07139205932617188, -0.06371498107910156, -0.05603790283203125, -0.04836082458496094, -0.040683746337890625, -0.03300666809082031, -0.02532958984375, -0.017652511596679688, -0.009975433349609375, -0.0022983551025390625, 0.00537872314453125, 0.013055801391601562, 0.020732879638671875, 0.028409957885742188, 0.0360870361328125, 0.04376411437988281, 0.051441192626953125, 0.05911827087402344, 0.06679534912109375, 0.07447242736816406, 0.08214950561523438, 0.08982658386230469, 0.097503662109375, 0.10518074035644531, 0.11285781860351562, 0.12053489685058594, 0.12821197509765625, 0.13588905334472656, 0.14356613159179688, 0.1512432098388672, 0.1589202880859375, 0.1665973663330078, 0.17427444458007812, 0.18195152282714844, 0.18962860107421875, 0.19730567932128906, 0.20498275756835938, 0.2126598358154297, 0.2203369140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 15.0, 41.0, 72.0, 199.0, 283.0, 214.0, 85.0, 50.0, 20.0, 5.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7644767761230469, -0.7356289625167847, -0.7067811489105225, -0.6779333353042603, -0.649085521697998, -0.6202377080917358, -0.5913898944854736, -0.5625420808792114, -0.5336942672729492, -0.504846453666687, -0.4759986400604248, -0.4471508264541626, -0.4183030128479004, -0.3894551992416382, -0.360607385635376, -0.33175957202911377, -0.30291175842285156, -0.27406394481658936, -0.24521613121032715, -0.21636831760406494, -0.18752050399780273, -0.15867269039154053, -0.12982487678527832, -0.10097706317901611, -0.0721292495727539, -0.0432814359664917, -0.014433622360229492, 0.014414191246032715, 0.04326200485229492, 0.07210981845855713, 0.10095763206481934, 0.12980544567108154, 0.15865325927734375, 0.18750107288360596, 0.21634888648986816, 0.24519670009613037, 0.2740445137023926, 0.3028923273086548, 0.331740140914917, 0.3605879545211792, 0.3894357681274414, 0.4182835817337036, 0.4471313953399658, 0.475979208946228, 0.5048270225524902, 0.5336748361587524, 0.5625226497650146, 0.5913704633712769, 0.6202182769775391, 0.6490660905838013, 0.6779139041900635, 0.7067617177963257, 0.7356095314025879, 0.7644573450088501, 0.7933051586151123, 0.8221529722213745, 0.8510007858276367, 0.8798485994338989, 0.9086964130401611, 0.9375442266464233, 0.9663920402526855, 0.9952398538589478, 1.02408766746521, 1.0529354810714722, 1.0817832946777344]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 7.0, 5.0, 5.0, 12.0, 9.0, 23.0, 18.0, 22.0, 19.0, 21.0, 36.0, 27.0, 28.0, 30.0, 38.0, 40.0, 38.0, 46.0, 44.0, 47.0, 32.0, 39.0, 35.0, 29.0, 45.0, 40.0, 34.0, 35.0, 35.0, 31.0, 16.0, 20.0, 13.0, 21.0, 10.0, 6.0, 7.0, 9.0, 5.0, 6.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3800247311592102, -0.3687201142311096, -0.35741546750068665, -0.34611085057258606, -0.3348062038421631, -0.3235015869140625, -0.3121969699859619, -0.30089232325553894, -0.28958767652511597, -0.2782830595970154, -0.2669784128665924, -0.2556737959384918, -0.24436914920806885, -0.23306453227996826, -0.22175990045070648, -0.2104552686214447, -0.19915065169334412, -0.18784601986408234, -0.17654138803482056, -0.16523677110671997, -0.153932124376297, -0.1426275074481964, -0.13132287561893463, -0.12001824378967285, -0.10871361196041107, -0.09740898013114929, -0.08610434830188751, -0.07479972392320633, -0.06349509209394455, -0.05219046026468277, -0.04088583588600159, -0.029581204056739807, -0.018276572227478027, -0.006971942260861397, 0.004332687705755234, 0.015637315809726715, 0.026941947638988495, 0.038246579468250275, 0.04955120384693146, 0.06085583567619324, 0.07216046750545502, 0.0834650993347168, 0.09476973116397858, 0.10607435554265976, 0.11737898737192154, 0.12868362665176392, 0.1399882435798645, 0.15129287540912628, 0.16259750723838806, 0.17390213906764984, 0.18520677089691162, 0.1965113878250122, 0.20781603455543518, 0.21912065148353577, 0.23042528331279755, 0.24172991514205933, 0.2530345320701599, 0.2643391489982605, 0.27564379572868347, 0.28694841265678406, 0.29825305938720703, 0.3095576763153076, 0.3208622932434082, 0.3321669399738312, 0.34347158670425415]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 9.0, 15.0, 16.0, 40.0, 44.0, 97.0, 131.0, 288.0, 611.0, 1787.0, 6866.0, 50388.0, 910813.0, 65977.0, 7944.0, 2024.0, 764.0, 352.0, 156.0, 74.0, 47.0, 38.0, 21.0, 21.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41943359375, -0.4061393737792969, -0.39284515380859375, -0.3795509338378906, -0.3662567138671875, -0.3529624938964844, -0.33966827392578125, -0.3263740539550781, -0.313079833984375, -0.2997856140136719, -0.28649139404296875, -0.2731971740722656, -0.2599029541015625, -0.24660873413085938, -0.23331451416015625, -0.22002029418945312, -0.20672607421875, -0.19343185424804688, -0.18013763427734375, -0.16684341430664062, -0.1535491943359375, -0.14025497436523438, -0.12696075439453125, -0.11366653442382812, -0.100372314453125, -0.08707809448242188, -0.07378387451171875, -0.060489654541015625, -0.0471954345703125, -0.033901214599609375, -0.02060699462890625, -0.007312774658203125, 0.0059814453125, 0.019275665283203125, 0.03256988525390625, 0.045864105224609375, 0.0591583251953125, 0.07245254516601562, 0.08574676513671875, 0.09904098510742188, 0.112335205078125, 0.12562942504882812, 0.13892364501953125, 0.15221786499023438, 0.1655120849609375, 0.17880630493164062, 0.19210052490234375, 0.20539474487304688, 0.21868896484375, 0.23198318481445312, 0.24527740478515625, 0.2585716247558594, 0.2718658447265625, 0.2851600646972656, 0.29845428466796875, 0.3117485046386719, 0.325042724609375, 0.3383369445800781, 0.35163116455078125, 0.3649253845214844, 0.3782196044921875, 0.3915138244628906, 0.40480804443359375, 0.4181022644042969, 0.431396484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 13.0, 20.0, 25.0, 55.0, 90.0, 89.0, 121.0, 116.0, 118.0, 97.0, 76.0, 58.0, 36.0, 20.0, 21.0, 17.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09857177734375, -0.09554195404052734, -0.09251213073730469, -0.08948230743408203, -0.08645248413085938, -0.08342266082763672, -0.08039283752441406, -0.0773630142211914, -0.07433319091796875, -0.0713033676147461, -0.06827354431152344, -0.06524372100830078, -0.062213897705078125, -0.05918407440185547, -0.05615425109863281, -0.053124427795410156, -0.0500946044921875, -0.047064781188964844, -0.04403495788574219, -0.04100513458251953, -0.037975311279296875, -0.03494548797607422, -0.03191566467285156, -0.028885841369628906, -0.02585601806640625, -0.022826194763183594, -0.019796371459960938, -0.01676654815673828, -0.013736724853515625, -0.010706901550292969, -0.0076770782470703125, -0.004647254943847656, -0.001617431640625, 0.0014123916625976562, 0.0044422149658203125, 0.007472038269042969, 0.010501861572265625, 0.013531684875488281, 0.016561508178710938, 0.019591331481933594, 0.02262115478515625, 0.025650978088378906, 0.028680801391601562, 0.03171062469482422, 0.034740447998046875, 0.03777027130126953, 0.04080009460449219, 0.043829917907714844, 0.0468597412109375, 0.049889564514160156, 0.05291938781738281, 0.05594921112060547, 0.058979034423828125, 0.06200885772705078, 0.06503868103027344, 0.0680685043334961, 0.07109832763671875, 0.0741281509399414, 0.07715797424316406, 0.08018779754638672, 0.08321762084960938, 0.08624744415283203, 0.08927726745605469, 0.09230709075927734, 0.0953369140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 10.0, 29.0, 27.0, 35.0, 62.0, 73.0, 119.0, 162.0, 336.0, 663.0, 1460.0, 3972.0, 14290.0, 109056.0, 856077.0, 48096.0, 8905.0, 2773.0, 1139.0, 498.0, 283.0, 155.0, 93.0, 66.0, 36.0, 23.0, 32.0, 14.0, 7.0, 8.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33251953125, -0.3225440979003906, -0.31256866455078125, -0.3025932312011719, -0.2926177978515625, -0.2826423645019531, -0.27266693115234375, -0.2626914978027344, -0.252716064453125, -0.24274063110351562, -0.23276519775390625, -0.22278976440429688, -0.2128143310546875, -0.20283889770507812, -0.19286346435546875, -0.18288803100585938, -0.17291259765625, -0.16293716430664062, -0.15296173095703125, -0.14298629760742188, -0.1330108642578125, -0.12303543090820312, -0.11305999755859375, -0.10308456420898438, -0.093109130859375, -0.08313369750976562, -0.07315826416015625, -0.06318283081054688, -0.0532073974609375, -0.043231964111328125, -0.03325653076171875, -0.023281097412109375, -0.0133056640625, -0.003330230712890625, 0.00664520263671875, 0.016620635986328125, 0.0265960693359375, 0.036571502685546875, 0.04654693603515625, 0.056522369384765625, 0.066497802734375, 0.07647323608398438, 0.08644866943359375, 0.09642410278320312, 0.1063995361328125, 0.11637496948242188, 0.12635040283203125, 0.13632583618164062, 0.14630126953125, 0.15627670288085938, 0.16625213623046875, 0.17622756958007812, 0.1862030029296875, 0.19617843627929688, 0.20615386962890625, 0.21612930297851562, 0.226104736328125, 0.23608016967773438, 0.24605560302734375, 0.2560310363769531, 0.2660064697265625, 0.2759819030761719, 0.28595733642578125, 0.2959327697753906, 0.305908203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 0.0, 3.0, 11.0, 6.0, 13.0, 16.0, 22.0, 29.0, 35.0, 40.0, 31.0, 50.0, 80.0, 82.0, 82.0, 72.0, 66.0, 63.0, 48.0, 65.0, 50.0, 39.0, 23.0, 15.0, 14.0, 8.0, 14.0, 5.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.3832244873046875, -0.372650146484375, -0.3620758056640625, -0.35150146484375, -0.3409271240234375, -0.330352783203125, -0.3197784423828125, -0.3092041015625, -0.2986297607421875, -0.288055419921875, -0.2774810791015625, -0.26690673828125, -0.2563323974609375, -0.245758056640625, -0.2351837158203125, -0.224609375, -0.2140350341796875, -0.203460693359375, -0.1928863525390625, -0.18231201171875, -0.1717376708984375, -0.161163330078125, -0.1505889892578125, -0.1400146484375, -0.1294403076171875, -0.118865966796875, -0.1082916259765625, -0.09771728515625, -0.0871429443359375, -0.076568603515625, -0.0659942626953125, -0.055419921875, -0.0448455810546875, -0.034271240234375, -0.0236968994140625, -0.01312255859375, -0.0025482177734375, 0.008026123046875, 0.0186004638671875, 0.0291748046875, 0.0397491455078125, 0.050323486328125, 0.0608978271484375, 0.07147216796875, 0.0820465087890625, 0.092620849609375, 0.1031951904296875, 0.11376953125, 0.1243438720703125, 0.134918212890625, 0.1454925537109375, 0.15606689453125, 0.1666412353515625, 0.177215576171875, 0.1877899169921875, 0.1983642578125, 0.2089385986328125, 0.219512939453125, 0.2300872802734375, 0.24066162109375, 0.2512359619140625, 0.261810302734375, 0.2723846435546875, 0.282958984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 13.0, 17.0, 23.0, 25.0, 58.0, 108.0, 157.0, 407.0, 1029.0, 5020.0, 65001.0, 927842.0, 43109.0, 4058.0, 933.0, 354.0, 175.0, 68.0, 43.0, 44.0, 19.0, 5.0, 9.0, 14.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.19758224487304688, -0.19167327880859375, -0.18576431274414062, -0.1798553466796875, -0.17394638061523438, -0.16803741455078125, -0.16212844848632812, -0.156219482421875, -0.15031051635742188, -0.14440155029296875, -0.13849258422851562, -0.1325836181640625, -0.12667465209960938, -0.12076568603515625, -0.11485671997070312, -0.10894775390625, -0.10303878784179688, -0.09712982177734375, -0.09122085571289062, -0.0853118896484375, -0.07940292358398438, -0.07349395751953125, -0.06758499145507812, -0.061676025390625, -0.055767059326171875, -0.04985809326171875, -0.043949127197265625, -0.0380401611328125, -0.032131195068359375, -0.02622222900390625, -0.020313262939453125, -0.014404296875, -0.008495330810546875, -0.00258636474609375, 0.003322601318359375, 0.0092315673828125, 0.015140533447265625, 0.02104949951171875, 0.026958465576171875, 0.032867431640625, 0.038776397705078125, 0.04468536376953125, 0.050594329833984375, 0.0565032958984375, 0.062412261962890625, 0.06832122802734375, 0.07423019409179688, 0.08013916015625, 0.08604812622070312, 0.09195709228515625, 0.09786605834960938, 0.1037750244140625, 0.10968399047851562, 0.11559295654296875, 0.12150192260742188, 0.127410888671875, 0.13331985473632812, 0.13922882080078125, 0.14513778686523438, 0.1510467529296875, 0.15695571899414062, 0.16286468505859375, 0.16877365112304688, 0.1746826171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 9.0, 9.0, 18.0, 24.0, 36.0, 45.0, 76.0, 115.0, 151.0, 145.0, 113.0, 70.0, 43.0, 32.0, 18.0, 19.0, 15.0, 8.0, 10.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.435415267944336e-05, -9.129848331212997e-05, -8.824281394481659e-05, -8.51871445775032e-05, -8.213147521018982e-05, -7.907580584287643e-05, -7.602013647556305e-05, -7.296446710824966e-05, -6.990879774093628e-05, -6.68531283736229e-05, -6.379745900630951e-05, -6.0741789638996124e-05, -5.768612027168274e-05, -5.4630450904369354e-05, -5.157478153705597e-05, -4.8519112169742584e-05, -4.54634428024292e-05, -4.2407773435115814e-05, -3.935210406780243e-05, -3.6296434700489044e-05, -3.324076533317566e-05, -3.0185095965862274e-05, -2.712942659854889e-05, -2.4073757231235504e-05, -2.101808786392212e-05, -1.7962418496608734e-05, -1.4906749129295349e-05, -1.1851079761981964e-05, -8.795410394668579e-06, -5.739741027355194e-06, -2.684071660041809e-06, 3.7159770727157593e-07, 3.427267074584961e-06, 6.482936441898346e-06, 9.538605809211731e-06, 1.2594275176525116e-05, 1.56499445438385e-05, 1.8705613911151886e-05, 2.176128327846527e-05, 2.4816952645778656e-05, 2.787262201309204e-05, 3.0928291380405426e-05, 3.398396074771881e-05, 3.7039630115032196e-05, 4.009529948234558e-05, 4.3150968849658966e-05, 4.620663821697235e-05, 4.9262307584285736e-05, 5.231797695159912e-05, 5.5373646318912506e-05, 5.842931568622589e-05, 6.148498505353928e-05, 6.454065442085266e-05, 6.759632378816605e-05, 7.065199315547943e-05, 7.370766252279282e-05, 7.67633318901062e-05, 7.981900125741959e-05, 8.287467062473297e-05, 8.593033999204636e-05, 8.898600935935974e-05, 9.204167872667313e-05, 9.509734809398651e-05, 9.81530174612999e-05, 0.00010120868682861328]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 15.0, 11.0, 17.0, 16.0, 33.0, 57.0, 88.0, 140.0, 257.0, 442.0, 935.0, 2887.0, 15500.0, 216035.0, 780499.0, 25326.0, 3824.0, 1227.0, 520.0, 278.0, 146.0, 98.0, 66.0, 45.0, 28.0, 16.0, 10.0, 9.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2137451171875, -0.20841598510742188, -0.20308685302734375, -0.19775772094726562, -0.1924285888671875, -0.18709945678710938, -0.18177032470703125, -0.17644119262695312, -0.171112060546875, -0.16578292846679688, -0.16045379638671875, -0.15512466430664062, -0.1497955322265625, -0.14446640014648438, -0.13913726806640625, -0.13380813598632812, -0.12847900390625, -0.12314987182617188, -0.11782073974609375, -0.11249160766601562, -0.1071624755859375, -0.10183334350585938, -0.09650421142578125, -0.09117507934570312, -0.085845947265625, -0.08051681518554688, -0.07518768310546875, -0.06985855102539062, -0.0645294189453125, -0.059200286865234375, -0.05387115478515625, -0.048542022705078125, -0.043212890625, -0.037883758544921875, -0.03255462646484375, -0.027225494384765625, -0.0218963623046875, -0.016567230224609375, -0.01123809814453125, -0.005908966064453125, -0.000579833984375, 0.004749298095703125, 0.01007843017578125, 0.015407562255859375, 0.0207366943359375, 0.026065826416015625, 0.03139495849609375, 0.036724090576171875, 0.04205322265625, 0.047382354736328125, 0.05271148681640625, 0.058040618896484375, 0.0633697509765625, 0.06869888305664062, 0.07402801513671875, 0.07935714721679688, 0.084686279296875, 0.09001541137695312, 0.09534454345703125, 0.10067367553710938, 0.1060028076171875, 0.11133193969726562, 0.11666107177734375, 0.12199020385742188, 0.1273193359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 11.0, 12.0, 15.0, 22.0, 20.0, 23.0, 25.0, 43.0, 58.0, 218.0, 266.0, 52.0, 33.0, 25.0, 34.0, 25.0, 10.0, 15.0, 11.0, 12.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1099853515625, -0.10632896423339844, -0.10267257690429688, -0.09901618957519531, -0.09535980224609375, -0.09170341491699219, -0.08804702758789062, -0.08439064025878906, -0.0807342529296875, -0.07707786560058594, -0.07342147827148438, -0.06976509094238281, -0.06610870361328125, -0.06245231628417969, -0.058795928955078125, -0.05513954162597656, -0.051483154296875, -0.04782676696777344, -0.044170379638671875, -0.04051399230957031, -0.03685760498046875, -0.03320121765136719, -0.029544830322265625, -0.025888442993164062, -0.0222320556640625, -0.018575668334960938, -0.014919281005859375, -0.011262893676757812, -0.00760650634765625, -0.0039501190185546875, -0.000293731689453125, 0.0033626556396484375, 0.00701904296875, 0.010675430297851562, 0.014331817626953125, 0.017988204956054688, 0.02164459228515625, 0.025300979614257812, 0.028957366943359375, 0.03261375427246094, 0.0362701416015625, 0.03992652893066406, 0.043582916259765625, 0.04723930358886719, 0.05089569091796875, 0.05455207824707031, 0.058208465576171875, 0.06186485290527344, 0.065521240234375, 0.06917762756347656, 0.07283401489257812, 0.07649040222167969, 0.08014678955078125, 0.08380317687988281, 0.08745956420898438, 0.09111595153808594, 0.0947723388671875, 0.09842872619628906, 0.10208511352539062, 0.10574150085449219, 0.10939788818359375, 0.11305427551269531, 0.11671066284179688, 0.12036705017089844, 0.1240234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 859.0, 146.0, 6.0], "bins": [-34.48314666748047, -33.9256477355957, -33.36814880371094, -32.810646057128906, -32.25314712524414, -31.695648193359375, -31.13814926147461, -30.58064842224121, -30.023149490356445, -29.46565055847168, -28.90814971923828, -28.350650787353516, -27.79315185546875, -27.23565101623535, -26.678152084350586, -26.120651245117188, -25.563152313232422, -25.005653381347656, -24.448152542114258, -23.890653610229492, -23.333152770996094, -22.775653839111328, -22.218154907226562, -21.660654067993164, -21.1031551361084, -20.545656204223633, -19.988155364990234, -19.43065643310547, -18.873157501220703, -18.315656661987305, -17.75815773010254, -17.20065689086914, -16.643157958984375, -16.08565902709961, -15.528158187866211, -14.970659255981445, -14.413159370422363, -13.855659484863281, -13.298160552978516, -12.740660667419434, -12.183160781860352, -11.62566089630127, -11.068161010742188, -10.510662078857422, -9.95316219329834, -9.395662307739258, -8.838163375854492, -8.28066349029541, -7.72316312789917, -7.165663719177246, -6.608163833618164, -6.050663948059082, -5.493164539337158, -4.935665130615234, -4.378165245056152, -3.8206655979156494, -3.2631659507751465, -2.7056663036346436, -2.1481666564941406, -1.5906670093536377, -1.0331673622131348, -0.47566771507263184, 0.0818319320678711, 0.639331579208374, 1.1968311071395874]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 6.0, 9.0, 9.0, 8.0, 16.0, 13.0, 25.0, 20.0, 29.0, 27.0, 39.0, 21.0, 32.0, 40.0, 48.0, 44.0, 61.0, 50.0, 47.0, 53.0, 32.0, 54.0, 41.0, 32.0, 39.0, 33.0, 22.0, 21.0, 22.0, 14.0, 20.0, 8.0, 12.0, 15.0, 11.0, 6.0, 6.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2465689182281494, -1.2084039449691772, -1.1702390909194946, -1.1320741176605225, -1.0939092636108398, -1.0557442903518677, -1.0175793170928955, -0.9794144630432129, -0.9412494897842407, -0.9030845761299133, -0.8649196624755859, -0.8267546892166138, -0.7885897755622864, -0.750424861907959, -0.7122599482536316, -0.6740950345993042, -0.6359301209449768, -0.5977652072906494, -0.559600293636322, -0.5214353799819946, -0.48327040672302246, -0.44510549306869507, -0.4069405794143677, -0.3687756359577179, -0.3306107223033905, -0.2924458086490631, -0.25428086519241333, -0.21611595153808594, -0.17795102298259735, -0.13978609442710876, -0.10162118077278137, -0.06345623731613159, -0.0252913236618042, 0.012873601168394089, 0.05103852599859238, 0.08920344710350037, 0.12736837565898895, 0.16553330421447754, 0.20369821786880493, 0.2418631613254547, 0.2800280749797821, 0.3181929886341095, 0.3563579320907593, 0.39452284574508667, 0.43268775939941406, 0.47085270285606384, 0.5090175867080688, 0.547182559967041, 0.5853474736213684, 0.6235123872756958, 0.6616773009300232, 0.6998422145843506, 0.7380071878433228, 0.7761721014976501, 0.8143370151519775, 0.8525019884109497, 0.8906668424606323, 0.9288317561149597, 0.9669966697692871, 1.0051616430282593, 1.043326497077942, 1.081491470336914, 1.1196563243865967, 1.1578212976455688, 1.195986270904541]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 11.0, 24.0, 28.0, 32.0, 93.0, 244.0, 753.0, 3201.0, 33354.0, 4099736.0, 51174.0, 4197.0, 873.0, 295.0, 114.0, 54.0, 35.0, 24.0, 11.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498291015625, -0.4825019836425781, -0.46671295166015625, -0.4509239196777344, -0.4351348876953125, -0.4193458557128906, -0.40355682373046875, -0.3877677917480469, -0.371978759765625, -0.3561897277832031, -0.34040069580078125, -0.3246116638183594, -0.3088226318359375, -0.2930335998535156, -0.27724456787109375, -0.2614555358886719, -0.24566650390625, -0.22987747192382812, -0.21408843994140625, -0.19829940795898438, -0.1825103759765625, -0.16672134399414062, -0.15093231201171875, -0.13514328002929688, -0.119354248046875, -0.10356521606445312, -0.08777618408203125, -0.07198715209960938, -0.0561981201171875, -0.040409088134765625, -0.02462005615234375, -0.008831024169921875, 0.0069580078125, 0.022747039794921875, 0.03853607177734375, 0.054325103759765625, 0.0701141357421875, 0.08590316772460938, 0.10169219970703125, 0.11748123168945312, 0.133270263671875, 0.14905929565429688, 0.16484832763671875, 0.18063735961914062, 0.1964263916015625, 0.21221542358398438, 0.22800445556640625, 0.24379348754882812, 0.25958251953125, 0.2753715515136719, 0.29116058349609375, 0.3069496154785156, 0.3227386474609375, 0.3385276794433594, 0.35431671142578125, 0.3701057434082031, 0.385894775390625, 0.4016838073730469, 0.41747283935546875, 0.4332618713378906, 0.4490509033203125, 0.4648399353027344, 0.48062896728515625, 0.4964179992675781, 0.51220703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 10.0, 9.0, 9.0, 20.0, 33.0, 43.0, 70.0, 82.0, 102.0, 119.0, 107.0, 105.0, 78.0, 68.0, 50.0, 23.0, 19.0, 25.0, 14.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1007080078125, -0.09765243530273438, -0.09459686279296875, -0.09154129028320312, -0.0884857177734375, -0.08543014526367188, -0.08237457275390625, -0.07931900024414062, -0.076263427734375, -0.07320785522460938, -0.07015228271484375, -0.06709671020507812, -0.0640411376953125, -0.060985565185546875, -0.05792999267578125, -0.054874420166015625, -0.05181884765625, -0.048763275146484375, -0.04570770263671875, -0.042652130126953125, -0.0395965576171875, -0.036540985107421875, -0.03348541259765625, -0.030429840087890625, -0.027374267578125, -0.024318695068359375, -0.02126312255859375, -0.018207550048828125, -0.0151519775390625, -0.012096405029296875, -0.00904083251953125, -0.005985260009765625, -0.0029296875, 0.000125885009765625, 0.00318145751953125, 0.006237030029296875, 0.0092926025390625, 0.012348175048828125, 0.01540374755859375, 0.018459320068359375, 0.021514892578125, 0.024570465087890625, 0.02762603759765625, 0.030681610107421875, 0.0337371826171875, 0.036792755126953125, 0.03984832763671875, 0.042903900146484375, 0.04595947265625, 0.049015045166015625, 0.05207061767578125, 0.055126190185546875, 0.0581817626953125, 0.061237335205078125, 0.06429290771484375, 0.06734848022460938, 0.070404052734375, 0.07345962524414062, 0.07651519775390625, 0.07957077026367188, 0.0826263427734375, 0.08568191528320312, 0.08873748779296875, 0.09179306030273438, 0.0948486328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 18.0, 22.0, 33.0, 68.0, 89.0, 177.0, 294.0, 496.0, 904.0, 2091.0, 7983.0, 83395.0, 4032252.0, 56045.0, 6706.0, 1786.0, 823.0, 461.0, 276.0, 139.0, 93.0, 57.0, 31.0, 17.0, 9.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390380859375, -0.3779640197753906, -0.36554718017578125, -0.3531303405761719, -0.3407135009765625, -0.3282966613769531, -0.31587982177734375, -0.3034629821777344, -0.291046142578125, -0.2786293029785156, -0.26621246337890625, -0.2537956237792969, -0.2413787841796875, -0.22896194458007812, -0.21654510498046875, -0.20412826538085938, -0.19171142578125, -0.17929458618164062, -0.16687774658203125, -0.15446090698242188, -0.1420440673828125, -0.12962722778320312, -0.11721038818359375, -0.10479354858398438, -0.092376708984375, -0.07995986938476562, -0.06754302978515625, -0.055126190185546875, -0.0427093505859375, -0.030292510986328125, -0.01787567138671875, -0.005458831787109375, 0.0069580078125, 0.019374847412109375, 0.03179168701171875, 0.044208526611328125, 0.0566253662109375, 0.06904220581054688, 0.08145904541015625, 0.09387588500976562, 0.106292724609375, 0.11870956420898438, 0.13112640380859375, 0.14354324340820312, 0.1559600830078125, 0.16837692260742188, 0.18079376220703125, 0.19321060180664062, 0.20562744140625, 0.21804428100585938, 0.23046112060546875, 0.24287796020507812, 0.2552947998046875, 0.2677116394042969, 0.28012847900390625, 0.2925453186035156, 0.304962158203125, 0.3173789978027344, 0.32979583740234375, 0.3422126770019531, 0.3546295166015625, 0.3670463562011719, 0.37946319580078125, 0.3918800354003906, 0.404296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 11.0, 13.0, 28.0, 56.0, 225.0, 2719.0, 819.0, 102.0, 45.0, 21.0, 12.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2066650390625, -0.20037269592285156, -0.19408035278320312, -0.1877880096435547, -0.18149566650390625, -0.1752033233642578, -0.16891098022460938, -0.16261863708496094, -0.1563262939453125, -0.15003395080566406, -0.14374160766601562, -0.1374492645263672, -0.13115692138671875, -0.12486457824707031, -0.11857223510742188, -0.11227989196777344, -0.105987548828125, -0.09969520568847656, -0.09340286254882812, -0.08711051940917969, -0.08081817626953125, -0.07452583312988281, -0.06823348999023438, -0.06194114685058594, -0.0556488037109375, -0.04935646057128906, -0.043064117431640625, -0.03677177429199219, -0.03047943115234375, -0.024187088012695312, -0.017894744873046875, -0.011602401733398438, -0.00531005859375, 0.0009822845458984375, 0.007274627685546875, 0.013566970825195312, 0.01985931396484375, 0.026151657104492188, 0.032444000244140625, 0.03873634338378906, 0.0450286865234375, 0.05132102966308594, 0.057613372802734375, 0.06390571594238281, 0.07019805908203125, 0.07649040222167969, 0.08278274536132812, 0.08907508850097656, 0.095367431640625, 0.10165977478027344, 0.10795211791992188, 0.11424446105957031, 0.12053680419921875, 0.1268291473388672, 0.13312149047851562, 0.13941383361816406, 0.1457061767578125, 0.15199851989746094, 0.15829086303710938, 0.1645832061767578, 0.17087554931640625, 0.1771678924560547, 0.18346023559570312, 0.18975257873535156, 0.196044921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 15.0, 47.0, 65.0, 174.0, 297.0, 212.0, 93.0, 51.0, 14.0, 10.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49684569239616394, -0.4729893207550049, -0.4491329491138458, -0.42527657747268677, -0.4014201760292053, -0.37756383419036865, -0.3537074327468872, -0.32985106110572815, -0.3059946894645691, -0.28213831782341003, -0.258281946182251, -0.23442555963993073, -0.21056918799877167, -0.1867128163576126, -0.16285642981529236, -0.1390000581741333, -0.11514368653297424, -0.09128731489181519, -0.06743093580007553, -0.043574556708335876, -0.01971818506717682, 0.004138186573982239, 0.02799457311630249, 0.05185094475746155, 0.0757073163986206, 0.09956368803977966, 0.12342006713151932, 0.14727644622325897, 0.17113281786441803, 0.1949891895055771, 0.21884557604789734, 0.2427019476890564, 0.26655828952789307, 0.2904146611690521, 0.3142710328102112, 0.3381274342536926, 0.3619837760925293, 0.38584017753601074, 0.4096965491771698, 0.43355292081832886, 0.4574092924594879, 0.481265664100647, 0.5051220655441284, 0.5289784073829651, 0.5528348088264465, 0.5766911506652832, 0.6005475521087646, 0.6244039535522461, 0.6482602953910828, 0.6721166968345642, 0.6959730386734009, 0.7198294401168823, 0.743685781955719, 0.7675421833992004, 0.7913985252380371, 0.8152549266815186, 0.839111328125, 0.8629677295684814, 0.8868240714073181, 0.9106804728507996, 0.9345368146896362, 0.9583932161331177, 0.9822496175765991, 1.006105899810791, 1.0299623012542725]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 6.0, 14.0, 19.0, 12.0, 13.0, 28.0, 31.0, 28.0, 36.0, 46.0, 48.0, 47.0, 61.0, 70.0, 70.0, 66.0, 61.0, 49.0, 55.0, 53.0, 50.0, 36.0, 29.0, 19.0, 17.0, 13.0, 9.0, 3.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36349231004714966, -0.34973224997520447, -0.3359721899032593, -0.3222121298313141, -0.3084520697593689, -0.2946920096874237, -0.2809319496154785, -0.2671718895435333, -0.25341182947158813, -0.23965176939964294, -0.22589170932769775, -0.21213164925575256, -0.19837158918380737, -0.18461152911186218, -0.170851469039917, -0.1570914089679718, -0.1433313637971878, -0.12957130372524261, -0.11581124365329742, -0.10205118358135223, -0.08829112350940704, -0.07453107088804245, -0.06077101081609726, -0.04701095074415207, -0.03325089067220688, -0.019490830600261688, -0.005730772390961647, 0.008029285818338394, 0.021789345890283585, 0.03554940223693848, 0.04930946230888367, 0.06306952238082886, 0.07682958245277405, 0.09058964252471924, 0.10434970259666443, 0.11810976266860962, 0.1318698227405548, 0.1456298828125, 0.1593899428844452, 0.17315000295639038, 0.18691006302833557, 0.20067012310028076, 0.21443018317222595, 0.22819024324417114, 0.24195030331611633, 0.2557103633880615, 0.2694704234600067, 0.2832304835319519, 0.2969905138015747, 0.3107505738735199, 0.3245106339454651, 0.3382706940174103, 0.35203075408935547, 0.36579081416130066, 0.37955087423324585, 0.39331093430519104, 0.40707099437713623, 0.4208310544490814, 0.4345911145210266, 0.4483511745929718, 0.462111234664917, 0.4758712947368622, 0.4896313548088074, 0.5033913850784302, 0.5171514749526978]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 9.0, 14.0, 22.0, 30.0, 45.0, 79.0, 109.0, 179.0, 299.0, 529.0, 1141.0, 2583.0, 7776.0, 29681.0, 264451.0, 675588.0, 48622.0, 10878.0, 3557.0, 1382.0, 642.0, 338.0, 215.0, 118.0, 73.0, 41.0, 33.0, 27.0, 25.0, 19.0, 15.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.217529296875, -0.2109661102294922, -0.20440292358398438, -0.19783973693847656, -0.19127655029296875, -0.18471336364746094, -0.17815017700195312, -0.1715869903564453, -0.1650238037109375, -0.1584606170654297, -0.15189743041992188, -0.14533424377441406, -0.13877105712890625, -0.13220787048339844, -0.12564468383789062, -0.11908149719238281, -0.112518310546875, -0.10595512390136719, -0.09939193725585938, -0.09282875061035156, -0.08626556396484375, -0.07970237731933594, -0.07313919067382812, -0.06657600402832031, -0.0600128173828125, -0.05344963073730469, -0.046886444091796875, -0.04032325744628906, -0.03376007080078125, -0.027196884155273438, -0.020633697509765625, -0.014070510864257812, -0.00750732421875, -0.0009441375732421875, 0.005619049072265625, 0.012182235717773438, 0.01874542236328125, 0.025308609008789062, 0.031871795654296875, 0.03843498229980469, 0.0449981689453125, 0.05156135559082031, 0.058124542236328125, 0.06468772888183594, 0.07125091552734375, 0.07781410217285156, 0.08437728881835938, 0.09094047546386719, 0.097503662109375, 0.10406684875488281, 0.11063003540039062, 0.11719322204589844, 0.12375640869140625, 0.13031959533691406, 0.13688278198242188, 0.1434459686279297, 0.1500091552734375, 0.1565723419189453, 0.16313552856445312, 0.16969871520996094, 0.17626190185546875, 0.18282508850097656, 0.18938827514648438, 0.1959514617919922, 0.2025146484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 13.0, 12.0, 18.0, 36.0, 36.0, 61.0, 99.0, 101.0, 105.0, 108.0, 98.0, 88.0, 67.0, 43.0, 33.0, 20.0, 20.0, 14.0, 14.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.103515625, -0.10038471221923828, -0.09725379943847656, -0.09412288665771484, -0.09099197387695312, -0.0878610610961914, -0.08473014831542969, -0.08159923553466797, -0.07846832275390625, -0.07533740997314453, -0.07220649719238281, -0.0690755844116211, -0.06594467163085938, -0.06281375885009766, -0.05968284606933594, -0.05655193328857422, -0.0534210205078125, -0.05029010772705078, -0.04715919494628906, -0.044028282165527344, -0.040897369384765625, -0.037766456604003906, -0.03463554382324219, -0.03150463104248047, -0.02837371826171875, -0.02524280548095703, -0.022111892700195312, -0.018980979919433594, -0.015850067138671875, -0.012719154357910156, -0.009588241577148438, -0.006457328796386719, -0.003326416015625, -0.00019550323486328125, 0.0029354095458984375, 0.006066322326660156, 0.009197235107421875, 0.012328147888183594, 0.015459060668945312, 0.01858997344970703, 0.02172088623046875, 0.02485179901123047, 0.027982711791992188, 0.031113624572753906, 0.034244537353515625, 0.037375450134277344, 0.04050636291503906, 0.04363727569580078, 0.0467681884765625, 0.04989910125732422, 0.05303001403808594, 0.056160926818847656, 0.059291839599609375, 0.062422752380371094, 0.06555366516113281, 0.06868457794189453, 0.07181549072265625, 0.07494640350341797, 0.07807731628417969, 0.0812082290649414, 0.08433914184570312, 0.08747005462646484, 0.09060096740722656, 0.09373188018798828, 0.09686279296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 6.0, 11.0, 22.0, 25.0, 35.0, 50.0, 73.0, 132.0, 228.0, 400.0, 867.0, 2081.0, 6551.0, 26575.0, 186767.0, 742393.0, 62874.0, 12956.0, 3651.0, 1428.0, 630.0, 300.0, 170.0, 106.0, 80.0, 37.0, 23.0, 18.0, 18.0, 17.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.22072982788085938, -0.21428680419921875, -0.20784378051757812, -0.2014007568359375, -0.19495773315429688, -0.18851470947265625, -0.18207168579101562, -0.175628662109375, -0.16918563842773438, -0.16274261474609375, -0.15629959106445312, -0.1498565673828125, -0.14341354370117188, -0.13697052001953125, -0.13052749633789062, -0.12408447265625, -0.11764144897460938, -0.11119842529296875, -0.10475540161132812, -0.0983123779296875, -0.09186935424804688, -0.08542633056640625, -0.07898330688476562, -0.072540283203125, -0.06609725952148438, -0.05965423583984375, -0.053211212158203125, -0.0467681884765625, -0.040325164794921875, -0.03388214111328125, -0.027439117431640625, -0.02099609375, -0.014553070068359375, -0.00811004638671875, -0.001667022705078125, 0.0047760009765625, 0.011219024658203125, 0.01766204833984375, 0.024105072021484375, 0.030548095703125, 0.036991119384765625, 0.04343414306640625, 0.049877166748046875, 0.0563201904296875, 0.06276321411132812, 0.06920623779296875, 0.07564926147460938, 0.08209228515625, 0.08853530883789062, 0.09497833251953125, 0.10142135620117188, 0.1078643798828125, 0.11430740356445312, 0.12075042724609375, 0.12719345092773438, 0.133636474609375, 0.14007949829101562, 0.14652252197265625, 0.15296554565429688, 0.1594085693359375, 0.16585159301757812, 0.17229461669921875, 0.17873764038085938, 0.1851806640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 11.0, 13.0, 15.0, 13.0, 22.0, 26.0, 32.0, 48.0, 44.0, 41.0, 43.0, 60.0, 59.0, 49.0, 54.0, 45.0, 44.0, 35.0, 37.0, 36.0, 34.0, 39.0, 43.0, 24.0, 18.0, 17.0, 17.0, 10.0, 13.0, 4.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27587890625, -0.2677764892578125, -0.259674072265625, -0.2515716552734375, -0.24346923828125, -0.2353668212890625, -0.227264404296875, -0.2191619873046875, -0.2110595703125, -0.2029571533203125, -0.194854736328125, -0.1867523193359375, -0.17864990234375, -0.1705474853515625, -0.162445068359375, -0.1543426513671875, -0.146240234375, -0.1381378173828125, -0.130035400390625, -0.1219329833984375, -0.11383056640625, -0.1057281494140625, -0.097625732421875, -0.0895233154296875, -0.0814208984375, -0.0733184814453125, -0.065216064453125, -0.0571136474609375, -0.04901123046875, -0.0409088134765625, -0.032806396484375, -0.0247039794921875, -0.0166015625, -0.0084991455078125, -0.000396728515625, 0.0077056884765625, 0.01580810546875, 0.0239105224609375, 0.032012939453125, 0.0401153564453125, 0.0482177734375, 0.0563201904296875, 0.064422607421875, 0.0725250244140625, 0.08062744140625, 0.0887298583984375, 0.096832275390625, 0.1049346923828125, 0.113037109375, 0.1211395263671875, 0.129241943359375, 0.1373443603515625, 0.14544677734375, 0.1535491943359375, 0.161651611328125, 0.1697540283203125, 0.1778564453125, 0.1859588623046875, 0.194061279296875, 0.2021636962890625, 0.21026611328125, 0.2183685302734375, 0.226470947265625, 0.2345733642578125, 0.24267578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 3.0, 10.0, 12.0, 13.0, 21.0, 28.0, 66.0, 100.0, 232.0, 541.0, 1723.0, 9890.0, 188998.0, 820126.0, 22581.0, 2848.0, 731.0, 287.0, 124.0, 59.0, 45.0, 28.0, 21.0, 12.0, 8.0, 9.0, 5.0, 5.0, 8.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1407470703125, -0.1365032196044922, -0.13225936889648438, -0.12801551818847656, -0.12377166748046875, -0.11952781677246094, -0.11528396606445312, -0.11104011535644531, -0.1067962646484375, -0.10255241394042969, -0.09830856323242188, -0.09406471252441406, -0.08982086181640625, -0.08557701110839844, -0.08133316040039062, -0.07708930969238281, -0.072845458984375, -0.06860160827636719, -0.06435775756835938, -0.06011390686035156, -0.05587005615234375, -0.05162620544433594, -0.047382354736328125, -0.04313850402832031, -0.0388946533203125, -0.03465080261230469, -0.030406951904296875, -0.026163101196289062, -0.02191925048828125, -0.017675399780273438, -0.013431549072265625, -0.009187698364257812, -0.00494384765625, -0.0006999969482421875, 0.003543853759765625, 0.0077877044677734375, 0.01203155517578125, 0.016275405883789062, 0.020519256591796875, 0.024763107299804688, 0.0290069580078125, 0.03325080871582031, 0.037494659423828125, 0.04173851013183594, 0.04598236083984375, 0.05022621154785156, 0.054470062255859375, 0.05871391296386719, 0.062957763671875, 0.06720161437988281, 0.07144546508789062, 0.07568931579589844, 0.07993316650390625, 0.08417701721191406, 0.08842086791992188, 0.09266471862792969, 0.0969085693359375, 0.10115242004394531, 0.10539627075195312, 0.10964012145996094, 0.11388397216796875, 0.11812782287597656, 0.12237167358398438, 0.1266155242919922, 0.130859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 1.0, 10.0, 15.0, 20.0, 30.0, 25.0, 61.0, 71.0, 88.0, 134.0, 135.0, 123.0, 81.0, 51.0, 37.0, 24.0, 19.0, 13.0, 9.0, 4.0, 8.0, 1.0, 5.0, 12.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18235969543457e-05, -6.908830255270004e-05, -6.635300815105438e-05, -6.361771374940872e-05, -6.088241934776306e-05, -5.81471249461174e-05, -5.541183054447174e-05, -5.267653614282608e-05, -4.994124174118042e-05, -4.720594733953476e-05, -4.44706529378891e-05, -4.173535853624344e-05, -3.900006413459778e-05, -3.626476973295212e-05, -3.352947533130646e-05, -3.07941809296608e-05, -2.8058886528015137e-05, -2.5323592126369476e-05, -2.2588297724723816e-05, -1.9853003323078156e-05, -1.7117708921432495e-05, -1.4382414519786835e-05, -1.1647120118141174e-05, -8.911825716495514e-06, -6.1765313148498535e-06, -3.441236913204193e-06, -7.059425115585327e-07, 2.0293518900871277e-06, 4.764646291732788e-06, 7.4999406933784485e-06, 1.0235235095024109e-05, 1.297052949666977e-05, 1.570582389831543e-05, 1.844111829996109e-05, 2.117641270160675e-05, 2.391170710325241e-05, 2.664700150489807e-05, 2.938229590654373e-05, 3.211759030818939e-05, 3.485288470983505e-05, 3.758817911148071e-05, 4.032347351312637e-05, 4.3058767914772034e-05, 4.5794062316417694e-05, 4.8529356718063354e-05, 5.1264651119709015e-05, 5.3999945521354675e-05, 5.6735239923000336e-05, 5.9470534324645996e-05, 6.220582872629166e-05, 6.494112312793732e-05, 6.767641752958298e-05, 7.041171193122864e-05, 7.31470063328743e-05, 7.588230073451996e-05, 7.861759513616562e-05, 8.135288953781128e-05, 8.408818393945694e-05, 8.68234783411026e-05, 8.955877274274826e-05, 9.229406714439392e-05, 9.502936154603958e-05, 9.776465594768524e-05, 0.0001004999503493309, 0.00010323524475097656]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 7.0, 17.0, 32.0, 60.0, 95.0, 227.0, 551.0, 2060.0, 15387.0, 770148.0, 247639.0, 9890.0, 1552.0, 493.0, 170.0, 93.0, 50.0, 21.0, 22.0, 11.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103271484375, -0.09833335876464844, -0.09339523315429688, -0.08845710754394531, -0.08351898193359375, -0.07858085632324219, -0.07364273071289062, -0.06870460510253906, -0.0637664794921875, -0.05882835388183594, -0.053890228271484375, -0.04895210266113281, -0.04401397705078125, -0.03907585144042969, -0.034137725830078125, -0.029199600219726562, -0.024261474609375, -0.019323348999023438, -0.014385223388671875, -0.009447097778320312, -0.00450897216796875, 0.0004291534423828125, 0.005367279052734375, 0.010305404663085938, 0.0152435302734375, 0.020181655883789062, 0.025119781494140625, 0.030057907104492188, 0.03499603271484375, 0.03993415832519531, 0.044872283935546875, 0.04981040954589844, 0.05474853515625, 0.05968666076660156, 0.06462478637695312, 0.06956291198730469, 0.07450103759765625, 0.07943916320800781, 0.08437728881835938, 0.08931541442871094, 0.0942535400390625, 0.09919166564941406, 0.10412979125976562, 0.10906791687011719, 0.11400604248046875, 0.11894416809082031, 0.12388229370117188, 0.12882041931152344, 0.133758544921875, 0.13869667053222656, 0.14363479614257812, 0.1485729217529297, 0.15351104736328125, 0.1584491729736328, 0.16338729858398438, 0.16832542419433594, 0.1732635498046875, 0.17820167541503906, 0.18313980102539062, 0.1880779266357422, 0.19301605224609375, 0.1979541778564453, 0.20289230346679688, 0.20783042907714844, 0.2127685546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 7.0, 9.0, 7.0, 8.0, 20.0, 33.0, 50.0, 51.0, 88.0, 274.0, 183.0, 74.0, 50.0, 39.0, 29.0, 13.0, 15.0, 10.0, 7.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08233642578125, -0.0787210464477539, -0.07510566711425781, -0.07149028778076172, -0.06787490844726562, -0.06425952911376953, -0.06064414978027344, -0.057028770446777344, -0.05341339111328125, -0.049798011779785156, -0.04618263244628906, -0.04256725311279297, -0.038951873779296875, -0.03533649444580078, -0.03172111511230469, -0.028105735778808594, -0.0244903564453125, -0.020874977111816406, -0.017259597778320312, -0.013644218444824219, -0.010028839111328125, -0.006413459777832031, -0.0027980804443359375, 0.0008172988891601562, 0.00443267822265625, 0.008048057556152344, 0.011663436889648438, 0.015278816223144531, 0.018894195556640625, 0.02250957489013672, 0.026124954223632812, 0.029740333557128906, 0.033355712890625, 0.036971092224121094, 0.04058647155761719, 0.04420185089111328, 0.047817230224609375, 0.05143260955810547, 0.05504798889160156, 0.058663368225097656, 0.06227874755859375, 0.06589412689208984, 0.06950950622558594, 0.07312488555908203, 0.07674026489257812, 0.08035564422607422, 0.08397102355957031, 0.0875864028930664, 0.0912017822265625, 0.0948171615600586, 0.09843254089355469, 0.10204792022705078, 0.10566329956054688, 0.10927867889404297, 0.11289405822753906, 0.11650943756103516, 0.12012481689453125, 0.12374019622802734, 0.12735557556152344, 0.13097095489501953, 0.13458633422851562, 0.13820171356201172, 0.1418170928955078, 0.1454324722290039, 0.1490478515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 573.0, 421.0, 12.0, 4.0], "bins": [-16.600149154663086, -16.327838897705078, -16.055530548095703, -15.783220291137695, -15.510910987854004, -15.238601684570312, -14.966291427612305, -14.693982124328613, -14.421672821044922, -14.14936351776123, -13.877053260803223, -13.604743957519531, -13.33243465423584, -13.060125350952148, -12.78781509399414, -12.51550579071045, -12.243196487426758, -11.970887184143066, -11.698576927185059, -11.426267623901367, -11.153958320617676, -10.881649017333984, -10.609338760375977, -10.337029457092285, -10.064719200134277, -9.792409896850586, -9.520099639892578, -9.247790336608887, -8.975481033325195, -8.703171730041504, -8.430861473083496, -8.158552169799805, -7.8862433433532715, -7.613933563232422, -7.3416242599487305, -7.069314479827881, -6.7970051765441895, -6.52469539642334, -6.252386093139648, -5.980076313018799, -5.707766532897949, -5.4354567527771, -5.163147449493408, -4.890837669372559, -4.618528366088867, -4.346218585968018, -4.073908805847168, -3.8015995025634766, -3.529290199279785, -3.2569806575775146, -2.984671115875244, -2.7123613357543945, -2.440052032470703, -2.1677422523498535, -1.895432710647583, -1.6231231689453125, -1.350813627243042, -1.0785040855407715, -0.8061944842338562, -0.5338848829269409, -0.2615753412246704, 0.010734200477600098, 0.28304386138916016, 0.5553534030914307, 0.827663004398346]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 6.0, 1.0, 5.0, 5.0, 3.0, 8.0, 11.0, 7.0, 14.0, 9.0, 12.0, 13.0, 20.0, 18.0, 24.0, 28.0, 33.0, 21.0, 30.0, 32.0, 32.0, 31.0, 28.0, 42.0, 39.0, 38.0, 45.0, 38.0, 46.0, 38.0, 30.0, 40.0, 32.0, 23.0, 23.0, 18.0, 26.0, 27.0, 13.0, 26.0, 18.0, 10.0, 8.0, 10.0, 6.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9027281999588013, -0.8719969391822815, -0.8412656188011169, -0.8105343580245972, -0.7798030376434326, -0.7490717768669128, -0.7183405160903931, -0.6876091957092285, -0.6568779349327087, -0.626146674156189, -0.5954153537750244, -0.5646840929985046, -0.5339527726173401, -0.5032215118408203, -0.47249022126197815, -0.441758930683136, -0.4110276401042938, -0.38029634952545166, -0.3495650589466095, -0.31883376836776733, -0.28810250759124756, -0.2573712170124054, -0.22663992643356323, -0.19590865075588226, -0.1651773601770401, -0.13444606959819794, -0.10371479392051697, -0.0729835033416748, -0.04225222021341324, -0.011520937085151672, 0.01921035349369049, 0.04994162917137146, 0.08067291975021362, 0.11140420287847519, 0.14213548600673676, 0.17286677658557892, 0.2035980522632599, 0.23432934284210205, 0.2650606334209442, 0.2957919239997864, 0.32652318477630615, 0.3572544753551483, 0.3879857659339905, 0.41871702671051025, 0.4494483172893524, 0.4801796078681946, 0.5109108686447144, 0.5416421890258789, 0.5723735094070435, 0.6031047701835632, 0.6338360905647278, 0.6645673513412476, 0.6952986717224121, 0.7260299324989319, 0.7567611932754517, 0.7874925136566162, 0.818223774433136, 0.8489550352096558, 0.8796863555908203, 0.9104176163673401, 0.9411489367485046, 0.9718801975250244, 1.002611517906189, 1.033342719078064, 1.0640740394592285]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 15.0, 10.0, 15.0, 27.0, 102.0, 254.0, 931.0, 7670.0, 4042339.0, 138076.0, 3841.0, 650.0, 189.0, 71.0, 34.0, 22.0, 9.0, 11.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0216293334960938, -0.9905242919921875, -0.9594192504882812, -0.928314208984375, -0.8972091674804688, -0.8661041259765625, -0.8349990844726562, -0.80389404296875, -0.7727890014648438, -0.7416839599609375, -0.7105789184570312, -0.679473876953125, -0.6483688354492188, -0.6172637939453125, -0.5861587524414062, -0.5550537109375, -0.5239486694335938, -0.4928436279296875, -0.46173858642578125, -0.430633544921875, -0.39952850341796875, -0.3684234619140625, -0.33731842041015625, -0.30621337890625, -0.27510833740234375, -0.2440032958984375, -0.21289825439453125, -0.181793212890625, -0.15068817138671875, -0.1195831298828125, -0.08847808837890625, -0.057373046875, -0.02626800537109375, 0.0048370361328125, 0.03594207763671875, 0.067047119140625, 0.09815216064453125, 0.1292572021484375, 0.16036224365234375, 0.19146728515625, 0.22257232666015625, 0.2536773681640625, 0.28478240966796875, 0.315887451171875, 0.34699249267578125, 0.3780975341796875, 0.40920257568359375, 0.4403076171875, 0.47141265869140625, 0.5025177001953125, 0.5336227416992188, 0.564727783203125, 0.5958328247070312, 0.6269378662109375, 0.6580429077148438, 0.68914794921875, 0.7202529907226562, 0.7513580322265625, 0.7824630737304688, 0.813568115234375, 0.8446731567382812, 0.8757781982421875, 0.9068832397460938, 0.93798828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 8.0, 15.0, 29.0, 31.0, 63.0, 67.0, 105.0, 108.0, 115.0, 109.0, 90.0, 70.0, 51.0, 43.0, 23.0, 21.0, 16.0, 9.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10394287109375, -0.10083866119384766, -0.09773445129394531, -0.09463024139404297, -0.09152603149414062, -0.08842182159423828, -0.08531761169433594, -0.0822134017944336, -0.07910919189453125, -0.0760049819946289, -0.07290077209472656, -0.06979656219482422, -0.06669235229492188, -0.06358814239501953, -0.06048393249511719, -0.057379722595214844, -0.0542755126953125, -0.051171302795410156, -0.04806709289550781, -0.04496288299560547, -0.041858673095703125, -0.03875446319580078, -0.03565025329589844, -0.032546043395996094, -0.02944183349609375, -0.026337623596191406, -0.023233413696289062, -0.02012920379638672, -0.017024993896484375, -0.013920783996582031, -0.010816574096679688, -0.007712364196777344, -0.004608154296875, -0.0015039443969726562, 0.0016002655029296875, 0.004704475402832031, 0.007808685302734375, 0.010912895202636719, 0.014017105102539062, 0.017121315002441406, 0.02022552490234375, 0.023329734802246094, 0.026433944702148438, 0.02953815460205078, 0.032642364501953125, 0.03574657440185547, 0.03885078430175781, 0.041954994201660156, 0.0450592041015625, 0.048163414001464844, 0.05126762390136719, 0.05437183380126953, 0.057476043701171875, 0.06058025360107422, 0.06368446350097656, 0.0667886734008789, 0.06989288330078125, 0.0729970932006836, 0.07610130310058594, 0.07920551300048828, 0.08230972290039062, 0.08541393280029297, 0.08851814270019531, 0.09162235260009766, 0.0947265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 6.0, 16.0, 20.0, 30.0, 30.0, 47.0, 71.0, 73.0, 105.0, 162.0, 269.0, 387.0, 693.0, 1213.0, 2525.0, 7550.0, 44504.0, 3855720.0, 255311.0, 16880.0, 4449.0, 1724.0, 903.0, 563.0, 314.0, 219.0, 124.0, 110.0, 69.0, 46.0, 40.0, 34.0, 21.0, 11.0, 12.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.375396728515625, -0.36187744140625, -0.348358154296875, -0.3348388671875, -0.321319580078125, -0.30780029296875, -0.294281005859375, -0.28076171875, -0.267242431640625, -0.25372314453125, -0.240203857421875, -0.2266845703125, -0.213165283203125, -0.19964599609375, -0.186126708984375, -0.172607421875, -0.159088134765625, -0.14556884765625, -0.132049560546875, -0.1185302734375, -0.105010986328125, -0.09149169921875, -0.077972412109375, -0.064453125, -0.050933837890625, -0.03741455078125, -0.023895263671875, -0.0103759765625, 0.003143310546875, 0.01666259765625, 0.030181884765625, 0.043701171875, 0.057220458984375, 0.07073974609375, 0.084259033203125, 0.0977783203125, 0.111297607421875, 0.12481689453125, 0.138336181640625, 0.15185546875, 0.165374755859375, 0.17889404296875, 0.192413330078125, 0.2059326171875, 0.219451904296875, 0.23297119140625, 0.246490478515625, 0.260009765625, 0.273529052734375, 0.28704833984375, 0.300567626953125, 0.3140869140625, 0.327606201171875, 0.34112548828125, 0.354644775390625, 0.3681640625, 0.381683349609375, 0.39520263671875, 0.408721923828125, 0.4222412109375, 0.435760498046875, 0.44927978515625, 0.462799072265625, 0.476318359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 21.0, 37.0, 173.0, 3066.0, 615.0, 80.0, 27.0, 16.0, 11.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322265625, -0.31180572509765625, -0.3013458251953125, -0.29088592529296875, -0.280426025390625, -0.26996612548828125, -0.2595062255859375, -0.24904632568359375, -0.23858642578125, -0.22812652587890625, -0.2176666259765625, -0.20720672607421875, -0.196746826171875, -0.18628692626953125, -0.1758270263671875, -0.16536712646484375, -0.1549072265625, -0.14444732666015625, -0.1339874267578125, -0.12352752685546875, -0.113067626953125, -0.10260772705078125, -0.0921478271484375, -0.08168792724609375, -0.07122802734375, -0.06076812744140625, -0.0503082275390625, -0.03984832763671875, -0.029388427734375, -0.01892852783203125, -0.0084686279296875, 0.00199127197265625, 0.012451171875, 0.02291107177734375, 0.0333709716796875, 0.04383087158203125, 0.054290771484375, 0.06475067138671875, 0.0752105712890625, 0.08567047119140625, 0.09613037109375, 0.10659027099609375, 0.1170501708984375, 0.12751007080078125, 0.137969970703125, 0.14842987060546875, 0.1588897705078125, 0.16934967041015625, 0.1798095703125, 0.19026947021484375, 0.2007293701171875, 0.21118927001953125, 0.221649169921875, 0.23210906982421875, 0.2425689697265625, 0.25302886962890625, 0.26348876953125, 0.27394866943359375, 0.2844085693359375, 0.29486846923828125, 0.305328369140625, 0.31578826904296875, 0.3262481689453125, 0.33670806884765625, 0.34716796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 10.0, 7.0, 19.0, 25.0, 39.0, 52.0, 99.0, 143.0, 172.0, 144.0, 123.0, 68.0, 36.0, 17.0, 11.0, 12.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.7999388575553894, -0.7821212410926819, -0.7643036246299744, -0.7464860081672668, -0.7286684513092041, -0.7108508348464966, -0.6930332183837891, -0.6752156019210815, -0.657397985458374, -0.6395803689956665, -0.621762752532959, -0.6039451360702515, -0.586127519607544, -0.5683099627494812, -0.5504923462867737, -0.5326747298240662, -0.5148571133613586, -0.4970394968986511, -0.4792218804359436, -0.46140429377555847, -0.44358667731285095, -0.42576906085014343, -0.4079514741897583, -0.3901338577270508, -0.37231624126434326, -0.35449862480163574, -0.3366810083389282, -0.3188634216785431, -0.30104580521583557, -0.28322818875312805, -0.2654106020927429, -0.2475929856300354, -0.2297753095626831, -0.21195769309997559, -0.19414009153842926, -0.17632248997688293, -0.15850487351417542, -0.1406872570514679, -0.12286965548992157, -0.10505204647779465, -0.08723443746566772, -0.0694168284535408, -0.05159921944141388, -0.03378161042928696, -0.015964001417160034, 0.0018536075949668884, 0.01967121660709381, 0.037488825619220734, 0.055306434631347656, 0.07312404364347458, 0.0909416526556015, 0.10875926166772842, 0.12657687067985535, 0.14439448714256287, 0.1622120887041092, 0.18002969026565552, 0.19784730672836304, 0.21566492319107056, 0.23348252475261688, 0.2513001263141632, 0.2691177427768707, 0.28693535923957825, 0.3047529458999634, 0.3225705623626709, 0.3403881788253784]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 7.0, 17.0, 17.0, 27.0, 20.0, 39.0, 35.0, 53.0, 51.0, 65.0, 59.0, 57.0, 57.0, 77.0, 67.0, 53.0, 46.0, 40.0, 34.0, 35.0, 24.0, 24.0, 20.0, 21.0, 14.0, 16.0, 2.0, 6.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4931862950325012, -0.4745917022228241, -0.45599713921546936, -0.43740254640579224, -0.4188079833984375, -0.4002133905887604, -0.38161879777908325, -0.3630242347717285, -0.3444296419620514, -0.32583504915237427, -0.30724048614501953, -0.2886458933353424, -0.2700513005256653, -0.25145673751831055, -0.23286214470863342, -0.2142675668001175, -0.19567298889160156, -0.17707841098308563, -0.1584838330745697, -0.13988924026489258, -0.12129466235637665, -0.10270008444786072, -0.08410549908876419, -0.06551091372966766, -0.04691633582115173, -0.028321754187345505, -0.009727172553539276, 0.008867409080266953, 0.02746199071407318, 0.04605656862258911, 0.06465115398168564, 0.08324573934078217, 0.1018403172492981, 0.12043489515781403, 0.13902947306632996, 0.15762406587600708, 0.176218643784523, 0.19481322169303894, 0.21340781450271606, 0.232002392411232, 0.2505969703197479, 0.26919156312942505, 0.2877861261367798, 0.3063807189464569, 0.32497531175613403, 0.34356987476348877, 0.3621644675731659, 0.380759060382843, 0.39935362339019775, 0.4179482161998749, 0.4365427792072296, 0.45513737201690674, 0.4737319350242615, 0.4923265278339386, 0.5109211206436157, 0.5295156836509705, 0.5481102466583252, 0.5667048096656799, 0.5852994322776794, 0.6038939952850342, 0.6224885582923889, 0.6410831212997437, 0.6596777439117432, 0.6782723069190979, 0.6968669295310974]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 20.0, 27.0, 54.0, 66.0, 124.0, 219.0, 470.0, 1084.0, 3153.0, 15151.0, 150078.0, 780443.0, 83253.0, 10291.0, 2371.0, 873.0, 364.0, 213.0, 102.0, 70.0, 36.0, 22.0, 14.0, 13.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4668159484863281, -0.45145416259765625, -0.4360923767089844, -0.4207305908203125, -0.4053688049316406, -0.39000701904296875, -0.3746452331542969, -0.359283447265625, -0.3439216613769531, -0.32855987548828125, -0.3131980895996094, -0.2978363037109375, -0.2824745178222656, -0.26711273193359375, -0.2517509460449219, -0.23638916015625, -0.22102737426757812, -0.20566558837890625, -0.19030380249023438, -0.1749420166015625, -0.15958023071289062, -0.14421844482421875, -0.12885665893554688, -0.113494873046875, -0.09813308715820312, -0.08277130126953125, -0.06740951538085938, -0.0520477294921875, -0.036685943603515625, -0.02132415771484375, -0.005962371826171875, 0.0093994140625, 0.024761199951171875, 0.04012298583984375, 0.055484771728515625, 0.0708465576171875, 0.08620834350585938, 0.10157012939453125, 0.11693191528320312, 0.132293701171875, 0.14765548706054688, 0.16301727294921875, 0.17837905883789062, 0.1937408447265625, 0.20910263061523438, 0.22446441650390625, 0.23982620239257812, 0.25518798828125, 0.2705497741699219, 0.28591156005859375, 0.3012733459472656, 0.3166351318359375, 0.3319969177246094, 0.34735870361328125, 0.3627204895019531, 0.378082275390625, 0.3934440612792969, 0.40880584716796875, 0.4241676330566406, 0.4395294189453125, 0.4548912048339844, 0.47025299072265625, 0.4856147766113281, 0.5009765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 13.0, 16.0, 21.0, 41.0, 58.0, 73.0, 108.0, 99.0, 112.0, 97.0, 80.0, 68.0, 56.0, 45.0, 36.0, 30.0, 17.0, 11.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1090087890625, -0.10567378997802734, -0.10233879089355469, -0.09900379180908203, -0.09566879272460938, -0.09233379364013672, -0.08899879455566406, -0.0856637954711914, -0.08232879638671875, -0.0789937973022461, -0.07565879821777344, -0.07232379913330078, -0.06898880004882812, -0.06565380096435547, -0.06231880187988281, -0.058983802795410156, -0.0556488037109375, -0.052313804626464844, -0.04897880554199219, -0.04564380645751953, -0.042308807373046875, -0.03897380828857422, -0.03563880920410156, -0.032303810119628906, -0.02896881103515625, -0.025633811950683594, -0.022298812866210938, -0.01896381378173828, -0.015628814697265625, -0.012293815612792969, -0.008958816528320312, -0.005623817443847656, -0.002288818359375, 0.0010461807250976562, 0.0043811798095703125, 0.007716178894042969, 0.011051177978515625, 0.014386177062988281, 0.017721176147460938, 0.021056175231933594, 0.02439117431640625, 0.027726173400878906, 0.031061172485351562, 0.03439617156982422, 0.037731170654296875, 0.04106616973876953, 0.04440116882324219, 0.047736167907714844, 0.0510711669921875, 0.054406166076660156, 0.05774116516113281, 0.06107616424560547, 0.06441116333007812, 0.06774616241455078, 0.07108116149902344, 0.0744161605834961, 0.07775115966796875, 0.0810861587524414, 0.08442115783691406, 0.08775615692138672, 0.09109115600585938, 0.09442615509033203, 0.09776115417480469, 0.10109615325927734, 0.10443115234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 5.0, 13.0, 21.0, 17.0, 25.0, 40.0, 48.0, 97.0, 146.0, 199.0, 373.0, 705.0, 1532.0, 3224.0, 9062.0, 39620.0, 451851.0, 484211.0, 41631.0, 9288.0, 3253.0, 1441.0, 717.0, 367.0, 220.0, 132.0, 100.0, 49.0, 40.0, 32.0, 22.0, 13.0, 8.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.423095703125, -0.4110107421875, -0.39892578125, -0.3868408203125, -0.374755859375, -0.3626708984375, -0.3505859375, -0.3385009765625, -0.326416015625, -0.3143310546875, -0.30224609375, -0.2901611328125, -0.278076171875, -0.2659912109375, -0.25390625, -0.2418212890625, -0.229736328125, -0.2176513671875, -0.20556640625, -0.1934814453125, -0.181396484375, -0.1693115234375, -0.1572265625, -0.1451416015625, -0.133056640625, -0.1209716796875, -0.10888671875, -0.0968017578125, -0.084716796875, -0.0726318359375, -0.060546875, -0.0484619140625, -0.036376953125, -0.0242919921875, -0.01220703125, -0.0001220703125, 0.011962890625, 0.0240478515625, 0.0361328125, 0.0482177734375, 0.060302734375, 0.0723876953125, 0.08447265625, 0.0965576171875, 0.108642578125, 0.1207275390625, 0.1328125, 0.1448974609375, 0.156982421875, 0.1690673828125, 0.18115234375, 0.1932373046875, 0.205322265625, 0.2174072265625, 0.2294921875, 0.2415771484375, 0.253662109375, 0.2657470703125, 0.27783203125, 0.2899169921875, 0.302001953125, 0.3140869140625, 0.326171875, 0.3382568359375, 0.350341796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 1.0, 9.0, 15.0, 6.0, 17.0, 16.0, 24.0, 22.0, 41.0, 36.0, 44.0, 80.0, 55.0, 56.0, 61.0, 67.0, 63.0, 65.0, 54.0, 46.0, 40.0, 35.0, 32.0, 26.0, 14.0, 18.0, 12.0, 7.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.384521484375, -0.372802734375, -0.361083984375, -0.349365234375, -0.337646484375, -0.325927734375, -0.314208984375, -0.302490234375, -0.290771484375, -0.279052734375, -0.267333984375, -0.255615234375, -0.243896484375, -0.232177734375, -0.220458984375, -0.208740234375, -0.197021484375, -0.185302734375, -0.173583984375, -0.161865234375, -0.150146484375, -0.138427734375, -0.126708984375, -0.114990234375, -0.103271484375, -0.091552734375, -0.079833984375, -0.068115234375, -0.056396484375, -0.044677734375, -0.032958984375, -0.021240234375, -0.009521484375, 0.002197265625, 0.013916015625, 0.025634765625, 0.037353515625, 0.049072265625, 0.060791015625, 0.072509765625, 0.084228515625, 0.095947265625, 0.107666015625, 0.119384765625, 0.131103515625, 0.142822265625, 0.154541015625, 0.166259765625, 0.177978515625, 0.189697265625, 0.201416015625, 0.213134765625, 0.224853515625, 0.236572265625, 0.248291015625, 0.260009765625, 0.271728515625, 0.283447265625, 0.295166015625, 0.306884765625, 0.318603515625, 0.330322265625, 0.342041015625, 0.353759765625, 0.365478515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 3.0, 10.0, 11.0, 13.0, 22.0, 29.0, 52.0, 53.0, 84.0, 135.0, 211.0, 337.0, 673.0, 1321.0, 3301.0, 13476.0, 752050.0, 261560.0, 9687.0, 2841.0, 1217.0, 585.0, 306.0, 178.0, 129.0, 78.0, 44.0, 49.0, 38.0, 21.0, 15.0, 15.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.42862701416015625, -0.4156036376953125, -0.40258026123046875, -0.389556884765625, -0.37653350830078125, -0.3635101318359375, -0.35048675537109375, -0.33746337890625, -0.32444000244140625, -0.3114166259765625, -0.29839324951171875, -0.285369873046875, -0.27234649658203125, -0.2593231201171875, -0.24629974365234375, -0.2332763671875, -0.22025299072265625, -0.2072296142578125, -0.19420623779296875, -0.181182861328125, -0.16815948486328125, -0.1551361083984375, -0.14211273193359375, -0.12908935546875, -0.11606597900390625, -0.1030426025390625, -0.09001922607421875, -0.076995849609375, -0.06397247314453125, -0.0509490966796875, -0.03792572021484375, -0.02490234375, -0.01187896728515625, 0.0011444091796875, 0.01416778564453125, 0.027191162109375, 0.04021453857421875, 0.0532379150390625, 0.06626129150390625, 0.07928466796875, 0.09230804443359375, 0.1053314208984375, 0.11835479736328125, 0.131378173828125, 0.14440155029296875, 0.1574249267578125, 0.17044830322265625, 0.1834716796875, 0.19649505615234375, 0.2095184326171875, 0.22254180908203125, 0.235565185546875, 0.24858856201171875, 0.2616119384765625, 0.27463531494140625, 0.28765869140625, 0.30068206787109375, 0.3137054443359375, 0.32672882080078125, 0.339752197265625, 0.35277557373046875, 0.3657989501953125, 0.37882232666015625, 0.391845703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 5.0, 10.0, 16.0, 17.0, 36.0, 48.0, 55.0, 70.0, 131.0, 137.0, 125.0, 101.0, 64.0, 42.0, 39.0, 30.0, 19.0, 18.0, 6.0, 5.0, 6.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015151500701904297, -0.00014660321176052094, -0.0001416914165019989, -0.00013677962124347687, -0.00013186782598495483, -0.0001269560307264328, -0.00012204423546791077, -0.00011713244020938873, -0.0001122206449508667, -0.00010730884969234467, -0.00010239705443382263, -9.74852591753006e-05, -9.257346391677856e-05, -8.766166865825653e-05, -8.27498733997345e-05, -7.783807814121246e-05, -7.292628288269043e-05, -6.80144876241684e-05, -6.310269236564636e-05, -5.819089710712433e-05, -5.3279101848602295e-05, -4.836730659008026e-05, -4.345551133155823e-05, -3.8543716073036194e-05, -3.363192081451416e-05, -2.8720125555992126e-05, -2.3808330297470093e-05, -1.889653503894806e-05, -1.3984739780426025e-05, -9.072944521903992e-06, -4.161149263381958e-06, 7.506459951400757e-07, 5.662441253662109e-06, 1.0574236512184143e-05, 1.5486031770706177e-05, 2.039782702922821e-05, 2.5309622287750244e-05, 3.0221417546272278e-05, 3.513321280479431e-05, 4.0045008063316345e-05, 4.495680332183838e-05, 4.986859858036041e-05, 5.4780393838882446e-05, 5.969218909740448e-05, 6.460398435592651e-05, 6.951577961444855e-05, 7.442757487297058e-05, 7.933937013149261e-05, 8.425116539001465e-05, 8.916296064853668e-05, 9.407475590705872e-05, 9.898655116558075e-05, 0.00010389834642410278, 0.00010881014168262482, 0.00011372193694114685, 0.00011863373219966888, 0.00012354552745819092, 0.00012845732271671295, 0.00013336911797523499, 0.00013828091323375702, 0.00014319270849227905, 0.00014810450375080109, 0.00015301629900932312, 0.00015792809426784515, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 11.0, 22.0, 23.0, 73.0, 154.0, 411.0, 1543.0, 22925.0, 1011717.0, 9942.0, 1105.0, 352.0, 137.0, 64.0, 25.0, 11.0, 6.0, 4.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7578125, -0.7344207763671875, -0.711029052734375, -0.6876373291015625, -0.66424560546875, -0.6408538818359375, -0.617462158203125, -0.5940704345703125, -0.5706787109375, -0.5472869873046875, -0.523895263671875, -0.5005035400390625, -0.47711181640625, -0.4537200927734375, -0.430328369140625, -0.4069366455078125, -0.383544921875, -0.3601531982421875, -0.336761474609375, -0.3133697509765625, -0.28997802734375, -0.2665863037109375, -0.243194580078125, -0.2198028564453125, -0.1964111328125, -0.1730194091796875, -0.149627685546875, -0.1262359619140625, -0.10284423828125, -0.0794525146484375, -0.056060791015625, -0.0326690673828125, -0.00927734375, 0.0141143798828125, 0.037506103515625, 0.0608978271484375, 0.08428955078125, 0.1076812744140625, 0.131072998046875, 0.1544647216796875, 0.1778564453125, 0.2012481689453125, 0.224639892578125, 0.2480316162109375, 0.27142333984375, 0.2948150634765625, 0.318206787109375, 0.3415985107421875, 0.364990234375, 0.3883819580078125, 0.411773681640625, 0.4351654052734375, 0.45855712890625, 0.4819488525390625, 0.505340576171875, 0.5287322998046875, 0.5521240234375, 0.5755157470703125, 0.598907470703125, 0.6222991943359375, 0.64569091796875, 0.6690826416015625, 0.692474365234375, 0.7158660888671875, 0.7392578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 10.0, 15.0, 46.0, 141.0, 512.0, 169.0, 45.0, 23.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5220947265625, -0.495361328125, -0.4686279296875, -0.44189453125, -0.4151611328125, -0.388427734375, -0.3616943359375, -0.3349609375, -0.3082275390625, -0.281494140625, -0.2547607421875, -0.22802734375, -0.2012939453125, -0.174560546875, -0.1478271484375, -0.12109375, -0.0943603515625, -0.067626953125, -0.0408935546875, -0.01416015625, 0.0125732421875, 0.039306640625, 0.0660400390625, 0.0927734375, 0.1195068359375, 0.146240234375, 0.1729736328125, 0.19970703125, 0.2264404296875, 0.253173828125, 0.2799072265625, 0.306640625, 0.3333740234375, 0.360107421875, 0.3868408203125, 0.41357421875, 0.4403076171875, 0.467041015625, 0.4937744140625, 0.5205078125, 0.5472412109375, 0.573974609375, 0.6007080078125, 0.62744140625, 0.6541748046875, 0.680908203125, 0.7076416015625, 0.734375, 0.7611083984375, 0.787841796875, 0.8145751953125, 0.84130859375, 0.8680419921875, 0.894775390625, 0.9215087890625, 0.9482421875, 0.9749755859375, 1.001708984375, 1.0284423828125, 1.05517578125, 1.0819091796875, 1.108642578125, 1.1353759765625, 1.162109375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 9.0, 17.0, 29.0, 59.0, 118.0, 194.0, 235.0, 176.0, 83.0, 36.0, 15.0, 8.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.157985687255859, -4.037571430206299, -3.917156934738159, -3.7967426776885986, -3.676328182220459, -3.5559139251708984, -3.435499429702759, -3.3150851726531982, -3.1946706771850586, -3.074256420135498, -2.9538419246673584, -2.833427667617798, -2.713013172149658, -2.5925989151000977, -2.472184419631958, -2.3517701625823975, -2.231355667114258, -2.1109414100646973, -1.9905269145965576, -1.8701125383377075, -1.7496981620788574, -1.6292839050292969, -1.5088694095611572, -1.3884551525115967, -1.2680408954620361, -1.147626519203186, -1.027212142944336, -0.9067977666854858, -0.7863833904266357, -0.6659690737724304, -0.5455546975135803, -0.4251403212547302, -0.30472588539123535, -0.18431150913238525, -0.06389714777469635, 0.056517213582992554, 0.17693158984184265, 0.29734593629837036, 0.41776031255722046, 0.5381746888160706, 0.6585890650749207, 0.7790034413337708, 0.8994178175926208, 1.0198321342468262, 1.1402465105056763, 1.2606608867645264, 1.3810752630233765, 1.5014896392822266, 1.6219040155410767, 1.7423183917999268, 1.8627327680587769, 1.983147144317627, 2.1035614013671875, 2.223975896835327, 2.3443901538848877, 2.4648046493530273, 2.585218906402588, 2.7056331634521484, 2.826047658920288, 2.9464619159698486, 3.0668764114379883, 3.187290668487549, 3.3077051639556885, 3.428119421005249, 3.5485339164733887]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 6.0, 9.0, 6.0, 4.0, 8.0, 13.0, 17.0, 20.0, 18.0, 28.0, 34.0, 45.0, 45.0, 41.0, 59.0, 45.0, 53.0, 53.0, 53.0, 44.0, 48.0, 41.0, 54.0, 43.0, 32.0, 27.0, 34.0, 24.0, 23.0, 20.0, 18.0, 13.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.561328887939453, -2.4870734214782715, -2.41281795501709, -2.338562488555908, -2.2643070220947266, -2.190051555633545, -2.1157960891723633, -2.0415403842926025, -1.967284917831421, -1.8930294513702393, -1.8187739849090576, -1.744518518447876, -1.6702629327774048, -1.5960074663162231, -1.5217519998550415, -1.4474964141845703, -1.3732410669326782, -1.2989856004714966, -1.224730134010315, -1.1504745483398438, -1.076219081878662, -1.0019636154174805, -0.9277081489562988, -0.8534526228904724, -0.7791971564292908, -0.7049416899681091, -0.6306861639022827, -0.5564306974411011, -0.48217520117759705, -0.407919704914093, -0.3336642384529114, -0.25940871238708496, -0.18515324592590332, -0.11089775711297989, -0.03664226830005646, 0.03761321306228638, 0.1118687093257904, 0.18612420558929443, 0.2603796720504761, 0.3346351981163025, 0.40889066457748413, 0.48314616084098816, 0.5574016571044922, 0.6316571235656738, 0.7059125900268555, 0.7801681160926819, 0.8544235825538635, 0.9286791086196899, 1.0029345750808716, 1.0771900415420532, 1.1514455080032349, 1.225701093673706, 1.2999565601348877, 1.3742120265960693, 1.448467493057251, 1.5227229595184326, 1.5969784259796143, 1.671233892440796, 1.7454893589019775, 1.8197448253631592, 1.8940004110336304, 1.968255877494812, 2.042511463165283, 2.116766929626465, 2.1910223960876465]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 13.0, 11.0, 22.0, 17.0, 38.0, 58.0, 104.0, 185.0, 234.0, 486.0, 909.0, 1835.0, 4201.0, 11720.0, 50951.0, 2982629.0, 1078251.0, 43814.0, 10908.0, 4004.0, 1767.0, 919.0, 490.0, 280.0, 170.0, 85.0, 53.0, 37.0, 24.0, 19.0, 8.0, 7.0, 11.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.2596549987792969, -0.25002288818359375, -0.24039077758789062, -0.2307586669921875, -0.22112655639648438, -0.21149444580078125, -0.20186233520507812, -0.192230224609375, -0.18259811401367188, -0.17296600341796875, -0.16333389282226562, -0.1537017822265625, -0.14406967163085938, -0.13443756103515625, -0.12480545043945312, -0.11517333984375, -0.10554122924804688, -0.09590911865234375, -0.08627700805664062, -0.0766448974609375, -0.06701278686523438, -0.05738067626953125, -0.047748565673828125, -0.038116455078125, -0.028484344482421875, -0.01885223388671875, -0.009220123291015625, 0.0004119873046875, 0.010044097900390625, 0.01967620849609375, 0.029308319091796875, 0.0389404296875, 0.048572540283203125, 0.05820465087890625, 0.06783676147460938, 0.0774688720703125, 0.08710098266601562, 0.09673309326171875, 0.10636520385742188, 0.115997314453125, 0.12562942504882812, 0.13526153564453125, 0.14489364624023438, 0.1545257568359375, 0.16415786743164062, 0.17378997802734375, 0.18342208862304688, 0.19305419921875, 0.20268630981445312, 0.21231842041015625, 0.22195053100585938, 0.2315826416015625, 0.24121475219726562, 0.25084686279296875, 0.2604789733886719, 0.270111083984375, 0.2797431945800781, 0.28937530517578125, 0.2990074157714844, 0.3086395263671875, 0.3182716369628906, 0.32790374755859375, 0.3375358581542969, 0.34716796875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 15.0, 7.0, 11.0, 16.0, 20.0, 30.0, 42.0, 50.0, 67.0, 72.0, 72.0, 79.0, 84.0, 74.0, 87.0, 53.0, 49.0, 40.0, 30.0, 26.0, 27.0, 18.0, 13.0, 10.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10955810546875, -0.10634708404541016, -0.10313606262207031, -0.09992504119873047, -0.09671401977539062, -0.09350299835205078, -0.09029197692871094, -0.0870809555053711, -0.08386993408203125, -0.0806589126586914, -0.07744789123535156, -0.07423686981201172, -0.07102584838867188, -0.06781482696533203, -0.06460380554199219, -0.061392784118652344, -0.0581817626953125, -0.054970741271972656, -0.05175971984863281, -0.04854869842529297, -0.045337677001953125, -0.04212665557861328, -0.03891563415527344, -0.035704612731933594, -0.03249359130859375, -0.029282569885253906, -0.026071548461914062, -0.02286052703857422, -0.019649505615234375, -0.01643848419189453, -0.013227462768554688, -0.010016441345214844, -0.006805419921875, -0.0035943984985351562, -0.0003833770751953125, 0.0028276443481445312, 0.006038665771484375, 0.009249687194824219, 0.012460708618164062, 0.015671730041503906, 0.01888275146484375, 0.022093772888183594, 0.025304794311523438, 0.02851581573486328, 0.031726837158203125, 0.03493785858154297, 0.03814888000488281, 0.041359901428222656, 0.0445709228515625, 0.047781944274902344, 0.05099296569824219, 0.05420398712158203, 0.057415008544921875, 0.06062602996826172, 0.06383705139160156, 0.0670480728149414, 0.07025909423828125, 0.0734701156616211, 0.07668113708496094, 0.07989215850830078, 0.08310317993164062, 0.08631420135498047, 0.08952522277832031, 0.09273624420166016, 0.095947265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 10.0, 7.0, 22.0, 25.0, 27.0, 68.0, 107.0, 172.0, 297.0, 460.0, 884.0, 1654.0, 3581.0, 11512.0, 94162.0, 3877589.0, 179242.0, 15842.0, 4316.0, 1891.0, 1049.0, 549.0, 319.0, 165.0, 101.0, 73.0, 33.0, 47.0, 18.0, 10.0, 15.0, 9.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.476318359375, -0.4625511169433594, -0.44878387451171875, -0.4350166320800781, -0.4212493896484375, -0.4074821472167969, -0.39371490478515625, -0.3799476623535156, -0.366180419921875, -0.3524131774902344, -0.33864593505859375, -0.3248786926269531, -0.3111114501953125, -0.2973442077636719, -0.28357696533203125, -0.2698097229003906, -0.25604248046875, -0.24227523803710938, -0.22850799560546875, -0.21474075317382812, -0.2009735107421875, -0.18720626831054688, -0.17343902587890625, -0.15967178344726562, -0.145904541015625, -0.13213729858398438, -0.11837005615234375, -0.10460281372070312, -0.0908355712890625, -0.07706832885742188, -0.06330108642578125, -0.049533843994140625, -0.0357666015625, -0.021999359130859375, -0.00823211669921875, 0.005535125732421875, 0.0193023681640625, 0.033069610595703125, 0.04683685302734375, 0.060604095458984375, 0.074371337890625, 0.08813858032226562, 0.10190582275390625, 0.11567306518554688, 0.1294403076171875, 0.14320755004882812, 0.15697479248046875, 0.17074203491210938, 0.18450927734375, 0.19827651977539062, 0.21204376220703125, 0.22581100463867188, 0.2395782470703125, 0.2533454895019531, 0.26711273193359375, 0.2808799743652344, 0.294647216796875, 0.3084144592285156, 0.32218170166015625, 0.3359489440917969, 0.3497161865234375, 0.3634834289550781, 0.37725067138671875, 0.3910179138183594, 0.40478515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 15.0, 14.0, 42.0, 130.0, 510.0, 2775.0, 397.0, 108.0, 24.0, 18.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.431640625, -0.42170143127441406, -0.4117622375488281, -0.4018230438232422, -0.39188385009765625, -0.3819446563720703, -0.3720054626464844, -0.36206626892089844, -0.3521270751953125, -0.34218788146972656, -0.3322486877441406, -0.3223094940185547, -0.31237030029296875, -0.3024311065673828, -0.2924919128417969, -0.28255271911621094, -0.272613525390625, -0.26267433166503906, -0.2527351379394531, -0.2427959442138672, -0.23285675048828125, -0.2229175567626953, -0.21297836303710938, -0.20303916931152344, -0.1930999755859375, -0.18316078186035156, -0.17322158813476562, -0.1632823944091797, -0.15334320068359375, -0.1434040069580078, -0.13346481323242188, -0.12352561950683594, -0.11358642578125, -0.10364723205566406, -0.09370803833007812, -0.08376884460449219, -0.07382965087890625, -0.06389045715332031, -0.053951263427734375, -0.04401206970214844, -0.0340728759765625, -0.024133682250976562, -0.014194488525390625, -0.0042552947998046875, 0.00568389892578125, 0.015623092651367188, 0.025562286376953125, 0.03550148010253906, 0.045440673828125, 0.05537986755371094, 0.06531906127929688, 0.07525825500488281, 0.08519744873046875, 0.09513664245605469, 0.10507583618164062, 0.11501502990722656, 0.1249542236328125, 0.13489341735839844, 0.14483261108398438, 0.1547718048095703, 0.16471099853515625, 0.1746501922607422, 0.18458938598632812, 0.19452857971191406, 0.2044677734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 16.0, 100.0, 348.0, 442.0, 79.0, 14.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.101809024810791, -4.994061470031738, -4.8863139152526855, -4.778566360473633, -4.670818328857422, -4.563070774078369, -4.455323219299316, -4.347575664520264, -4.239828109741211, -4.132080554962158, -4.0243330001831055, -3.9165852069854736, -3.808837652206421, -3.701089859008789, -3.5933423042297363, -3.4855947494506836, -3.3778469562530518, -3.270099401473999, -3.162351608276367, -3.0546040534973145, -2.9468564987182617, -2.839108943939209, -2.731361150741577, -2.6236135959625244, -2.5158658027648926, -2.40811824798584, -2.300370454788208, -2.1926229000091553, -2.0848753452301025, -1.9771276712417603, -1.869379997253418, -1.7616324424743652, -1.6538846492767334, -1.5461369752883911, -1.4383894205093384, -1.330641746520996, -1.2228941917419434, -1.115146517753601, -1.0073988437652588, -0.8996512293815613, -0.7919036149978638, -0.6841560006141663, -0.5764083862304688, -0.46866071224212646, -0.36091309785842896, -0.25316548347473145, -0.14541780948638916, -0.03767019510269165, 0.07007741928100586, 0.17782504856586456, 0.28557267785072327, 0.39332032203674316, 0.5010679364204407, 0.6088155508041382, 0.7165632247924805, 0.824310839176178, 0.9320584535598755, 1.0398061275482178, 1.1475536823272705, 1.2553013563156128, 1.363049030303955, 1.4707965850830078, 1.57854425907135, 1.6862919330596924, 1.7940394878387451]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 10.0, 7.0, 11.0, 11.0, 13.0, 13.0, 18.0, 21.0, 18.0, 20.0, 28.0, 32.0, 44.0, 49.0, 45.0, 50.0, 43.0, 39.0, 46.0, 41.0, 46.0, 51.0, 43.0, 35.0, 27.0, 34.0, 31.0, 29.0, 23.0, 26.0, 13.0, 24.0, 12.0, 11.0, 5.0, 7.0, 8.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0], "bins": [-0.8993347883224487, -0.8758382797241211, -0.8523417711257935, -0.8288452625274658, -0.8053486943244934, -0.7818521857261658, -0.7583556771278381, -0.7348591685295105, -0.7113626003265381, -0.6878660917282104, -0.6643695831298828, -0.6408730745315552, -0.6173765063285828, -0.5938799977302551, -0.5703834891319275, -0.5468869805335999, -0.5233904719352722, -0.4998939633369446, -0.47639742493629456, -0.4529009163379669, -0.4294043779373169, -0.40590786933898926, -0.3824113607406616, -0.358914852142334, -0.33541831374168396, -0.3119218051433563, -0.2884252667427063, -0.26492875814437866, -0.24143223464488983, -0.217935711145401, -0.19443920254707336, -0.17094267904758453, -0.14744609594345093, -0.1239495724439621, -0.10045305639505386, -0.07695654034614563, -0.0534600168466568, -0.02996349334716797, -0.006466984748840332, 0.0170295387506485, 0.04052606225013733, 0.06402258574962616, 0.0875191017985344, 0.11101561784744263, 0.13451214134693146, 0.1580086648464203, 0.18150517344474792, 0.20500169694423676, 0.22849822044372559, 0.2519947290420532, 0.27549126744270325, 0.2989877760410309, 0.3224843144416809, 0.34598082304000854, 0.3694773316383362, 0.3929738402366638, 0.41647037863731384, 0.4399668872356415, 0.4634634256362915, 0.48695993423461914, 0.5104564428329468, 0.5339529514312744, 0.557449460029602, 0.5809460282325745, 0.6044425368309021]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 12.0, 19.0, 36.0, 43.0, 90.0, 137.0, 247.0, 442.0, 954.0, 2180.0, 6229.0, 23835.0, 146770.0, 653325.0, 175509.0, 27232.0, 6954.0, 2392.0, 1017.0, 494.0, 266.0, 145.0, 74.0, 48.0, 27.0, 20.0, 12.0, 9.0, 10.0, 7.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.365631103515625, -0.35235595703125, -0.339080810546875, -0.3258056640625, -0.312530517578125, -0.29925537109375, -0.285980224609375, -0.272705078125, -0.259429931640625, -0.24615478515625, -0.232879638671875, -0.2196044921875, -0.206329345703125, -0.19305419921875, -0.179779052734375, -0.16650390625, -0.153228759765625, -0.13995361328125, -0.126678466796875, -0.1134033203125, -0.100128173828125, -0.08685302734375, -0.073577880859375, -0.060302734375, -0.047027587890625, -0.03375244140625, -0.020477294921875, -0.0072021484375, 0.006072998046875, 0.01934814453125, 0.032623291015625, 0.0458984375, 0.059173583984375, 0.07244873046875, 0.085723876953125, 0.0989990234375, 0.112274169921875, 0.12554931640625, 0.138824462890625, 0.152099609375, 0.165374755859375, 0.17864990234375, 0.191925048828125, 0.2052001953125, 0.218475341796875, 0.23175048828125, 0.245025634765625, 0.25830078125, 0.271575927734375, 0.28485107421875, 0.298126220703125, 0.3114013671875, 0.324676513671875, 0.33795166015625, 0.351226806640625, 0.364501953125, 0.377777099609375, 0.39105224609375, 0.404327392578125, 0.4176025390625, 0.430877685546875, 0.44415283203125, 0.457427978515625, 0.470703125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 7.0, 8.0, 10.0, 13.0, 11.0, 20.0, 32.0, 34.0, 40.0, 51.0, 47.0, 69.0, 78.0, 56.0, 77.0, 69.0, 59.0, 54.0, 53.0, 46.0, 43.0, 24.0, 25.0, 16.0, 21.0, 10.0, 8.0, 13.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10854911804199219, -0.10528182983398438, -0.10201454162597656, -0.09874725341796875, -0.09547996520996094, -0.09221267700195312, -0.08894538879394531, -0.0856781005859375, -0.08241081237792969, -0.07914352416992188, -0.07587623596191406, -0.07260894775390625, -0.06934165954589844, -0.06607437133789062, -0.06280708312988281, -0.059539794921875, -0.05627250671386719, -0.053005218505859375, -0.04973793029785156, -0.04647064208984375, -0.04320335388183594, -0.039936065673828125, -0.03666877746582031, -0.0334014892578125, -0.030134201049804688, -0.026866912841796875, -0.023599624633789062, -0.02033233642578125, -0.017065048217773438, -0.013797760009765625, -0.010530471801757812, -0.00726318359375, -0.0039958953857421875, -0.000728607177734375, 0.0025386810302734375, 0.00580596923828125, 0.009073257446289062, 0.012340545654296875, 0.015607833862304688, 0.0188751220703125, 0.022142410278320312, 0.025409698486328125, 0.028676986694335938, 0.03194427490234375, 0.03521156311035156, 0.038478851318359375, 0.04174613952636719, 0.045013427734375, 0.04828071594238281, 0.051548004150390625, 0.05481529235839844, 0.05808258056640625, 0.06134986877441406, 0.06461715698242188, 0.06788444519042969, 0.0711517333984375, 0.07441902160644531, 0.07768630981445312, 0.08095359802246094, 0.08422088623046875, 0.08748817443847656, 0.09075546264648438, 0.09402275085449219, 0.0972900390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 7.0, 6.0, 7.0, 12.0, 15.0, 22.0, 47.0, 70.0, 87.0, 159.0, 247.0, 421.0, 787.0, 1874.0, 4854.0, 17872.0, 117831.0, 752276.0, 124993.0, 18097.0, 4956.0, 1930.0, 883.0, 435.0, 233.0, 133.0, 82.0, 58.0, 44.0, 37.0, 21.0, 17.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0], "bins": [-0.66552734375, -0.6477851867675781, -0.6300430297851562, -0.6123008728027344, -0.5945587158203125, -0.5768165588378906, -0.5590744018554688, -0.5413322448730469, -0.523590087890625, -0.5058479309082031, -0.48810577392578125, -0.4703636169433594, -0.4526214599609375, -0.4348793029785156, -0.41713714599609375, -0.3993949890136719, -0.38165283203125, -0.3639106750488281, -0.34616851806640625, -0.3284263610839844, -0.3106842041015625, -0.2929420471191406, -0.27519989013671875, -0.2574577331542969, -0.239715576171875, -0.22197341918945312, -0.20423126220703125, -0.18648910522460938, -0.1687469482421875, -0.15100479125976562, -0.13326263427734375, -0.11552047729492188, -0.0977783203125, -0.08003616333007812, -0.06229400634765625, -0.044551849365234375, -0.0268096923828125, -0.009067535400390625, 0.00867462158203125, 0.026416778564453125, 0.044158935546875, 0.061901092529296875, 0.07964324951171875, 0.09738540649414062, 0.1151275634765625, 0.13286972045898438, 0.15061187744140625, 0.16835403442382812, 0.18609619140625, 0.20383834838867188, 0.22158050537109375, 0.23932266235351562, 0.2570648193359375, 0.2748069763183594, 0.29254913330078125, 0.3102912902832031, 0.328033447265625, 0.3457756042480469, 0.36351776123046875, 0.3812599182128906, 0.3990020751953125, 0.4167442321777344, 0.43448638916015625, 0.4522285461425781, 0.469970703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 10.0, 13.0, 16.0, 18.0, 29.0, 32.0, 44.0, 53.0, 47.0, 41.0, 53.0, 63.0, 55.0, 72.0, 46.0, 41.0, 56.0, 60.0, 43.0, 33.0, 36.0, 29.0, 26.0, 11.0, 7.0, 7.0, 7.0, 10.0, 10.0, 8.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6171875, -0.5978469848632812, -0.5785064697265625, -0.5591659545898438, -0.539825439453125, -0.5204849243164062, -0.5011444091796875, -0.48180389404296875, -0.46246337890625, -0.44312286376953125, -0.4237823486328125, -0.40444183349609375, -0.385101318359375, -0.36576080322265625, -0.3464202880859375, -0.32707977294921875, -0.3077392578125, -0.28839874267578125, -0.2690582275390625, -0.24971771240234375, -0.230377197265625, -0.21103668212890625, -0.1916961669921875, -0.17235565185546875, -0.15301513671875, -0.13367462158203125, -0.1143341064453125, -0.09499359130859375, -0.075653076171875, -0.05631256103515625, -0.0369720458984375, -0.01763153076171875, 0.001708984375, 0.02104949951171875, 0.0403900146484375, 0.05973052978515625, 0.079071044921875, 0.09841156005859375, 0.1177520751953125, 0.13709259033203125, 0.15643310546875, 0.17577362060546875, 0.1951141357421875, 0.21445465087890625, 0.233795166015625, 0.25313568115234375, 0.2724761962890625, 0.29181671142578125, 0.3111572265625, 0.33049774169921875, 0.3498382568359375, 0.36917877197265625, 0.388519287109375, 0.40785980224609375, 0.4272003173828125, 0.44654083251953125, 0.46588134765625, 0.48522186279296875, 0.5045623779296875, 0.5239028930664062, 0.543243408203125, 0.5625839233398438, 0.5819244384765625, 0.6012649536132812, 0.62060546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 13.0, 13.0, 26.0, 33.0, 58.0, 117.0, 150.0, 313.0, 667.0, 1720.0, 6164.0, 49868.0, 813363.0, 159395.0, 12210.0, 2583.0, 888.0, 441.0, 205.0, 121.0, 65.0, 36.0, 48.0, 11.0, 13.0, 9.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.384765625, -0.37334442138671875, -0.3619232177734375, -0.35050201416015625, -0.339080810546875, -0.32765960693359375, -0.3162384033203125, -0.30481719970703125, -0.29339599609375, -0.28197479248046875, -0.2705535888671875, -0.25913238525390625, -0.247711181640625, -0.23628997802734375, -0.2248687744140625, -0.21344757080078125, -0.2020263671875, -0.19060516357421875, -0.1791839599609375, -0.16776275634765625, -0.156341552734375, -0.14492034912109375, -0.1334991455078125, -0.12207794189453125, -0.11065673828125, -0.09923553466796875, -0.0878143310546875, -0.07639312744140625, -0.064971923828125, -0.05355072021484375, -0.0421295166015625, -0.03070831298828125, -0.019287109375, -0.00786590576171875, 0.0035552978515625, 0.01497650146484375, 0.026397705078125, 0.03781890869140625, 0.0492401123046875, 0.06066131591796875, 0.07208251953125, 0.08350372314453125, 0.0949249267578125, 0.10634613037109375, 0.117767333984375, 0.12918853759765625, 0.1406097412109375, 0.15203094482421875, 0.1634521484375, 0.17487335205078125, 0.1862945556640625, 0.19771575927734375, 0.209136962890625, 0.22055816650390625, 0.2319793701171875, 0.24340057373046875, 0.25482177734375, 0.26624298095703125, 0.2776641845703125, 0.28908538818359375, 0.300506591796875, 0.31192779541015625, 0.3233489990234375, 0.33477020263671875, 0.34619140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 12.0, 19.0, 28.0, 24.0, 45.0, 59.0, 72.0, 87.0, 115.0, 92.0, 88.0, 88.0, 59.0, 56.0, 33.0, 28.0, 20.0, 15.0, 13.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.952617645263672e-05, -8.549727499485016e-05, -8.14683735370636e-05, -7.743947207927704e-05, -7.341057062149048e-05, -6.938166916370392e-05, -6.535276770591736e-05, -6.13238662481308e-05, -5.729496479034424e-05, -5.326606333255768e-05, -4.923716187477112e-05, -4.520826041698456e-05, -4.1179358959198e-05, -3.715045750141144e-05, -3.312155604362488e-05, -2.9092654585838318e-05, -2.5063753128051758e-05, -2.1034851670265198e-05, -1.7005950212478638e-05, -1.2977048754692078e-05, -8.948147296905518e-06, -4.9192458391189575e-06, -8.903443813323975e-07, 3.1385570764541626e-06, 7.167458534240723e-06, 1.1196359992027283e-05, 1.5225261449813843e-05, 1.9254162907600403e-05, 2.3283064365386963e-05, 2.7311965823173523e-05, 3.134086728096008e-05, 3.536976873874664e-05, 3.93986701965332e-05, 4.342757165431976e-05, 4.745647311210632e-05, 5.148537456989288e-05, 5.551427602767944e-05, 5.9543177485466003e-05, 6.357207894325256e-05, 6.760098040103912e-05, 7.162988185882568e-05, 7.565878331661224e-05, 7.96876847743988e-05, 8.371658623218536e-05, 8.774548768997192e-05, 9.177438914775848e-05, 9.580329060554504e-05, 9.98321920633316e-05, 0.00010386109352111816, 0.00010788999497890472, 0.00011191889643669128, 0.00011594779789447784, 0.0001199766993522644, 0.00012400560081005096, 0.00012803450226783752, 0.00013206340372562408, 0.00013609230518341064, 0.0001401212066411972, 0.00014415010809898376, 0.00014817900955677032, 0.00015220791101455688, 0.00015623681247234344, 0.00016026571393013, 0.00016429461538791656, 0.00016832351684570312]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 9.0, 11.0, 15.0, 23.0, 46.0, 81.0, 143.0, 262.0, 415.0, 872.0, 2362.0, 10599.0, 100646.0, 821192.0, 97352.0, 10352.0, 2293.0, 860.0, 414.0, 218.0, 156.0, 89.0, 52.0, 33.0, 13.0, 13.0, 5.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31103515625, -0.3011589050292969, -0.29128265380859375, -0.2814064025878906, -0.2715301513671875, -0.2616539001464844, -0.25177764892578125, -0.24190139770507812, -0.232025146484375, -0.22214889526367188, -0.21227264404296875, -0.20239639282226562, -0.1925201416015625, -0.18264389038085938, -0.17276763916015625, -0.16289138793945312, -0.15301513671875, -0.14313888549804688, -0.13326263427734375, -0.12338638305664062, -0.1135101318359375, -0.10363388061523438, -0.09375762939453125, -0.08388137817382812, -0.074005126953125, -0.06412887573242188, -0.05425262451171875, -0.044376373291015625, -0.0345001220703125, -0.024623870849609375, -0.01474761962890625, -0.004871368408203125, 0.0050048828125, 0.014881134033203125, 0.02475738525390625, 0.034633636474609375, 0.0445098876953125, 0.054386138916015625, 0.06426239013671875, 0.07413864135742188, 0.084014892578125, 0.09389114379882812, 0.10376739501953125, 0.11364364624023438, 0.1235198974609375, 0.13339614868164062, 0.14327239990234375, 0.15314865112304688, 0.16302490234375, 0.17290115356445312, 0.18277740478515625, 0.19265365600585938, 0.2025299072265625, 0.21240615844726562, 0.22228240966796875, 0.23215866088867188, 0.242034912109375, 0.2519111633300781, 0.26178741455078125, 0.2716636657714844, 0.2815399169921875, 0.2914161682128906, 0.30129241943359375, 0.3111686706542969, 0.321044921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 6.0, 12.0, 22.0, 25.0, 34.0, 56.0, 87.0, 146.0, 206.0, 147.0, 88.0, 51.0, 45.0, 21.0, 14.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4208984375, -0.4070167541503906, -0.39313507080078125, -0.3792533874511719, -0.3653717041015625, -0.3514900207519531, -0.33760833740234375, -0.3237266540527344, -0.309844970703125, -0.2959632873535156, -0.28208160400390625, -0.2681999206542969, -0.2543182373046875, -0.24043655395507812, -0.22655487060546875, -0.21267318725585938, -0.19879150390625, -0.18490982055664062, -0.17102813720703125, -0.15714645385742188, -0.1432647705078125, -0.12938308715820312, -0.11550140380859375, -0.10161972045898438, -0.087738037109375, -0.07385635375976562, -0.05997467041015625, -0.046092987060546875, -0.0322113037109375, -0.018329620361328125, -0.00444793701171875, 0.009433746337890625, 0.0233154296875, 0.037197113037109375, 0.05107879638671875, 0.06496047973632812, 0.0788421630859375, 0.09272384643554688, 0.10660552978515625, 0.12048721313476562, 0.134368896484375, 0.14825057983398438, 0.16213226318359375, 0.17601394653320312, 0.1898956298828125, 0.20377731323242188, 0.21765899658203125, 0.23154067993164062, 0.24542236328125, 0.2593040466308594, 0.27318572998046875, 0.2870674133300781, 0.3009490966796875, 0.3148307800292969, 0.32871246337890625, 0.3425941467285156, 0.356475830078125, 0.3703575134277344, 0.38423919677734375, 0.3981208801269531, 0.4120025634765625, 0.4258842468261719, 0.43976593017578125, 0.4536476135253906, 0.467529296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 29.0, 114.0, 413.0, 360.0, 66.0, 14.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-18.472187042236328, -18.136234283447266, -17.800283432006836, -17.464330673217773, -17.128379821777344, -16.79242706298828, -16.45647621154785, -16.12052345275879, -15.784571647644043, -15.448619842529297, -15.11266803741455, -14.776716232299805, -14.440764427185059, -14.104812622070312, -13.76885986328125, -13.432908058166504, -13.096956253051758, -12.761004447937012, -12.425052642822266, -12.08910083770752, -11.753149032592773, -11.417196273803711, -11.081245422363281, -10.745292663574219, -10.409341812133789, -10.073390007019043, -9.737438201904297, -9.40148639678955, -9.065534591674805, -8.729581832885742, -8.393630981445312, -8.05767822265625, -7.721726417541504, -7.385774612426758, -7.049822807312012, -6.713871002197266, -6.377918720245361, -6.041966915130615, -5.706015110015869, -5.370062828063965, -5.034111022949219, -4.698159217834473, -4.362207412719727, -4.0262556076049805, -3.690303325653076, -3.35435152053833, -3.018399715423584, -2.682447671890259, -2.346496105194092, -2.0105443000793457, -1.6745922565460205, -1.3386404514312744, -1.0026885271072388, -0.6667366027832031, -0.33078479766845703, 0.005167245864868164, 0.34111905097961426, 0.6770709753036499, 1.0130228996276855, 1.3489747047424316, 1.6849266290664673, 2.020878553390503, 2.356830358505249, 2.692782402038574, 3.0287342071533203]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 3.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 32.0, 20.0, 30.0, 23.0, 28.0, 32.0, 51.0, 41.0, 30.0, 47.0, 60.0, 41.0, 41.0, 42.0, 47.0, 41.0, 35.0, 57.0, 43.0, 31.0, 29.0, 28.0, 15.0, 30.0, 14.0, 12.0, 13.0, 7.0, 10.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1834774017333984, -3.0944883823394775, -3.0054993629455566, -2.916510581970215, -2.827521562576294, -2.738532543182373, -2.649543523788452, -2.5605545043945312, -2.4715657234191895, -2.3825767040252686, -2.2935876846313477, -2.204598903656006, -2.115609884262085, -2.026620864868164, -1.9376318454742432, -1.8486428260803223, -1.7596538066864014, -1.6706647872924805, -1.5816758871078491, -1.4926868677139282, -1.4036979675292969, -1.314708948135376, -1.225719928741455, -1.1367309093475342, -1.0477420091629028, -0.9587530493736267, -0.8697640895843506, -0.7807750701904297, -0.6917861104011536, -0.6027971506118774, -0.5138081312179565, -0.4248191714286804, -0.3358302116394043, -0.24684123694896698, -0.15785226225852966, -0.06886327266693115, 0.02012568712234497, 0.1091146469116211, 0.198103666305542, 0.2870926260948181, 0.37608158588409424, 0.46507054567337036, 0.5540595054626465, 0.6430485248565674, 0.7320374846458435, 0.8210264444351196, 0.9100154638290405, 0.9990044236183167, 1.0879933834075928, 1.1769824028015137, 1.265971302986145, 1.354960322380066, 1.4439492225646973, 1.5329382419586182, 1.621927261352539, 1.71091628074646, 1.7999051809310913, 1.8888942003250122, 1.9778831005096436, 2.0668721199035645, 2.1558611392974854, 2.2448501586914062, 2.333838939666748, 2.422827959060669, 2.51181697845459]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 5.0, 8.0, 17.0, 18.0, 37.0, 60.0, 89.0, 143.0, 230.0, 358.0, 714.0, 1549.0, 4371.0, 21955.0, 3997562.0, 151801.0, 10216.0, 2729.0, 1069.0, 533.0, 300.0, 202.0, 106.0, 80.0, 47.0, 26.0, 18.0, 14.0, 11.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6250038146972656, -0.6088943481445312, -0.5927848815917969, -0.5766754150390625, -0.5605659484863281, -0.5444564819335938, -0.5283470153808594, -0.512237548828125, -0.4961280822753906, -0.48001861572265625, -0.4639091491699219, -0.4477996826171875, -0.4316902160644531, -0.41558074951171875, -0.3994712829589844, -0.38336181640625, -0.3672523498535156, -0.35114288330078125, -0.3350334167480469, -0.3189239501953125, -0.3028144836425781, -0.28670501708984375, -0.2705955505371094, -0.254486083984375, -0.23837661743164062, -0.22226715087890625, -0.20615768432617188, -0.1900482177734375, -0.17393875122070312, -0.15782928466796875, -0.14171981811523438, -0.1256103515625, -0.10950088500976562, -0.09339141845703125, -0.07728195190429688, -0.0611724853515625, -0.045063018798828125, -0.02895355224609375, -0.012844085693359375, 0.003265380859375, 0.019374847412109375, 0.03548431396484375, 0.051593780517578125, 0.0677032470703125, 0.08381271362304688, 0.09992218017578125, 0.11603164672851562, 0.13214111328125, 0.14825057983398438, 0.16436004638671875, 0.18046951293945312, 0.1965789794921875, 0.21268844604492188, 0.22879791259765625, 0.24490737915039062, 0.261016845703125, 0.2771263122558594, 0.29323577880859375, 0.3093452453613281, 0.3254547119140625, 0.3415641784667969, 0.35767364501953125, 0.3737831115722656, 0.389892578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 10.0, 6.0, 15.0, 20.0, 22.0, 29.0, 25.0, 39.0, 65.0, 58.0, 79.0, 79.0, 72.0, 65.0, 63.0, 71.0, 54.0, 46.0, 45.0, 37.0, 28.0, 27.0, 16.0, 8.0, 8.0, 5.0, 10.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1572265625, -0.15317344665527344, -0.14912033081054688, -0.1450672149658203, -0.14101409912109375, -0.1369609832763672, -0.13290786743164062, -0.12885475158691406, -0.1248016357421875, -0.12074851989746094, -0.11669540405273438, -0.11264228820800781, -0.10858917236328125, -0.10453605651855469, -0.10048294067382812, -0.09642982482910156, -0.092376708984375, -0.08832359313964844, -0.08427047729492188, -0.08021736145019531, -0.07616424560546875, -0.07211112976074219, -0.06805801391601562, -0.06400489807128906, -0.0599517822265625, -0.05589866638183594, -0.051845550537109375, -0.04779243469238281, -0.04373931884765625, -0.03968620300292969, -0.035633087158203125, -0.03157997131347656, -0.02752685546875, -0.023473739624023438, -0.019420623779296875, -0.015367507934570312, -0.01131439208984375, -0.0072612762451171875, -0.003208160400390625, 0.0008449554443359375, 0.0048980712890625, 0.008951187133789062, 0.013004302978515625, 0.017057418823242188, 0.02111053466796875, 0.025163650512695312, 0.029216766357421875, 0.03326988220214844, 0.037322998046875, 0.04137611389160156, 0.045429229736328125, 0.04948234558105469, 0.05353546142578125, 0.05758857727050781, 0.061641693115234375, 0.06569480895996094, 0.0697479248046875, 0.07380104064941406, 0.07785415649414062, 0.08190727233886719, 0.08596038818359375, 0.09001350402832031, 0.09406661987304688, 0.09811973571777344, 0.1021728515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 8.0, 12.0, 12.0, 28.0, 35.0, 24.0, 54.0, 66.0, 107.0, 148.0, 180.0, 249.0, 359.0, 508.0, 764.0, 1123.0, 2091.0, 4964.0, 15430.0, 110436.0, 3958032.0, 76783.0, 13005.0, 4427.0, 1967.0, 1111.0, 700.0, 458.0, 309.0, 216.0, 170.0, 149.0, 98.0, 48.0, 53.0, 49.0, 19.0, 24.0, 23.0, 6.0, 14.0, 1.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.4510002136230469, -0.43618011474609375, -0.4213600158691406, -0.4065399169921875, -0.3917198181152344, -0.37689971923828125, -0.3620796203613281, -0.347259521484375, -0.3324394226074219, -0.31761932373046875, -0.3027992248535156, -0.2879791259765625, -0.2731590270996094, -0.25833892822265625, -0.24351882934570312, -0.22869873046875, -0.21387863159179688, -0.19905853271484375, -0.18423843383789062, -0.1694183349609375, -0.15459823608398438, -0.13977813720703125, -0.12495803833007812, -0.110137939453125, -0.09531784057617188, -0.08049774169921875, -0.06567764282226562, -0.0508575439453125, -0.036037445068359375, -0.02121734619140625, -0.006397247314453125, 0.0084228515625, 0.023242950439453125, 0.03806304931640625, 0.052883148193359375, 0.0677032470703125, 0.08252334594726562, 0.09734344482421875, 0.11216354370117188, 0.126983642578125, 0.14180374145507812, 0.15662384033203125, 0.17144393920898438, 0.1862640380859375, 0.20108413696289062, 0.21590423583984375, 0.23072433471679688, 0.24554443359375, 0.2603645324707031, 0.27518463134765625, 0.2900047302246094, 0.3048248291015625, 0.3196449279785156, 0.33446502685546875, 0.3492851257324219, 0.364105224609375, 0.3789253234863281, 0.39374542236328125, 0.4085655212402344, 0.4233856201171875, 0.4382057189941406, 0.45302581787109375, 0.4678459167480469, 0.482666015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 19.0, 72.0, 445.0, 3269.0, 149.0, 62.0, 15.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1943359375, -0.18881607055664062, -0.18329620361328125, -0.17777633666992188, -0.1722564697265625, -0.16673660278320312, -0.16121673583984375, -0.15569686889648438, -0.150177001953125, -0.14465713500976562, -0.13913726806640625, -0.13361740112304688, -0.1280975341796875, -0.12257766723632812, -0.11705780029296875, -0.11153793334960938, -0.10601806640625, -0.10049819946289062, -0.09497833251953125, -0.08945846557617188, -0.0839385986328125, -0.07841873168945312, -0.07289886474609375, -0.06737899780273438, -0.061859130859375, -0.056339263916015625, -0.05081939697265625, -0.045299530029296875, -0.0397796630859375, -0.034259796142578125, -0.02873992919921875, -0.023220062255859375, -0.0177001953125, -0.012180328369140625, -0.00666046142578125, -0.001140594482421875, 0.0043792724609375, 0.009899139404296875, 0.01541900634765625, 0.020938873291015625, 0.026458740234375, 0.031978607177734375, 0.03749847412109375, 0.043018341064453125, 0.0485382080078125, 0.054058074951171875, 0.05957794189453125, 0.06509780883789062, 0.07061767578125, 0.07613754272460938, 0.08165740966796875, 0.08717727661132812, 0.0926971435546875, 0.09821701049804688, 0.10373687744140625, 0.10925674438476562, 0.114776611328125, 0.12029647827148438, 0.12581634521484375, 0.13133621215820312, 0.1368560791015625, 0.14237594604492188, 0.14789581298828125, 0.15341567993164062, 0.158935546875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 17.0, 14.0, 24.0, 55.0, 107.0, 140.0, 157.0, 149.0, 136.0, 72.0, 53.0, 28.0, 12.0, 12.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6229955554008484, -0.6078831553459167, -0.5927706956863403, -0.5776582956314087, -0.562545895576477, -0.5474334359169006, -0.532321035861969, -0.5172086358070374, -0.5020961761474609, -0.4869837462902069, -0.47187134623527527, -0.45675891637802124, -0.4416464865207672, -0.42653408646583557, -0.41142165660858154, -0.3963092565536499, -0.38119685649871826, -0.36608442664146423, -0.3509720265865326, -0.33585959672927856, -0.32074716687202454, -0.3056347668170929, -0.29052233695983887, -0.2754099369049072, -0.2602974772453308, -0.24518506228923798, -0.23007263243198395, -0.2149602174758911, -0.19984780251979828, -0.18473538756370544, -0.16962295770645142, -0.15451054275035858, -0.13939812779426575, -0.12428570538759232, -0.10917329043149948, -0.09406086802482605, -0.07894845306873322, -0.06383603066205978, -0.04872360825538635, -0.03361119329929352, -0.018498770892620087, -0.003386351279914379, 0.011726068332791328, 0.02683848887681961, 0.041950907558202744, 0.057063326239585876, 0.07217574864625931, 0.08728816360235214, 0.10240058600902557, 0.117513008415699, 0.13262543082237244, 0.14773784577846527, 0.1628502607345581, 0.17796269059181213, 0.19307510554790497, 0.2081875205039978, 0.22329995036125183, 0.23841236531734467, 0.2535247802734375, 0.26863721013069153, 0.28374963998794556, 0.2988620400428772, 0.3139744699001312, 0.32908689975738525, 0.3441992998123169]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 15.0, 7.0, 13.0, 11.0, 15.0, 29.0, 20.0, 29.0, 28.0, 35.0, 38.0, 39.0, 36.0, 48.0, 40.0, 43.0, 45.0, 42.0, 42.0, 42.0, 40.0, 34.0, 34.0, 44.0, 30.0, 34.0, 25.0, 18.0, 26.0, 20.0, 12.0, 14.0, 8.0, 8.0, 5.0, 1.0, 10.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25805431604385376, -0.24963845312595367, -0.2412225902080536, -0.2328067272901535, -0.22439086437225342, -0.21597498655319214, -0.20755912363529205, -0.19914326071739197, -0.19072739779949188, -0.1823115348815918, -0.1738956719636917, -0.16547980904579163, -0.15706393122673035, -0.14864808320999146, -0.14023220539093018, -0.1318163424730301, -0.12340047955513, -0.11498461663722992, -0.10656875371932983, -0.09815288335084915, -0.08973702043294907, -0.08132115751504898, -0.0729052871465683, -0.06448942422866821, -0.05607356131076813, -0.04765769839286804, -0.03924183174967766, -0.030825966969132423, -0.02241010218858719, -0.013994239270687103, -0.005578372627496719, 0.0028374940156936646, 0.01125335693359375, 0.019669221714138985, 0.02808508649468422, 0.0365009531378746, 0.04491681605577469, 0.053332678973674774, 0.06174854561686516, 0.07016441226005554, 0.07858027517795563, 0.08699613809585571, 0.0954120010137558, 0.10382787138223648, 0.11224373430013657, 0.12065959721803665, 0.12907546758651733, 0.13749133050441742, 0.1459071934223175, 0.1543230563402176, 0.16273891925811768, 0.17115478217601776, 0.17957064509391785, 0.18798652291297913, 0.1964023858308792, 0.2048182487487793, 0.21323411166667938, 0.22164997458457947, 0.23006583750247955, 0.23848170042037964, 0.24689757823944092, 0.2553134262561798, 0.2637293040752411, 0.27214515209198, 0.28056102991104126]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 8.0, 9.0, 13.0, 30.0, 31.0, 70.0, 126.0, 190.0, 368.0, 784.0, 1656.0, 3779.0, 10519.0, 35390.0, 188160.0, 602514.0, 157818.0, 30978.0, 9590.0, 3486.0, 1497.0, 695.0, 378.0, 183.0, 114.0, 66.0, 31.0, 17.0, 17.0, 9.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4077873229980469, -0.39345550537109375, -0.3791236877441406, -0.3647918701171875, -0.3504600524902344, -0.33612823486328125, -0.3217964172363281, -0.307464599609375, -0.2931327819824219, -0.27880096435546875, -0.2644691467285156, -0.2501373291015625, -0.23580551147460938, -0.22147369384765625, -0.20714187622070312, -0.19281005859375, -0.17847824096679688, -0.16414642333984375, -0.14981460571289062, -0.1354827880859375, -0.12115097045898438, -0.10681915283203125, -0.09248733520507812, -0.078155517578125, -0.06382369995117188, -0.04949188232421875, -0.035160064697265625, -0.0208282470703125, -0.006496429443359375, 0.00783538818359375, 0.022167205810546875, 0.0364990234375, 0.050830841064453125, 0.06516265869140625, 0.07949447631835938, 0.0938262939453125, 0.10815811157226562, 0.12248992919921875, 0.13682174682617188, 0.151153564453125, 0.16548538208007812, 0.17981719970703125, 0.19414901733398438, 0.2084808349609375, 0.22281265258789062, 0.23714447021484375, 0.2514762878417969, 0.26580810546875, 0.2801399230957031, 0.29447174072265625, 0.3088035583496094, 0.3231353759765625, 0.3374671936035156, 0.35179901123046875, 0.3661308288574219, 0.380462646484375, 0.3947944641113281, 0.40912628173828125, 0.4234580993652344, 0.4377899169921875, 0.4521217346191406, 0.46645355224609375, 0.4807853698730469, 0.4951171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 10.0, 19.0, 18.0, 23.0, 29.0, 23.0, 27.0, 41.0, 63.0, 53.0, 81.0, 64.0, 86.0, 70.0, 62.0, 53.0, 56.0, 48.0, 38.0, 40.0, 27.0, 17.0, 11.0, 14.0, 12.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1629638671875, -0.15884017944335938, -0.15471649169921875, -0.15059280395507812, -0.1464691162109375, -0.14234542846679688, -0.13822174072265625, -0.13409805297851562, -0.129974365234375, -0.12585067749023438, -0.12172698974609375, -0.11760330200195312, -0.1134796142578125, -0.10935592651367188, -0.10523223876953125, -0.10110855102539062, -0.09698486328125, -0.09286117553710938, -0.08873748779296875, -0.08461380004882812, -0.0804901123046875, -0.07636642456054688, -0.07224273681640625, -0.06811904907226562, -0.063995361328125, -0.059871673583984375, -0.05574798583984375, -0.051624298095703125, -0.0475006103515625, -0.043376922607421875, -0.03925323486328125, -0.035129547119140625, -0.031005859375, -0.026882171630859375, -0.02275848388671875, -0.018634796142578125, -0.0145111083984375, -0.010387420654296875, -0.00626373291015625, -0.002140045166015625, 0.001983642578125, 0.006107330322265625, 0.01023101806640625, 0.014354705810546875, 0.0184783935546875, 0.022602081298828125, 0.02672576904296875, 0.030849456787109375, 0.03497314453125, 0.039096832275390625, 0.04322052001953125, 0.047344207763671875, 0.0514678955078125, 0.055591583251953125, 0.05971527099609375, 0.06383895874023438, 0.067962646484375, 0.07208633422851562, 0.07621002197265625, 0.08033370971679688, 0.0844573974609375, 0.08858108520507812, 0.09270477294921875, 0.09682846069335938, 0.1009521484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 4.0, 12.0, 10.0, 23.0, 20.0, 26.0, 35.0, 55.0, 99.0, 134.0, 230.0, 333.0, 556.0, 921.0, 1707.0, 3545.0, 8304.0, 27038.0, 147167.0, 654281.0, 159162.0, 28331.0, 8665.0, 3636.0, 1730.0, 959.0, 575.0, 357.0, 195.0, 134.0, 97.0, 51.0, 53.0, 20.0, 20.0, 12.0, 9.0, 13.0, 8.0, 7.0, 2.0, 1.0, 6.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4716796875, -0.4567146301269531, -0.44174957275390625, -0.4267845153808594, -0.4118194580078125, -0.3968544006347656, -0.38188934326171875, -0.3669242858886719, -0.351959228515625, -0.3369941711425781, -0.32202911376953125, -0.3070640563964844, -0.2920989990234375, -0.2771339416503906, -0.26216888427734375, -0.24720382690429688, -0.23223876953125, -0.21727371215820312, -0.20230865478515625, -0.18734359741210938, -0.1723785400390625, -0.15741348266601562, -0.14244842529296875, -0.12748336791992188, -0.112518310546875, -0.09755325317382812, -0.08258819580078125, -0.06762313842773438, -0.0526580810546875, -0.037693023681640625, -0.02272796630859375, -0.007762908935546875, 0.0072021484375, 0.022167205810546875, 0.03713226318359375, 0.052097320556640625, 0.0670623779296875, 0.08202743530273438, 0.09699249267578125, 0.11195755004882812, 0.126922607421875, 0.14188766479492188, 0.15685272216796875, 0.17181777954101562, 0.1867828369140625, 0.20174789428710938, 0.21671295166015625, 0.23167800903320312, 0.24664306640625, 0.2616081237792969, 0.27657318115234375, 0.2915382385253906, 0.3065032958984375, 0.3214683532714844, 0.33643341064453125, 0.3513984680175781, 0.366363525390625, 0.3813285827636719, 0.39629364013671875, 0.4112586975097656, 0.4262237548828125, 0.4411888122558594, 0.45615386962890625, 0.4711189270019531, 0.486083984375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 6.0, 10.0, 15.0, 13.0, 37.0, 34.0, 35.0, 48.0, 48.0, 54.0, 69.0, 72.0, 59.0, 74.0, 65.0, 65.0, 49.0, 49.0, 42.0, 30.0, 28.0, 25.0, 19.0, 14.0, 10.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68994140625, -0.6648635864257812, -0.6397857666015625, -0.6147079467773438, -0.589630126953125, -0.5645523071289062, -0.5394744873046875, -0.5143966674804688, -0.48931884765625, -0.46424102783203125, -0.4391632080078125, -0.41408538818359375, -0.389007568359375, -0.36392974853515625, -0.3388519287109375, -0.31377410888671875, -0.2886962890625, -0.26361846923828125, -0.2385406494140625, -0.21346282958984375, -0.188385009765625, -0.16330718994140625, -0.1382293701171875, -0.11315155029296875, -0.08807373046875, -0.06299591064453125, -0.0379180908203125, -0.01284027099609375, 0.012237548828125, 0.03731536865234375, 0.0623931884765625, 0.08747100830078125, 0.112548828125, 0.13762664794921875, 0.1627044677734375, 0.18778228759765625, 0.212860107421875, 0.23793792724609375, 0.2630157470703125, 0.28809356689453125, 0.31317138671875, 0.33824920654296875, 0.3633270263671875, 0.38840484619140625, 0.413482666015625, 0.43856048583984375, 0.4636383056640625, 0.48871612548828125, 0.5137939453125, 0.5388717651367188, 0.5639495849609375, 0.5890274047851562, 0.614105224609375, 0.6391830444335938, 0.6642608642578125, 0.6893386840820312, 0.71441650390625, 0.7394943237304688, 0.7645721435546875, 0.7896499633789062, 0.814727783203125, 0.8398056030273438, 0.8648834228515625, 0.8899612426757812, 0.9150390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 21.0, 21.0, 30.0, 68.0, 132.0, 243.0, 736.0, 2845.0, 32082.0, 969000.0, 39054.0, 3006.0, 755.0, 283.0, 113.0, 72.0, 33.0, 24.0, 11.0, 9.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.41339874267578125, -0.3922271728515625, -0.37105560302734375, -0.349884033203125, -0.32871246337890625, -0.3075408935546875, -0.28636932373046875, -0.26519775390625, -0.24402618408203125, -0.2228546142578125, -0.20168304443359375, -0.180511474609375, -0.15933990478515625, -0.1381683349609375, -0.11699676513671875, -0.0958251953125, -0.07465362548828125, -0.0534820556640625, -0.03231048583984375, -0.011138916015625, 0.01003265380859375, 0.0312042236328125, 0.05237579345703125, 0.07354736328125, 0.09471893310546875, 0.1158905029296875, 0.13706207275390625, 0.158233642578125, 0.17940521240234375, 0.2005767822265625, 0.22174835205078125, 0.242919921875, 0.26409149169921875, 0.2852630615234375, 0.30643463134765625, 0.327606201171875, 0.34877777099609375, 0.3699493408203125, 0.39112091064453125, 0.41229248046875, 0.43346405029296875, 0.4546356201171875, 0.47580718994140625, 0.496978759765625, 0.5181503295898438, 0.5393218994140625, 0.5604934692382812, 0.5816650390625, 0.6028366088867188, 0.6240081787109375, 0.6451797485351562, 0.666351318359375, 0.6875228881835938, 0.7086944580078125, 0.7298660278320312, 0.75103759765625, 0.7722091674804688, 0.7933807373046875, 0.8145523071289062, 0.835723876953125, 0.8568954467773438, 0.8780670166015625, 0.8992385864257812, 0.92041015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 14.0, 10.0, 29.0, 53.0, 62.0, 102.0, 146.0, 186.0, 144.0, 108.0, 62.0, 29.0, 18.0, 17.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020694732666015625, -0.00020056962966918945, -0.00019419193267822266, -0.00018781423568725586, -0.00018143653869628906, -0.00017505884170532227, -0.00016868114471435547, -0.00016230344772338867, -0.00015592575073242188, -0.00014954805374145508, -0.00014317035675048828, -0.00013679265975952148, -0.0001304149627685547, -0.0001240372657775879, -0.0001176595687866211, -0.0001112818717956543, -0.0001049041748046875, -9.85264778137207e-05, -9.21487808227539e-05, -8.577108383178711e-05, -7.939338684082031e-05, -7.301568984985352e-05, -6.663799285888672e-05, -6.026029586791992e-05, -5.3882598876953125e-05, -4.750490188598633e-05, -4.112720489501953e-05, -3.4749507904052734e-05, -2.8371810913085938e-05, -2.199411392211914e-05, -1.5616416931152344e-05, -9.238719940185547e-06, -2.86102294921875e-06, 3.516674041748047e-06, 9.894371032714844e-06, 1.627206802368164e-05, 2.2649765014648438e-05, 2.9027462005615234e-05, 3.540515899658203e-05, 4.178285598754883e-05, 4.8160552978515625e-05, 5.453824996948242e-05, 6.091594696044922e-05, 6.729364395141602e-05, 7.367134094238281e-05, 8.004903793334961e-05, 8.64267349243164e-05, 9.28044319152832e-05, 9.918212890625e-05, 0.0001055598258972168, 0.0001119375228881836, 0.00011831521987915039, 0.0001246929168701172, 0.00013107061386108398, 0.00013744831085205078, 0.00014382600784301758, 0.00015020370483398438, 0.00015658140182495117, 0.00016295909881591797, 0.00016933679580688477, 0.00017571449279785156, 0.00018209218978881836, 0.00018846988677978516, 0.00019484758377075195, 0.00020122528076171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 6.0, 2.0, 8.0, 9.0, 19.0, 20.0, 33.0, 49.0, 83.0, 164.0, 280.0, 564.0, 1280.0, 3651.0, 16292.0, 219629.0, 750166.0, 45604.0, 6929.0, 2033.0, 833.0, 398.0, 185.0, 114.0, 69.0, 46.0, 21.0, 16.0, 12.0, 10.0, 12.0, 9.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.32464599609375, -0.3145751953125, -0.30450439453125, -0.29443359375, -0.28436279296875, -0.2742919921875, -0.26422119140625, -0.254150390625, -0.24407958984375, -0.2340087890625, -0.22393798828125, -0.2138671875, -0.20379638671875, -0.1937255859375, -0.18365478515625, -0.173583984375, -0.16351318359375, -0.1534423828125, -0.14337158203125, -0.13330078125, -0.12322998046875, -0.1131591796875, -0.10308837890625, -0.093017578125, -0.08294677734375, -0.0728759765625, -0.06280517578125, -0.052734375, -0.04266357421875, -0.0325927734375, -0.02252197265625, -0.012451171875, -0.00238037109375, 0.0076904296875, 0.01776123046875, 0.02783203125, 0.03790283203125, 0.0479736328125, 0.05804443359375, 0.068115234375, 0.07818603515625, 0.0882568359375, 0.09832763671875, 0.1083984375, 0.11846923828125, 0.1285400390625, 0.13861083984375, 0.148681640625, 0.15875244140625, 0.1688232421875, 0.17889404296875, 0.18896484375, 0.19903564453125, 0.2091064453125, 0.21917724609375, 0.229248046875, 0.23931884765625, 0.2493896484375, 0.25946044921875, 0.26953125, 0.27960205078125, 0.2896728515625, 0.29974365234375, 0.309814453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 9.0, 15.0, 23.0, 22.0, 25.0, 36.0, 56.0, 88.0, 128.0, 130.0, 133.0, 81.0, 57.0, 45.0, 34.0, 29.0, 21.0, 10.0, 10.0, 5.0, 2.0, 11.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37158203125, -0.3608589172363281, -0.35013580322265625, -0.3394126892089844, -0.3286895751953125, -0.3179664611816406, -0.30724334716796875, -0.2965202331542969, -0.285797119140625, -0.2750740051269531, -0.26435089111328125, -0.2536277770996094, -0.2429046630859375, -0.23218154907226562, -0.22145843505859375, -0.21073532104492188, -0.20001220703125, -0.18928909301757812, -0.17856597900390625, -0.16784286499023438, -0.1571197509765625, -0.14639663696289062, -0.13567352294921875, -0.12495040893554688, -0.114227294921875, -0.10350418090820312, -0.09278106689453125, -0.08205795288085938, -0.0713348388671875, -0.060611724853515625, -0.04988861083984375, -0.039165496826171875, -0.0284423828125, -0.017719268798828125, -0.00699615478515625, 0.003726959228515625, 0.0144500732421875, 0.025173187255859375, 0.03589630126953125, 0.046619415283203125, 0.057342529296875, 0.06806564331054688, 0.07878875732421875, 0.08951187133789062, 0.1002349853515625, 0.11095809936523438, 0.12168121337890625, 0.13240432739257812, 0.14312744140625, 0.15385055541992188, 0.16457366943359375, 0.17529678344726562, 0.1860198974609375, 0.19674301147460938, 0.20746612548828125, 0.21818923950195312, 0.228912353515625, 0.23963546752929688, 0.25035858154296875, 0.2610816955566406, 0.2718048095703125, 0.2825279235839844, 0.29325103759765625, 0.3039741516113281, 0.314697265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 4.0, 20.0, 53.0, 119.0, 222.0, 278.0, 177.0, 75.0, 28.0, 13.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.642379760742188, -9.41045093536377, -9.178521156311035, -8.946592330932617, -8.714662551879883, -8.482733726501465, -8.25080394744873, -8.018875122070312, -7.786945343017578, -7.555016040802002, -7.323086738586426, -7.09115743637085, -6.859228134155273, -6.627298831939697, -6.395369529724121, -6.163440704345703, -5.931511402130127, -5.699582099914551, -5.467652797698975, -5.235723495483398, -5.003794193267822, -4.771864891052246, -4.539936065673828, -4.308006286621094, -4.076077461242676, -3.8441481590270996, -3.6122188568115234, -3.3802895545959473, -3.148360252380371, -2.916430950164795, -2.684501886367798, -2.4525725841522217, -2.2206435203552246, -1.9887142181396484, -1.7567849159240723, -1.5248557329177856, -1.2929264307022095, -1.0609971284866333, -0.8290679454803467, -0.5971386432647705, -0.36520934104919434, -0.13328006863594055, 0.09864920377731323, 0.33057844638824463, 0.5625077486038208, 0.794437050819397, 1.0263662338256836, 1.2582955360412598, 1.490224838256836, 1.722154140472412, 1.9540834426879883, 2.1860127449035645, 2.4179420471191406, 2.649871349334717, 2.881800413131714, 3.11372971534729, 3.345659017562866, 3.5775883197784424, 3.8095176219940186, 4.041446685791016, 4.273375988006592, 4.505305290222168, 4.737234592437744, 4.96916389465332, 5.2010931968688965]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 6.0, 4.0, 3.0, 12.0, 12.0, 12.0, 6.0, 17.0, 19.0, 21.0, 30.0, 30.0, 28.0, 44.0, 42.0, 46.0, 48.0, 44.0, 46.0, 49.0, 61.0, 47.0, 59.0, 42.0, 46.0, 44.0, 28.0, 23.0, 20.0, 21.0, 18.0, 14.0, 13.0, 10.0, 7.0, 5.0, 6.0, 6.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1959125995635986, -3.0993895530700684, -3.002866268157959, -2.9063432216644287, -2.8098199367523193, -2.713296890258789, -2.6167736053466797, -2.5202505588531494, -2.423727512359619, -2.327204465866089, -2.2306811809539795, -2.134158134460449, -2.03763484954834, -1.9411118030548096, -1.8445886373519897, -1.74806547164917, -1.6515421867370605, -1.5550190210342407, -1.458495855331421, -1.3619728088378906, -1.2654495239257812, -1.168926477432251, -1.0724033117294312, -0.9758801460266113, -0.8793569803237915, -0.7828338146209717, -0.6863106489181519, -0.5897875428199768, -0.493264377117157, -0.39674121141433716, -0.3002181053161621, -0.20369493961334229, -0.10717201232910156, -0.010648861527442932, 0.0858742892742157, 0.18239742517471313, 0.27892059087753296, 0.3754437565803528, 0.47196686267852783, 0.5684900283813477, 0.6650131940841675, 0.7615363597869873, 0.8580595254898071, 0.9545826315879822, 1.0511057376861572, 1.1476290225982666, 1.2441520690917969, 1.3406752347946167, 1.4371984004974365, 1.5337215662002563, 1.6302447319030762, 1.7267677783966064, 1.8232910633087158, 1.919814109802246, 2.0163373947143555, 2.1128604412078857, 2.209383487701416, 2.3059065341949463, 2.4024298191070557, 2.498952865600586, 2.5954761505126953, 2.6919991970062256, 2.788522243499756, 2.8850455284118652, 2.9815688133239746]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 6.0, 7.0, 8.0, 14.0, 14.0, 23.0, 33.0, 61.0, 80.0, 110.0, 220.0, 332.0, 611.0, 1188.0, 2708.0, 7137.0, 31063.0, 3952858.0, 173193.0, 15834.0, 4709.0, 1974.0, 922.0, 467.0, 287.0, 142.0, 92.0, 74.0, 35.0, 21.0, 17.0, 12.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7001953125, -0.6830329895019531, -0.6658706665039062, -0.6487083435058594, -0.6315460205078125, -0.6143836975097656, -0.5972213745117188, -0.5800590515136719, -0.562896728515625, -0.5457344055175781, -0.5285720825195312, -0.5114097595214844, -0.4942474365234375, -0.4770851135253906, -0.45992279052734375, -0.4427604675292969, -0.42559814453125, -0.4084358215332031, -0.39127349853515625, -0.3741111755371094, -0.3569488525390625, -0.3397865295410156, -0.32262420654296875, -0.3054618835449219, -0.288299560546875, -0.2711372375488281, -0.25397491455078125, -0.23681259155273438, -0.2196502685546875, -0.20248794555664062, -0.18532562255859375, -0.16816329956054688, -0.1510009765625, -0.13383865356445312, -0.11667633056640625, -0.09951400756835938, -0.0823516845703125, -0.06518936157226562, -0.04802703857421875, -0.030864715576171875, -0.013702392578125, 0.003459930419921875, 0.02062225341796875, 0.037784576416015625, 0.0549468994140625, 0.07210922241210938, 0.08927154541015625, 0.10643386840820312, 0.12359619140625, 0.14075851440429688, 0.15792083740234375, 0.17508316040039062, 0.1922454833984375, 0.20940780639648438, 0.22657012939453125, 0.24373245239257812, 0.260894775390625, 0.2780570983886719, 0.29521942138671875, 0.3123817443847656, 0.3295440673828125, 0.3467063903808594, 0.36386871337890625, 0.3810310363769531, 0.398193359375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 7.0, 13.0, 17.0, 23.0, 31.0, 35.0, 46.0, 49.0, 70.0, 74.0, 84.0, 83.0, 63.0, 75.0, 71.0, 59.0, 46.0, 42.0, 24.0, 27.0, 19.0, 11.0, 12.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.212158203125, -0.20728492736816406, -0.20241165161132812, -0.1975383758544922, -0.19266510009765625, -0.1877918243408203, -0.18291854858398438, -0.17804527282714844, -0.1731719970703125, -0.16829872131347656, -0.16342544555664062, -0.1585521697998047, -0.15367889404296875, -0.1488056182861328, -0.14393234252929688, -0.13905906677246094, -0.134185791015625, -0.12931251525878906, -0.12443923950195312, -0.11956596374511719, -0.11469268798828125, -0.10981941223144531, -0.10494613647460938, -0.10007286071777344, -0.0951995849609375, -0.09032630920410156, -0.08545303344726562, -0.08057975769042969, -0.07570648193359375, -0.07083320617675781, -0.06595993041992188, -0.06108665466308594, -0.05621337890625, -0.05134010314941406, -0.046466827392578125, -0.04159355163574219, -0.03672027587890625, -0.03184700012207031, -0.026973724365234375, -0.022100448608398438, -0.0172271728515625, -0.012353897094726562, -0.007480621337890625, -0.0026073455810546875, 0.00226593017578125, 0.0071392059326171875, 0.012012481689453125, 0.016885757446289062, 0.021759033203125, 0.026632308959960938, 0.031505584716796875, 0.03637886047363281, 0.04125213623046875, 0.04612541198730469, 0.050998687744140625, 0.05587196350097656, 0.0607452392578125, 0.06561851501464844, 0.07049179077148438, 0.07536506652832031, 0.08023834228515625, 0.08511161804199219, 0.08998489379882812, 0.09485816955566406, 0.0997314453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 12.0, 7.0, 25.0, 21.0, 46.0, 51.0, 68.0, 100.0, 145.0, 187.0, 250.0, 434.0, 606.0, 966.0, 1687.0, 3049.0, 6478.0, 19508.0, 124772.0, 3913656.0, 92330.0, 16845.0, 5885.0, 2788.0, 1518.0, 886.0, 605.0, 413.0, 242.0, 205.0, 101.0, 107.0, 79.0, 60.0, 35.0, 30.0, 19.0, 19.0, 14.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.57470703125, -0.5569915771484375, -0.539276123046875, -0.5215606689453125, -0.50384521484375, -0.4861297607421875, -0.468414306640625, -0.4506988525390625, -0.4329833984375, -0.4152679443359375, -0.397552490234375, -0.3798370361328125, -0.36212158203125, -0.3444061279296875, -0.326690673828125, -0.3089752197265625, -0.291259765625, -0.2735443115234375, -0.255828857421875, -0.2381134033203125, -0.22039794921875, -0.2026824951171875, -0.184967041015625, -0.1672515869140625, -0.1495361328125, -0.1318206787109375, -0.114105224609375, -0.0963897705078125, -0.07867431640625, -0.0609588623046875, -0.043243408203125, -0.0255279541015625, -0.0078125, 0.0099029541015625, 0.027618408203125, 0.0453338623046875, 0.06304931640625, 0.0807647705078125, 0.098480224609375, 0.1161956787109375, 0.1339111328125, 0.1516265869140625, 0.169342041015625, 0.1870574951171875, 0.20477294921875, 0.2224884033203125, 0.240203857421875, 0.2579193115234375, 0.275634765625, 0.2933502197265625, 0.311065673828125, 0.3287811279296875, 0.34649658203125, 0.3642120361328125, 0.381927490234375, 0.3996429443359375, 0.4173583984375, 0.4350738525390625, 0.452789306640625, 0.4705047607421875, 0.48822021484375, 0.5059356689453125, 0.523651123046875, 0.5413665771484375, 0.55908203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 28.0, 70.0, 208.0, 3332.0, 278.0, 66.0, 31.0, 10.0, 11.0, 7.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3038444519042969, -0.29616546630859375, -0.2884864807128906, -0.2808074951171875, -0.2731285095214844, -0.26544952392578125, -0.2577705383300781, -0.250091552734375, -0.24241256713867188, -0.23473358154296875, -0.22705459594726562, -0.2193756103515625, -0.21169662475585938, -0.20401763916015625, -0.19633865356445312, -0.18865966796875, -0.18098068237304688, -0.17330169677734375, -0.16562271118164062, -0.1579437255859375, -0.15026473999023438, -0.14258575439453125, -0.13490676879882812, -0.127227783203125, -0.11954879760742188, -0.11186981201171875, -0.10419082641601562, -0.0965118408203125, -0.08883285522460938, -0.08115386962890625, -0.07347488403320312, -0.0657958984375, -0.058116912841796875, -0.05043792724609375, -0.042758941650390625, -0.0350799560546875, -0.027400970458984375, -0.01972198486328125, -0.012042999267578125, -0.004364013671875, 0.003314971923828125, 0.01099395751953125, 0.018672943115234375, 0.0263519287109375, 0.034030914306640625, 0.04170989990234375, 0.049388885498046875, 0.05706787109375, 0.06474685668945312, 0.07242584228515625, 0.08010482788085938, 0.0877838134765625, 0.09546279907226562, 0.10314178466796875, 0.11082077026367188, 0.118499755859375, 0.12617874145507812, 0.13385772705078125, 0.14153671264648438, 0.1492156982421875, 0.15689468383789062, 0.16457366943359375, 0.17225265502929688, 0.179931640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 9.0, 18.0, 44.0, 51.0, 153.0, 167.0, 219.0, 167.0, 80.0, 50.0, 29.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7165275812149048, -1.682455062866211, -1.6483824253082275, -1.6143099069595337, -1.5802373886108398, -1.5461647510528564, -1.5120922327041626, -1.4780197143554688, -1.4439470767974854, -1.4098745584487915, -1.375801920890808, -1.3417294025421143, -1.3076568841934204, -1.2735843658447266, -1.2395117282867432, -1.2054392099380493, -1.1713666915893555, -1.1372941732406616, -1.1032215356826782, -1.0691490173339844, -1.0350764989852905, -1.0010039806365967, -0.9669313430786133, -0.9328588247299194, -0.8987862467765808, -0.8647136688232422, -0.8306411504745483, -0.7965685725212097, -0.7624959945678711, -0.7284234762191772, -0.6943508982658386, -0.6602783203125, -0.6262056827545166, -0.592133104801178, -0.5580605864524841, -0.5239880084991455, -0.4899154603481293, -0.45584291219711304, -0.4217703342437744, -0.3876977860927582, -0.35362523794174194, -0.3195526897907257, -0.2854801416397095, -0.25140756368637085, -0.21733501553535461, -0.18326246738433838, -0.14918990433216095, -0.11511734127998352, -0.08104479312896729, -0.04697223752737045, -0.01289968192577362, 0.02117287367582321, 0.055245429277420044, 0.08931797742843628, 0.12339054048061371, 0.15746310353279114, 0.19153565168380737, 0.2256081998348236, 0.25968074798583984, 0.29375332593917847, 0.3278258740901947, 0.36189842224121094, 0.39597100019454956, 0.4300435483455658, 0.46411609649658203]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 9.0, 6.0, 12.0, 21.0, 21.0, 21.0, 21.0, 23.0, 26.0, 22.0, 26.0, 47.0, 53.0, 45.0, 39.0, 39.0, 45.0, 44.0, 55.0, 55.0, 35.0, 40.0, 32.0, 45.0, 34.0, 31.0, 20.0, 27.0, 21.0, 16.0, 12.0, 12.0, 9.0, 11.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.45489203929901123, -0.4417952001094818, -0.4286983609199524, -0.41560155153274536, -0.40250471234321594, -0.3894078731536865, -0.3763110339641571, -0.3632141947746277, -0.35011738538742065, -0.33702054619789124, -0.3239237070083618, -0.3108268976211548, -0.29773005843162537, -0.28463321924209595, -0.27153638005256653, -0.2584395408630371, -0.24534271657466888, -0.23224587738513947, -0.21914905309677124, -0.20605221390724182, -0.1929553896188736, -0.17985855042934418, -0.16676172614097595, -0.15366488695144653, -0.14056804776191711, -0.1274712085723877, -0.11437438428401947, -0.10127754509449005, -0.08818072080612183, -0.07508388161659241, -0.061987049877643585, -0.04889021813869476, -0.03579339385032654, -0.022696562111377716, -0.009599728509783745, 0.0034971050918102264, 0.01659393683075905, 0.02969077229499817, 0.04278760403394699, 0.05588443577289581, 0.06898126751184464, 0.08207809925079346, 0.09517493098974228, 0.1082717627286911, 0.12136860191822052, 0.13446542620658875, 0.14756226539611816, 0.16065910458564758, 0.1737559288740158, 0.18685276806354523, 0.19994959235191345, 0.21304643154144287, 0.2261432558298111, 0.23924009501934052, 0.25233691930770874, 0.26543375849723816, 0.2785305976867676, 0.291627436876297, 0.3047242760658264, 0.31782108545303345, 0.33091792464256287, 0.3440147638320923, 0.3571116030216217, 0.3702084422111511, 0.38330525159835815]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 11.0, 9.0, 10.0, 16.0, 22.0, 49.0, 88.0, 152.0, 299.0, 522.0, 1137.0, 2294.0, 5345.0, 14581.0, 54679.0, 318271.0, 516207.0, 99080.0, 22287.0, 7444.0, 3089.0, 1390.0, 751.0, 380.0, 201.0, 97.0, 58.0, 33.0, 14.0, 3.0, 14.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.484375, -0.4697761535644531, -0.45517730712890625, -0.4405784606933594, -0.4259796142578125, -0.4113807678222656, -0.39678192138671875, -0.3821830749511719, -0.367584228515625, -0.3529853820800781, -0.33838653564453125, -0.3237876892089844, -0.3091888427734375, -0.2945899963378906, -0.27999114990234375, -0.2653923034667969, -0.25079345703125, -0.23619461059570312, -0.22159576416015625, -0.20699691772460938, -0.1923980712890625, -0.17779922485351562, -0.16320037841796875, -0.14860153198242188, -0.134002685546875, -0.11940383911132812, -0.10480499267578125, -0.09020614624023438, -0.0756072998046875, -0.061008453369140625, -0.04640960693359375, -0.031810760498046875, -0.0172119140625, -0.002613067626953125, 0.01198577880859375, 0.026584625244140625, 0.0411834716796875, 0.055782318115234375, 0.07038116455078125, 0.08498001098632812, 0.099578857421875, 0.11417770385742188, 0.12877655029296875, 0.14337539672851562, 0.1579742431640625, 0.17257308959960938, 0.18717193603515625, 0.20177078247070312, 0.21636962890625, 0.23096847534179688, 0.24556732177734375, 0.2601661682128906, 0.2747650146484375, 0.2893638610839844, 0.30396270751953125, 0.3185615539550781, 0.333160400390625, 0.3477592468261719, 0.36235809326171875, 0.3769569396972656, 0.3915557861328125, 0.4061546325683594, 0.42075347900390625, 0.4353523254394531, 0.449951171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 9.0, 9.0, 8.0, 19.0, 25.0, 21.0, 28.0, 38.0, 43.0, 46.0, 62.0, 60.0, 52.0, 75.0, 71.0, 62.0, 63.0, 55.0, 57.0, 44.0, 34.0, 20.0, 24.0, 17.0, 15.0, 15.0, 13.0, 8.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.189208984375, -0.1845846176147461, -0.1799602508544922, -0.17533588409423828, -0.17071151733398438, -0.16608715057373047, -0.16146278381347656, -0.15683841705322266, -0.15221405029296875, -0.14758968353271484, -0.14296531677246094, -0.13834095001220703, -0.13371658325195312, -0.12909221649169922, -0.12446784973144531, -0.1198434829711914, -0.1152191162109375, -0.1105947494506836, -0.10597038269042969, -0.10134601593017578, -0.09672164916992188, -0.09209728240966797, -0.08747291564941406, -0.08284854888916016, -0.07822418212890625, -0.07359981536865234, -0.06897544860839844, -0.06435108184814453, -0.059726715087890625, -0.05510234832763672, -0.05047798156738281, -0.045853614807128906, -0.041229248046875, -0.036604881286621094, -0.03198051452636719, -0.02735614776611328, -0.022731781005859375, -0.01810741424560547, -0.013483047485351562, -0.008858680725097656, -0.00423431396484375, 0.00039005279541015625, 0.0050144195556640625, 0.009638786315917969, 0.014263153076171875, 0.01888751983642578, 0.023511886596679688, 0.028136253356933594, 0.0327606201171875, 0.037384986877441406, 0.04200935363769531, 0.04663372039794922, 0.051258087158203125, 0.05588245391845703, 0.06050682067871094, 0.06513118743896484, 0.06975555419921875, 0.07437992095947266, 0.07900428771972656, 0.08362865447998047, 0.08825302124023438, 0.09287738800048828, 0.09750175476074219, 0.1021261215209961, 0.10675048828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 6.0, 13.0, 18.0, 23.0, 37.0, 59.0, 107.0, 208.0, 350.0, 800.0, 2434.0, 12181.0, 402013.0, 611154.0, 14658.0, 2747.0, 878.0, 356.0, 203.0, 106.0, 68.0, 50.0, 21.0, 14.0, 16.0, 8.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99169921875, -0.9536209106445312, -0.9155426025390625, -0.8774642944335938, -0.839385986328125, -0.8013076782226562, -0.7632293701171875, -0.7251510620117188, -0.68707275390625, -0.6489944458007812, -0.6109161376953125, -0.5728378295898438, -0.534759521484375, -0.49668121337890625, -0.4586029052734375, -0.42052459716796875, -0.3824462890625, -0.34436798095703125, -0.3062896728515625, -0.26821136474609375, -0.230133056640625, -0.19205474853515625, -0.1539764404296875, -0.11589813232421875, -0.07781982421875, -0.03974151611328125, -0.0016632080078125, 0.03641510009765625, 0.074493408203125, 0.11257171630859375, 0.1506500244140625, 0.18872833251953125, 0.226806640625, 0.26488494873046875, 0.3029632568359375, 0.34104156494140625, 0.379119873046875, 0.41719818115234375, 0.4552764892578125, 0.49335479736328125, 0.53143310546875, 0.5695114135742188, 0.6075897216796875, 0.6456680297851562, 0.683746337890625, 0.7218246459960938, 0.7599029541015625, 0.7979812622070312, 0.8360595703125, 0.8741378784179688, 0.9122161865234375, 0.9502944946289062, 0.988372802734375, 1.0264511108398438, 1.0645294189453125, 1.1026077270507812, 1.14068603515625, 1.1787643432617188, 1.2168426513671875, 1.2549209594726562, 1.292999267578125, 1.3310775756835938, 1.3691558837890625, 1.4072341918945312, 1.4453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 7.0, 10.0, 17.0, 10.0, 25.0, 28.0, 33.0, 35.0, 46.0, 61.0, 50.0, 57.0, 72.0, 67.0, 65.0, 69.0, 55.0, 45.0, 59.0, 50.0, 30.0, 21.0, 18.0, 18.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7767257690429688, -0.7472991943359375, -0.7178726196289062, -0.688446044921875, -0.6590194702148438, -0.6295928955078125, -0.6001663208007812, -0.57073974609375, -0.5413131713867188, -0.5118865966796875, -0.48246002197265625, -0.453033447265625, -0.42360687255859375, -0.3941802978515625, -0.36475372314453125, -0.3353271484375, -0.30590057373046875, -0.2764739990234375, -0.24704742431640625, -0.217620849609375, -0.18819427490234375, -0.1587677001953125, -0.12934112548828125, -0.09991455078125, -0.07048797607421875, -0.0410614013671875, -0.01163482666015625, 0.017791748046875, 0.04721832275390625, 0.0766448974609375, 0.10607147216796875, 0.135498046875, 0.16492462158203125, 0.1943511962890625, 0.22377777099609375, 0.253204345703125, 0.28263092041015625, 0.3120574951171875, 0.34148406982421875, 0.37091064453125, 0.40033721923828125, 0.4297637939453125, 0.45919036865234375, 0.488616943359375, 0.5180435180664062, 0.5474700927734375, 0.5768966674804688, 0.6063232421875, 0.6357498168945312, 0.6651763916015625, 0.6946029663085938, 0.724029541015625, 0.7534561157226562, 0.7828826904296875, 0.8123092651367188, 0.84173583984375, 0.8711624145507812, 0.9005889892578125, 0.9300155639648438, 0.959442138671875, 0.9888687133789062, 1.0182952880859375, 1.0477218627929688, 1.0771484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 10.0, 13.0, 31.0, 65.0, 144.0, 393.0, 1447.0, 18329.0, 1016425.0, 10015.0, 1084.0, 298.0, 143.0, 78.0, 23.0, 17.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.3265380859375, -1.272216796875, -1.2178955078125, -1.16357421875, -1.1092529296875, -1.054931640625, -1.0006103515625, -0.9462890625, -0.8919677734375, -0.837646484375, -0.7833251953125, -0.72900390625, -0.6746826171875, -0.620361328125, -0.5660400390625, -0.51171875, -0.4573974609375, -0.403076171875, -0.3487548828125, -0.29443359375, -0.2401123046875, -0.185791015625, -0.1314697265625, -0.0771484375, -0.0228271484375, 0.031494140625, 0.0858154296875, 0.14013671875, 0.1944580078125, 0.248779296875, 0.3031005859375, 0.357421875, 0.4117431640625, 0.466064453125, 0.5203857421875, 0.57470703125, 0.6290283203125, 0.683349609375, 0.7376708984375, 0.7919921875, 0.8463134765625, 0.900634765625, 0.9549560546875, 1.00927734375, 1.0635986328125, 1.117919921875, 1.1722412109375, 1.2265625, 1.2808837890625, 1.335205078125, 1.3895263671875, 1.44384765625, 1.4981689453125, 1.552490234375, 1.6068115234375, 1.6611328125, 1.7154541015625, 1.769775390625, 1.8240966796875, 1.87841796875, 1.9327392578125, 1.987060546875, 2.0413818359375, 2.095703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 14.0, 17.0, 19.0, 27.0, 35.0, 51.0, 41.0, 75.0, 67.0, 76.0, 114.0, 93.0, 68.0, 64.0, 51.0, 42.0, 25.0, 28.0, 15.0, 16.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.08970832824707e-05, -8.780695497989655e-05, -8.471682667732239e-05, -8.162669837474823e-05, -7.853657007217407e-05, -7.544644176959991e-05, -7.235631346702576e-05, -6.92661851644516e-05, -6.617605686187744e-05, -6.308592855930328e-05, -5.9995800256729126e-05, -5.690567195415497e-05, -5.381554365158081e-05, -5.072541534900665e-05, -4.7635287046432495e-05, -4.454515874385834e-05, -4.145503044128418e-05, -3.836490213871002e-05, -3.5274773836135864e-05, -3.2184645533561707e-05, -2.909451723098755e-05, -2.600438892841339e-05, -2.2914260625839233e-05, -1.9824132323265076e-05, -1.6734004020690918e-05, -1.364387571811676e-05, -1.0553747415542603e-05, -7.463619112968445e-06, -4.373490810394287e-06, -1.2833625078201294e-06, 1.8067657947540283e-06, 4.896894097328186e-06, 7.987022399902344e-06, 1.1077150702476501e-05, 1.416727900505066e-05, 1.7257407307624817e-05, 2.0347535610198975e-05, 2.3437663912773132e-05, 2.652779221534729e-05, 2.9617920517921448e-05, 3.2708048820495605e-05, 3.579817712306976e-05, 3.888830542564392e-05, 4.197843372821808e-05, 4.5068562030792236e-05, 4.8158690333366394e-05, 5.124881863594055e-05, 5.433894693851471e-05, 5.742907524108887e-05, 6.0519203543663025e-05, 6.360933184623718e-05, 6.669946014881134e-05, 6.97895884513855e-05, 7.287971675395966e-05, 7.596984505653381e-05, 7.905997335910797e-05, 8.215010166168213e-05, 8.524022996425629e-05, 8.833035826683044e-05, 9.14204865694046e-05, 9.451061487197876e-05, 9.760074317455292e-05, 0.00010069087147712708, 0.00010378099977970123, 0.00010687112808227539]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 9.0, 15.0, 15.0, 33.0, 73.0, 138.0, 305.0, 762.0, 2849.0, 40938.0, 978501.0, 21482.0, 2274.0, 630.0, 246.0, 118.0, 63.0, 31.0, 17.0, 12.0, 3.0, 6.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9033203125, -0.8691253662109375, -0.834930419921875, -0.8007354736328125, -0.76654052734375, -0.7323455810546875, -0.698150634765625, -0.6639556884765625, -0.6297607421875, -0.5955657958984375, -0.561370849609375, -0.5271759033203125, -0.49298095703125, -0.4587860107421875, -0.424591064453125, -0.3903961181640625, -0.356201171875, -0.3220062255859375, -0.287811279296875, -0.2536163330078125, -0.21942138671875, -0.1852264404296875, -0.151031494140625, -0.1168365478515625, -0.0826416015625, -0.0484466552734375, -0.014251708984375, 0.0199432373046875, 0.05413818359375, 0.0883331298828125, 0.122528076171875, 0.1567230224609375, 0.19091796875, 0.2251129150390625, 0.259307861328125, 0.2935028076171875, 0.32769775390625, 0.3618927001953125, 0.396087646484375, 0.4302825927734375, 0.4644775390625, 0.4986724853515625, 0.532867431640625, 0.5670623779296875, 0.60125732421875, 0.6354522705078125, 0.669647216796875, 0.7038421630859375, 0.738037109375, 0.7722320556640625, 0.806427001953125, 0.8406219482421875, 0.87481689453125, 0.9090118408203125, 0.943206787109375, 0.9774017333984375, 1.0115966796875, 1.0457916259765625, 1.079986572265625, 1.1141815185546875, 1.14837646484375, 1.1825714111328125, 1.216766357421875, 1.2509613037109375, 1.28515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 20.0, 21.0, 21.0, 65.0, 111.0, 299.0, 248.0, 86.0, 47.0, 28.0, 22.0, 8.0, 6.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.1816558837890625, -1.144561767578125, -1.1074676513671875, -1.07037353515625, -1.0332794189453125, -0.996185302734375, -0.9590911865234375, -0.9219970703125, -0.8849029541015625, -0.847808837890625, -0.8107147216796875, -0.77362060546875, -0.7365264892578125, -0.699432373046875, -0.6623382568359375, -0.625244140625, -0.5881500244140625, -0.551055908203125, -0.5139617919921875, -0.47686767578125, -0.4397735595703125, -0.402679443359375, -0.3655853271484375, -0.3284912109375, -0.2913970947265625, -0.254302978515625, -0.2172088623046875, -0.18011474609375, -0.1430206298828125, -0.105926513671875, -0.0688323974609375, -0.03173828125, 0.0053558349609375, 0.042449951171875, 0.0795440673828125, 0.11663818359375, 0.1537322998046875, 0.190826416015625, 0.2279205322265625, 0.2650146484375, 0.3021087646484375, 0.339202880859375, 0.3762969970703125, 0.41339111328125, 0.4504852294921875, 0.487579345703125, 0.5246734619140625, 0.561767578125, 0.5988616943359375, 0.635955810546875, 0.6730499267578125, 0.71014404296875, 0.7472381591796875, 0.784332275390625, 0.8214263916015625, 0.8585205078125, 0.8956146240234375, 0.932708740234375, 0.9698028564453125, 1.00689697265625, 1.0439910888671875, 1.081085205078125, 1.1181793212890625, 1.1552734375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 34.0, 179.0, 582.0, 188.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.54459762573242, -31.744001388549805, -30.943405151367188, -30.14280891418457, -29.342212677001953, -28.54161834716797, -27.74102210998535, -26.940425872802734, -26.139829635620117, -25.3392333984375, -24.538637161254883, -23.738040924072266, -22.93744659423828, -22.13684844970703, -21.336254119873047, -20.53565788269043, -19.735061645507812, -18.934465408325195, -18.133869171142578, -17.33327293395996, -16.532676696777344, -15.732081413269043, -14.931486129760742, -14.130889892578125, -13.330293655395508, -12.52969741821289, -11.729101181030273, -10.928505897521973, -10.127909660339355, -9.327313423156738, -8.526718139648438, -7.72612190246582, -6.925527572631836, -6.124931335449219, -5.32433557510376, -4.523739814758301, -3.7231435775756836, -2.9225473403930664, -2.1219515800476074, -1.3213558197021484, -0.5207595825195312, 0.27983641624450684, 1.080432415008545, 1.881028413772583, 2.681624412536621, 3.4822206497192383, 4.282816410064697, 5.083412170410156, 5.884008407592773, 6.684604644775391, 7.48520040512085, 8.285796165466309, 9.086392402648926, 9.886988639831543, 10.687583923339844, 11.488180160522461, 12.288776397705078, 13.089372634887695, 13.889968872070312, 14.690564155578613, 15.49116039276123, 16.29175567626953, 17.09235191345215, 17.892948150634766, 18.693544387817383]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 5.0, 2.0, 8.0, 6.0, 14.0, 14.0, 16.0, 25.0, 20.0, 31.0, 38.0, 31.0, 45.0, 52.0, 50.0, 56.0, 65.0, 63.0, 52.0, 59.0, 50.0, 47.0, 37.0, 38.0, 23.0, 29.0, 32.0, 19.0, 7.0, 17.0, 12.0, 3.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.801705360412598, -4.664665222167969, -4.527624607086182, -4.390584468841553, -4.253543853759766, -4.116503715515137, -3.979463577270508, -3.8424232006073, -3.705382823944092, -3.568342447280884, -3.431302070617676, -3.294261932373047, -3.157221555709839, -3.020181179046631, -2.883141040802002, -2.746100664138794, -2.609060287475586, -2.472019910812378, -2.33497953414917, -2.197939395904541, -2.060899019241333, -1.923858642578125, -1.7868183851242065, -1.649778127670288, -1.51273775100708, -1.375697374343872, -1.2386571168899536, -1.1016168594360352, -0.9645764827728271, -0.8275361657142639, -0.6904958486557007, -0.5534555315971375, -0.4164149761199951, -0.2793746590614319, -0.14233434200286865, -0.00529402494430542, 0.1317462921142578, 0.26878660917282104, 0.4058269262313843, 0.5428672432899475, 0.6799075603485107, 0.816947877407074, 0.9539881944656372, 1.0910284519195557, 1.2280688285827637, 1.3651092052459717, 1.5021494626998901, 1.6391897201538086, 1.7762300968170166, 1.9132704734802246, 2.0503106117248535, 2.1873509883880615, 2.3243913650512695, 2.4614317417144775, 2.5984721183776855, 2.7355122566223145, 2.8725526332855225, 3.0095930099487305, 3.1466331481933594, 3.2836735248565674, 3.4207139015197754, 3.5577542781829834, 3.6947946548461914, 3.8318347930908203, 3.9688751697540283]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 9.0, 22.0, 34.0, 74.0, 125.0, 283.0, 555.0, 2165.0, 18343.0, 4149482.0, 19641.0, 2367.0, 646.0, 250.0, 111.0, 62.0, 34.0, 14.0, 21.0, 9.0, 9.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.131591796875, -2.07763671875, -2.023681640625, -1.9697265625, -1.915771484375, -1.86181640625, -1.807861328125, -1.75390625, -1.699951171875, -1.64599609375, -1.592041015625, -1.5380859375, -1.484130859375, -1.43017578125, -1.376220703125, -1.322265625, -1.268310546875, -1.21435546875, -1.160400390625, -1.1064453125, -1.052490234375, -0.99853515625, -0.944580078125, -0.890625, -0.836669921875, -0.78271484375, -0.728759765625, -0.6748046875, -0.620849609375, -0.56689453125, -0.512939453125, -0.458984375, -0.405029296875, -0.35107421875, -0.297119140625, -0.2431640625, -0.189208984375, -0.13525390625, -0.081298828125, -0.02734375, 0.026611328125, 0.08056640625, 0.134521484375, 0.1884765625, 0.242431640625, 0.29638671875, 0.350341796875, 0.404296875, 0.458251953125, 0.51220703125, 0.566162109375, 0.6201171875, 0.674072265625, 0.72802734375, 0.781982421875, 0.8359375, 0.889892578125, 0.94384765625, 0.997802734375, 1.0517578125, 1.105712890625, 1.15966796875, 1.213623046875, 1.267578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 10.0, 5.0, 11.0, 16.0, 17.0, 22.0, 25.0, 29.0, 35.0, 50.0, 52.0, 51.0, 54.0, 61.0, 59.0, 59.0, 58.0, 59.0, 44.0, 57.0, 46.0, 30.0, 37.0, 20.0, 22.0, 14.0, 16.0, 10.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1588134765625, -0.15386199951171875, -0.1489105224609375, -0.14395904541015625, -0.139007568359375, -0.13405609130859375, -0.1291046142578125, -0.12415313720703125, -0.11920166015625, -0.11425018310546875, -0.1092987060546875, -0.10434722900390625, -0.099395751953125, -0.09444427490234375, -0.0894927978515625, -0.08454132080078125, -0.07958984375, -0.07463836669921875, -0.0696868896484375, -0.06473541259765625, -0.059783935546875, -0.05483245849609375, -0.0498809814453125, -0.04492950439453125, -0.03997802734375, -0.03502655029296875, -0.0300750732421875, -0.02512359619140625, -0.020172119140625, -0.01522064208984375, -0.0102691650390625, -0.00531768798828125, -0.0003662109375, 0.00458526611328125, 0.0095367431640625, 0.01448822021484375, 0.019439697265625, 0.02439117431640625, 0.0293426513671875, 0.03429412841796875, 0.03924560546875, 0.04419708251953125, 0.0491485595703125, 0.05410003662109375, 0.059051513671875, 0.06400299072265625, 0.0689544677734375, 0.07390594482421875, 0.078857421875, 0.08380889892578125, 0.0887603759765625, 0.09371185302734375, 0.098663330078125, 0.10361480712890625, 0.1085662841796875, 0.11351776123046875, 0.11846923828125, 0.12342071533203125, 0.1283721923828125, 0.13332366943359375, 0.138275146484375, 0.14322662353515625, 0.1481781005859375, 0.15312957763671875, 0.1580810546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 8.0, 9.0, 6.0, 23.0, 20.0, 34.0, 61.0, 70.0, 115.0, 206.0, 351.0, 644.0, 1355.0, 3387.0, 13231.0, 3602592.0, 554068.0, 12094.0, 3139.0, 1295.0, 622.0, 362.0, 211.0, 125.0, 74.0, 49.0, 41.0, 21.0, 19.0, 12.0, 7.0, 11.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7158203125, -1.6706390380859375, -1.625457763671875, -1.5802764892578125, -1.53509521484375, -1.4899139404296875, -1.444732666015625, -1.3995513916015625, -1.3543701171875, -1.3091888427734375, -1.264007568359375, -1.2188262939453125, -1.17364501953125, -1.1284637451171875, -1.083282470703125, -1.0381011962890625, -0.992919921875, -0.9477386474609375, -0.902557373046875, -0.8573760986328125, -0.81219482421875, -0.7670135498046875, -0.721832275390625, -0.6766510009765625, -0.6314697265625, -0.5862884521484375, -0.541107177734375, -0.4959259033203125, -0.45074462890625, -0.4055633544921875, -0.360382080078125, -0.3152008056640625, -0.27001953125, -0.2248382568359375, -0.179656982421875, -0.1344757080078125, -0.08929443359375, -0.0441131591796875, 0.001068115234375, 0.0462493896484375, 0.0914306640625, 0.1366119384765625, 0.181793212890625, 0.2269744873046875, 0.27215576171875, 0.3173370361328125, 0.362518310546875, 0.4076995849609375, 0.452880859375, 0.4980621337890625, 0.543243408203125, 0.5884246826171875, 0.63360595703125, 0.6787872314453125, 0.723968505859375, 0.7691497802734375, 0.8143310546875, 0.8595123291015625, 0.904693603515625, 0.9498748779296875, 0.99505615234375, 1.0402374267578125, 1.085418701171875, 1.1305999755859375, 1.17578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 4.0, 7.0, 12.0, 26.0, 36.0, 92.0, 450.0, 3201.0, 140.0, 46.0, 21.0, 9.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33203125, -0.3241539001464844, -0.31627655029296875, -0.3083992004394531, -0.3005218505859375, -0.2926445007324219, -0.28476715087890625, -0.2768898010253906, -0.269012451171875, -0.2611351013183594, -0.25325775146484375, -0.24538040161132812, -0.2375030517578125, -0.22962570190429688, -0.22174835205078125, -0.21387100219726562, -0.20599365234375, -0.19811630249023438, -0.19023895263671875, -0.18236160278320312, -0.1744842529296875, -0.16660690307617188, -0.15872955322265625, -0.15085220336914062, -0.142974853515625, -0.13509750366210938, -0.12722015380859375, -0.11934280395507812, -0.1114654541015625, -0.10358810424804688, -0.09571075439453125, -0.08783340454101562, -0.0799560546875, -0.07207870483398438, -0.06420135498046875, -0.056324005126953125, -0.0484466552734375, -0.040569305419921875, -0.03269195556640625, -0.024814605712890625, -0.016937255859375, -0.009059906005859375, -0.00118255615234375, 0.006694793701171875, 0.0145721435546875, 0.022449493408203125, 0.03032684326171875, 0.038204193115234375, 0.04608154296875, 0.053958892822265625, 0.06183624267578125, 0.06971359252929688, 0.0775909423828125, 0.08546829223632812, 0.09334564208984375, 0.10122299194335938, 0.109100341796875, 0.11697769165039062, 0.12485504150390625, 0.13273239135742188, 0.1406097412109375, 0.14848709106445312, 0.15636444091796875, 0.16424179077148438, 0.172119140625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 8.0, 16.0, 24.0, 52.0, 95.0, 143.0, 205.0, 184.0, 135.0, 69.0, 38.0, 17.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3066192865371704, -1.2592202425003052, -1.2118213176727295, -1.1644222736358643, -1.117023229598999, -1.0696241855621338, -1.022225260734558, -0.9748262166976929, -0.9274272322654724, -0.880028247833252, -0.8326292037963867, -0.7852302193641663, -0.7378312349319458, -0.6904321908950806, -0.6430332064628601, -0.5956342220306396, -0.5482351779937744, -0.500836193561554, -0.4534371495246887, -0.40603816509246826, -0.3586391508579254, -0.31124013662338257, -0.2638411521911621, -0.21644213795661926, -0.16904312372207642, -0.12164411693811417, -0.07424511015415192, -0.026846110820770264, 0.020552903413772583, 0.06795191764831543, 0.11535090208053589, 0.16274991631507874, 0.21014904975891113, 0.257548063993454, 0.3049470782279968, 0.3523460626602173, 0.39974507689476013, 0.447144091129303, 0.49454307556152344, 0.5419421195983887, 0.5893411040306091, 0.6367400884628296, 0.6841391324996948, 0.7315381169319153, 0.7789371013641357, 0.826336145401001, 0.8737351298332214, 0.9211341142654419, 0.9685331583023071, 1.0159322023391724, 1.063331127166748, 1.1107301712036133, 1.1581292152404785, 1.2055282592773438, 1.2529271841049194, 1.3003262281417847, 1.3477251529693604, 1.3951241970062256, 1.4425231218338013, 1.4899221658706665, 1.5373212099075317, 1.5847201347351074, 1.6321191787719727, 1.679518222808838, 1.7269172668457031]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 12.0, 13.0, 13.0, 7.0, 10.0, 15.0, 23.0, 24.0, 25.0, 29.0, 31.0, 35.0, 31.0, 24.0, 43.0, 40.0, 40.0, 39.0, 49.0, 46.0, 44.0, 39.0, 38.0, 28.0, 45.0, 26.0, 35.0, 26.0, 25.0, 25.0, 27.0, 13.0, 20.0, 14.0, 14.0, 7.0, 9.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6180504560470581, -0.5989565849304199, -0.5798627138137817, -0.5607688426971436, -0.5416749715805054, -0.5225811004638672, -0.503487229347229, -0.48439332842826843, -0.46529945731163025, -0.44620558619499207, -0.4271117150783539, -0.4080178439617157, -0.3889239430427551, -0.36983007192611694, -0.35073620080947876, -0.3316423296928406, -0.3125484585762024, -0.2934545874595642, -0.274360716342926, -0.25526684522628784, -0.23617295920848846, -0.21707908809185028, -0.1979852020740509, -0.17889133095741272, -0.15979745984077454, -0.14070358872413635, -0.12160971015691757, -0.10251583158969879, -0.08342196047306061, -0.06432808935642242, -0.045234210789203644, -0.026140332221984863, -0.007046401500701904, 0.012047473341226578, 0.03114134818315506, 0.05023522302508354, 0.06932909786701202, 0.08842296898365021, 0.10751684755086899, 0.12661072611808777, 0.14570459723472595, 0.16479846835136414, 0.18389233946800232, 0.2029862254858017, 0.22208009660243988, 0.24117396771907806, 0.26026785373687744, 0.2793617248535156, 0.2984555959701538, 0.317549467086792, 0.3366433382034302, 0.35573720932006836, 0.37483108043670654, 0.3939249515533447, 0.4130188524723053, 0.4321127235889435, 0.45120659470558167, 0.47030046582221985, 0.48939433693885803, 0.5084882378578186, 0.5275821089744568, 0.546675980091095, 0.5657698512077332, 0.5848637223243713, 0.6039575934410095]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 18.0, 13.0, 19.0, 41.0, 56.0, 80.0, 161.0, 360.0, 629.0, 1598.0, 5181.0, 27970.0, 337749.0, 614470.0, 48735.0, 7682.0, 2183.0, 779.0, 385.0, 171.0, 115.0, 54.0, 43.0, 13.0, 16.0, 6.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8076171875, -0.7852630615234375, -0.762908935546875, -0.7405548095703125, -0.71820068359375, -0.6958465576171875, -0.673492431640625, -0.6511383056640625, -0.6287841796875, -0.6064300537109375, -0.584075927734375, -0.5617218017578125, -0.53936767578125, -0.5170135498046875, -0.494659423828125, -0.4723052978515625, -0.449951171875, -0.4275970458984375, -0.405242919921875, -0.3828887939453125, -0.36053466796875, -0.3381805419921875, -0.315826416015625, -0.2934722900390625, -0.2711181640625, -0.2487640380859375, -0.226409912109375, -0.2040557861328125, -0.18170166015625, -0.1593475341796875, -0.136993408203125, -0.1146392822265625, -0.09228515625, -0.0699310302734375, -0.047576904296875, -0.0252227783203125, -0.00286865234375, 0.0194854736328125, 0.041839599609375, 0.0641937255859375, 0.0865478515625, 0.1089019775390625, 0.131256103515625, 0.1536102294921875, 0.17596435546875, 0.1983184814453125, 0.220672607421875, 0.2430267333984375, 0.265380859375, 0.2877349853515625, 0.310089111328125, 0.3324432373046875, 0.35479736328125, 0.3771514892578125, 0.399505615234375, 0.4218597412109375, 0.4442138671875, 0.4665679931640625, 0.488922119140625, 0.5112762451171875, 0.53363037109375, 0.5559844970703125, 0.578338623046875, 0.6006927490234375, 0.623046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 7.0, 11.0, 16.0, 22.0, 22.0, 20.0, 33.0, 41.0, 39.0, 62.0, 48.0, 58.0, 58.0, 62.0, 57.0, 57.0, 52.0, 45.0, 45.0, 46.0, 36.0, 31.0, 27.0, 17.0, 17.0, 12.0, 11.0, 4.0, 9.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16457176208496094, -0.15922164916992188, -0.1538715362548828, -0.14852142333984375, -0.1431713104248047, -0.13782119750976562, -0.13247108459472656, -0.1271209716796875, -0.12177085876464844, -0.11642074584960938, -0.11107063293457031, -0.10572052001953125, -0.10037040710449219, -0.09502029418945312, -0.08967018127441406, -0.084320068359375, -0.07896995544433594, -0.07361984252929688, -0.06826972961425781, -0.06291961669921875, -0.05756950378417969, -0.052219390869140625, -0.04686927795410156, -0.0415191650390625, -0.03616905212402344, -0.030818939208984375, -0.025468826293945312, -0.02011871337890625, -0.014768600463867188, -0.009418487548828125, -0.0040683746337890625, 0.00128173828125, 0.0066318511962890625, 0.011981964111328125, 0.017332077026367188, 0.02268218994140625, 0.028032302856445312, 0.033382415771484375, 0.03873252868652344, 0.0440826416015625, 0.04943275451660156, 0.054782867431640625, 0.06013298034667969, 0.06548309326171875, 0.07083320617675781, 0.07618331909179688, 0.08153343200683594, 0.086883544921875, 0.09223365783691406, 0.09758377075195312, 0.10293388366699219, 0.10828399658203125, 0.11363410949707031, 0.11898422241210938, 0.12433433532714844, 0.1296844482421875, 0.13503456115722656, 0.14038467407226562, 0.1457347869873047, 0.15108489990234375, 0.1564350128173828, 0.16178512573242188, 0.16713523864746094, 0.1724853515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 9.0, 9.0, 23.0, 32.0, 30.0, 67.0, 86.0, 150.0, 283.0, 695.0, 2126.0, 10374.0, 305979.0, 707410.0, 16910.0, 2726.0, 857.0, 332.0, 174.0, 105.0, 58.0, 37.0, 16.0, 17.0, 7.0, 8.0, 10.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.416015625, -1.3831634521484375, -1.350311279296875, -1.3174591064453125, -1.28460693359375, -1.2517547607421875, -1.218902587890625, -1.1860504150390625, -1.1531982421875, -1.1203460693359375, -1.087493896484375, -1.0546417236328125, -1.02178955078125, -0.9889373779296875, -0.956085205078125, -0.9232330322265625, -0.890380859375, -0.8575286865234375, -0.824676513671875, -0.7918243408203125, -0.75897216796875, -0.7261199951171875, -0.693267822265625, -0.6604156494140625, -0.6275634765625, -0.5947113037109375, -0.561859130859375, -0.5290069580078125, -0.49615478515625, -0.4633026123046875, -0.430450439453125, -0.3975982666015625, -0.36474609375, -0.3318939208984375, -0.299041748046875, -0.2661895751953125, -0.23333740234375, -0.2004852294921875, -0.167633056640625, -0.1347808837890625, -0.1019287109375, -0.0690765380859375, -0.036224365234375, -0.0033721923828125, 0.02947998046875, 0.0623321533203125, 0.095184326171875, 0.1280364990234375, 0.160888671875, 0.1937408447265625, 0.226593017578125, 0.2594451904296875, 0.29229736328125, 0.3251495361328125, 0.358001708984375, 0.3908538818359375, 0.4237060546875, 0.4565582275390625, 0.489410400390625, 0.5222625732421875, 0.55511474609375, 0.5879669189453125, 0.620819091796875, 0.6536712646484375, 0.6865234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 17.0, 13.0, 13.0, 30.0, 29.0, 27.0, 35.0, 58.0, 57.0, 68.0, 65.0, 66.0, 77.0, 65.0, 62.0, 44.0, 40.0, 51.0, 36.0, 27.0, 30.0, 20.0, 23.0, 13.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94384765625, -0.9093399047851562, -0.8748321533203125, -0.8403244018554688, -0.805816650390625, -0.7713088989257812, -0.7368011474609375, -0.7022933959960938, -0.66778564453125, -0.6332778930664062, -0.5987701416015625, -0.5642623901367188, -0.529754638671875, -0.49524688720703125, -0.4607391357421875, -0.42623138427734375, -0.3917236328125, -0.35721588134765625, -0.3227081298828125, -0.28820037841796875, -0.253692626953125, -0.21918487548828125, -0.1846771240234375, -0.15016937255859375, -0.11566162109375, -0.08115386962890625, -0.0466461181640625, -0.01213836669921875, 0.022369384765625, 0.05687713623046875, 0.0913848876953125, 0.12589263916015625, 0.160400390625, 0.19490814208984375, 0.2294158935546875, 0.26392364501953125, 0.298431396484375, 0.33293914794921875, 0.3674468994140625, 0.40195465087890625, 0.43646240234375, 0.47097015380859375, 0.5054779052734375, 0.5399856567382812, 0.574493408203125, 0.6090011596679688, 0.6435089111328125, 0.6780166625976562, 0.7125244140625, 0.7470321655273438, 0.7815399169921875, 0.8160476684570312, 0.850555419921875, 0.8850631713867188, 0.9195709228515625, 0.9540786743164062, 0.98858642578125, 1.0230941772460938, 1.0576019287109375, 1.0921096801757812, 1.126617431640625, 1.1611251831054688, 1.1956329345703125, 1.2301406860351562, 1.2646484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 10.0, 16.0, 28.0, 100.0, 223.0, 785.0, 5090.0, 918788.0, 120327.0, 2382.0, 503.0, 152.0, 73.0, 35.0, 11.0, 15.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.041717529296875, -1.00140380859375, -0.961090087890625, -0.9207763671875, -0.880462646484375, -0.84014892578125, -0.799835205078125, -0.759521484375, -0.719207763671875, -0.67889404296875, -0.638580322265625, -0.5982666015625, -0.557952880859375, -0.51763916015625, -0.477325439453125, -0.43701171875, -0.396697998046875, -0.35638427734375, -0.316070556640625, -0.2757568359375, -0.235443115234375, -0.19512939453125, -0.154815673828125, -0.114501953125, -0.074188232421875, -0.03387451171875, 0.006439208984375, 0.0467529296875, 0.087066650390625, 0.12738037109375, 0.167694091796875, 0.2080078125, 0.248321533203125, 0.28863525390625, 0.328948974609375, 0.3692626953125, 0.409576416015625, 0.44989013671875, 0.490203857421875, 0.530517578125, 0.570831298828125, 0.61114501953125, 0.651458740234375, 0.6917724609375, 0.732086181640625, 0.77239990234375, 0.812713623046875, 0.85302734375, 0.893341064453125, 0.93365478515625, 0.973968505859375, 1.0142822265625, 1.054595947265625, 1.09490966796875, 1.135223388671875, 1.175537109375, 1.215850830078125, 1.25616455078125, 1.296478271484375, 1.3367919921875, 1.377105712890625, 1.41741943359375, 1.457733154296875, 1.498046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 15.0, 15.0, 19.0, 30.0, 30.0, 45.0, 63.0, 81.0, 111.0, 119.0, 104.0, 75.0, 81.0, 53.0, 38.0, 32.0, 24.0, 14.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00012874603271484375, -0.00012563727796077728, -0.00012252852320671082, -0.00011941976845264435, -0.00011631101369857788, -0.00011320225894451141, -0.00011009350419044495, -0.00010698474943637848, -0.00010387599468231201, -0.00010076723992824554, -9.765848517417908e-05, -9.454973042011261e-05, -9.144097566604614e-05, -8.833222091197968e-05, -8.522346615791321e-05, -8.211471140384674e-05, -7.900595664978027e-05, -7.58972018957138e-05, -7.278844714164734e-05, -6.967969238758087e-05, -6.65709376335144e-05, -6.346218287944794e-05, -6.035342812538147e-05, -5.7244673371315e-05, -5.4135918617248535e-05, -5.102716386318207e-05, -4.79184091091156e-05, -4.480965435504913e-05, -4.1700899600982666e-05, -3.85921448469162e-05, -3.548339009284973e-05, -3.2374635338783264e-05, -2.9265880584716797e-05, -2.615712583065033e-05, -2.3048371076583862e-05, -1.9939616322517395e-05, -1.6830861568450928e-05, -1.372210681438446e-05, -1.0613352060317993e-05, -7.504597306251526e-06, -4.395842552185059e-06, -1.2870877981185913e-06, 1.821666955947876e-06, 4.930421710014343e-06, 8.03917646408081e-06, 1.1147931218147278e-05, 1.4256685972213745e-05, 1.7365440726280212e-05, 2.047419548034668e-05, 2.3582950234413147e-05, 2.6691704988479614e-05, 2.980045974254608e-05, 3.290921449661255e-05, 3.6017969250679016e-05, 3.9126724004745483e-05, 4.223547875881195e-05, 4.534423351287842e-05, 4.8452988266944885e-05, 5.156174302101135e-05, 5.467049777507782e-05, 5.777925252914429e-05, 6.0888007283210754e-05, 6.399676203727722e-05, 6.710551679134369e-05, 7.021427154541016e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 4.0, 4.0, 13.0, 22.0, 47.0, 95.0, 174.0, 470.0, 1713.0, 14816.0, 907970.0, 117352.0, 4384.0, 877.0, 331.0, 116.0, 78.0, 38.0, 21.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1337890625, -1.1059722900390625, -1.078155517578125, -1.0503387451171875, -1.02252197265625, -0.9947052001953125, -0.966888427734375, -0.9390716552734375, -0.9112548828125, -0.8834381103515625, -0.855621337890625, -0.8278045654296875, -0.79998779296875, -0.7721710205078125, -0.744354248046875, -0.7165374755859375, -0.688720703125, -0.6609039306640625, -0.633087158203125, -0.6052703857421875, -0.57745361328125, -0.5496368408203125, -0.521820068359375, -0.4940032958984375, -0.4661865234375, -0.4383697509765625, -0.410552978515625, -0.3827362060546875, -0.35491943359375, -0.3271026611328125, -0.299285888671875, -0.2714691162109375, -0.24365234375, -0.2158355712890625, -0.188018798828125, -0.1602020263671875, -0.13238525390625, -0.1045684814453125, -0.076751708984375, -0.0489349365234375, -0.0211181640625, 0.0066986083984375, 0.034515380859375, 0.0623321533203125, 0.09014892578125, 0.1179656982421875, 0.145782470703125, 0.1735992431640625, 0.201416015625, 0.2292327880859375, 0.257049560546875, 0.2848663330078125, 0.31268310546875, 0.3404998779296875, 0.368316650390625, 0.3961334228515625, 0.4239501953125, 0.4517669677734375, 0.479583740234375, 0.5074005126953125, 0.53521728515625, 0.5630340576171875, 0.590850830078125, 0.6186676025390625, 0.646484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 8.0, 19.0, 29.0, 28.0, 48.0, 90.0, 132.0, 156.0, 169.0, 102.0, 71.0, 41.0, 44.0, 21.0, 16.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6992645263671875, -0.680755615234375, -0.6622467041015625, -0.64373779296875, -0.6252288818359375, -0.606719970703125, -0.5882110595703125, -0.5697021484375, -0.5511932373046875, -0.532684326171875, -0.5141754150390625, -0.49566650390625, -0.4771575927734375, -0.458648681640625, -0.4401397705078125, -0.421630859375, -0.4031219482421875, -0.384613037109375, -0.3661041259765625, -0.34759521484375, -0.3290863037109375, -0.310577392578125, -0.2920684814453125, -0.2735595703125, -0.2550506591796875, -0.236541748046875, -0.2180328369140625, -0.19952392578125, -0.1810150146484375, -0.162506103515625, -0.1439971923828125, -0.12548828125, -0.1069793701171875, -0.088470458984375, -0.0699615478515625, -0.05145263671875, -0.0329437255859375, -0.014434814453125, 0.0040740966796875, 0.0225830078125, 0.0410919189453125, 0.059600830078125, 0.0781097412109375, 0.09661865234375, 0.1151275634765625, 0.133636474609375, 0.1521453857421875, 0.170654296875, 0.1891632080078125, 0.207672119140625, 0.2261810302734375, 0.24468994140625, 0.2631988525390625, 0.281707763671875, 0.3002166748046875, 0.3187255859375, 0.3372344970703125, 0.355743408203125, 0.3742523193359375, 0.39276123046875, 0.4112701416015625, 0.429779052734375, 0.4482879638671875, 0.466796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 11.0, 63.0, 296.0, 433.0, 162.0, 26.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.198760986328125, -26.678014755249023, -26.157270431518555, -25.636524200439453, -25.115779876708984, -24.595033645629883, -24.07428741455078, -23.553543090820312, -23.03279685974121, -22.51205062866211, -21.99130630493164, -21.47056007385254, -20.94981575012207, -20.42906951904297, -19.9083251953125, -19.3875789642334, -18.866832733154297, -18.346086502075195, -17.825342178344727, -17.304595947265625, -16.783851623535156, -16.263105392456055, -15.74236011505127, -15.221614837646484, -14.700870513916016, -14.18012523651123, -13.659379959106445, -13.138633728027344, -12.617888450622559, -12.097143173217773, -11.576397895812988, -11.055652618408203, -10.534905433654785, -10.01416015625, -9.493414878845215, -8.97266960144043, -8.451923370361328, -7.931178092956543, -7.410432815551758, -6.889687538146973, -6.368941783905029, -5.848196506500244, -5.327450752258301, -4.806705474853516, -4.2859601974487305, -3.765214443206787, -3.244469165802002, -2.7237236499786377, -2.2029781341552734, -1.6822326183319092, -1.1614872217178345, -0.6407418251037598, -0.11999630928039551, 0.40074920654296875, 0.9214944839477539, 1.4422399997711182, 1.9629855155944824, 2.4837310314178467, 3.004476547241211, 3.525221824645996, 4.045967102050781, 4.566712856292725, 5.08745813369751, 5.608203887939453, 6.128949165344238]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 2.0, 12.0, 6.0, 10.0, 2.0, 13.0, 11.0, 14.0, 17.0, 17.0, 17.0, 27.0, 35.0, 27.0, 31.0, 24.0, 50.0, 32.0, 42.0, 49.0, 40.0, 46.0, 55.0, 37.0, 39.0, 54.0, 41.0, 30.0, 28.0, 28.0, 32.0, 20.0, 21.0, 17.0, 12.0, 17.0, 8.0, 9.0, 5.0, 6.0, 3.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.625253915786743, -3.512847900390625, -3.400442123413086, -3.288036346435547, -3.1756303310394287, -3.0632243156433105, -2.9508185386657715, -2.8384127616882324, -2.7260067462921143, -2.613600730895996, -2.501194953918457, -2.388789176940918, -2.2763831615448, -2.1639771461486816, -2.0515713691711426, -1.939165472984314, -1.8267595767974854, -1.7143536806106567, -1.6019477844238281, -1.4895418882369995, -1.377135992050171, -1.2647300958633423, -1.1523241996765137, -1.039918303489685, -0.9275124073028564, -0.8151065111160278, -0.7027006149291992, -0.5902947187423706, -0.477888822555542, -0.3654829263687134, -0.25307703018188477, -0.14067113399505615, -0.02826523780822754, 0.08414065837860107, 0.1965465545654297, 0.3089524507522583, 0.4213583469390869, 0.5337642431259155, 0.6461701393127441, 0.7585760354995728, 0.8709819316864014, 0.98338782787323, 1.0957937240600586, 1.2081996202468872, 1.3206055164337158, 1.4330114126205444, 1.545417308807373, 1.6578232049942017, 1.7702291011810303, 1.8826349973678589, 1.9950408935546875, 2.1074466705322266, 2.2198526859283447, 2.332258701324463, 2.444664478302002, 2.557070255279541, 2.669476270675659, 2.7818822860717773, 2.8942880630493164, 3.0066938400268555, 3.1190998554229736, 3.231505870819092, 3.343911647796631, 3.45631742477417, 3.568723440170288]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 5.0, 2.0, 11.0, 4.0, 8.0, 15.0, 18.0, 34.0, 45.0, 77.0, 106.0, 193.0, 324.0, 561.0, 1241.0, 3367.0, 15033.0, 318368.0, 3823686.0, 23414.0, 4701.0, 1561.0, 662.0, 323.0, 186.0, 117.0, 78.0, 49.0, 33.0, 22.0, 16.0, 13.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.1328125, -1.105255126953125, -1.07769775390625, -1.050140380859375, -1.0225830078125, -0.995025634765625, -0.96746826171875, -0.939910888671875, -0.912353515625, -0.884796142578125, -0.85723876953125, -0.829681396484375, -0.8021240234375, -0.774566650390625, -0.74700927734375, -0.719451904296875, -0.69189453125, -0.664337158203125, -0.63677978515625, -0.609222412109375, -0.5816650390625, -0.554107666015625, -0.52655029296875, -0.498992919921875, -0.471435546875, -0.443878173828125, -0.41632080078125, -0.388763427734375, -0.3612060546875, -0.333648681640625, -0.30609130859375, -0.278533935546875, -0.2509765625, -0.223419189453125, -0.19586181640625, -0.168304443359375, -0.1407470703125, -0.113189697265625, -0.08563232421875, -0.058074951171875, -0.030517578125, -0.002960205078125, 0.02459716796875, 0.052154541015625, 0.0797119140625, 0.107269287109375, 0.13482666015625, 0.162384033203125, 0.18994140625, 0.217498779296875, 0.24505615234375, 0.272613525390625, 0.3001708984375, 0.327728271484375, 0.35528564453125, 0.382843017578125, 0.410400390625, 0.437957763671875, 0.46551513671875, 0.493072509765625, 0.5206298828125, 0.548187255859375, 0.57574462890625, 0.603302001953125, 0.630859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 3.0, 8.0, 8.0, 12.0, 9.0, 19.0, 14.0, 35.0, 24.0, 31.0, 46.0, 62.0, 35.0, 56.0, 61.0, 66.0, 76.0, 64.0, 78.0, 40.0, 35.0, 50.0, 37.0, 29.0, 30.0, 18.0, 12.0, 9.0, 5.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.20751953125, -0.2017230987548828, -0.19592666625976562, -0.19013023376464844, -0.18433380126953125, -0.17853736877441406, -0.17274093627929688, -0.1669445037841797, -0.1611480712890625, -0.1553516387939453, -0.14955520629882812, -0.14375877380371094, -0.13796234130859375, -0.13216590881347656, -0.12636947631835938, -0.12057304382324219, -0.114776611328125, -0.10898017883300781, -0.10318374633789062, -0.09738731384277344, -0.09159088134765625, -0.08579444885253906, -0.07999801635742188, -0.07420158386230469, -0.0684051513671875, -0.06260871887207031, -0.056812286376953125, -0.05101585388183594, -0.04521942138671875, -0.03942298889160156, -0.033626556396484375, -0.027830123901367188, -0.02203369140625, -0.016237258911132812, -0.010440826416015625, -0.0046443939208984375, 0.00115203857421875, 0.0069484710693359375, 0.012744903564453125, 0.018541336059570312, 0.0243377685546875, 0.030134201049804688, 0.035930633544921875, 0.04172706604003906, 0.04752349853515625, 0.05331993103027344, 0.059116363525390625, 0.06491279602050781, 0.070709228515625, 0.07650566101074219, 0.08230209350585938, 0.08809852600097656, 0.09389495849609375, 0.09969139099121094, 0.10548782348632812, 0.11128425598144531, 0.1170806884765625, 0.12287712097167969, 0.12867355346679688, 0.13446998596191406, 0.14026641845703125, 0.14606285095214844, 0.15185928344726562, 0.1576557159423828, 0.1634521484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 18.0, 8.0, 15.0, 34.0, 41.0, 79.0, 114.0, 250.0, 657.0, 2326.0, 10367.0, 173912.0, 3974481.0, 25913.0, 4043.0, 1109.0, 422.0, 171.0, 94.0, 59.0, 45.0, 36.0, 15.0, 13.0, 11.0, 11.0, 2.0, 9.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.634765625, -1.589630126953125, -1.54449462890625, -1.499359130859375, -1.4542236328125, -1.409088134765625, -1.36395263671875, -1.318817138671875, -1.273681640625, -1.228546142578125, -1.18341064453125, -1.138275146484375, -1.0931396484375, -1.048004150390625, -1.00286865234375, -0.957733154296875, -0.91259765625, -0.867462158203125, -0.82232666015625, -0.777191162109375, -0.7320556640625, -0.686920166015625, -0.64178466796875, -0.596649169921875, -0.551513671875, -0.506378173828125, -0.46124267578125, -0.416107177734375, -0.3709716796875, -0.325836181640625, -0.28070068359375, -0.235565185546875, -0.1904296875, -0.145294189453125, -0.10015869140625, -0.055023193359375, -0.0098876953125, 0.035247802734375, 0.08038330078125, 0.125518798828125, 0.170654296875, 0.215789794921875, 0.26092529296875, 0.306060791015625, 0.3511962890625, 0.396331787109375, 0.44146728515625, 0.486602783203125, 0.53173828125, 0.576873779296875, 0.62200927734375, 0.667144775390625, 0.7122802734375, 0.757415771484375, 0.80255126953125, 0.847686767578125, 0.892822265625, 0.937957763671875, 0.98309326171875, 1.028228759765625, 1.0733642578125, 1.118499755859375, 1.16363525390625, 1.208770751953125, 1.25390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 8.0, 25.0, 34.0, 46.0, 115.0, 353.0, 2960.0, 282.0, 93.0, 61.0, 30.0, 14.0, 17.0, 7.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 3.0], "bins": [-0.638671875, -0.6257495880126953, -0.6128273010253906, -0.5999050140380859, -0.5869827270507812, -0.5740604400634766, -0.5611381530761719, -0.5482158660888672, -0.5352935791015625, -0.5223712921142578, -0.5094490051269531, -0.49652671813964844, -0.48360443115234375, -0.47068214416503906, -0.4577598571777344, -0.4448375701904297, -0.431915283203125, -0.4189929962158203, -0.4060707092285156, -0.39314842224121094, -0.38022613525390625, -0.36730384826660156, -0.3543815612792969, -0.3414592742919922, -0.3285369873046875, -0.3156147003173828, -0.3026924133300781, -0.28977012634277344, -0.27684783935546875, -0.26392555236816406, -0.2510032653808594, -0.2380809783935547, -0.22515869140625, -0.2122364044189453, -0.19931411743164062, -0.18639183044433594, -0.17346954345703125, -0.16054725646972656, -0.14762496948242188, -0.1347026824951172, -0.1217803955078125, -0.10885810852050781, -0.09593582153320312, -0.08301353454589844, -0.07009124755859375, -0.05716896057128906, -0.044246673583984375, -0.03132438659667969, -0.018402099609375, -0.0054798126220703125, 0.007442474365234375, 0.020364761352539062, 0.03328704833984375, 0.04620933532714844, 0.059131622314453125, 0.07205390930175781, 0.0849761962890625, 0.09789848327636719, 0.11082077026367188, 0.12374305725097656, 0.13666534423828125, 0.14958763122558594, 0.16250991821289062, 0.1754322052001953, 0.1883544921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 7.0, 13.0, 12.0, 16.0, 37.0, 45.0, 85.0, 147.0, 169.0, 155.0, 128.0, 76.0, 46.0, 26.0, 15.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.813605785369873, -1.7510530948638916, -1.6885004043579102, -1.6259477138519287, -1.5633951425552368, -1.5008424520492554, -1.438289761543274, -1.3757370710372925, -1.3131844997406006, -1.2506318092346191, -1.1880791187286377, -1.1255264282226562, -1.0629738569259644, -1.000421166419983, -0.9378684759140015, -0.87531578540802, -0.8127630949020386, -0.7502104043960571, -0.6876577734947205, -0.625105082988739, -0.5625524520874023, -0.4999997615814209, -0.43744707107543945, -0.3748944103717804, -0.31234174966812134, -0.24978908896446228, -0.18723641335964203, -0.12468373775482178, -0.06213107705116272, 0.0004215836524963379, 0.06297427415847778, 0.12552693486213684, 0.1880795955657959, 0.25063225626945496, 0.313184916973114, 0.37573760747909546, 0.4382902681827545, 0.5008429288864136, 0.563395619392395, 0.6259483098983765, 0.6885009407997131, 0.7510536313056946, 0.8136062622070312, 0.8761589527130127, 0.9387116432189941, 1.0012643337249756, 1.063817024230957, 1.126369595527649, 1.1889222860336304, 1.2514749765396118, 1.3140276670455933, 1.3765802383422852, 1.4391329288482666, 1.501685619354248, 1.5642383098602295, 1.626791000366211, 1.6893436908721924, 1.7518963813781738, 1.8144490718841553, 1.8770017623901367, 1.9395543336868286, 2.0021071434020996, 2.064659595489502, 2.1272122859954834, 2.189764976501465]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 11.0, 5.0, 8.0, 13.0, 17.0, 17.0, 17.0, 30.0, 24.0, 28.0, 37.0, 45.0, 48.0, 49.0, 69.0, 62.0, 52.0, 57.0, 54.0, 46.0, 57.0, 34.0, 38.0, 34.0, 26.0, 25.0, 21.0, 22.0, 11.0, 12.0, 8.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9570510983467102, -0.918036162853241, -0.8790212273597717, -0.8400062918663025, -0.8009912967681885, -0.7619763612747192, -0.72296142578125, -0.6839464902877808, -0.6449315547943115, -0.6059166193008423, -0.566901683807373, -0.5278867483139038, -0.4888717830181122, -0.44985684752464294, -0.4108418822288513, -0.3718269467353821, -0.33281201124191284, -0.2937970757484436, -0.25478214025497437, -0.21576717495918274, -0.1767522394657135, -0.13773730397224426, -0.09872235357761383, -0.0597074031829834, -0.02069246768951416, 0.018322475254535675, 0.05733741819858551, 0.09635236114263535, 0.13536730408668518, 0.17438223958015442, 0.21339718997478485, 0.2524121403694153, 0.2914271354675293, 0.33044207096099854, 0.3694570064544678, 0.4084719717502594, 0.44748690724372864, 0.4865018427371979, 0.5255168080329895, 0.5645317435264587, 0.603546679019928, 0.6425616145133972, 0.6815765500068665, 0.7205914855003357, 0.7596064805984497, 0.798621416091919, 0.8376363515853882, 0.8766512870788574, 0.9156662225723267, 0.9546811580657959, 0.9936960935592651, 1.0327110290527344, 1.0717259645462036, 1.1107409000396729, 1.149755835533142, 1.1887707710266113, 1.2277858257293701, 1.2668007612228394, 1.3058156967163086, 1.3448306322097778, 1.383845567703247, 1.4228605031967163, 1.4618754386901855, 1.5008904933929443, 1.539905309677124]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 9.0, 7.0, 13.0, 20.0, 33.0, 78.0, 109.0, 276.0, 518.0, 1302.0, 3795.0, 14472.0, 75954.0, 488421.0, 388131.0, 58453.0, 11688.0, 3278.0, 1041.0, 470.0, 224.0, 118.0, 53.0, 35.0, 14.0, 17.0, 6.0, 8.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5131072998046875, -0.492523193359375, -0.4719390869140625, -0.45135498046875, -0.4307708740234375, -0.410186767578125, -0.3896026611328125, -0.3690185546875, -0.3484344482421875, -0.327850341796875, -0.3072662353515625, -0.28668212890625, -0.2660980224609375, -0.245513916015625, -0.2249298095703125, -0.204345703125, -0.1837615966796875, -0.163177490234375, -0.1425933837890625, -0.12200927734375, -0.1014251708984375, -0.080841064453125, -0.0602569580078125, -0.0396728515625, -0.0190887451171875, 0.001495361328125, 0.0220794677734375, 0.04266357421875, 0.0632476806640625, 0.083831787109375, 0.1044158935546875, 0.125, 0.1455841064453125, 0.166168212890625, 0.1867523193359375, 0.20733642578125, 0.2279205322265625, 0.248504638671875, 0.2690887451171875, 0.2896728515625, 0.3102569580078125, 0.330841064453125, 0.3514251708984375, 0.37200927734375, 0.3925933837890625, 0.413177490234375, 0.4337615966796875, 0.454345703125, 0.4749298095703125, 0.495513916015625, 0.5160980224609375, 0.53668212890625, 0.5572662353515625, 0.577850341796875, 0.5984344482421875, 0.6190185546875, 0.6396026611328125, 0.660186767578125, 0.6807708740234375, 0.70135498046875, 0.7219390869140625, 0.742523193359375, 0.7631072998046875, 0.78369140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 10.0, 5.0, 6.0, 9.0, 12.0, 14.0, 23.0, 20.0, 23.0, 34.0, 48.0, 47.0, 53.0, 65.0, 60.0, 60.0, 66.0, 79.0, 54.0, 42.0, 38.0, 40.0, 25.0, 40.0, 35.0, 32.0, 16.0, 12.0, 12.0, 5.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.231201171875, -0.2251148223876953, -0.21902847290039062, -0.21294212341308594, -0.20685577392578125, -0.20076942443847656, -0.19468307495117188, -0.1885967254638672, -0.1825103759765625, -0.1764240264892578, -0.17033767700195312, -0.16425132751464844, -0.15816497802734375, -0.15207862854003906, -0.14599227905273438, -0.1399059295654297, -0.133819580078125, -0.1277332305908203, -0.12164688110351562, -0.11556053161621094, -0.10947418212890625, -0.10338783264160156, -0.09730148315429688, -0.09121513366699219, -0.0851287841796875, -0.07904243469238281, -0.07295608520507812, -0.06686973571777344, -0.06078338623046875, -0.05469703674316406, -0.048610687255859375, -0.04252433776855469, -0.03643798828125, -0.030351638793945312, -0.024265289306640625, -0.018178939819335938, -0.01209259033203125, -0.0060062408447265625, 8.0108642578125e-05, 0.0061664581298828125, 0.0122528076171875, 0.018339157104492188, 0.024425506591796875, 0.030511856079101562, 0.03659820556640625, 0.04268455505371094, 0.048770904541015625, 0.05485725402832031, 0.060943603515625, 0.06702995300292969, 0.07311630249023438, 0.07920265197753906, 0.08528900146484375, 0.09137535095214844, 0.09746170043945312, 0.10354804992675781, 0.1096343994140625, 0.11572074890136719, 0.12180709838867188, 0.12789344787597656, 0.13397979736328125, 0.14006614685058594, 0.14615249633789062, 0.1522388458251953, 0.1583251953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 11.0, 14.0, 18.0, 18.0, 25.0, 43.0, 38.0, 72.0, 107.0, 155.0, 217.0, 392.0, 678.0, 1470.0, 4229.0, 22178.0, 301824.0, 663196.0, 43415.0, 6399.0, 1936.0, 863.0, 429.0, 267.0, 160.0, 126.0, 81.0, 41.0, 39.0, 24.0, 18.0, 22.0, 6.0, 10.0, 6.0, 8.0, 2.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.96484375, -0.9365921020507812, -0.9083404541015625, -0.8800888061523438, -0.851837158203125, -0.8235855102539062, -0.7953338623046875, -0.7670822143554688, -0.73883056640625, -0.7105789184570312, -0.6823272705078125, -0.6540756225585938, -0.625823974609375, -0.5975723266601562, -0.5693206787109375, -0.5410690307617188, -0.5128173828125, -0.48456573486328125, -0.4563140869140625, -0.42806243896484375, -0.399810791015625, -0.37155914306640625, -0.3433074951171875, -0.31505584716796875, -0.28680419921875, -0.25855255126953125, -0.2303009033203125, -0.20204925537109375, -0.173797607421875, -0.14554595947265625, -0.1172943115234375, -0.08904266357421875, -0.060791015625, -0.03253936767578125, -0.0042877197265625, 0.02396392822265625, 0.052215576171875, 0.08046722412109375, 0.1087188720703125, 0.13697052001953125, 0.16522216796875, 0.19347381591796875, 0.2217254638671875, 0.24997711181640625, 0.278228759765625, 0.30648040771484375, 0.3347320556640625, 0.36298370361328125, 0.3912353515625, 0.41948699951171875, 0.4477386474609375, 0.47599029541015625, 0.504241943359375, 0.5324935913085938, 0.5607452392578125, 0.5889968872070312, 0.61724853515625, 0.6455001831054688, 0.6737518310546875, 0.7020034790039062, 0.730255126953125, 0.7585067749023438, 0.7867584228515625, 0.8150100708007812, 0.84326171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 4.0, 4.0, 9.0, 6.0, 12.0, 8.0, 20.0, 17.0, 17.0, 28.0, 30.0, 29.0, 40.0, 42.0, 35.0, 60.0, 60.0, 60.0, 67.0, 56.0, 61.0, 60.0, 42.0, 35.0, 19.0, 42.0, 28.0, 25.0, 17.0, 8.0, 12.0, 9.0, 10.0, 6.0, 11.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.1005859375, -1.0703506469726562, -1.0401153564453125, -1.0098800659179688, -0.979644775390625, -0.9494094848632812, -0.9191741943359375, -0.8889389038085938, -0.85870361328125, -0.8284683227539062, -0.7982330322265625, -0.7679977416992188, -0.737762451171875, -0.7075271606445312, -0.6772918701171875, -0.6470565795898438, -0.6168212890625, -0.5865859985351562, -0.5563507080078125, -0.5261154174804688, -0.495880126953125, -0.46564483642578125, -0.4354095458984375, -0.40517425537109375, -0.37493896484375, -0.34470367431640625, -0.3144683837890625, -0.28423309326171875, -0.253997802734375, -0.22376251220703125, -0.1935272216796875, -0.16329193115234375, -0.133056640625, -0.10282135009765625, -0.0725860595703125, -0.04235076904296875, -0.012115478515625, 0.01811981201171875, 0.0483551025390625, 0.07859039306640625, 0.10882568359375, 0.13906097412109375, 0.1692962646484375, 0.19953155517578125, 0.229766845703125, 0.26000213623046875, 0.2902374267578125, 0.32047271728515625, 0.3507080078125, 0.38094329833984375, 0.4111785888671875, 0.44141387939453125, 0.471649169921875, 0.5018844604492188, 0.5321197509765625, 0.5623550415039062, 0.59259033203125, 0.6228256225585938, 0.6530609130859375, 0.6832962036132812, 0.713531494140625, 0.7437667846679688, 0.7740020751953125, 0.8042373657226562, 0.83447265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 14.0, 20.0, 39.0, 61.0, 143.0, 235.0, 701.0, 2586.0, 32533.0, 972247.0, 35882.0, 2757.0, 727.0, 278.0, 148.0, 66.0, 40.0, 24.0, 12.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88330078125, -0.858428955078125, -0.83355712890625, -0.808685302734375, -0.7838134765625, -0.758941650390625, -0.73406982421875, -0.709197998046875, -0.684326171875, -0.659454345703125, -0.63458251953125, -0.609710693359375, -0.5848388671875, -0.559967041015625, -0.53509521484375, -0.510223388671875, -0.4853515625, -0.460479736328125, -0.43560791015625, -0.410736083984375, -0.3858642578125, -0.360992431640625, -0.33612060546875, -0.311248779296875, -0.286376953125, -0.261505126953125, -0.23663330078125, -0.211761474609375, -0.1868896484375, -0.162017822265625, -0.13714599609375, -0.112274169921875, -0.08740234375, -0.062530517578125, -0.03765869140625, -0.012786865234375, 0.0120849609375, 0.036956787109375, 0.06182861328125, 0.086700439453125, 0.111572265625, 0.136444091796875, 0.16131591796875, 0.186187744140625, 0.2110595703125, 0.235931396484375, 0.26080322265625, 0.285675048828125, 0.310546875, 0.335418701171875, 0.36029052734375, 0.385162353515625, 0.4100341796875, 0.434906005859375, 0.45977783203125, 0.484649658203125, 0.509521484375, 0.534393310546875, 0.55926513671875, 0.584136962890625, 0.6090087890625, 0.633880615234375, 0.65875244140625, 0.683624267578125, 0.70849609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 10.0, 21.0, 16.0, 37.0, 33.0, 51.0, 50.0, 69.0, 114.0, 149.0, 106.0, 78.0, 57.0, 51.0, 40.0, 26.0, 23.0, 11.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012046098709106445, -0.00011662300676107407, -0.00011278502643108368, -0.00010894704610109329, -0.0001051090657711029, -0.00010127108544111252, -9.743310511112213e-05, -9.359512478113174e-05, -8.975714445114136e-05, -8.591916412115097e-05, -8.208118379116058e-05, -7.82432034611702e-05, -7.440522313117981e-05, -7.056724280118942e-05, -6.672926247119904e-05, -6.289128214120865e-05, -5.905330181121826e-05, -5.5215321481227875e-05, -5.137734115123749e-05, -4.75393608212471e-05, -4.3701380491256714e-05, -3.986340016126633e-05, -3.602541983127594e-05, -3.218743950128555e-05, -2.8349459171295166e-05, -2.451147884130478e-05, -2.0673498511314392e-05, -1.6835518181324005e-05, -1.2997537851333618e-05, -9.159557521343231e-06, -5.321577191352844e-06, -1.4835968613624573e-06, 2.3543834686279297e-06, 6.192363798618317e-06, 1.0030344128608704e-05, 1.386832445859909e-05, 1.7706304788589478e-05, 2.1544285118579865e-05, 2.538226544857025e-05, 2.922024577856064e-05, 3.3058226108551025e-05, 3.689620643854141e-05, 4.07341867685318e-05, 4.4572167098522186e-05, 4.841014742851257e-05, 5.224812775850296e-05, 5.608610808849335e-05, 5.9924088418483734e-05, 6.376206874847412e-05, 6.760004907846451e-05, 7.14380294084549e-05, 7.527600973844528e-05, 7.911399006843567e-05, 8.295197039842606e-05, 8.678995072841644e-05, 9.062793105840683e-05, 9.446591138839722e-05, 9.83038917183876e-05, 0.00010214187204837799, 0.00010597985237836838, 0.00010981783270835876, 0.00011365581303834915, 0.00011749379336833954, 0.00012133177369832993, 0.0001251697540283203]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 13.0, 16.0, 25.0, 39.0, 83.0, 147.0, 288.0, 712.0, 2463.0, 20264.0, 849496.0, 165694.0, 6994.0, 1311.0, 486.0, 223.0, 135.0, 62.0, 42.0, 27.0, 8.0, 8.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5466690063476562, -0.5254669189453125, -0.5042648315429688, -0.483062744140625, -0.46186065673828125, -0.4406585693359375, -0.41945648193359375, -0.39825439453125, -0.37705230712890625, -0.3558502197265625, -0.33464813232421875, -0.313446044921875, -0.29224395751953125, -0.2710418701171875, -0.24983978271484375, -0.2286376953125, -0.20743560791015625, -0.1862335205078125, -0.16503143310546875, -0.143829345703125, -0.12262725830078125, -0.1014251708984375, -0.08022308349609375, -0.05902099609375, -0.03781890869140625, -0.0166168212890625, 0.00458526611328125, 0.025787353515625, 0.04698944091796875, 0.0681915283203125, 0.08939361572265625, 0.110595703125, 0.13179779052734375, 0.1529998779296875, 0.17420196533203125, 0.195404052734375, 0.21660614013671875, 0.2378082275390625, 0.25901031494140625, 0.28021240234375, 0.30141448974609375, 0.3226165771484375, 0.34381866455078125, 0.365020751953125, 0.38622283935546875, 0.4074249267578125, 0.42862701416015625, 0.4498291015625, 0.47103118896484375, 0.4922332763671875, 0.5134353637695312, 0.534637451171875, 0.5558395385742188, 0.5770416259765625, 0.5982437133789062, 0.61944580078125, 0.6406478881835938, 0.6618499755859375, 0.6830520629882812, 0.704254150390625, 0.7254562377929688, 0.7466583251953125, 0.7678604125976562, 0.7890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 5.0, 16.0, 22.0, 27.0, 58.0, 65.0, 136.0, 168.0, 172.0, 124.0, 77.0, 43.0, 32.0, 22.0, 11.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471923828125, -0.4530067443847656, -0.43408966064453125, -0.4151725769042969, -0.3962554931640625, -0.3773384094238281, -0.35842132568359375, -0.3395042419433594, -0.320587158203125, -0.3016700744628906, -0.28275299072265625, -0.2638359069824219, -0.2449188232421875, -0.22600173950195312, -0.20708465576171875, -0.18816757202148438, -0.16925048828125, -0.15033340454101562, -0.13141632080078125, -0.11249923706054688, -0.0935821533203125, -0.07466506958007812, -0.05574798583984375, -0.036830902099609375, -0.017913818359375, 0.001003265380859375, 0.01992034912109375, 0.038837432861328125, 0.0577545166015625, 0.07667160034179688, 0.09558868408203125, 0.11450576782226562, 0.1334228515625, 0.15233993530273438, 0.17125701904296875, 0.19017410278320312, 0.2090911865234375, 0.22800827026367188, 0.24692535400390625, 0.2658424377441406, 0.284759521484375, 0.3036766052246094, 0.32259368896484375, 0.3415107727050781, 0.3604278564453125, 0.3793449401855469, 0.39826202392578125, 0.4171791076660156, 0.43609619140625, 0.4550132751464844, 0.47393035888671875, 0.4928474426269531, 0.5117645263671875, 0.5306816101074219, 0.5495986938476562, 0.5685157775878906, 0.587432861328125, 0.6063499450683594, 0.6252670288085938, 0.6441841125488281, 0.6631011962890625, 0.6820182800292969, 0.7009353637695312, 0.7198524475097656, 0.73876953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 34.0, 175.0, 456.0, 269.0, 52.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.47958755493164, -17.929616928100586, -17.37964630126953, -16.829673767089844, -16.27970314025879, -15.729732513427734, -15.17976188659668, -14.629790306091309, -14.079818725585938, -13.529848098754883, -12.979876518249512, -12.429905891418457, -11.879934310913086, -11.329963684082031, -10.779993057250977, -10.230021476745605, -9.68005084991455, -9.130080223083496, -8.580108642578125, -8.03013801574707, -7.480166435241699, -6.9301958084106445, -6.380224704742432, -5.830253601074219, -5.280282497406006, -4.730311393737793, -4.18034029006958, -3.6303694248199463, -3.0803983211517334, -2.5304272174835205, -1.9804563522338867, -1.4304852485656738, -0.8805141448974609, -0.3305431008338928, 0.2194279432296753, 0.7693989276885986, 1.3193700313568115, 1.8693411350250244, 2.419312000274658, 2.969283103942871, 3.519254207611084, 4.069225311279297, 4.61919641494751, 5.169167518615723, 5.719138145446777, 6.269109725952148, 6.819080352783203, 7.369051456451416, 7.919022560119629, 8.468993186950684, 9.018964767456055, 9.56893539428711, 10.11890697479248, 10.668877601623535, 11.218849182128906, 11.768819808959961, 12.318790435791016, 12.86876106262207, 13.418732643127441, 13.968703269958496, 14.518674850463867, 15.068645477294922, 15.618616104125977, 16.16858673095703, 16.71855926513672]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 5.0, 6.0, 9.0, 6.0, 11.0, 11.0, 9.0, 15.0, 27.0, 28.0, 38.0, 33.0, 44.0, 49.0, 50.0, 50.0, 62.0, 51.0, 47.0, 59.0, 54.0, 39.0, 39.0, 40.0, 29.0, 31.0, 29.0, 20.0, 16.0, 11.0, 13.0, 10.0, 9.0, 11.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0], "bins": [-4.85911750793457, -4.733467102050781, -4.607816696166992, -4.482166290283203, -4.356515884399414, -4.230865478515625, -4.105215072631836, -3.979564666748047, -3.853914260864258, -3.7282638549804688, -3.6026134490966797, -3.4769630432128906, -3.3513126373291016, -3.2256622314453125, -3.1000118255615234, -2.9743614196777344, -2.8487110137939453, -2.7230606079101562, -2.597410202026367, -2.471759796142578, -2.346109390258789, -2.220458984375, -2.094808578491211, -1.9691581726074219, -1.8435077667236328, -1.7178573608398438, -1.5922069549560547, -1.4665565490722656, -1.3409061431884766, -1.2152557373046875, -1.0896053314208984, -0.9639549255371094, -0.8383049964904785, -0.7126545906066895, -0.5870041847229004, -0.46135377883911133, -0.33570337295532227, -0.2100529670715332, -0.08440256118774414, 0.04124784469604492, 0.16689825057983398, 0.29254865646362305, 0.4181990623474121, 0.5438494682312012, 0.6694998741149902, 0.7951502799987793, 0.9208006858825684, 1.0464510917663574, 1.1721014976501465, 1.2977519035339355, 1.4234023094177246, 1.5490527153015137, 1.6747031211853027, 1.8003535270690918, 1.9260039329528809, 2.05165433883667, 2.177304744720459, 2.302955150604248, 2.428605556488037, 2.554255962371826, 2.6799063682556152, 2.8055567741394043, 2.9312071800231934, 3.0568575859069824, 3.1825079917907715]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 5.0, 6.0, 3.0, 13.0, 6.0, 14.0, 11.0, 11.0, 15.0, 34.0, 48.0, 74.0, 99.0, 165.0, 284.0, 516.0, 824.0, 1455.0, 3198.0, 7884.0, 25760.0, 170495.0, 3578722.0, 347712.0, 38791.0, 10644.0, 3794.0, 1749.0, 861.0, 464.0, 244.0, 162.0, 79.0, 56.0, 31.0, 15.0, 12.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.56640625, -0.5513496398925781, -0.5362930297851562, -0.5212364196777344, -0.5061798095703125, -0.4911231994628906, -0.47606658935546875, -0.4610099792480469, -0.445953369140625, -0.4308967590332031, -0.41584014892578125, -0.4007835388183594, -0.3857269287109375, -0.3706703186035156, -0.35561370849609375, -0.3405570983886719, -0.32550048828125, -0.3104438781738281, -0.29538726806640625, -0.2803306579589844, -0.2652740478515625, -0.2502174377441406, -0.23516082763671875, -0.22010421752929688, -0.205047607421875, -0.18999099731445312, -0.17493438720703125, -0.15987777709960938, -0.1448211669921875, -0.12976455688476562, -0.11470794677734375, -0.09965133666992188, -0.0845947265625, -0.06953811645507812, -0.05448150634765625, -0.039424896240234375, -0.0243682861328125, -0.009311676025390625, 0.00574493408203125, 0.020801544189453125, 0.035858154296875, 0.050914764404296875, 0.06597137451171875, 0.08102798461914062, 0.0960845947265625, 0.11114120483398438, 0.12619781494140625, 0.14125442504882812, 0.15631103515625, 0.17136764526367188, 0.18642425537109375, 0.20148086547851562, 0.2165374755859375, 0.23159408569335938, 0.24665069580078125, 0.2617073059082031, 0.276763916015625, 0.2918205261230469, 0.30687713623046875, 0.3219337463378906, 0.3369903564453125, 0.3520469665527344, 0.36710357666015625, 0.3821601867675781, 0.397216796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 8.0, 10.0, 12.0, 19.0, 20.0, 46.0, 56.0, 70.0, 75.0, 85.0, 94.0, 95.0, 77.0, 76.0, 50.0, 47.0, 54.0, 33.0, 29.0, 12.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3583984375, -0.35002708435058594, -0.3416557312011719, -0.3332843780517578, -0.32491302490234375, -0.3165416717529297, -0.3081703186035156, -0.29979896545410156, -0.2914276123046875, -0.28305625915527344, -0.2746849060058594, -0.2663135528564453, -0.25794219970703125, -0.2495708465576172, -0.24119949340820312, -0.23282814025878906, -0.224456787109375, -0.21608543395996094, -0.20771408081054688, -0.1993427276611328, -0.19097137451171875, -0.1826000213623047, -0.17422866821289062, -0.16585731506347656, -0.1574859619140625, -0.14911460876464844, -0.14074325561523438, -0.1323719024658203, -0.12400054931640625, -0.11562919616699219, -0.10725784301757812, -0.09888648986816406, -0.09051513671875, -0.08214378356933594, -0.07377243041992188, -0.06540107727050781, -0.05702972412109375, -0.04865837097167969, -0.040287017822265625, -0.03191566467285156, -0.0235443115234375, -0.015172958374023438, -0.006801605224609375, 0.0015697479248046875, 0.00994110107421875, 0.018312454223632812, 0.026683807373046875, 0.03505516052246094, 0.043426513671875, 0.05179786682128906, 0.060169219970703125, 0.06854057312011719, 0.07691192626953125, 0.08528327941894531, 0.09365463256835938, 0.10202598571777344, 0.1103973388671875, 0.11876869201660156, 0.12714004516601562, 0.1355113983154297, 0.14388275146484375, 0.1522541046142578, 0.16062545776367188, 0.16899681091308594, 0.1773681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 4.0, 17.0, 15.0, 26.0, 46.0, 67.0, 122.0, 224.0, 425.0, 1032.0, 2828.0, 9604.0, 57120.0, 3151320.0, 924665.0, 35539.0, 7232.0, 2227.0, 858.0, 397.0, 195.0, 112.0, 66.0, 45.0, 26.0, 15.0, 15.0, 8.0, 7.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.802734375, -0.7783279418945312, -0.7539215087890625, -0.7295150756835938, -0.705108642578125, -0.6807022094726562, -0.6562957763671875, -0.6318893432617188, -0.60748291015625, -0.5830764770507812, -0.5586700439453125, -0.5342636108398438, -0.509857177734375, -0.48545074462890625, -0.4610443115234375, -0.43663787841796875, -0.4122314453125, -0.38782501220703125, -0.3634185791015625, -0.33901214599609375, -0.314605712890625, -0.29019927978515625, -0.2657928466796875, -0.24138641357421875, -0.21697998046875, -0.19257354736328125, -0.1681671142578125, -0.14376068115234375, -0.119354248046875, -0.09494781494140625, -0.0705413818359375, -0.04613494873046875, -0.021728515625, 0.00267791748046875, 0.0270843505859375, 0.05149078369140625, 0.075897216796875, 0.10030364990234375, 0.1247100830078125, 0.14911651611328125, 0.17352294921875, 0.19792938232421875, 0.2223358154296875, 0.24674224853515625, 0.271148681640625, 0.29555511474609375, 0.3199615478515625, 0.34436798095703125, 0.3687744140625, 0.39318084716796875, 0.4175872802734375, 0.44199371337890625, 0.466400146484375, 0.49080657958984375, 0.5152130126953125, 0.5396194458007812, 0.56402587890625, 0.5884323120117188, 0.6128387451171875, 0.6372451782226562, 0.661651611328125, 0.6860580444335938, 0.7104644775390625, 0.7348709106445312, 0.75927734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 3.0, 8.0, 13.0, 14.0, 19.0, 32.0, 54.0, 88.0, 168.0, 349.0, 971.0, 1362.0, 489.0, 214.0, 94.0, 75.0, 27.0, 21.0, 20.0, 12.0, 12.0, 5.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7548828125, -0.7327651977539062, -0.7106475830078125, -0.6885299682617188, -0.666412353515625, -0.6442947387695312, -0.6221771240234375, -0.6000595092773438, -0.57794189453125, -0.5558242797851562, -0.5337066650390625, -0.5115890502929688, -0.489471435546875, -0.46735382080078125, -0.4452362060546875, -0.42311859130859375, -0.4010009765625, -0.37888336181640625, -0.3567657470703125, -0.33464813232421875, -0.312530517578125, -0.29041290283203125, -0.2682952880859375, -0.24617767333984375, -0.22406005859375, -0.20194244384765625, -0.1798248291015625, -0.15770721435546875, -0.135589599609375, -0.11347198486328125, -0.0913543701171875, -0.06923675537109375, -0.047119140625, -0.02500152587890625, -0.0028839111328125, 0.01923370361328125, 0.041351318359375, 0.06346893310546875, 0.0855865478515625, 0.10770416259765625, 0.12982177734375, 0.15193939208984375, 0.1740570068359375, 0.19617462158203125, 0.218292236328125, 0.24040985107421875, 0.2625274658203125, 0.28464508056640625, 0.3067626953125, 0.32888031005859375, 0.3509979248046875, 0.37311553955078125, 0.395233154296875, 0.41735076904296875, 0.4394683837890625, 0.46158599853515625, 0.48370361328125, 0.5058212280273438, 0.5279388427734375, 0.5500564575195312, 0.572174072265625, 0.5942916870117188, 0.6164093017578125, 0.6385269165039062, 0.66064453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 22.0, 94.0, 288.0, 386.0, 148.0, 34.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.180972099304199, -6.842856407165527, -6.5047407150268555, -6.166625022888184, -5.828509330749512, -5.49039363861084, -5.15227746963501, -4.814161777496338, -4.476046085357666, -4.137930393218994, -3.7998147010803223, -3.4616987705230713, -3.1235830783843994, -2.7854673862457275, -2.4473514556884766, -2.1092357635498047, -1.7711200714111328, -1.433004379272461, -1.0948885679244995, -0.7567727565765381, -0.4186570644378662, -0.08054137229919434, 0.25757455825805664, 0.5956902503967285, 0.9338059425354004, 1.2719216346740723, 1.6100374460220337, 1.9481532573699951, 2.286268949508667, 2.624384641647339, 2.96250057220459, 3.3006162643432617, 3.638731002807617, 3.976846694946289, 4.314962387084961, 4.653078079223633, 4.991193771362305, 5.329309463500977, 5.667425632476807, 6.0055413246154785, 6.34365701675415, 6.681772708892822, 7.019888401031494, 7.358004570007324, 7.696120262145996, 8.034235954284668, 8.37235164642334, 8.710467338562012, 9.048583030700684, 9.386698722839355, 9.724814414978027, 10.0629301071167, 10.401045799255371, 10.739161491394043, 11.077278137207031, 11.415393829345703, 11.753509521484375, 12.091625213623047, 12.429740905761719, 12.76785659790039, 13.105972290039062, 13.444087982177734, 13.782203674316406, 14.120319366455078, 14.45843505859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 9.0, 12.0, 11.0, 14.0, 21.0, 19.0, 27.0, 31.0, 30.0, 49.0, 36.0, 27.0, 33.0, 45.0, 32.0, 49.0, 44.0, 50.0, 58.0, 43.0, 40.0, 37.0, 36.0, 24.0, 28.0, 20.0, 29.0, 26.0, 18.0, 18.0, 7.0, 14.0, 8.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.060170888900757, -1.991247296333313, -1.9223237037658691, -1.8534002304077148, -1.784476637840271, -1.7155530452728271, -1.6466295719146729, -1.577705979347229, -1.5087823867797852, -1.4398587942123413, -1.3709352016448975, -1.3020117282867432, -1.2330881357192993, -1.1641645431518555, -1.0952410697937012, -1.0263174772262573, -0.9573938846588135, -0.8884702920913696, -0.8195467591285706, -0.7506232261657715, -0.6816996335983276, -0.6127760410308838, -0.5438525080680847, -0.47492894530296326, -0.4060053825378418, -0.33708181977272034, -0.2681582570075989, -0.19923469424247742, -0.13031113147735596, -0.0613875687122345, 0.007535994052886963, 0.07645955681800842, 0.14538335800170898, 0.21430692076683044, 0.2832304835319519, 0.35215404629707336, 0.4210776090621948, 0.4900011718273163, 0.5589247345924377, 0.6278482675552368, 0.6967718601226807, 0.7656954526901245, 0.8346189856529236, 0.9035425186157227, 0.9724661111831665, 1.0413897037506104, 1.1103131771087646, 1.1792367696762085, 1.2481603622436523, 1.3170839548110962, 1.38600754737854, 1.4549310207366943, 1.5238546133041382, 1.592778205871582, 1.6617016792297363, 1.7306252717971802, 1.799548864364624, 1.8684724569320679, 1.9373960494995117, 2.006319522857666, 2.0752429962158203, 2.1441667079925537, 2.213090181350708, 2.2820138931274414, 2.3509373664855957]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 9.0, 19.0, 17.0, 33.0, 58.0, 96.0, 150.0, 241.0, 425.0, 773.0, 1536.0, 3157.0, 7367.0, 20199.0, 69340.0, 315976.0, 474402.0, 107676.0, 28874.0, 10054.0, 4095.0, 1875.0, 882.0, 546.0, 289.0, 159.0, 109.0, 65.0, 48.0, 25.0, 16.0, 7.0, 11.0, 7.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6328697204589844, -0.6158370971679688, -0.5988044738769531, -0.5817718505859375, -0.5647392272949219, -0.5477066040039062, -0.5306739807128906, -0.513641357421875, -0.4966087341308594, -0.47957611083984375, -0.4625434875488281, -0.4455108642578125, -0.4284782409667969, -0.41144561767578125, -0.3944129943847656, -0.37738037109375, -0.3603477478027344, -0.34331512451171875, -0.3262825012207031, -0.3092498779296875, -0.2922172546386719, -0.27518463134765625, -0.2581520080566406, -0.241119384765625, -0.22408676147460938, -0.20705413818359375, -0.19002151489257812, -0.1729888916015625, -0.15595626831054688, -0.13892364501953125, -0.12189102172851562, -0.1048583984375, -0.08782577514648438, -0.07079315185546875, -0.053760528564453125, -0.0367279052734375, -0.019695281982421875, -0.00266265869140625, 0.014369964599609375, 0.031402587890625, 0.048435211181640625, 0.06546783447265625, 0.08250045776367188, 0.0995330810546875, 0.11656570434570312, 0.13359832763671875, 0.15063095092773438, 0.16766357421875, 0.18469619750976562, 0.20172882080078125, 0.21876144409179688, 0.2357940673828125, 0.2528266906738281, 0.26985931396484375, 0.2868919372558594, 0.303924560546875, 0.3209571838378906, 0.33798980712890625, 0.3550224304199219, 0.3720550537109375, 0.3890876770019531, 0.40612030029296875, 0.4231529235839844, 0.440185546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 11.0, 21.0, 15.0, 27.0, 32.0, 60.0, 49.0, 65.0, 59.0, 76.0, 89.0, 69.0, 70.0, 67.0, 52.0, 49.0, 33.0, 35.0, 27.0, 29.0, 23.0, 4.0, 6.0, 6.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2538928985595703, -0.24655532836914062, -0.23921775817871094, -0.23188018798828125, -0.22454261779785156, -0.21720504760742188, -0.2098674774169922, -0.2025299072265625, -0.1951923370361328, -0.18785476684570312, -0.18051719665527344, -0.17317962646484375, -0.16584205627441406, -0.15850448608398438, -0.1511669158935547, -0.143829345703125, -0.1364917755126953, -0.12915420532226562, -0.12181663513183594, -0.11447906494140625, -0.10714149475097656, -0.09980392456054688, -0.09246635437011719, -0.0851287841796875, -0.07779121398925781, -0.07045364379882812, -0.06311607360839844, -0.05577850341796875, -0.04844093322753906, -0.041103363037109375, -0.03376579284667969, -0.02642822265625, -0.019090652465820312, -0.011753082275390625, -0.0044155120849609375, 0.00292205810546875, 0.010259628295898438, 0.017597198486328125, 0.024934768676757812, 0.0322723388671875, 0.03960990905761719, 0.046947479248046875, 0.05428504943847656, 0.06162261962890625, 0.06896018981933594, 0.07629776000976562, 0.08363533020019531, 0.090972900390625, 0.09831047058105469, 0.10564804077148438, 0.11298561096191406, 0.12032318115234375, 0.12766075134277344, 0.13499832153320312, 0.1423358917236328, 0.1496734619140625, 0.1570110321044922, 0.16434860229492188, 0.17168617248535156, 0.17902374267578125, 0.18636131286621094, 0.19369888305664062, 0.2010364532470703, 0.2083740234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 9.0, 17.0, 21.0, 28.0, 44.0, 65.0, 119.0, 199.0, 392.0, 955.0, 2641.0, 13089.0, 433675.0, 578056.0, 14616.0, 2718.0, 933.0, 437.0, 199.0, 125.0, 79.0, 28.0, 32.0, 13.0, 16.0, 7.0, 7.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1240234375, -1.0791015625, -1.0341796875, -0.9892578125, -0.9443359375, -0.8994140625, -0.8544921875, -0.8095703125, -0.7646484375, -0.7197265625, -0.6748046875, -0.6298828125, -0.5849609375, -0.5400390625, -0.4951171875, -0.4501953125, -0.4052734375, -0.3603515625, -0.3154296875, -0.2705078125, -0.2255859375, -0.1806640625, -0.1357421875, -0.0908203125, -0.0458984375, -0.0009765625, 0.0439453125, 0.0888671875, 0.1337890625, 0.1787109375, 0.2236328125, 0.2685546875, 0.3134765625, 0.3583984375, 0.4033203125, 0.4482421875, 0.4931640625, 0.5380859375, 0.5830078125, 0.6279296875, 0.6728515625, 0.7177734375, 0.7626953125, 0.8076171875, 0.8525390625, 0.8974609375, 0.9423828125, 0.9873046875, 1.0322265625, 1.0771484375, 1.1220703125, 1.1669921875, 1.2119140625, 1.2568359375, 1.3017578125, 1.3466796875, 1.3916015625, 1.4365234375, 1.4814453125, 1.5263671875, 1.5712890625, 1.6162109375, 1.6611328125, 1.7060546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 12.0, 9.0, 11.0, 18.0, 26.0, 19.0, 22.0, 32.0, 42.0, 51.0, 63.0, 52.0, 63.0, 86.0, 71.0, 58.0, 62.0, 57.0, 44.0, 42.0, 32.0, 25.0, 15.0, 27.0, 17.0, 17.0, 9.0, 8.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9064178466796875, -0.870452880859375, -0.8344879150390625, -0.79852294921875, -0.7625579833984375, -0.726593017578125, -0.6906280517578125, -0.6546630859375, -0.6186981201171875, -0.582733154296875, -0.5467681884765625, -0.51080322265625, -0.4748382568359375, -0.438873291015625, -0.4029083251953125, -0.366943359375, -0.3309783935546875, -0.295013427734375, -0.2590484619140625, -0.22308349609375, -0.1871185302734375, -0.151153564453125, -0.1151885986328125, -0.0792236328125, -0.0432586669921875, -0.007293701171875, 0.0286712646484375, 0.06463623046875, 0.1006011962890625, 0.136566162109375, 0.1725311279296875, 0.20849609375, 0.2444610595703125, 0.280426025390625, 0.3163909912109375, 0.35235595703125, 0.3883209228515625, 0.424285888671875, 0.4602508544921875, 0.4962158203125, 0.5321807861328125, 0.568145751953125, 0.6041107177734375, 0.64007568359375, 0.6760406494140625, 0.712005615234375, 0.7479705810546875, 0.783935546875, 0.8199005126953125, 0.855865478515625, 0.8918304443359375, 0.92779541015625, 0.9637603759765625, 0.999725341796875, 1.0356903076171875, 1.0716552734375, 1.1076202392578125, 1.143585205078125, 1.1795501708984375, 1.21551513671875, 1.2514801025390625, 1.287445068359375, 1.3234100341796875, 1.359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 12.0, 16.0, 7.0, 10.0, 34.0, 59.0, 111.0, 249.0, 663.0, 2142.0, 14385.0, 868329.0, 154152.0, 6203.0, 1287.0, 445.0, 181.0, 120.0, 51.0, 29.0, 24.0, 14.0, 5.0, 8.0, 1.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.7785797119140625, -0.749542236328125, -0.7205047607421875, -0.69146728515625, -0.6624298095703125, -0.633392333984375, -0.6043548583984375, -0.5753173828125, -0.5462799072265625, -0.517242431640625, -0.4882049560546875, -0.45916748046875, -0.4301300048828125, -0.401092529296875, -0.3720550537109375, -0.343017578125, -0.3139801025390625, -0.284942626953125, -0.2559051513671875, -0.22686767578125, -0.1978302001953125, -0.168792724609375, -0.1397552490234375, -0.1107177734375, -0.0816802978515625, -0.052642822265625, -0.0236053466796875, 0.00543212890625, 0.0344696044921875, 0.063507080078125, 0.0925445556640625, 0.12158203125, 0.1506195068359375, 0.179656982421875, 0.2086944580078125, 0.23773193359375, 0.2667694091796875, 0.295806884765625, 0.3248443603515625, 0.3538818359375, 0.3829193115234375, 0.411956787109375, 0.4409942626953125, 0.47003173828125, 0.4990692138671875, 0.528106689453125, 0.5571441650390625, 0.586181640625, 0.6152191162109375, 0.644256591796875, 0.6732940673828125, 0.70233154296875, 0.7313690185546875, 0.760406494140625, 0.7894439697265625, 0.8184814453125, 0.8475189208984375, 0.876556396484375, 0.9055938720703125, 0.93463134765625, 0.9636688232421875, 0.992706298828125, 1.0217437744140625, 1.05078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 17.0, 20.0, 40.0, 62.0, 86.0, 107.0, 146.0, 128.0, 104.0, 79.0, 60.0, 46.0, 25.0, 21.0, 10.0, 12.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021529197692871094, -0.00020461156964302063, -0.00019393116235733032, -0.00018325075507164001, -0.0001725703477859497, -0.0001618899405002594, -0.0001512095332145691, -0.00014052912592887878, -0.00012984871864318848, -0.00011916831135749817, -0.00010848790407180786, -9.780749678611755e-05, -8.712708950042725e-05, -7.644668221473694e-05, -6.576627492904663e-05, -5.508586764335632e-05, -4.4405460357666016e-05, -3.372505307197571e-05, -2.30446457862854e-05, -1.2364238500595093e-05, -1.6838312149047852e-06, 8.996576070785522e-06, 1.967698335647583e-05, 3.0357390642166138e-05, 4.1037797927856445e-05, 5.171820521354675e-05, 6.239861249923706e-05, 7.307901978492737e-05, 8.375942707061768e-05, 9.443983435630798e-05, 0.00010512024164199829, 0.0001158006489276886, 0.0001264810562133789, 0.00013716146349906921, 0.00014784187078475952, 0.00015852227807044983, 0.00016920268535614014, 0.00017988309264183044, 0.00019056349992752075, 0.00020124390721321106, 0.00021192431449890137, 0.00022260472178459167, 0.00023328512907028198, 0.0002439655363559723, 0.0002546459436416626, 0.0002653263509273529, 0.0002760067582130432, 0.0002866871654987335, 0.00029736757278442383, 0.00030804798007011414, 0.00031872838735580444, 0.00032940879464149475, 0.00034008920192718506, 0.00035076960921287537, 0.0003614500164985657, 0.000372130423784256, 0.0003828108310699463, 0.0003934912383556366, 0.0004041716456413269, 0.0004148520529270172, 0.0004255324602127075, 0.00043621286749839783, 0.00044689327478408813, 0.00045757368206977844, 0.00046825408935546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 4.0, 16.0, 23.0, 38.0, 37.0, 77.0, 90.0, 162.0, 270.0, 505.0, 1018.0, 2762.0, 13351.0, 219298.0, 773084.0, 30374.0, 4470.0, 1408.0, 700.0, 329.0, 186.0, 127.0, 62.0, 51.0, 30.0, 28.0, 13.0, 10.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5458984375, -0.52581787109375, -0.5057373046875, -0.48565673828125, -0.465576171875, -0.44549560546875, -0.4254150390625, -0.40533447265625, -0.38525390625, -0.36517333984375, -0.3450927734375, -0.32501220703125, -0.304931640625, -0.28485107421875, -0.2647705078125, -0.24468994140625, -0.224609375, -0.20452880859375, -0.1844482421875, -0.16436767578125, -0.144287109375, -0.12420654296875, -0.1041259765625, -0.08404541015625, -0.06396484375, -0.04388427734375, -0.0238037109375, -0.00372314453125, 0.016357421875, 0.03643798828125, 0.0565185546875, 0.07659912109375, 0.0966796875, 0.11676025390625, 0.1368408203125, 0.15692138671875, 0.177001953125, 0.19708251953125, 0.2171630859375, 0.23724365234375, 0.25732421875, 0.27740478515625, 0.2974853515625, 0.31756591796875, 0.337646484375, 0.35772705078125, 0.3778076171875, 0.39788818359375, 0.41796875, 0.43804931640625, 0.4581298828125, 0.47821044921875, 0.498291015625, 0.51837158203125, 0.5384521484375, 0.55853271484375, 0.57861328125, 0.59869384765625, 0.6187744140625, 0.63885498046875, 0.658935546875, 0.67901611328125, 0.6990966796875, 0.71917724609375, 0.7392578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 6.0, 8.0, 14.0, 8.0, 23.0, 34.0, 33.0, 48.0, 58.0, 63.0, 72.0, 98.0, 87.0, 78.0, 67.0, 67.0, 44.0, 47.0, 32.0, 26.0, 13.0, 10.0, 16.0, 9.0, 4.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32421875, -0.3105316162109375, -0.296844482421875, -0.2831573486328125, -0.26947021484375, -0.2557830810546875, -0.242095947265625, -0.2284088134765625, -0.2147216796875, -0.2010345458984375, -0.187347412109375, -0.1736602783203125, -0.15997314453125, -0.1462860107421875, -0.132598876953125, -0.1189117431640625, -0.105224609375, -0.0915374755859375, -0.077850341796875, -0.0641632080078125, -0.05047607421875, -0.0367889404296875, -0.023101806640625, -0.0094146728515625, 0.0042724609375, 0.0179595947265625, 0.031646728515625, 0.0453338623046875, 0.05902099609375, 0.0727081298828125, 0.086395263671875, 0.1000823974609375, 0.11376953125, 0.1274566650390625, 0.141143798828125, 0.1548309326171875, 0.16851806640625, 0.1822052001953125, 0.195892333984375, 0.2095794677734375, 0.2232666015625, 0.2369537353515625, 0.250640869140625, 0.2643280029296875, 0.27801513671875, 0.2917022705078125, 0.305389404296875, 0.3190765380859375, 0.332763671875, 0.3464508056640625, 0.360137939453125, 0.3738250732421875, 0.38751220703125, 0.4011993408203125, 0.414886474609375, 0.4285736083984375, 0.4422607421875, 0.4559478759765625, 0.469635009765625, 0.4833221435546875, 0.49700927734375, 0.5106964111328125, 0.524383544921875, 0.5380706787109375, 0.5517578125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 52.0, 164.0, 389.0, 244.0, 96.0, 26.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.409454345703125, -10.003876686096191, -9.598299026489258, -9.192720413208008, -8.787142753601074, -8.38156509399414, -7.975986957550049, -7.570408821105957, -7.164831161499023, -6.75925350189209, -6.353675365447998, -5.948097229003906, -5.542519569396973, -5.136941909790039, -4.731363773345947, -4.3257856369018555, -3.920207977294922, -3.514630079269409, -3.1090521812438965, -2.703474283218384, -2.297896385192871, -1.8923184871673584, -1.4867405891418457, -1.081162691116333, -0.6755847930908203, -0.2700068950653076, 0.13557100296020508, 0.5411489009857178, 0.9467267990112305, 1.3523046970367432, 1.7578825950622559, 2.1634604930877686, 2.5690383911132812, 2.974616289138794, 3.3801941871643066, 3.7857720851898193, 4.191349983215332, 4.596927642822266, 5.002505779266357, 5.408083915710449, 5.813661575317383, 6.219239234924316, 6.624817371368408, 7.0303955078125, 7.435973167419434, 7.841550827026367, 8.247129440307617, 8.65270709991455, 9.058284759521484, 9.463862419128418, 9.869440078735352, 10.275018692016602, 10.680596351623535, 11.086174011230469, 11.491752624511719, 11.897330284118652, 12.302907943725586, 12.70848560333252, 13.114063262939453, 13.519641876220703, 13.925219535827637, 14.33079719543457, 14.73637580871582, 15.141953468322754, 15.547531127929688]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 10.0, 4.0, 5.0, 14.0, 9.0, 15.0, 12.0, 24.0, 30.0, 27.0, 40.0, 38.0, 52.0, 49.0, 62.0, 60.0, 64.0, 61.0, 53.0, 47.0, 54.0, 54.0, 35.0, 29.0, 30.0, 26.0, 16.0, 14.0, 16.0, 12.0, 8.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-4.932521343231201, -4.801183223724365, -4.669845104217529, -4.538506984710693, -4.407168388366699, -4.275830268859863, -4.144492149353027, -4.013154029846191, -3.8818159103393555, -3.7504777908325195, -3.6191396713256836, -3.4878013134002686, -3.3564631938934326, -3.2251250743865967, -3.0937867164611816, -2.9624485969543457, -2.8311104774475098, -2.699772357940674, -2.568434238433838, -2.437095880508423, -2.305757761001587, -2.174419641494751, -2.043081283569336, -1.9117431640625, -1.780405044555664, -1.6490669250488281, -1.5177286863327026, -1.3863904476165771, -1.2550523281097412, -1.1237142086029053, -0.9923759698867798, -0.8610377907752991, -0.7296993732452393, -0.5983611941337585, -0.46702301502227783, -0.3356848359107971, -0.2043466567993164, -0.0730084776878357, 0.05832970142364502, 0.18966788053512573, 0.32100605964660645, 0.45234423875808716, 0.5836824178695679, 0.7150205969810486, 0.8463587760925293, 0.97769695520401, 1.1090351343154907, 1.2403733730316162, 1.3717114925384521, 1.503049612045288, 1.6343878507614136, 1.765726089477539, 1.897064208984375, 2.028402328491211, 2.159740447998047, 2.291078805923462, 2.422416925430298, 2.553755044937134, 2.685093402862549, 2.8164315223693848, 2.9477696418762207, 3.0791077613830566, 3.2104458808898926, 3.3417842388153076, 3.4731223583221436]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 13.0, 8.0, 10.0, 17.0, 16.0, 29.0, 34.0, 68.0, 140.0, 414.0, 4166860.0, 26001.0, 344.0, 153.0, 78.0, 35.0, 22.0, 12.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.23394775390625, -7.9835205078125, -7.73309326171875, -7.482666015625, -7.23223876953125, -6.9818115234375, -6.73138427734375, -6.48095703125, -6.23052978515625, -5.9801025390625, -5.72967529296875, -5.479248046875, -5.22882080078125, -4.9783935546875, -4.72796630859375, -4.4775390625, -4.22711181640625, -3.9766845703125, -3.72625732421875, -3.475830078125, -3.22540283203125, -2.9749755859375, -2.72454833984375, -2.47412109375, -2.22369384765625, -1.9732666015625, -1.72283935546875, -1.472412109375, -1.22198486328125, -0.9715576171875, -0.72113037109375, -0.470703125, -0.22027587890625, 0.0301513671875, 0.28057861328125, 0.531005859375, 0.78143310546875, 1.0318603515625, 1.28228759765625, 1.53271484375, 1.78314208984375, 2.0335693359375, 2.28399658203125, 2.534423828125, 2.78485107421875, 3.0352783203125, 3.28570556640625, 3.5361328125, 3.78656005859375, 4.0369873046875, 4.28741455078125, 4.537841796875, 4.78826904296875, 5.0386962890625, 5.28912353515625, 5.53955078125, 5.78997802734375, 6.0404052734375, 6.29083251953125, 6.541259765625, 6.79168701171875, 7.0421142578125, 7.29254150390625, 7.54296875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 10.0, 20.0, 16.0, 21.0, 39.0, 66.0, 77.0, 90.0, 108.0, 113.0, 88.0, 73.0, 67.0, 58.0, 46.0, 36.0, 17.0, 12.0, 8.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.45654296875, -0.4466590881347656, -0.43677520751953125, -0.4268913269042969, -0.4170074462890625, -0.4071235656738281, -0.39723968505859375, -0.3873558044433594, -0.377471923828125, -0.3675880432128906, -0.35770416259765625, -0.3478202819824219, -0.3379364013671875, -0.3280525207519531, -0.31816864013671875, -0.3082847595214844, -0.29840087890625, -0.2885169982910156, -0.27863311767578125, -0.2687492370605469, -0.2588653564453125, -0.24898147583007812, -0.23909759521484375, -0.22921371459960938, -0.219329833984375, -0.20944595336914062, -0.19956207275390625, -0.18967819213867188, -0.1797943115234375, -0.16991043090820312, -0.16002655029296875, -0.15014266967773438, -0.1402587890625, -0.13037490844726562, -0.12049102783203125, -0.11060714721679688, -0.1007232666015625, -0.09083938598632812, -0.08095550537109375, -0.07107162475585938, -0.061187744140625, -0.051303863525390625, -0.04141998291015625, -0.031536102294921875, -0.0216522216796875, -0.011768341064453125, -0.00188446044921875, 0.007999420166015625, 0.01788330078125, 0.027767181396484375, 0.03765106201171875, 0.047534942626953125, 0.0574188232421875, 0.06730270385742188, 0.07718658447265625, 0.08707046508789062, 0.096954345703125, 0.10683822631835938, 0.11672210693359375, 0.12660598754882812, 0.1364898681640625, 0.14637374877929688, 0.15625762939453125, 0.16614151000976562, 0.176025390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 13.0, 19.0, 27.0, 42.0, 62.0, 117.0, 182.0, 320.0, 583.0, 1057.0, 2172.0, 4560.0, 11104.0, 33615.0, 144002.0, 1693643.0, 2090298.0, 157754.0, 34820.0, 11418.0, 4292.0, 2041.0, 907.0, 484.0, 275.0, 154.0, 99.0, 51.0, 50.0, 23.0, 16.0, 21.0, 11.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.468017578125, -0.45571136474609375, -0.4434051513671875, -0.43109893798828125, -0.418792724609375, -0.40648651123046875, -0.3941802978515625, -0.38187408447265625, -0.36956787109375, -0.35726165771484375, -0.3449554443359375, -0.33264923095703125, -0.320343017578125, -0.30803680419921875, -0.2957305908203125, -0.28342437744140625, -0.2711181640625, -0.25881195068359375, -0.2465057373046875, -0.23419952392578125, -0.221893310546875, -0.20958709716796875, -0.1972808837890625, -0.18497467041015625, -0.17266845703125, -0.16036224365234375, -0.1480560302734375, -0.13574981689453125, -0.123443603515625, -0.11113739013671875, -0.0988311767578125, -0.08652496337890625, -0.07421875, -0.06191253662109375, -0.0496063232421875, -0.03730010986328125, -0.024993896484375, -0.01268768310546875, -0.0003814697265625, 0.01192474365234375, 0.02423095703125, 0.03653717041015625, 0.0488433837890625, 0.06114959716796875, 0.073455810546875, 0.08576202392578125, 0.0980682373046875, 0.11037445068359375, 0.1226806640625, 0.13498687744140625, 0.1472930908203125, 0.15959930419921875, 0.171905517578125, 0.18421173095703125, 0.1965179443359375, 0.20882415771484375, 0.22113037109375, 0.23343658447265625, 0.2457427978515625, 0.25804901123046875, 0.270355224609375, 0.28266143798828125, 0.2949676513671875, 0.30727386474609375, 0.319580078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 9.0, 17.0, 30.0, 23.0, 37.0, 58.0, 123.0, 218.0, 308.0, 668.0, 1123.0, 644.0, 361.0, 149.0, 105.0, 54.0, 46.0, 21.0, 15.0, 10.0, 4.0, 11.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.4444999694824219, -0.42830657958984375, -0.4121131896972656, -0.3959197998046875, -0.3797264099121094, -0.36353302001953125, -0.3473396301269531, -0.331146240234375, -0.3149528503417969, -0.29875946044921875, -0.2825660705566406, -0.2663726806640625, -0.2501792907714844, -0.23398590087890625, -0.21779251098632812, -0.20159912109375, -0.18540573120117188, -0.16921234130859375, -0.15301895141601562, -0.1368255615234375, -0.12063217163085938, -0.10443878173828125, -0.08824539184570312, -0.072052001953125, -0.055858612060546875, -0.03966522216796875, -0.023471832275390625, -0.0072784423828125, 0.008914947509765625, 0.02510833740234375, 0.041301727294921875, 0.0574951171875, 0.07368850708007812, 0.08988189697265625, 0.10607528686523438, 0.1222686767578125, 0.13846206665039062, 0.15465545654296875, 0.17084884643554688, 0.187042236328125, 0.20323562622070312, 0.21942901611328125, 0.23562240600585938, 0.2518157958984375, 0.2680091857910156, 0.28420257568359375, 0.3003959655761719, 0.31658935546875, 0.3327827453613281, 0.34897613525390625, 0.3651695251464844, 0.3813629150390625, 0.3975563049316406, 0.41374969482421875, 0.4299430847167969, 0.446136474609375, 0.4623298645019531, 0.47852325439453125, 0.4947166442871094, 0.5109100341796875, 0.5271034240722656, 0.5432968139648438, 0.5594902038574219, 0.57568359375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 4.0, 9.0, 8.0, 14.0, 63.0, 133.0, 269.0, 260.0, 153.0, 56.0, 11.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.224889755249023, -9.033588409423828, -8.842286109924316, -8.650983810424805, -8.45968246459961, -8.268381118774414, -8.077078819274902, -7.885776996612549, -7.694475173950195, -7.503173351287842, -7.311871528625488, -7.120569705963135, -6.929267883300781, -6.737966060638428, -6.546664237976074, -6.355362415313721, -6.164060592651367, -5.972758769989014, -5.78145694732666, -5.590155124664307, -5.398853302001953, -5.2075514793396, -5.016249656677246, -4.824947834014893, -4.633646011352539, -4.4423441886901855, -4.251042366027832, -4.0597405433654785, -3.868438720703125, -3.6771368980407715, -3.485835075378418, -3.2945332527160645, -3.10323166847229, -2.9119298458099365, -2.720628023147583, -2.5293262004852295, -2.338024377822876, -2.1467225551605225, -1.955420732498169, -1.7641189098358154, -1.572817087173462, -1.3815152645111084, -1.1902134418487549, -0.9989116191864014, -0.8076097965240479, -0.6163079738616943, -0.4250061511993408, -0.2337043285369873, -0.04240250587463379, 0.14889931678771973, 0.34020113945007324, 0.5315029621124268, 0.7228047847747803, 0.9141066074371338, 1.1054084300994873, 1.2967102527618408, 1.4880120754241943, 1.6793138980865479, 1.8706157207489014, 2.061917543411255, 2.2532193660736084, 2.444521188735962, 2.6358230113983154, 2.827124834060669, 3.0184266567230225]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 9.0, 13.0, 16.0, 14.0, 10.0, 27.0, 30.0, 27.0, 35.0, 42.0, 51.0, 48.0, 50.0, 57.0, 54.0, 51.0, 59.0, 54.0, 49.0, 42.0, 48.0, 32.0, 35.0, 28.0, 29.0, 20.0, 22.0, 13.0, 15.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1493704319000244, -2.072101593017578, -1.9948326349258423, -1.917563796043396, -1.8402948379516602, -1.7630259990692139, -1.6857571601867676, -1.6084883213043213, -1.5312193632125854, -1.4539505243301392, -1.3766815662384033, -1.299412727355957, -1.2221438884735107, -1.144874930381775, -1.0676060914993286, -0.9903371930122375, -0.9130682945251465, -0.8357993960380554, -0.7585304975509644, -0.6812616586685181, -0.603992760181427, -0.5267238616943359, -0.44945499300956726, -0.3721861243247986, -0.2949172258377075, -0.21764834225177765, -0.14037945866584778, -0.06311057507991791, 0.014158308506011963, 0.09142720699310303, 0.1686960756778717, 0.24596494436264038, 0.32323408126831055, 0.4005029797554016, 0.4777718484401703, 0.555040717124939, 0.63230961561203, 0.7095785140991211, 0.7868473529815674, 0.8641162514686584, 0.9413851499557495, 1.0186539888381958, 1.0959229469299316, 1.173191785812378, 1.2504606246948242, 1.32772958278656, 1.4049984216690063, 1.4822673797607422, 1.5595362186431885, 1.6368050575256348, 1.7140740156173706, 1.791342854499817, 1.8686118125915527, 1.945880651473999, 2.0231494903564453, 2.1004183292388916, 2.177687168121338, 2.254956007003784, 2.3322248458862305, 2.409493923187256, 2.486762762069702, 2.5640316009521484, 2.6413004398345947, 2.718569278717041, 2.7958383560180664]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 9.0, 9.0, 10.0, 17.0, 17.0, 41.0, 56.0, 86.0, 154.0, 226.0, 402.0, 742.0, 1244.0, 2476.0, 4875.0, 10753.0, 27938.0, 85719.0, 311572.0, 416518.0, 121543.0, 37714.0, 13917.0, 5928.0, 2880.0, 1535.0, 859.0, 494.0, 313.0, 185.0, 116.0, 65.0, 42.0, 36.0, 19.0, 17.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5107421875, -0.49620819091796875, -0.4816741943359375, -0.46714019775390625, -0.452606201171875, -0.43807220458984375, -0.4235382080078125, -0.40900421142578125, -0.39447021484375, -0.37993621826171875, -0.3654022216796875, -0.35086822509765625, -0.336334228515625, -0.32180023193359375, -0.3072662353515625, -0.29273223876953125, -0.2781982421875, -0.26366424560546875, -0.2491302490234375, -0.23459625244140625, -0.220062255859375, -0.20552825927734375, -0.1909942626953125, -0.17646026611328125, -0.16192626953125, -0.14739227294921875, -0.1328582763671875, -0.11832427978515625, -0.103790283203125, -0.08925628662109375, -0.0747222900390625, -0.06018829345703125, -0.045654296875, -0.03112030029296875, -0.0165863037109375, -0.00205230712890625, 0.012481689453125, 0.02701568603515625, 0.0415496826171875, 0.05608367919921875, 0.07061767578125, 0.08515167236328125, 0.0996856689453125, 0.11421966552734375, 0.128753662109375, 0.14328765869140625, 0.1578216552734375, 0.17235565185546875, 0.1868896484375, 0.20142364501953125, 0.2159576416015625, 0.23049163818359375, 0.245025634765625, 0.25955963134765625, 0.2740936279296875, 0.28862762451171875, 0.30316162109375, 0.31769561767578125, 0.3322296142578125, 0.34676361083984375, 0.361297607421875, 0.37583160400390625, 0.3903656005859375, 0.40489959716796875, 0.41943359375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 6.0, 5.0, 10.0, 15.0, 14.0, 15.0, 28.0, 40.0, 32.0, 41.0, 59.0, 37.0, 71.0, 73.0, 73.0, 79.0, 54.0, 54.0, 51.0, 44.0, 33.0, 30.0, 27.0, 22.0, 26.0, 10.0, 11.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24365234375, -0.2369537353515625, -0.230255126953125, -0.2235565185546875, -0.21685791015625, -0.2101593017578125, -0.203460693359375, -0.1967620849609375, -0.1900634765625, -0.1833648681640625, -0.176666259765625, -0.1699676513671875, -0.16326904296875, -0.1565704345703125, -0.149871826171875, -0.1431732177734375, -0.136474609375, -0.1297760009765625, -0.123077392578125, -0.1163787841796875, -0.10968017578125, -0.1029815673828125, -0.096282958984375, -0.0895843505859375, -0.0828857421875, -0.0761871337890625, -0.069488525390625, -0.0627899169921875, -0.05609130859375, -0.0493927001953125, -0.042694091796875, -0.0359954833984375, -0.029296875, -0.0225982666015625, -0.015899658203125, -0.0092010498046875, -0.00250244140625, 0.0041961669921875, 0.010894775390625, 0.0175933837890625, 0.0242919921875, 0.0309906005859375, 0.037689208984375, 0.0443878173828125, 0.05108642578125, 0.0577850341796875, 0.064483642578125, 0.0711822509765625, 0.077880859375, 0.0845794677734375, 0.091278076171875, 0.0979766845703125, 0.10467529296875, 0.1113739013671875, 0.118072509765625, 0.1247711181640625, 0.1314697265625, 0.1381683349609375, 0.144866943359375, 0.1515655517578125, 0.15826416015625, 0.1649627685546875, 0.171661376953125, 0.1783599853515625, 0.18505859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 9.0, 12.0, 19.0, 38.0, 54.0, 86.0, 119.0, 238.0, 501.0, 1154.0, 3395.0, 16267.0, 178315.0, 776068.0, 60576.0, 7893.0, 2134.0, 838.0, 387.0, 169.0, 107.0, 59.0, 36.0, 23.0, 13.0, 15.0, 5.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8017578125, -0.7700653076171875, -0.738372802734375, -0.7066802978515625, -0.67498779296875, -0.6432952880859375, -0.611602783203125, -0.5799102783203125, -0.5482177734375, -0.5165252685546875, -0.484832763671875, -0.4531402587890625, -0.42144775390625, -0.3897552490234375, -0.358062744140625, -0.3263702392578125, -0.294677734375, -0.2629852294921875, -0.231292724609375, -0.1996002197265625, -0.16790771484375, -0.1362152099609375, -0.104522705078125, -0.0728302001953125, -0.0411376953125, -0.0094451904296875, 0.022247314453125, 0.0539398193359375, 0.08563232421875, 0.1173248291015625, 0.149017333984375, 0.1807098388671875, 0.21240234375, 0.2440948486328125, 0.275787353515625, 0.3074798583984375, 0.33917236328125, 0.3708648681640625, 0.402557373046875, 0.4342498779296875, 0.4659423828125, 0.4976348876953125, 0.529327392578125, 0.5610198974609375, 0.59271240234375, 0.6244049072265625, 0.656097412109375, 0.6877899169921875, 0.719482421875, 0.7511749267578125, 0.782867431640625, 0.8145599365234375, 0.84625244140625, 0.8779449462890625, 0.909637451171875, 0.9413299560546875, 0.9730224609375, 1.0047149658203125, 1.036407470703125, 1.0680999755859375, 1.09979248046875, 1.1314849853515625, 1.163177490234375, 1.1948699951171875, 1.2265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 1.0, 4.0, 9.0, 5.0, 17.0, 19.0, 25.0, 28.0, 44.0, 46.0, 45.0, 53.0, 67.0, 67.0, 73.0, 60.0, 77.0, 50.0, 58.0, 46.0, 43.0, 43.0, 33.0, 29.0, 11.0, 13.0, 11.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7060546875, -0.672393798828125, -0.63873291015625, -0.605072021484375, -0.5714111328125, -0.537750244140625, -0.50408935546875, -0.470428466796875, -0.436767578125, -0.403106689453125, -0.36944580078125, -0.335784912109375, -0.3021240234375, -0.268463134765625, -0.23480224609375, -0.201141357421875, -0.16748046875, -0.133819580078125, -0.10015869140625, -0.066497802734375, -0.0328369140625, 0.000823974609375, 0.03448486328125, 0.068145751953125, 0.101806640625, 0.135467529296875, 0.16912841796875, 0.202789306640625, 0.2364501953125, 0.270111083984375, 0.30377197265625, 0.337432861328125, 0.37109375, 0.404754638671875, 0.43841552734375, 0.472076416015625, 0.5057373046875, 0.539398193359375, 0.57305908203125, 0.606719970703125, 0.640380859375, 0.674041748046875, 0.70770263671875, 0.741363525390625, 0.7750244140625, 0.808685302734375, 0.84234619140625, 0.876007080078125, 0.90966796875, 0.943328857421875, 0.97698974609375, 1.010650634765625, 1.0443115234375, 1.077972412109375, 1.11163330078125, 1.145294189453125, 1.178955078125, 1.212615966796875, 1.24627685546875, 1.279937744140625, 1.3135986328125, 1.347259521484375, 1.38092041015625, 1.414581298828125, 1.4482421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 9.0, 4.0, 8.0, 28.0, 20.0, 36.0, 69.0, 125.0, 218.0, 437.0, 1011.0, 3180.0, 20365.0, 833644.0, 177482.0, 8594.0, 1823.0, 724.0, 327.0, 167.0, 80.0, 70.0, 35.0, 22.0, 18.0, 16.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.8161392211914062, -0.7904815673828125, -0.7648239135742188, -0.739166259765625, -0.7135086059570312, -0.6878509521484375, -0.6621932983398438, -0.63653564453125, -0.6108779907226562, -0.5852203369140625, -0.5595626831054688, -0.533905029296875, -0.5082473754882812, -0.4825897216796875, -0.45693206787109375, -0.4312744140625, -0.40561676025390625, -0.3799591064453125, -0.35430145263671875, -0.328643798828125, -0.30298614501953125, -0.2773284912109375, -0.25167083740234375, -0.22601318359375, -0.20035552978515625, -0.1746978759765625, -0.14904022216796875, -0.123382568359375, -0.09772491455078125, -0.0720672607421875, -0.04640960693359375, -0.020751953125, 0.00490570068359375, 0.0305633544921875, 0.05622100830078125, 0.081878662109375, 0.10753631591796875, 0.1331939697265625, 0.15885162353515625, 0.18450927734375, 0.21016693115234375, 0.2358245849609375, 0.26148223876953125, 0.287139892578125, 0.31279754638671875, 0.3384552001953125, 0.36411285400390625, 0.3897705078125, 0.41542816162109375, 0.4410858154296875, 0.46674346923828125, 0.492401123046875, 0.5180587768554688, 0.5437164306640625, 0.5693740844726562, 0.59503173828125, 0.6206893920898438, 0.6463470458984375, 0.6720046997070312, 0.697662353515625, 0.7233200073242188, 0.7489776611328125, 0.7746353149414062, 0.80029296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 3.0, 11.0, 8.0, 18.0, 9.0, 23.0, 24.0, 28.0, 28.0, 37.0, 52.0, 81.0, 103.0, 119.0, 100.0, 88.0, 62.0, 43.0, 34.0, 24.0, 15.0, 16.0, 16.0, 7.0, 4.0, 4.0, 7.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013399124145507812, -0.0001301141455769539, -0.00012623704969882965, -0.00012235995382070541, -0.00011848285794258118, -0.00011460576206445694, -0.0001107286661863327, -0.00010685157030820847, -0.00010297447443008423, -9.909737855195999e-05, -9.522028267383575e-05, -9.134318679571152e-05, -8.746609091758728e-05, -8.358899503946304e-05, -7.97118991613388e-05, -7.583480328321457e-05, -7.195770740509033e-05, -6.80806115269661e-05, -6.420351564884186e-05, -6.032641977071762e-05, -5.6449323892593384e-05, -5.257222801446915e-05, -4.869513213634491e-05, -4.481803625822067e-05, -4.0940940380096436e-05, -3.70638445019722e-05, -3.318674862384796e-05, -2.9309652745723724e-05, -2.5432556867599487e-05, -2.155546098947525e-05, -1.7678365111351013e-05, -1.3801269233226776e-05, -9.924173355102539e-06, -6.047077476978302e-06, -2.169981598854065e-06, 1.7071142792701721e-06, 5.584210157394409e-06, 9.461306035518646e-06, 1.3338401913642883e-05, 1.721549779176712e-05, 2.1092593669891357e-05, 2.4969689548015594e-05, 2.884678542613983e-05, 3.272388130426407e-05, 3.6600977182388306e-05, 4.047807306051254e-05, 4.435516893863678e-05, 4.823226481676102e-05, 5.2109360694885254e-05, 5.598645657300949e-05, 5.986355245113373e-05, 6.374064832925797e-05, 6.76177442073822e-05, 7.149484008550644e-05, 7.537193596363068e-05, 7.924903184175491e-05, 8.312612771987915e-05, 8.700322359800339e-05, 9.088031947612762e-05, 9.475741535425186e-05, 9.86345112323761e-05, 0.00010251160711050034, 0.00010638870298862457, 0.00011026579886674881, 0.00011414289474487305]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 14.0, 17.0, 38.0, 41.0, 61.0, 85.0, 146.0, 285.0, 483.0, 1091.0, 3219.0, 14736.0, 229280.0, 762668.0, 28458.0, 4949.0, 1538.0, 613.0, 304.0, 190.0, 91.0, 63.0, 44.0, 40.0, 27.0, 9.0, 12.0, 10.0, 5.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6992568969726562, -0.6787872314453125, -0.6583175659179688, -0.637847900390625, -0.6173782348632812, -0.5969085693359375, -0.5764389038085938, -0.55596923828125, -0.5354995727539062, -0.5150299072265625, -0.49456024169921875, -0.474090576171875, -0.45362091064453125, -0.4331512451171875, -0.41268157958984375, -0.3922119140625, -0.37174224853515625, -0.3512725830078125, -0.33080291748046875, -0.310333251953125, -0.28986358642578125, -0.2693939208984375, -0.24892425537109375, -0.22845458984375, -0.20798492431640625, -0.1875152587890625, -0.16704559326171875, -0.146575927734375, -0.12610626220703125, -0.1056365966796875, -0.08516693115234375, -0.064697265625, -0.04422760009765625, -0.0237579345703125, -0.00328826904296875, 0.017181396484375, 0.03765106201171875, 0.0581207275390625, 0.07859039306640625, 0.09906005859375, 0.11952972412109375, 0.1399993896484375, 0.16046905517578125, 0.180938720703125, 0.20140838623046875, 0.2218780517578125, 0.24234771728515625, 0.2628173828125, 0.28328704833984375, 0.3037567138671875, 0.32422637939453125, 0.344696044921875, 0.36516571044921875, 0.3856353759765625, 0.40610504150390625, 0.42657470703125, 0.44704437255859375, 0.4675140380859375, 0.48798370361328125, 0.508453369140625, 0.5289230346679688, 0.5493927001953125, 0.5698623657226562, 0.59033203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 10.0, 11.0, 8.0, 11.0, 14.0, 18.0, 23.0, 38.0, 45.0, 80.0, 99.0, 125.0, 117.0, 123.0, 70.0, 41.0, 53.0, 21.0, 17.0, 19.0, 15.0, 4.0, 10.0, 7.0, 7.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5129890441894531, -0.49912261962890625, -0.4852561950683594, -0.4713897705078125, -0.4575233459472656, -0.44365692138671875, -0.4297904968261719, -0.415924072265625, -0.4020576477050781, -0.38819122314453125, -0.3743247985839844, -0.3604583740234375, -0.3465919494628906, -0.33272552490234375, -0.3188591003417969, -0.30499267578125, -0.2911262512207031, -0.27725982666015625, -0.2633934020996094, -0.2495269775390625, -0.23566055297851562, -0.22179412841796875, -0.20792770385742188, -0.194061279296875, -0.18019485473632812, -0.16632843017578125, -0.15246200561523438, -0.1385955810546875, -0.12472915649414062, -0.11086273193359375, -0.09699630737304688, -0.0831298828125, -0.06926345825195312, -0.05539703369140625, -0.041530609130859375, -0.0276641845703125, -0.013797760009765625, 6.866455078125e-05, 0.013935089111328125, 0.027801513671875, 0.041667938232421875, 0.05553436279296875, 0.06940078735351562, 0.0832672119140625, 0.09713363647460938, 0.11100006103515625, 0.12486648559570312, 0.13873291015625, 0.15259933471679688, 0.16646575927734375, 0.18033218383789062, 0.1941986083984375, 0.20806503295898438, 0.22193145751953125, 0.23579788208007812, 0.249664306640625, 0.2635307312011719, 0.27739715576171875, 0.2912635803222656, 0.3051300048828125, 0.3189964294433594, 0.33286285400390625, 0.3467292785644531, 0.360595703125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 8.0, 29.0, 66.0, 159.0, 274.0, 243.0, 125.0, 37.0, 23.0, 10.0, 8.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.0038423538208, -11.729766845703125, -11.45569133758545, -11.181615829467773, -10.907540321350098, -10.633464813232422, -10.359389305114746, -10.08531379699707, -9.811239242553711, -9.537163734436035, -9.26308822631836, -8.989012718200684, -8.714937210083008, -8.440861701965332, -8.166786193847656, -7.892711162567139, -7.618635177612305, -7.344559669494629, -7.070484161376953, -6.796408653259277, -6.522333145141602, -6.248257637023926, -5.974182605743408, -5.700107097625732, -5.426031589508057, -5.151956081390381, -4.877880573272705, -4.603805065155029, -4.329730033874512, -4.055654525756836, -3.78157901763916, -3.5075035095214844, -3.2334280014038086, -2.959352493286133, -2.685276985168457, -2.4112017154693604, -2.1371262073516846, -1.8630506992340088, -1.5889753103256226, -1.3148999214172363, -1.0408244132995605, -0.7667489647865295, -0.49267351627349854, -0.21859806776046753, 0.05547738075256348, 0.32955288887023926, 0.6036282777786255, 0.8777036666870117, 1.1517791748046875, 1.4258546829223633, 1.6999300718307495, 1.9740054607391357, 2.2480809688568115, 2.5221564769744873, 2.796231746673584, 3.0703072547912598, 3.3443827629089355, 3.6184582710266113, 3.892533779144287, 4.166609287261963, 4.4406843185424805, 4.714759826660156, 4.988835334777832, 5.262910842895508, 5.536986351013184]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 11.0, 7.0, 5.0, 9.0, 11.0, 11.0, 9.0, 22.0, 27.0, 23.0, 33.0, 38.0, 33.0, 32.0, 34.0, 57.0, 62.0, 57.0, 67.0, 61.0, 60.0, 50.0, 32.0, 37.0, 42.0, 19.0, 33.0, 20.0, 24.0, 13.0, 17.0, 11.0, 8.0, 10.0, 9.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.661123752593994, -3.5503969192504883, -3.4396703243255615, -3.3289434909820557, -3.21821665763855, -3.107490062713623, -2.996763229370117, -2.8860363960266113, -2.7753095626831055, -2.6645827293395996, -2.553856134414673, -2.443129301071167, -2.332402467727661, -2.2216758728027344, -2.1109490394592285, -2.0002222061157227, -1.8894954919815063, -1.77876877784729, -1.6680419445037842, -1.5573152303695679, -1.446588397026062, -1.3358616828918457, -1.2251348495483398, -1.1144081354141235, -1.0036814212799072, -0.8929546475410461, -0.7822278738021851, -0.6715011596679688, -0.5607743263244629, -0.4500476121902466, -0.3393208384513855, -0.22859406471252441, -0.11786723136901855, -0.007140465080738068, 0.10358630120754242, 0.2143130600452423, 0.3250398337841034, 0.4357665777206421, 0.5464933514595032, 0.6572201251983643, 0.7679468989372253, 0.8786736726760864, 0.9894004464149475, 1.1001272201538086, 1.210853934288025, 1.3215806484222412, 1.432307481765747, 1.543034315109253, 1.6537610292434692, 1.7644877433776855, 1.8752145767211914, 1.9859412908554077, 2.096668004989624, 2.20739483833313, 2.3181216716766357, 2.4288482666015625, 2.5395750999450684, 2.650301933288574, 2.761028528213501, 2.871755361557007, 2.9824821949005127, 3.0932087898254395, 3.2039356231689453, 3.314662456512451, 3.425389289855957]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 20.0, 17.0, 21.0, 28.0, 49.0, 74.0, 174.0, 620.0, 3348.0, 36471.0, 3619891.0, 518704.0, 12440.0, 1680.0, 383.0, 148.0, 71.0, 36.0, 32.0, 19.0, 14.0, 7.0, 7.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.904296875, -0.8775482177734375, -0.850799560546875, -0.8240509033203125, -0.79730224609375, -0.7705535888671875, -0.743804931640625, -0.7170562744140625, -0.6903076171875, -0.6635589599609375, -0.636810302734375, -0.6100616455078125, -0.58331298828125, -0.5565643310546875, -0.529815673828125, -0.5030670166015625, -0.476318359375, -0.4495697021484375, -0.422821044921875, -0.3960723876953125, -0.36932373046875, -0.3425750732421875, -0.315826416015625, -0.2890777587890625, -0.2623291015625, -0.2355804443359375, -0.208831787109375, -0.1820831298828125, -0.15533447265625, -0.1285858154296875, -0.101837158203125, -0.0750885009765625, -0.04833984375, -0.0215911865234375, 0.005157470703125, 0.0319061279296875, 0.05865478515625, 0.0854034423828125, 0.112152099609375, 0.1389007568359375, 0.1656494140625, 0.1923980712890625, 0.219146728515625, 0.2458953857421875, 0.27264404296875, 0.2993927001953125, 0.326141357421875, 0.3528900146484375, 0.379638671875, 0.4063873291015625, 0.433135986328125, 0.4598846435546875, 0.48663330078125, 0.5133819580078125, 0.540130615234375, 0.5668792724609375, 0.5936279296875, 0.6203765869140625, 0.647125244140625, 0.6738739013671875, 0.70062255859375, 0.7273712158203125, 0.754119873046875, 0.7808685302734375, 0.8076171875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 10.0, 5.0, 9.0, 8.0, 11.0, 14.0, 37.0, 46.0, 29.0, 49.0, 63.0, 59.0, 55.0, 75.0, 72.0, 65.0, 57.0, 55.0, 49.0, 44.0, 33.0, 29.0, 35.0, 16.0, 16.0, 12.0, 11.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201904296875, -0.1954517364501953, -0.18899917602539062, -0.18254661560058594, -0.17609405517578125, -0.16964149475097656, -0.16318893432617188, -0.1567363739013672, -0.1502838134765625, -0.1438312530517578, -0.13737869262695312, -0.13092613220214844, -0.12447357177734375, -0.11802101135253906, -0.11156845092773438, -0.10511589050292969, -0.098663330078125, -0.09221076965332031, -0.08575820922851562, -0.07930564880371094, -0.07285308837890625, -0.06640052795410156, -0.059947967529296875, -0.05349540710449219, -0.0470428466796875, -0.04059028625488281, -0.034137725830078125, -0.027685165405273438, -0.02123260498046875, -0.014780044555664062, -0.008327484130859375, -0.0018749237060546875, 0.00457763671875, 0.011030197143554688, 0.017482757568359375, 0.023935317993164062, 0.03038787841796875, 0.03684043884277344, 0.043292999267578125, 0.04974555969238281, 0.0561981201171875, 0.06265068054199219, 0.06910324096679688, 0.07555580139160156, 0.08200836181640625, 0.08846092224121094, 0.09491348266601562, 0.10136604309082031, 0.107818603515625, 0.11427116394042969, 0.12072372436523438, 0.12717628479003906, 0.13362884521484375, 0.14008140563964844, 0.14653396606445312, 0.1529865264892578, 0.1594390869140625, 0.1658916473388672, 0.17234420776367188, 0.17879676818847656, 0.18524932861328125, 0.19170188903808594, 0.19815444946289062, 0.2046070098876953, 0.2110595703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 1.0, 7.0, 5.0, 14.0, 9.0, 15.0, 20.0, 32.0, 51.0, 83.0, 136.0, 223.0, 380.0, 773.0, 1910.0, 5772.0, 21823.0, 136969.0, 2683311.0, 1242836.0, 79484.0, 14073.0, 3795.0, 1338.0, 534.0, 260.0, 160.0, 74.0, 63.0, 41.0, 15.0, 19.0, 16.0, 11.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43017578125, -0.415283203125, -0.400390625, -0.385498046875, -0.37060546875, -0.355712890625, -0.3408203125, -0.325927734375, -0.31103515625, -0.296142578125, -0.28125, -0.266357421875, -0.25146484375, -0.236572265625, -0.2216796875, -0.206787109375, -0.19189453125, -0.177001953125, -0.162109375, -0.147216796875, -0.13232421875, -0.117431640625, -0.1025390625, -0.087646484375, -0.07275390625, -0.057861328125, -0.04296875, -0.028076171875, -0.01318359375, 0.001708984375, 0.0166015625, 0.031494140625, 0.04638671875, 0.061279296875, 0.076171875, 0.091064453125, 0.10595703125, 0.120849609375, 0.1357421875, 0.150634765625, 0.16552734375, 0.180419921875, 0.1953125, 0.210205078125, 0.22509765625, 0.239990234375, 0.2548828125, 0.269775390625, 0.28466796875, 0.299560546875, 0.314453125, 0.329345703125, 0.34423828125, 0.359130859375, 0.3740234375, 0.388916015625, 0.40380859375, 0.418701171875, 0.43359375, 0.448486328125, 0.46337890625, 0.478271484375, 0.4931640625, 0.508056640625, 0.52294921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 12.0, 21.0, 28.0, 22.0, 30.0, 40.0, 47.0, 82.0, 165.0, 196.0, 260.0, 455.0, 641.0, 654.0, 489.0, 280.0, 177.0, 118.0, 98.0, 63.0, 36.0, 31.0, 30.0, 12.0, 12.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419921875, -0.4068260192871094, -0.39373016357421875, -0.3806343078613281, -0.3675384521484375, -0.3544425964355469, -0.34134674072265625, -0.3282508850097656, -0.315155029296875, -0.3020591735839844, -0.28896331787109375, -0.2758674621582031, -0.2627716064453125, -0.24967575073242188, -0.23657989501953125, -0.22348403930664062, -0.21038818359375, -0.19729232788085938, -0.18419647216796875, -0.17110061645507812, -0.1580047607421875, -0.14490890502929688, -0.13181304931640625, -0.11871719360351562, -0.105621337890625, -0.09252548217773438, -0.07942962646484375, -0.06633377075195312, -0.0532379150390625, -0.040142059326171875, -0.02704620361328125, -0.013950347900390625, -0.0008544921875, 0.012241363525390625, 0.02533721923828125, 0.038433074951171875, 0.0515289306640625, 0.06462478637695312, 0.07772064208984375, 0.09081649780273438, 0.103912353515625, 0.11700820922851562, 0.13010406494140625, 0.14319992065429688, 0.1562957763671875, 0.16939163208007812, 0.18248748779296875, 0.19558334350585938, 0.20867919921875, 0.22177505493164062, 0.23487091064453125, 0.24796676635742188, 0.2610626220703125, 0.2741584777832031, 0.28725433349609375, 0.3003501892089844, 0.313446044921875, 0.3265419006347656, 0.33963775634765625, 0.3527336120605469, 0.3658294677734375, 0.3789253234863281, 0.39202117919921875, 0.4051170349121094, 0.418212890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 12.0, 34.0, 150.0, 413.0, 301.0, 63.0, 14.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.2432918548584, -16.897762298583984, -16.55223274230957, -16.206703186035156, -15.861173629760742, -15.515644073486328, -15.170114517211914, -14.8245849609375, -14.479055404663086, -14.133525848388672, -13.787996292114258, -13.442466735839844, -13.09693717956543, -12.751407623291016, -12.405878067016602, -12.060348510742188, -11.714818954467773, -11.36928939819336, -11.023759841918945, -10.678230285644531, -10.332700729370117, -9.987171173095703, -9.641641616821289, -9.296112060546875, -8.950581550598145, -8.60505199432373, -8.259522438049316, -7.913992881774902, -7.568463325500488, -7.222933769226074, -6.87740421295166, -6.531874656677246, -6.186345100402832, -5.840815544128418, -5.495285987854004, -5.14975643157959, -4.804226875305176, -4.458697319030762, -4.113167762756348, -3.7676379680633545, -3.4221084117889404, -3.0765788555145264, -2.7310492992401123, -2.385519504547119, -2.039989948272705, -1.6944605112075806, -1.348930835723877, -1.003401279449463, -0.6578717231750488, -0.3123421370983124, 0.03318744897842407, 0.3787170648574829, 0.724246621131897, 1.069776177406311, 1.4153058528900146, 1.7608354091644287, 2.1063649654388428, 2.451894521713257, 2.797424077987671, 3.142953872680664, 3.488483428955078, 3.834012985229492, 4.179542541503906, 4.52507209777832, 4.870601654052734]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 5.0, 2.0, 4.0, 7.0, 7.0, 10.0, 10.0, 20.0, 21.0, 33.0, 22.0, 30.0, 24.0, 32.0, 43.0, 40.0, 27.0, 37.0, 44.0, 45.0, 52.0, 33.0, 52.0, 51.0, 44.0, 43.0, 33.0, 26.0, 33.0, 21.0, 21.0, 17.0, 17.0, 26.0, 9.0, 12.0, 8.0, 5.0, 7.0, 9.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.052689790725708, -1.9804867506027222, -1.9082838296890259, -1.83608078956604, -1.7638778686523438, -1.691674828529358, -1.619471788406372, -1.5472688674926758, -1.47506582736969, -1.402862787246704, -1.3306598663330078, -1.258456826210022, -1.1862537860870361, -1.1140508651733398, -1.041847825050354, -0.9696448445320129, -0.8974418640136719, -0.8252388834953308, -0.7530359029769897, -0.6808328628540039, -0.6086298823356628, -0.5364269018173218, -0.4642238914966583, -0.3920208811759949, -0.3198179006576538, -0.24761490523815155, -0.1754119098186493, -0.10320891439914703, -0.031005918979644775, 0.04119706153869629, 0.11340007185935974, 0.1856030821800232, 0.25780582427978516, 0.3300088047981262, 0.4022118151187897, 0.4744148254394531, 0.5466178059577942, 0.6188207864761353, 0.6910238265991211, 0.7632268071174622, 0.8354297876358032, 0.9076327681541443, 0.9798357486724854, 1.0520387887954712, 1.124241828918457, 1.1964447498321533, 1.2686477899551392, 1.340850830078125, 1.4130537509918213, 1.4852567911148071, 1.5574597120285034, 1.6296627521514893, 1.7018656730651855, 1.7740687131881714, 1.8462717533111572, 1.9184746742248535, 1.9906777143478394, 2.062880754470825, 2.1350836753845215, 2.2072865962982178, 2.279489755630493, 2.3516926765441895, 2.4238955974578857, 2.496098756790161, 2.5683016777038574]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 4.0, 8.0, 6.0, 23.0, 23.0, 32.0, 49.0, 61.0, 106.0, 166.0, 299.0, 516.0, 882.0, 1697.0, 3578.0, 8014.0, 19844.0, 52870.0, 151186.0, 385726.0, 271309.0, 94513.0, 33467.0, 12974.0, 5640.0, 2578.0, 1279.0, 648.0, 393.0, 225.0, 132.0, 88.0, 77.0, 44.0, 30.0, 22.0, 8.0, 12.0, 5.0, 3.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.35137939453125, -0.3382568359375, -0.32513427734375, -0.31201171875, -0.29888916015625, -0.2857666015625, -0.27264404296875, -0.259521484375, -0.24639892578125, -0.2332763671875, -0.22015380859375, -0.20703125, -0.19390869140625, -0.1807861328125, -0.16766357421875, -0.154541015625, -0.14141845703125, -0.1282958984375, -0.11517333984375, -0.10205078125, -0.08892822265625, -0.0758056640625, -0.06268310546875, -0.049560546875, -0.03643798828125, -0.0233154296875, -0.01019287109375, 0.0029296875, 0.01605224609375, 0.0291748046875, 0.04229736328125, 0.055419921875, 0.06854248046875, 0.0816650390625, 0.09478759765625, 0.10791015625, 0.12103271484375, 0.1341552734375, 0.14727783203125, 0.160400390625, 0.17352294921875, 0.1866455078125, 0.19976806640625, 0.212890625, 0.22601318359375, 0.2391357421875, 0.25225830078125, 0.265380859375, 0.27850341796875, 0.2916259765625, 0.30474853515625, 0.31787109375, 0.33099365234375, 0.3441162109375, 0.35723876953125, 0.370361328125, 0.38348388671875, 0.3966064453125, 0.40972900390625, 0.4228515625, 0.43597412109375, 0.4490966796875, 0.46221923828125, 0.475341796875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 2.0, 5.0, 3.0, 8.0, 10.0, 13.0, 10.0, 17.0, 31.0, 35.0, 32.0, 53.0, 53.0, 58.0, 69.0, 77.0, 61.0, 55.0, 42.0, 53.0, 56.0, 43.0, 39.0, 35.0, 30.0, 16.0, 26.0, 19.0, 7.0, 10.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.193603515625, -0.187255859375, -0.180908203125, -0.174560546875, -0.168212890625, -0.161865234375, -0.155517578125, -0.149169921875, -0.142822265625, -0.136474609375, -0.130126953125, -0.123779296875, -0.117431640625, -0.111083984375, -0.104736328125, -0.098388671875, -0.092041015625, -0.085693359375, -0.079345703125, -0.072998046875, -0.066650390625, -0.060302734375, -0.053955078125, -0.047607421875, -0.041259765625, -0.034912109375, -0.028564453125, -0.022216796875, -0.015869140625, -0.009521484375, -0.003173828125, 0.003173828125, 0.009521484375, 0.015869140625, 0.022216796875, 0.028564453125, 0.034912109375, 0.041259765625, 0.047607421875, 0.053955078125, 0.060302734375, 0.066650390625, 0.072998046875, 0.079345703125, 0.085693359375, 0.092041015625, 0.098388671875, 0.104736328125, 0.111083984375, 0.117431640625, 0.123779296875, 0.130126953125, 0.136474609375, 0.142822265625, 0.149169921875, 0.155517578125, 0.161865234375, 0.168212890625, 0.174560546875, 0.180908203125, 0.187255859375, 0.193603515625, 0.199951171875, 0.206298828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 18.0, 33.0, 44.0, 69.0, 144.0, 264.0, 531.0, 1187.0, 3430.0, 17867.0, 485431.0, 515788.0, 17827.0, 3453.0, 1271.0, 523.0, 277.0, 159.0, 94.0, 45.0, 29.0, 24.0, 12.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2138671875, -1.1720123291015625, -1.130157470703125, -1.0883026123046875, -1.04644775390625, -1.0045928955078125, -0.962738037109375, -0.9208831787109375, -0.8790283203125, -0.8371734619140625, -0.795318603515625, -0.7534637451171875, -0.71160888671875, -0.6697540283203125, -0.627899169921875, -0.5860443115234375, -0.544189453125, -0.5023345947265625, -0.460479736328125, -0.4186248779296875, -0.37677001953125, -0.3349151611328125, -0.293060302734375, -0.2512054443359375, -0.2093505859375, -0.1674957275390625, -0.125640869140625, -0.0837860107421875, -0.04193115234375, -7.62939453125e-05, 0.041778564453125, 0.0836334228515625, 0.12548828125, 0.1673431396484375, 0.209197998046875, 0.2510528564453125, 0.29290771484375, 0.3347625732421875, 0.376617431640625, 0.4184722900390625, 0.4603271484375, 0.5021820068359375, 0.544036865234375, 0.5858917236328125, 0.62774658203125, 0.6696014404296875, 0.711456298828125, 0.7533111572265625, 0.795166015625, 0.8370208740234375, 0.878875732421875, 0.9207305908203125, 0.96258544921875, 1.0044403076171875, 1.046295166015625, 1.0881500244140625, 1.1300048828125, 1.1718597412109375, 1.213714599609375, 1.2555694580078125, 1.29742431640625, 1.3392791748046875, 1.381134033203125, 1.4229888916015625, 1.46484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 13.0, 10.0, 15.0, 17.0, 21.0, 44.0, 52.0, 61.0, 54.0, 49.0, 52.0, 76.0, 75.0, 67.0, 79.0, 73.0, 50.0, 38.0, 30.0, 21.0, 24.0, 22.0, 11.0, 5.0, 6.0, 9.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.5966796875, -1.5577545166015625, -1.518829345703125, -1.4799041748046875, -1.44097900390625, -1.4020538330078125, -1.363128662109375, -1.3242034912109375, -1.2852783203125, -1.2463531494140625, -1.207427978515625, -1.1685028076171875, -1.12957763671875, -1.0906524658203125, -1.051727294921875, -1.0128021240234375, -0.973876953125, -0.9349517822265625, -0.896026611328125, -0.8571014404296875, -0.81817626953125, -0.7792510986328125, -0.740325927734375, -0.7014007568359375, -0.6624755859375, -0.6235504150390625, -0.584625244140625, -0.5457000732421875, -0.50677490234375, -0.4678497314453125, -0.428924560546875, -0.3899993896484375, -0.35107421875, -0.3121490478515625, -0.273223876953125, -0.2342987060546875, -0.19537353515625, -0.1564483642578125, -0.117523193359375, -0.0785980224609375, -0.0396728515625, -0.0007476806640625, 0.038177490234375, 0.0771026611328125, 0.11602783203125, 0.1549530029296875, 0.193878173828125, 0.2328033447265625, 0.271728515625, 0.3106536865234375, 0.349578857421875, 0.3885040283203125, 0.42742919921875, 0.4663543701171875, 0.505279541015625, 0.5442047119140625, 0.5831298828125, 0.6220550537109375, 0.660980224609375, 0.6999053955078125, 0.73883056640625, 0.7777557373046875, 0.816680908203125, 0.8556060791015625, 0.89453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 9.0, 4.0, 12.0, 19.0, 14.0, 32.0, 32.0, 65.0, 134.0, 225.0, 467.0, 1055.0, 3202.0, 15121.0, 174019.0, 800635.0, 43811.0, 6448.0, 1758.0, 695.0, 315.0, 190.0, 103.0, 63.0, 34.0, 29.0, 18.0, 11.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.609375, -0.591583251953125, -0.57379150390625, -0.555999755859375, -0.5382080078125, -0.520416259765625, -0.50262451171875, -0.484832763671875, -0.467041015625, -0.449249267578125, -0.43145751953125, -0.413665771484375, -0.3958740234375, -0.378082275390625, -0.36029052734375, -0.342498779296875, -0.32470703125, -0.306915283203125, -0.28912353515625, -0.271331787109375, -0.2535400390625, -0.235748291015625, -0.21795654296875, -0.200164794921875, -0.182373046875, -0.164581298828125, -0.14678955078125, -0.128997802734375, -0.1112060546875, -0.093414306640625, -0.07562255859375, -0.057830810546875, -0.0400390625, -0.022247314453125, -0.00445556640625, 0.013336181640625, 0.0311279296875, 0.048919677734375, 0.06671142578125, 0.084503173828125, 0.102294921875, 0.120086669921875, 0.13787841796875, 0.155670166015625, 0.1734619140625, 0.191253662109375, 0.20904541015625, 0.226837158203125, 0.24462890625, 0.262420654296875, 0.28021240234375, 0.298004150390625, 0.3157958984375, 0.333587646484375, 0.35137939453125, 0.369171142578125, 0.386962890625, 0.404754638671875, 0.42254638671875, 0.440338134765625, 0.4581298828125, 0.475921630859375, 0.49371337890625, 0.511505126953125, 0.529296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 5.0, 9.0, 5.0, 12.0, 8.0, 16.0, 15.0, 19.0, 21.0, 35.0, 30.0, 47.0, 44.0, 59.0, 71.0, 75.0, 77.0, 62.0, 70.0, 62.0, 56.0, 33.0, 29.0, 30.0, 23.0, 14.0, 16.0, 14.0, 15.0, 4.0, 9.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0001323223114013672, -0.0001287553459405899, -0.00012518838047981262, -0.00012162141501903534, -0.00011805444955825806, -0.00011448748409748077, -0.00011092051863670349, -0.00010735355317592621, -0.00010378658771514893, -0.00010021962225437164, -9.665265679359436e-05, -9.308569133281708e-05, -8.95187258720398e-05, -8.595176041126251e-05, -8.238479495048523e-05, -7.881782948970795e-05, -7.525086402893066e-05, -7.168389856815338e-05, -6.81169331073761e-05, -6.454996764659882e-05, -6.098300218582153e-05, -5.741603672504425e-05, -5.384907126426697e-05, -5.0282105803489685e-05, -4.67151403427124e-05, -4.314817488193512e-05, -3.958120942115784e-05, -3.6014243960380554e-05, -3.244727849960327e-05, -2.888031303882599e-05, -2.5313347578048706e-05, -2.1746382117271423e-05, -1.817941665649414e-05, -1.4612451195716858e-05, -1.1045485734939575e-05, -7.4785202741622925e-06, -3.91155481338501e-06, -3.4458935260772705e-07, 3.2223761081695557e-06, 6.789341568946838e-06, 1.0356307029724121e-05, 1.3923272490501404e-05, 1.7490237951278687e-05, 2.105720341205597e-05, 2.4624168872833252e-05, 2.8191134333610535e-05, 3.175809979438782e-05, 3.53250652551651e-05, 3.889203071594238e-05, 4.2458996176719666e-05, 4.602596163749695e-05, 4.959292709827423e-05, 5.3159892559051514e-05, 5.6726858019828796e-05, 6.029382348060608e-05, 6.386078894138336e-05, 6.742775440216064e-05, 7.099471986293793e-05, 7.456168532371521e-05, 7.812865078449249e-05, 8.169561624526978e-05, 8.526258170604706e-05, 8.882954716682434e-05, 9.239651262760162e-05, 9.59634780883789e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 0.0, 8.0, 8.0, 9.0, 10.0, 15.0, 32.0, 54.0, 83.0, 173.0, 257.0, 686.0, 2007.0, 8895.0, 135885.0, 870459.0, 24248.0, 3801.0, 1047.0, 425.0, 187.0, 97.0, 52.0, 38.0, 25.0, 19.0, 10.0, 9.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.87939453125, -0.8551254272460938, -0.8308563232421875, -0.8065872192382812, -0.782318115234375, -0.7580490112304688, -0.7337799072265625, -0.7095108032226562, -0.68524169921875, -0.6609725952148438, -0.6367034912109375, -0.6124343872070312, -0.588165283203125, -0.5638961791992188, -0.5396270751953125, -0.5153579711914062, -0.4910888671875, -0.46681976318359375, -0.4425506591796875, -0.41828155517578125, -0.394012451171875, -0.36974334716796875, -0.3454742431640625, -0.32120513916015625, -0.29693603515625, -0.27266693115234375, -0.2483978271484375, -0.22412872314453125, -0.199859619140625, -0.17559051513671875, -0.1513214111328125, -0.12705230712890625, -0.102783203125, -0.07851409912109375, -0.0542449951171875, -0.02997589111328125, -0.005706787109375, 0.01856231689453125, 0.0428314208984375, 0.06710052490234375, 0.09136962890625, 0.11563873291015625, 0.1399078369140625, 0.16417694091796875, 0.188446044921875, 0.21271514892578125, 0.2369842529296875, 0.26125335693359375, 0.2855224609375, 0.30979156494140625, 0.3340606689453125, 0.35832977294921875, 0.382598876953125, 0.40686798095703125, 0.4311370849609375, 0.45540618896484375, 0.47967529296875, 0.5039443969726562, 0.5282135009765625, 0.5524826049804688, 0.576751708984375, 0.6010208129882812, 0.6252899169921875, 0.6495590209960938, 0.673828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 13.0, 15.0, 22.0, 30.0, 34.0, 47.0, 61.0, 83.0, 108.0, 99.0, 105.0, 98.0, 78.0, 62.0, 37.0, 21.0, 13.0, 13.0, 9.0, 11.0, 8.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.54296875, -0.5287208557128906, -0.5144729614257812, -0.5002250671386719, -0.4859771728515625, -0.4717292785644531, -0.45748138427734375, -0.4432334899902344, -0.428985595703125, -0.4147377014160156, -0.40048980712890625, -0.3862419128417969, -0.3719940185546875, -0.3577461242675781, -0.34349822998046875, -0.3292503356933594, -0.31500244140625, -0.3007545471191406, -0.28650665283203125, -0.2722587585449219, -0.2580108642578125, -0.24376296997070312, -0.22951507568359375, -0.21526718139648438, -0.201019287109375, -0.18677139282226562, -0.17252349853515625, -0.15827560424804688, -0.1440277099609375, -0.12977981567382812, -0.11553192138671875, -0.10128402709960938, -0.0870361328125, -0.07278823852539062, -0.05854034423828125, -0.044292449951171875, -0.0300445556640625, -0.015796661376953125, -0.00154876708984375, 0.012699127197265625, 0.026947021484375, 0.041194915771484375, 0.05544281005859375, 0.06969070434570312, 0.0839385986328125, 0.09818649291992188, 0.11243438720703125, 0.12668228149414062, 0.14093017578125, 0.15517807006835938, 0.16942596435546875, 0.18367385864257812, 0.1979217529296875, 0.21216964721679688, 0.22641754150390625, 0.24066543579101562, 0.254913330078125, 0.2691612243652344, 0.28340911865234375, 0.2976570129394531, 0.3119049072265625, 0.3261528015136719, 0.34040069580078125, 0.3546485900878906, 0.368896484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 15.0, 31.0, 72.0, 110.0, 196.0, 250.0, 134.0, 75.0, 35.0, 25.0, 15.0, 9.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.048914909362793, -5.83397102355957, -5.619027137756348, -5.404083251953125, -5.189139366149902, -4.97419548034668, -4.759251594543457, -4.544307708740234, -4.329363822937012, -4.114419937133789, -3.8994760513305664, -3.6845321655273438, -3.469588279724121, -3.2546443939208984, -3.0397002696990967, -2.824756383895874, -2.6098122596740723, -2.3948683738708496, -2.179924488067627, -1.9649804830551147, -1.750036597251892, -1.5350927114486694, -1.3201487064361572, -1.1052048206329346, -0.8902609348297119, -0.6753170490264893, -0.4603731036186218, -0.2454291582107544, -0.03048527240753174, 0.18445861339569092, 0.3994026184082031, 0.6143465042114258, 0.8292899131774902, 1.044233798980713, 1.2591776847839355, 1.4741216897964478, 1.6890655755996704, 1.904009461402893, 2.1189534664154053, 2.333897352218628, 2.5488412380218506, 2.7637851238250732, 2.978729009628296, 3.1936731338500977, 3.4086170196533203, 3.623560905456543, 3.8385047912597656, 4.053448677062988, 4.268392562866211, 4.483336448669434, 4.698280334472656, 4.913224220275879, 5.128168106079102, 5.343111991882324, 5.558055877685547, 5.7729997634887695, 5.987943649291992, 6.202887535095215, 6.4178314208984375, 6.63277530670166, 6.847719192504883, 7.0626630783081055, 7.277606964111328, 7.492550849914551, 7.707495212554932]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 3.0, 4.0, 13.0, 5.0, 9.0, 21.0, 15.0, 19.0, 25.0, 25.0, 23.0, 34.0, 39.0, 40.0, 37.0, 42.0, 40.0, 57.0, 65.0, 56.0, 37.0, 54.0, 37.0, 29.0, 40.0, 39.0, 32.0, 20.0, 14.0, 20.0, 13.0, 15.0, 16.0, 15.0, 9.0, 9.0, 10.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.35766339302063, -3.2456111907958984, -3.133558988571167, -3.0215067863464355, -2.909454822540283, -2.7974026203155518, -2.6853504180908203, -2.573298215866089, -2.4612460136413574, -2.349193811416626, -2.2371416091918945, -2.125089645385742, -2.0130374431610107, -1.9009852409362793, -1.7889330387115479, -1.6768808364868164, -1.564828872680664, -1.4527766704559326, -1.3407245874404907, -1.2286723852157593, -1.1166203022003174, -1.004568099975586, -0.8925158977508545, -0.7804637551307678, -0.6684116125106812, -0.5563594698905945, -0.4443072974681854, -0.33225512504577637, -0.2202029824256897, -0.10815083980560303, 0.003901362419128418, 0.11595350503921509, 0.22800588607788086, 0.34005802869796753, 0.4521102011203766, 0.5641623735427856, 0.6762145161628723, 0.788266658782959, 0.9003188610076904, 1.0123710632324219, 1.1244231462478638, 1.2364753484725952, 1.348527431488037, 1.4605796337127686, 1.5726318359375, 1.684683918952942, 1.7967361211776733, 1.9087882041931152, 2.0208404064178467, 2.132892608642578, 2.2449448108673096, 2.356997013092041, 2.4690489768981934, 2.581101179122925, 2.6931533813476562, 2.8052055835723877, 2.917257785797119, 3.0293099880218506, 3.141362190246582, 3.2534141540527344, 3.365466356277466, 3.4775185585021973, 3.5895707607269287, 3.70162296295166, 3.8136749267578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 13.0, 13.0, 15.0, 29.0, 49.0, 79.0, 157.0, 317.0, 726.0, 1666.0, 4762.0, 17324.0, 111431.0, 2894953.0, 1092376.0, 54001.0, 10574.0, 3231.0, 1248.0, 573.0, 282.0, 196.0, 91.0, 47.0, 37.0, 14.0, 23.0, 14.0, 16.0, 3.0, 5.0, 1.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33251953125, -0.3191375732421875, -0.305755615234375, -0.2923736572265625, -0.27899169921875, -0.2656097412109375, -0.252227783203125, -0.2388458251953125, -0.2254638671875, -0.2120819091796875, -0.198699951171875, -0.1853179931640625, -0.17193603515625, -0.1585540771484375, -0.145172119140625, -0.1317901611328125, -0.118408203125, -0.1050262451171875, -0.091644287109375, -0.0782623291015625, -0.06488037109375, -0.0514984130859375, -0.038116455078125, -0.0247344970703125, -0.0113525390625, 0.0020294189453125, 0.015411376953125, 0.0287933349609375, 0.04217529296875, 0.0555572509765625, 0.068939208984375, 0.0823211669921875, 0.095703125, 0.1090850830078125, 0.122467041015625, 0.1358489990234375, 0.14923095703125, 0.1626129150390625, 0.175994873046875, 0.1893768310546875, 0.2027587890625, 0.2161407470703125, 0.229522705078125, 0.2429046630859375, 0.25628662109375, 0.2696685791015625, 0.283050537109375, 0.2964324951171875, 0.309814453125, 0.3231964111328125, 0.336578369140625, 0.3499603271484375, 0.36334228515625, 0.3767242431640625, 0.390106201171875, 0.4034881591796875, 0.4168701171875, 0.4302520751953125, 0.443634033203125, 0.4570159912109375, 0.47039794921875, 0.4837799072265625, 0.497161865234375, 0.5105438232421875, 0.52392578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 4.0, 4.0, 14.0, 13.0, 12.0, 16.0, 30.0, 30.0, 36.0, 49.0, 53.0, 53.0, 70.0, 62.0, 65.0, 55.0, 74.0, 65.0, 56.0, 37.0, 47.0, 31.0, 27.0, 25.0, 15.0, 15.0, 13.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.186279296875, -0.17932510375976562, -0.17237091064453125, -0.16541671752929688, -0.1584625244140625, -0.15150833129882812, -0.14455413818359375, -0.13759994506835938, -0.130645751953125, -0.12369155883789062, -0.11673736572265625, -0.10978317260742188, -0.1028289794921875, -0.09587478637695312, -0.08892059326171875, -0.08196640014648438, -0.07501220703125, -0.06805801391601562, -0.06110382080078125, -0.054149627685546875, -0.0471954345703125, -0.040241241455078125, -0.03328704833984375, -0.026332855224609375, -0.019378662109375, -0.012424468994140625, -0.00547027587890625, 0.001483917236328125, 0.0084381103515625, 0.015392303466796875, 0.02234649658203125, 0.029300689697265625, 0.0362548828125, 0.043209075927734375, 0.05016326904296875, 0.057117462158203125, 0.0640716552734375, 0.07102584838867188, 0.07798004150390625, 0.08493423461914062, 0.091888427734375, 0.09884262084960938, 0.10579681396484375, 0.11275100708007812, 0.1197052001953125, 0.12665939331054688, 0.13361358642578125, 0.14056777954101562, 0.14752197265625, 0.15447616577148438, 0.16143035888671875, 0.16838455200195312, 0.1753387451171875, 0.18229293823242188, 0.18924713134765625, 0.19620132446289062, 0.203155517578125, 0.21010971069335938, 0.21706390380859375, 0.22401809692382812, 0.2309722900390625, 0.23792648315429688, 0.24488067626953125, 0.2518348693847656, 0.2587890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 7.0, 15.0, 14.0, 34.0, 37.0, 64.0, 104.0, 144.0, 256.0, 497.0, 1019.0, 2422.0, 7580.0, 34120.0, 324734.0, 3518839.0, 265292.0, 29104.0, 6101.0, 1956.0, 816.0, 461.0, 241.0, 125.0, 110.0, 53.0, 32.0, 22.0, 16.0, 9.0, 10.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4140625, -0.39898681640625, -0.3839111328125, -0.36883544921875, -0.353759765625, -0.33868408203125, -0.3236083984375, -0.30853271484375, -0.29345703125, -0.27838134765625, -0.2633056640625, -0.24822998046875, -0.233154296875, -0.21807861328125, -0.2030029296875, -0.18792724609375, -0.1728515625, -0.15777587890625, -0.1427001953125, -0.12762451171875, -0.112548828125, -0.09747314453125, -0.0823974609375, -0.06732177734375, -0.05224609375, -0.03717041015625, -0.0220947265625, -0.00701904296875, 0.008056640625, 0.02313232421875, 0.0382080078125, 0.05328369140625, 0.068359375, 0.08343505859375, 0.0985107421875, 0.11358642578125, 0.128662109375, 0.14373779296875, 0.1588134765625, 0.17388916015625, 0.18896484375, 0.20404052734375, 0.2191162109375, 0.23419189453125, 0.249267578125, 0.26434326171875, 0.2794189453125, 0.29449462890625, 0.3095703125, 0.32464599609375, 0.3397216796875, 0.35479736328125, 0.369873046875, 0.38494873046875, 0.4000244140625, 0.41510009765625, 0.43017578125, 0.44525146484375, 0.4603271484375, 0.47540283203125, 0.490478515625, 0.50555419921875, 0.5206298828125, 0.53570556640625, 0.55078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 2.0, 6.0, 8.0, 14.0, 23.0, 38.0, 47.0, 76.0, 115.0, 215.0, 392.0, 913.0, 1033.0, 534.0, 272.0, 140.0, 71.0, 58.0, 34.0, 28.0, 20.0, 8.0, 10.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6413803100585938, -0.6226043701171875, -0.6038284301757812, -0.585052490234375, -0.5662765502929688, -0.5475006103515625, -0.5287246704101562, -0.50994873046875, -0.49117279052734375, -0.4723968505859375, -0.45362091064453125, -0.434844970703125, -0.41606903076171875, -0.3972930908203125, -0.37851715087890625, -0.3597412109375, -0.34096527099609375, -0.3221893310546875, -0.30341339111328125, -0.284637451171875, -0.26586151123046875, -0.2470855712890625, -0.22830963134765625, -0.20953369140625, -0.19075775146484375, -0.1719818115234375, -0.15320587158203125, -0.134429931640625, -0.11565399169921875, -0.0968780517578125, -0.07810211181640625, -0.059326171875, -0.04055023193359375, -0.0217742919921875, -0.00299835205078125, 0.015777587890625, 0.03455352783203125, 0.0533294677734375, 0.07210540771484375, 0.09088134765625, 0.10965728759765625, 0.1284332275390625, 0.14720916748046875, 0.165985107421875, 0.18476104736328125, 0.2035369873046875, 0.22231292724609375, 0.2410888671875, 0.25986480712890625, 0.2786407470703125, 0.29741668701171875, 0.316192626953125, 0.33496856689453125, 0.3537445068359375, 0.37252044677734375, 0.39129638671875, 0.41007232666015625, 0.4288482666015625, 0.44762420654296875, 0.466400146484375, 0.48517608642578125, 0.5039520263671875, 0.5227279663085938, 0.54150390625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 6.0, 26.0, 64.0, 161.0, 313.0, 258.0, 102.0, 31.0, 11.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21705961227417, -5.012783527374268, -4.808507919311523, -4.604231834411621, -4.399955749511719, -4.195680141448975, -3.9914040565490723, -3.787128210067749, -3.582852363586426, -3.3785765171051025, -3.1743004322052, -2.970024585723877, -2.7657487392425537, -2.5614728927612305, -2.357196807861328, -2.152920961380005, -1.9486448764801025, -1.7443689107894897, -1.5400930643081665, -1.3358170986175537, -1.1315412521362305, -0.9272652864456177, -0.7229893207550049, -0.5187134742736816, -0.31443750858306885, -0.11016158759593964, 0.09411433339118958, 0.29839026927948, 0.502666175365448, 0.706942081451416, 0.9112180471420288, 1.115493893623352, 1.3197698593139648, 1.5240458250045776, 1.7283216714859009, 1.9325976371765137, 2.136873483657837, 2.34114933013916, 2.5454254150390625, 2.7497012615203857, 2.953977108001709, 3.1582529544830322, 3.3625290393829346, 3.566804885864258, 3.771080732345581, 3.9753565788269043, 4.179632663726807, 4.383908271789551, 4.588184356689453, 4.7924604415893555, 4.9967360496521, 5.201012134552002, 5.405288219451904, 5.609563827514648, 5.813839912414551, 6.018115997314453, 6.2223920822143555, 6.426668167114258, 6.630943775177002, 6.835219860076904, 7.039495944976807, 7.243771553039551, 7.448047637939453, 7.6523237228393555, 7.8565993309021]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 8.0, 3.0, 8.0, 11.0, 10.0, 10.0, 15.0, 19.0, 17.0, 16.0, 25.0, 26.0, 34.0, 30.0, 37.0, 33.0, 45.0, 54.0, 42.0, 59.0, 49.0, 44.0, 38.0, 45.0, 43.0, 36.0, 39.0, 28.0, 32.0, 24.0, 25.0, 19.0, 16.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.229215621948242, -2.1623589992523193, -2.0955023765563965, -2.0286459922790527, -1.9617893695831299, -1.894932746887207, -1.8280762434005737, -1.7612197399139404, -1.6943631172180176, -1.6275064945220947, -1.5606499910354614, -1.4937934875488281, -1.4269368648529053, -1.3600802421569824, -1.2932237386703491, -1.2263672351837158, -1.159510612487793, -1.0926539897918701, -1.0257974863052368, -0.9589409232139587, -0.8920843601226807, -0.8252277970314026, -0.7583712339401245, -0.6915146708488464, -0.6246581077575684, -0.5578015446662903, -0.4909449815750122, -0.42408841848373413, -0.35723185539245605, -0.290375292301178, -0.2235187292098999, -0.15666216611862183, -0.08980584144592285, -0.022949278354644775, 0.0439072847366333, 0.11076384782791138, 0.17762041091918945, 0.24447697401046753, 0.3113335371017456, 0.3781901001930237, 0.44504666328430176, 0.5119032263755798, 0.5787597894668579, 0.645616352558136, 0.7124729156494141, 0.7793294787406921, 0.8461860418319702, 0.9130426049232483, 0.9798991680145264, 1.0467557907104492, 1.1136122941970825, 1.1804687976837158, 1.2473254203796387, 1.3141820430755615, 1.3810385465621948, 1.4478950500488281, 1.514751672744751, 1.5816082954406738, 1.6484647989273071, 1.7153213024139404, 1.7821779251098633, 1.8490345478057861, 1.9158910512924194, 1.9827475547790527, 2.0496041774749756]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 9.0, 20.0, 28.0, 47.0, 84.0, 131.0, 237.0, 472.0, 970.0, 2544.0, 6826.0, 23086.0, 99484.0, 492421.0, 334327.0, 63401.0, 15831.0, 5059.0, 1867.0, 799.0, 400.0, 208.0, 96.0, 66.0, 45.0, 21.0, 16.0, 13.0, 13.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5735626220703125, -0.554351806640625, -0.5351409912109375, -0.51593017578125, -0.4967193603515625, -0.477508544921875, -0.4582977294921875, -0.4390869140625, -0.4198760986328125, -0.400665283203125, -0.3814544677734375, -0.36224365234375, -0.3430328369140625, -0.323822021484375, -0.3046112060546875, -0.285400390625, -0.2661895751953125, -0.246978759765625, -0.2277679443359375, -0.20855712890625, -0.1893463134765625, -0.170135498046875, -0.1509246826171875, -0.1317138671875, -0.1125030517578125, -0.093292236328125, -0.0740814208984375, -0.05487060546875, -0.0356597900390625, -0.016448974609375, 0.0027618408203125, 0.02197265625, 0.0411834716796875, 0.060394287109375, 0.0796051025390625, 0.09881591796875, 0.1180267333984375, 0.137237548828125, 0.1564483642578125, 0.1756591796875, 0.1948699951171875, 0.214080810546875, 0.2332916259765625, 0.25250244140625, 0.2717132568359375, 0.290924072265625, 0.3101348876953125, 0.329345703125, 0.3485565185546875, 0.367767333984375, 0.3869781494140625, 0.40618896484375, 0.4253997802734375, 0.444610595703125, 0.4638214111328125, 0.4830322265625, 0.5022430419921875, 0.521453857421875, 0.5406646728515625, 0.55987548828125, 0.5790863037109375, 0.598297119140625, 0.6175079345703125, 0.63671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 3.0, 5.0, 4.0, 9.0, 18.0, 15.0, 22.0, 35.0, 36.0, 37.0, 51.0, 55.0, 62.0, 48.0, 62.0, 60.0, 75.0, 56.0, 68.0, 54.0, 44.0, 34.0, 33.0, 26.0, 17.0, 17.0, 15.0, 13.0, 7.0, 4.0, 7.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1907958984375, -0.18406295776367188, -0.17733001708984375, -0.17059707641601562, -0.1638641357421875, -0.15713119506835938, -0.15039825439453125, -0.14366531372070312, -0.136932373046875, -0.13019943237304688, -0.12346649169921875, -0.11673355102539062, -0.1100006103515625, -0.10326766967773438, -0.09653472900390625, -0.08980178833007812, -0.08306884765625, -0.07633590698242188, -0.06960296630859375, -0.06287002563476562, -0.0561370849609375, -0.049404144287109375, -0.04267120361328125, -0.035938262939453125, -0.029205322265625, -0.022472381591796875, -0.01573944091796875, -0.009006500244140625, -0.0022735595703125, 0.004459381103515625, 0.01119232177734375, 0.017925262451171875, 0.024658203125, 0.031391143798828125, 0.03812408447265625, 0.044857025146484375, 0.0515899658203125, 0.058322906494140625, 0.06505584716796875, 0.07178878784179688, 0.078521728515625, 0.08525466918945312, 0.09198760986328125, 0.09872055053710938, 0.1054534912109375, 0.11218643188476562, 0.11891937255859375, 0.12565231323242188, 0.13238525390625, 0.13911819458007812, 0.14585113525390625, 0.15258407592773438, 0.1593170166015625, 0.16604995727539062, 0.17278289794921875, 0.17951583862304688, 0.186248779296875, 0.19298171997070312, 0.19971466064453125, 0.20644760131835938, 0.2131805419921875, 0.21991348266601562, 0.22664642333984375, 0.23337936401367188, 0.2401123046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 15.0, 4.0, 26.0, 26.0, 55.0, 87.0, 138.0, 270.0, 604.0, 1554.0, 6946.0, 88050.0, 904599.0, 39638.0, 4354.0, 1174.0, 490.0, 189.0, 121.0, 68.0, 50.0, 22.0, 24.0, 11.0, 10.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.5316162109375, -1.487060546875, -1.4425048828125, -1.39794921875, -1.3533935546875, -1.308837890625, -1.2642822265625, -1.2197265625, -1.1751708984375, -1.130615234375, -1.0860595703125, -1.04150390625, -0.9969482421875, -0.952392578125, -0.9078369140625, -0.86328125, -0.8187255859375, -0.774169921875, -0.7296142578125, -0.68505859375, -0.6405029296875, -0.595947265625, -0.5513916015625, -0.5068359375, -0.4622802734375, -0.417724609375, -0.3731689453125, -0.32861328125, -0.2840576171875, -0.239501953125, -0.1949462890625, -0.150390625, -0.1058349609375, -0.061279296875, -0.0167236328125, 0.02783203125, 0.0723876953125, 0.116943359375, 0.1614990234375, 0.2060546875, 0.2506103515625, 0.295166015625, 0.3397216796875, 0.38427734375, 0.4288330078125, 0.473388671875, 0.5179443359375, 0.5625, 0.6070556640625, 0.651611328125, 0.6961669921875, 0.74072265625, 0.7852783203125, 0.829833984375, 0.8743896484375, 0.9189453125, 0.9635009765625, 1.008056640625, 1.0526123046875, 1.09716796875, 1.1417236328125, 1.186279296875, 1.2308349609375, 1.275390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 5.0, 4.0, 4.0, 9.0, 11.0, 6.0, 11.0, 15.0, 17.0, 28.0, 31.0, 44.0, 44.0, 45.0, 54.0, 73.0, 74.0, 61.0, 79.0, 43.0, 63.0, 48.0, 40.0, 40.0, 33.0, 28.0, 12.0, 20.0, 6.0, 10.0, 12.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0185546875, -0.9913482666015625, -0.964141845703125, -0.9369354248046875, -0.90972900390625, -0.8825225830078125, -0.855316162109375, -0.8281097412109375, -0.8009033203125, -0.7736968994140625, -0.746490478515625, -0.7192840576171875, -0.69207763671875, -0.6648712158203125, -0.637664794921875, -0.6104583740234375, -0.583251953125, -0.5560455322265625, -0.528839111328125, -0.5016326904296875, -0.47442626953125, -0.4472198486328125, -0.420013427734375, -0.3928070068359375, -0.3656005859375, -0.3383941650390625, -0.311187744140625, -0.2839813232421875, -0.25677490234375, -0.2295684814453125, -0.202362060546875, -0.1751556396484375, -0.14794921875, -0.1207427978515625, -0.093536376953125, -0.0663299560546875, -0.03912353515625, -0.0119171142578125, 0.015289306640625, 0.0424957275390625, 0.0697021484375, 0.0969085693359375, 0.124114990234375, 0.1513214111328125, 0.17852783203125, 0.2057342529296875, 0.232940673828125, 0.2601470947265625, 0.287353515625, 0.3145599365234375, 0.341766357421875, 0.3689727783203125, 0.39617919921875, 0.4233856201171875, 0.450592041015625, 0.4777984619140625, 0.5050048828125, 0.5322113037109375, 0.559417724609375, 0.5866241455078125, 0.61383056640625, 0.6410369873046875, 0.668243408203125, 0.6954498291015625, 0.72265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 5.0, 8.0, 15.0, 19.0, 35.0, 47.0, 81.0, 157.0, 377.0, 1017.0, 4009.0, 40631.0, 920899.0, 73268.0, 5811.0, 1293.0, 453.0, 174.0, 98.0, 57.0, 33.0, 24.0, 11.0, 3.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66064453125, -0.6397323608398438, -0.6188201904296875, -0.5979080200195312, -0.576995849609375, -0.5560836791992188, -0.5351715087890625, -0.5142593383789062, -0.49334716796875, -0.47243499755859375, -0.4515228271484375, -0.43061065673828125, -0.409698486328125, -0.38878631591796875, -0.3678741455078125, -0.34696197509765625, -0.3260498046875, -0.30513763427734375, -0.2842254638671875, -0.26331329345703125, -0.242401123046875, -0.22148895263671875, -0.2005767822265625, -0.17966461181640625, -0.15875244140625, -0.13784027099609375, -0.1169281005859375, -0.09601593017578125, -0.075103759765625, -0.05419158935546875, -0.0332794189453125, -0.01236724853515625, 0.008544921875, 0.02945709228515625, 0.0503692626953125, 0.07128143310546875, 0.092193603515625, 0.11310577392578125, 0.1340179443359375, 0.15493011474609375, 0.17584228515625, 0.19675445556640625, 0.2176666259765625, 0.23857879638671875, 0.259490966796875, 0.28040313720703125, 0.3013153076171875, 0.32222747802734375, 0.3431396484375, 0.36405181884765625, 0.3849639892578125, 0.40587615966796875, 0.426788330078125, 0.44770050048828125, 0.4686126708984375, 0.48952484130859375, 0.51043701171875, 0.5313491821289062, 0.5522613525390625, 0.5731735229492188, 0.594085693359375, 0.6149978637695312, 0.6359100341796875, 0.6568222045898438, 0.677734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 6.0, 9.0, 6.0, 13.0, 16.0, 17.0, 23.0, 37.0, 39.0, 53.0, 70.0, 117.0, 144.0, 142.0, 76.0, 54.0, 36.0, 29.0, 20.0, 16.0, 17.0, 12.0, 11.0, 6.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.910894393920898e-05, -8.535105735063553e-05, -8.159317076206207e-05, -7.783528417348862e-05, -7.407739758491516e-05, -7.03195109963417e-05, -6.656162440776825e-05, -6.28037378191948e-05, -5.904585123062134e-05, -5.528796464204788e-05, -5.1530078053474426e-05, -4.777219146490097e-05, -4.4014304876327515e-05, -4.025641828775406e-05, -3.64985316991806e-05, -3.274064511060715e-05, -2.898275852203369e-05, -2.5224871933460236e-05, -2.146698534488678e-05, -1.7709098756313324e-05, -1.3951212167739868e-05, -1.0193325579166412e-05, -6.4354389905929565e-06, -2.6775524020195007e-06, 1.080334186553955e-06, 4.838220775127411e-06, 8.596107363700867e-06, 1.2353993952274323e-05, 1.611188054084778e-05, 1.9869767129421234e-05, 2.362765371799469e-05, 2.7385540306568146e-05, 3.11434268951416e-05, 3.490131348371506e-05, 3.865920007228851e-05, 4.241708666086197e-05, 4.6174973249435425e-05, 4.993285983800888e-05, 5.3690746426582336e-05, 5.744863301515579e-05, 6.120651960372925e-05, 6.49644061923027e-05, 6.872229278087616e-05, 7.248017936944962e-05, 7.623806595802307e-05, 7.999595254659653e-05, 8.375383913516998e-05, 8.751172572374344e-05, 9.12696123123169e-05, 9.502749890089035e-05, 9.87853854894638e-05, 0.00010254327207803726, 0.00010630115866661072, 0.00011005904525518417, 0.00011381693184375763, 0.00011757481843233109, 0.00012133270502090454, 0.000125090591609478, 0.00012884847819805145, 0.0001326063647866249, 0.00013636425137519836, 0.00014012213796377182, 0.00014388002455234528, 0.00014763791114091873, 0.0001513957977294922]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 7.0, 18.0, 25.0, 41.0, 67.0, 106.0, 229.0, 407.0, 978.0, 3479.0, 19025.0, 522602.0, 477111.0, 19075.0, 3493.0, 964.0, 431.0, 221.0, 107.0, 51.0, 36.0, 20.0, 14.0, 8.0, 9.0, 6.0, 8.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64404296875, -0.625640869140625, -0.60723876953125, -0.588836669921875, -0.5704345703125, -0.552032470703125, -0.53363037109375, -0.515228271484375, -0.496826171875, -0.478424072265625, -0.46002197265625, -0.441619873046875, -0.4232177734375, -0.404815673828125, -0.38641357421875, -0.368011474609375, -0.349609375, -0.331207275390625, -0.31280517578125, -0.294403076171875, -0.2760009765625, -0.257598876953125, -0.23919677734375, -0.220794677734375, -0.202392578125, -0.183990478515625, -0.16558837890625, -0.147186279296875, -0.1287841796875, -0.110382080078125, -0.09197998046875, -0.073577880859375, -0.05517578125, -0.036773681640625, -0.01837158203125, 3.0517578125e-05, 0.0184326171875, 0.036834716796875, 0.05523681640625, 0.073638916015625, 0.092041015625, 0.110443115234375, 0.12884521484375, 0.147247314453125, 0.1656494140625, 0.184051513671875, 0.20245361328125, 0.220855712890625, 0.2392578125, 0.257659912109375, 0.27606201171875, 0.294464111328125, 0.3128662109375, 0.331268310546875, 0.34967041015625, 0.368072509765625, 0.386474609375, 0.404876708984375, 0.42327880859375, 0.441680908203125, 0.4600830078125, 0.478485107421875, 0.49688720703125, 0.515289306640625, 0.53369140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 6.0, 10.0, 8.0, 14.0, 13.0, 9.0, 21.0, 30.0, 39.0, 54.0, 81.0, 106.0, 136.0, 121.0, 92.0, 77.0, 46.0, 23.0, 23.0, 22.0, 13.0, 10.0, 9.0, 5.0, 6.0, 3.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.3099098205566406, -0.29779815673828125, -0.2856864929199219, -0.2735748291015625, -0.2614631652832031, -0.24935150146484375, -0.23723983764648438, -0.225128173828125, -0.21301651000976562, -0.20090484619140625, -0.18879318237304688, -0.1766815185546875, -0.16456985473632812, -0.15245819091796875, -0.14034652709960938, -0.12823486328125, -0.11612319946289062, -0.10401153564453125, -0.09189987182617188, -0.0797882080078125, -0.06767654418945312, -0.05556488037109375, -0.043453216552734375, -0.031341552734375, -0.019229888916015625, -0.00711822509765625, 0.004993438720703125, 0.0171051025390625, 0.029216766357421875, 0.04132843017578125, 0.053440093994140625, 0.0655517578125, 0.07766342163085938, 0.08977508544921875, 0.10188674926757812, 0.1139984130859375, 0.12611007690429688, 0.13822174072265625, 0.15033340454101562, 0.162445068359375, 0.17455673217773438, 0.18666839599609375, 0.19878005981445312, 0.2108917236328125, 0.22300338745117188, 0.23511505126953125, 0.24722671508789062, 0.25933837890625, 0.2714500427246094, 0.28356170654296875, 0.2956733703613281, 0.3077850341796875, 0.3198966979980469, 0.33200836181640625, 0.3441200256347656, 0.356231689453125, 0.3683433532714844, 0.38045501708984375, 0.3925666809082031, 0.4046783447265625, 0.4167900085449219, 0.42890167236328125, 0.4410133361816406, 0.453125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 8.0, 17.0, 43.0, 66.0, 119.0, 197.0, 251.0, 156.0, 70.0, 28.0, 15.0, 9.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.248492240905762, -7.053330421447754, -6.858168125152588, -6.66300630569458, -6.467844009399414, -6.272682189941406, -6.077520370483398, -5.882358551025391, -5.687196254730225, -5.492034435272217, -5.296872138977051, -5.101710319519043, -4.906548500061035, -4.711386203765869, -4.516224384307861, -4.321062088012695, -4.1259002685546875, -3.9307382106781006, -3.7355761528015137, -3.540414333343506, -3.345252275466919, -3.150090217590332, -2.954928398132324, -2.7597663402557373, -2.5646042823791504, -2.3694422245025635, -2.1742801666259766, -1.9791183471679688, -1.7839562892913818, -1.588794231414795, -1.3936322927474976, -1.1984703540802002, -1.0033082962036133, -0.8081462979316711, -0.612984299659729, -0.41782230138778687, -0.22266030311584473, -0.027498304843902588, 0.16766369342803955, 0.3628256320953369, 0.5579876899719238, 0.753149688243866, 0.9483116865158081, 1.1434736251831055, 1.3386356830596924, 1.5337977409362793, 1.7289596796035767, 1.924121618270874, 2.119283676147461, 2.314445734024048, 2.5096077919006348, 2.7047696113586426, 2.8999316692352295, 3.0950937271118164, 3.290255546569824, 3.485417604446411, 3.680579662322998, 3.875741720199585, 4.070903778076172, 4.26606559753418, 4.4612274169921875, 4.6563897132873535, 4.851551532745361, 5.046713829040527, 5.241875648498535]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 13.0, 6.0, 13.0, 10.0, 10.0, 20.0, 35.0, 32.0, 36.0, 43.0, 41.0, 69.0, 80.0, 66.0, 61.0, 72.0, 60.0, 46.0, 46.0, 28.0, 39.0, 34.0, 28.0, 22.0, 18.0, 17.0, 12.0, 5.0, 12.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5050852298736572, -3.396188735961914, -3.287292242050171, -3.1783957481384277, -3.0694992542266846, -2.9606027603149414, -2.8517065048217773, -2.742809772491455, -2.633913516998291, -2.525017023086548, -2.4161205291748047, -2.3072240352630615, -2.1983275413513184, -2.089431047439575, -1.9805346727371216, -1.8716381788253784, -1.7627415657043457, -1.6538450717926025, -1.5449485778808594, -1.4360520839691162, -1.327155590057373, -1.2182590961456299, -1.1093627214431763, -1.000466227531433, -0.8915697336196899, -0.7826732397079468, -0.6737767457962036, -0.5648803114891052, -0.45598381757736206, -0.3470873236656189, -0.2381908893585205, -0.12929439544677734, -0.020397663116455078, 0.08849881589412689, 0.19739529490470886, 0.30629175901412964, 0.4151882529258728, 0.524084746837616, 0.6329811811447144, 0.7418776750564575, 0.8507741689682007, 0.9596706628799438, 1.068567156791687, 1.1774635314941406, 1.2863600254058838, 1.395256519317627, 1.5041530132293701, 1.6130495071411133, 1.7219460010528564, 1.8308424949645996, 1.9397389888763428, 2.048635482788086, 2.157531976699829, 2.2664284706115723, 2.3753247261047363, 2.4842214584350586, 2.5931177139282227, 2.702014207839966, 2.810910701751709, 2.919807195663452, 3.0287036895751953, 3.1376001834869385, 3.2464966773986816, 3.3553929328918457, 3.464289665222168]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 10.0, 17.0, 14.0, 23.0, 48.0, 71.0, 117.0, 250.0, 512.0, 1323.0, 3936.0, 17400.0, 344443.0, 3757122.0, 56495.0, 8276.0, 2429.0, 902.0, 398.0, 168.0, 107.0, 66.0, 41.0, 20.0, 28.0, 12.0, 11.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552734375, -0.5338516235351562, -0.5149688720703125, -0.49608612060546875, -0.477203369140625, -0.45832061767578125, -0.4394378662109375, -0.42055511474609375, -0.40167236328125, -0.38278961181640625, -0.3639068603515625, -0.34502410888671875, -0.326141357421875, -0.30725860595703125, -0.2883758544921875, -0.26949310302734375, -0.2506103515625, -0.23172760009765625, -0.2128448486328125, -0.19396209716796875, -0.175079345703125, -0.15619659423828125, -0.1373138427734375, -0.11843109130859375, -0.09954833984375, -0.08066558837890625, -0.0617828369140625, -0.04290008544921875, -0.024017333984375, -0.00513458251953125, 0.0137481689453125, 0.03263092041015625, 0.051513671875, 0.07039642333984375, 0.0892791748046875, 0.10816192626953125, 0.127044677734375, 0.14592742919921875, 0.1648101806640625, 0.18369293212890625, 0.20257568359375, 0.22145843505859375, 0.2403411865234375, 0.25922393798828125, 0.278106689453125, 0.29698944091796875, 0.3158721923828125, 0.33475494384765625, 0.3536376953125, 0.37252044677734375, 0.3914031982421875, 0.41028594970703125, 0.429168701171875, 0.44805145263671875, 0.4669342041015625, 0.48581695556640625, 0.50469970703125, 0.5235824584960938, 0.5424652099609375, 0.5613479614257812, 0.580230712890625, 0.5991134643554688, 0.6179962158203125, 0.6368789672851562, 0.65576171875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 13.0, 23.0, 31.0, 52.0, 63.0, 73.0, 97.0, 96.0, 89.0, 112.0, 103.0, 66.0, 55.0, 46.0, 41.0, 12.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396484375, -0.3861656188964844, -0.37584686279296875, -0.3655281066894531, -0.3552093505859375, -0.3448905944824219, -0.33457183837890625, -0.3242530822753906, -0.313934326171875, -0.3036155700683594, -0.29329681396484375, -0.2829780578613281, -0.2726593017578125, -0.2623405456542969, -0.25202178955078125, -0.24170303344726562, -0.23138427734375, -0.22106552124023438, -0.21074676513671875, -0.20042800903320312, -0.1901092529296875, -0.17979049682617188, -0.16947174072265625, -0.15915298461914062, -0.148834228515625, -0.13851547241210938, -0.12819671630859375, -0.11787796020507812, -0.1075592041015625, -0.09724044799804688, -0.08692169189453125, -0.07660293579101562, -0.0662841796875, -0.055965423583984375, -0.04564666748046875, -0.035327911376953125, -0.0250091552734375, -0.014690399169921875, -0.00437164306640625, 0.005947113037109375, 0.016265869140625, 0.026584625244140625, 0.03690338134765625, 0.047222137451171875, 0.0575408935546875, 0.06785964965820312, 0.07817840576171875, 0.08849716186523438, 0.09881591796875, 0.10913467407226562, 0.11945343017578125, 0.12977218627929688, 0.1400909423828125, 0.15040969848632812, 0.16072845458984375, 0.17104721069335938, 0.181365966796875, 0.19168472290039062, 0.20200347900390625, 0.21232223510742188, 0.2226409912109375, 0.23295974731445312, 0.24327850341796875, 0.2535972595214844, 0.263916015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 11.0, 4.0, 8.0, 18.0, 24.0, 17.0, 36.0, 30.0, 58.0, 80.0, 114.0, 196.0, 264.0, 448.0, 799.0, 1565.0, 3700.0, 11946.0, 62166.0, 1745370.0, 2281030.0, 66937.0, 12028.0, 3646.0, 1708.0, 822.0, 423.0, 268.0, 164.0, 128.0, 87.0, 45.0, 42.0, 27.0, 9.0, 22.0, 12.0, 5.0, 8.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.5068359375, -0.4919395446777344, -0.47704315185546875, -0.4621467590332031, -0.4472503662109375, -0.4323539733886719, -0.41745758056640625, -0.4025611877441406, -0.387664794921875, -0.3727684020996094, -0.35787200927734375, -0.3429756164550781, -0.3280792236328125, -0.3131828308105469, -0.29828643798828125, -0.2833900451660156, -0.26849365234375, -0.2535972595214844, -0.23870086669921875, -0.22380447387695312, -0.2089080810546875, -0.19401168823242188, -0.17911529541015625, -0.16421890258789062, -0.149322509765625, -0.13442611694335938, -0.11952972412109375, -0.10463333129882812, -0.0897369384765625, -0.07484054565429688, -0.05994415283203125, -0.045047760009765625, -0.0301513671875, -0.015254974365234375, -0.00035858154296875, 0.014537811279296875, 0.0294342041015625, 0.044330596923828125, 0.05922698974609375, 0.07412338256835938, 0.089019775390625, 0.10391616821289062, 0.11881256103515625, 0.13370895385742188, 0.1486053466796875, 0.16350173950195312, 0.17839813232421875, 0.19329452514648438, 0.20819091796875, 0.22308731079101562, 0.23798370361328125, 0.2528800964355469, 0.2677764892578125, 0.2826728820800781, 0.29756927490234375, 0.3124656677246094, 0.327362060546875, 0.3422584533691406, 0.35715484619140625, 0.3720512390136719, 0.3869476318359375, 0.4018440246582031, 0.41674041748046875, 0.4316368103027344, 0.446533203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 9.0, 12.0, 12.0, 18.0, 23.0, 53.0, 45.0, 87.0, 99.0, 199.0, 502.0, 1024.0, 980.0, 433.0, 203.0, 116.0, 72.0, 53.0, 33.0, 28.0, 12.0, 8.0, 15.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.43750762939453125, -0.4233551025390625, -0.40920257568359375, -0.395050048828125, -0.38089752197265625, -0.3667449951171875, -0.35259246826171875, -0.33843994140625, -0.32428741455078125, -0.3101348876953125, -0.29598236083984375, -0.281829833984375, -0.26767730712890625, -0.2535247802734375, -0.23937225341796875, -0.2252197265625, -0.21106719970703125, -0.1969146728515625, -0.18276214599609375, -0.168609619140625, -0.15445709228515625, -0.1403045654296875, -0.12615203857421875, -0.11199951171875, -0.09784698486328125, -0.0836944580078125, -0.06954193115234375, -0.055389404296875, -0.04123687744140625, -0.0270843505859375, -0.01293182373046875, 0.001220703125, 0.01537322998046875, 0.0295257568359375, 0.04367828369140625, 0.057830810546875, 0.07198333740234375, 0.0861358642578125, 0.10028839111328125, 0.11444091796875, 0.12859344482421875, 0.1427459716796875, 0.15689849853515625, 0.171051025390625, 0.18520355224609375, 0.1993560791015625, 0.21350860595703125, 0.2276611328125, 0.24181365966796875, 0.2559661865234375, 0.27011871337890625, 0.284271240234375, 0.29842376708984375, 0.3125762939453125, 0.32672882080078125, 0.34088134765625, 0.35503387451171875, 0.3691864013671875, 0.38333892822265625, 0.397491455078125, 0.41164398193359375, 0.4257965087890625, 0.43994903564453125, 0.4541015625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 10.0, 16.0, 49.0, 135.0, 283.0, 304.0, 122.0, 47.0, 14.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.207853317260742, -6.019106388092041, -5.83035945892334, -5.6416120529174805, -5.452865123748779, -5.264118194580078, -5.075370788574219, -4.886623859405518, -4.697876930236816, -4.509130001068115, -4.320383071899414, -4.131635665893555, -3.9428887367248535, -3.7541418075561523, -3.565394639968872, -3.376647472381592, -3.1879005432128906, -2.9991536140441895, -2.810406446456909, -2.621659278869629, -2.4329123497009277, -2.2441654205322266, -2.0554182529449463, -1.8666712045669556, -1.6779241561889648, -1.4891771078109741, -1.3004300594329834, -1.1116830110549927, -0.922935962677002, -0.7341889142990112, -0.5454418659210205, -0.3566948175430298, -0.16794776916503906, 0.02079927921295166, 0.20954632759094238, 0.3982933759689331, 0.5870404243469238, 0.7757874727249146, 0.9645345211029053, 1.153281569480896, 1.3420286178588867, 1.5307756662368774, 1.7195227146148682, 1.9082697629928589, 2.0970168113708496, 2.285763740539551, 2.474510908126831, 2.6632580757141113, 2.8520050048828125, 3.0407519340515137, 3.229499101638794, 3.418246269226074, 3.6069931983947754, 3.7957401275634766, 3.984487295150757, 4.173234462738037, 4.361981391906738, 4.5507283210754395, 4.739475250244141, 4.92822265625, 5.116969585418701, 5.305716514587402, 5.494463920593262, 5.683210849761963, 5.871957778930664]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 12.0, 10.0, 11.0, 15.0, 21.0, 16.0, 32.0, 32.0, 15.0, 31.0, 36.0, 37.0, 45.0, 37.0, 47.0, 43.0, 41.0, 54.0, 46.0, 35.0, 43.0, 33.0, 29.0, 42.0, 36.0, 34.0, 22.0, 23.0, 16.0, 14.0, 16.0, 8.0, 14.0, 4.0, 8.0, 7.0, 2.0, 3.0, 0.0, 3.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5050184726715088, -1.4553773403167725, -1.4057360887527466, -1.3560948371887207, -1.3064537048339844, -1.256812572479248, -1.2071713209152222, -1.1575300693511963, -1.10788893699646, -1.0582478046417236, -1.0086065530776978, -0.9589653611183167, -0.9093241691589355, -0.8596829771995544, -0.8100417852401733, -0.7604005932807922, -0.7107594013214111, -0.66111820936203, -0.6114770174026489, -0.5618358254432678, -0.5121946334838867, -0.4625534415245056, -0.4129122495651245, -0.3632710576057434, -0.3136298656463623, -0.2639886736869812, -0.2143474817276001, -0.164706289768219, -0.11506509780883789, -0.06542390584945679, -0.015782713890075684, 0.03385847806930542, 0.08349967002868652, 0.13314086198806763, 0.18278205394744873, 0.23242324590682983, 0.28206443786621094, 0.33170562982559204, 0.38134682178497314, 0.43098801374435425, 0.48062920570373535, 0.5302703976631165, 0.5799115896224976, 0.6295527815818787, 0.6791939735412598, 0.7288351655006409, 0.778476357460022, 0.8281175494194031, 0.8777587413787842, 0.9273999333381653, 0.9770411252975464, 1.0266823768615723, 1.0763235092163086, 1.125964641571045, 1.1756058931350708, 1.2252471446990967, 1.274888277053833, 1.3245294094085693, 1.3741706609725952, 1.423811912536621, 1.4734530448913574, 1.5230941772460938, 1.5727354288101196, 1.6223766803741455, 1.6720178127288818]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 8.0, 7.0, 13.0, 30.0, 36.0, 58.0, 102.0, 201.0, 444.0, 1398.0, 5727.0, 45333.0, 669596.0, 300414.0, 20293.0, 3228.0, 926.0, 341.0, 165.0, 101.0, 35.0, 29.0, 24.0, 11.0, 11.0, 8.0, 7.0, 5.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.712890625, -0.6863174438476562, -0.6597442626953125, -0.6331710815429688, -0.606597900390625, -0.5800247192382812, -0.5534515380859375, -0.5268783569335938, -0.50030517578125, -0.47373199462890625, -0.4471588134765625, -0.42058563232421875, -0.394012451171875, -0.36743927001953125, -0.3408660888671875, -0.31429290771484375, -0.2877197265625, -0.26114654541015625, -0.2345733642578125, -0.20800018310546875, -0.181427001953125, -0.15485382080078125, -0.1282806396484375, -0.10170745849609375, -0.07513427734375, -0.04856109619140625, -0.0219879150390625, 0.00458526611328125, 0.031158447265625, 0.05773162841796875, 0.0843048095703125, 0.11087799072265625, 0.137451171875, 0.16402435302734375, 0.1905975341796875, 0.21717071533203125, 0.243743896484375, 0.27031707763671875, 0.2968902587890625, 0.32346343994140625, 0.35003662109375, 0.37660980224609375, 0.4031829833984375, 0.42975616455078125, 0.456329345703125, 0.48290252685546875, 0.5094757080078125, 0.5360488891601562, 0.5626220703125, 0.5891952514648438, 0.6157684326171875, 0.6423416137695312, 0.668914794921875, 0.6954879760742188, 0.7220611572265625, 0.7486343383789062, 0.77520751953125, 0.8017807006835938, 0.8283538818359375, 0.8549270629882812, 0.881500244140625, 0.9080734252929688, 0.9346466064453125, 0.9612197875976562, 0.98779296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 11.0, 14.0, 21.0, 29.0, 48.0, 59.0, 82.0, 87.0, 109.0, 107.0, 82.0, 78.0, 73.0, 71.0, 42.0, 31.0, 27.0, 9.0, 12.0, 6.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376708984375, -0.366668701171875, -0.35662841796875, -0.346588134765625, -0.3365478515625, -0.326507568359375, -0.31646728515625, -0.306427001953125, -0.29638671875, -0.286346435546875, -0.27630615234375, -0.266265869140625, -0.2562255859375, -0.246185302734375, -0.23614501953125, -0.226104736328125, -0.216064453125, -0.206024169921875, -0.19598388671875, -0.185943603515625, -0.1759033203125, -0.165863037109375, -0.15582275390625, -0.145782470703125, -0.1357421875, -0.125701904296875, -0.11566162109375, -0.105621337890625, -0.0955810546875, -0.085540771484375, -0.07550048828125, -0.065460205078125, -0.055419921875, -0.045379638671875, -0.03533935546875, -0.025299072265625, -0.0152587890625, -0.005218505859375, 0.00482177734375, 0.014862060546875, 0.02490234375, 0.034942626953125, 0.04498291015625, 0.055023193359375, 0.0650634765625, 0.075103759765625, 0.08514404296875, 0.095184326171875, 0.105224609375, 0.115264892578125, 0.12530517578125, 0.135345458984375, 0.1453857421875, 0.155426025390625, 0.16546630859375, 0.175506591796875, 0.185546875, 0.195587158203125, 0.20562744140625, 0.215667724609375, 0.2257080078125, 0.235748291015625, 0.24578857421875, 0.255828857421875, 0.265869140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 5.0, 9.0, 12.0, 12.0, 13.0, 25.0, 38.0, 56.0, 71.0, 114.0, 155.0, 333.0, 784.0, 2113.0, 7827.0, 53837.0, 703657.0, 248922.0, 23514.0, 4439.0, 1371.0, 551.0, 224.0, 167.0, 67.0, 64.0, 38.0, 31.0, 25.0, 15.0, 12.0, 8.0, 11.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7236328125, -0.7039718627929688, -0.6843109130859375, -0.6646499633789062, -0.644989013671875, -0.6253280639648438, -0.6056671142578125, -0.5860061645507812, -0.56634521484375, -0.5466842651367188, -0.5270233154296875, -0.5073623657226562, -0.487701416015625, -0.46804046630859375, -0.4483795166015625, -0.42871856689453125, -0.4090576171875, -0.38939666748046875, -0.3697357177734375, -0.35007476806640625, -0.330413818359375, -0.31075286865234375, -0.2910919189453125, -0.27143096923828125, -0.25177001953125, -0.23210906982421875, -0.2124481201171875, -0.19278717041015625, -0.173126220703125, -0.15346527099609375, -0.1338043212890625, -0.11414337158203125, -0.094482421875, -0.07482147216796875, -0.0551605224609375, -0.03549957275390625, -0.015838623046875, 0.00382232666015625, 0.0234832763671875, 0.04314422607421875, 0.06280517578125, 0.08246612548828125, 0.1021270751953125, 0.12178802490234375, 0.141448974609375, 0.16110992431640625, 0.1807708740234375, 0.20043182373046875, 0.2200927734375, 0.23975372314453125, 0.2594146728515625, 0.27907562255859375, 0.298736572265625, 0.31839752197265625, 0.3380584716796875, 0.35771942138671875, 0.37738037109375, 0.39704132080078125, 0.4167022705078125, 0.43636322021484375, 0.456024169921875, 0.47568511962890625, 0.4953460693359375, 0.5150070190429688, 0.53466796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 11.0, 21.0, 29.0, 43.0, 46.0, 47.0, 54.0, 65.0, 66.0, 72.0, 78.0, 77.0, 62.0, 74.0, 53.0, 47.0, 42.0, 28.0, 21.0, 20.0, 12.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93603515625, -0.9078140258789062, -0.8795928955078125, -0.8513717651367188, -0.823150634765625, -0.7949295043945312, -0.7667083740234375, -0.7384872436523438, -0.71026611328125, -0.6820449829101562, -0.6538238525390625, -0.6256027221679688, -0.597381591796875, -0.5691604614257812, -0.5409393310546875, -0.5127182006835938, -0.4844970703125, -0.45627593994140625, -0.4280548095703125, -0.39983367919921875, -0.371612548828125, -0.34339141845703125, -0.3151702880859375, -0.28694915771484375, -0.25872802734375, -0.23050689697265625, -0.2022857666015625, -0.17406463623046875, -0.145843505859375, -0.11762237548828125, -0.0894012451171875, -0.06118011474609375, -0.032958984375, -0.00473785400390625, 0.0234832763671875, 0.05170440673828125, 0.079925537109375, 0.10814666748046875, 0.1363677978515625, 0.16458892822265625, 0.19281005859375, 0.22103118896484375, 0.2492523193359375, 0.27747344970703125, 0.305694580078125, 0.33391571044921875, 0.3621368408203125, 0.39035797119140625, 0.4185791015625, 0.44680023193359375, 0.4750213623046875, 0.5032424926757812, 0.531463623046875, 0.5596847534179688, 0.5879058837890625, 0.6161270141601562, 0.64434814453125, 0.6725692749023438, 0.7007904052734375, 0.7290115356445312, 0.757232666015625, 0.7854537963867188, 0.8136749267578125, 0.8418960571289062, 0.8701171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 9.0, 14.0, 17.0, 44.0, 80.0, 178.0, 474.0, 1778.0, 10743.0, 142688.0, 850764.0, 35758.0, 4511.0, 911.0, 325.0, 109.0, 47.0, 26.0, 21.0, 16.0, 10.0, 10.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3798828125, -0.3684654235839844, -0.35704803466796875, -0.3456306457519531, -0.3342132568359375, -0.3227958679199219, -0.31137847900390625, -0.2999610900878906, -0.288543701171875, -0.2771263122558594, -0.26570892333984375, -0.2542915344238281, -0.2428741455078125, -0.23145675659179688, -0.22003936767578125, -0.20862197875976562, -0.19720458984375, -0.18578720092773438, -0.17436981201171875, -0.16295242309570312, -0.1515350341796875, -0.14011764526367188, -0.12870025634765625, -0.11728286743164062, -0.105865478515625, -0.09444808959960938, -0.08303070068359375, -0.07161331176757812, -0.0601959228515625, -0.048778533935546875, -0.03736114501953125, -0.025943756103515625, -0.0145263671875, -0.003108978271484375, 0.00830841064453125, 0.019725799560546875, 0.0311431884765625, 0.042560577392578125, 0.05397796630859375, 0.06539535522460938, 0.076812744140625, 0.08823013305664062, 0.09964752197265625, 0.11106491088867188, 0.1224822998046875, 0.13389968872070312, 0.14531707763671875, 0.15673446655273438, 0.16815185546875, 0.17956924438476562, 0.19098663330078125, 0.20240402221679688, 0.2138214111328125, 0.22523880004882812, 0.23665618896484375, 0.24807357788085938, 0.259490966796875, 0.2709083557128906, 0.28232574462890625, 0.2937431335449219, 0.3051605224609375, 0.3165779113769531, 0.32799530029296875, 0.3394126892089844, 0.350830078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 6.0, 7.0, 2.0, 10.0, 11.0, 19.0, 31.0, 58.0, 74.0, 101.0, 114.0, 153.0, 136.0, 75.0, 59.0, 32.0, 24.0, 24.0, 17.0, 8.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010478496551513672, -0.00010211393237113953, -9.944289922714233e-05, -9.677186608314514e-05, -9.410083293914795e-05, -9.142979979515076e-05, -8.875876665115356e-05, -8.608773350715637e-05, -8.341670036315918e-05, -8.074566721916199e-05, -7.80746340751648e-05, -7.54036009311676e-05, -7.273256778717041e-05, -7.006153464317322e-05, -6.739050149917603e-05, -6.471946835517883e-05, -6.204843521118164e-05, -5.937740206718445e-05, -5.6706368923187256e-05, -5.4035335779190063e-05, -5.136430263519287e-05, -4.869326949119568e-05, -4.6022236347198486e-05, -4.3351203203201294e-05, -4.06801700592041e-05, -3.800913691520691e-05, -3.533810377120972e-05, -3.2667070627212524e-05, -2.9996037483215332e-05, -2.732500433921814e-05, -2.4653971195220947e-05, -2.1982938051223755e-05, -1.9311904907226562e-05, -1.664087176322937e-05, -1.3969838619232178e-05, -1.1298805475234985e-05, -8.627772331237793e-06, -5.956739187240601e-06, -3.285706043243408e-06, -6.146728992462158e-07, 2.0563602447509766e-06, 4.727393388748169e-06, 7.398426532745361e-06, 1.0069459676742554e-05, 1.2740492820739746e-05, 1.541152596473694e-05, 1.808255910873413e-05, 2.0753592252731323e-05, 2.3424625396728516e-05, 2.6095658540725708e-05, 2.87666916847229e-05, 3.143772482872009e-05, 3.4108757972717285e-05, 3.677979111671448e-05, 3.945082426071167e-05, 4.212185740470886e-05, 4.4792890548706055e-05, 4.746392369270325e-05, 5.013495683670044e-05, 5.280598998069763e-05, 5.5477023124694824e-05, 5.8148056268692017e-05, 6.081908941268921e-05, 6.34901225566864e-05, 6.61611557006836e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 5.0, 6.0, 11.0, 16.0, 39.0, 54.0, 167.0, 571.0, 2757.0, 25498.0, 920559.0, 92083.0, 5431.0, 926.0, 252.0, 81.0, 38.0, 25.0, 9.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.373779296875, -0.3579978942871094, -0.34221649169921875, -0.3264350891113281, -0.3106536865234375, -0.2948722839355469, -0.27909088134765625, -0.2633094787597656, -0.247528076171875, -0.23174667358398438, -0.21596527099609375, -0.20018386840820312, -0.1844024658203125, -0.16862106323242188, -0.15283966064453125, -0.13705825805664062, -0.12127685546875, -0.10549545288085938, -0.08971405029296875, -0.07393264770507812, -0.0581512451171875, -0.042369842529296875, -0.02658843994140625, -0.010807037353515625, 0.004974365234375, 0.020755767822265625, 0.03653717041015625, 0.052318572998046875, 0.0680999755859375, 0.08388137817382812, 0.09966278076171875, 0.11544418334960938, 0.1312255859375, 0.14700698852539062, 0.16278839111328125, 0.17856979370117188, 0.1943511962890625, 0.21013259887695312, 0.22591400146484375, 0.24169540405273438, 0.257476806640625, 0.2732582092285156, 0.28903961181640625, 0.3048210144042969, 0.3206024169921875, 0.3363838195800781, 0.35216522216796875, 0.3679466247558594, 0.38372802734375, 0.3995094299316406, 0.41529083251953125, 0.4310722351074219, 0.4468536376953125, 0.4626350402832031, 0.47841644287109375, 0.4941978454589844, 0.509979248046875, 0.5257606506347656, 0.5415420532226562, 0.5573234558105469, 0.5731048583984375, 0.5888862609863281, 0.6046676635742188, 0.6204490661621094, 0.63623046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 7.0, 8.0, 7.0, 19.0, 28.0, 44.0, 45.0, 107.0, 125.0, 132.0, 145.0, 114.0, 72.0, 28.0, 39.0, 20.0, 16.0, 10.0, 7.0, 1.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315185546875, -0.30636024475097656, -0.2975349426269531, -0.2887096405029297, -0.27988433837890625, -0.2710590362548828, -0.2622337341308594, -0.25340843200683594, -0.2445831298828125, -0.23575782775878906, -0.22693252563476562, -0.2181072235107422, -0.20928192138671875, -0.2004566192626953, -0.19163131713867188, -0.18280601501464844, -0.173980712890625, -0.16515541076660156, -0.15633010864257812, -0.1475048065185547, -0.13867950439453125, -0.1298542022705078, -0.12102890014648438, -0.11220359802246094, -0.1033782958984375, -0.09455299377441406, -0.08572769165039062, -0.07690238952636719, -0.06807708740234375, -0.05925178527832031, -0.050426483154296875, -0.04160118103027344, -0.03277587890625, -0.023950576782226562, -0.015125274658203125, -0.0062999725341796875, 0.00252532958984375, 0.011350631713867188, 0.020175933837890625, 0.029001235961914062, 0.0378265380859375, 0.04665184020996094, 0.055477142333984375, 0.06430244445800781, 0.07312774658203125, 0.08195304870605469, 0.09077835083007812, 0.09960365295410156, 0.108428955078125, 0.11725425720214844, 0.12607955932617188, 0.1349048614501953, 0.14373016357421875, 0.1525554656982422, 0.16138076782226562, 0.17020606994628906, 0.1790313720703125, 0.18785667419433594, 0.19668197631835938, 0.2055072784423828, 0.21433258056640625, 0.2231578826904297, 0.23198318481445312, 0.24080848693847656, 0.2496337890625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 10.0, 5.0, 10.0, 18.0, 30.0, 68.0, 105.0, 145.0, 202.0, 144.0, 98.0, 64.0, 34.0, 22.0, 14.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.164175033569336, -3.0608623027801514, -2.9575493335723877, -2.854236602783203, -2.7509236335754395, -2.647610902786255, -2.5442981719970703, -2.4409852027893066, -2.337672472000122, -2.2343597412109375, -2.131046772003174, -2.0277340412139893, -1.9244211912155151, -1.821108341217041, -1.7177956104278564, -1.6144827604293823, -1.5111699104309082, -1.407857060432434, -1.30454421043396, -1.2012314796447754, -1.0979186296463013, -0.9946057796478271, -0.8912929892539978, -0.7879801988601685, -0.6846673488616943, -0.5813544988632202, -0.47804170846939087, -0.37472888827323914, -0.2714160680770874, -0.16810321807861328, -0.06479042768478394, 0.03852236270904541, 0.14183497428894043, 0.24514779448509216, 0.3484606146812439, 0.45177343487739563, 0.5550862550735474, 0.6583991050720215, 0.7617118954658508, 0.8650246858596802, 0.9683375358581543, 1.0716503858566284, 1.1749632358551025, 1.278275966644287, 1.3815888166427612, 1.4849016666412354, 1.58821439743042, 1.691527247428894, 1.7948400974273682, 1.8981529474258423, 2.0014657974243164, 2.104778528213501, 2.2080912590026855, 2.311404228210449, 2.414716958999634, 2.5180296897888184, 2.621342658996582, 2.7246553897857666, 2.8279683589935303, 2.931281089782715, 3.0345940589904785, 3.137906789779663, 3.2412195205688477, 3.3445324897766113, 3.447845220565796]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 6.0, 3.0, 11.0, 7.0, 20.0, 15.0, 15.0, 23.0, 28.0, 21.0, 38.0, 35.0, 54.0, 50.0, 61.0, 66.0, 74.0, 62.0, 61.0, 46.0, 41.0, 31.0, 22.0, 30.0, 38.0, 22.0, 16.0, 16.0, 19.0, 16.0, 9.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.1785826683044434, -3.0959415435791016, -3.0133001804351807, -2.930659055709839, -2.848017692565918, -2.765376567840576, -2.6827352046966553, -2.6000940799713135, -2.5174527168273926, -2.434811592102051, -2.35217022895813, -2.269529104232788, -2.186887741088867, -2.1042466163635254, -2.0216052532196045, -1.9389641284942627, -1.856323003768921, -1.7736817598342896, -1.6910405158996582, -1.6083992719650269, -1.5257580280303955, -1.4431169033050537, -1.3604756593704224, -1.277834415435791, -1.1951931715011597, -1.1125519275665283, -1.029910683631897, -0.9472694993019104, -0.864628255367279, -0.7819870114326477, -0.6993458271026611, -0.6167045831680298, -0.5340631008148193, -0.451421856880188, -0.36878064274787903, -0.28613942861557007, -0.20349818468093872, -0.12085694074630737, -0.03821572661399841, 0.04442548751831055, 0.1270667314529419, 0.20970796048641205, 0.2923491895198822, 0.37499040365219116, 0.4576316475868225, 0.5402728915214539, 0.6229140758514404, 0.7055553197860718, 0.7881965637207031, 0.8708378076553345, 0.9534790515899658, 1.0361202955245972, 1.1187615394592285, 1.2014026641845703, 1.2840439081192017, 1.366685152053833, 1.4493263959884644, 1.5319676399230957, 1.614608883857727, 1.6972501277923584, 1.7798912525177002, 1.862532615661621, 1.945173740386963, 2.0278148651123047, 2.1104562282562256]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 12.0, 10.0, 7.0, 18.0, 34.0, 40.0, 63.0, 93.0, 171.0, 318.0, 674.0, 1662.0, 4597.0, 16369.0, 115491.0, 3390179.0, 613094.0, 37682.0, 8345.0, 2914.0, 1220.0, 521.0, 289.0, 177.0, 79.0, 64.0, 51.0, 24.0, 18.0, 12.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.359130859375, -0.3478202819824219, -0.33650970458984375, -0.3251991271972656, -0.3138885498046875, -0.3025779724121094, -0.29126739501953125, -0.2799568176269531, -0.268646240234375, -0.2573356628417969, -0.24602508544921875, -0.23471450805664062, -0.2234039306640625, -0.21209335327148438, -0.20078277587890625, -0.18947219848632812, -0.17816162109375, -0.16685104370117188, -0.15554046630859375, -0.14422988891601562, -0.1329193115234375, -0.12160873413085938, -0.11029815673828125, -0.09898757934570312, -0.087677001953125, -0.07636642456054688, -0.06505584716796875, -0.053745269775390625, -0.0424346923828125, -0.031124114990234375, -0.01981353759765625, -0.008502960205078125, 0.0028076171875, 0.014118194580078125, 0.02542877197265625, 0.036739349365234375, 0.0480499267578125, 0.059360504150390625, 0.07067108154296875, 0.08198165893554688, 0.093292236328125, 0.10460281372070312, 0.11591339111328125, 0.12722396850585938, 0.1385345458984375, 0.14984512329101562, 0.16115570068359375, 0.17246627807617188, 0.18377685546875, 0.19508743286132812, 0.20639801025390625, 0.21770858764648438, 0.2290191650390625, 0.24032974243164062, 0.25164031982421875, 0.2629508972167969, 0.274261474609375, 0.2855720520019531, 0.29688262939453125, 0.3081932067871094, 0.3195037841796875, 0.3308143615722656, 0.34212493896484375, 0.3534355163574219, 0.36474609375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 18.0, 23.0, 40.0, 57.0, 86.0, 93.0, 112.0, 117.0, 89.0, 79.0, 71.0, 62.0, 53.0, 28.0, 27.0, 12.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382080078125, -0.3721656799316406, -0.36225128173828125, -0.3523368835449219, -0.3424224853515625, -0.3325080871582031, -0.32259368896484375, -0.3126792907714844, -0.302764892578125, -0.2928504943847656, -0.28293609619140625, -0.2730216979980469, -0.2631072998046875, -0.2531929016113281, -0.24327850341796875, -0.23336410522460938, -0.22344970703125, -0.21353530883789062, -0.20362091064453125, -0.19370651245117188, -0.1837921142578125, -0.17387771606445312, -0.16396331787109375, -0.15404891967773438, -0.144134521484375, -0.13422012329101562, -0.12430572509765625, -0.11439132690429688, -0.1044769287109375, -0.09456253051757812, -0.08464813232421875, -0.07473373413085938, -0.0648193359375, -0.054904937744140625, -0.04499053955078125, -0.035076141357421875, -0.0251617431640625, -0.015247344970703125, -0.00533294677734375, 0.004581451416015625, 0.014495849609375, 0.024410247802734375, 0.03432464599609375, 0.044239044189453125, 0.0541534423828125, 0.06406784057617188, 0.07398223876953125, 0.08389663696289062, 0.09381103515625, 0.10372543334960938, 0.11363983154296875, 0.12355422973632812, 0.1334686279296875, 0.14338302612304688, 0.15329742431640625, 0.16321182250976562, 0.173126220703125, 0.18304061889648438, 0.19295501708984375, 0.20286941528320312, 0.2127838134765625, 0.22269821166992188, 0.23261260986328125, 0.24252700805664062, 0.25244140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 16.0, 17.0, 38.0, 51.0, 87.0, 144.0, 232.0, 535.0, 1763.0, 13596.0, 349777.0, 3777382.0, 44856.0, 4156.0, 861.0, 335.0, 179.0, 92.0, 52.0, 33.0, 26.0, 21.0, 14.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.712890625, -0.691436767578125, -0.66998291015625, -0.648529052734375, -0.6270751953125, -0.605621337890625, -0.58416748046875, -0.562713623046875, -0.541259765625, -0.519805908203125, -0.49835205078125, -0.476898193359375, -0.4554443359375, -0.433990478515625, -0.41253662109375, -0.391082763671875, -0.36962890625, -0.348175048828125, -0.32672119140625, -0.305267333984375, -0.2838134765625, -0.262359619140625, -0.24090576171875, -0.219451904296875, -0.197998046875, -0.176544189453125, -0.15509033203125, -0.133636474609375, -0.1121826171875, -0.090728759765625, -0.06927490234375, -0.047821044921875, -0.0263671875, -0.004913330078125, 0.01654052734375, 0.037994384765625, 0.0594482421875, 0.080902099609375, 0.10235595703125, 0.123809814453125, 0.145263671875, 0.166717529296875, 0.18817138671875, 0.209625244140625, 0.2310791015625, 0.252532958984375, 0.27398681640625, 0.295440673828125, 0.31689453125, 0.338348388671875, 0.35980224609375, 0.381256103515625, 0.4027099609375, 0.424163818359375, 0.44561767578125, 0.467071533203125, 0.488525390625, 0.509979248046875, 0.53143310546875, 0.552886962890625, 0.5743408203125, 0.595794677734375, 0.61724853515625, 0.638702392578125, 0.66015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 15.0, 12.0, 19.0, 23.0, 31.0, 38.0, 63.0, 120.0, 210.0, 411.0, 1007.0, 1075.0, 503.0, 184.0, 121.0, 62.0, 41.0, 39.0, 29.0, 13.0, 10.0, 10.0, 8.0, 2.0, 2.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.433837890625, -0.421112060546875, -0.40838623046875, -0.395660400390625, -0.3829345703125, -0.370208740234375, -0.35748291015625, -0.344757080078125, -0.33203125, -0.319305419921875, -0.30657958984375, -0.293853759765625, -0.2811279296875, -0.268402099609375, -0.25567626953125, -0.242950439453125, -0.230224609375, -0.217498779296875, -0.20477294921875, -0.192047119140625, -0.1793212890625, -0.166595458984375, -0.15386962890625, -0.141143798828125, -0.12841796875, -0.115692138671875, -0.10296630859375, -0.090240478515625, -0.0775146484375, -0.064788818359375, -0.05206298828125, -0.039337158203125, -0.026611328125, -0.013885498046875, -0.00115966796875, 0.011566162109375, 0.0242919921875, 0.037017822265625, 0.04974365234375, 0.062469482421875, 0.0751953125, 0.087921142578125, 0.10064697265625, 0.113372802734375, 0.1260986328125, 0.138824462890625, 0.15155029296875, 0.164276123046875, 0.177001953125, 0.189727783203125, 0.20245361328125, 0.215179443359375, 0.2279052734375, 0.240631103515625, 0.25335693359375, 0.266082763671875, 0.27880859375, 0.291534423828125, 0.30426025390625, 0.316986083984375, 0.3297119140625, 0.342437744140625, 0.35516357421875, 0.367889404296875, 0.380615234375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 16.0, 31.0, 67.0, 138.0, 206.0, 206.0, 154.0, 91.0, 40.0, 15.0, 10.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.637744188308716, -3.5208239555358887, -3.4039037227630615, -3.2869834899902344, -3.1700632572174072, -3.05314302444458, -2.936222553253174, -2.819302558898926, -2.7023820877075195, -2.5854618549346924, -2.4685416221618652, -2.351621389389038, -2.234701156616211, -2.117780923843384, -2.0008606910705566, -1.88394033908844, -1.7670202255249023, -1.6500999927520752, -1.533179759979248, -1.416259527206421, -1.2993392944335938, -1.1824190616607666, -1.06549870967865, -0.9485784769058228, -0.8316582441329956, -0.7147380113601685, -0.5978177785873413, -0.4808974862098694, -0.36397725343704224, -0.2470570206642151, -0.13013672828674316, -0.013216495513916016, 0.10370397567749023, 0.22062422335147858, 0.3375444710254669, 0.45446473360061646, 0.5713849663734436, 0.6883051991462708, 0.8052254915237427, 0.9221457242965698, 1.039065957069397, 1.1559861898422241, 1.2729064226150513, 1.389826774597168, 1.5067470073699951, 1.6236672401428223, 1.7405874729156494, 1.8575077056884766, 1.9744279384613037, 2.091348171234131, 2.208268404006958, 2.325188636779785, 2.4421088695526123, 2.5590291023254395, 2.6759495735168457, 2.7928695678710938, 2.9097900390625, 3.026710271835327, 3.1436305046081543, 3.2605507373809814, 3.3774709701538086, 3.4943912029266357, 3.611311435699463, 3.728231906890869, 3.845151901245117]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 3.0, 6.0, 6.0, 9.0, 5.0, 9.0, 11.0, 21.0, 20.0, 17.0, 23.0, 22.0, 37.0, 26.0, 38.0, 31.0, 41.0, 39.0, 43.0, 46.0, 44.0, 45.0, 58.0, 42.0, 29.0, 30.0, 43.0, 33.0, 36.0, 28.0, 21.0, 15.0, 23.0, 13.0, 14.0, 16.0, 11.0, 9.0, 10.0, 6.0, 12.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1957745552062988, -1.1551610231399536, -1.1145474910736084, -1.0739339590072632, -1.033320426940918, -0.9927068948745728, -0.9520934224128723, -0.9114798903465271, -0.8708663582801819, -0.8302528262138367, -0.7896392941474915, -0.7490257620811462, -0.7084122896194458, -0.6677987575531006, -0.6271852254867554, -0.5865716934204102, -0.5459581613540649, -0.5053446292877197, -0.4647310972213745, -0.4241175949573517, -0.38350406289100647, -0.34289053082466125, -0.3022770285606384, -0.2616634964942932, -0.221049964427948, -0.18043643236160278, -0.13982291519641876, -0.09920939058065414, -0.058595865964889526, -0.01798233389854431, 0.02263118326663971, 0.06324470043182373, 0.10385823249816895, 0.14447176456451416, 0.18508528172969818, 0.2256987988948822, 0.2663123309612274, 0.30692586302757263, 0.34753936529159546, 0.3881528973579407, 0.4287664294242859, 0.4693799614906311, 0.5099934935569763, 0.5506070256233215, 0.591220498085022, 0.6318340301513672, 0.6724475622177124, 0.7130610942840576, 0.7536746263504028, 0.794288158416748, 0.8349016904830933, 0.8755152225494385, 0.9161287546157837, 0.9567422866821289, 0.9973557591438293, 1.0379693508148193, 1.078582763671875, 1.1191962957382202, 1.1598098278045654, 1.2004233598709106, 1.2410368919372559, 1.281650424003601, 1.3222639560699463, 1.362877368927002, 1.4034910202026367]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 20.0, 20.0, 47.0, 88.0, 141.0, 320.0, 867.0, 3034.0, 16633.0, 177840.0, 741914.0, 93769.0, 10408.0, 2171.0, 687.0, 283.0, 139.0, 75.0, 35.0, 15.0, 13.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84814453125, -0.8271408081054688, -0.8061370849609375, -0.7851333618164062, -0.764129638671875, -0.7431259155273438, -0.7221221923828125, -0.7011184692382812, -0.68011474609375, -0.6591110229492188, -0.6381072998046875, -0.6171035766601562, -0.596099853515625, -0.5750961303710938, -0.5540924072265625, -0.5330886840820312, -0.5120849609375, -0.49108123779296875, -0.4700775146484375, -0.44907379150390625, -0.428070068359375, -0.40706634521484375, -0.3860626220703125, -0.36505889892578125, -0.34405517578125, -0.32305145263671875, -0.3020477294921875, -0.28104400634765625, -0.260040283203125, -0.23903656005859375, -0.2180328369140625, -0.19702911376953125, -0.176025390625, -0.15502166748046875, -0.1340179443359375, -0.11301422119140625, -0.092010498046875, -0.07100677490234375, -0.0500030517578125, -0.02899932861328125, -0.00799560546875, 0.01300811767578125, 0.0340118408203125, 0.05501556396484375, 0.076019287109375, 0.09702301025390625, 0.1180267333984375, 0.13903045654296875, 0.1600341796875, 0.18103790283203125, 0.2020416259765625, 0.22304534912109375, 0.244049072265625, 0.26505279541015625, 0.2860565185546875, 0.30706024169921875, 0.32806396484375, 0.34906768798828125, 0.3700714111328125, 0.39107513427734375, 0.412078857421875, 0.43308258056640625, 0.4540863037109375, 0.47509002685546875, 0.49609375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 11.0, 11.0, 17.0, 30.0, 47.0, 65.0, 71.0, 92.0, 104.0, 96.0, 100.0, 79.0, 76.0, 62.0, 45.0, 29.0, 22.0, 23.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380859375, -0.3709678649902344, -0.36107635498046875, -0.3511848449707031, -0.3412933349609375, -0.3314018249511719, -0.32151031494140625, -0.3116188049316406, -0.301727294921875, -0.2918357849121094, -0.28194427490234375, -0.2720527648925781, -0.2621612548828125, -0.2522697448730469, -0.24237823486328125, -0.23248672485351562, -0.22259521484375, -0.21270370483398438, -0.20281219482421875, -0.19292068481445312, -0.1830291748046875, -0.17313766479492188, -0.16324615478515625, -0.15335464477539062, -0.143463134765625, -0.13357162475585938, -0.12368011474609375, -0.11378860473632812, -0.1038970947265625, -0.09400558471679688, -0.08411407470703125, -0.07422256469726562, -0.0643310546875, -0.054439544677734375, -0.04454803466796875, -0.034656524658203125, -0.0247650146484375, -0.014873504638671875, -0.00498199462890625, 0.004909515380859375, 0.014801025390625, 0.024692535400390625, 0.03458404541015625, 0.044475555419921875, 0.0543670654296875, 0.06425857543945312, 0.07415008544921875, 0.08404159545898438, 0.09393310546875, 0.10382461547851562, 0.11371612548828125, 0.12360763549804688, 0.1334991455078125, 0.14339065551757812, 0.15328216552734375, 0.16317367553710938, 0.173065185546875, 0.18295669555664062, 0.19284820556640625, 0.20273971557617188, 0.2126312255859375, 0.22252273559570312, 0.23241424560546875, 0.24230575561523438, 0.252197265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 7.0, 17.0, 15.0, 32.0, 50.0, 53.0, 98.0, 161.0, 286.0, 656.0, 1777.0, 7553.0, 64893.0, 862603.0, 97198.0, 9488.0, 2082.0, 736.0, 322.0, 172.0, 101.0, 64.0, 64.0, 35.0, 17.0, 15.0, 10.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6810684204101562, -0.6580352783203125, -0.6350021362304688, -0.611968994140625, -0.5889358520507812, -0.5659027099609375, -0.5428695678710938, -0.51983642578125, -0.49680328369140625, -0.4737701416015625, -0.45073699951171875, -0.427703857421875, -0.40467071533203125, -0.3816375732421875, -0.35860443115234375, -0.3355712890625, -0.31253814697265625, -0.2895050048828125, -0.26647186279296875, -0.243438720703125, -0.22040557861328125, -0.1973724365234375, -0.17433929443359375, -0.15130615234375, -0.12827301025390625, -0.1052398681640625, -0.08220672607421875, -0.059173583984375, -0.03614044189453125, -0.0131072998046875, 0.00992584228515625, 0.032958984375, 0.05599212646484375, 0.0790252685546875, 0.10205841064453125, 0.125091552734375, 0.14812469482421875, 0.1711578369140625, 0.19419097900390625, 0.21722412109375, 0.24025726318359375, 0.2632904052734375, 0.28632354736328125, 0.309356689453125, 0.33238983154296875, 0.3554229736328125, 0.37845611572265625, 0.4014892578125, 0.42452239990234375, 0.4475555419921875, 0.47058868408203125, 0.493621826171875, 0.5166549682617188, 0.5396881103515625, 0.5627212524414062, 0.58575439453125, 0.6087875366210938, 0.6318206787109375, 0.6548538208007812, 0.677886962890625, 0.7009201049804688, 0.7239532470703125, 0.7469863891601562, 0.77001953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 5.0, 1.0, 4.0, 9.0, 8.0, 6.0, 14.0, 22.0, 25.0, 42.0, 39.0, 45.0, 59.0, 44.0, 74.0, 65.0, 73.0, 78.0, 66.0, 60.0, 43.0, 53.0, 28.0, 29.0, 23.0, 21.0, 9.0, 8.0, 9.0, 6.0, 3.0, 5.0, 3.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.71435546875, -0.6890487670898438, -0.6637420654296875, -0.6384353637695312, -0.613128662109375, -0.5878219604492188, -0.5625152587890625, -0.5372085571289062, -0.51190185546875, -0.48659515380859375, -0.4612884521484375, -0.43598175048828125, -0.410675048828125, -0.38536834716796875, -0.3600616455078125, -0.33475494384765625, -0.3094482421875, -0.28414154052734375, -0.2588348388671875, -0.23352813720703125, -0.208221435546875, -0.18291473388671875, -0.1576080322265625, -0.13230133056640625, -0.10699462890625, -0.08168792724609375, -0.0563812255859375, -0.03107452392578125, -0.005767822265625, 0.01953887939453125, 0.0448455810546875, 0.07015228271484375, 0.095458984375, 0.12076568603515625, 0.1460723876953125, 0.17137908935546875, 0.196685791015625, 0.22199249267578125, 0.2472991943359375, 0.27260589599609375, 0.29791259765625, 0.32321929931640625, 0.3485260009765625, 0.37383270263671875, 0.399139404296875, 0.42444610595703125, 0.4497528076171875, 0.47505950927734375, 0.5003662109375, 0.5256729125976562, 0.5509796142578125, 0.5762863159179688, 0.601593017578125, 0.6268997192382812, 0.6522064208984375, 0.6775131225585938, 0.70281982421875, 0.7281265258789062, 0.7534332275390625, 0.7787399291992188, 0.804046630859375, 0.8293533325195312, 0.8546600341796875, 0.8799667358398438, 0.9052734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 11.0, 7.0, 19.0, 19.0, 30.0, 60.0, 92.0, 180.0, 415.0, 1041.0, 3900.0, 19236.0, 286148.0, 705022.0, 25461.0, 4679.0, 1293.0, 460.0, 194.0, 110.0, 55.0, 42.0, 21.0, 12.0, 14.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2261962890625, -0.21751976013183594, -0.20884323120117188, -0.2001667022705078, -0.19149017333984375, -0.1828136444091797, -0.17413711547851562, -0.16546058654785156, -0.1567840576171875, -0.14810752868652344, -0.13943099975585938, -0.1307544708251953, -0.12207794189453125, -0.11340141296386719, -0.10472488403320312, -0.09604835510253906, -0.087371826171875, -0.07869529724121094, -0.07001876831054688, -0.06134223937988281, -0.05266571044921875, -0.04398918151855469, -0.035312652587890625, -0.026636123657226562, -0.0179595947265625, -0.009283065795898438, -0.000606536865234375, 0.008069992065429688, 0.01674652099609375, 0.025423049926757812, 0.034099578857421875, 0.04277610778808594, 0.05145263671875, 0.06012916564941406, 0.06880569458007812, 0.07748222351074219, 0.08615875244140625, 0.09483528137207031, 0.10351181030273438, 0.11218833923339844, 0.1208648681640625, 0.12954139709472656, 0.13821792602539062, 0.1468944549560547, 0.15557098388671875, 0.1642475128173828, 0.17292404174804688, 0.18160057067871094, 0.190277099609375, 0.19895362854003906, 0.20763015747070312, 0.2163066864013672, 0.22498321533203125, 0.2336597442626953, 0.24233627319335938, 0.25101280212402344, 0.2596893310546875, 0.26836585998535156, 0.2770423889160156, 0.2857189178466797, 0.29439544677734375, 0.3030719757080078, 0.3117485046386719, 0.32042503356933594, 0.3291015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 8.0, 15.0, 11.0, 14.0, 24.0, 30.0, 39.0, 65.0, 68.0, 106.0, 131.0, 128.0, 100.0, 45.0, 53.0, 32.0, 20.0, 19.0, 16.0, 14.0, 7.0, 7.0, 7.0, 7.0, 3.0, 0.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3882598876953125e-05, -5.207117646932602e-05, -5.0259754061698914e-05, -4.844833165407181e-05, -4.66369092464447e-05, -4.4825486838817596e-05, -4.301406443119049e-05, -4.1202642023563385e-05, -3.939121961593628e-05, -3.7579797208309174e-05, -3.576837480068207e-05, -3.395695239305496e-05, -3.2145529985427856e-05, -3.033410757780075e-05, -2.8522685170173645e-05, -2.671126276254654e-05, -2.4899840354919434e-05, -2.3088417947292328e-05, -2.1276995539665222e-05, -1.9465573132038116e-05, -1.765415072441101e-05, -1.5842728316783905e-05, -1.40313059091568e-05, -1.2219883501529694e-05, -1.0408461093902588e-05, -8.597038686275482e-06, -6.7856162786483765e-06, -4.974193871021271e-06, -3.162771463394165e-06, -1.3513490557670593e-06, 4.600733518600464e-07, 2.271495759487152e-06, 4.082918167114258e-06, 5.8943405747413635e-06, 7.70576298236847e-06, 9.517185389995575e-06, 1.132860779762268e-05, 1.3140030205249786e-05, 1.4951452612876892e-05, 1.6762875020503998e-05, 1.8574297428131104e-05, 2.038571983575821e-05, 2.2197142243385315e-05, 2.400856465101242e-05, 2.5819987058639526e-05, 2.7631409466266632e-05, 2.9442831873893738e-05, 3.1254254281520844e-05, 3.306567668914795e-05, 3.4877099096775055e-05, 3.668852150440216e-05, 3.8499943912029266e-05, 4.031136631965637e-05, 4.212278872728348e-05, 4.3934211134910583e-05, 4.574563354253769e-05, 4.7557055950164795e-05, 4.93684783577919e-05, 5.1179900765419006e-05, 5.299132317304611e-05, 5.480274558067322e-05, 5.6614167988300323e-05, 5.842559039592743e-05, 6.0237012803554535e-05, 6.204843521118164e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 9.0, 11.0, 12.0, 16.0, 38.0, 30.0, 65.0, 68.0, 117.0, 203.0, 355.0, 747.0, 1546.0, 4044.0, 12658.0, 51933.0, 656707.0, 267466.0, 36784.0, 9591.0, 3272.0, 1322.0, 710.0, 337.0, 181.0, 103.0, 82.0, 52.0, 23.0, 13.0, 15.0, 8.0, 7.0, 9.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.1324939727783203, -0.12717056274414062, -0.12184715270996094, -0.11652374267578125, -0.11120033264160156, -0.10587692260742188, -0.10055351257324219, -0.0952301025390625, -0.08990669250488281, -0.08458328247070312, -0.07925987243652344, -0.07393646240234375, -0.06861305236816406, -0.06328964233398438, -0.05796623229980469, -0.052642822265625, -0.04731941223144531, -0.041996002197265625, -0.03667259216308594, -0.03134918212890625, -0.026025772094726562, -0.020702362060546875, -0.015378952026367188, -0.0100555419921875, -0.0047321319580078125, 0.000591278076171875, 0.0059146881103515625, 0.01123809814453125, 0.016561508178710938, 0.021884918212890625, 0.027208328247070312, 0.03253173828125, 0.03785514831542969, 0.043178558349609375, 0.04850196838378906, 0.05382537841796875, 0.05914878845214844, 0.06447219848632812, 0.06979560852050781, 0.0751190185546875, 0.08044242858886719, 0.08576583862304688, 0.09108924865722656, 0.09641265869140625, 0.10173606872558594, 0.10705947875976562, 0.11238288879394531, 0.117706298828125, 0.12302970886230469, 0.12835311889648438, 0.13367652893066406, 0.13899993896484375, 0.14432334899902344, 0.14964675903320312, 0.1549701690673828, 0.1602935791015625, 0.1656169891357422, 0.17094039916992188, 0.17626380920410156, 0.18158721923828125, 0.18691062927246094, 0.19223403930664062, 0.1975574493408203, 0.202880859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 8.0, 12.0, 15.0, 17.0, 26.0, 35.0, 45.0, 57.0, 97.0, 108.0, 117.0, 124.0, 82.0, 53.0, 39.0, 35.0, 14.0, 17.0, 15.0, 24.0, 6.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127197265625, -0.12171554565429688, -0.11623382568359375, -0.11075210571289062, -0.1052703857421875, -0.09978866577148438, -0.09430694580078125, -0.08882522583007812, -0.083343505859375, -0.07786178588867188, -0.07238006591796875, -0.06689834594726562, -0.0614166259765625, -0.055934906005859375, -0.05045318603515625, -0.044971466064453125, -0.03948974609375, -0.034008026123046875, -0.02852630615234375, -0.023044586181640625, -0.0175628662109375, -0.012081146240234375, -0.00659942626953125, -0.001117706298828125, 0.004364013671875, 0.009845733642578125, 0.01532745361328125, 0.020809173583984375, 0.0262908935546875, 0.031772613525390625, 0.03725433349609375, 0.042736053466796875, 0.0482177734375, 0.053699493408203125, 0.05918121337890625, 0.06466293334960938, 0.0701446533203125, 0.07562637329101562, 0.08110809326171875, 0.08658981323242188, 0.092071533203125, 0.09755325317382812, 0.10303497314453125, 0.10851669311523438, 0.1139984130859375, 0.11948013305664062, 0.12496185302734375, 0.13044357299804688, 0.13592529296875, 0.14140701293945312, 0.14688873291015625, 0.15237045288085938, 0.1578521728515625, 0.16333389282226562, 0.16881561279296875, 0.17429733276367188, 0.179779052734375, 0.18526077270507812, 0.19074249267578125, 0.19622421264648438, 0.2017059326171875, 0.20718765258789062, 0.21266937255859375, 0.21815109252929688, 0.2236328125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 14.0, 44.0, 141.0, 446.0, 219.0, 81.0, 17.0, 15.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.024956703186035, -8.797606468200684, -8.570255279541016, -8.342905044555664, -8.115553855895996, -7.888203144073486, -7.660852432250977, -7.433501720428467, -7.206151008605957, -6.978800296783447, -6.7514495849609375, -6.524098873138428, -6.296748161315918, -6.069397449493408, -5.842046737670898, -5.614696025848389, -5.387345314025879, -5.159994602203369, -4.932643890380859, -4.70529317855835, -4.47794246673584, -4.25059175491333, -4.02324104309082, -3.7958903312683105, -3.568540096282959, -3.341189384460449, -3.1138386726379395, -2.8864879608154297, -2.65913724899292, -2.43178653717041, -2.2044358253479004, -1.9770852327346802, -1.7497344017028809, -1.522383689880371, -1.2950329780578613, -1.0676822662353516, -0.8403316140174866, -0.6129809617996216, -0.3856302499771118, -0.15827953815460205, 0.06907117366790771, 0.2964218854904175, 0.5237725973129272, 0.7511232495307922, 0.978473961353302, 1.205824613571167, 1.4331753253936768, 1.6605260372161865, 1.8878767490386963, 2.115227460861206, 2.342578172683716, 2.5699288845062256, 2.7972795963287354, 3.024630069732666, 3.251980781555176, 3.4793314933776855, 3.7066822052001953, 3.934032917022705, 4.161383628845215, 4.388734340667725, 4.616085052490234, 4.843435764312744, 5.070786476135254, 5.298137187957764, 5.525487899780273]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 12.0, 3.0, 13.0, 10.0, 9.0, 18.0, 14.0, 19.0, 21.0, 27.0, 26.0, 37.0, 40.0, 41.0, 43.0, 60.0, 67.0, 85.0, 71.0, 50.0, 55.0, 36.0, 21.0, 25.0, 26.0, 31.0, 27.0, 15.0, 16.0, 11.0, 8.0, 11.0, 12.0, 11.0, 4.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.055661201477051, -1.980941891670227, -1.9062225818634033, -1.8315033912658691, -1.7567840814590454, -1.6820647716522217, -1.6073455810546875, -1.5326262712478638, -1.45790696144104, -1.3831876516342163, -1.3084683418273926, -1.2337491512298584, -1.1590298414230347, -1.084310531616211, -1.0095913410186768, -0.934872031211853, -0.8601527214050293, -0.7854334115982056, -0.7107141613960266, -0.6359949111938477, -0.5612756013870239, -0.4865563213825226, -0.41183704137802124, -0.3371177911758423, -0.26239848136901855, -0.1876792013645172, -0.11295992136001587, -0.038240641355514526, 0.036478638648986816, 0.11119791865348816, 0.1859171986579895, 0.26063644886016846, 0.3353555202484131, 0.41007480025291443, 0.48479408025741577, 0.5595133304595947, 0.6342326402664185, 0.7089519500732422, 0.7836712002754211, 0.8583904504776001, 0.9331097602844238, 1.0078290700912476, 1.0825483798980713, 1.1572675704956055, 1.2319868803024292, 1.306706190109253, 1.381425380706787, 1.4561446905136108, 1.5308640003204346, 1.6055833101272583, 1.680302619934082, 1.7550218105316162, 1.82974112033844, 1.9044604301452637, 1.9791796207427979, 2.053898811340332, 2.1286182403564453, 2.2033374309539795, 2.2780568599700928, 2.352776050567627, 2.4274954795837402, 2.5022146701812744, 2.5769338607788086, 2.651653289794922, 2.726372480392456]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 13.0, 9.0, 22.0, 39.0, 48.0, 83.0, 123.0, 232.0, 476.0, 829.0, 1833.0, 4947.0, 15595.0, 78996.0, 1862591.0, 2121040.0, 81630.0, 16362.0, 5117.0, 2055.0, 948.0, 505.0, 286.0, 152.0, 112.0, 68.0, 49.0, 22.0, 19.0, 12.0, 15.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.3469886779785156, -0.33460235595703125, -0.3222160339355469, -0.3098297119140625, -0.2974433898925781, -0.28505706787109375, -0.2726707458496094, -0.260284423828125, -0.24789810180664062, -0.23551177978515625, -0.22312545776367188, -0.2107391357421875, -0.19835281372070312, -0.18596649169921875, -0.17358016967773438, -0.16119384765625, -0.14880752563476562, -0.13642120361328125, -0.12403488159179688, -0.1116485595703125, -0.09926223754882812, -0.08687591552734375, -0.07448959350585938, -0.062103271484375, -0.049716949462890625, -0.03733062744140625, -0.024944305419921875, -0.0125579833984375, -0.000171661376953125, 0.01221466064453125, 0.024600982666015625, 0.0369873046875, 0.049373626708984375, 0.06175994873046875, 0.07414627075195312, 0.0865325927734375, 0.09891891479492188, 0.11130523681640625, 0.12369155883789062, 0.136077880859375, 0.14846420288085938, 0.16085052490234375, 0.17323684692382812, 0.1856231689453125, 0.19800949096679688, 0.21039581298828125, 0.22278213500976562, 0.23516845703125, 0.24755477905273438, 0.25994110107421875, 0.2723274230957031, 0.2847137451171875, 0.2971000671386719, 0.30948638916015625, 0.3218727111816406, 0.334259033203125, 0.3466453552246094, 0.35903167724609375, 0.3714179992675781, 0.3838043212890625, 0.3961906433105469, 0.40857696533203125, 0.4209632873535156, 0.433349609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 10.0, 9.0, 14.0, 24.0, 31.0, 32.0, 51.0, 58.0, 55.0, 78.0, 100.0, 95.0, 90.0, 56.0, 65.0, 59.0, 46.0, 33.0, 24.0, 23.0, 19.0, 13.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.282958984375, -0.2747344970703125, -0.266510009765625, -0.2582855224609375, -0.25006103515625, -0.2418365478515625, -0.233612060546875, -0.2253875732421875, -0.2171630859375, -0.2089385986328125, -0.200714111328125, -0.1924896240234375, -0.18426513671875, -0.1760406494140625, -0.167816162109375, -0.1595916748046875, -0.1513671875, -0.1431427001953125, -0.134918212890625, -0.1266937255859375, -0.11846923828125, -0.1102447509765625, -0.102020263671875, -0.0937957763671875, -0.0855712890625, -0.0773468017578125, -0.069122314453125, -0.0608978271484375, -0.05267333984375, -0.0444488525390625, -0.036224365234375, -0.0279998779296875, -0.019775390625, -0.0115509033203125, -0.003326416015625, 0.0048980712890625, 0.01312255859375, 0.0213470458984375, 0.029571533203125, 0.0377960205078125, 0.0460205078125, 0.0542449951171875, 0.062469482421875, 0.0706939697265625, 0.07891845703125, 0.0871429443359375, 0.095367431640625, 0.1035919189453125, 0.11181640625, 0.1200408935546875, 0.128265380859375, 0.1364898681640625, 0.14471435546875, 0.1529388427734375, 0.161163330078125, 0.1693878173828125, 0.1776123046875, 0.1858367919921875, 0.194061279296875, 0.2022857666015625, 0.21051025390625, 0.2187347412109375, 0.226959228515625, 0.2351837158203125, 0.243408203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 10.0, 18.0, 20.0, 23.0, 29.0, 55.0, 88.0, 102.0, 207.0, 395.0, 982.0, 3606.0, 19123.0, 223546.0, 3786054.0, 140549.0, 14654.0, 2971.0, 918.0, 346.0, 192.0, 114.0, 79.0, 44.0, 33.0, 27.0, 15.0, 17.0, 14.0, 12.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478515625, -0.52984619140625, -0.5118408203125, -0.49383544921875, -0.475830078125, -0.45782470703125, -0.4398193359375, -0.42181396484375, -0.40380859375, -0.38580322265625, -0.3677978515625, -0.34979248046875, -0.331787109375, -0.31378173828125, -0.2957763671875, -0.27777099609375, -0.259765625, -0.24176025390625, -0.2237548828125, -0.20574951171875, -0.187744140625, -0.16973876953125, -0.1517333984375, -0.13372802734375, -0.11572265625, -0.09771728515625, -0.0797119140625, -0.06170654296875, -0.043701171875, -0.02569580078125, -0.0076904296875, 0.01031494140625, 0.0283203125, 0.04632568359375, 0.0643310546875, 0.08233642578125, 0.100341796875, 0.11834716796875, 0.1363525390625, 0.15435791015625, 0.17236328125, 0.19036865234375, 0.2083740234375, 0.22637939453125, 0.244384765625, 0.26239013671875, 0.2803955078125, 0.29840087890625, 0.31640625, 0.33441162109375, 0.3524169921875, 0.37042236328125, 0.388427734375, 0.40643310546875, 0.4244384765625, 0.44244384765625, 0.46044921875, 0.47845458984375, 0.4964599609375, 0.51446533203125, 0.532470703125, 0.55047607421875, 0.5684814453125, 0.58648681640625, 0.6044921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 5.0, 6.0, 6.0, 11.0, 8.0, 19.0, 25.0, 35.0, 42.0, 46.0, 82.0, 108.0, 226.0, 387.0, 707.0, 912.0, 579.0, 306.0, 187.0, 81.0, 79.0, 53.0, 31.0, 36.0, 15.0, 13.0, 13.0, 10.0, 3.0, 5.0, 6.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32177734375, -0.3099822998046875, -0.298187255859375, -0.2863922119140625, -0.27459716796875, -0.2628021240234375, -0.251007080078125, -0.2392120361328125, -0.2274169921875, -0.2156219482421875, -0.203826904296875, -0.1920318603515625, -0.18023681640625, -0.1684417724609375, -0.156646728515625, -0.1448516845703125, -0.133056640625, -0.1212615966796875, -0.109466552734375, -0.0976715087890625, -0.08587646484375, -0.0740814208984375, -0.062286376953125, -0.0504913330078125, -0.0386962890625, -0.0269012451171875, -0.015106201171875, -0.0033111572265625, 0.00848388671875, 0.0202789306640625, 0.032073974609375, 0.0438690185546875, 0.0556640625, 0.0674591064453125, 0.079254150390625, 0.0910491943359375, 0.10284423828125, 0.1146392822265625, 0.126434326171875, 0.1382293701171875, 0.1500244140625, 0.1618194580078125, 0.173614501953125, 0.1854095458984375, 0.19720458984375, 0.2089996337890625, 0.220794677734375, 0.2325897216796875, 0.244384765625, 0.2561798095703125, 0.267974853515625, 0.2797698974609375, 0.29156494140625, 0.3033599853515625, 0.315155029296875, 0.3269500732421875, 0.3387451171875, 0.3505401611328125, 0.362335205078125, 0.3741302490234375, 0.38592529296875, 0.3977203369140625, 0.409515380859375, 0.4213104248046875, 0.43310546875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 9.0, 31.0, 58.0, 156.0, 205.0, 197.0, 147.0, 92.0, 38.0, 23.0, 13.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564911365509033, -2.437615394592285, -2.310319185256958, -2.183022975921631, -2.055727005004883, -1.9284309148788452, -1.8011348247528076, -1.67383873462677, -1.5465426445007324, -1.4192465543746948, -1.2919504642486572, -1.1646543741226196, -1.037358283996582, -0.9100621938705444, -0.7827661037445068, -0.6554700136184692, -0.5281739234924316, -0.40087783336639404, -0.27358174324035645, -0.14628565311431885, -0.01898956298828125, 0.10830652713775635, 0.23560261726379395, 0.36289870738983154, 0.49019479751586914, 0.6174908876419067, 0.7447869777679443, 0.8720830678939819, 0.9993791580200195, 1.1266752481460571, 1.2539713382720947, 1.3812674283981323, 1.50856351852417, 1.6358596086502075, 1.7631556987762451, 1.8904517889022827, 2.0177478790283203, 2.1450438499450684, 2.2723400592803955, 2.3996362686157227, 2.5269322395324707, 2.6542282104492188, 2.781524419784546, 2.908820629119873, 3.036116600036621, 3.163412570953369, 3.2907087802886963, 3.4180049896240234, 3.5453009605407715, 3.6725969314575195, 3.7998931407928467, 3.927189350128174, 4.054485321044922, 4.18178129196167, 4.309077262878418, 4.436373710632324, 4.563669681549072, 4.69096565246582, 4.818262100219727, 4.945558071136475, 5.072854042053223, 5.200150012969971, 5.327445983886719, 5.454742431640625, 5.582038402557373]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 18.0, 20.0, 17.0, 18.0, 28.0, 25.0, 30.0, 37.0, 38.0, 37.0, 45.0, 51.0, 52.0, 50.0, 53.0, 60.0, 46.0, 36.0, 32.0, 45.0, 23.0, 26.0, 25.0, 21.0, 23.0, 13.0, 18.0, 19.0, 16.0, 5.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-1.9096438884735107, -1.860107183456421, -1.8105703592300415, -1.7610336542129517, -1.7114969491958618, -1.661960244178772, -1.6124234199523926, -1.5628867149353027, -1.513350009918213, -1.463813304901123, -1.4142764806747437, -1.3647397756576538, -1.315203070640564, -1.2656663656234741, -1.2161295413970947, -1.1665928363800049, -1.117056131362915, -1.0675194263458252, -1.0179826021194458, -0.968445897102356, -0.9189091920852661, -0.8693724274635315, -0.8198356628417969, -0.770298957824707, -0.7207621335983276, -0.671225368976593, -0.6216886639595032, -0.5721518993377686, -0.5226151943206787, -0.4730784296989441, -0.42354169487953186, -0.37400496006011963, -0.3244682550430298, -0.27493152022361755, -0.22539478540420532, -0.1758580356836319, -0.12632130086421967, -0.07678456604480743, -0.02724781632423401, 0.022288918495178223, 0.07182565331459045, 0.12136238813400269, 0.17089912295341492, 0.22043587267398834, 0.26997262239456177, 0.3195093274116516, 0.36904609203338623, 0.41858282685279846, 0.4681195616722107, 0.5176563262939453, 0.5671930313110352, 0.6167297959327698, 0.6662665009498596, 0.7158032655715942, 0.7653399705886841, 0.8148767352104187, 0.8644134998321533, 0.9139502644538879, 0.9634869694709778, 1.0130237340927124, 1.0625604391098022, 1.112097144126892, 1.1616339683532715, 1.2111706733703613, 1.2607073783874512]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 16.0, 17.0, 27.0, 40.0, 63.0, 121.0, 211.0, 382.0, 730.0, 1748.0, 4312.0, 13260.0, 49967.0, 262569.0, 557631.0, 118241.0, 26329.0, 7650.0, 2839.0, 1185.0, 519.0, 257.0, 157.0, 83.0, 53.0, 38.0, 27.0, 16.0, 13.0, 10.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.55908203125, -0.5432319641113281, -0.5273818969726562, -0.5115318298339844, -0.4956817626953125, -0.4798316955566406, -0.46398162841796875, -0.4481315612792969, -0.432281494140625, -0.4164314270019531, -0.40058135986328125, -0.3847312927246094, -0.3688812255859375, -0.3530311584472656, -0.33718109130859375, -0.3213310241699219, -0.30548095703125, -0.2896308898925781, -0.27378082275390625, -0.2579307556152344, -0.2420806884765625, -0.22623062133789062, -0.21038055419921875, -0.19453048706054688, -0.178680419921875, -0.16283035278320312, -0.14698028564453125, -0.13113021850585938, -0.1152801513671875, -0.09943008422851562, -0.08358001708984375, -0.06772994995117188, -0.0518798828125, -0.036029815673828125, -0.02017974853515625, -0.004329681396484375, 0.0115203857421875, 0.027370452880859375, 0.04322052001953125, 0.059070587158203125, 0.074920654296875, 0.09077072143554688, 0.10662078857421875, 0.12247085571289062, 0.1383209228515625, 0.15417098999023438, 0.17002105712890625, 0.18587112426757812, 0.20172119140625, 0.21757125854492188, 0.23342132568359375, 0.24927139282226562, 0.2651214599609375, 0.2809715270996094, 0.29682159423828125, 0.3126716613769531, 0.328521728515625, 0.3443717956542969, 0.36022186279296875, 0.3760719299316406, 0.3919219970703125, 0.4077720642089844, 0.42362213134765625, 0.4394721984863281, 0.455322265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 10.0, 6.0, 25.0, 26.0, 31.0, 27.0, 56.0, 57.0, 71.0, 73.0, 74.0, 93.0, 85.0, 66.0, 60.0, 44.0, 42.0, 38.0, 40.0, 25.0, 20.0, 17.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2745037078857422, -0.2662925720214844, -0.25808143615722656, -0.24987030029296875, -0.24165916442871094, -0.23344802856445312, -0.2252368927001953, -0.2170257568359375, -0.2088146209716797, -0.20060348510742188, -0.19239234924316406, -0.18418121337890625, -0.17597007751464844, -0.16775894165039062, -0.1595478057861328, -0.151336669921875, -0.1431255340576172, -0.13491439819335938, -0.12670326232910156, -0.11849212646484375, -0.11028099060058594, -0.10206985473632812, -0.09385871887207031, -0.0856475830078125, -0.07743644714355469, -0.06922531127929688, -0.06101417541503906, -0.05280303955078125, -0.04459190368652344, -0.036380767822265625, -0.028169631958007812, -0.01995849609375, -0.011747360229492188, -0.003536224365234375, 0.0046749114990234375, 0.01288604736328125, 0.021097183227539062, 0.029308319091796875, 0.03751945495605469, 0.0457305908203125, 0.05394172668457031, 0.062152862548828125, 0.07036399841308594, 0.07857513427734375, 0.08678627014160156, 0.09499740600585938, 0.10320854187011719, 0.111419677734375, 0.11963081359863281, 0.12784194946289062, 0.13605308532714844, 0.14426422119140625, 0.15247535705566406, 0.16068649291992188, 0.1688976287841797, 0.1771087646484375, 0.1853199005126953, 0.19353103637695312, 0.20174217224121094, 0.20995330810546875, 0.21816444396972656, 0.22637557983398438, 0.2345867156982422, 0.2427978515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 9.0, 7.0, 11.0, 15.0, 26.0, 23.0, 42.0, 83.0, 136.0, 250.0, 541.0, 1324.0, 3884.0, 16296.0, 171782.0, 803394.0, 40124.0, 6954.0, 1986.0, 787.0, 374.0, 200.0, 95.0, 70.0, 39.0, 29.0, 17.0, 11.0, 10.0, 5.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.79931640625, -0.7759628295898438, -0.7526092529296875, -0.7292556762695312, -0.705902099609375, -0.6825485229492188, -0.6591949462890625, -0.6358413696289062, -0.61248779296875, -0.5891342163085938, -0.5657806396484375, -0.5424270629882812, -0.519073486328125, -0.49571990966796875, -0.4723663330078125, -0.44901275634765625, -0.4256591796875, -0.40230560302734375, -0.3789520263671875, -0.35559844970703125, -0.332244873046875, -0.30889129638671875, -0.2855377197265625, -0.26218414306640625, -0.23883056640625, -0.21547698974609375, -0.1921234130859375, -0.16876983642578125, -0.145416259765625, -0.12206268310546875, -0.0987091064453125, -0.07535552978515625, -0.052001953125, -0.02864837646484375, -0.0052947998046875, 0.01805877685546875, 0.041412353515625, 0.06476593017578125, 0.0881195068359375, 0.11147308349609375, 0.13482666015625, 0.15818023681640625, 0.1815338134765625, 0.20488739013671875, 0.228240966796875, 0.25159454345703125, 0.2749481201171875, 0.29830169677734375, 0.3216552734375, 0.34500885009765625, 0.3683624267578125, 0.39171600341796875, 0.415069580078125, 0.43842315673828125, 0.4617767333984375, 0.48513031005859375, 0.50848388671875, 0.5318374633789062, 0.5551910400390625, 0.5785446166992188, 0.601898193359375, 0.6252517700195312, 0.6486053466796875, 0.6719589233398438, 0.6953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 9.0, 6.0, 8.0, 14.0, 18.0, 23.0, 36.0, 26.0, 27.0, 48.0, 52.0, 54.0, 60.0, 68.0, 67.0, 72.0, 69.0, 56.0, 51.0, 47.0, 35.0, 27.0, 25.0, 17.0, 13.0, 16.0, 11.0, 9.0, 3.0, 5.0, 2.0, 3.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.73974609375, -0.7147140502929688, -0.6896820068359375, -0.6646499633789062, -0.639617919921875, -0.6145858764648438, -0.5895538330078125, -0.5645217895507812, -0.53948974609375, -0.5144577026367188, -0.4894256591796875, -0.46439361572265625, -0.439361572265625, -0.41432952880859375, -0.3892974853515625, -0.36426544189453125, -0.3392333984375, -0.31420135498046875, -0.2891693115234375, -0.26413726806640625, -0.239105224609375, -0.21407318115234375, -0.1890411376953125, -0.16400909423828125, -0.13897705078125, -0.11394500732421875, -0.0889129638671875, -0.06388092041015625, -0.038848876953125, -0.01381683349609375, 0.0112152099609375, 0.03624725341796875, 0.061279296875, 0.08631134033203125, 0.1113433837890625, 0.13637542724609375, 0.161407470703125, 0.18643951416015625, 0.2114715576171875, 0.23650360107421875, 0.26153564453125, 0.28656768798828125, 0.3115997314453125, 0.33663177490234375, 0.361663818359375, 0.38669586181640625, 0.4117279052734375, 0.43675994873046875, 0.4617919921875, 0.48682403564453125, 0.5118560791015625, 0.5368881225585938, 0.561920166015625, 0.5869522094726562, 0.6119842529296875, 0.6370162963867188, 0.66204833984375, 0.6870803833007812, 0.7121124267578125, 0.7371444702148438, 0.762176513671875, 0.7872085571289062, 0.8122406005859375, 0.8372726440429688, 0.8623046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 6.0, 7.0, 3.0, 14.0, 16.0, 19.0, 30.0, 53.0, 103.0, 212.0, 497.0, 1451.0, 5098.0, 33994.0, 946305.0, 51821.0, 6161.0, 1601.0, 624.0, 219.0, 107.0, 55.0, 42.0, 19.0, 14.0, 11.0, 11.0, 7.0, 8.0, 6.0, 3.0, 1.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.351806640625, -0.3390464782714844, -0.32628631591796875, -0.3135261535644531, -0.3007659912109375, -0.2880058288574219, -0.27524566650390625, -0.2624855041503906, -0.249725341796875, -0.23696517944335938, -0.22420501708984375, -0.21144485473632812, -0.1986846923828125, -0.18592453002929688, -0.17316436767578125, -0.16040420532226562, -0.14764404296875, -0.13488388061523438, -0.12212371826171875, -0.10936355590820312, -0.0966033935546875, -0.08384323120117188, -0.07108306884765625, -0.058322906494140625, -0.045562744140625, -0.032802581787109375, -0.02004241943359375, -0.007282257080078125, 0.0054779052734375, 0.018238067626953125, 0.03099822998046875, 0.043758392333984375, 0.0565185546875, 0.06927871704101562, 0.08203887939453125, 0.09479904174804688, 0.1075592041015625, 0.12031936645507812, 0.13307952880859375, 0.14583969116210938, 0.158599853515625, 0.17136001586914062, 0.18412017822265625, 0.19688034057617188, 0.2096405029296875, 0.22240066528320312, 0.23516082763671875, 0.24792098999023438, 0.26068115234375, 0.2734413146972656, 0.28620147705078125, 0.2989616394042969, 0.3117218017578125, 0.3244819641113281, 0.33724212646484375, 0.3500022888183594, 0.362762451171875, 0.3755226135253906, 0.38828277587890625, 0.4010429382324219, 0.4138031005859375, 0.4265632629394531, 0.43932342529296875, 0.4520835876464844, 0.46484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 9.0, 10.0, 8.0, 15.0, 18.0, 14.0, 25.0, 23.0, 29.0, 23.0, 41.0, 69.0, 76.0, 97.0, 105.0, 90.0, 71.0, 44.0, 34.0, 35.0, 23.0, 20.0, 19.0, 14.0, 11.0, 11.0, 12.0, 8.0, 13.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.61611557006836e-05, -6.39650970697403e-05, -6.1769038438797e-05, -5.95729798078537e-05, -5.73769211769104e-05, -5.51808625459671e-05, -5.2984803915023804e-05, -5.0788745284080505e-05, -4.859268665313721e-05, -4.639662802219391e-05, -4.420056939125061e-05, -4.200451076030731e-05, -3.9808452129364014e-05, -3.7612393498420715e-05, -3.541633486747742e-05, -3.322027623653412e-05, -3.102421760559082e-05, -2.8828158974647522e-05, -2.6632100343704224e-05, -2.4436041712760925e-05, -2.2239983081817627e-05, -2.004392445087433e-05, -1.784786581993103e-05, -1.5651807188987732e-05, -1.3455748558044434e-05, -1.1259689927101135e-05, -9.063631296157837e-06, -6.8675726652145386e-06, -4.67151403427124e-06, -2.475455403327942e-06, -2.7939677238464355e-07, 1.9166618585586548e-06, 4.112720489501953e-06, 6.3087791204452515e-06, 8.50483775138855e-06, 1.0700896382331848e-05, 1.2896955013275146e-05, 1.5093013644218445e-05, 1.7289072275161743e-05, 1.948513090610504e-05, 2.168118953704834e-05, 2.3877248167991638e-05, 2.6073306798934937e-05, 2.8269365429878235e-05, 3.0465424060821533e-05, 3.266148269176483e-05, 3.485754132270813e-05, 3.705359995365143e-05, 3.9249658584594727e-05, 4.1445717215538025e-05, 4.364177584648132e-05, 4.583783447742462e-05, 4.803389310836792e-05, 5.022995173931122e-05, 5.2426010370254517e-05, 5.4622069001197815e-05, 5.681812763214111e-05, 5.901418626308441e-05, 6.121024489402771e-05, 6.340630352497101e-05, 6.56023621559143e-05, 6.77984207868576e-05, 6.99944794178009e-05, 7.21905380487442e-05, 7.43865966796875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 2.0, 8.0, 9.0, 11.0, 20.0, 29.0, 33.0, 46.0, 61.0, 92.0, 137.0, 213.0, 390.0, 713.0, 1347.0, 2838.0, 8134.0, 51867.0, 906066.0, 61419.0, 8757.0, 3008.0, 1469.0, 716.0, 409.0, 229.0, 148.0, 104.0, 53.0, 66.0, 34.0, 21.0, 16.0, 13.0, 9.0, 11.0, 12.0, 6.0, 1.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.334228515625, -0.3242607116699219, -0.31429290771484375, -0.3043251037597656, -0.2943572998046875, -0.2843894958496094, -0.27442169189453125, -0.2644538879394531, -0.254486083984375, -0.24451828002929688, -0.23455047607421875, -0.22458267211914062, -0.2146148681640625, -0.20464706420898438, -0.19467926025390625, -0.18471145629882812, -0.17474365234375, -0.16477584838867188, -0.15480804443359375, -0.14484024047851562, -0.1348724365234375, -0.12490463256835938, -0.11493682861328125, -0.10496902465820312, -0.095001220703125, -0.08503341674804688, -0.07506561279296875, -0.06509780883789062, -0.0551300048828125, -0.045162200927734375, -0.03519439697265625, -0.025226593017578125, -0.0152587890625, -0.005290985107421875, 0.00467681884765625, 0.014644622802734375, 0.0246124267578125, 0.034580230712890625, 0.04454803466796875, 0.054515838623046875, 0.064483642578125, 0.07445144653320312, 0.08441925048828125, 0.09438705444335938, 0.1043548583984375, 0.11432266235351562, 0.12429046630859375, 0.13425827026367188, 0.14422607421875, 0.15419387817382812, 0.16416168212890625, 0.17412948608398438, 0.1840972900390625, 0.19406509399414062, 0.20403289794921875, 0.21400070190429688, 0.223968505859375, 0.23393630981445312, 0.24390411376953125, 0.2538719177246094, 0.2638397216796875, 0.2738075256347656, 0.28377532958984375, 0.2937431335449219, 0.3037109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 8.0, 13.0, 17.0, 33.0, 50.0, 114.0, 218.0, 233.0, 127.0, 73.0, 36.0, 16.0, 15.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.3840599060058594, -0.37212371826171875, -0.3601875305175781, -0.3482513427734375, -0.3363151550292969, -0.32437896728515625, -0.3124427795410156, -0.300506591796875, -0.2885704040527344, -0.27663421630859375, -0.2646980285644531, -0.2527618408203125, -0.24082565307617188, -0.22888946533203125, -0.21695327758789062, -0.20501708984375, -0.19308090209960938, -0.18114471435546875, -0.16920852661132812, -0.1572723388671875, -0.14533615112304688, -0.13339996337890625, -0.12146377563476562, -0.109527587890625, -0.09759140014648438, -0.08565521240234375, -0.07371902465820312, -0.0617828369140625, -0.049846649169921875, -0.03791046142578125, -0.025974273681640625, -0.0140380859375, -0.002101898193359375, 0.00983428955078125, 0.021770477294921875, 0.0337066650390625, 0.045642852783203125, 0.05757904052734375, 0.06951522827148438, 0.081451416015625, 0.09338760375976562, 0.10532379150390625, 0.11725997924804688, 0.1291961669921875, 0.14113235473632812, 0.15306854248046875, 0.16500473022460938, 0.17694091796875, 0.18887710571289062, 0.20081329345703125, 0.21274948120117188, 0.2246856689453125, 0.23662185668945312, 0.24855804443359375, 0.2604942321777344, 0.272430419921875, 0.2843666076660156, 0.29630279541015625, 0.3082389831542969, 0.3201751708984375, 0.3321113586425781, 0.34404754638671875, 0.3559837341308594, 0.367919921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 4.0, 17.0, 73.0, 295.0, 436.0, 120.0, 26.0, 10.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.787864685058594, -11.461349487304688, -11.134834289550781, -10.808319091796875, -10.481803894042969, -10.155288696289062, -9.828773498535156, -9.50225830078125, -9.175743103027344, -8.849227905273438, -8.522712707519531, -8.196197509765625, -7.869682312011719, -7.5431671142578125, -7.2166523933410645, -6.890137195587158, -6.56362247467041, -6.237107276916504, -5.910592079162598, -5.584076881408691, -5.257561683654785, -4.931046485900879, -4.604531764984131, -4.278016567230225, -3.9515013694763184, -3.624986171722412, -3.298470973968506, -2.9719560146331787, -2.6454408168792725, -2.318925619125366, -1.9924105405807495, -1.6658954620361328, -1.3393802642822266, -1.0128650665283203, -0.6863499879837036, -0.35983484983444214, -0.033319711685180664, 0.2931954860687256, 0.6197105646133423, 0.946225643157959, 1.2727408409118652, 1.5992560386657715, 1.9257711172103882, 2.252286195755005, 2.578801393508911, 2.9053165912628174, 3.2318315505981445, 3.558346748352051, 3.884861946105957, 4.211377143859863, 4.5378923416137695, 4.864407539367676, 5.190922737121582, 5.517437934875488, 5.843952655792236, 6.170467853546143, 6.496983051300049, 6.823498249053955, 7.150013446807861, 7.476528644561768, 7.803043365478516, 8.129558563232422, 8.456073760986328, 8.782588958740234, 9.10910415649414]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 15.0, 9.0, 17.0, 27.0, 26.0, 29.0, 28.0, 46.0, 56.0, 57.0, 84.0, 130.0, 106.0, 81.0, 55.0, 42.0, 32.0, 29.0, 32.0, 24.0, 14.0, 10.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1053006649017334, -2.9970927238464355, -2.8888845443725586, -2.7806766033172607, -2.672468423843384, -2.564260482788086, -2.456052303314209, -2.347844362258911, -2.2396364212036133, -2.1314284801483154, -2.0232203006744385, -1.9150123596191406, -1.8068042993545532, -1.6985962390899658, -1.5903881788253784, -1.482180118560791, -1.3739720582962036, -1.2657639980316162, -1.1575559377670288, -1.0493478775024414, -0.9411399364471436, -0.8329318761825562, -0.7247238159179688, -0.6165158152580261, -0.5083077549934387, -0.4000997245311737, -0.2918916940689087, -0.1836836338043213, -0.07547560334205627, 0.03273242712020874, 0.14094048738479614, 0.24914848804473877, 0.35735654830932617, 0.4655645787715912, 0.5737726092338562, 0.6819806694984436, 0.7901886701583862, 0.8983967304229736, 1.006604790687561, 1.1148128509521484, 1.2230207920074463, 1.3312288522720337, 1.439436912536621, 1.547644853591919, 1.6558529138565063, 1.7640609741210938, 1.8722690343856812, 1.9804770946502686, 2.0886850357055664, 2.1968929767608643, 2.305101156234741, 2.413309097290039, 2.521517276763916, 2.629725217819214, 2.7379331588745117, 2.8461413383483887, 2.9543495178222656, 3.0625574588775635, 3.1707656383514404, 3.2789735794067383, 3.3871817588806152, 3.495389699935913, 3.603597640991211, 3.711805820465088, 3.8200137615203857]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 8.0, 2.0, 4.0, 6.0, 7.0, 21.0, 12.0, 32.0, 53.0, 81.0, 159.0, 286.0, 649.0, 1619.0, 5699.0, 30079.0, 479366.0, 3471106.0, 180894.0, 17869.0, 3916.0, 1294.0, 530.0, 258.0, 128.0, 68.0, 46.0, 33.0, 26.0, 11.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89111328125, -0.8651809692382812, -0.8392486572265625, -0.8133163452148438, -0.787384033203125, -0.7614517211914062, -0.7355194091796875, -0.7095870971679688, -0.68365478515625, -0.6577224731445312, -0.6317901611328125, -0.6058578491210938, -0.579925537109375, -0.5539932250976562, -0.5280609130859375, -0.5021286010742188, -0.4761962890625, -0.45026397705078125, -0.4243316650390625, -0.39839935302734375, -0.372467041015625, -0.34653472900390625, -0.3206024169921875, -0.29467010498046875, -0.26873779296875, -0.24280548095703125, -0.2168731689453125, -0.19094085693359375, -0.165008544921875, -0.13907623291015625, -0.1131439208984375, -0.08721160888671875, -0.061279296875, -0.03534698486328125, -0.0094146728515625, 0.01651763916015625, 0.042449951171875, 0.06838226318359375, 0.0943145751953125, 0.12024688720703125, 0.14617919921875, 0.17211151123046875, 0.1980438232421875, 0.22397613525390625, 0.249908447265625, 0.27584075927734375, 0.3017730712890625, 0.32770538330078125, 0.3536376953125, 0.37957000732421875, 0.4055023193359375, 0.43143463134765625, 0.457366943359375, 0.48329925537109375, 0.5092315673828125, 0.5351638793945312, 0.56109619140625, 0.5870285034179688, 0.6129608154296875, 0.6388931274414062, 0.664825439453125, 0.6907577514648438, 0.7166900634765625, 0.7426223754882812, 0.7685546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 10.0, 11.0, 18.0, 29.0, 21.0, 19.0, 32.0, 41.0, 50.0, 57.0, 62.0, 78.0, 62.0, 74.0, 74.0, 56.0, 47.0, 58.0, 34.0, 37.0, 35.0, 22.0, 22.0, 14.0, 13.0, 12.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15185546875, -0.1450042724609375, -0.138153076171875, -0.1313018798828125, -0.12445068359375, -0.1175994873046875, -0.110748291015625, -0.1038970947265625, -0.0970458984375, -0.0901947021484375, -0.083343505859375, -0.0764923095703125, -0.06964111328125, -0.0627899169921875, -0.055938720703125, -0.0490875244140625, -0.042236328125, -0.0353851318359375, -0.028533935546875, -0.0216827392578125, -0.01483154296875, -0.0079803466796875, -0.001129150390625, 0.0057220458984375, 0.0125732421875, 0.0194244384765625, 0.026275634765625, 0.0331268310546875, 0.03997802734375, 0.0468292236328125, 0.053680419921875, 0.0605316162109375, 0.0673828125, 0.0742340087890625, 0.081085205078125, 0.0879364013671875, 0.09478759765625, 0.1016387939453125, 0.108489990234375, 0.1153411865234375, 0.1221923828125, 0.1290435791015625, 0.135894775390625, 0.1427459716796875, 0.14959716796875, 0.1564483642578125, 0.163299560546875, 0.1701507568359375, 0.177001953125, 0.1838531494140625, 0.190704345703125, 0.1975555419921875, 0.20440673828125, 0.2112579345703125, 0.218109130859375, 0.2249603271484375, 0.2318115234375, 0.2386627197265625, 0.245513916015625, 0.2523651123046875, 0.25921630859375, 0.2660675048828125, 0.272918701171875, 0.2797698974609375, 0.28662109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 11.0, 8.0, 16.0, 11.0, 33.0, 37.0, 68.0, 126.0, 190.0, 354.0, 730.0, 1801.0, 4852.0, 27935.0, 2342841.0, 1780808.0, 26325.0, 4745.0, 1677.0, 797.0, 357.0, 199.0, 103.0, 76.0, 42.0, 22.0, 17.0, 15.0, 12.0, 10.0, 10.0, 4.0, 7.0, 4.0, 1.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3681640625, -1.3290557861328125, -1.289947509765625, -1.2508392333984375, -1.21173095703125, -1.1726226806640625, -1.133514404296875, -1.0944061279296875, -1.0552978515625, -1.0161895751953125, -0.977081298828125, -0.9379730224609375, -0.89886474609375, -0.8597564697265625, -0.820648193359375, -0.7815399169921875, -0.742431640625, -0.7033233642578125, -0.664215087890625, -0.6251068115234375, -0.58599853515625, -0.5468902587890625, -0.507781982421875, -0.4686737060546875, -0.4295654296875, -0.3904571533203125, -0.351348876953125, -0.3122406005859375, -0.27313232421875, -0.2340240478515625, -0.194915771484375, -0.1558074951171875, -0.11669921875, -0.0775909423828125, -0.038482666015625, 0.0006256103515625, 0.03973388671875, 0.0788421630859375, 0.117950439453125, 0.1570587158203125, 0.1961669921875, 0.2352752685546875, 0.274383544921875, 0.3134918212890625, 0.35260009765625, 0.3917083740234375, 0.430816650390625, 0.4699249267578125, 0.509033203125, 0.5481414794921875, 0.587249755859375, 0.6263580322265625, 0.66546630859375, 0.7045745849609375, 0.743682861328125, 0.7827911376953125, 0.8218994140625, 0.8610076904296875, 0.900115966796875, 0.9392242431640625, 0.97833251953125, 1.0174407958984375, 1.056549072265625, 1.0956573486328125, 1.134765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 4.0, 7.0, 22.0, 22.0, 44.0, 74.0, 118.0, 207.0, 425.0, 787.0, 998.0, 607.0, 322.0, 176.0, 113.0, 48.0, 36.0, 15.0, 10.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89697265625, -0.8599014282226562, -0.8228302001953125, -0.7857589721679688, -0.748687744140625, -0.7116165161132812, -0.6745452880859375, -0.6374740600585938, -0.60040283203125, -0.5633316040039062, -0.5262603759765625, -0.48918914794921875, -0.452117919921875, -0.41504669189453125, -0.3779754638671875, -0.34090423583984375, -0.3038330078125, -0.26676177978515625, -0.2296905517578125, -0.19261932373046875, -0.155548095703125, -0.11847686767578125, -0.0814056396484375, -0.04433441162109375, -0.00726318359375, 0.02980804443359375, 0.0668792724609375, 0.10395050048828125, 0.141021728515625, 0.17809295654296875, 0.2151641845703125, 0.25223541259765625, 0.289306640625, 0.32637786865234375, 0.3634490966796875, 0.40052032470703125, 0.437591552734375, 0.47466278076171875, 0.5117340087890625, 0.5488052368164062, 0.58587646484375, 0.6229476928710938, 0.6600189208984375, 0.6970901489257812, 0.734161376953125, 0.7712326049804688, 0.8083038330078125, 0.8453750610351562, 0.8824462890625, 0.9195175170898438, 0.9565887451171875, 0.9936599731445312, 1.030731201171875, 1.0678024291992188, 1.1048736572265625, 1.1419448852539062, 1.17901611328125, 1.2160873413085938, 1.2531585693359375, 1.2902297973632812, 1.327301025390625, 1.3643722534179688, 1.4014434814453125, 1.4385147094726562, 1.4755859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 10.0, 13.0, 35.0, 48.0, 151.0, 269.0, 233.0, 117.0, 54.0, 27.0, 8.0, 9.0, 2.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.487607955932617, -14.043328285217285, -13.599048614501953, -13.154767990112305, -12.710488319396973, -12.26620864868164, -11.821928977966309, -11.377649307250977, -10.933368682861328, -10.489089012145996, -10.044809341430664, -9.600528717041016, -9.156249046325684, -8.711969375610352, -8.26768970489502, -7.8234100341796875, -7.3791303634643555, -6.934850692749023, -6.490570545196533, -6.046290874481201, -5.602010726928711, -5.157731056213379, -4.713451385498047, -4.269171714782715, -3.8248915672302246, -3.3806116580963135, -2.9363317489624023, -2.4920520782470703, -2.047772169113159, -1.603492259979248, -1.159212589263916, -0.7149326801300049, -0.27065181732177734, 0.173628032207489, 0.6179078817367554, 1.062187671661377, 1.506467580795288, 1.9507474899291992, 2.3950271606445312, 2.8393070697784424, 3.2835869789123535, 3.7278668880462646, 4.172146797180176, 4.616426467895508, 5.06070613861084, 5.50498628616333, 5.949265956878662, 6.393546104431152, 6.837825775146484, 7.282105445861816, 7.726385593414307, 8.170665740966797, 8.614945411682129, 9.059225082397461, 9.503504753112793, 9.947784423828125, 10.392065048217773, 10.836344718933105, 11.280624389648438, 11.724905014038086, 12.169184684753418, 12.61346435546875, 13.057744026184082, 13.502023696899414, 13.946303367614746]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 3.0, 12.0, 17.0, 19.0, 22.0, 24.0, 43.0, 45.0, 54.0, 70.0, 72.0, 87.0, 87.0, 91.0, 77.0, 70.0, 53.0, 38.0, 31.0, 25.0, 14.0, 20.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.083523750305176, -7.839505672454834, -7.595487117767334, -7.351469039916992, -7.10745096206665, -6.863432884216309, -6.619414329528809, -6.375396251678467, -6.131378173828125, -5.887360095977783, -5.643341541290283, -5.399323463439941, -5.1553053855896, -4.911287307739258, -4.667268753051758, -4.423250675201416, -4.179232120513916, -3.935213804244995, -3.6911957263946533, -3.4471774101257324, -3.2031593322753906, -2.9591410160064697, -2.715122699737549, -2.471104621887207, -2.227086305618286, -1.9830681085586548, -1.7390499114990234, -1.4950315952301025, -1.2510133981704712, -1.0069952011108398, -0.762976884841919, -0.5189586877822876, -0.27494049072265625, -0.030922263860702515, 0.21309596300125122, 0.45711421966552734, 0.7011324167251587, 0.94515061378479, 1.189168930053711, 1.4331871271133423, 1.6772053241729736, 1.921223521232605, 2.1652417182922363, 2.4092600345611572, 2.653278350830078, 2.89729642868042, 3.141314744949341, 3.3853330612182617, 3.6293511390686035, 3.8733694553375244, 4.117387771606445, 4.361405849456787, 4.605423927307129, 4.849442481994629, 5.093460559844971, 5.3374786376953125, 5.5814971923828125, 5.825515270233154, 6.069533824920654, 6.313551902770996, 6.557569980621338, 6.80158805847168, 7.04560661315918, 7.2896246910095215, 7.533642768859863]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 17.0, 17.0, 30.0, 26.0, 44.0, 77.0, 160.0, 210.0, 353.0, 740.0, 1579.0, 3722.0, 11115.0, 41219.0, 243979.0, 604639.0, 106388.0, 22605.0, 6593.0, 2595.0, 1139.0, 550.0, 303.0, 158.0, 107.0, 56.0, 32.0, 24.0, 23.0, 18.0, 9.0, 10.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.40256500244140625, -0.3908233642578125, -0.37908172607421875, -0.367340087890625, -0.35559844970703125, -0.3438568115234375, -0.33211517333984375, -0.32037353515625, -0.30863189697265625, -0.2968902587890625, -0.28514862060546875, -0.273406982421875, -0.26166534423828125, -0.2499237060546875, -0.23818206787109375, -0.2264404296875, -0.21469879150390625, -0.2029571533203125, -0.19121551513671875, -0.179473876953125, -0.16773223876953125, -0.1559906005859375, -0.14424896240234375, -0.13250732421875, -0.12076568603515625, -0.1090240478515625, -0.09728240966796875, -0.085540771484375, -0.07379913330078125, -0.0620574951171875, -0.05031585693359375, -0.03857421875, -0.02683258056640625, -0.0150909423828125, -0.00334930419921875, 0.008392333984375, 0.02013397216796875, 0.0318756103515625, 0.04361724853515625, 0.05535888671875, 0.06710052490234375, 0.0788421630859375, 0.09058380126953125, 0.102325439453125, 0.11406707763671875, 0.1258087158203125, 0.13755035400390625, 0.1492919921875, 0.16103363037109375, 0.1727752685546875, 0.18451690673828125, 0.196258544921875, 0.20800018310546875, 0.2197418212890625, 0.23148345947265625, 0.24322509765625, 0.25496673583984375, 0.2667083740234375, 0.27845001220703125, 0.290191650390625, 0.30193328857421875, 0.3136749267578125, 0.32541656494140625, 0.337158203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 9.0, 9.0, 20.0, 24.0, 34.0, 52.0, 50.0, 69.0, 81.0, 73.0, 73.0, 110.0, 96.0, 67.0, 64.0, 52.0, 34.0, 31.0, 20.0, 16.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.34853363037109375, -0.3359832763671875, -0.32343292236328125, -0.310882568359375, -0.29833221435546875, -0.2857818603515625, -0.27323150634765625, -0.26068115234375, -0.24813079833984375, -0.2355804443359375, -0.22303009033203125, -0.210479736328125, -0.19792938232421875, -0.1853790283203125, -0.17282867431640625, -0.1602783203125, -0.14772796630859375, -0.1351776123046875, -0.12262725830078125, -0.110076904296875, -0.09752655029296875, -0.0849761962890625, -0.07242584228515625, -0.05987548828125, -0.04732513427734375, -0.0347747802734375, -0.02222442626953125, -0.009674072265625, 0.00287628173828125, 0.0154266357421875, 0.02797698974609375, 0.04052734375, 0.05307769775390625, 0.0656280517578125, 0.07817840576171875, 0.090728759765625, 0.10327911376953125, 0.1158294677734375, 0.12837982177734375, 0.14093017578125, 0.15348052978515625, 0.1660308837890625, 0.17858123779296875, 0.191131591796875, 0.20368194580078125, 0.2162322998046875, 0.22878265380859375, 0.2413330078125, 0.25388336181640625, 0.2664337158203125, 0.27898406982421875, 0.291534423828125, 0.30408477783203125, 0.3166351318359375, 0.32918548583984375, 0.34173583984375, 0.35428619384765625, 0.3668365478515625, 0.37938690185546875, 0.391937255859375, 0.40448760986328125, 0.4170379638671875, 0.42958831787109375, 0.442138671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 9.0, 5.0, 11.0, 18.0, 21.0, 57.0, 65.0, 111.0, 217.0, 494.0, 1269.0, 4957.0, 41759.0, 927159.0, 63294.0, 6406.0, 1576.0, 532.0, 257.0, 125.0, 68.0, 54.0, 27.0, 20.0, 15.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6595535278320312, -0.6399078369140625, -0.6202621459960938, -0.600616455078125, -0.5809707641601562, -0.5613250732421875, -0.5416793823242188, -0.52203369140625, -0.5023880004882812, -0.4827423095703125, -0.46309661865234375, -0.443450927734375, -0.42380523681640625, -0.4041595458984375, -0.38451385498046875, -0.3648681640625, -0.34522247314453125, -0.3255767822265625, -0.30593109130859375, -0.286285400390625, -0.26663970947265625, -0.2469940185546875, -0.22734832763671875, -0.20770263671875, -0.18805694580078125, -0.1684112548828125, -0.14876556396484375, -0.129119873046875, -0.10947418212890625, -0.0898284912109375, -0.07018280029296875, -0.050537109375, -0.03089141845703125, -0.0112457275390625, 0.00839996337890625, 0.028045654296875, 0.04769134521484375, 0.0673370361328125, 0.08698272705078125, 0.10662841796875, 0.12627410888671875, 0.1459197998046875, 0.16556549072265625, 0.185211181640625, 0.20485687255859375, 0.2245025634765625, 0.24414825439453125, 0.2637939453125, 0.28343963623046875, 0.3030853271484375, 0.32273101806640625, 0.342376708984375, 0.36202239990234375, 0.3816680908203125, 0.40131378173828125, 0.42095947265625, 0.44060516357421875, 0.4602508544921875, 0.47989654541015625, 0.499542236328125, 0.5191879272460938, 0.5388336181640625, 0.5584793090820312, 0.578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 11.0, 5.0, 4.0, 10.0, 14.0, 26.0, 29.0, 33.0, 28.0, 43.0, 80.0, 86.0, 109.0, 120.0, 83.0, 90.0, 54.0, 46.0, 32.0, 27.0, 21.0, 11.0, 10.0, 14.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.44403076171875, -1.3978271484375, -1.35162353515625, -1.305419921875, -1.25921630859375, -1.2130126953125, -1.16680908203125, -1.12060546875, -1.07440185546875, -1.0281982421875, -0.98199462890625, -0.935791015625, -0.88958740234375, -0.8433837890625, -0.79718017578125, -0.7509765625, -0.70477294921875, -0.6585693359375, -0.61236572265625, -0.566162109375, -0.51995849609375, -0.4737548828125, -0.42755126953125, -0.38134765625, -0.33514404296875, -0.2889404296875, -0.24273681640625, -0.196533203125, -0.15032958984375, -0.1041259765625, -0.05792236328125, -0.01171875, 0.03448486328125, 0.0806884765625, 0.12689208984375, 0.173095703125, 0.21929931640625, 0.2655029296875, 0.31170654296875, 0.35791015625, 0.40411376953125, 0.4503173828125, 0.49652099609375, 0.542724609375, 0.58892822265625, 0.6351318359375, 0.68133544921875, 0.7275390625, 0.77374267578125, 0.8199462890625, 0.86614990234375, 0.912353515625, 0.95855712890625, 1.0047607421875, 1.05096435546875, 1.09716796875, 1.14337158203125, 1.1895751953125, 1.23577880859375, 1.281982421875, 1.32818603515625, 1.3743896484375, 1.42059326171875, 1.466796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 11.0, 14.0, 15.0, 24.0, 43.0, 31.0, 63.0, 89.0, 149.0, 223.0, 389.0, 735.0, 1512.0, 3619.0, 9903.0, 39305.0, 779845.0, 175079.0, 24639.0, 7394.0, 2721.0, 1173.0, 594.0, 361.0, 202.0, 138.0, 69.0, 51.0, 42.0, 33.0, 20.0, 6.0, 13.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06195068359375, -0.05987548828125, -0.05780029296875, -0.05572509765625, -0.05364990234375, -0.05157470703125, -0.04949951171875, -0.04742431640625, -0.04534912109375, -0.04327392578125, -0.04119873046875, -0.03912353515625, -0.03704833984375, -0.03497314453125, -0.03289794921875, -0.03082275390625, -0.02874755859375, -0.02667236328125, -0.02459716796875, -0.02252197265625, -0.02044677734375, -0.01837158203125, -0.01629638671875, -0.01422119140625, -0.01214599609375, -0.01007080078125, -0.00799560546875, -0.00592041015625, -0.00384521484375, -0.00177001953125, 0.00030517578125, 0.00238037109375, 0.00445556640625, 0.00653076171875, 0.00860595703125, 0.01068115234375, 0.01275634765625, 0.01483154296875, 0.01690673828125, 0.01898193359375, 0.02105712890625, 0.02313232421875, 0.02520751953125, 0.02728271484375, 0.02935791015625, 0.03143310546875, 0.03350830078125, 0.03558349609375, 0.03765869140625, 0.03973388671875, 0.04180908203125, 0.04388427734375, 0.04595947265625, 0.04803466796875, 0.05010986328125, 0.05218505859375, 0.05426025390625, 0.05633544921875, 0.05841064453125, 0.06048583984375, 0.06256103515625, 0.06463623046875, 0.06671142578125, 0.06878662109375, 0.07086181640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 5.0, 4.0, 8.0, 5.0, 14.0, 14.0, 20.0, 27.0, 33.0, 59.0, 73.0, 87.0, 92.0, 87.0, 95.0, 89.0, 58.0, 51.0, 29.0, 30.0, 16.0, 14.0, 18.0, 9.0, 9.0, 9.0, 8.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3543834686279297e-05, -2.2739171981811523e-05, -2.193450927734375e-05, -2.1129846572875977e-05, -2.0325183868408203e-05, -1.952052116394043e-05, -1.8715858459472656e-05, -1.7911195755004883e-05, -1.710653305053711e-05, -1.6301870346069336e-05, -1.5497207641601562e-05, -1.4692544937133789e-05, -1.3887882232666016e-05, -1.3083219528198242e-05, -1.2278556823730469e-05, -1.1473894119262695e-05, -1.0669231414794922e-05, -9.864568710327148e-06, -9.059906005859375e-06, -8.255243301391602e-06, -7.450580596923828e-06, -6.645917892456055e-06, -5.841255187988281e-06, -5.036592483520508e-06, -4.231929779052734e-06, -3.427267074584961e-06, -2.6226043701171875e-06, -1.817941665649414e-06, -1.0132789611816406e-06, -2.086162567138672e-07, 5.960464477539062e-07, 1.4007091522216797e-06, 2.205371856689453e-06, 3.0100345611572266e-06, 3.814697265625e-06, 4.6193599700927734e-06, 5.424022674560547e-06, 6.22868537902832e-06, 7.033348083496094e-06, 7.838010787963867e-06, 8.64267349243164e-06, 9.447336196899414e-06, 1.0251998901367188e-05, 1.1056661605834961e-05, 1.1861324310302734e-05, 1.2665987014770508e-05, 1.3470649719238281e-05, 1.4275312423706055e-05, 1.5079975128173828e-05, 1.58846378326416e-05, 1.6689300537109375e-05, 1.749396324157715e-05, 1.8298625946044922e-05, 1.9103288650512695e-05, 1.990795135498047e-05, 2.0712614059448242e-05, 2.1517276763916016e-05, 2.232193946838379e-05, 2.3126602172851562e-05, 2.3931264877319336e-05, 2.473592758178711e-05, 2.5540590286254883e-05, 2.6345252990722656e-05, 2.714991569519043e-05, 2.7954578399658203e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 15.0, 12.0, 22.0, 32.0, 47.0, 76.0, 122.0, 217.0, 323.0, 697.0, 1242.0, 2780.0, 6594.0, 20306.0, 93633.0, 819907.0, 73873.0, 17553.0, 6072.0, 2501.0, 1131.0, 586.0, 305.0, 177.0, 106.0, 69.0, 41.0, 20.0, 20.0, 14.0, 11.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07025146484375, -0.06815052032470703, -0.06604957580566406, -0.0639486312866211, -0.061847686767578125, -0.059746742248535156, -0.05764579772949219, -0.05554485321044922, -0.05344390869140625, -0.05134296417236328, -0.04924201965332031, -0.047141075134277344, -0.045040130615234375, -0.042939186096191406, -0.04083824157714844, -0.03873729705810547, -0.0366363525390625, -0.03453540802001953, -0.03243446350097656, -0.030333518981933594, -0.028232574462890625, -0.026131629943847656, -0.024030685424804688, -0.02192974090576172, -0.01982879638671875, -0.01772785186767578, -0.015626907348632812, -0.013525962829589844, -0.011425018310546875, -0.009324073791503906, -0.0072231292724609375, -0.005122184753417969, -0.003021240234375, -0.0009202957153320312, 0.0011806488037109375, 0.0032815933227539062, 0.005382537841796875, 0.007483482360839844, 0.009584426879882812, 0.011685371398925781, 0.01378631591796875, 0.01588726043701172, 0.017988204956054688, 0.020089149475097656, 0.022190093994140625, 0.024291038513183594, 0.026391983032226562, 0.02849292755126953, 0.0305938720703125, 0.03269481658935547, 0.03479576110839844, 0.036896705627441406, 0.038997650146484375, 0.041098594665527344, 0.04319953918457031, 0.04530048370361328, 0.04740142822265625, 0.04950237274169922, 0.05160331726074219, 0.053704261779785156, 0.055805206298828125, 0.057906150817871094, 0.06000709533691406, 0.06210803985595703, 0.064208984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 5.0, 4.0, 11.0, 11.0, 9.0, 16.0, 22.0, 33.0, 38.0, 60.0, 123.0, 168.0, 156.0, 114.0, 68.0, 45.0, 26.0, 23.0, 13.0, 18.0, 4.0, 8.0, 4.0, 3.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1302051544189453, -0.12613296508789062, -0.12206077575683594, -0.11798858642578125, -0.11391639709472656, -0.10984420776367188, -0.10577201843261719, -0.1016998291015625, -0.09762763977050781, -0.09355545043945312, -0.08948326110839844, -0.08541107177734375, -0.08133888244628906, -0.07726669311523438, -0.07319450378417969, -0.069122314453125, -0.06505012512207031, -0.060977935791015625, -0.05690574645996094, -0.05283355712890625, -0.04876136779785156, -0.044689178466796875, -0.04061698913574219, -0.0365447998046875, -0.03247261047363281, -0.028400421142578125, -0.024328231811523438, -0.02025604248046875, -0.016183853149414062, -0.012111663818359375, -0.008039474487304688, -0.00396728515625, 0.0001049041748046875, 0.004177093505859375, 0.008249282836914062, 0.01232147216796875, 0.016393661499023438, 0.020465850830078125, 0.024538040161132812, 0.0286102294921875, 0.03268241882324219, 0.036754608154296875, 0.04082679748535156, 0.04489898681640625, 0.04897117614746094, 0.053043365478515625, 0.05711555480957031, 0.061187744140625, 0.06525993347167969, 0.06933212280273438, 0.07340431213378906, 0.07747650146484375, 0.08154869079589844, 0.08562088012695312, 0.08969306945800781, 0.0937652587890625, 0.09783744812011719, 0.10190963745117188, 0.10598182678222656, 0.11005401611328125, 0.11412620544433594, 0.11819839477539062, 0.12227058410644531, 0.1263427734375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 15.0, 32.0, 70.0, 232.0, 488.0, 104.0, 32.0, 10.0, 9.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5393590927124023, -3.2913997173309326, -3.043440341949463, -2.7954812049865723, -2.5475218296051025, -2.299562454223633, -2.051603317260742, -1.8036439418792725, -1.5556845664978027, -1.307725191116333, -1.0597659349441528, -0.8118066191673279, -0.5638473033905029, -0.3158879280090332, -0.06792867183685303, 0.18003058433532715, 0.4279899597167969, 0.6759492754936218, 0.9239085912704468, 1.171867847442627, 1.4198272228240967, 1.6677865982055664, 1.9157458543777466, 2.1637051105499268, 2.4116644859313965, 2.659623861312866, 2.907583236694336, 3.1555423736572266, 3.4035017490386963, 3.651461124420166, 3.8994202613830566, 4.1473798751831055, 4.395339012145996, 4.643298149108887, 4.8912577629089355, 5.139216899871826, 5.387176513671875, 5.635135650634766, 5.883094787597656, 6.131053924560547, 6.379013538360596, 6.626972675323486, 6.874932289123535, 7.122891426086426, 7.370850563049316, 7.618810176849365, 7.866769313812256, 8.114728927612305, 8.362688064575195, 8.610647201538086, 8.858606338500977, 9.106566429138184, 9.354525566101074, 9.602484703063965, 9.850443840026855, 10.098402976989746, 10.346363067626953, 10.594322204589844, 10.842281341552734, 11.090241432189941, 11.338200569152832, 11.586159706115723, 11.834118843078613, 12.082077980041504, 12.330037117004395]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 27.0, 22.0, 37.0, 33.0, 47.0, 88.0, 137.0, 181.0, 170.0, 65.0, 51.0, 24.0, 18.0, 15.0, 16.0, 10.0, 14.0, 12.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.862760543823242, -3.698683738708496, -3.53460693359375, -3.370530128479004, -3.206453323364258, -3.0423765182495117, -2.8782994747161865, -2.7142226696014404, -2.5501458644866943, -2.3860690593719482, -2.221992254257202, -2.057915449142456, -1.8938385248184204, -1.7297617197036743, -1.5656847953796387, -1.4016079902648926, -1.2375311851501465, -1.0734543800354004, -0.9093775153160095, -0.7453006505966187, -0.5812238454818726, -0.41714704036712646, -0.2530701756477356, -0.08899331092834473, 0.07508349418640137, 0.23916032910346985, 0.40323716402053833, 0.5673140287399292, 0.7313908338546753, 0.8954676389694214, 1.059544563293457, 1.2236213684082031, 1.3876981735229492, 1.5517749786376953, 1.7158517837524414, 1.879928708076477, 2.0440053939819336, 2.2080821990966797, 2.372159242630005, 2.536236047744751, 2.700312852859497, 2.864389657974243, 3.0284664630889893, 3.1925432682037354, 3.3566203117370605, 3.5206971168518066, 3.6847739219665527, 3.848850727081299, 4.012927532196045, 4.177004337310791, 4.341081142425537, 4.505157947540283, 4.669234752655029, 4.833311557769775, 4.9973883628845215, 5.161465644836426, 5.325542449951172, 5.489619255065918, 5.653696060180664, 5.81777286529541, 5.981849670410156, 6.145926475524902, 6.310003280639648, 6.4740800857543945, 6.638156890869141]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 12.0, 12.0, 9.0, 20.0, 26.0, 27.0, 42.0, 49.0, 55.0, 193.0, 260.0, 63.0, 48.0, 49.0, 43.0, 19.0, 18.0, 12.0, 18.0, 11.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4104042053222656, -0.39868927001953125, -0.3869743347167969, -0.3752593994140625, -0.3635444641113281, -0.35182952880859375, -0.3401145935058594, -0.328399658203125, -0.3166847229003906, -0.30496978759765625, -0.2932548522949219, -0.2815399169921875, -0.2698249816894531, -0.25811004638671875, -0.24639511108398438, -0.23468017578125, -0.22296524047851562, -0.21125030517578125, -0.19953536987304688, -0.1878204345703125, -0.17610549926757812, -0.16439056396484375, -0.15267562866210938, -0.140960693359375, -0.12924575805664062, -0.11753082275390625, -0.10581588745117188, -0.0941009521484375, -0.08238601684570312, -0.07067108154296875, -0.058956146240234375, -0.0472412109375, -0.035526275634765625, -0.02381134033203125, -0.012096405029296875, -0.0003814697265625, 0.011333465576171875, 0.02304840087890625, 0.034763336181640625, 0.046478271484375, 0.058193206787109375, 0.06990814208984375, 0.08162307739257812, 0.0933380126953125, 0.10505294799804688, 0.11676788330078125, 0.12848281860351562, 0.14019775390625, 0.15191268920898438, 0.16362762451171875, 0.17534255981445312, 0.1870574951171875, 0.19877243041992188, 0.21048736572265625, 0.22220230102539062, 0.233917236328125, 0.24563217163085938, 0.25734710693359375, 0.2690620422363281, 0.2807769775390625, 0.2924919128417969, 0.30420684814453125, 0.3159217834472656, 0.32763671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 6.0, 20.0, 22.0, 47.0, 50.0, 94.0, 205.0, 469.0, 1528.0, 7696.0, 8334815.0, 38486.0, 3495.0, 904.0, 330.0, 151.0, 89.0, 56.0, 32.0, 23.0, 18.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.9818265438079834, -3.879146099090576, -3.77646541595459, -3.6737849712371826, -3.5711042881011963, -3.468423843383789, -3.3657431602478027, -3.2630627155303955, -3.1603822708129883, -3.057701826095581, -2.9550211429595947, -2.8523406982421875, -2.749660015106201, -2.646979570388794, -2.5442991256713867, -2.4416184425354004, -2.338937759399414, -2.236257314682007, -2.1335766315460205, -2.0308961868286133, -1.9282156229019165, -1.8255350589752197, -1.722854495048523, -1.6201739311218262, -1.517493486404419, -1.4148129224777222, -1.3121323585510254, -1.2094519138336182, -1.1067713499069214, -1.0040907859802246, -0.9014102220535278, -0.7987297177314758, -0.6960492134094238, -0.593368649482727, -0.49068814516067505, -0.38800758123397827, -0.2853270471096039, -0.1826465129852295, -0.07996594905853271, 0.022714555263519287, 0.12539511919021606, 0.22807565331459045, 0.33075618743896484, 0.4334367513656616, 0.5361173152923584, 0.6387978196144104, 0.7414783835411072, 0.8441588878631592, 0.946839451789856, 1.0495200157165527, 1.1522005796432495, 1.2548811435699463, 1.3575615882873535, 1.4602421522140503, 1.562922716140747, 1.6656031608581543, 1.7682838439941406, 1.8709644079208374, 1.9736449718475342, 2.0763254165649414, 2.1790060997009277, 2.281686544418335, 2.384366989135742, 2.4870476722717285, 2.5897281169891357]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 1.0, 1.0, 3.0, 8.0, 1.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.363250732421875, -4.21594762802124, -4.068645000457764, -3.921341896057129, -3.7740390300750732, -3.6267361640930176, -3.479433059692383, -3.332130193710327, -3.1848273277282715, -3.037524461746216, -2.89022159576416, -2.7429184913635254, -2.5956156253814697, -2.448312759399414, -2.3010096549987793, -2.1537067890167236, -2.006403923034668, -1.8591010570526123, -1.711798071861267, -1.5644950866699219, -1.4171922206878662, -1.2698893547058105, -1.1225863695144653, -0.9752833843231201, -0.8279805183410645, -0.680677592754364, -0.5333746671676636, -0.38607174158096313, -0.2387688159942627, -0.09146589040756226, 0.055837035179138184, 0.2031400203704834, 0.35044240951538086, 0.4977453351020813, 0.6450482606887817, 0.7923511862754822, 0.9396541118621826, 1.0869569778442383, 1.2342599630355835, 1.3815629482269287, 1.5288658142089844, 1.67616868019104, 1.8234716653823853, 1.9707746505737305, 2.118077516555786, 2.265380382537842, 2.4126834869384766, 2.5599863529205322, 2.707289218902588, 2.8545920848846436, 3.001894950866699, 3.149198055267334, 3.2965009212493896, 3.4438037872314453, 3.59110689163208, 3.7384097576141357, 3.8857126235961914, 4.033015727996826, 4.180318355560303, 4.3276214599609375, 4.474924087524414, 4.622227191925049, 4.769530296325684, 4.91683292388916, 5.064136028289795]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 18.0, 18.0, 33.0, 38.0, 74.0, 104.0, 136.0, 238.0, 417.0, 679.0, 1239.0, 2526.0, 5244.0, 11636.0, 25904.0, 58287.0, 122839.0, 148148.0, 80688.0, 35853.0, 15720.0, 7145.0, 3309.0, 1691.0, 896.0, 474.0, 289.0, 180.0, 108.0, 85.0, 46.0, 37.0, 38.0, 22.0, 23.0, 15.0, 14.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.3087158203125, -1.263916015625, -1.2191162109375, -1.17431640625, -1.1295166015625, -1.084716796875, -1.0399169921875, -0.9951171875, -0.9503173828125, -0.905517578125, -0.8607177734375, -0.81591796875, -0.7711181640625, -0.726318359375, -0.6815185546875, -0.63671875, -0.5919189453125, -0.547119140625, -0.5023193359375, -0.45751953125, -0.4127197265625, -0.367919921875, -0.3231201171875, -0.2783203125, -0.2335205078125, -0.188720703125, -0.1439208984375, -0.09912109375, -0.0543212890625, -0.009521484375, 0.0352783203125, 0.080078125, 0.1248779296875, 0.169677734375, 0.2144775390625, 0.25927734375, 0.3040771484375, 0.348876953125, 0.3936767578125, 0.4384765625, 0.4832763671875, 0.528076171875, 0.5728759765625, 0.61767578125, 0.6624755859375, 0.707275390625, 0.7520751953125, 0.796875, 0.8416748046875, 0.886474609375, 0.9312744140625, 0.97607421875, 1.0208740234375, 1.065673828125, 1.1104736328125, 1.1552734375, 1.2000732421875, 1.244873046875, 1.2896728515625, 1.33447265625, 1.3792724609375, 1.424072265625, 1.4688720703125, 1.513671875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 9.0, 25.0, 27.0, 43.0, 65.0, 116.0, 99.0, 120.0, 144.0, 89.0, 78.0, 55.0, 34.0, 28.0, 26.0, 12.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67041015625, -0.652801513671875, -0.63519287109375, -0.617584228515625, -0.5999755859375, -0.582366943359375, -0.56475830078125, -0.547149658203125, -0.529541015625, -0.511932373046875, -0.49432373046875, -0.476715087890625, -0.4591064453125, -0.441497802734375, -0.42388916015625, -0.406280517578125, -0.388671875, -0.371063232421875, -0.35345458984375, -0.335845947265625, -0.3182373046875, -0.300628662109375, -0.28302001953125, -0.265411376953125, -0.247802734375, -0.230194091796875, -0.21258544921875, -0.194976806640625, -0.1773681640625, -0.159759521484375, -0.14215087890625, -0.124542236328125, -0.10693359375, -0.089324951171875, -0.07171630859375, -0.054107666015625, -0.0364990234375, -0.018890380859375, -0.00128173828125, 0.016326904296875, 0.033935546875, 0.051544189453125, 0.06915283203125, 0.086761474609375, 0.1043701171875, 0.121978759765625, 0.13958740234375, 0.157196044921875, 0.1748046875, 0.192413330078125, 0.21002197265625, 0.227630615234375, 0.2452392578125, 0.262847900390625, 0.28045654296875, 0.298065185546875, 0.315673828125, 0.333282470703125, 0.35089111328125, 0.368499755859375, 0.3861083984375, 0.403717041015625, 0.42132568359375, 0.438934326171875, 0.45654296875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 19.0, 25.0, 63.0, 84.0, 109.0, 62.0, 32.0, 29.0, 16.0, 16.0, 8.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640334129333496, -4.501906394958496, -4.363478183746338, -4.225050449371338, -4.086622714996338, -3.948194742202759, -3.8097667694091797, -3.6713390350341797, -3.5329113006591797, -3.3944833278656006, -3.2560555934906006, -3.1176276206970215, -2.9791998863220215, -2.8407719135284424, -2.7023439407348633, -2.5639162063598633, -2.425488233566284, -2.287060260772705, -2.148632526397705, -2.010204553604126, -1.871776819229126, -1.7333488464355469, -1.5949209928512573, -1.4564931392669678, -1.3180652856826782, -1.1796374320983887, -1.0412095785140991, -0.9027816653251648, -0.7643538117408752, -0.6259259581565857, -0.48749804496765137, -0.3490701913833618, -0.21064233779907227, -0.07221446931362152, 0.06621339917182922, 0.20464128255844116, 0.3430691361427307, 0.48149698972702026, 0.6199249029159546, 0.7583527565002441, 0.8967806100845337, 1.0352084636688232, 1.1736363172531128, 1.3120641708374023, 1.4504921436309814, 1.5889198780059814, 1.7273478507995605, 1.86577570438385, 2.0042035579681396, 2.1426315307617188, 2.2810592651367188, 2.419487237930298, 2.557914972305298, 2.696342945098877, 2.834770679473877, 2.973198652267456, 3.111626625061035, 3.2500545978546143, 3.3884823322296143, 3.5269103050231934, 3.6653380393981934, 3.8037660121917725, 3.9421939849853516, 4.080621719360352, 4.219049453735352]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 1.0, 7.0, 8.0, 19.0, 15.0, 28.0, 32.0, 32.0, 52.0, 45.0, 42.0, 51.0, 33.0, 23.0, 17.0, 17.0, 13.0, 11.0, 10.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310678005218506, -3.2163918018341064, -3.122105598449707, -3.0278191566467285, -2.933532953262329, -2.8392467498779297, -2.7449605464935303, -2.650674343109131, -2.5563879013061523, -2.462101697921753, -2.3678154945373535, -2.273529052734375, -2.1792428493499756, -2.084956645965576, -1.9906704425811768, -1.8963841199874878, -1.8020979166030884, -1.707811713218689, -1.613525390625, -1.5192391872406006, -1.4249528646469116, -1.3306666612625122, -1.2363803386688232, -1.1420941352844238, -1.0478079319000244, -0.9535216689109802, -0.859235405921936, -0.7649492025375366, -0.6706628799438477, -0.5763766765594482, -0.48209041357040405, -0.38780415058135986, -0.2935178279876709, -0.1992315649986267, -0.10494531691074371, -0.010659068822860718, 0.08362719416618347, 0.17791345715522766, 0.27219969034194946, 0.36648595333099365, 0.46077221632003784, 0.555058479309082, 0.6493447422981262, 0.7436310052871704, 0.8379172086715698, 0.9322035312652588, 1.0264897346496582, 1.1207759380340576, 1.2150622606277466, 1.309348464012146, 1.403634786605835, 1.4979209899902344, 1.5922073125839233, 1.6864935159683228, 1.7807798385620117, 1.8750660419464111, 1.9693522453308105, 2.06363844871521, 2.1579246520996094, 2.252211093902588, 2.3464972972869873, 2.4407835006713867, 2.535069704055786, 2.6293559074401855, 2.723642349243164]}, "eval/loss": 4.82772970199585, "eval/wer": 2.4284212614042047, "eval/runtime": 1118.0617, "eval/samples_per_second": 2.363, "eval/steps_per_second": 0.296, "train/train_runtime": 6324.9374, "train/train_samples_per_second": 4.512, "train/train_steps_per_second": 0.141, "train/total_flos": 0.0, "train/train_loss": 4.944881099221952} \ No newline at end of file +{"train/loss": 4.2487, "train/learning_rate": 5.102040816326531e-06, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 7749, "_timestamp": 1646286542, "_step": 894, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 51.0, 788.0, 154.0, 11.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-157.27684020996094, -143.8236541748047, -130.37045288085938, -116.91726684570312, -103.46407318115234, -90.01087951660156, -76.55769348144531, -63.10449981689453, -49.65130615234375, -36.19811248779297, -22.744922637939453, -9.291732788085938, 4.161460876464844, 17.614654541015625, 31.067840576171875, 44.521034240722656, 57.97422790527344, 71.42742156982422, 84.880615234375, 98.33380126953125, 111.78699493408203, 125.24018859863281, 138.69337463378906, 152.14657592773438, 165.59976196289062, 179.05294799804688, 192.5061492919922, 205.95933532714844, 219.41253662109375, 232.86572265625, 246.31890869140625, 259.7720947265625, 273.22528076171875, 286.678466796875, 300.13165283203125, 313.5848388671875, 327.0380554199219, 340.4912414550781, 353.9444274902344, 367.3976135253906, 380.850830078125, 394.30401611328125, 407.7572021484375, 421.21038818359375, 434.6636047363281, 448.1167907714844, 461.5699768066406, 475.0231628417969, 488.4763488769531, 501.9295349121094, 515.3827514648438, 528.8359375, 542.2891235351562, 555.7423095703125, 569.1954956054688, 582.648681640625, 596.1018676757812, 609.5550537109375, 623.0082397460938, 636.46142578125, 649.9146118164062, 663.3677978515625, 676.821044921875, 690.2742309570312, 703.7274169921875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 0.0, 3.0, 9.0, 7.0, 7.0, 16.0, 23.0, 39.0, 34.0, 65.0, 107.0, 155.0, 167.0, 125.0, 93.0, 52.0, 31.0, 23.0, 12.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-367.9178161621094, -358.02044677734375, -348.12310791015625, -338.2257385253906, -328.3283996582031, -318.4310302734375, -308.53369140625, -298.6363220214844, -288.73895263671875, -278.8415832519531, -268.9442443847656, -259.046875, -249.14952087402344, -239.25216674804688, -229.3548126220703, -219.45745849609375, -209.5601043701172, -199.66275024414062, -189.76539611816406, -179.8680419921875, -169.97067260742188, -160.0733184814453, -150.17596435546875, -140.27859497070312, -130.38125610351562, -120.48390197753906, -110.58654022216797, -100.6891860961914, -90.79182434082031, -80.89447021484375, -70.99711608886719, -61.099754333496094, -51.202392578125, -41.30503463745117, -31.407678604125977, -21.51032257080078, -11.612964630126953, -1.715606689453125, 8.181747436523438, 18.07910919189453, 27.976463317871094, 37.87382125854492, 47.77117919921875, 57.66853332519531, 67.56588745117188, 77.46324920654297, 87.36060333251953, 97.25796508789062, 107.15531921386719, 117.05267333984375, 126.95003509521484, 136.84738159179688, 146.7447509765625, 156.64210510253906, 166.53945922851562, 176.43682861328125, 186.33416748046875, 196.2315216064453, 206.12887573242188, 216.0262451171875, 225.92359924316406, 235.82095336914062, 245.7183074951172, 255.61566162109375, 265.5130310058594]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 9.0, 7.0, 11.0, 17.0, 25.0, 38.0, 30.0, 72.0, 96.0, 131.0, 152.0, 130.0, 93.0, 59.0, 45.0, 28.0, 17.0, 8.0, 11.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4296875, -5.28729248046875, -5.1448974609375, -5.00250244140625, -4.860107421875, -4.71771240234375, -4.5753173828125, -4.43292236328125, -4.29052734375, -4.14813232421875, -4.0057373046875, -3.86334228515625, -3.720947265625, -3.57855224609375, -3.4361572265625, -3.29376220703125, -3.1513671875, -3.00897216796875, -2.8665771484375, -2.72418212890625, -2.581787109375, -2.43939208984375, -2.2969970703125, -2.15460205078125, -2.01220703125, -1.86981201171875, -1.7274169921875, -1.58502197265625, -1.442626953125, -1.30023193359375, -1.1578369140625, -1.01544189453125, -0.873046875, -0.73065185546875, -0.5882568359375, -0.44586181640625, -0.303466796875, -0.16107177734375, -0.0186767578125, 0.12371826171875, 0.26611328125, 0.40850830078125, 0.5509033203125, 0.69329833984375, 0.835693359375, 0.97808837890625, 1.1204833984375, 1.26287841796875, 1.4052734375, 1.54766845703125, 1.6900634765625, 1.83245849609375, 1.974853515625, 2.11724853515625, 2.2596435546875, 2.40203857421875, 2.54443359375, 2.68682861328125, 2.8292236328125, 2.97161865234375, 3.114013671875, 3.25640869140625, 3.3988037109375, 3.54119873046875, 3.68359375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 17.0, 23.0, 17.0, 19.0, 36.0, 71.0, 92.0, 125.0, 210.0, 343.0, 642.0, 1381.0, 3303.0, 14395.0, 4000953.0, 161666.0, 7076.0, 2043.0, 852.0, 372.0, 248.0, 113.0, 84.0, 59.0, 28.0, 23.0, 25.0, 13.0, 6.0, 6.0, 8.0, 8.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-46.40625, -45.1787109375, -43.951171875, -42.7236328125, -41.49609375, -40.2685546875, -39.041015625, -37.8134765625, -36.5859375, -35.3583984375, -34.130859375, -32.9033203125, -31.67578125, -30.4482421875, -29.220703125, -27.9931640625, -26.765625, -25.5380859375, -24.310546875, -23.0830078125, -21.85546875, -20.6279296875, -19.400390625, -18.1728515625, -16.9453125, -15.7177734375, -14.490234375, -13.2626953125, -12.03515625, -10.8076171875, -9.580078125, -8.3525390625, -7.125, -5.8974609375, -4.669921875, -3.4423828125, -2.21484375, -0.9873046875, 0.240234375, 1.4677734375, 2.6953125, 3.9228515625, 5.150390625, 6.3779296875, 7.60546875, 8.8330078125, 10.060546875, 11.2880859375, 12.515625, 13.7431640625, 14.970703125, 16.1982421875, 17.42578125, 18.6533203125, 19.880859375, 21.1083984375, 22.3359375, 23.5634765625, 24.791015625, 26.0185546875, 27.24609375, 28.4736328125, 29.701171875, 30.9287109375, 32.15625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 14.0, 14.0, 16.0, 29.0, 28.0, 35.0, 65.0, 97.0, 169.0, 298.0, 640.0, 1029.0, 687.0, 371.0, 194.0, 111.0, 72.0, 54.0, 38.0, 27.0, 17.0, 12.0, 14.0, 9.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.387939453125, -9.03369140625, -8.679443359375, -8.3251953125, -7.970947265625, -7.61669921875, -7.262451171875, -6.908203125, -6.553955078125, -6.19970703125, -5.845458984375, -5.4912109375, -5.136962890625, -4.78271484375, -4.428466796875, -4.07421875, -3.719970703125, -3.36572265625, -3.011474609375, -2.6572265625, -2.302978515625, -1.94873046875, -1.594482421875, -1.240234375, -0.885986328125, -0.53173828125, -0.177490234375, 0.1767578125, 0.531005859375, 0.88525390625, 1.239501953125, 1.59375, 1.947998046875, 2.30224609375, 2.656494140625, 3.0107421875, 3.364990234375, 3.71923828125, 4.073486328125, 4.427734375, 4.781982421875, 5.13623046875, 5.490478515625, 5.8447265625, 6.198974609375, 6.55322265625, 6.907470703125, 7.26171875, 7.615966796875, 7.97021484375, 8.324462890625, 8.6787109375, 9.032958984375, 9.38720703125, 9.741455078125, 10.095703125, 10.449951171875, 10.80419921875, 11.158447265625, 11.5126953125, 11.866943359375, 12.22119140625, 12.575439453125, 12.9296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 11.0, 21.0, 19.0, 25.0, 42.0, 61.0, 81.0, 121.0, 177.0, 320.0, 1004.0, 6191.0, 151149.0, 3984397.0, 45848.0, 3317.0, 701.0, 284.0, 157.0, 97.0, 57.0, 66.0, 38.0, 25.0, 20.0, 15.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.53125, -35.5263671875, -34.521484375, -33.5166015625, -32.51171875, -31.5068359375, -30.501953125, -29.4970703125, -28.4921875, -27.4873046875, -26.482421875, -25.4775390625, -24.47265625, -23.4677734375, -22.462890625, -21.4580078125, -20.453125, -19.4482421875, -18.443359375, -17.4384765625, -16.43359375, -15.4287109375, -14.423828125, -13.4189453125, -12.4140625, -11.4091796875, -10.404296875, -9.3994140625, -8.39453125, -7.3896484375, -6.384765625, -5.3798828125, -4.375, -3.3701171875, -2.365234375, -1.3603515625, -0.35546875, 0.6494140625, 1.654296875, 2.6591796875, 3.6640625, 4.6689453125, 5.673828125, 6.6787109375, 7.68359375, 8.6884765625, 9.693359375, 10.6982421875, 11.703125, 12.7080078125, 13.712890625, 14.7177734375, 15.72265625, 16.7275390625, 17.732421875, 18.7373046875, 19.7421875, 20.7470703125, 21.751953125, 22.7568359375, 23.76171875, 24.7666015625, 25.771484375, 26.7763671875, 27.78125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 52.0, 218.0, 463.0, 201.0, 59.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.93682098388672, -117.5113754272461, -115.0859375, -112.66049194335938, -110.23505401611328, -107.80960845947266, -105.38417053222656, -102.95872497558594, -100.53327941894531, -98.10783386230469, -95.6823959350586, -93.25695037841797, -90.83151245117188, -88.40606689453125, -85.98062133789062, -83.55518341064453, -81.12974548339844, -78.70429992675781, -76.27886199951172, -73.8534164428711, -71.427978515625, -69.00253295898438, -66.57708740234375, -64.15164947509766, -61.72620391845703, -59.30076217651367, -56.87532043457031, -54.44987487792969, -52.02443313598633, -49.59899139404297, -47.17354965209961, -44.74810791015625, -42.32265853881836, -39.897216796875, -37.47177505493164, -35.04633331298828, -32.620887756347656, -30.195446014404297, -27.770004272460938, -25.344560623168945, -22.919118881225586, -20.493677139282227, -18.068233489990234, -15.642791748046875, -13.2173490524292, -10.791906356811523, -8.366464614868164, -5.941020965576172, -3.5155792236328125, -1.0901367664337158, 1.3353056907653809, 3.7607479095458984, 6.186190605163574, 8.61163330078125, 11.03707504272461, 13.462518692016602, 15.887960433959961, 18.31340217590332, 20.738845825195312, 23.164287567138672, 25.58972930908203, 28.015172958374023, 30.440614700317383, 32.866058349609375, 35.291500091552734]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 12.0, 9.0, 17.0, 13.0, 19.0, 21.0, 30.0, 21.0, 32.0, 32.0, 33.0, 46.0, 40.0, 42.0, 40.0, 49.0, 42.0, 44.0, 41.0, 39.0, 47.0, 38.0, 38.0, 40.0, 26.0, 25.0, 32.0, 23.0, 16.0, 15.0, 12.0, 14.0, 8.0, 5.0, 3.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.84715270996094, -32.708274841308594, -31.56939697265625, -30.430519104003906, -29.291641235351562, -28.15276336669922, -27.013885498046875, -25.87500762939453, -24.736129760742188, -23.597251892089844, -22.4583740234375, -21.319496154785156, -20.180618286132812, -19.04174041748047, -17.902862548828125, -16.76398468017578, -15.625104904174805, -14.486227035522461, -13.347349166870117, -12.208471298217773, -11.06959342956543, -9.930715560913086, -8.791836738586426, -7.652958869934082, -6.514081001281738, -5.3752031326293945, -4.236325263977051, -3.097446918487549, -1.958569049835205, -0.8196911811828613, 0.3191871643066406, 1.4580650329589844, 2.596942901611328, 3.735820770263672, 4.874698638916016, 6.013576984405518, 7.152454853057861, 8.291332244873047, 9.430211067199707, 10.56908893585205, 11.707966804504395, 12.846844673156738, 13.985722541809082, 15.124601364135742, 16.263479232788086, 17.40235710144043, 18.541234970092773, 19.680112838745117, 20.81899070739746, 21.957868576049805, 23.09674644470215, 24.235624313354492, 25.374502182006836, 26.51338005065918, 27.652259826660156, 28.7911376953125, 29.930015563964844, 31.068893432617188, 32.20777130126953, 33.346649169921875, 34.48552703857422, 35.62440490722656, 36.763282775878906, 37.90216064453125, 39.041038513183594]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 14.0, 10.0, 28.0, 29.0, 42.0, 50.0, 83.0, 106.0, 125.0, 157.0, 104.0, 76.0, 56.0, 36.0, 27.0, 13.0, 10.0, 7.0, 1.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.91290283203125, -4.7789306640625, -4.64495849609375, -4.510986328125, -4.37701416015625, -4.2430419921875, -4.10906982421875, -3.97509765625, -3.84112548828125, -3.7071533203125, -3.57318115234375, -3.439208984375, -3.30523681640625, -3.1712646484375, -3.03729248046875, -2.9033203125, -2.76934814453125, -2.6353759765625, -2.50140380859375, -2.367431640625, -2.23345947265625, -2.0994873046875, -1.96551513671875, -1.83154296875, -1.69757080078125, -1.5635986328125, -1.42962646484375, -1.295654296875, -1.16168212890625, -1.0277099609375, -0.89373779296875, -0.759765625, -0.62579345703125, -0.4918212890625, -0.35784912109375, -0.223876953125, -0.08990478515625, 0.0440673828125, 0.17803955078125, 0.31201171875, 0.44598388671875, 0.5799560546875, 0.71392822265625, 0.847900390625, 0.98187255859375, 1.1158447265625, 1.24981689453125, 1.3837890625, 1.51776123046875, 1.6517333984375, 1.78570556640625, 1.919677734375, 2.05364990234375, 2.1876220703125, 2.32159423828125, 2.45556640625, 2.58953857421875, 2.7235107421875, 2.85748291015625, 2.991455078125, 3.12542724609375, 3.2593994140625, 3.39337158203125, 3.52734375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 11.0, 5.0, 12.0, 10.0, 17.0, 19.0, 30.0, 37.0, 57.0, 77.0, 121.0, 180.0, 262.0, 416.0, 633.0, 993.0, 1474.0, 2513.0, 4484.0, 8982.0, 21978.0, 71196.0, 434702.0, 391400.0, 68229.0, 20756.0, 9021.0, 4418.0, 2397.0, 1447.0, 944.0, 583.0, 373.0, 238.0, 151.0, 125.0, 70.0, 58.0, 36.0, 30.0, 20.0, 11.0, 15.0, 4.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2352294921875, -0.22763633728027344, -0.22004318237304688, -0.2124500274658203, -0.20485687255859375, -0.1972637176513672, -0.18967056274414062, -0.18207740783691406, -0.1744842529296875, -0.16689109802246094, -0.15929794311523438, -0.1517047882080078, -0.14411163330078125, -0.1365184783935547, -0.12892532348632812, -0.12133216857910156, -0.113739013671875, -0.10614585876464844, -0.09855270385742188, -0.09095954895019531, -0.08336639404296875, -0.07577323913574219, -0.06818008422851562, -0.06058692932128906, -0.0529937744140625, -0.04540061950683594, -0.037807464599609375, -0.030214309692382812, -0.02262115478515625, -0.015027999877929688, -0.007434844970703125, 0.0001583099365234375, 0.00775146484375, 0.015344619750976562, 0.022937774658203125, 0.030530929565429688, 0.03812408447265625, 0.04571723937988281, 0.053310394287109375, 0.06090354919433594, 0.0684967041015625, 0.07608985900878906, 0.08368301391601562, 0.09127616882324219, 0.09886932373046875, 0.10646247863769531, 0.11405563354492188, 0.12164878845214844, 0.129241943359375, 0.13683509826660156, 0.14442825317382812, 0.1520214080810547, 0.15961456298828125, 0.1672077178955078, 0.17480087280273438, 0.18239402770996094, 0.1899871826171875, 0.19758033752441406, 0.20517349243164062, 0.2127666473388672, 0.22035980224609375, 0.2279529571533203, 0.23554611206054688, 0.24313926696777344, 0.250732421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 4.0, 8.0, 12.0, 16.0, 24.0, 24.0, 28.0, 25.0, 33.0, 33.0, 27.0, 29.0, 39.0, 50.0, 44.0, 50.0, 1064.0, 62.0, 48.0, 59.0, 36.0, 49.0, 38.0, 34.0, 24.0, 27.0, 23.0, 18.0, 25.0, 16.0, 10.0, 14.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0546875, -2.952239990234375, -2.84979248046875, -2.747344970703125, -2.6448974609375, -2.542449951171875, -2.44000244140625, -2.337554931640625, -2.235107421875, -2.132659912109375, -2.03021240234375, -1.927764892578125, -1.8253173828125, -1.722869873046875, -1.62042236328125, -1.517974853515625, -1.41552734375, -1.313079833984375, -1.21063232421875, -1.108184814453125, -1.0057373046875, -0.903289794921875, -0.80084228515625, -0.698394775390625, -0.595947265625, -0.493499755859375, -0.39105224609375, -0.288604736328125, -0.1861572265625, -0.083709716796875, 0.01873779296875, 0.121185302734375, 0.2236328125, 0.326080322265625, 0.42852783203125, 0.530975341796875, 0.6334228515625, 0.735870361328125, 0.83831787109375, 0.940765380859375, 1.043212890625, 1.145660400390625, 1.24810791015625, 1.350555419921875, 1.4530029296875, 1.555450439453125, 1.65789794921875, 1.760345458984375, 1.86279296875, 1.965240478515625, 2.06768798828125, 2.170135498046875, 2.2725830078125, 2.375030517578125, 2.47747802734375, 2.579925537109375, 2.682373046875, 2.784820556640625, 2.88726806640625, 2.989715576171875, 3.0921630859375, 3.194610595703125, 3.29705810546875, 3.399505615234375, 3.501953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 10.0, 10.0, 12.0, 31.0, 32.0, 44.0, 77.0, 125.0, 156.0, 244.0, 444.0, 616.0, 1009.0, 1529.0, 2345.0, 3568.0, 5616.0, 8782.0, 14055.0, 22371.0, 36501.0, 61429.0, 111638.0, 1282345.0, 290438.0, 103776.0, 57655.0, 34439.0, 21122.0, 13204.0, 8499.0, 5444.0, 3410.0, 2157.0, 1433.0, 869.0, 593.0, 387.0, 269.0, 149.0, 105.0, 80.0, 39.0, 31.0, 14.0, 13.0, 7.0, 4.0, 7.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.08544921875, -0.082855224609375, -0.08026123046875, -0.077667236328125, -0.0750732421875, -0.072479248046875, -0.06988525390625, -0.067291259765625, -0.064697265625, -0.062103271484375, -0.05950927734375, -0.056915283203125, -0.0543212890625, -0.051727294921875, -0.04913330078125, -0.046539306640625, -0.0439453125, -0.041351318359375, -0.03875732421875, -0.036163330078125, -0.0335693359375, -0.030975341796875, -0.02838134765625, -0.025787353515625, -0.023193359375, -0.020599365234375, -0.01800537109375, -0.015411376953125, -0.0128173828125, -0.010223388671875, -0.00762939453125, -0.005035400390625, -0.00244140625, 0.000152587890625, 0.00274658203125, 0.005340576171875, 0.0079345703125, 0.010528564453125, 0.01312255859375, 0.015716552734375, 0.018310546875, 0.020904541015625, 0.02349853515625, 0.026092529296875, 0.0286865234375, 0.031280517578125, 0.03387451171875, 0.036468505859375, 0.0390625, 0.041656494140625, 0.04425048828125, 0.046844482421875, 0.0494384765625, 0.052032470703125, 0.05462646484375, 0.057220458984375, 0.059814453125, 0.062408447265625, 0.06500244140625, 0.067596435546875, 0.0701904296875, 0.072784423828125, 0.07537841796875, 0.077972412109375, 0.08056640625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 4.0, 9.0, 15.0, 14.0, 12.0, 14.0, 30.0, 30.0, 29.0, 47.0, 38.0, 49.0, 65.0, 74.0, 79.0, 85.0, 49.0, 59.0, 35.0, 40.0, 32.0, 31.0, 38.0, 15.0, 25.0, 17.0, 10.0, 11.0, 8.0, 7.0, 6.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006933212280273438, -0.0006714761257171631, -0.0006496310234069824, -0.0006277859210968018, -0.0006059408187866211, -0.0005840957164764404, -0.0005622506141662598, -0.0005404055118560791, -0.0005185604095458984, -0.0004967153072357178, -0.0004748702049255371, -0.00045302510261535645, -0.0004311800003051758, -0.0004093348979949951, -0.00038748979568481445, -0.0003656446933746338, -0.0003437995910644531, -0.00032195448875427246, -0.0003001093864440918, -0.00027826428413391113, -0.00025641918182373047, -0.0002345740795135498, -0.00021272897720336914, -0.00019088387489318848, -0.0001690387725830078, -0.00014719367027282715, -0.00012534856796264648, -0.00010350346565246582, -8.165836334228516e-05, -5.981326103210449e-05, -3.796815872192383e-05, -1.6123056411743164e-05, 5.7220458984375e-06, 2.7567148208618164e-05, 4.941225051879883e-05, 7.125735282897949e-05, 9.310245513916016e-05, 0.00011494755744934082, 0.00013679265975952148, 0.00015863776206970215, 0.0001804828643798828, 0.00020232796669006348, 0.00022417306900024414, 0.0002460181713104248, 0.00026786327362060547, 0.00028970837593078613, 0.0003115534782409668, 0.00033339858055114746, 0.0003552436828613281, 0.0003770887851715088, 0.00039893388748168945, 0.0004207789897918701, 0.0004426240921020508, 0.00046446919441223145, 0.0004863142967224121, 0.0005081593990325928, 0.0005300045013427734, 0.0005518496036529541, 0.0005736947059631348, 0.0005955398082733154, 0.0006173849105834961, 0.0006392300128936768, 0.0006610751152038574, 0.0006829202175140381, 0.0007047653198242188]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 8.0, 11.0, 11.0, 15.0, 16.0, 24.0, 34.0, 50.0, 62.0, 72.0, 88.0, 127.0, 133.0, 217.0, 227.0, 366.0, 27533.0, 1017823.0, 448.0, 309.0, 193.0, 151.0, 156.0, 98.0, 94.0, 73.0, 40.0, 37.0, 34.0, 25.0, 15.0, 12.0, 14.0, 5.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0141448974609375, -0.013705253601074219, -0.013265609741210938, -0.012825965881347656, -0.012386322021484375, -0.011946678161621094, -0.011507034301757812, -0.011067390441894531, -0.01062774658203125, -0.010188102722167969, -0.009748458862304688, -0.009308815002441406, -0.008869171142578125, -0.008429527282714844, -0.007989883422851562, -0.007550239562988281, -0.007110595703125, -0.006670951843261719, -0.0062313079833984375, -0.005791664123535156, -0.005352020263671875, -0.004912376403808594, -0.0044727325439453125, -0.004033088684082031, -0.00359344482421875, -0.0031538009643554688, -0.0027141571044921875, -0.0022745132446289062, -0.001834869384765625, -0.0013952255249023438, -0.0009555816650390625, -0.0005159378051757812, -7.62939453125e-05, 0.00036334991455078125, 0.0008029937744140625, 0.0012426376342773438, 0.001682281494140625, 0.0021219253540039062, 0.0025615692138671875, 0.0030012130737304688, 0.00344085693359375, 0.0038805007934570312, 0.0043201446533203125, 0.004759788513183594, 0.005199432373046875, 0.005639076232910156, 0.0060787200927734375, 0.006518363952636719, 0.0069580078125, 0.007397651672363281, 0.007837295532226562, 0.008276939392089844, 0.008716583251953125, 0.009156227111816406, 0.009595870971679688, 0.010035514831542969, 0.01047515869140625, 0.010914802551269531, 0.011354446411132812, 0.011794090270996094, 0.012233734130859375, 0.012673377990722656, 0.013113021850585938, 0.013552665710449219, 0.0139923095703125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1010.0, 4.0], "bins": [-0.01571698673069477, -0.015465534292161465, -0.015214082784950733, -0.014962630346417427, -0.014711177907884121, -0.014459725469350815, -0.014208273962140083, -0.013956821523606777, -0.013705369085073471, -0.013453916646540165, -0.013202465139329433, -0.012951012700796127, -0.012699560262262821, -0.012448107823729515, -0.012196656316518784, -0.011945203877985477, -0.011693752370774746, -0.01144229993224144, -0.011190848425030708, -0.010939395986497402, -0.010687943547964096, -0.010436492040753365, -0.010185039602220058, -0.009933587163686752, -0.00968213565647602, -0.009430683217942715, -0.009179231710731983, -0.008927779272198677, -0.008676326833665371, -0.008424874395132065, -0.008173422887921333, -0.007921970449388027, -0.0076705170795321465, -0.007419065106660128, -0.0071676126681268215, -0.006916160695254803, -0.006664708256721497, -0.006413256283849478, -0.006161804310977459, -0.005910351872444153, -0.005658899899572134, -0.005407447926700115, -0.005155995488166809, -0.00490454351529479, -0.0046530915424227715, -0.004401639103889465, -0.0041501871310174465, -0.003898734925314784, -0.0036472827196121216, -0.003395830513909459, -0.0031443783082067966, -0.002892926335334778, -0.0026414741296321154, -0.002390021923929453, -0.002138569951057434, -0.0018871177453547716, -0.001635665656067431, -0.0013842135667800903, -0.0011327613610774279, -0.0008813092135824263, -0.0006298570660874248, -0.0003784048603847623, -0.00012695277109742165, 0.000124499318189919, 0.0003759515529964119]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 19.0, 17.0, 21.0, 24.0, 33.0, 25.0, 36.0, 58.0, 48.0, 53.0, 68.0, 67.0, 60.0, 60.0, 61.0, 56.0, 43.0, 46.0, 44.0, 29.0, 35.0, 24.0, 14.0, 19.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006846189498901367, -0.0006620734930038452, -0.0006395280361175537, -0.0006169825792312622, -0.0005944371223449707, -0.0005718916654586792, -0.0005493462085723877, -0.0005268007516860962, -0.0005042552947998047, -0.0004817098379135132, -0.0004591643810272217, -0.0004366189241409302, -0.00041407346725463867, -0.00039152801036834717, -0.00036898255348205566, -0.00034643709659576416, -0.00032389163970947266, -0.00030134618282318115, -0.00027880072593688965, -0.00025625526905059814, -0.00023370981216430664, -0.00021116435527801514, -0.00018861889839172363, -0.00016607344150543213, -0.00014352798461914062, -0.00012098252773284912, -9.843707084655762e-05, -7.589161396026611e-05, -5.334615707397461e-05, -3.0800700187683105e-05, -8.255243301391602e-06, 1.4290213584899902e-05, 3.6835670471191406e-05, 5.938112735748291e-05, 8.192658424377441e-05, 0.00010447204113006592, 0.00012701749801635742, 0.00014956295490264893, 0.00017210841178894043, 0.00019465386867523193, 0.00021719932556152344, 0.00023974478244781494, 0.00026229023933410645, 0.00028483569622039795, 0.00030738115310668945, 0.00032992660999298096, 0.00035247206687927246, 0.00037501752376556396, 0.00039756298065185547, 0.00042010843753814697, 0.0004426538944244385, 0.00046519935131073, 0.0004877448081970215, 0.000510290265083313, 0.0005328357219696045, 0.000555381178855896, 0.0005779266357421875, 0.000600472092628479, 0.0006230175495147705, 0.000645563006401062, 0.0006681084632873535, 0.000690653920173645, 0.0007131993770599365, 0.000735744833946228, 0.0007582902908325195]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 2.0, 8.0, 14.0, 10.0, 28.0, 29.0, 42.0, 50.0, 83.0, 106.0, 125.0, 157.0, 104.0, 76.0, 56.0, 36.0, 27.0, 13.0, 10.0, 7.0, 1.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.046875, -4.91290283203125, -4.7789306640625, -4.64495849609375, -4.510986328125, -4.37701416015625, -4.2430419921875, -4.10906982421875, -3.97509765625, -3.84112548828125, -3.7071533203125, -3.57318115234375, -3.439208984375, -3.30523681640625, -3.1712646484375, -3.03729248046875, -2.9033203125, -2.76934814453125, -2.6353759765625, -2.50140380859375, -2.367431640625, -2.23345947265625, -2.0994873046875, -1.96551513671875, -1.83154296875, -1.69757080078125, -1.5635986328125, -1.42962646484375, -1.295654296875, -1.16168212890625, -1.0277099609375, -0.89373779296875, -0.759765625, -0.62579345703125, -0.4918212890625, -0.35784912109375, -0.223876953125, -0.08990478515625, 0.0440673828125, 0.17803955078125, 0.31201171875, 0.44598388671875, 0.5799560546875, 0.71392822265625, 0.847900390625, 0.98187255859375, 1.1158447265625, 1.24981689453125, 1.3837890625, 1.51776123046875, 1.6517333984375, 1.78570556640625, 1.919677734375, 2.05364990234375, 2.1876220703125, 2.32159423828125, 2.45556640625, 2.58953857421875, 2.7235107421875, 2.85748291015625, 2.991455078125, 3.12542724609375, 3.2593994140625, 3.39337158203125, 3.52734375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 6.0, 11.0, 16.0, 29.0, 32.0, 56.0, 89.0, 94.0, 165.0, 250.0, 486.0, 955.0, 1974.0, 5367.0, 28971.0, 923839.0, 73186.0, 7823.0, 2549.0, 1160.0, 610.0, 312.0, 184.0, 114.0, 79.0, 51.0, 50.0, 28.0, 12.0, 11.0, 9.0, 12.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.328125, -26.515869140625, -25.70361328125, -24.891357421875, -24.0791015625, -23.266845703125, -22.45458984375, -21.642333984375, -20.830078125, -20.017822265625, -19.20556640625, -18.393310546875, -17.5810546875, -16.768798828125, -15.95654296875, -15.144287109375, -14.33203125, -13.519775390625, -12.70751953125, -11.895263671875, -11.0830078125, -10.270751953125, -9.45849609375, -8.646240234375, -7.833984375, -7.021728515625, -6.20947265625, -5.397216796875, -4.5849609375, -3.772705078125, -2.96044921875, -2.148193359375, -1.3359375, -0.523681640625, 0.28857421875, 1.100830078125, 1.9130859375, 2.725341796875, 3.53759765625, 4.349853515625, 5.162109375, 5.974365234375, 6.78662109375, 7.598876953125, 8.4111328125, 9.223388671875, 10.03564453125, 10.847900390625, 11.66015625, 12.472412109375, 13.28466796875, 14.096923828125, 14.9091796875, 15.721435546875, 16.53369140625, 17.345947265625, 18.158203125, 18.970458984375, 19.78271484375, 20.594970703125, 21.4072265625, 22.219482421875, 23.03173828125, 23.843994140625, 24.65625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 8.0, 7.0, 12.0, 11.0, 18.0, 19.0, 14.0, 28.0, 26.0, 18.0, 37.0, 33.0, 39.0, 51.0, 55.0, 59.0, 96.0, 192.0, 1520.0, 226.0, 100.0, 87.0, 63.0, 28.0, 43.0, 39.0, 24.0, 25.0, 29.0, 21.0, 18.0, 16.0, 11.0, 11.0, 12.0, 7.0, 12.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69921875, -6.47332763671875, -6.2474365234375, -6.02154541015625, -5.795654296875, -5.56976318359375, -5.3438720703125, -5.11798095703125, -4.89208984375, -4.66619873046875, -4.4403076171875, -4.21441650390625, -3.988525390625, -3.76263427734375, -3.5367431640625, -3.31085205078125, -3.0849609375, -2.85906982421875, -2.6331787109375, -2.40728759765625, -2.181396484375, -1.95550537109375, -1.7296142578125, -1.50372314453125, -1.27783203125, -1.05194091796875, -0.8260498046875, -0.60015869140625, -0.374267578125, -0.14837646484375, 0.0775146484375, 0.30340576171875, 0.529296875, 0.75518798828125, 0.9810791015625, 1.20697021484375, 1.432861328125, 1.65875244140625, 1.8846435546875, 2.11053466796875, 2.33642578125, 2.56231689453125, 2.7882080078125, 3.01409912109375, 3.239990234375, 3.46588134765625, 3.6917724609375, 3.91766357421875, 4.1435546875, 4.36944580078125, 4.5953369140625, 4.82122802734375, 5.047119140625, 5.27301025390625, 5.4989013671875, 5.72479248046875, 5.95068359375, 6.17657470703125, 6.4024658203125, 6.62835693359375, 6.854248046875, 7.08013916015625, 7.3060302734375, 7.53192138671875, 7.7578125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 10.0, 6.0, 12.0, 16.0, 11.0, 22.0, 28.0, 23.0, 32.0, 42.0, 50.0, 81.0, 166.0, 335.0, 1262.0, 24451.0, 3090122.0, 26731.0, 1307.0, 384.0, 164.0, 95.0, 59.0, 45.0, 40.0, 25.0, 27.0, 21.0, 18.0, 23.0, 16.0, 6.0, 11.0, 12.0, 5.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.25, -29.319580078125, -28.38916015625, -27.458740234375, -26.5283203125, -25.597900390625, -24.66748046875, -23.737060546875, -22.806640625, -21.876220703125, -20.94580078125, -20.015380859375, -19.0849609375, -18.154541015625, -17.22412109375, -16.293701171875, -15.36328125, -14.432861328125, -13.50244140625, -12.572021484375, -11.6416015625, -10.711181640625, -9.78076171875, -8.850341796875, -7.919921875, -6.989501953125, -6.05908203125, -5.128662109375, -4.1982421875, -3.267822265625, -2.33740234375, -1.406982421875, -0.4765625, 0.453857421875, 1.38427734375, 2.314697265625, 3.2451171875, 4.175537109375, 5.10595703125, 6.036376953125, 6.966796875, 7.897216796875, 8.82763671875, 9.758056640625, 10.6884765625, 11.618896484375, 12.54931640625, 13.479736328125, 14.41015625, 15.340576171875, 16.27099609375, 17.201416015625, 18.1318359375, 19.062255859375, 19.99267578125, 20.923095703125, 21.853515625, 22.783935546875, 23.71435546875, 24.644775390625, 25.5751953125, 26.505615234375, 27.43603515625, 28.366455078125, 29.296875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 15.0, 219.0, 633.0, 135.0, 15.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.684745788574219, -5.3429388999938965, -3.001132011413574, -0.659325122833252, 1.6824817657470703, 4.024288177490234, 6.366095542907715, 8.707902908325195, 11.04970932006836, 13.391515731811523, 15.733323097229004, 18.075130462646484, 20.41693687438965, 22.758743286132812, 25.10055160522461, 27.442358016967773, 29.784164428710938, 32.125972747802734, 34.467777252197266, 36.80958557128906, 39.151390075683594, 41.49319839477539, 43.83500671386719, 46.17681121826172, 48.518619537353516, 50.86042785644531, 53.202232360839844, 55.54404067993164, 57.88584899902344, 60.22765350341797, 62.569461822509766, 64.91127014160156, 67.25308227539062, 69.59488677978516, 71.93669891357422, 74.27850341796875, 76.62030792236328, 78.96211242675781, 81.30392456054688, 83.6457290649414, 85.98753356933594, 88.32933807373047, 90.67115020751953, 93.01295471191406, 95.3547592163086, 97.69656372070312, 100.03837585449219, 102.38018035888672, 104.72199249267578, 107.06379699707031, 109.40560913085938, 111.7474136352539, 114.08921813964844, 116.4310302734375, 118.77283477783203, 121.11463928222656, 123.45645141601562, 125.79825592041016, 128.1400604248047, 130.48187255859375, 132.8236846923828, 135.1654815673828, 137.50729370117188, 139.84910583496094, 142.19090270996094]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 7.0, 5.0, 8.0, 5.0, 14.0, 26.0, 16.0, 16.0, 21.0, 23.0, 30.0, 31.0, 37.0, 44.0, 23.0, 37.0, 48.0, 32.0, 48.0, 37.0, 48.0, 35.0, 38.0, 47.0, 42.0, 29.0, 37.0, 28.0, 28.0, 29.0, 24.0, 22.0, 9.0, 11.0, 14.0, 12.0, 5.0, 4.0, 10.0, 14.0, 6.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0], "bins": [-27.12782096862793, -26.352937698364258, -25.578054428100586, -24.80316925048828, -24.02828598022461, -23.253402709960938, -22.478519439697266, -21.703636169433594, -20.928752899169922, -20.15386962890625, -19.378986358642578, -18.604103088378906, -17.8292179107666, -17.05433464050293, -16.279451370239258, -15.504568099975586, -14.729682922363281, -13.95479965209961, -13.179915428161621, -12.40503215789795, -11.630147933959961, -10.855264663696289, -10.080381393432617, -9.305498123168945, -8.530613899230957, -7.755730152130127, -6.980846405029297, -6.205963134765625, -5.431079387664795, -4.656195640563965, -3.881312370300293, -3.106428623199463, -2.3315467834472656, -1.556663155555725, -0.7817795276641846, -0.006896018981933594, 0.7679877281188965, 1.5428714752197266, 2.3177547454833984, 3.0926384925842285, 3.8675222396850586, 4.642405986785889, 5.417289733886719, 6.192173004150391, 6.967056751251221, 7.741940498352051, 8.516823768615723, 9.291707992553711, 10.066591262817383, 10.841474533081055, 11.616358757019043, 12.391242027282715, 13.166126251220703, 13.941009521484375, 14.715892791748047, 15.490776062011719, 16.26565933227539, 17.040542602539062, 17.815425872802734, 18.590309143066406, 19.36519432067871, 20.140077590942383, 20.914960861206055, 21.689844131469727, 22.46472930908203]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 2.0, 8.0, 14.0, 11.0, 28.0, 36.0, 40.0, 58.0, 91.0, 113.0, 116.0, 138.0, 102.0, 79.0, 57.0, 34.0, 22.0, 18.0, 10.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.10546875, -4.969482421875, -4.83349609375, -4.697509765625, -4.5615234375, -4.425537109375, -4.28955078125, -4.153564453125, -4.017578125, -3.881591796875, -3.74560546875, -3.609619140625, -3.4736328125, -3.337646484375, -3.20166015625, -3.065673828125, -2.9296875, -2.793701171875, -2.65771484375, -2.521728515625, -2.3857421875, -2.249755859375, -2.11376953125, -1.977783203125, -1.841796875, -1.705810546875, -1.56982421875, -1.433837890625, -1.2978515625, -1.161865234375, -1.02587890625, -0.889892578125, -0.75390625, -0.617919921875, -0.48193359375, -0.345947265625, -0.2099609375, -0.073974609375, 0.06201171875, 0.197998046875, 0.333984375, 0.469970703125, 0.60595703125, 0.741943359375, 0.8779296875, 1.013916015625, 1.14990234375, 1.285888671875, 1.421875, 1.557861328125, 1.69384765625, 1.829833984375, 1.9658203125, 2.101806640625, 2.23779296875, 2.373779296875, 2.509765625, 2.645751953125, 2.78173828125, 2.917724609375, 3.0537109375, 3.189697265625, 3.32568359375, 3.461669921875, 3.59765625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 11.0, 9.0, 12.0, 27.0, 28.0, 59.0, 92.0, 158.0, 212.0, 540.0, 1289.0, 4332.0, 61982.0, 4104052.0, 17378.0, 2580.0, 780.0, 328.0, 160.0, 89.0, 53.0, 37.0, 18.0, 9.0, 14.0, 7.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.75, -41.60498046875, -40.4599609375, -39.31494140625, -38.169921875, -37.02490234375, -35.8798828125, -34.73486328125, -33.58984375, -32.44482421875, -31.2998046875, -30.15478515625, -29.009765625, -27.86474609375, -26.7197265625, -25.57470703125, -24.4296875, -23.28466796875, -22.1396484375, -20.99462890625, -19.849609375, -18.70458984375, -17.5595703125, -16.41455078125, -15.26953125, -14.12451171875, -12.9794921875, -11.83447265625, -10.689453125, -9.54443359375, -8.3994140625, -7.25439453125, -6.109375, -4.96435546875, -3.8193359375, -2.67431640625, -1.529296875, -0.38427734375, 0.7607421875, 1.90576171875, 3.05078125, 4.19580078125, 5.3408203125, 6.48583984375, 7.630859375, 8.77587890625, 9.9208984375, 11.06591796875, 12.2109375, 13.35595703125, 14.5009765625, 15.64599609375, 16.791015625, 17.93603515625, 19.0810546875, 20.22607421875, 21.37109375, 22.51611328125, 23.6611328125, 24.80615234375, 25.951171875, 27.09619140625, 28.2412109375, 29.38623046875, 30.53125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 6.0, 13.0, 8.0, 15.0, 19.0, 25.0, 32.0, 48.0, 98.0, 107.0, 210.0, 304.0, 550.0, 799.0, 665.0, 399.0, 251.0, 162.0, 105.0, 60.0, 46.0, 30.0, 24.0, 18.0, 7.0, 12.0, 8.0, 7.0, 10.0, 3.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.890625, -7.6336669921875, -7.376708984375, -7.1197509765625, -6.86279296875, -6.6058349609375, -6.348876953125, -6.0919189453125, -5.8349609375, -5.5780029296875, -5.321044921875, -5.0640869140625, -4.80712890625, -4.5501708984375, -4.293212890625, -4.0362548828125, -3.779296875, -3.5223388671875, -3.265380859375, -3.0084228515625, -2.75146484375, -2.4945068359375, -2.237548828125, -1.9805908203125, -1.7236328125, -1.4666748046875, -1.209716796875, -0.9527587890625, -0.69580078125, -0.4388427734375, -0.181884765625, 0.0750732421875, 0.33203125, 0.5889892578125, 0.845947265625, 1.1029052734375, 1.35986328125, 1.6168212890625, 1.873779296875, 2.1307373046875, 2.3876953125, 2.6446533203125, 2.901611328125, 3.1585693359375, 3.41552734375, 3.6724853515625, 3.929443359375, 4.1864013671875, 4.443359375, 4.7003173828125, 4.957275390625, 5.2142333984375, 5.47119140625, 5.7281494140625, 5.985107421875, 6.2420654296875, 6.4990234375, 6.7559814453125, 7.012939453125, 7.2698974609375, 7.52685546875, 7.7838134765625, 8.040771484375, 8.2977294921875, 8.5546875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 6.0, 15.0, 17.0, 18.0, 56.0, 74.0, 113.0, 178.0, 335.0, 525.0, 942.0, 1678.0, 3245.0, 6484.0, 14236.0, 38563.0, 151931.0, 1371988.0, 2287519.0, 232318.0, 50384.0, 17758.0, 7684.0, 3695.0, 1892.0, 1073.0, 614.0, 354.0, 224.0, 119.0, 92.0, 42.0, 31.0, 22.0, 17.0, 16.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.5859375, -11.236083984375, -10.88623046875, -10.536376953125, -10.1865234375, -9.836669921875, -9.48681640625, -9.136962890625, -8.787109375, -8.437255859375, -8.08740234375, -7.737548828125, -7.3876953125, -7.037841796875, -6.68798828125, -6.338134765625, -5.98828125, -5.638427734375, -5.28857421875, -4.938720703125, -4.5888671875, -4.239013671875, -3.88916015625, -3.539306640625, -3.189453125, -2.839599609375, -2.48974609375, -2.139892578125, -1.7900390625, -1.440185546875, -1.09033203125, -0.740478515625, -0.390625, -0.040771484375, 0.30908203125, 0.658935546875, 1.0087890625, 1.358642578125, 1.70849609375, 2.058349609375, 2.408203125, 2.758056640625, 3.10791015625, 3.457763671875, 3.8076171875, 4.157470703125, 4.50732421875, 4.857177734375, 5.20703125, 5.556884765625, 5.90673828125, 6.256591796875, 6.6064453125, 6.956298828125, 7.30615234375, 7.656005859375, 8.005859375, 8.355712890625, 8.70556640625, 9.055419921875, 9.4052734375, 9.755126953125, 10.10498046875, 10.454833984375, 10.8046875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 22.0, 74.0, 284.0, 400.0, 175.0, 45.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.34567642211914, -32.80447769165039, -29.263277053833008, -25.722076416015625, -22.180877685546875, -18.639678955078125, -15.098478317260742, -11.55727767944336, -8.01607894897461, -4.474879264831543, -0.9336795806884766, 2.60752010345459, 6.148719787597656, 9.689918518066406, 13.231119155883789, 16.772319793701172, 20.313518524169922, 23.854717254638672, 27.395917892456055, 30.937118530273438, 34.47831726074219, 38.01951599121094, 41.56071472167969, 45.1019172668457, 48.64311599731445, 52.1843147277832, 55.72551727294922, 59.26671600341797, 62.80791473388672, 66.34911346435547, 69.89031219482422, 73.4315185546875, 76.97271728515625, 80.513916015625, 84.05511474609375, 87.5963134765625, 91.13751220703125, 94.6787109375, 98.21991729736328, 101.76111602783203, 105.30231475830078, 108.84351348876953, 112.38471221923828, 115.92591094970703, 119.46711730957031, 123.00831604003906, 126.54951477050781, 130.09071350097656, 133.6319122314453, 137.17311096191406, 140.7143096923828, 144.25550842285156, 147.7967071533203, 151.33790588378906, 154.8791046142578, 158.42031860351562, 161.96151733398438, 165.50271606445312, 169.04391479492188, 172.58511352539062, 176.12631225585938, 179.66751098632812, 183.20870971679688, 186.74990844726562, 190.29110717773438]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 5.0, 3.0, 6.0, 3.0, 12.0, 13.0, 12.0, 14.0, 18.0, 17.0, 31.0, 26.0, 28.0, 31.0, 24.0, 28.0, 39.0, 27.0, 36.0, 43.0, 30.0, 38.0, 47.0, 35.0, 39.0, 32.0, 35.0, 36.0, 28.0, 28.0, 27.0, 22.0, 23.0, 24.0, 15.0, 22.0, 14.0, 23.0, 13.0, 8.0, 15.0, 8.0, 2.0, 6.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 4.0], "bins": [-26.044818878173828, -25.298988342285156, -24.553159713745117, -23.807329177856445, -23.061498641967773, -22.315670013427734, -21.569839477539062, -20.82400894165039, -20.07818031311035, -19.33234977722168, -18.58652114868164, -17.84069061279297, -17.094860076904297, -16.349031448364258, -15.603200912475586, -14.85737133026123, -14.111540794372559, -13.365711212158203, -12.619880676269531, -11.874051094055176, -11.12822151184082, -10.382390975952148, -9.636561393737793, -8.890731811523438, -8.144901275634766, -7.399071216583252, -6.6532416343688965, -5.907411575317383, -5.161581993103027, -4.415751934051514, -3.669921875, -2.9240922927856445, -2.178262710571289, -1.4324328899383545, -0.6866029500961304, 0.05922698974609375, 0.8050568103790283, 1.550886631011963, 2.2967166900634766, 3.042546272277832, 3.7883763313293457, 4.534206390380859, 5.280035972595215, 6.0258660316467285, 6.771696090698242, 7.517525672912598, 8.263355255126953, 9.009185791015625, 9.75501537322998, 10.500844955444336, 11.246675491333008, 11.992505073547363, 12.738334655761719, 13.48416519165039, 14.229994773864746, 14.975824356079102, 15.721654891967773, 16.467485427856445, 17.213314056396484, 17.959144592285156, 18.704975128173828, 19.450803756713867, 20.19663429260254, 20.942462921142578, 21.68829345703125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 8.0, 20.0, 22.0, 22.0, 39.0, 62.0, 83.0, 88.0, 123.0, 103.0, 115.0, 90.0, 57.0, 66.0, 29.0, 25.0, 12.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8046875, -4.675201416015625, -4.54571533203125, -4.416229248046875, -4.2867431640625, -4.157257080078125, -4.02777099609375, -3.898284912109375, -3.768798828125, -3.639312744140625, -3.50982666015625, -3.380340576171875, -3.2508544921875, -3.121368408203125, -2.99188232421875, -2.862396240234375, -2.73291015625, -2.603424072265625, -2.47393798828125, -2.344451904296875, -2.2149658203125, -2.085479736328125, -1.95599365234375, -1.826507568359375, -1.697021484375, -1.567535400390625, -1.43804931640625, -1.308563232421875, -1.1790771484375, -1.049591064453125, -0.92010498046875, -0.790618896484375, -0.6611328125, -0.531646728515625, -0.40216064453125, -0.272674560546875, -0.1431884765625, -0.013702392578125, 0.11578369140625, 0.245269775390625, 0.374755859375, 0.504241943359375, 0.63372802734375, 0.763214111328125, 0.8927001953125, 1.022186279296875, 1.15167236328125, 1.281158447265625, 1.41064453125, 1.540130615234375, 1.66961669921875, 1.799102783203125, 1.9285888671875, 2.058074951171875, 2.18756103515625, 2.317047119140625, 2.446533203125, 2.576019287109375, 2.70550537109375, 2.834991455078125, 2.9644775390625, 3.093963623046875, 3.22344970703125, 3.352935791015625, 3.482421875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 6.0, 4.0, 8.0, 15.0, 9.0, 32.0, 42.0, 51.0, 52.0, 82.0, 103.0, 151.0, 267.0, 367.0, 525.0, 797.0, 1349.0, 2198.0, 3827.0, 7414.0, 16832.0, 46359.0, 181476.0, 588692.0, 131660.0, 36997.0, 13984.0, 6540.0, 3306.0, 1903.0, 1133.0, 780.0, 534.0, 324.0, 199.0, 143.0, 103.0, 68.0, 62.0, 35.0, 30.0, 24.0, 14.0, 14.0, 13.0, 9.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2049560546875, -0.1982135772705078, -0.19147109985351562, -0.18472862243652344, -0.17798614501953125, -0.17124366760253906, -0.16450119018554688, -0.1577587127685547, -0.1510162353515625, -0.1442737579345703, -0.13753128051757812, -0.13078880310058594, -0.12404632568359375, -0.11730384826660156, -0.11056137084960938, -0.10381889343261719, -0.097076416015625, -0.09033393859863281, -0.08359146118164062, -0.07684898376464844, -0.07010650634765625, -0.06336402893066406, -0.056621551513671875, -0.04987907409667969, -0.0431365966796875, -0.03639411926269531, -0.029651641845703125, -0.022909164428710938, -0.01616668701171875, -0.009424209594726562, -0.002681732177734375, 0.0040607452392578125, 0.01080322265625, 0.017545700073242188, 0.024288177490234375, 0.031030654907226562, 0.03777313232421875, 0.04451560974121094, 0.051258087158203125, 0.05800056457519531, 0.0647430419921875, 0.07148551940917969, 0.07822799682617188, 0.08497047424316406, 0.09171295166015625, 0.09845542907714844, 0.10519790649414062, 0.11194038391113281, 0.118682861328125, 0.1254253387451172, 0.13216781616210938, 0.13891029357910156, 0.14565277099609375, 0.15239524841308594, 0.15913772583007812, 0.1658802032470703, 0.1726226806640625, 0.1793651580810547, 0.18610763549804688, 0.19285011291503906, 0.19959259033203125, 0.20633506774902344, 0.21307754516601562, 0.2198200225830078, 0.2265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 13.0, 12.0, 12.0, 18.0, 20.0, 20.0, 26.0, 22.0, 20.0, 35.0, 31.0, 32.0, 37.0, 37.0, 39.0, 38.0, 32.0, 1060.0, 32.0, 32.0, 35.0, 33.0, 27.0, 38.0, 44.0, 34.0, 37.0, 20.0, 20.0, 27.0, 18.0, 22.0, 18.0, 9.0, 12.0, 9.0, 10.0, 5.0, 7.0, 3.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.376953125, -2.306732177734375, -2.23651123046875, -2.166290283203125, -2.0960693359375, -2.025848388671875, -1.95562744140625, -1.885406494140625, -1.815185546875, -1.744964599609375, -1.67474365234375, -1.604522705078125, -1.5343017578125, -1.464080810546875, -1.39385986328125, -1.323638916015625, -1.25341796875, -1.183197021484375, -1.11297607421875, -1.042755126953125, -0.9725341796875, -0.902313232421875, -0.83209228515625, -0.761871337890625, -0.691650390625, -0.621429443359375, -0.55120849609375, -0.480987548828125, -0.4107666015625, -0.340545654296875, -0.27032470703125, -0.200103759765625, -0.1298828125, -0.059661865234375, 0.01055908203125, 0.080780029296875, 0.1510009765625, 0.221221923828125, 0.29144287109375, 0.361663818359375, 0.431884765625, 0.502105712890625, 0.57232666015625, 0.642547607421875, 0.7127685546875, 0.782989501953125, 0.85321044921875, 0.923431396484375, 0.99365234375, 1.063873291015625, 1.13409423828125, 1.204315185546875, 1.2745361328125, 1.344757080078125, 1.41497802734375, 1.485198974609375, 1.555419921875, 1.625640869140625, 1.69586181640625, 1.766082763671875, 1.8363037109375, 1.906524658203125, 1.97674560546875, 2.046966552734375, 2.1171875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 13.0, 10.0, 10.0, 21.0, 43.0, 41.0, 62.0, 109.0, 139.0, 199.0, 345.0, 461.0, 657.0, 936.0, 1271.0, 1833.0, 2761.0, 3935.0, 5677.0, 8311.0, 12076.0, 18168.0, 27051.0, 41447.0, 65742.0, 110464.0, 1106326.0, 395159.0, 107412.0, 64158.0, 40583.0, 26325.0, 17551.0, 11885.0, 8118.0, 5376.0, 3782.0, 2649.0, 1794.0, 1311.0, 882.0, 623.0, 402.0, 307.0, 214.0, 156.0, 104.0, 80.0, 52.0, 28.0, 34.0, 20.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.057098388671875, -0.05525493621826172, -0.05341148376464844, -0.051568031311035156, -0.049724578857421875, -0.047881126403808594, -0.04603767395019531, -0.04419422149658203, -0.04235076904296875, -0.04050731658935547, -0.03866386413574219, -0.036820411682128906, -0.034976959228515625, -0.033133506774902344, -0.03129005432128906, -0.02944660186767578, -0.0276031494140625, -0.02575969696044922, -0.023916244506835938, -0.022072792053222656, -0.020229339599609375, -0.018385887145996094, -0.016542434692382812, -0.014698982238769531, -0.01285552978515625, -0.011012077331542969, -0.009168624877929688, -0.007325172424316406, -0.005481719970703125, -0.0036382675170898438, -0.0017948150634765625, 4.863739013671875e-05, 0.00189208984375, 0.0037355422973632812, 0.0055789947509765625, 0.007422447204589844, 0.009265899658203125, 0.011109352111816406, 0.012952804565429688, 0.014796257019042969, 0.01663970947265625, 0.01848316192626953, 0.020326614379882812, 0.022170066833496094, 0.024013519287109375, 0.025856971740722656, 0.027700424194335938, 0.02954387664794922, 0.0313873291015625, 0.03323078155517578, 0.03507423400878906, 0.036917686462402344, 0.038761138916015625, 0.040604591369628906, 0.04244804382324219, 0.04429149627685547, 0.04613494873046875, 0.04797840118408203, 0.04982185363769531, 0.051665306091308594, 0.053508758544921875, 0.055352210998535156, 0.05719566345214844, 0.05903911590576172, 0.060882568359375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 9.0, 4.0, 9.0, 13.0, 15.0, 6.0, 18.0, 21.0, 24.0, 28.0, 29.0, 38.0, 42.0, 56.0, 60.0, 57.0, 66.0, 51.0, 59.0, 48.0, 50.0, 53.0, 46.0, 34.0, 29.0, 25.0, 14.0, 20.0, 12.0, 12.0, 8.0, 13.0, 4.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003948211669921875, -0.0003816261887550354, -0.0003684312105178833, -0.0003552362322807312, -0.0003420412540435791, -0.000328846275806427, -0.0003156512975692749, -0.0003024563193321228, -0.0002892613410949707, -0.0002760663628578186, -0.0002628713846206665, -0.0002496764063835144, -0.0002364814281463623, -0.0002232864499092102, -0.0002100914716720581, -0.000196896493434906, -0.0001837015151977539, -0.0001705065369606018, -0.0001573115587234497, -0.0001441165804862976, -0.0001309216022491455, -0.00011772662401199341, -0.00010453164577484131, -9.133666753768921e-05, -7.814168930053711e-05, -6.494671106338501e-05, -5.175173282623291e-05, -3.855675458908081e-05, -2.536177635192871e-05, -1.2166798114776611e-05, 1.0281801223754883e-06, 1.4223158359527588e-05, 2.7418136596679688e-05, 4.061311483383179e-05, 5.380809307098389e-05, 6.700307130813599e-05, 8.019804954528809e-05, 9.339302778244019e-05, 0.00010658800601959229, 0.00011978298425674438, 0.00013297796249389648, 0.00014617294073104858, 0.00015936791896820068, 0.00017256289720535278, 0.00018575787544250488, 0.00019895285367965698, 0.00021214783191680908, 0.00022534281015396118, 0.00023853778839111328, 0.0002517327666282654, 0.0002649277448654175, 0.0002781227231025696, 0.0002913177013397217, 0.0003045126795768738, 0.0003177076578140259, 0.000330902636051178, 0.0003440976142883301, 0.0003572925925254822, 0.0003704875707626343, 0.0003836825489997864, 0.0003968775272369385, 0.0004100725054740906, 0.0004232674837112427, 0.0004364624619483948, 0.0004496574401855469]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 3.0, 3.0, 5.0, 7.0, 13.0, 14.0, 22.0, 22.0, 29.0, 37.0, 44.0, 42.0, 46.0, 80.0, 91.0, 97.0, 120.0, 149.0, 168.0, 417.0, 8932.0, 842230.0, 191900.0, 2847.0, 244.0, 193.0, 144.0, 124.0, 91.0, 82.0, 59.0, 52.0, 47.0, 37.0, 38.0, 27.0, 16.0, 27.0, 13.0, 9.0, 5.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006885528564453125, -0.006669342517852783, -0.006453156471252441, -0.0062369704246521, -0.006020784378051758, -0.005804598331451416, -0.005588412284851074, -0.005372226238250732, -0.005156040191650391, -0.004939854145050049, -0.004723668098449707, -0.004507482051849365, -0.0042912960052490234, -0.004075109958648682, -0.00385892391204834, -0.003642737865447998, -0.0034265518188476562, -0.0032103657722473145, -0.0029941797256469727, -0.002777993679046631, -0.002561807632446289, -0.0023456215858459473, -0.0021294355392456055, -0.0019132494926452637, -0.0016970634460449219, -0.00148087739944458, -0.0012646913528442383, -0.0010485053062438965, -0.0008323192596435547, -0.0006161332130432129, -0.0003999471664428711, -0.0001837611198425293, 3.24249267578125e-05, 0.0002486109733581543, 0.0004647970199584961, 0.0006809830665588379, 0.0008971691131591797, 0.0011133551597595215, 0.0013295412063598633, 0.001545727252960205, 0.0017619132995605469, 0.0019780993461608887, 0.0021942853927612305, 0.0024104714393615723, 0.002626657485961914, 0.002842843532562256, 0.0030590295791625977, 0.0032752156257629395, 0.0034914016723632812, 0.003707587718963623, 0.003923773765563965, 0.004139959812164307, 0.0043561458587646484, 0.00457233190536499, 0.004788517951965332, 0.005004703998565674, 0.005220890045166016, 0.005437076091766357, 0.005653262138366699, 0.005869448184967041, 0.006085634231567383, 0.006301820278167725, 0.006518006324768066, 0.006734192371368408, 0.00695037841796875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 96.0, 858.0, 56.0, 2.0, 0.0, 1.0], "bins": [-0.007806016132235527, -0.007674674037843943, -0.007543331943452358, -0.007411989849060774, -0.0072806477546691895, -0.007149305660277605, -0.007017963565886021, -0.006886621471494436, -0.006755279377102852, -0.0066239372827112675, -0.006492595188319683, -0.006361253093928099, -0.006229910999536514, -0.00609856890514493, -0.0059672268107533455, -0.005835884716361761, -0.005704542621970177, -0.005573200527578592, -0.005441858433187008, -0.0053105163387954235, -0.005179174244403839, -0.005047832150012255, -0.00491649005562067, -0.004785147961229086, -0.004653806332498789, -0.0045224642381072044, -0.00439112214371562, -0.004259780049324036, -0.004128437954932451, -0.003997095860540867, -0.0038657537661492825, -0.003734411671757698, -0.0036030698101967573, -0.003471727715805173, -0.0033403856214135885, -0.003209043527022004, -0.0030777014326304197, -0.0029463593382388353, -0.0028150174766778946, -0.00268367538228631, -0.002552333287894726, -0.0024209911935031414, -0.002289649099111557, -0.0021583070047199726, -0.002026964910328388, -0.0018956228159368038, -0.0017642808379605412, -0.0016329387435689569, -0.0015015965327620506, -0.0013702544383704662, -0.0012389123439788818, -0.0011075702495872974, -0.000976228213403374, -0.0008448861190117896, -0.0007135440828278661, -0.0005822019884362817, -0.0004508599522523582, -0.0003195178578607738, -0.00018817579257301986, -5.683372728526592e-05, 7.450836710631847e-05, 0.00020585046149790287, 0.00033719249768182635, 0.00046853459207341075, 0.0005998766864649951]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 5.0, 8.0, 16.0, 11.0, 17.0, 22.0, 29.0, 36.0, 29.0, 43.0, 30.0, 45.0, 43.0, 58.0, 41.0, 47.0, 49.0, 56.0, 53.0, 50.0, 38.0, 43.0, 32.0, 32.0, 30.0, 23.0, 20.0, 20.0, 18.0, 12.0, 6.0, 8.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0004892349243164062, -0.0004763184115290642, -0.0004634018987417221, -0.00045048538595438004, -0.00043756887316703796, -0.0004246523603796959, -0.0004117358475923538, -0.00039881933480501175, -0.0003859028220176697, -0.0003729863092303276, -0.00036006979644298553, -0.00034715328365564346, -0.0003342367708683014, -0.0003213202580809593, -0.00030840374529361725, -0.0002954872325062752, -0.0002825707197189331, -0.00026965420693159103, -0.00025673769414424896, -0.0002438211813569069, -0.00023090466856956482, -0.00021798815578222275, -0.00020507164299488068, -0.0001921551302075386, -0.00017923861742019653, -0.00016632210463285446, -0.0001534055918455124, -0.00014048907905817032, -0.00012757256627082825, -0.00011465605348348618, -0.0001017395406961441, -8.882302790880203e-05, -7.590651512145996e-05, -6.299000233411789e-05, -5.007348954677582e-05, -3.7156976759433746e-05, -2.4240463972091675e-05, -1.1323951184749603e-05, 1.5925616025924683e-06, 1.450907438993454e-05, 2.742558717727661e-05, 4.034209996461868e-05, 5.3258612751960754e-05, 6.617512553930283e-05, 7.90916383266449e-05, 9.200815111398697e-05, 0.00010492466390132904, 0.00011784117668867111, 0.00013075768947601318, 0.00014367420226335526, 0.00015659071505069733, 0.0001695072278380394, 0.00018242374062538147, 0.00019534025341272354, 0.0002082567662000656, 0.00022117327898740768, 0.00023408979177474976, 0.00024700630456209183, 0.0002599228173494339, 0.00027283933013677597, 0.00028575584292411804, 0.0002986723557114601, 0.0003115888684988022, 0.00032450538128614426, 0.00033742189407348633]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 8.0, 20.0, 22.0, 22.0, 39.0, 62.0, 83.0, 88.0, 123.0, 103.0, 115.0, 90.0, 57.0, 66.0, 29.0, 25.0, 12.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8046875, -4.675201416015625, -4.54571533203125, -4.416229248046875, -4.2867431640625, -4.157257080078125, -4.02777099609375, -3.898284912109375, -3.768798828125, -3.639312744140625, -3.50982666015625, -3.380340576171875, -3.2508544921875, -3.121368408203125, -2.99188232421875, -2.862396240234375, -2.73291015625, -2.603424072265625, -2.47393798828125, -2.344451904296875, -2.2149658203125, -2.085479736328125, -1.95599365234375, -1.826507568359375, -1.697021484375, -1.567535400390625, -1.43804931640625, -1.308563232421875, -1.1790771484375, -1.049591064453125, -0.92010498046875, -0.790618896484375, -0.6611328125, -0.531646728515625, -0.40216064453125, -0.272674560546875, -0.1431884765625, -0.013702392578125, 0.11578369140625, 0.245269775390625, 0.374755859375, 0.504241943359375, 0.63372802734375, 0.763214111328125, 0.8927001953125, 1.022186279296875, 1.15167236328125, 1.281158447265625, 1.41064453125, 1.540130615234375, 1.66961669921875, 1.799102783203125, 1.9285888671875, 2.058074951171875, 2.18756103515625, 2.317047119140625, 2.446533203125, 2.576019287109375, 2.70550537109375, 2.834991455078125, 2.9644775390625, 3.093963623046875, 3.22344970703125, 3.352935791015625, 3.482421875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 7.0, 8.0, 11.0, 11.0, 11.0, 45.0, 61.0, 61.0, 125.0, 196.0, 331.0, 654.0, 1557.0, 4678.0, 19406.0, 111546.0, 588540.0, 267183.0, 40857.0, 8664.0, 2588.0, 955.0, 444.0, 209.0, 130.0, 79.0, 53.0, 36.0, 25.0, 23.0, 13.0, 8.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.1328125, -4.9891357421875, -4.845458984375, -4.7017822265625, -4.55810546875, -4.4144287109375, -4.270751953125, -4.1270751953125, -3.9833984375, -3.8397216796875, -3.696044921875, -3.5523681640625, -3.40869140625, -3.2650146484375, -3.121337890625, -2.9776611328125, -2.833984375, -2.6903076171875, -2.546630859375, -2.4029541015625, -2.25927734375, -2.1156005859375, -1.971923828125, -1.8282470703125, -1.6845703125, -1.5408935546875, -1.397216796875, -1.2535400390625, -1.10986328125, -0.9661865234375, -0.822509765625, -0.6788330078125, -0.53515625, -0.3914794921875, -0.247802734375, -0.1041259765625, 0.03955078125, 0.1832275390625, 0.326904296875, 0.4705810546875, 0.6142578125, 0.7579345703125, 0.901611328125, 1.0452880859375, 1.18896484375, 1.3326416015625, 1.476318359375, 1.6199951171875, 1.763671875, 1.9073486328125, 2.051025390625, 2.1947021484375, 2.33837890625, 2.4820556640625, 2.625732421875, 2.7694091796875, 2.9130859375, 3.0567626953125, 3.200439453125, 3.3441162109375, 3.48779296875, 3.6314697265625, 3.775146484375, 3.9188232421875, 4.0625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 9.0, 9.0, 12.0, 23.0, 19.0, 20.0, 23.0, 20.0, 29.0, 28.0, 33.0, 30.0, 34.0, 48.0, 48.0, 99.0, 239.0, 1621.0, 217.0, 71.0, 53.0, 46.0, 43.0, 36.0, 25.0, 32.0, 37.0, 22.0, 16.0, 26.0, 16.0, 19.0, 11.0, 8.0, 6.0, 8.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.7109375, -8.4652099609375, -8.219482421875, -7.9737548828125, -7.72802734375, -7.4822998046875, -7.236572265625, -6.9908447265625, -6.7451171875, -6.4993896484375, -6.253662109375, -6.0079345703125, -5.76220703125, -5.5164794921875, -5.270751953125, -5.0250244140625, -4.779296875, -4.5335693359375, -4.287841796875, -4.0421142578125, -3.79638671875, -3.5506591796875, -3.304931640625, -3.0592041015625, -2.8134765625, -2.5677490234375, -2.322021484375, -2.0762939453125, -1.83056640625, -1.5848388671875, -1.339111328125, -1.0933837890625, -0.84765625, -0.6019287109375, -0.356201171875, -0.1104736328125, 0.13525390625, 0.3809814453125, 0.626708984375, 0.8724365234375, 1.1181640625, 1.3638916015625, 1.609619140625, 1.8553466796875, 2.10107421875, 2.3468017578125, 2.592529296875, 2.8382568359375, 3.083984375, 3.3297119140625, 3.575439453125, 3.8211669921875, 4.06689453125, 4.3126220703125, 4.558349609375, 4.8040771484375, 5.0498046875, 5.2955322265625, 5.541259765625, 5.7869873046875, 6.03271484375, 6.2784423828125, 6.524169921875, 6.7698974609375, 7.015625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 7.0, 9.0, 11.0, 18.0, 20.0, 10.0, 25.0, 31.0, 30.0, 46.0, 35.0, 64.0, 92.0, 155.0, 321.0, 925.0, 17596.0, 3073751.0, 50268.0, 1298.0, 371.0, 184.0, 94.0, 79.0, 46.0, 33.0, 27.0, 28.0, 22.0, 21.0, 20.0, 15.0, 15.0, 13.0, 9.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.8797607421875, -13.376708984375, -12.8736572265625, -12.37060546875, -11.8675537109375, -11.364501953125, -10.8614501953125, -10.3583984375, -9.8553466796875, -9.352294921875, -8.8492431640625, -8.34619140625, -7.8431396484375, -7.340087890625, -6.8370361328125, -6.333984375, -5.8309326171875, -5.327880859375, -4.8248291015625, -4.32177734375, -3.8187255859375, -3.315673828125, -2.8126220703125, -2.3095703125, -1.8065185546875, -1.303466796875, -0.8004150390625, -0.29736328125, 0.2056884765625, 0.708740234375, 1.2117919921875, 1.71484375, 2.2178955078125, 2.720947265625, 3.2239990234375, 3.72705078125, 4.2301025390625, 4.733154296875, 5.2362060546875, 5.7392578125, 6.2423095703125, 6.745361328125, 7.2484130859375, 7.75146484375, 8.2545166015625, 8.757568359375, 9.2606201171875, 9.763671875, 10.2667236328125, 10.769775390625, 11.2728271484375, 11.77587890625, 12.2789306640625, 12.781982421875, 13.2850341796875, 13.7880859375, 14.2911376953125, 14.794189453125, 15.2972412109375, 15.80029296875, 16.3033447265625, 16.806396484375, 17.3094482421875, 17.8125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 8.0, 1004.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.908605575561523, -8.04853630065918, -2.1884679794311523, 3.671600341796875, 9.531669616699219, 15.391738891601562, 21.251806259155273, 27.111875534057617, 32.971946716308594, 38.83201599121094, 44.69208526611328, 50.552154541015625, 56.41222381591797, 62.27229309082031, 68.13235473632812, 73.992431640625, 79.85249328613281, 85.71256256103516, 91.5726318359375, 97.43270111083984, 103.29277038574219, 109.15283966064453, 115.01290893554688, 120.87297058105469, 126.73304748535156, 132.59310913085938, 138.45318603515625, 144.31324768066406, 150.17332458496094, 156.03338623046875, 161.89346313476562, 167.75352478027344, 173.6136016845703, 179.47366333007812, 185.333740234375, 191.1938018798828, 197.0538787841797, 202.9139404296875, 208.77401733398438, 214.6340789794922, 220.49415588378906, 226.35421752929688, 232.21429443359375, 238.07435607910156, 243.93443298339844, 249.79449462890625, 255.65457153320312, 261.5146484375, 267.37469482421875, 273.2347717285156, 279.0948181152344, 284.95489501953125, 290.8149719238281, 296.675048828125, 302.53509521484375, 308.3951721191406, 314.2552490234375, 320.1153259277344, 325.9753723144531, 331.83544921875, 337.6955261230469, 343.55560302734375, 349.4156494140625, 355.2757263183594, 361.13580322265625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 6.0, 8.0, 3.0, 9.0, 16.0, 16.0, 20.0, 22.0, 27.0, 37.0, 36.0, 34.0, 38.0, 27.0, 32.0, 51.0, 35.0, 49.0, 53.0, 45.0, 45.0, 38.0, 39.0, 38.0, 35.0, 46.0, 30.0, 25.0, 19.0, 21.0, 18.0, 19.0, 11.0, 12.0, 6.0, 5.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-28.132755279541016, -27.32994842529297, -26.527141571044922, -25.724334716796875, -24.921525955200195, -24.11871910095215, -23.3159122467041, -22.513105392456055, -21.710298538208008, -20.90749168395996, -20.104684829711914, -19.301876068115234, -18.499069213867188, -17.69626235961914, -16.893455505371094, -16.090648651123047, -15.287840843200684, -14.485033988952637, -13.682226181030273, -12.879419326782227, -12.07661247253418, -11.273805618286133, -10.47099781036377, -9.668190956115723, -8.86538314819336, -8.062576293945312, -7.259768962860107, -6.456961631774902, -5.6541547775268555, -4.85134744644165, -4.048540115356445, -3.2457332611083984, -2.4429264068603516, -1.6401193141937256, -0.8373121023178101, -0.03450489044189453, 0.7683022022247314, 1.5711092948913574, 2.3739166259765625, 3.1767234802246094, 3.9795308113098145, 4.7823381423950195, 5.585144996643066, 6.3879523277282715, 7.190759658813477, 7.993566513061523, 8.79637336730957, 9.599180221557617, 10.40198802947998, 11.204794883728027, 12.00760269165039, 12.810409545898438, 13.613216400146484, 14.416023254394531, 15.218831062316895, 16.021636962890625, 16.824445724487305, 17.62725257873535, 18.4300594329834, 19.232868194580078, 20.035675048828125, 20.838481903076172, 21.64128875732422, 22.444095611572266, 23.246902465820312]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 4.0, 4.0, 11.0, 16.0, 25.0, 26.0, 43.0, 63.0, 77.0, 87.0, 123.0, 99.0, 114.0, 94.0, 59.0, 60.0, 34.0, 19.0, 15.0, 11.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8125, -4.682647705078125, -4.55279541015625, -4.422943115234375, -4.2930908203125, -4.163238525390625, -4.03338623046875, -3.903533935546875, -3.773681640625, -3.643829345703125, -3.51397705078125, -3.384124755859375, -3.2542724609375, -3.124420166015625, -2.99456787109375, -2.864715576171875, -2.73486328125, -2.605010986328125, -2.47515869140625, -2.345306396484375, -2.2154541015625, -2.085601806640625, -1.95574951171875, -1.825897216796875, -1.696044921875, -1.566192626953125, -1.43634033203125, -1.306488037109375, -1.1766357421875, -1.046783447265625, -0.91693115234375, -0.787078857421875, -0.6572265625, -0.527374267578125, -0.39752197265625, -0.267669677734375, -0.1378173828125, -0.007965087890625, 0.12188720703125, 0.251739501953125, 0.381591796875, 0.511444091796875, 0.64129638671875, 0.771148681640625, 0.9010009765625, 1.030853271484375, 1.16070556640625, 1.290557861328125, 1.42041015625, 1.550262451171875, 1.68011474609375, 1.809967041015625, 1.9398193359375, 2.069671630859375, 2.19952392578125, 2.329376220703125, 2.459228515625, 2.589080810546875, 2.71893310546875, 2.848785400390625, 2.9786376953125, 3.108489990234375, 3.23834228515625, 3.368194580078125, 3.498046875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 10.0, 20.0, 13.0, 29.0, 35.0, 80.0, 107.0, 159.0, 347.0, 645.0, 1277.0, 3636.0, 18283.0, 2704388.0, 1444805.0, 15338.0, 3023.0, 1042.0, 471.0, 221.0, 150.0, 73.0, 35.0, 31.0, 23.0, 13.0, 5.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.875, -24.201904296875, -23.52880859375, -22.855712890625, -22.1826171875, -21.509521484375, -20.83642578125, -20.163330078125, -19.490234375, -18.817138671875, -18.14404296875, -17.470947265625, -16.7978515625, -16.124755859375, -15.45166015625, -14.778564453125, -14.10546875, -13.432373046875, -12.75927734375, -12.086181640625, -11.4130859375, -10.739990234375, -10.06689453125, -9.393798828125, -8.720703125, -8.047607421875, -7.37451171875, -6.701416015625, -6.0283203125, -5.355224609375, -4.68212890625, -4.009033203125, -3.3359375, -2.662841796875, -1.98974609375, -1.316650390625, -0.6435546875, 0.029541015625, 0.70263671875, 1.375732421875, 2.048828125, 2.721923828125, 3.39501953125, 4.068115234375, 4.7412109375, 5.414306640625, 6.08740234375, 6.760498046875, 7.43359375, 8.106689453125, 8.77978515625, 9.452880859375, 10.1259765625, 10.799072265625, 11.47216796875, 12.145263671875, 12.818359375, 13.491455078125, 14.16455078125, 14.837646484375, 15.5107421875, 16.183837890625, 16.85693359375, 17.530029296875, 18.203125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 14.0, 2.0, 16.0, 19.0, 11.0, 33.0, 39.0, 70.0, 71.0, 137.0, 223.0, 339.0, 498.0, 715.0, 627.0, 420.0, 288.0, 170.0, 116.0, 68.0, 54.0, 33.0, 26.0, 16.0, 14.0, 9.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1015625, -6.8629150390625, -6.624267578125, -6.3856201171875, -6.14697265625, -5.9083251953125, -5.669677734375, -5.4310302734375, -5.1923828125, -4.9537353515625, -4.715087890625, -4.4764404296875, -4.23779296875, -3.9991455078125, -3.760498046875, -3.5218505859375, -3.283203125, -3.0445556640625, -2.805908203125, -2.5672607421875, -2.32861328125, -2.0899658203125, -1.851318359375, -1.6126708984375, -1.3740234375, -1.1353759765625, -0.896728515625, -0.6580810546875, -0.41943359375, -0.1807861328125, 0.057861328125, 0.2965087890625, 0.53515625, 0.7738037109375, 1.012451171875, 1.2510986328125, 1.48974609375, 1.7283935546875, 1.967041015625, 2.2056884765625, 2.4443359375, 2.6829833984375, 2.921630859375, 3.1602783203125, 3.39892578125, 3.6375732421875, 3.876220703125, 4.1148681640625, 4.353515625, 4.5921630859375, 4.830810546875, 5.0694580078125, 5.30810546875, 5.5467529296875, 5.785400390625, 6.0240478515625, 6.2626953125, 6.5013427734375, 6.739990234375, 6.9786376953125, 7.21728515625, 7.4559326171875, 7.694580078125, 7.9332275390625, 8.171875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 5.0, 12.0, 26.0, 31.0, 41.0, 57.0, 86.0, 153.0, 287.0, 448.0, 851.0, 1699.0, 3508.0, 8250.0, 22829.0, 82200.0, 555135.0, 2847407.0, 550748.0, 82273.0, 22762.0, 8288.0, 3512.0, 1684.0, 832.0, 438.0, 258.0, 161.0, 86.0, 83.0, 43.0, 29.0, 22.0, 9.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-12.3125, -11.9449462890625, -11.577392578125, -11.2098388671875, -10.84228515625, -10.4747314453125, -10.107177734375, -9.7396240234375, -9.3720703125, -9.0045166015625, -8.636962890625, -8.2694091796875, -7.90185546875, -7.5343017578125, -7.166748046875, -6.7991943359375, -6.431640625, -6.0640869140625, -5.696533203125, -5.3289794921875, -4.96142578125, -4.5938720703125, -4.226318359375, -3.8587646484375, -3.4912109375, -3.1236572265625, -2.756103515625, -2.3885498046875, -2.02099609375, -1.6534423828125, -1.285888671875, -0.9183349609375, -0.55078125, -0.1832275390625, 0.184326171875, 0.5518798828125, 0.91943359375, 1.2869873046875, 1.654541015625, 2.0220947265625, 2.3896484375, 2.7572021484375, 3.124755859375, 3.4923095703125, 3.85986328125, 4.2274169921875, 4.594970703125, 4.9625244140625, 5.330078125, 5.6976318359375, 6.065185546875, 6.4327392578125, 6.80029296875, 7.1678466796875, 7.535400390625, 7.9029541015625, 8.2705078125, 8.6380615234375, 9.005615234375, 9.3731689453125, 9.74072265625, 10.1082763671875, 10.475830078125, 10.8433837890625, 11.2109375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 8.0, 25.0, 59.0, 145.0, 269.0, 278.0, 140.0, 67.0, 16.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.68810272216797, -21.9373779296875, -19.18665313720703, -16.43592643737793, -13.685201644897461, -10.934476852416992, -8.18375015258789, -5.433025360107422, -2.682300567626953, 0.06842470169067383, 2.819149971008301, 5.569875717163086, 8.320600509643555, 11.071325302124023, 13.822052001953125, 16.572776794433594, 19.323501586914062, 22.07422637939453, 24.824951171875, 27.5756778717041, 30.32640266418457, 33.077125549316406, 35.82785415649414, 38.57857894897461, 41.32930374145508, 44.08002853393555, 46.830753326416016, 49.58148193359375, 52.33220672607422, 55.08293151855469, 57.833656311035156, 60.584381103515625, 63.33509826660156, 66.08582305908203, 68.8365478515625, 71.58727264404297, 74.33799743652344, 77.0887222290039, 79.83944702148438, 82.59017944335938, 85.34089660644531, 88.09162139892578, 90.84234619140625, 93.59307098388672, 96.34379577636719, 99.09452056884766, 101.84524536132812, 104.59597778320312, 107.3467025756836, 110.09742736816406, 112.84815216064453, 115.598876953125, 118.34960174560547, 121.10032653808594, 123.85105895996094, 126.60177612304688, 129.35250854492188, 132.10324096679688, 134.8539581298828, 137.6046905517578, 140.35540771484375, 143.10614013671875, 145.8568572998047, 148.6075897216797, 151.35830688476562]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 4.0, 4.0, 10.0, 5.0, 4.0, 13.0, 15.0, 17.0, 18.0, 23.0, 26.0, 28.0, 34.0, 26.0, 29.0, 39.0, 38.0, 38.0, 40.0, 54.0, 34.0, 53.0, 47.0, 37.0, 43.0, 34.0, 38.0, 34.0, 34.0, 34.0, 19.0, 13.0, 28.0, 18.0, 14.0, 10.0, 14.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.430870056152344, -23.666580200195312, -22.90228843688965, -22.137998580932617, -21.373706817626953, -20.609416961669922, -19.84512710571289, -19.080835342407227, -18.316545486450195, -17.552255630493164, -16.7879638671875, -16.02367401123047, -15.259383201599121, -14.495092391967773, -13.730801582336426, -12.966510772705078, -12.20221996307373, -11.437929153442383, -10.673638343811035, -9.909347534179688, -9.145057678222656, -8.380766868591309, -7.616476058959961, -6.8521857261657715, -6.087894916534424, -5.323604106903076, -4.559313774108887, -3.795022964477539, -3.0307323932647705, -2.266441822052002, -1.5021510124206543, -0.7378606796264648, 0.026430130004882812, 0.7907207608222961, 1.5550113916397095, 2.3193020820617676, 3.083592653274536, 3.8478832244873047, 4.612174034118652, 5.376464366912842, 6.1407551765441895, 6.905045986175537, 7.669336318969727, 8.433627128601074, 9.197917938232422, 9.962207794189453, 10.726499557495117, 11.490789413452148, 12.255080223083496, 13.019371032714844, 13.783661842346191, 14.547952651977539, 15.31224250793457, 16.076534271240234, 16.840824127197266, 17.605113983154297, 18.36940574645996, 19.133695602416992, 19.897987365722656, 20.662277221679688, 21.42656898498535, 22.190858840942383, 22.955150604248047, 23.719440460205078, 24.48373031616211]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 27.0, 18.0, 45.0, 58.0, 53.0, 82.0, 88.0, 82.0, 114.0, 94.0, 81.0, 60.0, 55.0, 41.0, 22.0, 15.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.475860595703125, -4.35406494140625, -4.232269287109375, -4.1104736328125, -3.988677978515625, -3.86688232421875, -3.745086669921875, -3.623291015625, -3.501495361328125, -3.37969970703125, -3.257904052734375, -3.1361083984375, -3.014312744140625, -2.89251708984375, -2.770721435546875, -2.64892578125, -2.527130126953125, -2.40533447265625, -2.283538818359375, -2.1617431640625, -2.039947509765625, -1.91815185546875, -1.796356201171875, -1.674560546875, -1.552764892578125, -1.43096923828125, -1.309173583984375, -1.1873779296875, -1.065582275390625, -0.94378662109375, -0.821990966796875, -0.7001953125, -0.578399658203125, -0.45660400390625, -0.334808349609375, -0.2130126953125, -0.091217041015625, 0.03057861328125, 0.152374267578125, 0.274169921875, 0.395965576171875, 0.51776123046875, 0.639556884765625, 0.7613525390625, 0.883148193359375, 1.00494384765625, 1.126739501953125, 1.24853515625, 1.370330810546875, 1.49212646484375, 1.613922119140625, 1.7357177734375, 1.857513427734375, 1.97930908203125, 2.101104736328125, 2.222900390625, 2.344696044921875, 2.46649169921875, 2.588287353515625, 2.7100830078125, 2.831878662109375, 2.95367431640625, 3.075469970703125, 3.197265625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 5.0, 4.0, 15.0, 16.0, 27.0, 29.0, 42.0, 39.0, 67.0, 85.0, 149.0, 222.0, 292.0, 477.0, 731.0, 1197.0, 2001.0, 3578.0, 6876.0, 14968.0, 39481.0, 127508.0, 562265.0, 195822.0, 54302.0, 19796.0, 8379.0, 4176.0, 2291.0, 1286.0, 846.0, 498.0, 337.0, 236.0, 149.0, 97.0, 69.0, 55.0, 34.0, 25.0, 21.0, 20.0, 14.0, 5.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.215087890625, -0.20806884765625, -0.2010498046875, -0.19403076171875, -0.18701171875, -0.17999267578125, -0.1729736328125, -0.16595458984375, -0.158935546875, -0.15191650390625, -0.1448974609375, -0.13787841796875, -0.130859375, -0.12384033203125, -0.1168212890625, -0.10980224609375, -0.102783203125, -0.09576416015625, -0.0887451171875, -0.08172607421875, -0.07470703125, -0.06768798828125, -0.0606689453125, -0.05364990234375, -0.046630859375, -0.03961181640625, -0.0325927734375, -0.02557373046875, -0.0185546875, -0.01153564453125, -0.0045166015625, 0.00250244140625, 0.009521484375, 0.01654052734375, 0.0235595703125, 0.03057861328125, 0.03759765625, 0.04461669921875, 0.0516357421875, 0.05865478515625, 0.065673828125, 0.07269287109375, 0.0797119140625, 0.08673095703125, 0.09375, 0.10076904296875, 0.1077880859375, 0.11480712890625, 0.121826171875, 0.12884521484375, 0.1358642578125, 0.14288330078125, 0.14990234375, 0.15692138671875, 0.1639404296875, 0.17095947265625, 0.177978515625, 0.18499755859375, 0.1920166015625, 0.19903564453125, 0.2060546875, 0.21307373046875, 0.2200927734375, 0.22711181640625, 0.234130859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 3.0, 10.0, 8.0, 8.0, 15.0, 16.0, 17.0, 23.0, 25.0, 34.0, 24.0, 23.0, 35.0, 44.0, 36.0, 48.0, 39.0, 59.0, 1070.0, 34.0, 42.0, 26.0, 45.0, 45.0, 36.0, 36.0, 27.0, 32.0, 25.0, 26.0, 20.0, 21.0, 16.0, 17.0, 9.0, 6.0, 8.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.875, -2.797149658203125, -2.71929931640625, -2.641448974609375, -2.5635986328125, -2.485748291015625, -2.40789794921875, -2.330047607421875, -2.252197265625, -2.174346923828125, -2.09649658203125, -2.018646240234375, -1.9407958984375, -1.862945556640625, -1.78509521484375, -1.707244873046875, -1.62939453125, -1.551544189453125, -1.47369384765625, -1.395843505859375, -1.3179931640625, -1.240142822265625, -1.16229248046875, -1.084442138671875, -1.006591796875, -0.928741455078125, -0.85089111328125, -0.773040771484375, -0.6951904296875, -0.617340087890625, -0.53948974609375, -0.461639404296875, -0.3837890625, -0.305938720703125, -0.22808837890625, -0.150238037109375, -0.0723876953125, 0.005462646484375, 0.08331298828125, 0.161163330078125, 0.239013671875, 0.316864013671875, 0.39471435546875, 0.472564697265625, 0.5504150390625, 0.628265380859375, 0.70611572265625, 0.783966064453125, 0.86181640625, 0.939666748046875, 1.01751708984375, 1.095367431640625, 1.1732177734375, 1.251068115234375, 1.32891845703125, 1.406768798828125, 1.484619140625, 1.562469482421875, 1.64031982421875, 1.718170166015625, 1.7960205078125, 1.873870849609375, 1.95172119140625, 2.029571533203125, 2.107421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 11.0, 27.0, 32.0, 53.0, 82.0, 170.0, 213.0, 347.0, 576.0, 900.0, 1385.0, 2148.0, 3448.0, 5425.0, 8555.0, 13523.0, 21553.0, 35825.0, 60720.0, 111932.0, 1036662.0, 530396.0, 109881.0, 60367.0, 34968.0, 21682.0, 13417.0, 8378.0, 5206.0, 3355.0, 2162.0, 1371.0, 843.0, 542.0, 354.0, 220.0, 119.0, 102.0, 70.0, 38.0, 15.0, 25.0, 6.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06503105163574219, -0.06286239624023438, -0.06069374084472656, -0.05852508544921875, -0.05635643005371094, -0.054187774658203125, -0.05201911926269531, -0.0498504638671875, -0.04768180847167969, -0.045513153076171875, -0.04334449768066406, -0.04117584228515625, -0.03900718688964844, -0.036838531494140625, -0.03466987609863281, -0.032501220703125, -0.030332565307617188, -0.028163909912109375, -0.025995254516601562, -0.02382659912109375, -0.021657943725585938, -0.019489288330078125, -0.017320632934570312, -0.0151519775390625, -0.012983322143554688, -0.010814666748046875, -0.008646011352539062, -0.00647735595703125, -0.0043087005615234375, -0.002140045166015625, 2.86102294921875e-05, 0.002197265625, 0.0043659210205078125, 0.006534576416015625, 0.008703231811523438, 0.01087188720703125, 0.013040542602539062, 0.015209197998046875, 0.017377853393554688, 0.0195465087890625, 0.021715164184570312, 0.023883819580078125, 0.026052474975585938, 0.02822113037109375, 0.030389785766601562, 0.032558441162109375, 0.03472709655761719, 0.036895751953125, 0.03906440734863281, 0.041233062744140625, 0.04340171813964844, 0.04557037353515625, 0.04773902893066406, 0.049907684326171875, 0.05207633972167969, 0.0542449951171875, 0.05641365051269531, 0.058582305908203125, 0.06075096130371094, 0.06291961669921875, 0.06508827209472656, 0.06725692749023438, 0.06942558288574219, 0.07159423828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 7.0, 9.0, 2.0, 11.0, 8.0, 17.0, 14.0, 34.0, 36.0, 34.0, 64.0, 46.0, 79.0, 73.0, 91.0, 81.0, 69.0, 59.0, 69.0, 37.0, 34.0, 21.0, 24.0, 15.0, 22.0, 6.0, 13.0, 9.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007200241088867188, -0.0007008612155914307, -0.0006816983222961426, -0.0006625354290008545, -0.0006433725357055664, -0.0006242096424102783, -0.0006050467491149902, -0.0005858838558197021, -0.0005667209625244141, -0.000547558069229126, -0.0005283951759338379, -0.0005092322826385498, -0.0004900693893432617, -0.00047090649604797363, -0.00045174360275268555, -0.00043258070945739746, -0.0004134178161621094, -0.0003942549228668213, -0.0003750920295715332, -0.0003559291362762451, -0.00033676624298095703, -0.00031760334968566895, -0.00029844045639038086, -0.0002792775630950928, -0.0002601146697998047, -0.0002409517765045166, -0.00022178888320922852, -0.00020262598991394043, -0.00018346309661865234, -0.00016430020332336426, -0.00014513731002807617, -0.00012597441673278809, -0.0001068115234375, -8.764863014221191e-05, -6.848573684692383e-05, -4.932284355163574e-05, -3.0159950256347656e-05, -1.099705696105957e-05, 8.165836334228516e-06, 2.73287296295166e-05, 4.649162292480469e-05, 6.565451622009277e-05, 8.481740951538086e-05, 0.00010398030281066895, 0.00012314319610595703, 0.00014230608940124512, 0.0001614689826965332, 0.0001806318759918213, 0.00019979476928710938, 0.00021895766258239746, 0.00023812055587768555, 0.00025728344917297363, 0.0002764463424682617, 0.0002956092357635498, 0.0003147721290588379, 0.000333935022354126, 0.00035309791564941406, 0.00037226080894470215, 0.00039142370223999023, 0.0004105865955352783, 0.0004297494888305664, 0.0004489123821258545, 0.0004680752754211426, 0.00048723816871643066, 0.0005064010620117188]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 8.0, 11.0, 16.0, 22.0, 19.0, 40.0, 40.0, 48.0, 67.0, 91.0, 131.0, 207.0, 361.0, 2757.0, 116888.0, 910897.0, 15287.0, 811.0, 252.0, 146.0, 112.0, 83.0, 71.0, 48.0, 38.0, 23.0, 20.0, 13.0, 10.0, 11.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00897979736328125, -0.008672833442687988, -0.008365869522094727, -0.008058905601501465, -0.007751941680908203, -0.007444977760314941, -0.00713801383972168, -0.006831049919128418, -0.006524085998535156, -0.0062171220779418945, -0.005910158157348633, -0.005603194236755371, -0.005296230316162109, -0.004989266395568848, -0.004682302474975586, -0.004375338554382324, -0.0040683746337890625, -0.0037614107131958008, -0.003454446792602539, -0.0031474828720092773, -0.0028405189514160156, -0.002533555030822754, -0.002226591110229492, -0.0019196271896362305, -0.0016126632690429688, -0.001305699348449707, -0.0009987354278564453, -0.0006917715072631836, -0.0003848075866699219, -7.784366607666016e-05, 0.00022912025451660156, 0.0005360841751098633, 0.000843048095703125, 0.0011500120162963867, 0.0014569759368896484, 0.0017639398574829102, 0.002070903778076172, 0.0023778676986694336, 0.0026848316192626953, 0.002991795539855957, 0.0032987594604492188, 0.0036057233810424805, 0.003912687301635742, 0.004219651222229004, 0.004526615142822266, 0.004833579063415527, 0.005140542984008789, 0.005447506904602051, 0.0057544708251953125, 0.006061434745788574, 0.006368398666381836, 0.006675362586975098, 0.006982326507568359, 0.007289290428161621, 0.007596254348754883, 0.007903218269348145, 0.008210182189941406, 0.008517146110534668, 0.00882411003112793, 0.009131073951721191, 0.009438037872314453, 0.009745001792907715, 0.010051965713500977, 0.010358929634094238, 0.0106658935546875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 25.0, 124.0, 718.0, 132.0, 17.0, 2.0], "bins": [-0.009489239193499088, -0.00933240819722414, -0.009175577200949192, -0.009018746204674244, -0.008861915208399296, -0.008705084212124348, -0.0085482532158494, -0.008391422219574451, -0.008234591223299503, -0.008077760227024555, -0.007920929230749607, -0.007764098234474659, -0.007607267238199711, -0.007450436241924763, -0.007293605245649815, -0.0071367742493748665, -0.006979943253099918, -0.00682311225682497, -0.006666281260550022, -0.006509450264275074, -0.006352619268000126, -0.006195788271725178, -0.00603895727545023, -0.0058821262791752815, -0.005725294817239046, -0.005568463820964098, -0.00541163282468915, -0.005254801828414202, -0.005097970832139254, -0.0049411398358643055, -0.004784308839589357, -0.004627477843314409, -0.004470646381378174, -0.004313815385103226, -0.004156984388828278, -0.0040001533925533295, -0.0038433223962783813, -0.0036864914000034332, -0.003529660403728485, -0.003372829407453537, -0.003215998411178589, -0.0030591674149036407, -0.0029023364186286926, -0.0027455054223537445, -0.0025886744260787964, -0.0024318434298038483, -0.0022750124335289, -0.002118181437253952, -0.001961350440979004, -0.0018045194447040558, -0.0016476884484291077, -0.0014908574521541595, -0.0013340264558792114, -0.0011771954596042633, -0.0010203643469139934, -0.0008635333506390452, -0.0007067023543640971, -0.000549871358089149, -0.0003930403327103704, -0.00023620930733159184, -7.937831105664372e-05, 7.74526852183044e-05, 0.00023428373970091343, 0.00039111473597586155, 0.0005479457322508097]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 9.0, 8.0, 14.0, 13.0, 26.0, 22.0, 32.0, 35.0, 41.0, 47.0, 47.0, 39.0, 44.0, 54.0, 73.0, 45.0, 37.0, 49.0, 49.0, 50.0, 42.0, 39.0, 33.0, 35.0, 20.0, 18.0, 20.0, 11.0, 11.0, 11.0, 10.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0007194876670837402, -0.0007006833329796791, -0.000681878998875618, -0.0006630746647715569, -0.0006442703306674957, -0.0006254659965634346, -0.0006066616624593735, -0.0005878573283553123, -0.0005690529942512512, -0.0005502486601471901, -0.000531444326043129, -0.0005126399919390678, -0.0004938356578350067, -0.0004750313237309456, -0.00045622698962688446, -0.00043742265552282333, -0.0004186183214187622, -0.0003998139873147011, -0.00038100965321063995, -0.0003622053191065788, -0.0003434009850025177, -0.0003245966508984566, -0.00030579231679439545, -0.0002869879826903343, -0.0002681836485862732, -0.00024937931448221207, -0.00023057498037815094, -0.0002117706462740898, -0.0001929663121700287, -0.00017416197806596756, -0.00015535764396190643, -0.0001365533098578453, -0.00011774897575378418, -9.894464164972305e-05, -8.014030754566193e-05, -6.13359734416008e-05, -4.253163933753967e-05, -2.3727305233478546e-05, -4.9229711294174194e-06, 1.3881362974643707e-05, 3.2685697078704834e-05, 5.149003118276596e-05, 7.029436528682709e-05, 8.909869939088821e-05, 0.00010790303349494934, 0.00012670736759901047, 0.0001455117017030716, 0.00016431603580713272, 0.00018312036991119385, 0.00020192470401525497, 0.0002207290381193161, 0.00023953337222337723, 0.00025833770632743835, 0.0002771420404314995, 0.0002959463745355606, 0.00031475070863962173, 0.00033355504274368286, 0.000352359376847744, 0.0003711637109518051, 0.00038996804505586624, 0.00040877237915992737, 0.0004275767132639885, 0.0004463810473680496, 0.00046518538147211075, 0.0004839897155761719]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 27.0, 18.0, 45.0, 58.0, 53.0, 82.0, 88.0, 82.0, 114.0, 93.0, 82.0, 60.0, 55.0, 41.0, 22.0, 15.0, 12.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.475860595703125, -4.35406494140625, -4.232269287109375, -4.1104736328125, -3.988677978515625, -3.86688232421875, -3.745086669921875, -3.623291015625, -3.501495361328125, -3.37969970703125, -3.257904052734375, -3.1361083984375, -3.014312744140625, -2.89251708984375, -2.770721435546875, -2.64892578125, -2.527130126953125, -2.40533447265625, -2.283538818359375, -2.1617431640625, -2.039947509765625, -1.91815185546875, -1.796356201171875, -1.674560546875, -1.552764892578125, -1.43096923828125, -1.309173583984375, -1.1873779296875, -1.065582275390625, -0.94378662109375, -0.821990966796875, -0.7001953125, -0.578399658203125, -0.45660400390625, -0.334808349609375, -0.2130126953125, -0.091217041015625, 0.03057861328125, 0.152374267578125, 0.274169921875, 0.395965576171875, 0.51776123046875, 0.639556884765625, 0.7613525390625, 0.883148193359375, 1.00494384765625, 1.126739501953125, 1.24853515625, 1.370330810546875, 1.49212646484375, 1.613922119140625, 1.7357177734375, 1.857513427734375, 1.97930908203125, 2.101104736328125, 2.222900390625, 2.344696044921875, 2.46649169921875, 2.588287353515625, 2.7100830078125, 2.831878662109375, 2.95367431640625, 3.075469970703125, 3.197265625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 7.0, 10.0, 16.0, 20.0, 29.0, 39.0, 61.0, 67.0, 118.0, 193.0, 337.0, 631.0, 1442.0, 4534.0, 30392.0, 963706.0, 38597.0, 5169.0, 1607.0, 677.0, 311.0, 209.0, 121.0, 74.0, 65.0, 34.0, 21.0, 16.0, 13.0, 15.0, 2.0, 7.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.3125, -19.66845703125, -19.0244140625, -18.38037109375, -17.736328125, -17.09228515625, -16.4482421875, -15.80419921875, -15.16015625, -14.51611328125, -13.8720703125, -13.22802734375, -12.583984375, -11.93994140625, -11.2958984375, -10.65185546875, -10.0078125, -9.36376953125, -8.7197265625, -8.07568359375, -7.431640625, -6.78759765625, -6.1435546875, -5.49951171875, -4.85546875, -4.21142578125, -3.5673828125, -2.92333984375, -2.279296875, -1.63525390625, -0.9912109375, -0.34716796875, 0.296875, 0.94091796875, 1.5849609375, 2.22900390625, 2.873046875, 3.51708984375, 4.1611328125, 4.80517578125, 5.44921875, 6.09326171875, 6.7373046875, 7.38134765625, 8.025390625, 8.66943359375, 9.3134765625, 9.95751953125, 10.6015625, 11.24560546875, 11.8896484375, 12.53369140625, 13.177734375, 13.82177734375, 14.4658203125, 15.10986328125, 15.75390625, 16.39794921875, 17.0419921875, 17.68603515625, 18.330078125, 18.97412109375, 19.6181640625, 20.26220703125, 20.90625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 11.0, 15.0, 19.0, 24.0, 27.0, 32.0, 39.0, 39.0, 40.0, 55.0, 53.0, 68.0, 115.0, 1525.0, 428.0, 94.0, 73.0, 53.0, 43.0, 31.0, 38.0, 32.0, 37.0, 29.0, 31.0, 17.0, 15.0, 6.0, 9.0, 6.0, 4.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.263916015625, -7.95751953125, -7.651123046875, -7.3447265625, -7.038330078125, -6.73193359375, -6.425537109375, -6.119140625, -5.812744140625, -5.50634765625, -5.199951171875, -4.8935546875, -4.587158203125, -4.28076171875, -3.974365234375, -3.66796875, -3.361572265625, -3.05517578125, -2.748779296875, -2.4423828125, -2.135986328125, -1.82958984375, -1.523193359375, -1.216796875, -0.910400390625, -0.60400390625, -0.297607421875, 0.0087890625, 0.315185546875, 0.62158203125, 0.927978515625, 1.234375, 1.540771484375, 1.84716796875, 2.153564453125, 2.4599609375, 2.766357421875, 3.07275390625, 3.379150390625, 3.685546875, 3.991943359375, 4.29833984375, 4.604736328125, 4.9111328125, 5.217529296875, 5.52392578125, 5.830322265625, 6.13671875, 6.443115234375, 6.74951171875, 7.055908203125, 7.3623046875, 7.668701171875, 7.97509765625, 8.281494140625, 8.587890625, 8.894287109375, 9.20068359375, 9.507080078125, 9.8134765625, 10.119873046875, 10.42626953125, 10.732666015625, 11.0390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 9.0, 15.0, 29.0, 25.0, 38.0, 51.0, 95.0, 114.0, 152.0, 227.0, 322.0, 481.0, 793.0, 1115.0, 1794.0, 3169.0, 5695.0, 11830.0, 34838.0, 1505155.0, 1519298.0, 34436.0, 12048.0, 5615.0, 3086.0, 1868.0, 1133.0, 743.0, 476.0, 325.0, 214.0, 143.0, 102.0, 86.0, 41.0, 28.0, 27.0, 20.0, 15.0, 17.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.7109375, -14.2205810546875, -13.730224609375, -13.2398681640625, -12.74951171875, -12.2591552734375, -11.768798828125, -11.2784423828125, -10.7880859375, -10.2977294921875, -9.807373046875, -9.3170166015625, -8.82666015625, -8.3363037109375, -7.845947265625, -7.3555908203125, -6.865234375, -6.3748779296875, -5.884521484375, -5.3941650390625, -4.90380859375, -4.4134521484375, -3.923095703125, -3.4327392578125, -2.9423828125, -2.4520263671875, -1.961669921875, -1.4713134765625, -0.98095703125, -0.4906005859375, -0.000244140625, 0.4901123046875, 0.98046875, 1.4708251953125, 1.961181640625, 2.4515380859375, 2.94189453125, 3.4322509765625, 3.922607421875, 4.4129638671875, 4.9033203125, 5.3936767578125, 5.884033203125, 6.3743896484375, 6.86474609375, 7.3551025390625, 7.845458984375, 8.3358154296875, 8.826171875, 9.3165283203125, 9.806884765625, 10.2972412109375, 10.78759765625, 11.2779541015625, 11.768310546875, 12.2586669921875, 12.7490234375, 13.2393798828125, 13.729736328125, 14.2200927734375, 14.71044921875, 15.2008056640625, 15.691162109375, 16.1815185546875, 16.671875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 11.0, 19.0, 31.0, 42.0, 80.0, 133.0, 134.0, 154.0, 144.0, 96.0, 64.0, 43.0, 17.0, 11.0, 12.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.64273452758789, -54.412296295166016, -53.18185806274414, -51.951419830322266, -50.72098159790039, -49.490543365478516, -48.26010513305664, -47.0296630859375, -45.799224853515625, -44.56878662109375, -43.338348388671875, -42.10791015625, -40.877471923828125, -39.64703369140625, -38.416595458984375, -37.1861572265625, -35.955718994140625, -34.72528076171875, -33.494842529296875, -32.264404296875, -31.033966064453125, -29.80352783203125, -28.573087692260742, -27.342649459838867, -26.112211227416992, -24.881772994995117, -23.651334762573242, -22.420896530151367, -21.19045639038086, -19.960018157958984, -18.72957992553711, -17.499141693115234, -16.268707275390625, -15.03826904296875, -13.807830810546875, -12.577391624450684, -11.346953392028809, -10.116515159606934, -8.886075973510742, -7.655637741088867, -6.425199508666992, -5.194761276245117, -3.964322566986084, -2.73388409614563, -1.5034456253051758, -0.2730073928833008, 0.9574313163757324, 2.1878700256347656, 3.4183082580566406, 4.648746490478516, 5.879185199737549, 7.109623908996582, 8.340062141418457, 9.570500373840332, 10.800939559936523, 12.031377792358398, 13.261816024780273, 14.492254257202148, 15.722692489624023, 16.9531307220459, 18.183570861816406, 19.41400909423828, 20.644447326660156, 21.87488555908203, 23.105323791503906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 6.0, 8.0, 13.0, 15.0, 13.0, 16.0, 17.0, 26.0, 21.0, 26.0, 33.0, 27.0, 39.0, 41.0, 51.0, 48.0, 43.0, 46.0, 51.0, 41.0, 46.0, 42.0, 41.0, 41.0, 40.0, 31.0, 25.0, 28.0, 26.0, 18.0, 17.0, 13.0, 7.0, 10.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.903656005859375, -33.89384078979492, -32.88402557373047, -31.874210357666016, -30.864395141601562, -29.85457992553711, -28.844764709472656, -27.834949493408203, -26.82513427734375, -25.815319061279297, -24.805503845214844, -23.79568862915039, -22.785873413085938, -21.776058197021484, -20.76624298095703, -19.756427764892578, -18.746612548828125, -17.736797332763672, -16.72698211669922, -15.717166900634766, -14.707351684570312, -13.69753646850586, -12.687721252441406, -11.677906036376953, -10.6680908203125, -9.658275604248047, -8.648460388183594, -7.638645172119141, -6.6288299560546875, -5.619014739990234, -4.609199523925781, -3.599384307861328, -2.5895729064941406, -1.5797576904296875, -0.5699424743652344, 0.43987274169921875, 1.4496879577636719, 2.459503173828125, 3.469318389892578, 4.479133605957031, 5.488948822021484, 6.4987640380859375, 7.508579254150391, 8.518394470214844, 9.528209686279297, 10.53802490234375, 11.547840118408203, 12.557655334472656, 13.56747055053711, 14.577285766601562, 15.587100982666016, 16.59691619873047, 17.606731414794922, 18.616546630859375, 19.626361846923828, 20.63617706298828, 21.645992279052734, 22.655807495117188, 23.66562271118164, 24.675437927246094, 25.685253143310547, 26.695068359375, 27.704883575439453, 28.714698791503906, 29.72451400756836]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 2.0, 4.0, 3.0, 14.0, 15.0, 16.0, 25.0, 39.0, 61.0, 65.0, 66.0, 76.0, 93.0, 95.0, 105.0, 78.0, 57.0, 57.0, 43.0, 32.0, 22.0, 13.0, 4.0, 10.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.69921875, -4.575408935546875, -4.45159912109375, -4.327789306640625, -4.2039794921875, -4.080169677734375, -3.95635986328125, -3.832550048828125, -3.708740234375, -3.584930419921875, -3.46112060546875, -3.337310791015625, -3.2135009765625, -3.089691162109375, -2.96588134765625, -2.842071533203125, -2.71826171875, -2.594451904296875, -2.47064208984375, -2.346832275390625, -2.2230224609375, -2.099212646484375, -1.97540283203125, -1.851593017578125, -1.727783203125, -1.603973388671875, -1.48016357421875, -1.356353759765625, -1.2325439453125, -1.108734130859375, -0.98492431640625, -0.861114501953125, -0.7373046875, -0.613494873046875, -0.48968505859375, -0.365875244140625, -0.2420654296875, -0.118255615234375, 0.00555419921875, 0.129364013671875, 0.253173828125, 0.376983642578125, 0.50079345703125, 0.624603271484375, 0.7484130859375, 0.872222900390625, 0.99603271484375, 1.119842529296875, 1.24365234375, 1.367462158203125, 1.49127197265625, 1.615081787109375, 1.7388916015625, 1.862701416015625, 1.98651123046875, 2.110321044921875, 2.234130859375, 2.357940673828125, 2.48175048828125, 2.605560302734375, 2.7293701171875, 2.853179931640625, 2.97698974609375, 3.100799560546875, 3.224609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 7.0, 7.0, 14.0, 13.0, 17.0, 37.0, 61.0, 83.0, 159.0, 299.0, 699.0, 1837.0, 6508.0, 96907.0, 4005432.0, 74292.0, 5363.0, 1507.0, 524.0, 249.0, 117.0, 47.0, 28.0, 24.0, 12.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.90625, -24.241455078125, -23.57666015625, -22.911865234375, -22.2470703125, -21.582275390625, -20.91748046875, -20.252685546875, -19.587890625, -18.923095703125, -18.25830078125, -17.593505859375, -16.9287109375, -16.263916015625, -15.59912109375, -14.934326171875, -14.26953125, -13.604736328125, -12.93994140625, -12.275146484375, -11.6103515625, -10.945556640625, -10.28076171875, -9.615966796875, -8.951171875, -8.286376953125, -7.62158203125, -6.956787109375, -6.2919921875, -5.627197265625, -4.96240234375, -4.297607421875, -3.6328125, -2.968017578125, -2.30322265625, -1.638427734375, -0.9736328125, -0.308837890625, 0.35595703125, 1.020751953125, 1.685546875, 2.350341796875, 3.01513671875, 3.679931640625, 4.3447265625, 5.009521484375, 5.67431640625, 6.339111328125, 7.00390625, 7.668701171875, 8.33349609375, 8.998291015625, 9.6630859375, 10.327880859375, 10.99267578125, 11.657470703125, 12.322265625, 12.987060546875, 13.65185546875, 14.316650390625, 14.9814453125, 15.646240234375, 16.31103515625, 16.975830078125, 17.640625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 10.0, 7.0, 14.0, 25.0, 33.0, 55.0, 85.0, 135.0, 247.0, 431.0, 693.0, 856.0, 612.0, 347.0, 170.0, 133.0, 59.0, 42.0, 28.0, 26.0, 12.0, 13.0, 9.0, 4.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.8828125, -10.5828857421875, -10.282958984375, -9.9830322265625, -9.68310546875, -9.3831787109375, -9.083251953125, -8.7833251953125, -8.4833984375, -8.1834716796875, -7.883544921875, -7.5836181640625, -7.28369140625, -6.9837646484375, -6.683837890625, -6.3839111328125, -6.083984375, -5.7840576171875, -5.484130859375, -5.1842041015625, -4.88427734375, -4.5843505859375, -4.284423828125, -3.9844970703125, -3.6845703125, -3.3846435546875, -3.084716796875, -2.7847900390625, -2.48486328125, -2.1849365234375, -1.885009765625, -1.5850830078125, -1.28515625, -0.9852294921875, -0.685302734375, -0.3853759765625, -0.08544921875, 0.2144775390625, 0.514404296875, 0.8143310546875, 1.1142578125, 1.4141845703125, 1.714111328125, 2.0140380859375, 2.31396484375, 2.6138916015625, 2.913818359375, 3.2137451171875, 3.513671875, 3.8135986328125, 4.113525390625, 4.4134521484375, 4.71337890625, 5.0133056640625, 5.313232421875, 5.6131591796875, 5.9130859375, 6.2130126953125, 6.512939453125, 6.8128662109375, 7.11279296875, 7.4127197265625, 7.712646484375, 8.0125732421875, 8.3125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 6.0, 18.0, 38.0, 51.0, 107.0, 183.0, 437.0, 1020.0, 3145.0, 13224.0, 94850.0, 3195490.0, 835558.0, 39554.0, 7246.0, 1990.0, 740.0, 286.0, 163.0, 71.0, 44.0, 19.0, 14.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.88330078125, -19.1416015625, -18.39990234375, -17.658203125, -16.91650390625, -16.1748046875, -15.43310546875, -14.69140625, -13.94970703125, -13.2080078125, -12.46630859375, -11.724609375, -10.98291015625, -10.2412109375, -9.49951171875, -8.7578125, -8.01611328125, -7.2744140625, -6.53271484375, -5.791015625, -5.04931640625, -4.3076171875, -3.56591796875, -2.82421875, -2.08251953125, -1.3408203125, -0.59912109375, 0.142578125, 0.88427734375, 1.6259765625, 2.36767578125, 3.109375, 3.85107421875, 4.5927734375, 5.33447265625, 6.076171875, 6.81787109375, 7.5595703125, 8.30126953125, 9.04296875, 9.78466796875, 10.5263671875, 11.26806640625, 12.009765625, 12.75146484375, 13.4931640625, 14.23486328125, 14.9765625, 15.71826171875, 16.4599609375, 17.20166015625, 17.943359375, 18.68505859375, 19.4267578125, 20.16845703125, 20.91015625, 21.65185546875, 22.3935546875, 23.13525390625, 23.876953125, 24.61865234375, 25.3603515625, 26.10205078125, 26.84375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 13.0, 13.0, 30.0, 58.0, 76.0, 124.0, 184.0, 156.0, 114.0, 94.0, 61.0, 34.0, 23.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-84.50379943847656, -82.74308776855469, -80.98237609863281, -79.22166442871094, -77.46095275878906, -75.70024108886719, -73.93952941894531, -72.17881774902344, -70.41810607910156, -68.65739440917969, -66.89668273925781, -65.13597106933594, -63.37525939941406, -61.61454772949219, -59.85383605957031, -58.09312438964844, -56.33241653442383, -54.57170486450195, -52.81099319458008, -51.0502815246582, -49.28956985473633, -47.52885818481445, -45.768150329589844, -44.00743865966797, -42.246726989746094, -40.48601531982422, -38.725303649902344, -36.96459197998047, -35.203880310058594, -33.44316864013672, -31.682458877563477, -29.9217472076416, -28.16103744506836, -26.400325775146484, -24.63961410522461, -22.878902435302734, -21.11819076538086, -19.357479095458984, -17.596769332885742, -15.836057662963867, -14.075345993041992, -12.314634323120117, -10.553922653198242, -8.793211936950684, -7.032500267028809, -5.271788597106934, -3.511077880859375, -1.7503662109375, 0.010345458984375, 1.771056890487671, 3.531768321990967, 5.292479515075684, 7.053191184997559, 8.813902854919434, 10.574613571166992, 12.335325241088867, 14.096036911010742, 15.856748580932617, 17.617460250854492, 19.378170013427734, 21.13888168334961, 22.899593353271484, 24.66030502319336, 26.421016693115234, 28.18172836303711]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 7.0, 7.0, 4.0, 14.0, 7.0, 11.0, 6.0, 18.0, 22.0, 15.0, 20.0, 29.0, 22.0, 26.0, 27.0, 32.0, 37.0, 41.0, 38.0, 27.0, 43.0, 35.0, 40.0, 43.0, 37.0, 34.0, 34.0, 29.0, 31.0, 33.0, 25.0, 27.0, 24.0, 24.0, 26.0, 14.0, 15.0, 13.0, 11.0, 7.0, 7.0, 4.0, 3.0, 5.0, 5.0, 6.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-21.42793083190918, -20.758066177368164, -20.08820343017578, -19.418338775634766, -18.74847412109375, -18.078609466552734, -17.40874481201172, -16.738882064819336, -16.06901741027832, -15.399152755737305, -14.729289054870605, -14.059425354003906, -13.38956069946289, -12.719696044921875, -12.049832344055176, -11.379968643188477, -10.710103988647461, -10.040239334106445, -9.370375633239746, -8.700511932373047, -8.030647277832031, -7.360783100128174, -6.690918922424316, -6.021054744720459, -5.351190567016602, -4.681326389312744, -4.011462211608887, -3.3415980339050293, -2.671733856201172, -2.0018696784973145, -1.332005500793457, -0.6621413230895996, 0.007724761962890625, 0.677588939666748, 1.3474531173706055, 2.017317295074463, 2.6871814727783203, 3.3570456504821777, 4.026909828186035, 4.696774005889893, 5.36663818359375, 6.036502361297607, 6.706366539001465, 7.376230716705322, 8.04609489440918, 8.715959548950195, 9.385823249816895, 10.055686950683594, 10.72555160522461, 11.395416259765625, 12.065279960632324, 12.735143661499023, 13.405008316040039, 14.074872970581055, 14.744736671447754, 15.414600372314453, 16.08446502685547, 16.754329681396484, 17.4241943359375, 18.094057083129883, 18.7639217376709, 19.433786392211914, 20.103649139404297, 20.773513793945312, 21.443378448486328]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 7.0, 15.0, 24.0, 24.0, 32.0, 40.0, 58.0, 72.0, 59.0, 76.0, 90.0, 94.0, 97.0, 83.0, 46.0, 46.0, 40.0, 39.0, 17.0, 18.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.411529541015625, -4.28790283203125, -4.164276123046875, -4.0406494140625, -3.917022705078125, -3.79339599609375, -3.669769287109375, -3.546142578125, -3.422515869140625, -3.29888916015625, -3.175262451171875, -3.0516357421875, -2.928009033203125, -2.80438232421875, -2.680755615234375, -2.55712890625, -2.433502197265625, -2.30987548828125, -2.186248779296875, -2.0626220703125, -1.938995361328125, -1.81536865234375, -1.691741943359375, -1.568115234375, -1.444488525390625, -1.32086181640625, -1.197235107421875, -1.0736083984375, -0.949981689453125, -0.82635498046875, -0.702728271484375, -0.5791015625, -0.455474853515625, -0.33184814453125, -0.208221435546875, -0.0845947265625, 0.039031982421875, 0.16265869140625, 0.286285400390625, 0.409912109375, 0.533538818359375, 0.65716552734375, 0.780792236328125, 0.9044189453125, 1.028045654296875, 1.15167236328125, 1.275299072265625, 1.39892578125, 1.522552490234375, 1.64617919921875, 1.769805908203125, 1.8934326171875, 2.017059326171875, 2.14068603515625, 2.264312744140625, 2.387939453125, 2.511566162109375, 2.63519287109375, 2.758819580078125, 2.8824462890625, 3.006072998046875, 3.12969970703125, 3.253326416015625, 3.376953125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 9.0, 3.0, 10.0, 20.0, 21.0, 25.0, 29.0, 57.0, 53.0, 88.0, 124.0, 179.0, 279.0, 403.0, 671.0, 1225.0, 2010.0, 3796.0, 7847.0, 17281.0, 44677.0, 138797.0, 525159.0, 203253.0, 59786.0, 22540.0, 9532.0, 4663.0, 2418.0, 1393.0, 772.0, 495.0, 290.0, 182.0, 139.0, 89.0, 64.0, 40.0, 36.0, 23.0, 18.0, 13.0, 14.0, 9.0, 4.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.240478515625, -0.23332977294921875, -0.2261810302734375, -0.21903228759765625, -0.211883544921875, -0.20473480224609375, -0.1975860595703125, -0.19043731689453125, -0.18328857421875, -0.17613983154296875, -0.1689910888671875, -0.16184234619140625, -0.154693603515625, -0.14754486083984375, -0.1403961181640625, -0.13324737548828125, -0.1260986328125, -0.11894989013671875, -0.1118011474609375, -0.10465240478515625, -0.097503662109375, -0.09035491943359375, -0.0832061767578125, -0.07605743408203125, -0.06890869140625, -0.06175994873046875, -0.0546112060546875, -0.04746246337890625, -0.040313720703125, -0.03316497802734375, -0.0260162353515625, -0.01886749267578125, -0.01171875, -0.00457000732421875, 0.0025787353515625, 0.00972747802734375, 0.016876220703125, 0.02402496337890625, 0.0311737060546875, 0.03832244873046875, 0.04547119140625, 0.05261993408203125, 0.0597686767578125, 0.06691741943359375, 0.074066162109375, 0.08121490478515625, 0.0883636474609375, 0.09551239013671875, 0.1026611328125, 0.10980987548828125, 0.1169586181640625, 0.12410736083984375, 0.131256103515625, 0.13840484619140625, 0.1455535888671875, 0.15270233154296875, 0.15985107421875, 0.16699981689453125, 0.1741485595703125, 0.18129730224609375, 0.188446044921875, 0.19559478759765625, 0.2027435302734375, 0.20989227294921875, 0.217041015625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 6.0, 7.0, 5.0, 12.0, 12.0, 10.0, 15.0, 20.0, 29.0, 17.0, 21.0, 25.0, 33.0, 31.0, 43.0, 39.0, 30.0, 44.0, 37.0, 37.0, 1065.0, 43.0, 36.0, 27.0, 41.0, 29.0, 33.0, 26.0, 37.0, 30.0, 31.0, 20.0, 14.0, 14.0, 12.0, 16.0, 19.0, 8.0, 11.0, 7.0, 8.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 3.0], "bins": [-2.37109375, -2.306365966796875, -2.24163818359375, -2.176910400390625, -2.1121826171875, -2.047454833984375, -1.98272705078125, -1.917999267578125, -1.853271484375, -1.788543701171875, -1.72381591796875, -1.659088134765625, -1.5943603515625, -1.529632568359375, -1.46490478515625, -1.400177001953125, -1.33544921875, -1.270721435546875, -1.20599365234375, -1.141265869140625, -1.0765380859375, -1.011810302734375, -0.94708251953125, -0.882354736328125, -0.817626953125, -0.752899169921875, -0.68817138671875, -0.623443603515625, -0.5587158203125, -0.493988037109375, -0.42926025390625, -0.364532470703125, -0.2998046875, -0.235076904296875, -0.17034912109375, -0.105621337890625, -0.0408935546875, 0.023834228515625, 0.08856201171875, 0.153289794921875, 0.218017578125, 0.282745361328125, 0.34747314453125, 0.412200927734375, 0.4769287109375, 0.541656494140625, 0.60638427734375, 0.671112060546875, 0.73583984375, 0.800567626953125, 0.86529541015625, 0.930023193359375, 0.9947509765625, 1.059478759765625, 1.12420654296875, 1.188934326171875, 1.253662109375, 1.318389892578125, 1.38311767578125, 1.447845458984375, 1.5125732421875, 1.577301025390625, 1.64202880859375, 1.706756591796875, 1.771484375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 21.0, 26.0, 46.0, 62.0, 86.0, 154.0, 187.0, 273.0, 386.0, 636.0, 856.0, 1265.0, 1759.0, 2592.0, 3679.0, 5478.0, 7793.0, 11582.0, 17032.0, 25270.0, 38769.0, 61189.0, 106291.0, 500531.0, 1020267.0, 108500.0, 62384.0, 39418.0, 25781.0, 17375.0, 11576.0, 8016.0, 5388.0, 3788.0, 2669.0, 1837.0, 1277.0, 905.0, 613.0, 433.0, 275.0, 220.0, 131.0, 112.0, 69.0, 48.0, 32.0, 17.0, 10.0, 8.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04815673828125, -0.046604156494140625, -0.04505157470703125, -0.043498992919921875, -0.0419464111328125, -0.040393829345703125, -0.03884124755859375, -0.037288665771484375, -0.035736083984375, -0.034183502197265625, -0.03263092041015625, -0.031078338623046875, -0.0295257568359375, -0.027973175048828125, -0.02642059326171875, -0.024868011474609375, -0.0233154296875, -0.021762847900390625, -0.02021026611328125, -0.018657684326171875, -0.0171051025390625, -0.015552520751953125, -0.01399993896484375, -0.012447357177734375, -0.010894775390625, -0.009342193603515625, -0.00778961181640625, -0.006237030029296875, -0.0046844482421875, -0.003131866455078125, -0.00157928466796875, -2.6702880859375e-05, 0.00152587890625, 0.003078460693359375, 0.00463104248046875, 0.006183624267578125, 0.0077362060546875, 0.009288787841796875, 0.01084136962890625, 0.012393951416015625, 0.013946533203125, 0.015499114990234375, 0.01705169677734375, 0.018604278564453125, 0.0201568603515625, 0.021709442138671875, 0.02326202392578125, 0.024814605712890625, 0.0263671875, 0.027919769287109375, 0.02947235107421875, 0.031024932861328125, 0.0325775146484375, 0.034130096435546875, 0.03568267822265625, 0.037235260009765625, 0.038787841796875, 0.040340423583984375, 0.04189300537109375, 0.043445587158203125, 0.0449981689453125, 0.046550750732421875, 0.04810333251953125, 0.049655914306640625, 0.05120849609375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 6.0, 6.0, 14.0, 13.0, 18.0, 14.0, 19.0, 27.0, 42.0, 51.0, 47.0, 64.0, 73.0, 104.0, 91.0, 72.0, 50.0, 40.0, 32.0, 25.0, 19.0, 22.0, 17.0, 12.0, 12.0, 6.0, 8.0, 9.0, 9.0, 3.0, 2.0, 8.0, 4.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002772808074951172, -0.00026794523000717163, -0.0002586096525192261, -0.0002492740750312805, -0.00023993849754333496, -0.0002306029200553894, -0.00022126734256744385, -0.0002119317650794983, -0.00020259618759155273, -0.00019326061010360718, -0.00018392503261566162, -0.00017458945512771606, -0.0001652538776397705, -0.00015591830015182495, -0.0001465827226638794, -0.00013724714517593384, -0.00012791156768798828, -0.00011857599020004272, -0.00010924041271209717, -9.990483522415161e-05, -9.056925773620605e-05, -8.12336802482605e-05, -7.189810276031494e-05, -6.256252527236938e-05, -5.322694778442383e-05, -4.389137029647827e-05, -3.4555792808532715e-05, -2.5220215320587158e-05, -1.58846378326416e-05, -6.549060344696045e-06, 2.7865171432495117e-06, 1.2122094631195068e-05, 2.1457672119140625e-05, 3.079324960708618e-05, 4.012882709503174e-05, 4.9464404582977295e-05, 5.879998207092285e-05, 6.813555955886841e-05, 7.747113704681396e-05, 8.680671453475952e-05, 9.614229202270508e-05, 0.00010547786951065063, 0.00011481344699859619, 0.00012414902448654175, 0.0001334846019744873, 0.00014282017946243286, 0.00015215575695037842, 0.00016149133443832397, 0.00017082691192626953, 0.0001801624894142151, 0.00018949806690216064, 0.0001988336443901062, 0.00020816922187805176, 0.00021750479936599731, 0.00022684037685394287, 0.00023617595434188843, 0.000245511531829834, 0.00025484710931777954, 0.0002641826868057251, 0.00027351826429367065, 0.0002828538417816162, 0.00029218941926956177, 0.0003015249967575073, 0.0003108605742454529, 0.00032019615173339844]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 8.0, 4.0, 4.0, 10.0, 3.0, 11.0, 9.0, 13.0, 18.0, 26.0, 23.0, 27.0, 30.0, 59.0, 58.0, 83.0, 139.0, 451.0, 2049.0, 12369.0, 102900.0, 801416.0, 112272.0, 13293.0, 2185.0, 511.0, 163.0, 95.0, 62.0, 42.0, 37.0, 34.0, 31.0, 23.0, 20.0, 14.0, 14.0, 12.0, 6.0, 7.0, 7.0, 2.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.005462646484375, -0.005304396152496338, -0.005146145820617676, -0.004987895488739014, -0.0048296451568603516, -0.0046713948249816895, -0.004513144493103027, -0.004354894161224365, -0.004196643829345703, -0.004038393497467041, -0.003880143165588379, -0.003721892833709717, -0.0035636425018310547, -0.0034053921699523926, -0.0032471418380737305, -0.0030888915061950684, -0.0029306411743164062, -0.002772390842437744, -0.002614140510559082, -0.00245589017868042, -0.002297639846801758, -0.0021393895149230957, -0.0019811391830444336, -0.0018228888511657715, -0.0016646385192871094, -0.0015063881874084473, -0.0013481378555297852, -0.001189887523651123, -0.001031637191772461, -0.0008733868598937988, -0.0007151365280151367, -0.0005568861961364746, -0.0003986358642578125, -0.0002403855323791504, -8.213520050048828e-05, 7.611513137817383e-05, 0.00023436546325683594, 0.00039261579513549805, 0.0005508661270141602, 0.0007091164588928223, 0.0008673667907714844, 0.0010256171226501465, 0.0011838674545288086, 0.0013421177864074707, 0.0015003681182861328, 0.001658618450164795, 0.001816868782043457, 0.001975119113922119, 0.0021333694458007812, 0.0022916197776794434, 0.0024498701095581055, 0.0026081204414367676, 0.0027663707733154297, 0.002924621105194092, 0.003082871437072754, 0.003241121768951416, 0.003399372100830078, 0.0035576224327087402, 0.0037158727645874023, 0.0038741230964660645, 0.0040323734283447266, 0.004190623760223389, 0.004348874092102051, 0.004507124423980713, 0.004665374755859375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 22.0, 95.0, 614.0, 234.0, 36.0, 9.0], "bins": [-0.008506637066602707, -0.008366578258574009, -0.008226520381867886, -0.008086461573839188, -0.00794640276581049, -0.007806344889104366, -0.007666286081075668, -0.007526227738708258, -0.007386169396340847, -0.007246111053973436, -0.007106052245944738, -0.006965993903577328, -0.006825935561209917, -0.006685877218842506, -0.0065458184108138084, -0.006405760068446398, -0.006265701726078987, -0.0061256433837115765, -0.0059855845756828785, -0.005845526233315468, -0.005705467890948057, -0.0055654095485806465, -0.0054253507405519485, -0.005285292398184538, -0.00514523359015584, -0.005005175247788429, -0.004865116439759731, -0.004725058097392321, -0.00458499975502491, -0.004444941412657499, -0.004304882604628801, -0.004164824262261391, -0.004024765454232693, -0.0038847068790346384, -0.0037446485366672277, -0.0036045899614691734, -0.0034645316191017628, -0.0033244730439037085, -0.003184414468705654, -0.0030443561263382435, -0.002904297783970833, -0.0027642392087727785, -0.002624180866405368, -0.0024841222912073135, -0.002344063948839903, -0.0022040053736418486, -0.0020639467984437943, -0.0019238884560763836, -0.001783830113708973, -0.0016437716549262404, -0.001503713196143508, -0.0013636546209454536, -0.001223596278578043, -0.0010835377033799887, -0.0009434792445972562, -0.0008034207858145237, -0.0006633622688241303, -0.0005233038100413978, -0.00038324532215483487, -0.00024318683426827192, -0.00010312837548553944, 3.693008329719305e-05, 0.00017698860028758645, 0.00031704705907031894, 0.0004571055178530514]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 7.0, 11.0, 9.0, 11.0, 17.0, 23.0, 30.0, 31.0, 39.0, 40.0, 53.0, 39.0, 57.0, 60.0, 59.0, 47.0, 60.0, 47.0, 51.0, 51.0, 40.0, 34.0, 38.0, 33.0, 24.0, 17.0, 17.0, 11.0, 11.0, 10.0, 6.0, 4.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042742490768432617, -0.00041339173913002014, -0.0003993585705757141, -0.0003853254020214081, -0.00037129223346710205, -0.000357259064912796, -0.00034322589635849, -0.00032919272780418396, -0.00031515955924987793, -0.0003011263906955719, -0.00028709322214126587, -0.00027306005358695984, -0.0002590268850326538, -0.0002449937164783478, -0.00023096054792404175, -0.00021692737936973572, -0.0002028942108154297, -0.00018886104226112366, -0.00017482787370681763, -0.0001607947051525116, -0.00014676153659820557, -0.00013272836804389954, -0.0001186951994895935, -0.00010466203093528748, -9.062886238098145e-05, -7.659569382667542e-05, -6.256252527236938e-05, -4.8529356718063354e-05, -3.4496188163757324e-05, -2.0463019609451294e-05, -6.429851055145264e-06, 7.603317499160767e-06, 2.1636486053466797e-05, 3.566965460777283e-05, 4.970282316207886e-05, 6.373599171638489e-05, 7.776916027069092e-05, 9.180232882499695e-05, 0.00010583549737930298, 0.00011986866593360901, 0.00013390183448791504, 0.00014793500304222107, 0.0001619681715965271, 0.00017600134015083313, 0.00019003450870513916, 0.0002040676772594452, 0.00021810084581375122, 0.00023213401436805725, 0.0002461671829223633, 0.0002602003514766693, 0.00027423352003097534, 0.00028826668858528137, 0.0003022998571395874, 0.00031633302569389343, 0.00033036619424819946, 0.0003443993628025055, 0.0003584325313568115, 0.00037246569991111755, 0.0003864988684654236, 0.0004005320370197296, 0.00041456520557403564, 0.0004285983741283417, 0.0004426315426826477, 0.00045666471123695374, 0.00047069787979125977]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 1.0, 5.0, 7.0, 15.0, 24.0, 24.0, 32.0, 40.0, 58.0, 72.0, 59.0, 76.0, 90.0, 94.0, 96.0, 84.0, 46.0, 46.0, 40.0, 39.0, 17.0, 18.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.411529541015625, -4.28790283203125, -4.164276123046875, -4.0406494140625, -3.917022705078125, -3.79339599609375, -3.669769287109375, -3.546142578125, -3.422515869140625, -3.29888916015625, -3.175262451171875, -3.0516357421875, -2.928009033203125, -2.80438232421875, -2.680755615234375, -2.55712890625, -2.433502197265625, -2.30987548828125, -2.186248779296875, -2.0626220703125, -1.938995361328125, -1.81536865234375, -1.691741943359375, -1.568115234375, -1.444488525390625, -1.32086181640625, -1.197235107421875, -1.0736083984375, -0.949981689453125, -0.82635498046875, -0.702728271484375, -0.5791015625, -0.455474853515625, -0.33184814453125, -0.208221435546875, -0.0845947265625, 0.039031982421875, 0.16265869140625, 0.286285400390625, 0.409912109375, 0.533538818359375, 0.65716552734375, 0.780792236328125, 0.9044189453125, 1.028045654296875, 1.15167236328125, 1.275299072265625, 1.39892578125, 1.522552490234375, 1.64617919921875, 1.769805908203125, 1.8934326171875, 2.017059326171875, 2.14068603515625, 2.264312744140625, 2.387939453125, 2.511566162109375, 2.63519287109375, 2.758819580078125, 2.8824462890625, 3.006072998046875, 3.12969970703125, 3.253326416015625, 3.376953125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 9.0, 7.0, 15.0, 21.0, 32.0, 54.0, 85.0, 179.0, 295.0, 718.0, 1860.0, 5351.0, 17245.0, 62183.0, 316640.0, 513875.0, 93705.0, 24646.0, 7389.0, 2457.0, 916.0, 392.0, 206.0, 105.0, 54.0, 37.0, 24.0, 15.0, 13.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.83734130859375, -3.7215576171875, -3.60577392578125, -3.489990234375, -3.37420654296875, -3.2584228515625, -3.14263916015625, -3.02685546875, -2.91107177734375, -2.7952880859375, -2.67950439453125, -2.563720703125, -2.44793701171875, -2.3321533203125, -2.21636962890625, -2.1005859375, -1.98480224609375, -1.8690185546875, -1.75323486328125, -1.637451171875, -1.52166748046875, -1.4058837890625, -1.29010009765625, -1.17431640625, -1.05853271484375, -0.9427490234375, -0.82696533203125, -0.711181640625, -0.59539794921875, -0.4796142578125, -0.36383056640625, -0.248046875, -0.13226318359375, -0.0164794921875, 0.09930419921875, 0.215087890625, 0.33087158203125, 0.4466552734375, 0.56243896484375, 0.67822265625, 0.79400634765625, 0.9097900390625, 1.02557373046875, 1.141357421875, 1.25714111328125, 1.3729248046875, 1.48870849609375, 1.6044921875, 1.72027587890625, 1.8360595703125, 1.95184326171875, 2.067626953125, 2.18341064453125, 2.2991943359375, 2.41497802734375, 2.53076171875, 2.64654541015625, 2.7623291015625, 2.87811279296875, 2.993896484375, 3.10968017578125, 3.2254638671875, 3.34124755859375, 3.45703125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 4.0, 9.0, 15.0, 15.0, 13.0, 18.0, 20.0, 14.0, 29.0, 30.0, 30.0, 33.0, 42.0, 34.0, 51.0, 64.0, 74.0, 183.0, 1624.0, 203.0, 108.0, 60.0, 56.0, 35.0, 32.0, 48.0, 28.0, 25.0, 25.0, 23.0, 20.0, 13.0, 14.0, 17.0, 5.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.238525390625, -7.96923828125, -7.699951171875, -7.4306640625, -7.161376953125, -6.89208984375, -6.622802734375, -6.353515625, -6.084228515625, -5.81494140625, -5.545654296875, -5.2763671875, -5.007080078125, -4.73779296875, -4.468505859375, -4.19921875, -3.929931640625, -3.66064453125, -3.391357421875, -3.1220703125, -2.852783203125, -2.58349609375, -2.314208984375, -2.044921875, -1.775634765625, -1.50634765625, -1.237060546875, -0.9677734375, -0.698486328125, -0.42919921875, -0.159912109375, 0.109375, 0.378662109375, 0.64794921875, 0.917236328125, 1.1865234375, 1.455810546875, 1.72509765625, 1.994384765625, 2.263671875, 2.532958984375, 2.80224609375, 3.071533203125, 3.3408203125, 3.610107421875, 3.87939453125, 4.148681640625, 4.41796875, 4.687255859375, 4.95654296875, 5.225830078125, 5.4951171875, 5.764404296875, 6.03369140625, 6.302978515625, 6.572265625, 6.841552734375, 7.11083984375, 7.380126953125, 7.6494140625, 7.918701171875, 8.18798828125, 8.457275390625, 8.7265625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 12.0, 18.0, 20.0, 30.0, 27.0, 27.0, 41.0, 63.0, 103.0, 236.0, 503.0, 1141.0, 3422.0, 19290.0, 520523.0, 2549225.0, 42533.0, 5497.0, 1652.0, 585.0, 244.0, 146.0, 81.0, 53.0, 43.0, 28.0, 21.0, 19.0, 21.0, 15.0, 16.0, 11.0, 12.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.6343994140625, -11.260986328125, -10.8875732421875, -10.51416015625, -10.1407470703125, -9.767333984375, -9.3939208984375, -9.0205078125, -8.6470947265625, -8.273681640625, -7.9002685546875, -7.52685546875, -7.1534423828125, -6.780029296875, -6.4066162109375, -6.033203125, -5.6597900390625, -5.286376953125, -4.9129638671875, -4.53955078125, -4.1661376953125, -3.792724609375, -3.4193115234375, -3.0458984375, -2.6724853515625, -2.299072265625, -1.9256591796875, -1.55224609375, -1.1788330078125, -0.805419921875, -0.4320068359375, -0.05859375, 0.3148193359375, 0.688232421875, 1.0616455078125, 1.43505859375, 1.8084716796875, 2.181884765625, 2.5552978515625, 2.9287109375, 3.3021240234375, 3.675537109375, 4.0489501953125, 4.42236328125, 4.7957763671875, 5.169189453125, 5.5426025390625, 5.916015625, 6.2894287109375, 6.662841796875, 7.0362548828125, 7.40966796875, 7.7830810546875, 8.156494140625, 8.5299072265625, 8.9033203125, 9.2767333984375, 9.650146484375, 10.0235595703125, 10.39697265625, 10.7703857421875, 11.143798828125, 11.5172119140625, 11.890625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 16.0, 38.0, 78.0, 155.0, 170.0, 205.0, 147.0, 108.0, 58.0, 20.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.738855361938477, -27.924104690551758, -27.10935401916504, -26.29460334777832, -25.4798526763916, -24.665102005004883, -23.85034942626953, -23.035598754882812, -22.220848083496094, -21.406097412109375, -20.591346740722656, -19.776596069335938, -18.96184539794922, -18.1470947265625, -17.33234405517578, -16.517593383789062, -15.702842712402344, -14.888092041015625, -14.073341369628906, -13.258590698242188, -12.443840026855469, -11.62908935546875, -10.814337730407715, -9.999587059020996, -9.184836387634277, -8.370085716247559, -7.55533504486084, -6.740583896636963, -5.925833225250244, -5.111082553863525, -4.296331405639648, -3.4815807342529297, -2.6668319702148438, -1.8520811796188354, -1.0373303890228271, -0.2225794792175293, 0.5921711921691895, 1.4069218635559082, 2.221673011779785, 3.036423683166504, 3.8511743545532227, 4.665925025939941, 5.48067569732666, 6.295426845550537, 7.110177516937256, 7.924928188323975, 8.739679336547852, 9.55443000793457, 10.369180679321289, 11.183931350708008, 11.998682022094727, 12.813432693481445, 13.628183364868164, 14.442934036254883, 15.257685661315918, 16.072437286376953, 16.887187957763672, 17.70193862915039, 18.51668930053711, 19.331439971923828, 20.146190643310547, 20.960941314697266, 21.775691986083984, 22.590442657470703, 23.405193328857422]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 6.0, 12.0, 8.0, 13.0, 14.0, 18.0, 22.0, 22.0, 19.0, 20.0, 33.0, 29.0, 36.0, 38.0, 44.0, 35.0, 27.0, 35.0, 26.0, 36.0, 27.0, 31.0, 37.0, 42.0, 37.0, 37.0, 39.0, 35.0, 22.0, 22.0, 15.0, 20.0, 21.0, 21.0, 13.0, 9.0, 15.0, 8.0, 13.0, 4.0, 7.0, 7.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-29.035263061523438, -28.222087860107422, -27.408910751342773, -26.595735549926758, -25.78255844116211, -24.969383239746094, -24.156208038330078, -23.34303092956543, -22.52985382080078, -21.716678619384766, -20.903501510620117, -20.0903263092041, -19.277149200439453, -18.463973999023438, -17.650798797607422, -16.837621688842773, -16.024446487426758, -15.211270332336426, -14.398094177246094, -13.584918975830078, -12.77174186706543, -11.958566665649414, -11.145390510559082, -10.33221435546875, -9.519038200378418, -8.705862045288086, -7.892685890197754, -7.07951021194458, -6.266334056854248, -5.453157901763916, -4.639982223510742, -3.82680606842041, -3.013629913330078, -2.200453758239746, -1.3872778415679932, -0.5741019248962402, 0.2390742301940918, 1.0522503852844238, 1.8654260635375977, 2.6786022186279297, 3.4917783737182617, 4.304954528808594, 5.118130683898926, 5.9313063621521, 6.744482517242432, 7.557658672332764, 8.370834350585938, 9.18401050567627, 9.997186660766602, 10.810362815856934, 11.623538970947266, 12.436714172363281, 13.24989128112793, 14.063066482543945, 14.876242637634277, 15.68941879272461, 16.502593994140625, 17.31576919555664, 18.12894630432129, 18.942121505737305, 19.755298614501953, 20.56847381591797, 21.381649017333984, 22.194826126098633, 23.00800323486328]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 1.0, 2.0, 3.0, 16.0, 13.0, 30.0, 21.0, 38.0, 53.0, 59.0, 62.0, 65.0, 78.0, 93.0, 100.0, 77.0, 71.0, 48.0, 45.0, 36.0, 41.0, 21.0, 11.0, 7.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4375, -4.3154296875, -4.193359375, -4.0712890625, -3.94921875, -3.8271484375, -3.705078125, -3.5830078125, -3.4609375, -3.3388671875, -3.216796875, -3.0947265625, -2.97265625, -2.8505859375, -2.728515625, -2.6064453125, -2.484375, -2.3623046875, -2.240234375, -2.1181640625, -1.99609375, -1.8740234375, -1.751953125, -1.6298828125, -1.5078125, -1.3857421875, -1.263671875, -1.1416015625, -1.01953125, -0.8974609375, -0.775390625, -0.6533203125, -0.53125, -0.4091796875, -0.287109375, -0.1650390625, -0.04296875, 0.0791015625, 0.201171875, 0.3232421875, 0.4453125, 0.5673828125, 0.689453125, 0.8115234375, 0.93359375, 1.0556640625, 1.177734375, 1.2998046875, 1.421875, 1.5439453125, 1.666015625, 1.7880859375, 1.91015625, 2.0322265625, 2.154296875, 2.2763671875, 2.3984375, 2.5205078125, 2.642578125, 2.7646484375, 2.88671875, 3.0087890625, 3.130859375, 3.2529296875, 3.375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 18.0, 14.0, 36.0, 35.0, 62.0, 88.0, 163.0, 310.0, 680.0, 1563.0, 5208.0, 39891.0, 3849853.0, 282621.0, 9928.0, 2313.0, 776.0, 351.0, 140.0, 78.0, 38.0, 37.0, 17.0, 10.0, 7.0, 6.0, 9.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -24.306640625, -23.64453125, -22.982421875, -22.3203125, -21.658203125, -20.99609375, -20.333984375, -19.671875, -19.009765625, -18.34765625, -17.685546875, -17.0234375, -16.361328125, -15.69921875, -15.037109375, -14.375, -13.712890625, -13.05078125, -12.388671875, -11.7265625, -11.064453125, -10.40234375, -9.740234375, -9.078125, -8.416015625, -7.75390625, -7.091796875, -6.4296875, -5.767578125, -5.10546875, -4.443359375, -3.78125, -3.119140625, -2.45703125, -1.794921875, -1.1328125, -0.470703125, 0.19140625, 0.853515625, 1.515625, 2.177734375, 2.83984375, 3.501953125, 4.1640625, 4.826171875, 5.48828125, 6.150390625, 6.8125, 7.474609375, 8.13671875, 8.798828125, 9.4609375, 10.123046875, 10.78515625, 11.447265625, 12.109375, 12.771484375, 13.43359375, 14.095703125, 14.7578125, 15.419921875, 16.08203125, 16.744140625, 17.40625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 7.0, 5.0, 5.0, 10.0, 18.0, 15.0, 34.0, 50.0, 46.0, 96.0, 117.0, 237.0, 334.0, 473.0, 627.0, 629.0, 455.0, 342.0, 185.0, 109.0, 63.0, 46.0, 42.0, 26.0, 24.0, 22.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.51953125, -7.290283203125, -7.06103515625, -6.831787109375, -6.6025390625, -6.373291015625, -6.14404296875, -5.914794921875, -5.685546875, -5.456298828125, -5.22705078125, -4.997802734375, -4.7685546875, -4.539306640625, -4.31005859375, -4.080810546875, -3.8515625, -3.622314453125, -3.39306640625, -3.163818359375, -2.9345703125, -2.705322265625, -2.47607421875, -2.246826171875, -2.017578125, -1.788330078125, -1.55908203125, -1.329833984375, -1.1005859375, -0.871337890625, -0.64208984375, -0.412841796875, -0.18359375, 0.045654296875, 0.27490234375, 0.504150390625, 0.7333984375, 0.962646484375, 1.19189453125, 1.421142578125, 1.650390625, 1.879638671875, 2.10888671875, 2.338134765625, 2.5673828125, 2.796630859375, 3.02587890625, 3.255126953125, 3.484375, 3.713623046875, 3.94287109375, 4.172119140625, 4.4013671875, 4.630615234375, 4.85986328125, 5.089111328125, 5.318359375, 5.547607421875, 5.77685546875, 6.006103515625, 6.2353515625, 6.464599609375, 6.69384765625, 6.923095703125, 7.15234375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 13.0, 18.0, 21.0, 42.0, 64.0, 107.0, 198.0, 276.0, 520.0, 995.0, 1585.0, 2913.0, 5787.0, 12732.0, 34248.0, 138317.0, 1094385.0, 2462918.0, 340120.0, 62008.0, 19850.0, 8273.0, 3974.0, 2024.0, 1181.0, 673.0, 421.0, 229.0, 145.0, 99.0, 53.0, 29.0, 22.0, 12.0, 7.0, 10.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.875, -10.52685546875, -10.1787109375, -9.83056640625, -9.482421875, -9.13427734375, -8.7861328125, -8.43798828125, -8.08984375, -7.74169921875, -7.3935546875, -7.04541015625, -6.697265625, -6.34912109375, -6.0009765625, -5.65283203125, -5.3046875, -4.95654296875, -4.6083984375, -4.26025390625, -3.912109375, -3.56396484375, -3.2158203125, -2.86767578125, -2.51953125, -2.17138671875, -1.8232421875, -1.47509765625, -1.126953125, -0.77880859375, -0.4306640625, -0.08251953125, 0.265625, 0.61376953125, 0.9619140625, 1.31005859375, 1.658203125, 2.00634765625, 2.3544921875, 2.70263671875, 3.05078125, 3.39892578125, 3.7470703125, 4.09521484375, 4.443359375, 4.79150390625, 5.1396484375, 5.48779296875, 5.8359375, 6.18408203125, 6.5322265625, 6.88037109375, 7.228515625, 7.57666015625, 7.9248046875, 8.27294921875, 8.62109375, 8.96923828125, 9.3173828125, 9.66552734375, 10.013671875, 10.36181640625, 10.7099609375, 11.05810546875, 11.40625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 23.0, 27.0, 60.0, 86.0, 121.0, 162.0, 128.0, 139.0, 91.0, 60.0, 41.0, 27.0, 14.0, 5.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.423763275146484, -59.6796760559082, -57.93558883666992, -56.19150161743164, -54.447410583496094, -52.70332336425781, -50.95923614501953, -49.21514892578125, -47.47106170654297, -45.72697448730469, -43.982887268066406, -42.238800048828125, -40.494712829589844, -38.75062561035156, -37.006534576416016, -35.262447357177734, -33.51836013793945, -31.774272918701172, -30.03018569946289, -28.286096572875977, -26.542009353637695, -24.797922134399414, -23.0538330078125, -21.30974578857422, -19.565658569335938, -17.821571350097656, -16.077484130859375, -14.333395004272461, -12.58930778503418, -10.845220565795898, -9.1011323928833, -7.357044219970703, -5.612953186035156, -3.868865489959717, -2.1247777938842773, -0.3806900978088379, 1.3633975982666016, 3.107484817504883, 4.8515729904174805, 6.595661163330078, 8.33974838256836, 10.08383560180664, 11.827923774719238, 13.572011947631836, 15.316099166870117, 17.0601863861084, 18.804275512695312, 20.548362731933594, 22.292449951171875, 24.036537170410156, 25.780624389648438, 27.52471351623535, 29.268800735473633, 31.012887954711914, 32.75697708129883, 34.50106430053711, 36.24515151977539, 37.98923873901367, 39.73332595825195, 41.477413177490234, 43.22150421142578, 44.96559143066406, 46.709678649902344, 48.453765869140625, 50.197853088378906]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 0.0, 3.0, 2.0, 3.0, 8.0, 0.0, 5.0, 6.0, 5.0, 13.0, 6.0, 13.0, 18.0, 15.0, 24.0, 20.0, 16.0, 19.0, 30.0, 31.0, 20.0, 41.0, 39.0, 39.0, 40.0, 37.0, 30.0, 53.0, 36.0, 37.0, 24.0, 53.0, 35.0, 33.0, 36.0, 31.0, 34.0, 22.0, 17.0, 18.0, 14.0, 13.0, 11.0, 12.0, 7.0, 8.0, 11.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.55889129638672, -18.92671775817871, -18.294546127319336, -17.662372589111328, -17.03019905090332, -16.398025512695312, -15.765853881835938, -15.13368034362793, -14.501507759094238, -13.869335174560547, -13.237161636352539, -12.604989051818848, -11.972816467285156, -11.340642929077148, -10.708470344543457, -10.076297760009766, -9.444124221801758, -8.811951637268066, -8.179778099060059, -7.547605514526367, -6.915432453155518, -6.283259391784668, -5.651086807250977, -5.018913745880127, -4.386740684509277, -3.7545676231384277, -3.1223948001861572, -2.4902219772338867, -1.858048915863037, -1.2258758544921875, -0.593703031539917, 0.038469791412353516, 0.6706409454345703, 1.3028138875961304, 1.9349868297576904, 2.567159652709961, 3.1993327140808105, 3.83150577545166, 4.463678359985352, 5.095851421356201, 5.728024482727051, 6.3601975440979, 6.99237060546875, 7.624543190002441, 8.256715774536133, 8.88888931274414, 9.521061897277832, 10.153234481811523, 10.785408020019531, 11.417580604553223, 12.04975414276123, 12.681926727294922, 13.31410026550293, 13.946272850036621, 14.578445434570312, 15.21061897277832, 15.842791557312012, 16.474964141845703, 17.10713768005371, 17.73931121826172, 18.371482849121094, 19.0036563873291, 19.63582992553711, 20.268001556396484, 20.900175094604492]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 11.0, 9.0, 16.0, 23.0, 31.0, 39.0, 49.0, 51.0, 49.0, 67.0, 73.0, 83.0, 82.0, 77.0, 78.0, 64.0, 47.0, 39.0, 29.0, 23.0, 22.0, 13.0, 10.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.18353271484375, -4.0662841796875, -3.94903564453125, -3.831787109375, -3.71453857421875, -3.5972900390625, -3.48004150390625, -3.36279296875, -3.24554443359375, -3.1282958984375, -3.01104736328125, -2.893798828125, -2.77655029296875, -2.6593017578125, -2.54205322265625, -2.4248046875, -2.30755615234375, -2.1903076171875, -2.07305908203125, -1.955810546875, -1.83856201171875, -1.7213134765625, -1.60406494140625, -1.48681640625, -1.36956787109375, -1.2523193359375, -1.13507080078125, -1.017822265625, -0.90057373046875, -0.7833251953125, -0.66607666015625, -0.548828125, -0.43157958984375, -0.3143310546875, -0.19708251953125, -0.079833984375, 0.03741455078125, 0.1546630859375, 0.27191162109375, 0.38916015625, 0.50640869140625, 0.6236572265625, 0.74090576171875, 0.858154296875, 0.97540283203125, 1.0926513671875, 1.20989990234375, 1.3271484375, 1.44439697265625, 1.5616455078125, 1.67889404296875, 1.796142578125, 1.91339111328125, 2.0306396484375, 2.14788818359375, 2.26513671875, 2.38238525390625, 2.4996337890625, 2.61688232421875, 2.734130859375, 2.85137939453125, 2.9686279296875, 3.08587646484375, 3.203125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 5.0, 8.0, 15.0, 23.0, 22.0, 53.0, 43.0, 64.0, 111.0, 141.0, 231.0, 354.0, 592.0, 1121.0, 1933.0, 3581.0, 6898.0, 13938.0, 32444.0, 83191.0, 281711.0, 430056.0, 113770.0, 42163.0, 18028.0, 8326.0, 4300.0, 2235.0, 1268.0, 661.0, 397.0, 278.0, 186.0, 118.0, 77.0, 57.0, 46.0, 31.0, 20.0, 19.0, 7.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.220703125, -0.21361732482910156, -0.20653152465820312, -0.1994457244873047, -0.19235992431640625, -0.1852741241455078, -0.17818832397460938, -0.17110252380371094, -0.1640167236328125, -0.15693092346191406, -0.14984512329101562, -0.1427593231201172, -0.13567352294921875, -0.1285877227783203, -0.12150192260742188, -0.11441612243652344, -0.107330322265625, -0.10024452209472656, -0.09315872192382812, -0.08607292175292969, -0.07898712158203125, -0.07190132141113281, -0.06481552124023438, -0.05772972106933594, -0.0506439208984375, -0.04355812072753906, -0.036472320556640625, -0.029386520385742188, -0.02230072021484375, -0.015214920043945312, -0.008129119873046875, -0.0010433197021484375, 0.00604248046875, 0.013128280639648438, 0.020214080810546875, 0.027299880981445312, 0.03438568115234375, 0.04147148132324219, 0.048557281494140625, 0.05564308166503906, 0.0627288818359375, 0.06981468200683594, 0.07690048217773438, 0.08398628234863281, 0.09107208251953125, 0.09815788269042969, 0.10524368286132812, 0.11232948303222656, 0.119415283203125, 0.12650108337402344, 0.13358688354492188, 0.1406726837158203, 0.14775848388671875, 0.1548442840576172, 0.16193008422851562, 0.16901588439941406, 0.1761016845703125, 0.18318748474121094, 0.19027328491210938, 0.1973590850830078, 0.20444488525390625, 0.2115306854248047, 0.21861648559570312, 0.22570228576660156, 0.2327880859375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 3.0, 3.0, 12.0, 5.0, 10.0, 13.0, 20.0, 25.0, 18.0, 23.0, 22.0, 23.0, 28.0, 27.0, 33.0, 26.0, 35.0, 32.0, 35.0, 49.0, 46.0, 1064.0, 41.0, 26.0, 40.0, 26.0, 36.0, 45.0, 25.0, 27.0, 30.0, 20.0, 19.0, 15.0, 22.0, 16.0, 12.0, 13.0, 6.0, 8.0, 11.0, 8.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.75390625, -1.6923828125, -1.630859375, -1.5693359375, -1.5078125, -1.4462890625, -1.384765625, -1.3232421875, -1.26171875, -1.2001953125, -1.138671875, -1.0771484375, -1.015625, -0.9541015625, -0.892578125, -0.8310546875, -0.76953125, -0.7080078125, -0.646484375, -0.5849609375, -0.5234375, -0.4619140625, -0.400390625, -0.3388671875, -0.27734375, -0.2158203125, -0.154296875, -0.0927734375, -0.03125, 0.0302734375, 0.091796875, 0.1533203125, 0.21484375, 0.2763671875, 0.337890625, 0.3994140625, 0.4609375, 0.5224609375, 0.583984375, 0.6455078125, 0.70703125, 0.7685546875, 0.830078125, 0.8916015625, 0.953125, 1.0146484375, 1.076171875, 1.1376953125, 1.19921875, 1.2607421875, 1.322265625, 1.3837890625, 1.4453125, 1.5068359375, 1.568359375, 1.6298828125, 1.69140625, 1.7529296875, 1.814453125, 1.8759765625, 1.9375, 1.9990234375, 2.060546875, 2.1220703125, 2.18359375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 6.0, 5.0, 8.0, 17.0, 20.0, 23.0, 26.0, 62.0, 61.0, 102.0, 148.0, 197.0, 267.0, 378.0, 563.0, 667.0, 927.0, 1296.0, 1818.0, 2533.0, 3623.0, 5171.0, 7089.0, 10240.0, 14920.0, 21567.0, 32635.0, 49898.0, 81573.0, 152216.0, 1317566.0, 154009.0, 81820.0, 50179.0, 32756.0, 21974.0, 15061.0, 10414.0, 7319.0, 5150.0, 3673.0, 2563.0, 1957.0, 1348.0, 968.0, 687.0, 444.0, 368.0, 223.0, 182.0, 115.0, 89.0, 60.0, 50.0, 30.0, 33.0, 18.0, 9.0, 11.0, 7.0, 4.0, 4.0], "bins": [-0.043121337890625, -0.041794776916503906, -0.04046821594238281, -0.03914165496826172, -0.037815093994140625, -0.03648853302001953, -0.03516197204589844, -0.033835411071777344, -0.03250885009765625, -0.031182289123535156, -0.029855728149414062, -0.02852916717529297, -0.027202606201171875, -0.02587604522705078, -0.024549484252929688, -0.023222923278808594, -0.0218963623046875, -0.020569801330566406, -0.019243240356445312, -0.01791667938232422, -0.016590118408203125, -0.015263557434082031, -0.013936996459960938, -0.012610435485839844, -0.01128387451171875, -0.009957313537597656, -0.008630752563476562, -0.007304191589355469, -0.005977630615234375, -0.004651069641113281, -0.0033245086669921875, -0.0019979476928710938, -0.00067138671875, 0.0006551742553710938, 0.0019817352294921875, 0.0033082962036132812, 0.004634857177734375, 0.005961418151855469, 0.0072879791259765625, 0.008614540100097656, 0.00994110107421875, 0.011267662048339844, 0.012594223022460938, 0.013920783996582031, 0.015247344970703125, 0.01657390594482422, 0.017900466918945312, 0.019227027893066406, 0.0205535888671875, 0.021880149841308594, 0.023206710815429688, 0.02453327178955078, 0.025859832763671875, 0.02718639373779297, 0.028512954711914062, 0.029839515686035156, 0.03116607666015625, 0.032492637634277344, 0.03381919860839844, 0.03514575958251953, 0.036472320556640625, 0.03779888153076172, 0.03912544250488281, 0.040452003479003906, 0.041778564453125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 6.0, 8.0, 15.0, 14.0, 17.0, 16.0, 14.0, 17.0, 24.0, 42.0, 32.0, 50.0, 77.0, 103.0, 111.0, 100.0, 88.0, 48.0, 40.0, 31.0, 31.0, 22.0, 15.0, 20.0, 5.0, 12.0, 4.0, 10.0, 4.0, 2.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005235671997070312, -0.0005052238702774048, -0.0004868805408477783, -0.00046853721141815186, -0.0004501938819885254, -0.0004318505525588989, -0.00041350722312927246, -0.000395163893699646, -0.00037682056427001953, -0.00035847723484039307, -0.0003401339054107666, -0.00032179057598114014, -0.00030344724655151367, -0.0002851039171218872, -0.00026676058769226074, -0.0002484172582626343, -0.0002300739288330078, -0.00021173059940338135, -0.00019338726997375488, -0.00017504394054412842, -0.00015670061111450195, -0.0001383572816848755, -0.00012001395225524902, -0.00010167062282562256, -8.33272933959961e-05, -6.498396396636963e-05, -4.6640634536743164e-05, -2.82973051071167e-05, -9.953975677490234e-06, 8.38935375213623e-06, 2.6732683181762695e-05, 4.507601261138916e-05, 6.341934204101562e-05, 8.176267147064209e-05, 0.00010010600090026855, 0.00011844933032989502, 0.00013679265975952148, 0.00015513598918914795, 0.00017347931861877441, 0.00019182264804840088, 0.00021016597747802734, 0.0002285093069076538, 0.0002468526363372803, 0.00026519596576690674, 0.0002835392951965332, 0.00030188262462615967, 0.00032022595405578613, 0.0003385692834854126, 0.00035691261291503906, 0.00037525594234466553, 0.000393599271774292, 0.00041194260120391846, 0.0004302859306335449, 0.0004486292600631714, 0.00046697258949279785, 0.0004853159189224243, 0.0005036592483520508, 0.0005220025777816772, 0.0005403459072113037, 0.0005586892366409302, 0.0005770325660705566, 0.0005953758955001831, 0.0006137192249298096, 0.000632062554359436, 0.0006504058837890625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 7.0, 9.0, 13.0, 21.0, 21.0, 29.0, 57.0, 67.0, 96.0, 126.0, 210.0, 886.0, 8087.0, 155497.0, 844419.0, 35458.0, 2582.0, 418.0, 177.0, 99.0, 64.0, 35.0, 38.0, 31.0, 24.0, 18.0, 12.0, 9.0, 13.0, 6.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01025390625, -0.009963154792785645, -0.009672403335571289, -0.009381651878356934, -0.009090900421142578, -0.008800148963928223, -0.008509397506713867, -0.008218646049499512, -0.007927894592285156, -0.007637143135070801, -0.007346391677856445, -0.00705564022064209, -0.006764888763427734, -0.006474137306213379, -0.0061833858489990234, -0.005892634391784668, -0.0056018829345703125, -0.005311131477355957, -0.0050203800201416016, -0.004729628562927246, -0.004438877105712891, -0.004148125648498535, -0.0038573741912841797, -0.0035666227340698242, -0.0032758712768554688, -0.0029851198196411133, -0.002694368362426758, -0.0024036169052124023, -0.002112865447998047, -0.0018221139907836914, -0.001531362533569336, -0.0012406110763549805, -0.000949859619140625, -0.0006591081619262695, -0.00036835670471191406, -7.76052474975586e-05, 0.00021314620971679688, 0.0005038976669311523, 0.0007946491241455078, 0.0010854005813598633, 0.0013761520385742188, 0.0016669034957885742, 0.0019576549530029297, 0.002248406410217285, 0.0025391578674316406, 0.002829909324645996, 0.0031206607818603516, 0.003411412239074707, 0.0037021636962890625, 0.003992915153503418, 0.0042836666107177734, 0.004574418067932129, 0.004865169525146484, 0.00515592098236084, 0.005446672439575195, 0.005737423896789551, 0.006028175354003906, 0.006318926811218262, 0.006609678268432617, 0.006900429725646973, 0.007191181182861328, 0.007481932640075684, 0.007772684097290039, 0.008063435554504395, 0.00835418701171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 11.0, 51.0, 607.0, 323.0, 24.0], "bins": [-0.013291134499013424, -0.013076398521661758, -0.012861662544310093, -0.012646926566958427, -0.012432190589606762, -0.012217454612255096, -0.012002719566226006, -0.01178798358887434, -0.011573247611522675, -0.011358511634171009, -0.011143775656819344, -0.010929039679467678, -0.010714303702116013, -0.010499568656086922, -0.010284831747412682, -0.01007009670138359, -0.00985535979270935, -0.009640623815357685, -0.00942588783800602, -0.009211151860654354, -0.008996415883302689, -0.008781680837273598, -0.008566943928599358, -0.008352208882570267, -0.008137472905218601, -0.007922736927866936, -0.00770800095051527, -0.007493264973163605, -0.0072785294614732265, -0.007063793484121561, -0.0068490575067698956, -0.00663432152941823, -0.0064195855520665646, -0.006204849574714899, -0.0059901135973632336, -0.005775378085672855, -0.00556064210832119, -0.005345906130969524, -0.005131170153617859, -0.004916434176266193, -0.004701698198914528, -0.004486962221562862, -0.004272226244211197, -0.004057490266859531, -0.003842754755169153, -0.0036280187778174877, -0.0034132828004658222, -0.0031985468231141567, -0.0029838113114237785, -0.002769075334072113, -0.002554339589551091, -0.0023396036121994257, -0.002124867867678404, -0.0019101318903267384, -0.0016953959129750729, -0.0014806600520387292, -0.0012659241911023855, -0.0010511883301660419, -0.0008364524110220373, -0.0006217164918780327, -0.000406980630941689, -0.00019224477000534534, 2.2491207346320152e-05, 0.00023722706828266382, 0.0004519629292190075]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 14.0, 15.0, 21.0, 36.0, 26.0, 46.0, 43.0, 48.0, 64.0, 55.0, 64.0, 59.0, 70.0, 61.0, 62.0, 53.0, 52.0, 42.0, 31.0, 26.0, 25.0, 21.0, 19.0, 13.0, 6.0, 12.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005148649215698242, -0.0004944652318954468, -0.00047406554222106934, -0.0004536658525466919, -0.00043326616287231445, -0.000412866473197937, -0.00039246678352355957, -0.00037206709384918213, -0.0003516674041748047, -0.00033126771450042725, -0.0003108680248260498, -0.00029046833515167236, -0.0002700686454772949, -0.0002496689558029175, -0.00022926926612854004, -0.0002088695764541626, -0.00018846988677978516, -0.00016807019710540771, -0.00014767050743103027, -0.00012727081775665283, -0.00010687112808227539, -8.647143840789795e-05, -6.607174873352051e-05, -4.5672059059143066e-05, -2.5272369384765625e-05, -4.872679710388184e-06, 1.5527009963989258e-05, 3.59266996383667e-05, 5.632638931274414e-05, 7.672607898712158e-05, 9.712576866149902e-05, 0.00011752545833587646, 0.0001379251480102539, 0.00015832483768463135, 0.0001787245273590088, 0.00019912421703338623, 0.00021952390670776367, 0.0002399235963821411, 0.00026032328605651855, 0.000280722975730896, 0.00030112266540527344, 0.0003215223550796509, 0.0003419220447540283, 0.00036232173442840576, 0.0003827214241027832, 0.00040312111377716064, 0.0004235208034515381, 0.00044392049312591553, 0.00046432018280029297, 0.0004847198724746704, 0.0005051195621490479, 0.0005255192518234253, 0.0005459189414978027, 0.0005663186311721802, 0.0005867183208465576, 0.0006071180105209351, 0.0006275177001953125, 0.0006479173898696899, 0.0006683170795440674, 0.0006887167692184448, 0.0007091164588928223, 0.0007295161485671997, 0.0007499158382415771, 0.0007703155279159546, 0.000790715217590332]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 11.0, 9.0, 16.0, 23.0, 31.0, 39.0, 49.0, 51.0, 49.0, 67.0, 73.0, 83.0, 82.0, 77.0, 78.0, 64.0, 47.0, 39.0, 29.0, 23.0, 22.0, 13.0, 10.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.30078125, -4.18353271484375, -4.0662841796875, -3.94903564453125, -3.831787109375, -3.71453857421875, -3.5972900390625, -3.48004150390625, -3.36279296875, -3.24554443359375, -3.1282958984375, -3.01104736328125, -2.893798828125, -2.77655029296875, -2.6593017578125, -2.54205322265625, -2.4248046875, -2.30755615234375, -2.1903076171875, -2.07305908203125, -1.955810546875, -1.83856201171875, -1.7213134765625, -1.60406494140625, -1.48681640625, -1.36956787109375, -1.2523193359375, -1.13507080078125, -1.017822265625, -0.90057373046875, -0.7833251953125, -0.66607666015625, -0.548828125, -0.43157958984375, -0.3143310546875, -0.19708251953125, -0.079833984375, 0.03741455078125, 0.1546630859375, 0.27191162109375, 0.38916015625, 0.50640869140625, 0.6236572265625, 0.74090576171875, 0.858154296875, 0.97540283203125, 1.0926513671875, 1.20989990234375, 1.3271484375, 1.44439697265625, 1.5616455078125, 1.67889404296875, 1.796142578125, 1.91339111328125, 2.0306396484375, 2.14788818359375, 2.26513671875, 2.38238525390625, 2.4996337890625, 2.61688232421875, 2.734130859375, 2.85137939453125, 2.9686279296875, 3.08587646484375, 3.203125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 8.0, 9.0, 11.0, 21.0, 21.0, 46.0, 73.0, 127.0, 209.0, 501.0, 1128.0, 3242.0, 13089.0, 91205.0, 814384.0, 104808.0, 13904.0, 3544.0, 1207.0, 488.0, 224.0, 120.0, 63.0, 44.0, 32.0, 15.0, 13.0, 12.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2578125, -10.9219970703125, -10.586181640625, -10.2503662109375, -9.91455078125, -9.5787353515625, -9.242919921875, -8.9071044921875, -8.5712890625, -8.2354736328125, -7.899658203125, -7.5638427734375, -7.22802734375, -6.8922119140625, -6.556396484375, -6.2205810546875, -5.884765625, -5.5489501953125, -5.213134765625, -4.8773193359375, -4.54150390625, -4.2056884765625, -3.869873046875, -3.5340576171875, -3.1982421875, -2.8624267578125, -2.526611328125, -2.1907958984375, -1.85498046875, -1.5191650390625, -1.183349609375, -0.8475341796875, -0.51171875, -0.1759033203125, 0.159912109375, 0.4957275390625, 0.83154296875, 1.1673583984375, 1.503173828125, 1.8389892578125, 2.1748046875, 2.5106201171875, 2.846435546875, 3.1822509765625, 3.51806640625, 3.8538818359375, 4.189697265625, 4.5255126953125, 4.861328125, 5.1971435546875, 5.532958984375, 5.8687744140625, 6.20458984375, 6.5404052734375, 6.876220703125, 7.2120361328125, 7.5478515625, 7.8836669921875, 8.219482421875, 8.5552978515625, 8.89111328125, 9.2269287109375, 9.562744140625, 9.8985595703125, 10.234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 10.0, 4.0, 5.0, 5.0, 7.0, 5.0, 7.0, 15.0, 15.0, 25.0, 21.0, 24.0, 25.0, 23.0, 48.0, 33.0, 19.0, 39.0, 46.0, 58.0, 64.0, 110.0, 190.0, 1367.0, 236.0, 120.0, 52.0, 53.0, 43.0, 43.0, 43.0, 32.0, 26.0, 17.0, 34.0, 24.0, 20.0, 28.0, 18.0, 15.0, 13.0, 8.0, 11.0, 9.0, 10.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.86328125, -6.6466064453125, -6.429931640625, -6.2132568359375, -5.99658203125, -5.7799072265625, -5.563232421875, -5.3465576171875, -5.1298828125, -4.9132080078125, -4.696533203125, -4.4798583984375, -4.26318359375, -4.0465087890625, -3.829833984375, -3.6131591796875, -3.396484375, -3.1798095703125, -2.963134765625, -2.7464599609375, -2.52978515625, -2.3131103515625, -2.096435546875, -1.8797607421875, -1.6630859375, -1.4464111328125, -1.229736328125, -1.0130615234375, -0.79638671875, -0.5797119140625, -0.363037109375, -0.1463623046875, 0.0703125, 0.2869873046875, 0.503662109375, 0.7203369140625, 0.93701171875, 1.1536865234375, 1.370361328125, 1.5870361328125, 1.8037109375, 2.0203857421875, 2.237060546875, 2.4537353515625, 2.67041015625, 2.8870849609375, 3.103759765625, 3.3204345703125, 3.537109375, 3.7537841796875, 3.970458984375, 4.1871337890625, 4.40380859375, 4.6204833984375, 4.837158203125, 5.0538330078125, 5.2705078125, 5.4871826171875, 5.703857421875, 5.9205322265625, 6.13720703125, 6.3538818359375, 6.570556640625, 6.7872314453125, 7.00390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 12.0, 21.0, 12.0, 14.0, 17.0, 28.0, 42.0, 53.0, 59.0, 124.0, 173.0, 227.0, 423.0, 740.0, 1421.0, 2856.0, 6097.0, 14951.0, 46549.0, 355342.0, 2486689.0, 174935.0, 33365.0, 11538.0, 4935.0, 2216.0, 1134.0, 636.0, 341.0, 232.0, 136.0, 85.0, 75.0, 47.0, 42.0, 20.0, 24.0, 14.0, 13.0, 8.0, 13.0, 8.0, 4.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-10.9765625, -10.637451171875, -10.29833984375, -9.959228515625, -9.6201171875, -9.281005859375, -8.94189453125, -8.602783203125, -8.263671875, -7.924560546875, -7.58544921875, -7.246337890625, -6.9072265625, -6.568115234375, -6.22900390625, -5.889892578125, -5.55078125, -5.211669921875, -4.87255859375, -4.533447265625, -4.1943359375, -3.855224609375, -3.51611328125, -3.177001953125, -2.837890625, -2.498779296875, -2.15966796875, -1.820556640625, -1.4814453125, -1.142333984375, -0.80322265625, -0.464111328125, -0.125, 0.214111328125, 0.55322265625, 0.892333984375, 1.2314453125, 1.570556640625, 1.90966796875, 2.248779296875, 2.587890625, 2.927001953125, 3.26611328125, 3.605224609375, 3.9443359375, 4.283447265625, 4.62255859375, 4.961669921875, 5.30078125, 5.639892578125, 5.97900390625, 6.318115234375, 6.6572265625, 6.996337890625, 7.33544921875, 7.674560546875, 8.013671875, 8.352783203125, 8.69189453125, 9.031005859375, 9.3701171875, 9.709228515625, 10.04833984375, 10.387451171875, 10.7265625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [4.0, 140.0, 809.0, 65.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.585744857788086, -10.903063774108887, -3.2203826904296875, 4.462297439575195, 12.144979476928711, 19.827661514282227, 27.510339736938477, 35.193023681640625, 42.875701904296875, 50.55838394165039, 58.241065979003906, 65.92374420166016, 73.60643005371094, 81.28910827636719, 88.97178649902344, 96.65446472167969, 104.33715057373047, 112.01982879638672, 119.7025146484375, 127.38519287109375, 135.06787109375, 142.75054931640625, 150.4332275390625, 158.1159210205078, 165.79859924316406, 173.4812774658203, 181.16395568847656, 188.84664916992188, 196.52932739257812, 204.21200561523438, 211.89468383789062, 219.57736206054688, 227.26004028320312, 234.94271850585938, 242.62539672851562, 250.30807495117188, 257.9907531738281, 265.6734619140625, 273.35614013671875, 281.038818359375, 288.72149658203125, 296.4041748046875, 304.08685302734375, 311.76953125, 319.45220947265625, 327.1348876953125, 334.81756591796875, 342.5002746582031, 350.18292236328125, 357.8656005859375, 365.54827880859375, 373.23095703125, 380.91363525390625, 388.5963134765625, 396.27899169921875, 403.9617004394531, 411.6443786621094, 419.3270568847656, 427.0097351074219, 434.6924133300781, 442.3750915527344, 450.05780029296875, 457.740478515625, 465.42315673828125, 473.1058349609375]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 5.0, 12.0, 8.0, 15.0, 22.0, 19.0, 20.0, 25.0, 18.0, 34.0, 30.0, 28.0, 27.0, 33.0, 56.0, 37.0, 35.0, 33.0, 36.0, 35.0, 45.0, 49.0, 34.0, 40.0, 38.0, 38.0, 28.0, 17.0, 21.0, 24.0, 16.0, 20.0, 18.0, 17.0, 8.0, 8.0, 4.0, 7.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.87702751159668, -28.988431930541992, -28.099836349487305, -27.211238861083984, -26.322643280029297, -25.43404769897461, -24.545452117919922, -23.656856536865234, -22.768260955810547, -21.87966537475586, -20.991069793701172, -20.102474212646484, -19.213876724243164, -18.325281143188477, -17.43668556213379, -16.5480899810791, -15.659492492675781, -14.770896911621094, -13.88230037689209, -12.993704795837402, -12.105108261108398, -11.216512680053711, -10.327917098999023, -9.439321517944336, -8.550724983215332, -7.662128925323486, -6.773532867431641, -5.884937286376953, -4.996341228485107, -4.107745170593262, -3.219149589538574, -2.3305535316467285, -1.4419574737548828, -0.5533615350723267, 0.3352344036102295, 1.223830223083496, 2.112426280975342, 3.0010223388671875, 3.889617919921875, 4.778213977813721, 5.666810035705566, 6.555406093597412, 7.444002151489258, 8.332597732543945, 9.221193313598633, 10.109789848327637, 10.998385429382324, 11.886981964111328, 12.775577545166016, 13.664173126220703, 14.552769660949707, 15.441365242004395, 16.3299617767334, 17.218557357788086, 18.107152938842773, 18.99574851989746, 19.88434600830078, 20.77294158935547, 21.661537170410156, 22.550132751464844, 23.438730239868164, 24.32732582092285, 25.21592140197754, 26.104516983032227, 26.993112564086914]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 14.0, 10.0, 16.0, 37.0, 31.0, 34.0, 46.0, 53.0, 42.0, 59.0, 63.0, 86.0, 83.0, 58.0, 77.0, 67.0, 37.0, 46.0, 35.0, 24.0, 25.0, 19.0, 12.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1171875, -4.005035400390625, -3.89288330078125, -3.780731201171875, -3.6685791015625, -3.556427001953125, -3.44427490234375, -3.332122802734375, -3.219970703125, -3.107818603515625, -2.99566650390625, -2.883514404296875, -2.7713623046875, -2.659210205078125, -2.54705810546875, -2.434906005859375, -2.32275390625, -2.210601806640625, -2.09844970703125, -1.986297607421875, -1.8741455078125, -1.761993408203125, -1.64984130859375, -1.537689208984375, -1.425537109375, -1.313385009765625, -1.20123291015625, -1.089080810546875, -0.9769287109375, -0.864776611328125, -0.75262451171875, -0.640472412109375, -0.5283203125, -0.416168212890625, -0.30401611328125, -0.191864013671875, -0.0797119140625, 0.032440185546875, 0.14459228515625, 0.256744384765625, 0.368896484375, 0.481048583984375, 0.59320068359375, 0.705352783203125, 0.8175048828125, 0.929656982421875, 1.04180908203125, 1.153961181640625, 1.26611328125, 1.378265380859375, 1.49041748046875, 1.602569580078125, 1.7147216796875, 1.826873779296875, 1.93902587890625, 2.051177978515625, 2.163330078125, 2.275482177734375, 2.38763427734375, 2.499786376953125, 2.6119384765625, 2.724090576171875, 2.83624267578125, 2.948394775390625, 3.060546875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 12.0, 12.0, 23.0, 23.0, 20.0, 48.0, 45.0, 102.0, 163.0, 273.0, 494.0, 918.0, 1918.0, 5519.0, 21902.0, 458838.0, 3565933.0, 119277.0, 12673.0, 3553.0, 1277.0, 566.0, 284.0, 150.0, 99.0, 66.0, 28.0, 12.0, 13.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.374755859375, -16.92138671875, -16.468017578125, -16.0146484375, -15.561279296875, -15.10791015625, -14.654541015625, -14.201171875, -13.747802734375, -13.29443359375, -12.841064453125, -12.3876953125, -11.934326171875, -11.48095703125, -11.027587890625, -10.57421875, -10.120849609375, -9.66748046875, -9.214111328125, -8.7607421875, -8.307373046875, -7.85400390625, -7.400634765625, -6.947265625, -6.493896484375, -6.04052734375, -5.587158203125, -5.1337890625, -4.680419921875, -4.22705078125, -3.773681640625, -3.3203125, -2.866943359375, -2.41357421875, -1.960205078125, -1.5068359375, -1.053466796875, -0.60009765625, -0.146728515625, 0.306640625, 0.760009765625, 1.21337890625, 1.666748046875, 2.1201171875, 2.573486328125, 3.02685546875, 3.480224609375, 3.93359375, 4.386962890625, 4.84033203125, 5.293701171875, 5.7470703125, 6.200439453125, 6.65380859375, 7.107177734375, 7.560546875, 8.013916015625, 8.46728515625, 8.920654296875, 9.3740234375, 9.827392578125, 10.28076171875, 10.734130859375, 11.1875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 10.0, 16.0, 15.0, 19.0, 44.0, 73.0, 93.0, 144.0, 274.0, 439.0, 654.0, 779.0, 582.0, 364.0, 202.0, 111.0, 97.0, 52.0, 25.0, 18.0, 15.0, 8.0, 11.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.3380126953125, -8.043212890625, -7.7484130859375, -7.45361328125, -7.1588134765625, -6.864013671875, -6.5692138671875, -6.2744140625, -5.9796142578125, -5.684814453125, -5.3900146484375, -5.09521484375, -4.8004150390625, -4.505615234375, -4.2108154296875, -3.916015625, -3.6212158203125, -3.326416015625, -3.0316162109375, -2.73681640625, -2.4420166015625, -2.147216796875, -1.8524169921875, -1.5576171875, -1.2628173828125, -0.968017578125, -0.6732177734375, -0.37841796875, -0.0836181640625, 0.211181640625, 0.5059814453125, 0.80078125, 1.0955810546875, 1.390380859375, 1.6851806640625, 1.97998046875, 2.2747802734375, 2.569580078125, 2.8643798828125, 3.1591796875, 3.4539794921875, 3.748779296875, 4.0435791015625, 4.33837890625, 4.6331787109375, 4.927978515625, 5.2227783203125, 5.517578125, 5.8123779296875, 6.107177734375, 6.4019775390625, 6.69677734375, 6.9915771484375, 7.286376953125, 7.5811767578125, 7.8759765625, 8.1707763671875, 8.465576171875, 8.7603759765625, 9.05517578125, 9.3499755859375, 9.644775390625, 9.9395751953125, 10.234375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 14.0, 32.0, 37.0, 65.0, 127.0, 234.0, 454.0, 811.0, 1663.0, 3733.0, 9589.0, 31475.0, 162612.0, 1705515.0, 2030701.0, 193676.0, 35183.0, 10605.0, 4009.0, 1839.0, 881.0, 459.0, 243.0, 152.0, 77.0, 46.0, 19.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.9296875, -13.5205078125, -13.111328125, -12.7021484375, -12.29296875, -11.8837890625, -11.474609375, -11.0654296875, -10.65625, -10.2470703125, -9.837890625, -9.4287109375, -9.01953125, -8.6103515625, -8.201171875, -7.7919921875, -7.3828125, -6.9736328125, -6.564453125, -6.1552734375, -5.74609375, -5.3369140625, -4.927734375, -4.5185546875, -4.109375, -3.7001953125, -3.291015625, -2.8818359375, -2.47265625, -2.0634765625, -1.654296875, -1.2451171875, -0.8359375, -0.4267578125, -0.017578125, 0.3916015625, 0.80078125, 1.2099609375, 1.619140625, 2.0283203125, 2.4375, 2.8466796875, 3.255859375, 3.6650390625, 4.07421875, 4.4833984375, 4.892578125, 5.3017578125, 5.7109375, 6.1201171875, 6.529296875, 6.9384765625, 7.34765625, 7.7568359375, 8.166015625, 8.5751953125, 8.984375, 9.3935546875, 9.802734375, 10.2119140625, 10.62109375, 11.0302734375, 11.439453125, 11.8486328125, 12.2578125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 8.0, 39.0, 61.0, 114.0, 191.0, 186.0, 163.0, 99.0, 85.0, 27.0, 20.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-100.6738510131836, -98.3565444946289, -96.03923797607422, -93.72193145751953, -91.40461730957031, -89.08731079101562, -86.77000427246094, -84.45269775390625, -82.13539123535156, -79.81808471679688, -77.50077819824219, -75.1834716796875, -72.86616516113281, -70.5488510131836, -68.2315444946289, -65.91423797607422, -63.59693145751953, -61.279624938964844, -58.962318420410156, -56.6450080871582, -54.327701568603516, -52.01039505004883, -49.693084716796875, -47.37577819824219, -45.0584716796875, -42.74116516113281, -40.423858642578125, -38.10654830932617, -35.789241790771484, -33.4719352722168, -31.154626846313477, -28.837318420410156, -26.520004272460938, -24.20269775390625, -21.88538932800293, -19.56808090209961, -17.250774383544922, -14.933466911315918, -12.616159439086914, -10.298851013183594, -7.981544494628906, -5.664237022399902, -3.3469295501708984, -1.0296220779418945, 1.2876853942871094, 3.6049928665161133, 5.922300338745117, 8.239608764648438, 10.556915283203125, 12.874222755432129, 15.191530227661133, 17.508838653564453, 19.82614517211914, 22.143451690673828, 24.46076011657715, 26.77806854248047, 29.095375061035156, 31.412681579589844, 33.72998809814453, 36.047298431396484, 38.36460494995117, 40.68191146850586, 42.99922180175781, 45.3165283203125, 47.63383483886719]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 6.0, 4.0, 5.0, 9.0, 12.0, 12.0, 12.0, 17.0, 32.0, 27.0, 35.0, 31.0, 46.0, 30.0, 36.0, 50.0, 46.0, 34.0, 41.0, 43.0, 62.0, 45.0, 42.0, 41.0, 32.0, 47.0, 27.0, 21.0, 27.0, 20.0, 22.0, 19.0, 10.0, 12.0, 8.0, 7.0, 7.0, 5.0, 10.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.952232360839844, -20.172441482543945, -19.392650604248047, -18.61285972595215, -17.83306884765625, -17.053279876708984, -16.273487091064453, -15.493698120117188, -14.713907241821289, -13.93411636352539, -13.154325485229492, -12.374534606933594, -11.594744682312012, -10.814953804016113, -10.035162925720215, -9.255373001098633, -8.475581169128418, -7.6957902908325195, -6.915999889373779, -6.136209011077881, -5.356418609619141, -4.576627731323242, -3.7968368530273438, -3.0170464515686035, -2.237255573272705, -1.4574649333953857, -0.6776741743087769, 0.10211658477783203, 0.8819072246551514, 1.6616978645324707, 2.441488742828369, 3.2212791442871094, 4.001070022583008, 4.780860900878906, 5.5606513023376465, 6.340442180633545, 7.120232582092285, 7.900023460388184, 8.679814338684082, 9.459604263305664, 10.239395141601562, 11.019186019897461, 11.79897689819336, 12.578767776489258, 13.35855770111084, 14.138348579406738, 14.918139457702637, 15.697929382324219, 16.47772216796875, 17.25751304626465, 18.037303924560547, 18.817094802856445, 19.596885681152344, 20.37667465209961, 21.15646743774414, 21.936256408691406, 22.716047286987305, 23.495838165283203, 24.2756290435791, 25.055419921875, 25.8352108001709, 26.615001678466797, 27.394790649414062, 28.17458152770996, 28.95437240600586]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 9.0, 18.0, 15.0, 23.0, 32.0, 41.0, 37.0, 32.0, 45.0, 68.0, 67.0, 73.0, 67.0, 67.0, 59.0, 64.0, 49.0, 35.0, 46.0, 30.0, 30.0, 17.0, 19.0, 15.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.76171875, -3.657684326171875, -3.55364990234375, -3.449615478515625, -3.3455810546875, -3.241546630859375, -3.13751220703125, -3.033477783203125, -2.929443359375, -2.825408935546875, -2.72137451171875, -2.617340087890625, -2.5133056640625, -2.409271240234375, -2.30523681640625, -2.201202392578125, -2.09716796875, -1.993133544921875, -1.88909912109375, -1.785064697265625, -1.6810302734375, -1.576995849609375, -1.47296142578125, -1.368927001953125, -1.264892578125, -1.160858154296875, -1.05682373046875, -0.952789306640625, -0.8487548828125, -0.744720458984375, -0.64068603515625, -0.536651611328125, -0.4326171875, -0.328582763671875, -0.22454833984375, -0.120513916015625, -0.0164794921875, 0.087554931640625, 0.19158935546875, 0.295623779296875, 0.399658203125, 0.503692626953125, 0.60772705078125, 0.711761474609375, 0.8157958984375, 0.919830322265625, 1.02386474609375, 1.127899169921875, 1.23193359375, 1.335968017578125, 1.44000244140625, 1.544036865234375, 1.6480712890625, 1.752105712890625, 1.85614013671875, 1.960174560546875, 2.064208984375, 2.168243408203125, 2.27227783203125, 2.376312255859375, 2.4803466796875, 2.584381103515625, 2.68841552734375, 2.792449951171875, 2.896484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 14.0, 7.0, 23.0, 33.0, 33.0, 46.0, 55.0, 93.0, 130.0, 188.0, 302.0, 452.0, 733.0, 1250.0, 2136.0, 3787.0, 6835.0, 13023.0, 24878.0, 50062.0, 111770.0, 359635.0, 284134.0, 96445.0, 44268.0, 21939.0, 11440.0, 6279.0, 3438.0, 1953.0, 1146.0, 666.0, 450.0, 293.0, 185.0, 110.0, 90.0, 60.0, 53.0, 30.0, 18.0, 13.0, 17.0, 11.0, 13.0, 5.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0], "bins": [-0.1978759765625, -0.19204139709472656, -0.18620681762695312, -0.1803722381591797, -0.17453765869140625, -0.1687030792236328, -0.16286849975585938, -0.15703392028808594, -0.1511993408203125, -0.14536476135253906, -0.13953018188476562, -0.1336956024169922, -0.12786102294921875, -0.12202644348144531, -0.11619186401367188, -0.11035728454589844, -0.104522705078125, -0.09868812561035156, -0.09285354614257812, -0.08701896667480469, -0.08118438720703125, -0.07534980773925781, -0.06951522827148438, -0.06368064880371094, -0.0578460693359375, -0.05201148986816406, -0.046176910400390625, -0.04034233093261719, -0.03450775146484375, -0.028673171997070312, -0.022838592529296875, -0.017004013061523438, -0.01116943359375, -0.0053348541259765625, 0.000499725341796875, 0.0063343048095703125, 0.01216888427734375, 0.018003463745117188, 0.023838043212890625, 0.029672622680664062, 0.0355072021484375, 0.04134178161621094, 0.047176361083984375, 0.05301094055175781, 0.05884552001953125, 0.06468009948730469, 0.07051467895507812, 0.07634925842285156, 0.082183837890625, 0.08801841735839844, 0.09385299682617188, 0.09968757629394531, 0.10552215576171875, 0.11135673522949219, 0.11719131469726562, 0.12302589416503906, 0.1288604736328125, 0.13469505310058594, 0.14052963256835938, 0.1463642120361328, 0.15219879150390625, 0.1580333709716797, 0.16386795043945312, 0.16970252990722656, 0.175537109375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 9.0, 10.0, 7.0, 7.0, 8.0, 14.0, 6.0, 7.0, 20.0, 20.0, 24.0, 22.0, 22.0, 27.0, 24.0, 29.0, 45.0, 38.0, 32.0, 45.0, 48.0, 1059.0, 27.0, 42.0, 45.0, 38.0, 36.0, 36.0, 33.0, 39.0, 34.0, 26.0, 28.0, 20.0, 13.0, 10.0, 21.0, 4.0, 11.0, 13.0, 8.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9501953125, -1.8871002197265625, -1.824005126953125, -1.7609100341796875, -1.69781494140625, -1.6347198486328125, -1.571624755859375, -1.5085296630859375, -1.4454345703125, -1.3823394775390625, -1.319244384765625, -1.2561492919921875, -1.19305419921875, -1.1299591064453125, -1.066864013671875, -1.0037689208984375, -0.940673828125, -0.8775787353515625, -0.814483642578125, -0.7513885498046875, -0.68829345703125, -0.6251983642578125, -0.562103271484375, -0.4990081787109375, -0.4359130859375, -0.3728179931640625, -0.309722900390625, -0.2466278076171875, -0.18353271484375, -0.1204376220703125, -0.057342529296875, 0.0057525634765625, 0.06884765625, 0.1319427490234375, 0.195037841796875, 0.2581329345703125, 0.32122802734375, 0.3843231201171875, 0.447418212890625, 0.5105133056640625, 0.5736083984375, 0.6367034912109375, 0.699798583984375, 0.7628936767578125, 0.82598876953125, 0.8890838623046875, 0.952178955078125, 1.0152740478515625, 1.078369140625, 1.1414642333984375, 1.204559326171875, 1.2676544189453125, 1.33074951171875, 1.3938446044921875, 1.456939697265625, 1.5200347900390625, 1.5831298828125, 1.6462249755859375, 1.709320068359375, 1.7724151611328125, 1.83551025390625, 1.8986053466796875, 1.961700439453125, 2.0247955322265625, 2.087890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 8.0, 7.0, 13.0, 18.0, 31.0, 42.0, 57.0, 85.0, 127.0, 167.0, 223.0, 324.0, 475.0, 649.0, 886.0, 1265.0, 1787.0, 2500.0, 3505.0, 4984.0, 7190.0, 10328.0, 14731.0, 21608.0, 32597.0, 50173.0, 81698.0, 154147.0, 1314405.0, 155298.0, 82748.0, 50588.0, 32942.0, 22042.0, 14770.0, 10280.0, 7088.0, 4970.0, 3580.0, 2469.0, 1886.0, 1295.0, 915.0, 654.0, 475.0, 314.0, 237.0, 157.0, 125.0, 89.0, 62.0, 45.0, 25.0, 15.0, 17.0, 8.0, 10.0, 3.0, 2.0, 3.0], "bins": [-0.044769287109375, -0.043392181396484375, -0.04201507568359375, -0.040637969970703125, -0.0392608642578125, -0.037883758544921875, -0.03650665283203125, -0.035129547119140625, -0.03375244140625, -0.032375335693359375, -0.03099822998046875, -0.029621124267578125, -0.0282440185546875, -0.026866912841796875, -0.02548980712890625, -0.024112701416015625, -0.022735595703125, -0.021358489990234375, -0.01998138427734375, -0.018604278564453125, -0.0172271728515625, -0.015850067138671875, -0.01447296142578125, -0.013095855712890625, -0.01171875, -0.010341644287109375, -0.00896453857421875, -0.007587432861328125, -0.0062103271484375, -0.004833221435546875, -0.00345611572265625, -0.002079010009765625, -0.000701904296875, 0.000675201416015625, 0.00205230712890625, 0.003429412841796875, 0.0048065185546875, 0.006183624267578125, 0.00756072998046875, 0.008937835693359375, 0.01031494140625, 0.011692047119140625, 0.01306915283203125, 0.014446258544921875, 0.0158233642578125, 0.017200469970703125, 0.01857757568359375, 0.019954681396484375, 0.021331787109375, 0.022708892822265625, 0.02408599853515625, 0.025463104248046875, 0.0268402099609375, 0.028217315673828125, 0.02959442138671875, 0.030971527099609375, 0.0323486328125, 0.033725738525390625, 0.03510284423828125, 0.036479949951171875, 0.0378570556640625, 0.039234161376953125, 0.04061126708984375, 0.041988372802734375, 0.043365478515625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 7.0, 16.0, 6.0, 12.0, 17.0, 34.0, 39.0, 37.0, 46.0, 53.0, 102.0, 116.0, 113.0, 73.0, 55.0, 52.0, 42.0, 31.0, 24.0, 20.0, 18.0, 11.0, 6.0, 11.0, 10.0, 4.0, 9.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004665851593017578, -0.00045050308108329773, -0.00043442100286483765, -0.00041833892464637756, -0.0004022568464279175, -0.0003861747682094574, -0.0003700926899909973, -0.00035401061177253723, -0.00033792853355407715, -0.00032184645533561707, -0.000305764377117157, -0.0002896822988986969, -0.0002736002206802368, -0.00025751814246177673, -0.00024143606424331665, -0.00022535398602485657, -0.00020927190780639648, -0.0001931898295879364, -0.00017710775136947632, -0.00016102567315101624, -0.00014494359493255615, -0.00012886151671409607, -0.00011277943849563599, -9.66973602771759e-05, -8.061528205871582e-05, -6.453320384025574e-05, -4.8451125621795654e-05, -3.236904740333557e-05, -1.6286969184875488e-05, -2.0489096641540527e-07, 1.5877187252044678e-05, 3.195926547050476e-05, 4.8041343688964844e-05, 6.412342190742493e-05, 8.020550012588501e-05, 9.628757834434509e-05, 0.00011236965656280518, 0.00012845173478126526, 0.00014453381299972534, 0.00016061589121818542, 0.0001766979694366455, 0.0001927800476551056, 0.00020886212587356567, 0.00022494420409202576, 0.00024102628231048584, 0.0002571083605289459, 0.000273190438747406, 0.0002892725169658661, 0.00030535459518432617, 0.00032143667340278625, 0.00033751875162124634, 0.0003536008298397064, 0.0003696829080581665, 0.0003857649862766266, 0.00040184706449508667, 0.00041792914271354675, 0.00043401122093200684, 0.0004500932991504669, 0.000466175377368927, 0.0004822574555873871, 0.0004983395338058472, 0.0005144216120243073, 0.0005305036902427673, 0.0005465857684612274, 0.0005626678466796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 1.0, 4.0, 7.0, 10.0, 15.0, 12.0, 19.0, 24.0, 25.0, 45.0, 67.0, 104.0, 194.0, 636.0, 3560.0, 31048.0, 657582.0, 330538.0, 20987.0, 2624.0, 524.0, 179.0, 99.0, 70.0, 43.0, 35.0, 23.0, 13.0, 15.0, 6.0, 14.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0091552734375, -0.008893072605133057, -0.008630871772766113, -0.00836867094039917, -0.008106470108032227, -0.007844269275665283, -0.00758206844329834, -0.0073198676109313965, -0.007057666778564453, -0.00679546594619751, -0.006533265113830566, -0.006271064281463623, -0.00600886344909668, -0.005746662616729736, -0.005484461784362793, -0.00522226095199585, -0.004960060119628906, -0.004697859287261963, -0.0044356584548950195, -0.004173457622528076, -0.003911256790161133, -0.0036490559577941895, -0.003386855125427246, -0.0031246542930603027, -0.0028624534606933594, -0.002600252628326416, -0.0023380517959594727, -0.0020758509635925293, -0.001813650131225586, -0.0015514492988586426, -0.0012892484664916992, -0.0010270476341247559, -0.0007648468017578125, -0.0005026459693908691, -0.00024044513702392578, 2.1755695343017578e-05, 0.00028395652770996094, 0.0005461573600769043, 0.0008083581924438477, 0.001070559024810791, 0.0013327598571777344, 0.0015949606895446777, 0.001857161521911621, 0.0021193623542785645, 0.002381563186645508, 0.002643764019012451, 0.0029059648513793945, 0.003168165683746338, 0.0034303665161132812, 0.0036925673484802246, 0.003954768180847168, 0.004216969013214111, 0.004479169845581055, 0.004741370677947998, 0.005003571510314941, 0.005265772342681885, 0.005527973175048828, 0.0057901740074157715, 0.006052374839782715, 0.006314575672149658, 0.0065767765045166016, 0.006838977336883545, 0.007101178169250488, 0.007363379001617432, 0.007625579833984375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 33.0, 377.0, 556.0, 37.0, 8.0], "bins": [-0.013181163929402828, -0.012965384870767593, -0.012749604880809784, -0.012533825822174549, -0.012318046763539314, -0.012102266773581505, -0.01188648771494627, -0.011670708656311035, -0.0114549295976758, -0.011239150539040565, -0.011023370549082756, -0.010807591490447521, -0.010591812431812286, -0.010376032441854477, -0.010160253383219242, -0.009944474324584007, -0.009728694334626198, -0.009512915275990963, -0.009297135286033154, -0.009081356227397919, -0.008865577168762684, -0.008649798110127449, -0.00843401812016964, -0.008218239061534405, -0.00800246000289917, -0.007786680478602648, -0.007570901419967413, -0.007355121895670891, -0.007139342837035656, -0.006923563312739134, -0.006707783788442612, -0.006492004729807377, -0.006276224739849567, -0.006060445215553045, -0.0058446661569178104, -0.005628886632621288, -0.0054131075739860535, -0.005197328049689531, -0.004981548525393009, -0.004765769466757774, -0.0045499904081225395, -0.004334210883826017, -0.0041184318251907825, -0.0039026523008942604, -0.003686873009428382, -0.0034710937179625034, -0.003255314426496625, -0.0030395351350307465, -0.0028237556107342243, -0.002607976319268346, -0.0023921970278024673, -0.002176417503505945, -0.0019606382120400667, -0.0017448589205741882, -0.0015290796291083097, -0.0013133002212271094, -0.001097520929761231, -0.0008817415800876915, -0.0006659622304141521, -0.00045018293894827366, -0.00023440358927473426, -1.862423960119486e-05, 0.00019715505186468363, 0.00041293445974588394, 0.0006287137512117624]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 12.0, 19.0, 17.0, 23.0, 25.0, 49.0, 46.0, 52.0, 70.0, 53.0, 60.0, 73.0, 73.0, 80.0, 50.0, 48.0, 45.0, 38.0, 47.0, 29.0, 25.0, 19.0, 10.0, 12.0, 12.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004439353942871094, -0.00042630359530448914, -0.0004086717963218689, -0.00039103999733924866, -0.0003734081983566284, -0.0003557763993740082, -0.00033814460039138794, -0.0003205128014087677, -0.00030288100242614746, -0.0002852492034435272, -0.000267617404460907, -0.00024998560547828674, -0.0002323538064956665, -0.00021472200751304626, -0.00019709020853042603, -0.00017945840954780579, -0.00016182661056518555, -0.0001441948115825653, -0.00012656301259994507, -0.00010893121361732483, -9.129941463470459e-05, -7.366761565208435e-05, -5.603581666946411e-05, -3.840401768684387e-05, -2.0772218704223633e-05, -3.1404197216033936e-06, 1.4491379261016846e-05, 3.2123178243637085e-05, 4.9754977226257324e-05, 6.738677620887756e-05, 8.50185751914978e-05, 0.00010265037417411804, 0.00012028217315673828, 0.00013791397213935852, 0.00015554577112197876, 0.000173177570104599, 0.00019080936908721924, 0.00020844116806983948, 0.00022607296705245972, 0.00024370476603507996, 0.0002613365650177002, 0.00027896836400032043, 0.0002966001629829407, 0.0003142319619655609, 0.00033186376094818115, 0.0003494955599308014, 0.00036712735891342163, 0.00038475915789604187, 0.0004023909568786621, 0.00042002275586128235, 0.0004376545548439026, 0.00045528635382652283, 0.00047291815280914307, 0.0004905499517917633, 0.0005081817507743835, 0.0005258135497570038, 0.000543445348739624, 0.0005610771477222443, 0.0005787089467048645, 0.0005963407456874847, 0.000613972544670105, 0.0006316043436527252, 0.0006492361426353455, 0.0006668679416179657, 0.0006844997406005859]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 9.0, 18.0, 14.0, 23.0, 33.0, 41.0, 37.0, 32.0, 45.0, 68.0, 66.0, 74.0, 66.0, 68.0, 59.0, 64.0, 49.0, 34.0, 47.0, 29.0, 31.0, 17.0, 19.0, 15.0, 11.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.763671875, -3.65960693359375, -3.5555419921875, -3.45147705078125, -3.347412109375, -3.24334716796875, -3.1392822265625, -3.03521728515625, -2.93115234375, -2.82708740234375, -2.7230224609375, -2.61895751953125, -2.514892578125, -2.41082763671875, -2.3067626953125, -2.20269775390625, -2.0986328125, -1.99456787109375, -1.8905029296875, -1.78643798828125, -1.682373046875, -1.57830810546875, -1.4742431640625, -1.37017822265625, -1.26611328125, -1.16204833984375, -1.0579833984375, -0.95391845703125, -0.849853515625, -0.74578857421875, -0.6417236328125, -0.53765869140625, -0.43359375, -0.32952880859375, -0.2254638671875, -0.12139892578125, -0.017333984375, 0.08673095703125, 0.1907958984375, 0.29486083984375, 0.39892578125, 0.50299072265625, 0.6070556640625, 0.71112060546875, 0.815185546875, 0.91925048828125, 1.0233154296875, 1.12738037109375, 1.2314453125, 1.33551025390625, 1.4395751953125, 1.54364013671875, 1.647705078125, 1.75177001953125, 1.8558349609375, 1.95989990234375, 2.06396484375, 2.16802978515625, 2.2720947265625, 2.37615966796875, 2.480224609375, 2.58428955078125, 2.6883544921875, 2.79241943359375, 2.896484375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 13.0, 23.0, 38.0, 56.0, 105.0, 148.0, 300.0, 714.0, 1873.0, 5846.0, 26141.0, 622019.0, 362127.0, 21150.0, 4979.0, 1660.0, 649.0, 318.0, 163.0, 94.0, 43.0, 27.0, 11.0, 15.0, 8.0, 10.0, 11.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.1639404296875, -11.695068359375, -11.2261962890625, -10.75732421875, -10.2884521484375, -9.819580078125, -9.3507080078125, -8.8818359375, -8.4129638671875, -7.944091796875, -7.4752197265625, -7.00634765625, -6.5374755859375, -6.068603515625, -5.5997314453125, -5.130859375, -4.6619873046875, -4.193115234375, -3.7242431640625, -3.25537109375, -2.7864990234375, -2.317626953125, -1.8487548828125, -1.3798828125, -0.9110107421875, -0.442138671875, 0.0267333984375, 0.49560546875, 0.9644775390625, 1.433349609375, 1.9022216796875, 2.37109375, 2.8399658203125, 3.308837890625, 3.7777099609375, 4.24658203125, 4.7154541015625, 5.184326171875, 5.6531982421875, 6.1220703125, 6.5909423828125, 7.059814453125, 7.5286865234375, 7.99755859375, 8.4664306640625, 8.935302734375, 9.4041748046875, 9.873046875, 10.3419189453125, 10.810791015625, 11.2796630859375, 11.74853515625, 12.2174072265625, 12.686279296875, 13.1551513671875, 13.6240234375, 14.0928955078125, 14.561767578125, 15.0306396484375, 15.49951171875, 15.9683837890625, 16.437255859375, 16.9061279296875, 17.375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 7.0, 8.0, 15.0, 16.0, 12.0, 10.0, 21.0, 27.0, 26.0, 26.0, 29.0, 28.0, 39.0, 41.0, 43.0, 67.0, 86.0, 126.0, 244.0, 1408.0, 158.0, 94.0, 87.0, 58.0, 50.0, 43.0, 30.0, 31.0, 24.0, 25.0, 19.0, 20.0, 16.0, 15.0, 15.0, 17.0, 7.0, 8.0, 5.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-7.125, -6.90362548828125, -6.6822509765625, -6.46087646484375, -6.239501953125, -6.01812744140625, -5.7967529296875, -5.57537841796875, -5.35400390625, -5.13262939453125, -4.9112548828125, -4.68988037109375, -4.468505859375, -4.24713134765625, -4.0257568359375, -3.80438232421875, -3.5830078125, -3.36163330078125, -3.1402587890625, -2.91888427734375, -2.697509765625, -2.47613525390625, -2.2547607421875, -2.03338623046875, -1.81201171875, -1.59063720703125, -1.3692626953125, -1.14788818359375, -0.926513671875, -0.70513916015625, -0.4837646484375, -0.26239013671875, -0.041015625, 0.18035888671875, 0.4017333984375, 0.62310791015625, 0.844482421875, 1.06585693359375, 1.2872314453125, 1.50860595703125, 1.72998046875, 1.95135498046875, 2.1727294921875, 2.39410400390625, 2.615478515625, 2.83685302734375, 3.0582275390625, 3.27960205078125, 3.5009765625, 3.72235107421875, 3.9437255859375, 4.16510009765625, 4.386474609375, 4.60784912109375, 4.8292236328125, 5.05059814453125, 5.27197265625, 5.49334716796875, 5.7147216796875, 5.93609619140625, 6.157470703125, 6.37884521484375, 6.6002197265625, 6.82159423828125, 7.04296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 7.0, 11.0, 10.0, 23.0, 23.0, 23.0, 28.0, 44.0, 59.0, 64.0, 153.0, 245.0, 479.0, 840.0, 2035.0, 5015.0, 15814.0, 105030.0, 2362323.0, 597527.0, 40466.0, 9261.0, 3223.0, 1389.0, 655.0, 323.0, 187.0, 115.0, 65.0, 69.0, 48.0, 17.0, 19.0, 17.0, 22.0, 14.0, 14.0, 8.0, 5.0, 10.0, 8.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.0859375, -10.7371826171875, -10.388427734375, -10.0396728515625, -9.69091796875, -9.3421630859375, -8.993408203125, -8.6446533203125, -8.2958984375, -7.9471435546875, -7.598388671875, -7.2496337890625, -6.90087890625, -6.5521240234375, -6.203369140625, -5.8546142578125, -5.505859375, -5.1571044921875, -4.808349609375, -4.4595947265625, -4.11083984375, -3.7620849609375, -3.413330078125, -3.0645751953125, -2.7158203125, -2.3670654296875, -2.018310546875, -1.6695556640625, -1.32080078125, -0.9720458984375, -0.623291015625, -0.2745361328125, 0.07421875, 0.4229736328125, 0.771728515625, 1.1204833984375, 1.46923828125, 1.8179931640625, 2.166748046875, 2.5155029296875, 2.8642578125, 3.2130126953125, 3.561767578125, 3.9105224609375, 4.25927734375, 4.6080322265625, 4.956787109375, 5.3055419921875, 5.654296875, 6.0030517578125, 6.351806640625, 6.7005615234375, 7.04931640625, 7.3980712890625, 7.746826171875, 8.0955810546875, 8.4443359375, 8.7930908203125, 9.141845703125, 9.4906005859375, 9.83935546875, 10.1881103515625, 10.536865234375, 10.8856201171875, 11.234375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 123.0, 610.0, 265.0, 17.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53078842163086, -25.123645782470703, -20.716503143310547, -16.309358596801758, -11.902215957641602, -7.495073318481445, -3.0879287719726562, 1.3192138671875, 5.726356506347656, 10.133499145507812, 14.540642738342285, 18.947786331176758, 23.354928970336914, 27.76207160949707, 32.16921615600586, 36.576358795166016, 40.98350143432617, 45.39064407348633, 49.797786712646484, 54.204933166503906, 58.61207580566406, 63.01921844482422, 67.42636108398438, 71.83350372314453, 76.24064636230469, 80.64778900146484, 85.054931640625, 89.46207427978516, 93.86921691894531, 98.27635955810547, 102.68350219726562, 107.09065246582031, 111.497802734375, 115.90494537353516, 120.31208801269531, 124.71923065185547, 129.12637329101562, 133.5335235595703, 137.94065856933594, 142.34780883789062, 146.75494384765625, 151.16209411621094, 155.56922912597656, 159.97637939453125, 164.38351440429688, 168.79066467285156, 173.1977996826172, 177.60494995117188, 182.0120849609375, 186.4192352294922, 190.8263702392578, 195.2335205078125, 199.64065551757812, 204.0478057861328, 208.45494079589844, 212.86209106445312, 217.2692413330078, 221.6763916015625, 226.08352661132812, 230.4906768798828, 234.89781188964844, 239.30496215820312, 243.71209716796875, 248.11924743652344, 252.52638244628906]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 5.0, 13.0, 4.0, 8.0, 16.0, 18.0, 18.0, 15.0, 25.0, 25.0, 32.0, 24.0, 32.0, 34.0, 26.0, 32.0, 39.0, 40.0, 47.0, 43.0, 41.0, 42.0, 38.0, 44.0, 41.0, 36.0, 34.0, 31.0, 40.0, 27.0, 26.0, 23.0, 20.0, 12.0, 9.0, 8.0, 10.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.002681732177734, -27.202951431274414, -26.403223037719727, -25.603492736816406, -24.803762435913086, -24.004032135009766, -23.204303741455078, -22.404573440551758, -21.604843139648438, -20.805112838745117, -20.00538444519043, -19.20565414428711, -18.40592384338379, -17.60619354248047, -16.80646514892578, -16.00673484802246, -15.207006454467773, -14.40727710723877, -13.60754680633545, -12.807817459106445, -12.008087158203125, -11.208357810974121, -10.408628463745117, -9.608898162841797, -8.809168815612793, -8.009439468383789, -7.209709167480469, -6.409979820251465, -5.610249996185303, -4.810520172119141, -4.010790824890137, -3.2110610008239746, -2.4113311767578125, -1.61160147190094, -0.8118717670440674, -0.012142181396484375, 0.7875876426696777, 1.5873174667358398, 2.3870468139648438, 3.186776638031006, 3.986506462097168, 4.78623628616333, 5.585966110229492, 6.385695457458496, 7.185425281524658, 7.98515510559082, 8.784884452819824, 9.584613800048828, 10.384344100952148, 11.184073448181152, 11.983803749084473, 12.783533096313477, 13.583263397216797, 14.3829927444458, 15.182722091674805, 15.982452392578125, 16.782180786132812, 17.581911087036133, 18.38163948059082, 19.18136978149414, 19.98110008239746, 20.78083038330078, 21.58055877685547, 22.38028907775879, 23.18001937866211]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 6.0, 11.0, 10.0, 10.0, 23.0, 15.0, 28.0, 38.0, 41.0, 37.0, 44.0, 49.0, 59.0, 69.0, 65.0, 64.0, 59.0, 62.0, 50.0, 55.0, 38.0, 42.0, 33.0, 24.0, 17.0, 21.0, 10.0, 8.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.744140625, -3.639495849609375, -3.53485107421875, -3.430206298828125, -3.3255615234375, -3.220916748046875, -3.11627197265625, -3.011627197265625, -2.906982421875, -2.802337646484375, -2.69769287109375, -2.593048095703125, -2.4884033203125, -2.383758544921875, -2.27911376953125, -2.174468994140625, -2.06982421875, -1.965179443359375, -1.86053466796875, -1.755889892578125, -1.6512451171875, -1.546600341796875, -1.44195556640625, -1.337310791015625, -1.232666015625, -1.128021240234375, -1.02337646484375, -0.918731689453125, -0.8140869140625, -0.709442138671875, -0.60479736328125, -0.500152587890625, -0.3955078125, -0.290863037109375, -0.18621826171875, -0.081573486328125, 0.0230712890625, 0.127716064453125, 0.23236083984375, 0.337005615234375, 0.441650390625, 0.546295166015625, 0.65093994140625, 0.755584716796875, 0.8602294921875, 0.964874267578125, 1.06951904296875, 1.174163818359375, 1.27880859375, 1.383453369140625, 1.48809814453125, 1.592742919921875, 1.6973876953125, 1.802032470703125, 1.90667724609375, 2.011322021484375, 2.115966796875, 2.220611572265625, 2.32525634765625, 2.429901123046875, 2.5345458984375, 2.639190673828125, 2.74383544921875, 2.848480224609375, 2.953125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 14.0, 13.0, 18.0, 30.0, 23.0, 42.0, 58.0, 91.0, 146.0, 231.0, 337.0, 618.0, 1044.0, 2002.0, 4180.0, 10924.0, 43867.0, 447295.0, 3076650.0, 533544.0, 52369.0, 12286.0, 4413.0, 1958.0, 951.0, 450.0, 269.0, 149.0, 110.0, 57.0, 46.0, 29.0, 15.0, 10.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-10.96875, -10.6981201171875, -10.427490234375, -10.1568603515625, -9.88623046875, -9.6156005859375, -9.344970703125, -9.0743408203125, -8.8037109375, -8.5330810546875, -8.262451171875, -7.9918212890625, -7.72119140625, -7.4505615234375, -7.179931640625, -6.9093017578125, -6.638671875, -6.3680419921875, -6.097412109375, -5.8267822265625, -5.55615234375, -5.2855224609375, -5.014892578125, -4.7442626953125, -4.4736328125, -4.2030029296875, -3.932373046875, -3.6617431640625, -3.39111328125, -3.1204833984375, -2.849853515625, -2.5792236328125, -2.30859375, -2.0379638671875, -1.767333984375, -1.4967041015625, -1.22607421875, -0.9554443359375, -0.684814453125, -0.4141845703125, -0.1435546875, 0.1270751953125, 0.397705078125, 0.6683349609375, 0.93896484375, 1.2095947265625, 1.480224609375, 1.7508544921875, 2.021484375, 2.2921142578125, 2.562744140625, 2.8333740234375, 3.10400390625, 3.3746337890625, 3.645263671875, 3.9158935546875, 4.1865234375, 4.4571533203125, 4.727783203125, 4.9984130859375, 5.26904296875, 5.5396728515625, 5.810302734375, 6.0809326171875, 6.3515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 3.0, 6.0, 8.0, 6.0, 8.0, 15.0, 19.0, 23.0, 36.0, 61.0, 74.0, 108.0, 178.0, 284.0, 410.0, 557.0, 610.0, 520.0, 380.0, 249.0, 168.0, 96.0, 67.0, 40.0, 34.0, 29.0, 23.0, 20.0, 10.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.84375, -7.6151123046875, -7.386474609375, -7.1578369140625, -6.92919921875, -6.7005615234375, -6.471923828125, -6.2432861328125, -6.0146484375, -5.7860107421875, -5.557373046875, -5.3287353515625, -5.10009765625, -4.8714599609375, -4.642822265625, -4.4141845703125, -4.185546875, -3.9569091796875, -3.728271484375, -3.4996337890625, -3.27099609375, -3.0423583984375, -2.813720703125, -2.5850830078125, -2.3564453125, -2.1278076171875, -1.899169921875, -1.6705322265625, -1.44189453125, -1.2132568359375, -0.984619140625, -0.7559814453125, -0.52734375, -0.2987060546875, -0.070068359375, 0.1585693359375, 0.38720703125, 0.6158447265625, 0.844482421875, 1.0731201171875, 1.3017578125, 1.5303955078125, 1.759033203125, 1.9876708984375, 2.21630859375, 2.4449462890625, 2.673583984375, 2.9022216796875, 3.130859375, 3.3594970703125, 3.588134765625, 3.8167724609375, 4.04541015625, 4.2740478515625, 4.502685546875, 4.7313232421875, 4.9599609375, 5.1885986328125, 5.417236328125, 5.6458740234375, 5.87451171875, 6.1031494140625, 6.331787109375, 6.5604248046875, 6.7890625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 12.0, 6.0, 16.0, 13.0, 22.0, 37.0, 53.0, 88.0, 142.0, 238.0, 350.0, 509.0, 991.0, 1620.0, 2960.0, 5593.0, 11994.0, 30629.0, 107764.0, 563199.0, 2313327.0, 920573.0, 162601.0, 41484.0, 15036.0, 6843.0, 3403.0, 1930.0, 1126.0, 631.0, 367.0, 230.0, 197.0, 103.0, 55.0, 49.0, 22.0, 13.0, 16.0, 12.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.59375, -8.313232421875, -8.03271484375, -7.752197265625, -7.4716796875, -7.191162109375, -6.91064453125, -6.630126953125, -6.349609375, -6.069091796875, -5.78857421875, -5.508056640625, -5.2275390625, -4.947021484375, -4.66650390625, -4.385986328125, -4.10546875, -3.824951171875, -3.54443359375, -3.263916015625, -2.9833984375, -2.702880859375, -2.42236328125, -2.141845703125, -1.861328125, -1.580810546875, -1.30029296875, -1.019775390625, -0.7392578125, -0.458740234375, -0.17822265625, 0.102294921875, 0.3828125, 0.663330078125, 0.94384765625, 1.224365234375, 1.5048828125, 1.785400390625, 2.06591796875, 2.346435546875, 2.626953125, 2.907470703125, 3.18798828125, 3.468505859375, 3.7490234375, 4.029541015625, 4.31005859375, 4.590576171875, 4.87109375, 5.151611328125, 5.43212890625, 5.712646484375, 5.9931640625, 6.273681640625, 6.55419921875, 6.834716796875, 7.115234375, 7.395751953125, 7.67626953125, 7.956787109375, 8.2373046875, 8.517822265625, 8.79833984375, 9.078857421875, 9.359375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 17.0, 22.0, 43.0, 62.0, 93.0, 117.0, 119.0, 137.0, 102.0, 105.0, 67.0, 36.0, 29.0, 16.0, 16.0, 5.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.916015625, -45.53499221801758, -44.153968811035156, -42.77294158935547, -41.39191818237305, -40.010894775390625, -38.6298713684082, -37.24884796142578, -35.867820739746094, -34.48679733276367, -33.10577392578125, -31.724748611450195, -30.34372329711914, -28.96269989013672, -27.581676483154297, -26.200653076171875, -24.819629669189453, -23.43860626220703, -22.057580947875977, -20.676557540893555, -19.2955322265625, -17.914508819580078, -16.533485412597656, -15.152461051940918, -13.77143669128418, -12.390412330627441, -11.009387969970703, -9.628364562988281, -8.247340202331543, -6.866315841674805, -5.485292434692383, -4.1042680740356445, -2.723247528076172, -1.3422234058380127, 0.038800716400146484, 1.4198246002197266, 2.800848960876465, 4.181873321533203, 5.562896728515625, 6.943921089172363, 8.324945449829102, 9.70596981048584, 11.086994171142578, 12.468017578125, 13.849041938781738, 15.230066299438477, 16.6110897064209, 17.992115020751953, 19.373138427734375, 20.754161834716797, 22.13518714904785, 23.516210556030273, 24.897235870361328, 26.27825927734375, 27.659282684326172, 29.040306091308594, 30.42133140563965, 31.80235481262207, 33.183380126953125, 34.56440353393555, 35.94542694091797, 37.326454162597656, 38.70747375488281, 40.0885009765625, 41.46952438354492]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 13.0, 5.0, 5.0, 8.0, 14.0, 16.0, 20.0, 15.0, 16.0, 22.0, 25.0, 22.0, 22.0, 25.0, 30.0, 36.0, 36.0, 44.0, 44.0, 33.0, 37.0, 34.0, 39.0, 44.0, 36.0, 40.0, 35.0, 46.0, 49.0, 27.0, 24.0, 25.0, 30.0, 11.0, 11.0, 14.0, 10.0, 10.0, 5.0, 7.0, 3.0, 7.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.16278839111328, -19.51471710205078, -18.86664581298828, -18.21857452392578, -17.57050323486328, -16.92243003845215, -16.27435874938965, -15.626287460327148, -14.978216171264648, -14.330144882202148, -13.682073593139648, -13.034001350402832, -12.385930061340332, -11.737858772277832, -11.089786529541016, -10.441715240478516, -9.793643951416016, -9.145572662353516, -8.497501373291016, -7.849429130554199, -7.201357841491699, -6.553286552429199, -5.905214786529541, -5.257143020629883, -4.609071731567383, -3.9610002040863037, -3.3129286766052246, -2.6648571491241455, -2.0167856216430664, -1.3687140941619873, -0.7206425666809082, -0.07257080078125, 0.57550048828125, 1.223572015762329, 1.8716435432434082, 2.5197150707244873, 3.1677865982055664, 3.8158581256866455, 4.463929653167725, 5.112001419067383, 5.760072708129883, 6.408143997192383, 7.056215763092041, 7.704287528991699, 8.3523588180542, 9.0004301071167, 9.648502349853516, 10.296573638916016, 10.944644927978516, 11.592716217041016, 12.240787506103516, 12.888859748840332, 13.536931037902832, 14.185002326965332, 14.833074569702148, 15.481145858764648, 16.12921714782715, 16.77728843688965, 17.42535972595215, 18.07343101501465, 18.72150421142578, 19.36957550048828, 20.01764678955078, 20.66571807861328, 21.31378936767578]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 9.0, 18.0, 23.0, 26.0, 32.0, 42.0, 38.0, 50.0, 44.0, 44.0, 70.0, 77.0, 50.0, 71.0, 54.0, 63.0, 48.0, 37.0, 34.0, 31.0, 29.0, 16.0, 14.0, 20.0, 12.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.46875, -3.366546630859375, -3.26434326171875, -3.162139892578125, -3.0599365234375, -2.957733154296875, -2.85552978515625, -2.753326416015625, -2.651123046875, -2.548919677734375, -2.44671630859375, -2.344512939453125, -2.2423095703125, -2.140106201171875, -2.03790283203125, -1.935699462890625, -1.83349609375, -1.731292724609375, -1.62908935546875, -1.526885986328125, -1.4246826171875, -1.322479248046875, -1.22027587890625, -1.118072509765625, -1.015869140625, -0.913665771484375, -0.81146240234375, -0.709259033203125, -0.6070556640625, -0.504852294921875, -0.40264892578125, -0.300445556640625, -0.1982421875, -0.096038818359375, 0.00616455078125, 0.108367919921875, 0.2105712890625, 0.312774658203125, 0.41497802734375, 0.517181396484375, 0.619384765625, 0.721588134765625, 0.82379150390625, 0.925994873046875, 1.0281982421875, 1.130401611328125, 1.23260498046875, 1.334808349609375, 1.43701171875, 1.539215087890625, 1.64141845703125, 1.743621826171875, 1.8458251953125, 1.948028564453125, 2.05023193359375, 2.152435302734375, 2.254638671875, 2.356842041015625, 2.45904541015625, 2.561248779296875, 2.6634521484375, 2.765655517578125, 2.86785888671875, 2.970062255859375, 3.072265625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 6.0, 8.0, 12.0, 8.0, 26.0, 31.0, 50.0, 64.0, 80.0, 116.0, 191.0, 283.0, 447.0, 752.0, 1123.0, 1870.0, 3150.0, 5411.0, 9506.0, 17487.0, 33640.0, 67951.0, 156767.0, 413716.0, 179595.0, 75082.0, 36941.0, 19340.0, 10426.0, 5838.0, 3354.0, 1949.0, 1209.0, 743.0, 445.0, 300.0, 204.0, 129.0, 98.0, 63.0, 53.0, 20.0, 19.0, 15.0, 15.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.200439453125, -0.1940898895263672, -0.18774032592773438, -0.18139076232910156, -0.17504119873046875, -0.16869163513183594, -0.16234207153320312, -0.1559925079345703, -0.1496429443359375, -0.1432933807373047, -0.13694381713867188, -0.13059425354003906, -0.12424468994140625, -0.11789512634277344, -0.11154556274414062, -0.10519599914550781, -0.098846435546875, -0.09249687194824219, -0.08614730834960938, -0.07979774475097656, -0.07344818115234375, -0.06709861755371094, -0.060749053955078125, -0.05439949035644531, -0.0480499267578125, -0.04170036315917969, -0.035350799560546875, -0.029001235961914062, -0.02265167236328125, -0.016302108764648438, -0.009952545166015625, -0.0036029815673828125, 0.00274658203125, 0.009096145629882812, 0.015445709228515625, 0.021795272827148438, 0.02814483642578125, 0.03449440002441406, 0.040843963623046875, 0.04719352722167969, 0.0535430908203125, 0.05989265441894531, 0.06624221801757812, 0.07259178161621094, 0.07894134521484375, 0.08529090881347656, 0.09164047241210938, 0.09799003601074219, 0.104339599609375, 0.11068916320800781, 0.11703872680664062, 0.12338829040527344, 0.12973785400390625, 0.13608741760253906, 0.14243698120117188, 0.1487865447998047, 0.1551361083984375, 0.1614856719970703, 0.16783523559570312, 0.17418479919433594, 0.18053436279296875, 0.18688392639160156, 0.19323348999023438, 0.1995830535888672, 0.2059326171875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 5.0, 10.0, 8.0, 12.0, 10.0, 12.0, 15.0, 27.0, 23.0, 23.0, 22.0, 18.0, 37.0, 31.0, 36.0, 37.0, 46.0, 45.0, 37.0, 35.0, 1064.0, 48.0, 46.0, 37.0, 39.0, 29.0, 33.0, 30.0, 19.0, 31.0, 26.0, 21.0, 23.0, 19.0, 16.0, 10.0, 10.0, 14.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.404296875, -2.33380126953125, -2.2633056640625, -2.19281005859375, -2.122314453125, -2.05181884765625, -1.9813232421875, -1.91082763671875, -1.84033203125, -1.76983642578125, -1.6993408203125, -1.62884521484375, -1.558349609375, -1.48785400390625, -1.4173583984375, -1.34686279296875, -1.2763671875, -1.20587158203125, -1.1353759765625, -1.06488037109375, -0.994384765625, -0.92388916015625, -0.8533935546875, -0.78289794921875, -0.71240234375, -0.64190673828125, -0.5714111328125, -0.50091552734375, -0.430419921875, -0.35992431640625, -0.2894287109375, -0.21893310546875, -0.1484375, -0.07794189453125, -0.0074462890625, 0.06304931640625, 0.133544921875, 0.20404052734375, 0.2745361328125, 0.34503173828125, 0.41552734375, 0.48602294921875, 0.5565185546875, 0.62701416015625, 0.697509765625, 0.76800537109375, 0.8385009765625, 0.90899658203125, 0.9794921875, 1.04998779296875, 1.1204833984375, 1.19097900390625, 1.261474609375, 1.33197021484375, 1.4024658203125, 1.47296142578125, 1.54345703125, 1.61395263671875, 1.6844482421875, 1.75494384765625, 1.825439453125, 1.89593505859375, 1.9664306640625, 2.03692626953125, 2.107421875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 10.0, 18.0, 24.0, 32.0, 51.0, 77.0, 110.0, 149.0, 216.0, 324.0, 473.0, 671.0, 1032.0, 1545.0, 2330.0, 3279.0, 4763.0, 7101.0, 10474.0, 16130.0, 24501.0, 38090.0, 60583.0, 101898.0, 293096.0, 1226912.0, 115609.0, 66605.0, 41446.0, 26529.0, 17327.0, 11643.0, 7685.0, 5165.0, 3542.0, 2333.0, 1670.0, 1116.0, 773.0, 594.0, 387.0, 265.0, 176.0, 125.0, 85.0, 53.0, 44.0, 22.0, 15.0, 11.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.05377197265625, -0.05214738845825195, -0.050522804260253906, -0.04889822006225586, -0.04727363586425781, -0.045649051666259766, -0.04402446746826172, -0.04239988327026367, -0.040775299072265625, -0.03915071487426758, -0.03752613067626953, -0.035901546478271484, -0.03427696228027344, -0.03265237808227539, -0.031027793884277344, -0.029403209686279297, -0.02777862548828125, -0.026154041290283203, -0.024529457092285156, -0.02290487289428711, -0.021280288696289062, -0.019655704498291016, -0.01803112030029297, -0.016406536102294922, -0.014781951904296875, -0.013157367706298828, -0.011532783508300781, -0.009908199310302734, -0.008283615112304688, -0.006659030914306641, -0.005034446716308594, -0.003409862518310547, -0.0017852783203125, -0.00016069412231445312, 0.0014638900756835938, 0.0030884742736816406, 0.0047130584716796875, 0.006337642669677734, 0.007962226867675781, 0.009586811065673828, 0.011211395263671875, 0.012835979461669922, 0.014460563659667969, 0.016085147857666016, 0.017709732055664062, 0.01933431625366211, 0.020958900451660156, 0.022583484649658203, 0.02420806884765625, 0.025832653045654297, 0.027457237243652344, 0.02908182144165039, 0.030706405639648438, 0.032330989837646484, 0.03395557403564453, 0.03558015823364258, 0.037204742431640625, 0.03882932662963867, 0.04045391082763672, 0.042078495025634766, 0.04370307922363281, 0.04532766342163086, 0.046952247619628906, 0.04857683181762695, 0.050201416015625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 8.0, 7.0, 8.0, 22.0, 23.0, 30.0, 29.0, 33.0, 54.0, 62.0, 79.0, 103.0, 125.0, 96.0, 65.0, 45.0, 39.0, 31.0, 24.0, 18.0, 21.0, 14.0, 14.0, 8.0, 5.0, 3.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004258155822753906, -0.0004117041826248169, -0.00039759278297424316, -0.00038348138332366943, -0.0003693699836730957, -0.00035525858402252197, -0.00034114718437194824, -0.0003270357847213745, -0.0003129243850708008, -0.00029881298542022705, -0.0002847015857696533, -0.0002705901861190796, -0.00025647878646850586, -0.00024236738681793213, -0.0002282559871673584, -0.00021414458751678467, -0.00020003318786621094, -0.0001859217882156372, -0.00017181038856506348, -0.00015769898891448975, -0.00014358758926391602, -0.00012947618961334229, -0.00011536478996276855, -0.00010125339031219482, -8.71419906616211e-05, -7.303059101104736e-05, -5.891919136047363e-05, -4.48077917098999e-05, -3.069639205932617e-05, -1.658499240875244e-05, -2.473592758178711e-06, 1.163780689239502e-05, 2.574920654296875e-05, 3.986060619354248e-05, 5.397200584411621e-05, 6.808340549468994e-05, 8.219480514526367e-05, 9.63062047958374e-05, 0.00011041760444641113, 0.00012452900409698486, 0.0001386404037475586, 0.00015275180339813232, 0.00016686320304870605, 0.00018097460269927979, 0.00019508600234985352, 0.00020919740200042725, 0.00022330880165100098, 0.0002374202013015747, 0.00025153160095214844, 0.00026564300060272217, 0.0002797544002532959, 0.00029386579990386963, 0.00030797719955444336, 0.0003220885992050171, 0.0003361999988555908, 0.00035031139850616455, 0.0003644227981567383, 0.000378534197807312, 0.00039264559745788574, 0.00040675699710845947, 0.0004208683967590332, 0.00043497979640960693, 0.00044909119606018066, 0.0004632025957107544, 0.0004773139953613281]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 2.0, 13.0, 10.0, 22.0, 32.0, 47.0, 68.0, 127.0, 224.0, 502.0, 1012.0, 2730.0, 7495.0, 22073.0, 76060.0, 497217.0, 347652.0, 63470.0, 18871.0, 6555.0, 2432.0, 983.0, 411.0, 162.0, 117.0, 85.0, 56.0, 23.0, 27.0, 21.0, 11.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0084991455078125, -0.008248686790466309, -0.007998228073120117, -0.007747769355773926, -0.007497310638427734, -0.007246851921081543, -0.0069963932037353516, -0.00674593448638916, -0.006495475769042969, -0.006245017051696777, -0.005994558334350586, -0.0057440996170043945, -0.005493640899658203, -0.005243182182312012, -0.00499272346496582, -0.004742264747619629, -0.0044918060302734375, -0.004241347312927246, -0.003990888595581055, -0.0037404298782348633, -0.003489971160888672, -0.0032395124435424805, -0.002989053726196289, -0.0027385950088500977, -0.0024881362915039062, -0.002237677574157715, -0.0019872188568115234, -0.001736760139465332, -0.0014863014221191406, -0.0012358427047729492, -0.0009853839874267578, -0.0007349252700805664, -0.000484466552734375, -0.0002340078353881836, 1.6450881958007812e-05, 0.0002669095993041992, 0.0005173683166503906, 0.000767827033996582, 0.0010182857513427734, 0.0012687444686889648, 0.0015192031860351562, 0.0017696619033813477, 0.002020120620727539, 0.0022705793380737305, 0.002521038055419922, 0.0027714967727661133, 0.0030219554901123047, 0.003272414207458496, 0.0035228729248046875, 0.003773331642150879, 0.00402379035949707, 0.004274249076843262, 0.004524707794189453, 0.0047751665115356445, 0.005025625228881836, 0.005276083946228027, 0.005526542663574219, 0.00577700138092041, 0.0060274600982666016, 0.006277918815612793, 0.006528377532958984, 0.006778836250305176, 0.007029294967651367, 0.007279753684997559, 0.00753021240234375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 31.0, 94.0, 480.0, 283.0, 73.0, 19.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011955345049500465, -0.011669577099382877, -0.01138380914926529, -0.011098040267825127, -0.010812272317707539, -0.01052650436758995, -0.010240736417472363, -0.009954968467354774, -0.009669199585914612, -0.009383431635797024, -0.009097663685679436, -0.008811894804239273, -0.008526126854121685, -0.008240358904004097, -0.007954590953886509, -0.007668822538107634, -0.0073830545879900455, -0.0070972866378724575, -0.006811518222093582, -0.006525750271975994, -0.006239981856197119, -0.005954213906079531, -0.005668445490300655, -0.005382677540183067, -0.005096909590065479, -0.004811141639947891, -0.004525373224169016, -0.004239605274051428, -0.0039538368582725525, -0.0036680689081549644, -0.0033823007252067327, -0.003096532542258501, -0.0028107636608183384, -0.0025249954778701067, -0.002239227294921875, -0.001953459344804287, -0.0016676910454407334, -0.0013819228624925017, -0.0010961547959595919, -0.0008103866130113602, -0.0005246184300631285, -0.00023885027621872723, 4.691787762567401e-05, 0.0003326860023662448, 0.0006184541853144765, 0.0009042223682627082, 0.001189990434795618, 0.0014757586177438498, 0.0017615268006920815, 0.002047294983640313, 0.002333063166588545, 0.002618831116706133, 0.0029045995324850082, 0.0031903674826025963, 0.003476135665550828, 0.0037619038484990597, 0.004047672264277935, 0.004333440214395523, 0.004619208630174398, 0.0049049765802919865, 0.005190744996070862, 0.00547651294618845, 0.005762280896306038, 0.006048049312084913, 0.006333817262202501]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 5.0, 6.0, 3.0, 19.0, 20.0, 18.0, 25.0, 40.0, 36.0, 50.0, 54.0, 64.0, 49.0, 72.0, 82.0, 59.0, 59.0, 61.0, 62.0, 50.0, 37.0, 24.0, 27.0, 24.0, 14.0, 9.0, 10.0, 5.0, 7.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041168928146362305, -0.00039730407297611237, -0.0003829188644886017, -0.000368533656001091, -0.0003541484475135803, -0.00033976323902606964, -0.00032537803053855896, -0.0003109928220510483, -0.0002966076135635376, -0.0002822224050760269, -0.00026783719658851624, -0.00025345198810100555, -0.00023906677961349487, -0.0002246815711259842, -0.0002102963626384735, -0.00019591115415096283, -0.00018152594566345215, -0.00016714073717594147, -0.00015275552868843079, -0.0001383703202009201, -0.00012398511171340942, -0.00010959990322589874, -9.521469473838806e-05, -8.082948625087738e-05, -6.64442777633667e-05, -5.205906927585602e-05, -3.767386078834534e-05, -2.3288652300834656e-05, -8.903443813323975e-06, 5.4817646741867065e-06, 1.9866973161697388e-05, 3.425218164920807e-05, 4.863739013671875e-05, 6.302259862422943e-05, 7.740780711174011e-05, 9.17930155992508e-05, 0.00010617822408676147, 0.00012056343257427216, 0.00013494864106178284, 0.00014933384954929352, 0.0001637190580368042, 0.00017810426652431488, 0.00019248947501182556, 0.00020687468349933624, 0.00022125989198684692, 0.0002356451004743576, 0.0002500303089618683, 0.00026441551744937897, 0.00027880072593688965, 0.00029318593442440033, 0.000307571142911911, 0.0003219563513994217, 0.0003363415598869324, 0.00035072676837444305, 0.00036511197686195374, 0.0003794971853494644, 0.0003938823938369751, 0.0004082676023244858, 0.00042265281081199646, 0.00043703801929950714, 0.0004514232277870178, 0.0004658084362745285, 0.0004801936447620392, 0.0004945788532495499, 0.0005089640617370605]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 11.0, 9.0, 18.0, 23.0, 26.0, 32.0, 41.0, 39.0, 50.0, 44.0, 44.0, 70.0, 77.0, 50.0, 71.0, 55.0, 62.0, 48.0, 37.0, 34.0, 31.0, 29.0, 16.0, 14.0, 20.0, 12.0, 9.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.46875, -3.366546630859375, -3.26434326171875, -3.162139892578125, -3.0599365234375, -2.957733154296875, -2.85552978515625, -2.753326416015625, -2.651123046875, -2.548919677734375, -2.44671630859375, -2.344512939453125, -2.2423095703125, -2.140106201171875, -2.03790283203125, -1.935699462890625, -1.83349609375, -1.731292724609375, -1.62908935546875, -1.526885986328125, -1.4246826171875, -1.322479248046875, -1.22027587890625, -1.118072509765625, -1.015869140625, -0.913665771484375, -0.81146240234375, -0.709259033203125, -0.6070556640625, -0.504852294921875, -0.40264892578125, -0.300445556640625, -0.1982421875, -0.096038818359375, 0.00616455078125, 0.108367919921875, 0.2105712890625, 0.312774658203125, 0.41497802734375, 0.517181396484375, 0.619384765625, 0.721588134765625, 0.82379150390625, 0.925994873046875, 1.0281982421875, 1.130401611328125, 1.23260498046875, 1.334808349609375, 1.43701171875, 1.539215087890625, 1.64141845703125, 1.743621826171875, 1.8458251953125, 1.948028564453125, 2.05023193359375, 2.152435302734375, 2.254638671875, 2.356842041015625, 2.45904541015625, 2.561248779296875, 2.6634521484375, 2.765655517578125, 2.86785888671875, 2.970062255859375, 3.072265625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 12.0, 11.0, 17.0, 38.0, 47.0, 56.0, 119.0, 210.0, 359.0, 723.0, 1440.0, 3097.0, 7990.0, 29927.0, 213577.0, 681614.0, 83676.0, 16091.0, 5143.0, 2130.0, 1023.0, 536.0, 312.0, 153.0, 88.0, 56.0, 33.0, 28.0, 18.0, 7.0, 5.0, 3.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.34576416015625, -7.0860595703125, -6.82635498046875, -6.566650390625, -6.30694580078125, -6.0472412109375, -5.78753662109375, -5.52783203125, -5.26812744140625, -5.0084228515625, -4.74871826171875, -4.489013671875, -4.22930908203125, -3.9696044921875, -3.70989990234375, -3.4501953125, -3.19049072265625, -2.9307861328125, -2.67108154296875, -2.411376953125, -2.15167236328125, -1.8919677734375, -1.63226318359375, -1.37255859375, -1.11285400390625, -0.8531494140625, -0.59344482421875, -0.333740234375, -0.07403564453125, 0.1856689453125, 0.44537353515625, 0.705078125, 0.96478271484375, 1.2244873046875, 1.48419189453125, 1.743896484375, 2.00360107421875, 2.2633056640625, 2.52301025390625, 2.78271484375, 3.04241943359375, 3.3021240234375, 3.56182861328125, 3.821533203125, 4.08123779296875, 4.3409423828125, 4.60064697265625, 4.8603515625, 5.12005615234375, 5.3797607421875, 5.63946533203125, 5.899169921875, 6.15887451171875, 6.4185791015625, 6.67828369140625, 6.93798828125, 7.19769287109375, 7.4573974609375, 7.71710205078125, 7.976806640625, 8.23651123046875, 8.4962158203125, 8.75592041015625, 9.015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 3.0, 8.0, 11.0, 11.0, 8.0, 21.0, 17.0, 18.0, 19.0, 20.0, 26.0, 30.0, 34.0, 46.0, 53.0, 57.0, 80.0, 107.0, 215.0, 1438.0, 200.0, 129.0, 72.0, 60.0, 54.0, 53.0, 38.0, 36.0, 32.0, 22.0, 13.0, 26.0, 13.0, 7.0, 13.0, 13.0, 4.0, 9.0, 3.0, 3.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9375, -7.68505859375, -7.4326171875, -7.18017578125, -6.927734375, -6.67529296875, -6.4228515625, -6.17041015625, -5.91796875, -5.66552734375, -5.4130859375, -5.16064453125, -4.908203125, -4.65576171875, -4.4033203125, -4.15087890625, -3.8984375, -3.64599609375, -3.3935546875, -3.14111328125, -2.888671875, -2.63623046875, -2.3837890625, -2.13134765625, -1.87890625, -1.62646484375, -1.3740234375, -1.12158203125, -0.869140625, -0.61669921875, -0.3642578125, -0.11181640625, 0.140625, 0.39306640625, 0.6455078125, 0.89794921875, 1.150390625, 1.40283203125, 1.6552734375, 1.90771484375, 2.16015625, 2.41259765625, 2.6650390625, 2.91748046875, 3.169921875, 3.42236328125, 3.6748046875, 3.92724609375, 4.1796875, 4.43212890625, 4.6845703125, 4.93701171875, 5.189453125, 5.44189453125, 5.6943359375, 5.94677734375, 6.19921875, 6.45166015625, 6.7041015625, 6.95654296875, 7.208984375, 7.46142578125, 7.7138671875, 7.96630859375, 8.21875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 5.0, 8.0, 10.0, 13.0, 9.0, 16.0, 20.0, 30.0, 29.0, 38.0, 50.0, 73.0, 127.0, 212.0, 313.0, 702.0, 2246.0, 9510.0, 92946.0, 2484608.0, 521254.0, 26629.0, 4299.0, 1269.0, 498.0, 233.0, 135.0, 92.0, 78.0, 51.0, 29.0, 25.0, 26.0, 22.0, 10.0, 14.0, 15.0, 13.0, 10.0, 4.0, 3.0, 4.0, 6.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.375, -11.97265625, -11.5703125, -11.16796875, -10.765625, -10.36328125, -9.9609375, -9.55859375, -9.15625, -8.75390625, -8.3515625, -7.94921875, -7.546875, -7.14453125, -6.7421875, -6.33984375, -5.9375, -5.53515625, -5.1328125, -4.73046875, -4.328125, -3.92578125, -3.5234375, -3.12109375, -2.71875, -2.31640625, -1.9140625, -1.51171875, -1.109375, -0.70703125, -0.3046875, 0.09765625, 0.5, 0.90234375, 1.3046875, 1.70703125, 2.109375, 2.51171875, 2.9140625, 3.31640625, 3.71875, 4.12109375, 4.5234375, 4.92578125, 5.328125, 5.73046875, 6.1328125, 6.53515625, 6.9375, 7.33984375, 7.7421875, 8.14453125, 8.546875, 8.94921875, 9.3515625, 9.75390625, 10.15625, 10.55859375, 10.9609375, 11.36328125, 11.765625, 12.16796875, 12.5703125, 12.97265625, 13.375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 9.0, 11.0, 41.0, 67.0, 118.0, 157.0, 165.0, 187.0, 124.0, 60.0, 45.0, 15.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.619930267333984, -33.673526763916016, -32.72712707519531, -31.780723571777344, -30.834320068359375, -29.88791847229004, -28.941516876220703, -27.995113372802734, -27.0487117767334, -26.102310180664062, -25.155906677246094, -24.209505081176758, -23.26310157775879, -22.316699981689453, -21.370296478271484, -20.42389488220215, -19.477493286132812, -18.531091690063477, -17.584688186645508, -16.638286590576172, -15.69188404083252, -14.745481491088867, -13.799078941345215, -12.852676391601562, -11.906272888183594, -10.959870338439941, -10.013467788696289, -9.067066192626953, -8.1206636428833, -7.174261093139648, -6.227858543395996, -5.281456470489502, -4.335054397583008, -3.3886520862579346, -2.4422497749328613, -1.495847225189209, -0.5494449138641357, 0.3969573974609375, 1.3433599472045898, 2.289762020111084, 3.2361645698547363, 4.182567119598389, 5.128969192504883, 6.075371742248535, 7.0217742919921875, 7.968176364898682, 8.914579391479492, 9.860980987548828, 10.80738353729248, 11.753786087036133, 12.700188636779785, 13.646591186523438, 14.592992782592773, 15.539395332336426, 16.485797882080078, 17.432199478149414, 18.378602981567383, 19.32500457763672, 20.271408081054688, 21.217809677124023, 22.164213180541992, 23.110614776611328, 24.057018280029297, 25.003419876098633, 25.94982147216797]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 6.0, 12.0, 21.0, 16.0, 13.0, 19.0, 30.0, 26.0, 37.0, 35.0, 31.0, 34.0, 41.0, 48.0, 54.0, 53.0, 45.0, 48.0, 42.0, 44.0, 41.0, 67.0, 34.0, 34.0, 35.0, 18.0, 26.0, 21.0, 15.0, 18.0, 9.0, 5.0, 9.0, 1.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-33.14874267578125, -32.308895111083984, -31.469051361083984, -30.62920379638672, -29.789358139038086, -28.949512481689453, -28.109664916992188, -27.269819259643555, -26.429973602294922, -25.59012794494629, -24.750282287597656, -23.91043472290039, -23.070589065551758, -22.230743408203125, -21.39089584350586, -20.551050186157227, -19.711204528808594, -18.87135887145996, -18.031513214111328, -17.191665649414062, -16.35181999206543, -15.511974334716797, -14.672127723693848, -13.832281112670898, -12.992435455322266, -12.152589797973633, -11.312743186950684, -10.472896575927734, -9.633050918579102, -8.793205261230469, -7.9533586502075195, -7.1135125160217285, -6.27366828918457, -5.433822154998779, -4.593976020812988, -3.7541298866271973, -2.9142837524414062, -2.0744376182556152, -1.2345914840698242, -0.3947453498840332, 0.4451007843017578, 1.2849469184875488, 2.12479305267334, 2.964639186859131, 3.804485321044922, 4.644331455230713, 5.484177589416504, 6.324023723602295, 7.163869857788086, 8.003715515136719, 8.843562126159668, 9.683408737182617, 10.52325439453125, 11.363100051879883, 12.202946662902832, 13.042793273925781, 13.882638931274414, 14.722484588623047, 15.562331199645996, 16.402177810668945, 17.242023468017578, 18.08186912536621, 18.921714782714844, 19.76156234741211, 20.601408004760742]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 6.0, 6.0, 11.0, 10.0, 20.0, 23.0, 29.0, 34.0, 37.0, 40.0, 45.0, 50.0, 55.0, 51.0, 77.0, 48.0, 65.0, 59.0, 56.0, 45.0, 42.0, 30.0, 29.0, 38.0, 16.0, 16.0, 17.0, 15.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.439453125, -3.338043212890625, -3.23663330078125, -3.135223388671875, -3.0338134765625, -2.932403564453125, -2.83099365234375, -2.729583740234375, -2.628173828125, -2.526763916015625, -2.42535400390625, -2.323944091796875, -2.2225341796875, -2.121124267578125, -2.01971435546875, -1.918304443359375, -1.81689453125, -1.715484619140625, -1.61407470703125, -1.512664794921875, -1.4112548828125, -1.309844970703125, -1.20843505859375, -1.107025146484375, -1.005615234375, -0.904205322265625, -0.80279541015625, -0.701385498046875, -0.5999755859375, -0.498565673828125, -0.39715576171875, -0.295745849609375, -0.1943359375, -0.092926025390625, 0.00848388671875, 0.109893798828125, 0.2113037109375, 0.312713623046875, 0.41412353515625, 0.515533447265625, 0.616943359375, 0.718353271484375, 0.81976318359375, 0.921173095703125, 1.0225830078125, 1.123992919921875, 1.22540283203125, 1.326812744140625, 1.42822265625, 1.529632568359375, 1.63104248046875, 1.732452392578125, 1.8338623046875, 1.935272216796875, 2.03668212890625, 2.138092041015625, 2.239501953125, 2.340911865234375, 2.44232177734375, 2.543731689453125, 2.6451416015625, 2.746551513671875, 2.84796142578125, 2.949371337890625, 3.05078125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 1.0, 7.0, 6.0, 6.0, 7.0, 11.0, 10.0, 29.0, 22.0, 42.0, 76.0, 91.0, 149.0, 238.0, 352.0, 620.0, 1002.0, 1915.0, 3732.0, 9306.0, 33895.0, 306256.0, 2941836.0, 803864.0, 66576.0, 14207.0, 5083.0, 2302.0, 1095.0, 583.0, 365.0, 196.0, 135.0, 89.0, 60.0, 32.0, 29.0, 18.0, 10.0, 10.0, 4.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-10.4296875, -10.15283203125, -9.8759765625, -9.59912109375, -9.322265625, -9.04541015625, -8.7685546875, -8.49169921875, -8.21484375, -7.93798828125, -7.6611328125, -7.38427734375, -7.107421875, -6.83056640625, -6.5537109375, -6.27685546875, -6.0, -5.72314453125, -5.4462890625, -5.16943359375, -4.892578125, -4.61572265625, -4.3388671875, -4.06201171875, -3.78515625, -3.50830078125, -3.2314453125, -2.95458984375, -2.677734375, -2.40087890625, -2.1240234375, -1.84716796875, -1.5703125, -1.29345703125, -1.0166015625, -0.73974609375, -0.462890625, -0.18603515625, 0.0908203125, 0.36767578125, 0.64453125, 0.92138671875, 1.1982421875, 1.47509765625, 1.751953125, 2.02880859375, 2.3056640625, 2.58251953125, 2.859375, 3.13623046875, 3.4130859375, 3.68994140625, 3.966796875, 4.24365234375, 4.5205078125, 4.79736328125, 5.07421875, 5.35107421875, 5.6279296875, 5.90478515625, 6.181640625, 6.45849609375, 6.7353515625, 7.01220703125, 7.2890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 15.0, 12.0, 24.0, 50.0, 48.0, 103.0, 181.0, 265.0, 402.0, 669.0, 741.0, 593.0, 353.0, 215.0, 136.0, 84.0, 53.0, 37.0, 18.0, 18.0, 9.0, 8.0, 5.0, 6.0, 8.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4453125, -9.1614990234375, -8.877685546875, -8.5938720703125, -8.31005859375, -8.0262451171875, -7.742431640625, -7.4586181640625, -7.1748046875, -6.8909912109375, -6.607177734375, -6.3233642578125, -6.03955078125, -5.7557373046875, -5.471923828125, -5.1881103515625, -4.904296875, -4.6204833984375, -4.336669921875, -4.0528564453125, -3.76904296875, -3.4852294921875, -3.201416015625, -2.9176025390625, -2.6337890625, -2.3499755859375, -2.066162109375, -1.7823486328125, -1.49853515625, -1.2147216796875, -0.930908203125, -0.6470947265625, -0.36328125, -0.0794677734375, 0.204345703125, 0.4881591796875, 0.77197265625, 1.0557861328125, 1.339599609375, 1.6234130859375, 1.9072265625, 2.1910400390625, 2.474853515625, 2.7586669921875, 3.04248046875, 3.3262939453125, 3.610107421875, 3.8939208984375, 4.177734375, 4.4615478515625, 4.745361328125, 5.0291748046875, 5.31298828125, 5.5968017578125, 5.880615234375, 6.1644287109375, 6.4482421875, 6.7320556640625, 7.015869140625, 7.2996826171875, 7.58349609375, 7.8673095703125, 8.151123046875, 8.4349365234375, 8.71875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 6.0, 3.0, 13.0, 9.0, 16.0, 27.0, 55.0, 84.0, 148.0, 321.0, 792.0, 2448.0, 10601.0, 93374.0, 3260176.0, 788317.0, 30016.0, 5358.0, 1477.0, 550.0, 224.0, 110.0, 73.0, 31.0, 19.0, 12.0, 10.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.134033203125, -20.42431640625, -19.714599609375, -19.0048828125, -18.295166015625, -17.58544921875, -16.875732421875, -16.166015625, -15.456298828125, -14.74658203125, -14.036865234375, -13.3271484375, -12.617431640625, -11.90771484375, -11.197998046875, -10.48828125, -9.778564453125, -9.06884765625, -8.359130859375, -7.6494140625, -6.939697265625, -6.22998046875, -5.520263671875, -4.810546875, -4.100830078125, -3.39111328125, -2.681396484375, -1.9716796875, -1.261962890625, -0.55224609375, 0.157470703125, 0.8671875, 1.576904296875, 2.28662109375, 2.996337890625, 3.7060546875, 4.415771484375, 5.12548828125, 5.835205078125, 6.544921875, 7.254638671875, 7.96435546875, 8.674072265625, 9.3837890625, 10.093505859375, 10.80322265625, 11.512939453125, 12.22265625, 12.932373046875, 13.64208984375, 14.351806640625, 15.0615234375, 15.771240234375, 16.48095703125, 17.190673828125, 17.900390625, 18.610107421875, 19.31982421875, 20.029541015625, 20.7392578125, 21.448974609375, 22.15869140625, 22.868408203125, 23.578125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 12.0, 29.0, 29.0, 50.0, 55.0, 98.0, 109.0, 110.0, 133.0, 108.0, 92.0, 63.0, 34.0, 38.0, 11.0, 15.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-67.41304016113281, -65.94137573242188, -64.46971130371094, -62.998046875, -61.52638244628906, -60.054718017578125, -58.58305358886719, -57.11138916015625, -55.63972473144531, -54.168060302734375, -52.69639587402344, -51.2247314453125, -49.75306701660156, -48.281402587890625, -46.80973815917969, -45.33807373046875, -43.86641311645508, -42.39474868774414, -40.9230842590332, -39.451419830322266, -37.97975540161133, -36.50809097290039, -35.03643035888672, -33.56476593017578, -32.093101501464844, -30.621437072753906, -29.14977264404297, -27.67810821533203, -26.206443786621094, -24.734779357910156, -23.26311683654785, -21.791452407836914, -20.319787979125977, -18.84812355041504, -17.3764591217041, -15.90479564666748, -14.433131217956543, -12.961466789245605, -11.489803314208984, -10.018138885498047, -8.54647445678711, -7.074810028076172, -5.603146076202393, -4.131482124328613, -2.659817695617676, -1.1881532669067383, 0.2835102081298828, 1.7551746368408203, 3.226839065551758, 4.698503494262695, 6.170167446136475, 7.641831398010254, 9.113495826721191, 10.585160255432129, 12.05682373046875, 13.528488159179688, 15.000152587890625, 16.471817016601562, 17.9434814453125, 19.415145874023438, 20.886810302734375, 22.358474731445312, 23.830137252807617, 25.301801681518555, 26.773466110229492]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 4.0, 3.0, 4.0, 6.0, 7.0, 13.0, 3.0, 8.0, 14.0, 17.0, 11.0, 22.0, 19.0, 20.0, 25.0, 29.0, 24.0, 29.0, 40.0, 37.0, 40.0, 38.0, 32.0, 36.0, 31.0, 41.0, 37.0, 36.0, 33.0, 32.0, 30.0, 28.0, 34.0, 35.0, 24.0, 24.0, 19.0, 13.0, 16.0, 20.0, 9.0, 10.0, 14.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.286697387695312, -19.62721061706543, -18.967721939086914, -18.30823516845703, -17.648746490478516, -16.989259719848633, -16.32977294921875, -15.670284271240234, -15.010797500610352, -14.351309776306152, -13.691822052001953, -13.03233528137207, -12.372847557067871, -11.713359832763672, -11.053872108459473, -10.394384384155273, -9.734896659851074, -9.075408935546875, -8.415921211242676, -7.756433963775635, -7.096946716308594, -6.4374589920043945, -5.777971267700195, -5.118484020233154, -4.458996295928955, -3.799508810043335, -3.140021324157715, -2.4805335998535156, -1.8210461139678955, -1.1615586280822754, -0.5020709037780762, 0.15741634368896484, 0.8169040679931641, 1.4763915538787842, 2.1358790397644043, 2.7953667640686035, 3.4548542499542236, 4.114341735839844, 4.773829460144043, 5.433316707611084, 6.092804431915283, 6.752292156219482, 7.411779403686523, 8.071267127990723, 8.730754852294922, 9.390241622924805, 10.04973030090332, 10.709217071533203, 11.368704795837402, 12.028192520141602, 12.6876802444458, 13.34716796875, 14.006654739379883, 14.666142463684082, 15.325630187988281, 15.985116958618164, 16.64460563659668, 17.304092407226562, 17.963581085205078, 18.62306785583496, 19.282556533813477, 19.94204330444336, 20.601531982421875, 21.261018753051758, 21.92050552368164]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 10.0, 13.0, 6.0, 12.0, 20.0, 15.0, 24.0, 28.0, 47.0, 33.0, 32.0, 53.0, 47.0, 59.0, 64.0, 48.0, 52.0, 56.0, 63.0, 49.0, 49.0, 27.0, 44.0, 34.0, 22.0, 19.0, 11.0, 14.0, 10.0, 14.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.3046875, -3.20623779296875, -3.1077880859375, -3.00933837890625, -2.910888671875, -2.81243896484375, -2.7139892578125, -2.61553955078125, -2.51708984375, -2.41864013671875, -2.3201904296875, -2.22174072265625, -2.123291015625, -2.02484130859375, -1.9263916015625, -1.82794189453125, -1.7294921875, -1.63104248046875, -1.5325927734375, -1.43414306640625, -1.335693359375, -1.23724365234375, -1.1387939453125, -1.04034423828125, -0.94189453125, -0.84344482421875, -0.7449951171875, -0.64654541015625, -0.548095703125, -0.44964599609375, -0.3511962890625, -0.25274658203125, -0.154296875, -0.05584716796875, 0.0426025390625, 0.14105224609375, 0.239501953125, 0.33795166015625, 0.4364013671875, 0.53485107421875, 0.63330078125, 0.73175048828125, 0.8302001953125, 0.92864990234375, 1.027099609375, 1.12554931640625, 1.2239990234375, 1.32244873046875, 1.4208984375, 1.51934814453125, 1.6177978515625, 1.71624755859375, 1.814697265625, 1.91314697265625, 2.0115966796875, 2.11004638671875, 2.20849609375, 2.30694580078125, 2.4053955078125, 2.50384521484375, 2.602294921875, 2.70074462890625, 2.7991943359375, 2.89764404296875, 2.99609375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 7.0, 7.0, 2.0, 15.0, 8.0, 19.0, 34.0, 33.0, 53.0, 76.0, 119.0, 177.0, 249.0, 379.0, 625.0, 968.0, 1508.0, 2437.0, 4030.0, 6729.0, 11533.0, 20448.0, 37486.0, 73295.0, 155196.0, 373173.0, 181514.0, 82641.0, 41850.0, 22304.0, 12552.0, 7411.0, 4412.0, 2672.0, 1632.0, 1037.0, 648.0, 414.0, 291.0, 165.0, 131.0, 89.0, 62.0, 37.0, 28.0, 19.0, 17.0, 12.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.15379905700683594, -0.14841842651367188, -0.1430377960205078, -0.13765716552734375, -0.1322765350341797, -0.12689590454101562, -0.12151527404785156, -0.1161346435546875, -0.11075401306152344, -0.10537338256835938, -0.09999275207519531, -0.09461212158203125, -0.08923149108886719, -0.08385086059570312, -0.07847023010253906, -0.073089599609375, -0.06770896911621094, -0.062328338623046875, -0.05694770812988281, -0.05156707763671875, -0.04618644714355469, -0.040805816650390625, -0.03542518615722656, -0.0300445556640625, -0.024663925170898438, -0.019283294677734375, -0.013902664184570312, -0.00852203369140625, -0.0031414031982421875, 0.002239227294921875, 0.0076198577880859375, 0.01300048828125, 0.018381118774414062, 0.023761749267578125, 0.029142379760742188, 0.03452301025390625, 0.03990364074707031, 0.045284271240234375, 0.05066490173339844, 0.0560455322265625, 0.06142616271972656, 0.06680679321289062, 0.07218742370605469, 0.07756805419921875, 0.08294868469238281, 0.08832931518554688, 0.09370994567871094, 0.099090576171875, 0.10447120666503906, 0.10985183715820312, 0.11523246765136719, 0.12061309814453125, 0.1259937286376953, 0.13137435913085938, 0.13675498962402344, 0.1421356201171875, 0.14751625061035156, 0.15289688110351562, 0.1582775115966797, 0.16365814208984375, 0.1690387725830078, 0.17441940307617188, 0.17980003356933594, 0.1851806640625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 7.0, 7.0, 16.0, 17.0, 10.0, 14.0, 21.0, 24.0, 15.0, 24.0, 30.0, 49.0, 39.0, 29.0, 33.0, 38.0, 36.0, 43.0, 1056.0, 34.0, 53.0, 42.0, 34.0, 43.0, 36.0, 27.0, 34.0, 35.0, 23.0, 29.0, 20.0, 14.0, 18.0, 16.0, 8.0, 11.0, 8.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.37890625, -2.306121826171875, -2.23333740234375, -2.160552978515625, -2.0877685546875, -2.014984130859375, -1.94219970703125, -1.869415283203125, -1.796630859375, -1.723846435546875, -1.65106201171875, -1.578277587890625, -1.5054931640625, -1.432708740234375, -1.35992431640625, -1.287139892578125, -1.21435546875, -1.141571044921875, -1.06878662109375, -0.996002197265625, -0.9232177734375, -0.850433349609375, -0.77764892578125, -0.704864501953125, -0.632080078125, -0.559295654296875, -0.48651123046875, -0.413726806640625, -0.3409423828125, -0.268157958984375, -0.19537353515625, -0.122589111328125, -0.0498046875, 0.022979736328125, 0.09576416015625, 0.168548583984375, 0.2413330078125, 0.314117431640625, 0.38690185546875, 0.459686279296875, 0.532470703125, 0.605255126953125, 0.67803955078125, 0.750823974609375, 0.8236083984375, 0.896392822265625, 0.96917724609375, 1.041961669921875, 1.11474609375, 1.187530517578125, 1.26031494140625, 1.333099365234375, 1.4058837890625, 1.478668212890625, 1.55145263671875, 1.624237060546875, 1.697021484375, 1.769805908203125, 1.84259033203125, 1.915374755859375, 1.9881591796875, 2.060943603515625, 2.13372802734375, 2.206512451171875, 2.279296875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 3.0, 11.0, 19.0, 25.0, 37.0, 48.0, 59.0, 107.0, 146.0, 248.0, 372.0, 609.0, 928.0, 1504.0, 2485.0, 4064.0, 6667.0, 11110.0, 19128.0, 33240.0, 59091.0, 112393.0, 463412.0, 1120311.0, 116002.0, 61607.0, 34550.0, 19844.0, 11503.0, 6859.0, 4009.0, 2436.0, 1550.0, 958.0, 630.0, 402.0, 254.0, 182.0, 94.0, 88.0, 54.0, 29.0, 24.0, 13.0, 8.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.06866455078125, -0.06658554077148438, -0.06450653076171875, -0.062427520751953125, -0.0603485107421875, -0.058269500732421875, -0.05619049072265625, -0.054111480712890625, -0.052032470703125, -0.049953460693359375, -0.04787445068359375, -0.045795440673828125, -0.0437164306640625, -0.041637420654296875, -0.03955841064453125, -0.037479400634765625, -0.035400390625, -0.033321380615234375, -0.03124237060546875, -0.029163360595703125, -0.0270843505859375, -0.025005340576171875, -0.02292633056640625, -0.020847320556640625, -0.018768310546875, -0.016689300537109375, -0.01461029052734375, -0.012531280517578125, -0.0104522705078125, -0.008373260498046875, -0.00629425048828125, -0.004215240478515625, -0.00213623046875, -5.7220458984375e-05, 0.00202178955078125, 0.004100799560546875, 0.0061798095703125, 0.008258819580078125, 0.01033782958984375, 0.012416839599609375, 0.014495849609375, 0.016574859619140625, 0.01865386962890625, 0.020732879638671875, 0.0228118896484375, 0.024890899658203125, 0.02696990966796875, 0.029048919677734375, 0.0311279296875, 0.033206939697265625, 0.03528594970703125, 0.037364959716796875, 0.0394439697265625, 0.041522979736328125, 0.04360198974609375, 0.045680999755859375, 0.047760009765625, 0.049839019775390625, 0.05191802978515625, 0.053997039794921875, 0.0560760498046875, 0.058155059814453125, 0.06023406982421875, 0.062313079833984375, 0.06439208984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 13.0, 8.0, 19.0, 27.0, 14.0, 25.0, 27.0, 33.0, 57.0, 98.0, 135.0, 141.0, 106.0, 64.0, 44.0, 33.0, 25.0, 20.0, 17.0, 13.0, 11.0, 12.0, 5.0, 9.0, 6.0, 13.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0], "bins": [-0.0008792877197265625, -0.0008589327335357666, -0.0008385777473449707, -0.0008182227611541748, -0.0007978677749633789, -0.000777512788772583, -0.0007571578025817871, -0.0007368028163909912, -0.0007164478302001953, -0.0006960928440093994, -0.0006757378578186035, -0.0006553828716278076, -0.0006350278854370117, -0.0006146728992462158, -0.0005943179130554199, -0.000573962926864624, -0.0005536079406738281, -0.0005332529544830322, -0.0005128979682922363, -0.0004925429821014404, -0.00047218799591064453, -0.00045183300971984863, -0.00043147802352905273, -0.00041112303733825684, -0.00039076805114746094, -0.00037041306495666504, -0.00035005807876586914, -0.00032970309257507324, -0.00030934810638427734, -0.00028899312019348145, -0.00026863813400268555, -0.00024828314781188965, -0.00022792816162109375, -0.00020757317543029785, -0.00018721818923950195, -0.00016686320304870605, -0.00014650821685791016, -0.00012615323066711426, -0.00010579824447631836, -8.544325828552246e-05, -6.508827209472656e-05, -4.4733285903930664e-05, -2.4378299713134766e-05, -4.023313522338867e-06, 1.633167266845703e-05, 3.668665885925293e-05, 5.704164505004883e-05, 7.739663124084473e-05, 9.775161743164062e-05, 0.00011810660362243652, 0.00013846158981323242, 0.00015881657600402832, 0.00017917156219482422, 0.00019952654838562012, 0.00021988153457641602, 0.00024023652076721191, 0.0002605915069580078, 0.0002809464931488037, 0.0003013014793395996, 0.0003216564655303955, 0.0003420114517211914, 0.0003623664379119873, 0.0003827214241027832, 0.0004030764102935791, 0.000423431396484375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 5.0, 5.0, 8.0, 19.0, 22.0, 39.0, 57.0, 77.0, 147.0, 395.0, 1437.0, 6725.0, 45574.0, 692586.0, 269826.0, 25807.0, 4216.0, 968.0, 294.0, 134.0, 78.0, 39.0, 21.0, 20.0, 16.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00806427001953125, -0.007739901542663574, -0.0074155330657958984, -0.007091164588928223, -0.006766796112060547, -0.006442427635192871, -0.006118059158325195, -0.0057936906814575195, -0.005469322204589844, -0.005144953727722168, -0.004820585250854492, -0.004496216773986816, -0.004171848297119141, -0.003847479820251465, -0.003523111343383789, -0.0031987428665161133, -0.0028743743896484375, -0.0025500059127807617, -0.002225637435913086, -0.0019012689590454102, -0.0015769004821777344, -0.0012525320053100586, -0.0009281635284423828, -0.000603795051574707, -0.00027942657470703125, 4.494190216064453e-05, 0.0003693103790283203, 0.0006936788558959961, 0.0010180473327636719, 0.0013424158096313477, 0.0016667842864990234, 0.0019911527633666992, 0.002315521240234375, 0.0026398897171020508, 0.0029642581939697266, 0.0032886266708374023, 0.003612995147705078, 0.003937363624572754, 0.00426173210144043, 0.0045861005783081055, 0.004910469055175781, 0.005234837532043457, 0.005559206008911133, 0.005883574485778809, 0.006207942962646484, 0.00653231143951416, 0.006856679916381836, 0.007181048393249512, 0.0075054168701171875, 0.007829785346984863, 0.008154153823852539, 0.008478522300720215, 0.00880289077758789, 0.009127259254455566, 0.009451627731323242, 0.009775996208190918, 0.010100364685058594, 0.01042473316192627, 0.010749101638793945, 0.011073470115661621, 0.011397838592529297, 0.011722207069396973, 0.012046575546264648, 0.012370944023132324, 0.0126953125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 11.0, 33.0, 86.0, 282.0, 413.0, 106.0, 49.0, 14.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004466247744858265, -0.004313251003623009, -0.0041602542623877525, -0.004007257521152496, -0.0038542605470865965, -0.0037012638058513403, -0.0035482668317854404, -0.0033952700905501842, -0.003242273349314928, -0.003089276608079672, -0.0029362798668444157, -0.002783282892778516, -0.0026302861515432596, -0.0024772894103080034, -0.0023242924362421036, -0.0021712956950068474, -0.002018298953771591, -0.001865302212536335, -0.001712305354885757, -0.001559308497235179, -0.0014063117559999228, -0.0012533150147646666, -0.0011003181571140885, -0.0009473212994635105, -0.0007943245582282543, -0.0006413277587853372, -0.0004883309593424201, -0.000335334159899503, -0.00018233736045658588, -2.9340561013668776e-05, 0.00012365623842924833, 0.00027665309607982635, 0.00042965030297636986, 0.000582647102419287, 0.0007356439018622041, 0.0008886407013051212, 0.0010416375007480383, 0.0011946342419832945, 0.0013476310996338725, 0.0015006279572844505, 0.0016536246985197067, 0.001806621439754963, 0.001959618180990219, 0.002112615155056119, 0.002265611896291375, 0.0024186086375266314, 0.002571605611592531, 0.0027246023528277874, 0.0028775990940630436, 0.0030305958352983, 0.003183592576533556, 0.003336589550599456, 0.003489586291834712, 0.0036425830330699682, 0.003795580007135868, 0.003948576748371124, 0.0041015734896063805, 0.004254570230841637, 0.004407566972076893, 0.004560563713312149, 0.004713560454547405, 0.004866557661443949, 0.005019554402679205, 0.005172551143914461, 0.005325547885149717]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 11.0, 9.0, 21.0, 16.0, 16.0, 38.0, 35.0, 34.0, 39.0, 43.0, 56.0, 54.0, 59.0, 55.0, 59.0, 55.0, 68.0, 59.0, 66.0, 34.0, 25.0, 39.0, 28.0, 20.0, 16.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005463361740112305, -0.0005301665514707565, -0.0005139969289302826, -0.0004978273063898087, -0.0004816576838493347, -0.0004654880613088608, -0.00044931843876838684, -0.0004331488162279129, -0.00041697919368743896, -0.000400809571146965, -0.0003846399486064911, -0.00036847032606601715, -0.0003523007035255432, -0.0003361310809850693, -0.00031996145844459534, -0.0003037918359041214, -0.00028762221336364746, -0.0002714525908231735, -0.0002552829682826996, -0.00023911334574222565, -0.0002229437232017517, -0.00020677410066127777, -0.00019060447812080383, -0.0001744348555803299, -0.00015826523303985596, -0.00014209561049938202, -0.00012592598795890808, -0.00010975636541843414, -9.35867428779602e-05, -7.741712033748627e-05, -6.124749779701233e-05, -4.507787525653839e-05, -2.8908252716064453e-05, -1.2738630175590515e-05, 3.430992364883423e-06, 1.960061490535736e-05, 3.57702374458313e-05, 5.193985998630524e-05, 6.810948252677917e-05, 8.427910506725311e-05, 0.00010044872760772705, 0.00011661835014820099, 0.00013278797268867493, 0.00014895759522914886, 0.0001651272177696228, 0.00018129684031009674, 0.00019746646285057068, 0.00021363608539104462, 0.00022980570793151855, 0.0002459753304719925, 0.00026214495301246643, 0.00027831457555294037, 0.0002944841980934143, 0.00031065382063388824, 0.0003268234431743622, 0.0003429930657148361, 0.00035916268825531006, 0.000375332310795784, 0.00039150193333625793, 0.00040767155587673187, 0.0004238411784172058, 0.00044001080095767975, 0.0004561804234981537, 0.0004723500460386276, 0.0004885196685791016]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 10.0, 13.0, 6.0, 12.0, 20.0, 15.0, 24.0, 28.0, 47.0, 33.0, 33.0, 52.0, 47.0, 59.0, 64.0, 47.0, 53.0, 56.0, 63.0, 49.0, 49.0, 27.0, 44.0, 34.0, 22.0, 19.0, 11.0, 14.0, 10.0, 14.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.3046875, -3.20623779296875, -3.1077880859375, -3.00933837890625, -2.910888671875, -2.81243896484375, -2.7139892578125, -2.61553955078125, -2.51708984375, -2.41864013671875, -2.3201904296875, -2.22174072265625, -2.123291015625, -2.02484130859375, -1.9263916015625, -1.82794189453125, -1.7294921875, -1.63104248046875, -1.5325927734375, -1.43414306640625, -1.335693359375, -1.23724365234375, -1.1387939453125, -1.04034423828125, -0.94189453125, -0.84344482421875, -0.7449951171875, -0.64654541015625, -0.548095703125, -0.44964599609375, -0.3511962890625, -0.25274658203125, -0.154296875, -0.05584716796875, 0.0426025390625, 0.14105224609375, 0.239501953125, 0.33795166015625, 0.4364013671875, 0.53485107421875, 0.63330078125, 0.73175048828125, 0.8302001953125, 0.92864990234375, 1.027099609375, 1.12554931640625, 1.2239990234375, 1.32244873046875, 1.4208984375, 1.51934814453125, 1.6177978515625, 1.71624755859375, 1.814697265625, 1.91314697265625, 2.0115966796875, 2.11004638671875, 2.20849609375, 2.30694580078125, 2.4053955078125, 2.50384521484375, 2.602294921875, 2.70074462890625, 2.7991943359375, 2.89764404296875, 2.99609375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 6.0, 9.0, 13.0, 35.0, 50.0, 69.0, 113.0, 160.0, 347.0, 595.0, 1296.0, 3053.0, 10474.0, 70561.0, 746907.0, 184006.0, 22405.0, 4790.0, 1797.0, 824.0, 453.0, 212.0, 147.0, 69.0, 53.0, 40.0, 17.0, 14.0, 12.0, 7.0, 4.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.279052734375, -10.88623046875, -10.493408203125, -10.1005859375, -9.707763671875, -9.31494140625, -8.922119140625, -8.529296875, -8.136474609375, -7.74365234375, -7.350830078125, -6.9580078125, -6.565185546875, -6.17236328125, -5.779541015625, -5.38671875, -4.993896484375, -4.60107421875, -4.208251953125, -3.8154296875, -3.422607421875, -3.02978515625, -2.636962890625, -2.244140625, -1.851318359375, -1.45849609375, -1.065673828125, -0.6728515625, -0.280029296875, 0.11279296875, 0.505615234375, 0.8984375, 1.291259765625, 1.68408203125, 2.076904296875, 2.4697265625, 2.862548828125, 3.25537109375, 3.648193359375, 4.041015625, 4.433837890625, 4.82666015625, 5.219482421875, 5.6123046875, 6.005126953125, 6.39794921875, 6.790771484375, 7.18359375, 7.576416015625, 7.96923828125, 8.362060546875, 8.7548828125, 9.147705078125, 9.54052734375, 9.933349609375, 10.326171875, 10.718994140625, 11.11181640625, 11.504638671875, 11.8974609375, 12.290283203125, 12.68310546875, 13.075927734375, 13.46875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 4.0, 10.0, 12.0, 8.0, 23.0, 26.0, 30.0, 22.0, 25.0, 34.0, 41.0, 35.0, 50.0, 71.0, 112.0, 175.0, 1374.0, 304.0, 136.0, 114.0, 79.0, 50.0, 53.0, 30.0, 34.0, 44.0, 32.0, 24.0, 19.0, 11.0, 7.0, 9.0, 1.0, 10.0, 6.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.265625, -9.97998046875, -9.6943359375, -9.40869140625, -9.123046875, -8.83740234375, -8.5517578125, -8.26611328125, -7.98046875, -7.69482421875, -7.4091796875, -7.12353515625, -6.837890625, -6.55224609375, -6.2666015625, -5.98095703125, -5.6953125, -5.40966796875, -5.1240234375, -4.83837890625, -4.552734375, -4.26708984375, -3.9814453125, -3.69580078125, -3.41015625, -3.12451171875, -2.8388671875, -2.55322265625, -2.267578125, -1.98193359375, -1.6962890625, -1.41064453125, -1.125, -0.83935546875, -0.5537109375, -0.26806640625, 0.017578125, 0.30322265625, 0.5888671875, 0.87451171875, 1.16015625, 1.44580078125, 1.7314453125, 2.01708984375, 2.302734375, 2.58837890625, 2.8740234375, 3.15966796875, 3.4453125, 3.73095703125, 4.0166015625, 4.30224609375, 4.587890625, 4.87353515625, 5.1591796875, 5.44482421875, 5.73046875, 6.01611328125, 6.3017578125, 6.58740234375, 6.873046875, 7.15869140625, 7.4443359375, 7.72998046875, 8.015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 16.0, 18.0, 25.0, 39.0, 49.0, 59.0, 112.0, 149.0, 283.0, 540.0, 1309.0, 3753.0, 15662.0, 153515.0, 2514400.0, 415897.0, 30652.0, 5751.0, 1806.0, 693.0, 333.0, 180.0, 120.0, 76.0, 53.0, 44.0, 33.0, 21.0, 24.0, 10.0, 7.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.46875, -12.0338134765625, -11.598876953125, -11.1639404296875, -10.72900390625, -10.2940673828125, -9.859130859375, -9.4241943359375, -8.9892578125, -8.5543212890625, -8.119384765625, -7.6844482421875, -7.24951171875, -6.8145751953125, -6.379638671875, -5.9447021484375, -5.509765625, -5.0748291015625, -4.639892578125, -4.2049560546875, -3.77001953125, -3.3350830078125, -2.900146484375, -2.4652099609375, -2.0302734375, -1.5953369140625, -1.160400390625, -0.7254638671875, -0.29052734375, 0.1444091796875, 0.579345703125, 1.0142822265625, 1.44921875, 1.8841552734375, 2.319091796875, 2.7540283203125, 3.18896484375, 3.6239013671875, 4.058837890625, 4.4937744140625, 4.9287109375, 5.3636474609375, 5.798583984375, 6.2335205078125, 6.66845703125, 7.1033935546875, 7.538330078125, 7.9732666015625, 8.408203125, 8.8431396484375, 9.278076171875, 9.7130126953125, 10.14794921875, 10.5828857421875, 11.017822265625, 11.4527587890625, 11.8876953125, 12.3226318359375, 12.757568359375, 13.1925048828125, 13.62744140625, 14.0623779296875, 14.497314453125, 14.9322509765625, 15.3671875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [4.0, 27.0, 181.0, 427.0, 304.0, 63.0, 9.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.46053695678711, -9.165708541870117, -5.870879173278809, -2.5760498046875, 0.7187786102294922, 4.013607025146484, 7.308437347412109, 10.603265762329102, 13.898094177246094, 17.192922592163086, 20.487751007080078, 23.782581329345703, 27.077409744262695, 30.372238159179688, 33.66706848144531, 36.96189880371094, 40.2567253112793, 43.55155563354492, 46.84638214111328, 50.141212463378906, 53.43604278564453, 56.73086929321289, 60.025699615478516, 63.320526123046875, 66.6153564453125, 69.91018676757812, 73.20501708984375, 76.49984741210938, 79.79467010498047, 83.0895004272461, 86.38433074951172, 89.67916107177734, 92.97398376464844, 96.26881408691406, 99.56364440917969, 102.85847473144531, 106.1532974243164, 109.44812774658203, 112.74295806884766, 116.03778839111328, 119.33261108398438, 122.62744140625, 125.92227172851562, 129.21710205078125, 132.51193237304688, 135.8067626953125, 139.10159301757812, 142.3964080810547, 145.69125366210938, 148.986083984375, 152.28091430664062, 155.57574462890625, 158.87057495117188, 162.1654052734375, 165.46023559570312, 168.7550506591797, 172.0498809814453, 175.34471130371094, 178.63954162597656, 181.9343719482422, 185.2292022705078, 188.52401733398438, 191.81884765625, 195.11367797851562, 198.40850830078125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 9.0, 6.0, 10.0, 7.0, 16.0, 20.0, 24.0, 22.0, 26.0, 17.0, 29.0, 31.0, 43.0, 50.0, 47.0, 44.0, 47.0, 40.0, 38.0, 46.0, 42.0, 34.0, 36.0, 36.0, 43.0, 30.0, 29.0, 35.0, 24.0, 18.0, 15.0, 17.0, 13.0, 18.0, 12.0, 8.0, 5.0, 11.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.645442962646484, -30.732877731323242, -29.8203125, -28.907747268676758, -27.995182037353516, -27.082618713378906, -26.170053482055664, -25.257488250732422, -24.34492301940918, -23.432357788085938, -22.519792556762695, -21.607227325439453, -20.694664001464844, -19.78209686279297, -18.86953353881836, -17.956968307495117, -17.044403076171875, -16.131837844848633, -15.21927261352539, -14.306708335876465, -13.394143104553223, -12.48157787322998, -11.569013595581055, -10.656448364257812, -9.74388313293457, -8.831317901611328, -7.918753147125244, -7.00618839263916, -6.093623161315918, -5.181057929992676, -4.268493175506592, -3.355928421020508, -2.4433631896972656, -1.5307981967926025, -0.6182332038879395, 0.29433178901672363, 1.2068967819213867, 2.119462013244629, 3.032026767730713, 3.944591522216797, 4.857156753540039, 5.769721984863281, 6.682286739349365, 7.594851493835449, 8.507416725158691, 9.419981956481934, 10.33254623413086, 11.245111465454102, 12.157676696777344, 13.070241928100586, 13.982807159423828, 14.895371437072754, 15.807936668395996, 16.720500946044922, 17.633066177368164, 18.545631408691406, 19.45819664001465, 20.37076187133789, 21.283327102661133, 22.195892333984375, 23.108455657958984, 24.02102279663086, 24.93358612060547, 25.84615135192871, 26.758716583251953]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 8.0, 5.0, 8.0, 5.0, 11.0, 13.0, 18.0, 15.0, 14.0, 23.0, 32.0, 31.0, 39.0, 37.0, 49.0, 54.0, 54.0, 42.0, 44.0, 45.0, 54.0, 54.0, 47.0, 43.0, 44.0, 37.0, 33.0, 30.0, 22.0, 25.0, 12.0, 10.0, 9.0, 10.0, 10.0, 3.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.158203125, -3.06463623046875, -2.9710693359375, -2.87750244140625, -2.783935546875, -2.69036865234375, -2.5968017578125, -2.50323486328125, -2.40966796875, -2.31610107421875, -2.2225341796875, -2.12896728515625, -2.035400390625, -1.94183349609375, -1.8482666015625, -1.75469970703125, -1.6611328125, -1.56756591796875, -1.4739990234375, -1.38043212890625, -1.286865234375, -1.19329833984375, -1.0997314453125, -1.00616455078125, -0.91259765625, -0.81903076171875, -0.7254638671875, -0.63189697265625, -0.538330078125, -0.44476318359375, -0.3511962890625, -0.25762939453125, -0.1640625, -0.07049560546875, 0.0230712890625, 0.11663818359375, 0.210205078125, 0.30377197265625, 0.3973388671875, 0.49090576171875, 0.58447265625, 0.67803955078125, 0.7716064453125, 0.86517333984375, 0.958740234375, 1.05230712890625, 1.1458740234375, 1.23944091796875, 1.3330078125, 1.42657470703125, 1.5201416015625, 1.61370849609375, 1.707275390625, 1.80084228515625, 1.8944091796875, 1.98797607421875, 2.08154296875, 2.17510986328125, 2.2686767578125, 2.36224365234375, 2.455810546875, 2.54937744140625, 2.6429443359375, 2.73651123046875, 2.830078125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 10.0, 12.0, 14.0, 17.0, 20.0, 44.0, 52.0, 72.0, 132.0, 202.0, 356.0, 673.0, 1202.0, 2249.0, 4815.0, 13016.0, 59945.0, 760413.0, 2964925.0, 333489.0, 35741.0, 9542.0, 3712.0, 1695.0, 868.0, 429.0, 229.0, 153.0, 68.0, 54.0, 52.0, 25.0, 21.0, 8.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.15625, -10.8653564453125, -10.574462890625, -10.2835693359375, -9.99267578125, -9.7017822265625, -9.410888671875, -9.1199951171875, -8.8291015625, -8.5382080078125, -8.247314453125, -7.9564208984375, -7.66552734375, -7.3746337890625, -7.083740234375, -6.7928466796875, -6.501953125, -6.2110595703125, -5.920166015625, -5.6292724609375, -5.33837890625, -5.0474853515625, -4.756591796875, -4.4656982421875, -4.1748046875, -3.8839111328125, -3.593017578125, -3.3021240234375, -3.01123046875, -2.7203369140625, -2.429443359375, -2.1385498046875, -1.84765625, -1.5567626953125, -1.265869140625, -0.9749755859375, -0.68408203125, -0.3931884765625, -0.102294921875, 0.1885986328125, 0.4794921875, 0.7703857421875, 1.061279296875, 1.3521728515625, 1.64306640625, 1.9339599609375, 2.224853515625, 2.5157470703125, 2.806640625, 3.0975341796875, 3.388427734375, 3.6793212890625, 3.97021484375, 4.2611083984375, 4.552001953125, 4.8428955078125, 5.1337890625, 5.4246826171875, 5.715576171875, 6.0064697265625, 6.29736328125, 6.5882568359375, 6.879150390625, 7.1700439453125, 7.4609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 9.0, 11.0, 11.0, 18.0, 26.0, 26.0, 38.0, 55.0, 78.0, 102.0, 157.0, 283.0, 364.0, 546.0, 593.0, 548.0, 377.0, 258.0, 165.0, 131.0, 74.0, 65.0, 37.0, 23.0, 13.0, 15.0, 14.0, 4.0, 6.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.4376220703125, -6.203369140625, -5.9691162109375, -5.73486328125, -5.5006103515625, -5.266357421875, -5.0321044921875, -4.7978515625, -4.5635986328125, -4.329345703125, -4.0950927734375, -3.86083984375, -3.6265869140625, -3.392333984375, -3.1580810546875, -2.923828125, -2.6895751953125, -2.455322265625, -2.2210693359375, -1.98681640625, -1.7525634765625, -1.518310546875, -1.2840576171875, -1.0498046875, -0.8155517578125, -0.581298828125, -0.3470458984375, -0.11279296875, 0.1214599609375, 0.355712890625, 0.5899658203125, 0.82421875, 1.0584716796875, 1.292724609375, 1.5269775390625, 1.76123046875, 1.9954833984375, 2.229736328125, 2.4639892578125, 2.6982421875, 2.9324951171875, 3.166748046875, 3.4010009765625, 3.63525390625, 3.8695068359375, 4.103759765625, 4.3380126953125, 4.572265625, 4.8065185546875, 5.040771484375, 5.2750244140625, 5.50927734375, 5.7435302734375, 5.977783203125, 6.2120361328125, 6.4462890625, 6.6805419921875, 6.914794921875, 7.1490478515625, 7.38330078125, 7.6175537109375, 7.851806640625, 8.0860595703125, 8.3203125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 13.0, 13.0, 20.0, 15.0, 19.0, 34.0, 48.0, 80.0, 166.0, 313.0, 687.0, 1563.0, 3959.0, 11786.0, 57401.0, 721762.0, 3055904.0, 294480.0, 32574.0, 8256.0, 2824.0, 1164.0, 557.0, 244.0, 139.0, 83.0, 47.0, 32.0, 26.0, 18.0, 20.0, 11.0, 7.0, 5.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.703125, -17.241455078125, -16.77978515625, -16.318115234375, -15.8564453125, -15.394775390625, -14.93310546875, -14.471435546875, -14.009765625, -13.548095703125, -13.08642578125, -12.624755859375, -12.1630859375, -11.701416015625, -11.23974609375, -10.778076171875, -10.31640625, -9.854736328125, -9.39306640625, -8.931396484375, -8.4697265625, -8.008056640625, -7.54638671875, -7.084716796875, -6.623046875, -6.161376953125, -5.69970703125, -5.238037109375, -4.7763671875, -4.314697265625, -3.85302734375, -3.391357421875, -2.9296875, -2.468017578125, -2.00634765625, -1.544677734375, -1.0830078125, -0.621337890625, -0.15966796875, 0.302001953125, 0.763671875, 1.225341796875, 1.68701171875, 2.148681640625, 2.6103515625, 3.072021484375, 3.53369140625, 3.995361328125, 4.45703125, 4.918701171875, 5.38037109375, 5.842041015625, 6.3037109375, 6.765380859375, 7.22705078125, 7.688720703125, 8.150390625, 8.612060546875, 9.07373046875, 9.535400390625, 9.9970703125, 10.458740234375, 10.92041015625, 11.382080078125, 11.84375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 7.0, 8.0, 15.0, 11.0, 18.0, 29.0, 20.0, 27.0, 28.0, 37.0, 47.0, 49.0, 53.0, 56.0, 60.0, 65.0, 59.0, 52.0, 61.0, 48.0, 41.0, 47.0, 27.0, 32.0, 17.0, 18.0, 14.0, 9.0, 15.0, 4.0, 7.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.93575096130371, -19.27741050720215, -18.619068145751953, -17.96072769165039, -17.302387237548828, -16.644046783447266, -15.985705375671387, -15.327363967895508, -14.669023513793945, -14.010683059692383, -13.352341651916504, -12.694000244140625, -12.035659790039062, -11.3773193359375, -10.718977928161621, -10.060636520385742, -9.40229606628418, -8.743955612182617, -8.085614204406738, -7.427273273468018, -6.768932342529297, -6.110591411590576, -5.4522504806518555, -4.793909549713135, -4.135568618774414, -3.4772276878356934, -2.8188867568969727, -2.160545825958252, -1.5022048950195312, -0.8438639640808105, -0.18552303314208984, 0.47281789779663086, 1.1311607360839844, 1.789501667022705, 2.447842597961426, 3.1061835289001465, 3.764524459838867, 4.422865390777588, 5.081206321716309, 5.739547252655029, 6.39788818359375, 7.056229114532471, 7.714570045471191, 8.37291145324707, 9.031251907348633, 9.689592361450195, 10.347933769226074, 11.006275177001953, 11.664615631103516, 12.322956085205078, 12.981297492980957, 13.639638900756836, 14.297979354858398, 14.956319808959961, 15.61466121673584, 16.27300262451172, 16.93134307861328, 17.589683532714844, 18.248023986816406, 18.9063663482666, 19.564706802368164, 20.223047256469727, 20.881389617919922, 21.539730072021484, 22.198070526123047]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 1.0, 5.0, 3.0, 9.0, 4.0, 10.0, 16.0, 14.0, 20.0, 21.0, 25.0, 27.0, 24.0, 32.0, 25.0, 27.0, 40.0, 37.0, 39.0, 31.0, 45.0, 41.0, 35.0, 36.0, 35.0, 47.0, 29.0, 44.0, 26.0, 24.0, 38.0, 27.0, 24.0, 22.0, 10.0, 16.0, 14.0, 16.0, 11.0, 9.0, 9.0, 8.0, 4.0, 7.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-21.031719207763672, -20.40998649597168, -19.788253784179688, -19.166521072387695, -18.544788360595703, -17.92305564880371, -17.30132293701172, -16.67959213256836, -16.057857513427734, -15.436124801635742, -14.81439208984375, -14.192659378051758, -13.570926666259766, -12.949193954467773, -12.327462196350098, -11.705729484558105, -11.08399772644043, -10.462265014648438, -9.840532302856445, -9.218799591064453, -8.597066879272461, -7.975334644317627, -7.353602409362793, -6.731869697570801, -6.110136985778809, -5.488404273986816, -4.866671562194824, -4.24493932723999, -3.623206615447998, -3.001473903656006, -2.3797414302825928, -1.7580089569091797, -1.1362743377685547, -0.514541745185852, 0.10719084739685059, 0.7289234399795532, 1.3506560325622559, 1.972388744354248, 2.594121217727661, 3.215853691101074, 3.8375864028930664, 4.459319114685059, 5.081051826477051, 5.702784061431885, 6.324516773223877, 6.946249485015869, 7.567981719970703, 8.189714431762695, 8.811447143554688, 9.43317985534668, 10.054912567138672, 10.676645278930664, 11.298377990722656, 11.920110702514648, 12.541842460632324, 13.163575172424316, 13.785307884216309, 14.4070405960083, 15.028773307800293, 15.650506019592285, 16.27223777770996, 16.893970489501953, 17.515703201293945, 18.137435913085938, 18.75916862487793]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 3.0, 6.0, 12.0, 6.0, 9.0, 13.0, 19.0, 19.0, 12.0, 25.0, 35.0, 23.0, 40.0, 49.0, 40.0, 41.0, 41.0, 50.0, 49.0, 53.0, 49.0, 42.0, 49.0, 55.0, 31.0, 47.0, 28.0, 29.0, 20.0, 16.0, 13.0, 20.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.95703125, -2.86669921875, -2.7763671875, -2.68603515625, -2.595703125, -2.50537109375, -2.4150390625, -2.32470703125, -2.234375, -2.14404296875, -2.0537109375, -1.96337890625, -1.873046875, -1.78271484375, -1.6923828125, -1.60205078125, -1.51171875, -1.42138671875, -1.3310546875, -1.24072265625, -1.150390625, -1.06005859375, -0.9697265625, -0.87939453125, -0.7890625, -0.69873046875, -0.6083984375, -0.51806640625, -0.427734375, -0.33740234375, -0.2470703125, -0.15673828125, -0.06640625, 0.02392578125, 0.1142578125, 0.20458984375, 0.294921875, 0.38525390625, 0.4755859375, 0.56591796875, 0.65625, 0.74658203125, 0.8369140625, 0.92724609375, 1.017578125, 1.10791015625, 1.1982421875, 1.28857421875, 1.37890625, 1.46923828125, 1.5595703125, 1.64990234375, 1.740234375, 1.83056640625, 1.9208984375, 2.01123046875, 2.1015625, 2.19189453125, 2.2822265625, 2.37255859375, 2.462890625, 2.55322265625, 2.6435546875, 2.73388671875, 2.82421875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 12.0, 7.0, 15.0, 17.0, 30.0, 49.0, 65.0, 101.0, 149.0, 229.0, 376.0, 557.0, 866.0, 1365.0, 2314.0, 3994.0, 6857.0, 11509.0, 19493.0, 33936.0, 61561.0, 124931.0, 333465.0, 232021.0, 96360.0, 50166.0, 28173.0, 16219.0, 9584.0, 5660.0, 3263.0, 1896.0, 1250.0, 742.0, 444.0, 313.0, 186.0, 131.0, 75.0, 60.0, 44.0, 19.0, 18.0, 11.0, 11.0, 3.0, 8.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1634521484375, -0.1579723358154297, -0.15249252319335938, -0.14701271057128906, -0.14153289794921875, -0.13605308532714844, -0.13057327270507812, -0.1250934600830078, -0.1196136474609375, -0.11413383483886719, -0.10865402221679688, -0.10317420959472656, -0.09769439697265625, -0.09221458435058594, -0.08673477172851562, -0.08125495910644531, -0.075775146484375, -0.07029533386230469, -0.06481552124023438, -0.05933570861816406, -0.05385589599609375, -0.04837608337402344, -0.042896270751953125, -0.03741645812988281, -0.0319366455078125, -0.026456832885742188, -0.020977020263671875, -0.015497207641601562, -0.01001739501953125, -0.0045375823974609375, 0.000942230224609375, 0.0064220428466796875, 0.01190185546875, 0.017381668090820312, 0.022861480712890625, 0.028341293334960938, 0.03382110595703125, 0.03930091857910156, 0.044780731201171875, 0.05026054382324219, 0.0557403564453125, 0.06122016906738281, 0.06669998168945312, 0.07217979431152344, 0.07765960693359375, 0.08313941955566406, 0.08861923217773438, 0.09409904479980469, 0.099578857421875, 0.10505867004394531, 0.11053848266601562, 0.11601829528808594, 0.12149810791015625, 0.12697792053222656, 0.13245773315429688, 0.1379375457763672, 0.1434173583984375, 0.1488971710205078, 0.15437698364257812, 0.15985679626464844, 0.16533660888671875, 0.17081642150878906, 0.17629623413085938, 0.1817760467529297, 0.187255859375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 7.0, 4.0, 7.0, 10.0, 15.0, 15.0, 21.0, 16.0, 18.0, 28.0, 37.0, 29.0, 40.0, 38.0, 34.0, 42.0, 37.0, 42.0, 39.0, 1071.0, 41.0, 26.0, 42.0, 39.0, 41.0, 37.0, 33.0, 32.0, 39.0, 23.0, 20.0, 16.0, 16.0, 11.0, 4.0, 11.0, 7.0, 6.0, 11.0, 4.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08203125, -2.00799560546875, -1.9339599609375, -1.85992431640625, -1.785888671875, -1.71185302734375, -1.6378173828125, -1.56378173828125, -1.48974609375, -1.41571044921875, -1.3416748046875, -1.26763916015625, -1.193603515625, -1.11956787109375, -1.0455322265625, -0.97149658203125, -0.8974609375, -0.82342529296875, -0.7493896484375, -0.67535400390625, -0.601318359375, -0.52728271484375, -0.4532470703125, -0.37921142578125, -0.30517578125, -0.23114013671875, -0.1571044921875, -0.08306884765625, -0.009033203125, 0.06500244140625, 0.1390380859375, 0.21307373046875, 0.287109375, 0.36114501953125, 0.4351806640625, 0.50921630859375, 0.583251953125, 0.65728759765625, 0.7313232421875, 0.80535888671875, 0.87939453125, 0.95343017578125, 1.0274658203125, 1.10150146484375, 1.175537109375, 1.24957275390625, 1.3236083984375, 1.39764404296875, 1.4716796875, 1.54571533203125, 1.6197509765625, 1.69378662109375, 1.767822265625, 1.84185791015625, 1.9158935546875, 1.98992919921875, 2.06396484375, 2.13800048828125, 2.2120361328125, 2.28607177734375, 2.360107421875, 2.43414306640625, 2.5081787109375, 2.58221435546875, 2.65625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 8.0, 10.0, 14.0, 16.0, 21.0, 56.0, 55.0, 89.0, 95.0, 170.0, 247.0, 325.0, 495.0, 669.0, 992.0, 1345.0, 1897.0, 2919.0, 4197.0, 6206.0, 9213.0, 13656.0, 21210.0, 32872.0, 52543.0, 89270.0, 176638.0, 1325719.0, 145373.0, 77093.0, 46556.0, 29290.0, 18946.0, 12559.0, 8279.0, 5605.0, 3774.0, 2583.0, 1900.0, 1265.0, 891.0, 598.0, 439.0, 291.0, 233.0, 164.0, 98.0, 79.0, 55.0, 39.0, 29.0, 15.0, 14.0, 6.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.0496826171875, -0.04809904098510742, -0.046515464782714844, -0.044931888580322266, -0.04334831237792969, -0.04176473617553711, -0.04018115997314453, -0.03859758377075195, -0.037014007568359375, -0.0354304313659668, -0.03384685516357422, -0.03226327896118164, -0.030679702758789062, -0.029096126556396484, -0.027512550354003906, -0.025928974151611328, -0.02434539794921875, -0.022761821746826172, -0.021178245544433594, -0.019594669342041016, -0.018011093139648438, -0.01642751693725586, -0.014843940734863281, -0.013260364532470703, -0.011676788330078125, -0.010093212127685547, -0.008509635925292969, -0.006926059722900391, -0.0053424835205078125, -0.0037589073181152344, -0.0021753311157226562, -0.0005917549133300781, 0.0009918212890625, 0.002575397491455078, 0.004158973693847656, 0.005742549896240234, 0.0073261260986328125, 0.00890970230102539, 0.010493278503417969, 0.012076854705810547, 0.013660430908203125, 0.015244007110595703, 0.01682758331298828, 0.01841115951538086, 0.019994735717773438, 0.021578311920166016, 0.023161888122558594, 0.024745464324951172, 0.02632904052734375, 0.027912616729736328, 0.029496192932128906, 0.031079769134521484, 0.03266334533691406, 0.03424692153930664, 0.03583049774169922, 0.0374140739440918, 0.038997650146484375, 0.04058122634887695, 0.04216480255126953, 0.04374837875366211, 0.04533195495605469, 0.046915531158447266, 0.048499107360839844, 0.05008268356323242, 0.051666259765625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 6.0, 11.0, 8.0, 10.0, 12.0, 16.0, 15.0, 29.0, 23.0, 28.0, 37.0, 45.0, 69.0, 85.0, 114.0, 101.0, 78.0, 54.0, 57.0, 42.0, 25.0, 30.0, 25.0, 17.0, 17.0, 6.0, 6.0, 4.0, 4.0, 10.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.000667572021484375, -0.0006489977240562439, -0.0006304234266281128, -0.0006118491291999817, -0.0005932748317718506, -0.0005747005343437195, -0.0005561262369155884, -0.0005375519394874573, -0.0005189776420593262, -0.0005004033446311951, -0.00048182904720306396, -0.00046325474977493286, -0.00044468045234680176, -0.00042610615491867065, -0.00040753185749053955, -0.00038895756006240845, -0.00037038326263427734, -0.00035180896520614624, -0.00033323466777801514, -0.00031466037034988403, -0.00029608607292175293, -0.0002775117754936218, -0.0002589374780654907, -0.00024036318063735962, -0.00022178888320922852, -0.0002032145857810974, -0.0001846402883529663, -0.0001660659909248352, -0.0001474916934967041, -0.000128917396068573, -0.0001103430986404419, -9.176880121231079e-05, -7.319450378417969e-05, -5.4620206356048584e-05, -3.604590892791748e-05, -1.7471611499786377e-05, 1.1026859283447266e-06, 1.967698335647583e-05, 3.8251280784606934e-05, 5.682557821273804e-05, 7.539987564086914e-05, 9.397417306900024e-05, 0.00011254847049713135, 0.00013112276792526245, 0.00014969706535339355, 0.00016827136278152466, 0.00018684566020965576, 0.00020541995763778687, 0.00022399425506591797, 0.00024256855249404907, 0.0002611428499221802, 0.0002797171473503113, 0.0002982914447784424, 0.0003168657422065735, 0.0003354400396347046, 0.0003540143370628357, 0.0003725886344909668, 0.0003911629319190979, 0.000409737229347229, 0.0004283115267753601, 0.0004468858242034912, 0.0004654601216316223, 0.0004840344190597534, 0.0005026087164878845, 0.0005211830139160156]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 7.0, 6.0, 8.0, 6.0, 8.0, 22.0, 33.0, 40.0, 94.0, 168.0, 528.0, 2030.0, 9373.0, 55418.0, 637948.0, 300296.0, 34427.0, 6069.0, 1368.0, 364.0, 134.0, 66.0, 42.0, 24.0, 18.0, 15.0, 8.0, 9.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00795745849609375, -0.007681846618652344, -0.0074062347412109375, -0.007130622863769531, -0.006855010986328125, -0.006579399108886719, -0.0063037872314453125, -0.006028175354003906, -0.0057525634765625, -0.005476951599121094, -0.0052013397216796875, -0.004925727844238281, -0.004650115966796875, -0.004374504089355469, -0.0040988922119140625, -0.0038232803344726562, -0.00354766845703125, -0.0032720565795898438, -0.0029964447021484375, -0.0027208328247070312, -0.002445220947265625, -0.0021696090698242188, -0.0018939971923828125, -0.0016183853149414062, -0.0013427734375, -0.0010671615600585938, -0.0007915496826171875, -0.0005159378051757812, -0.000240325927734375, 3.528594970703125e-05, 0.0003108978271484375, 0.0005865097045898438, 0.00086212158203125, 0.0011377334594726562, 0.0014133453369140625, 0.0016889572143554688, 0.001964569091796875, 0.0022401809692382812, 0.0025157928466796875, 0.0027914047241210938, 0.0030670166015625, 0.0033426284790039062, 0.0036182403564453125, 0.0038938522338867188, 0.004169464111328125, 0.004445075988769531, 0.0047206878662109375, 0.004996299743652344, 0.00527191162109375, 0.005547523498535156, 0.0058231353759765625, 0.006098747253417969, 0.006374359130859375, 0.006649971008300781, 0.0069255828857421875, 0.007201194763183594, 0.007476806640625, 0.007752418518066406, 0.008028030395507812, 0.008303642272949219, 0.008579254150390625, 0.008854866027832031, 0.009130477905273438, 0.009406089782714844, 0.00968170166015625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 12.0, 134.0, 750.0, 104.0, 13.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002684985753148794, -0.0023683321196585894, -0.0020516784861683846, -0.0017350249690935016, -0.0014183713356032968, -0.001101717702113092, -0.000785064185038209, -0.00046841055154800415, -0.00015175691805779934, 0.00016489668632857502, 0.00048155029071494937, 0.0007982038659974933, 0.001114857499487698, 0.0014315111329779029, 0.0017481646500527859, 0.0020648182835429907, 0.0023814719170331955, 0.0026981255505234003, 0.003014779184013605, 0.0033314325846731663, 0.0036480864509940147, 0.003964739851653576, 0.004281393252313137, 0.0045980471186339855, 0.004914700984954834, 0.005231354385614395, 0.005548008251935244, 0.005864661652594805, 0.006181315518915653, 0.006497968919575214, 0.0068146223202347755, 0.007131276186555624, 0.007447929121553898, 0.007764582522213459, 0.00808123592287302, 0.008397890254855156, 0.008714543655514717, 0.009031197056174278, 0.00934785045683384, 0.0096645038574934, 0.009981158189475536, 0.010297811590135098, 0.010614464990794659, 0.010931119322776794, 0.011247772723436356, 0.011564426124095917, 0.011881079524755478, 0.012197732925415039, 0.0125143863260746, 0.012831039726734161, 0.013147693127393723, 0.013464347459375858, 0.01378100086003542, 0.01409765426069498, 0.014414307661354542, 0.014730961993336678, 0.015047615393996239, 0.0153642687946558, 0.01568092219531536, 0.015997575595974922, 0.016314228996634483, 0.016630884259939194, 0.016947537660598755, 0.017264191061258316, 0.017580844461917877]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 5.0, 24.0, 30.0, 38.0, 67.0, 76.0, 93.0, 99.0, 89.0, 97.0, 86.0, 62.0, 80.0, 49.0, 46.0, 28.0, 12.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013107657432556152, -0.0012807315215468407, -0.001250697299838066, -0.0012206630781292915, -0.001190628856420517, -0.0011605946347117424, -0.0011305604130029678, -0.0011005261912941933, -0.0010704919695854187, -0.0010404577478766441, -0.0010104235261678696, -0.000980389304459095, -0.0009503550827503204, -0.0009203208610415459, -0.0008902866393327713, -0.0008602524176239967, -0.0008302181959152222, -0.0008001839742064476, -0.000770149752497673, -0.0007401155307888985, -0.0007100813090801239, -0.0006800470873713493, -0.0006500128656625748, -0.0006199786439538002, -0.0005899444222450256, -0.0005599102005362511, -0.0005298759788274765, -0.0004998417571187019, -0.00046980753540992737, -0.0004397733137011528, -0.00040973909199237823, -0.00037970487028360367, -0.0003496706485748291, -0.00031963642686605453, -0.00028960220515727997, -0.0002595679834485054, -0.00022953376173973083, -0.00019949954003095627, -0.0001694653183221817, -0.00013943109661340714, -0.00010939687490463257, -7.9362653195858e-05, -4.9328431487083435e-05, -1.929420977830887e-05, 1.0740011930465698e-05, 4.0774233639240265e-05, 7.080845534801483e-05, 0.0001008426770567894, 0.00013087689876556396, 0.00016091112047433853, 0.0001909453421831131, 0.00022097956389188766, 0.00025101378560066223, 0.0002810480073094368, 0.00031108222901821136, 0.00034111645072698593, 0.0003711506724357605, 0.00040118489414453506, 0.00043121911585330963, 0.0004612533375620842, 0.0004912875592708588, 0.0005213217809796333, 0.0005513560026884079, 0.0005813902243971825, 0.000611424446105957]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 5.0, 3.0, 6.0, 12.0, 6.0, 9.0, 13.0, 19.0, 19.0, 12.0, 25.0, 35.0, 23.0, 40.0, 49.0, 40.0, 41.0, 41.0, 50.0, 49.0, 53.0, 49.0, 42.0, 49.0, 55.0, 31.0, 47.0, 28.0, 29.0, 20.0, 16.0, 13.0, 20.0, 10.0, 11.0, 6.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.95703125, -2.86669921875, -2.7763671875, -2.68603515625, -2.595703125, -2.50537109375, -2.4150390625, -2.32470703125, -2.234375, -2.14404296875, -2.0537109375, -1.96337890625, -1.873046875, -1.78271484375, -1.6923828125, -1.60205078125, -1.51171875, -1.42138671875, -1.3310546875, -1.24072265625, -1.150390625, -1.06005859375, -0.9697265625, -0.87939453125, -0.7890625, -0.69873046875, -0.6083984375, -0.51806640625, -0.427734375, -0.33740234375, -0.2470703125, -0.15673828125, -0.06640625, 0.02392578125, 0.1142578125, 0.20458984375, 0.294921875, 0.38525390625, 0.4755859375, 0.56591796875, 0.65625, 0.74658203125, 0.8369140625, 0.92724609375, 1.017578125, 1.10791015625, 1.1982421875, 1.28857421875, 1.37890625, 1.46923828125, 1.5595703125, 1.64990234375, 1.740234375, 1.83056640625, 1.9208984375, 2.01123046875, 2.1015625, 2.19189453125, 2.2822265625, 2.37255859375, 2.462890625, 2.55322265625, 2.6435546875, 2.73388671875, 2.82421875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 19.0, 17.0, 28.0, 38.0, 63.0, 162.0, 249.0, 480.0, 899.0, 1973.0, 4716.0, 13274.0, 43096.0, 156933.0, 510335.0, 226207.0, 61059.0, 17963.0, 6265.0, 2467.0, 1052.0, 565.0, 296.0, 142.0, 92.0, 63.0, 23.0, 20.0, 14.0, 8.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.578125, -7.37127685546875, -7.1644287109375, -6.95758056640625, -6.750732421875, -6.54388427734375, -6.3370361328125, -6.13018798828125, -5.92333984375, -5.71649169921875, -5.5096435546875, -5.30279541015625, -5.095947265625, -4.88909912109375, -4.6822509765625, -4.47540283203125, -4.2685546875, -4.06170654296875, -3.8548583984375, -3.64801025390625, -3.441162109375, -3.23431396484375, -3.0274658203125, -2.82061767578125, -2.61376953125, -2.40692138671875, -2.2000732421875, -1.99322509765625, -1.786376953125, -1.57952880859375, -1.3726806640625, -1.16583251953125, -0.958984375, -0.75213623046875, -0.5452880859375, -0.33843994140625, -0.131591796875, 0.07525634765625, 0.2821044921875, 0.48895263671875, 0.69580078125, 0.90264892578125, 1.1094970703125, 1.31634521484375, 1.523193359375, 1.73004150390625, 1.9368896484375, 2.14373779296875, 2.3505859375, 2.55743408203125, 2.7642822265625, 2.97113037109375, 3.177978515625, 3.38482666015625, 3.5916748046875, 3.79852294921875, 4.00537109375, 4.21221923828125, 4.4190673828125, 4.62591552734375, 4.832763671875, 5.03961181640625, 5.2464599609375, 5.45330810546875, 5.66015625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 1.0, 5.0, 6.0, 8.0, 4.0, 12.0, 10.0, 9.0, 27.0, 23.0, 23.0, 39.0, 28.0, 34.0, 43.0, 49.0, 60.0, 85.0, 127.0, 185.0, 1352.0, 230.0, 117.0, 100.0, 66.0, 57.0, 59.0, 31.0, 27.0, 45.0, 30.0, 23.0, 19.0, 22.0, 22.0, 13.0, 14.0, 12.0, 9.0, 6.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.53125, -8.2431640625, -7.955078125, -7.6669921875, -7.37890625, -7.0908203125, -6.802734375, -6.5146484375, -6.2265625, -5.9384765625, -5.650390625, -5.3623046875, -5.07421875, -4.7861328125, -4.498046875, -4.2099609375, -3.921875, -3.6337890625, -3.345703125, -3.0576171875, -2.76953125, -2.4814453125, -2.193359375, -1.9052734375, -1.6171875, -1.3291015625, -1.041015625, -0.7529296875, -0.46484375, -0.1767578125, 0.111328125, 0.3994140625, 0.6875, 0.9755859375, 1.263671875, 1.5517578125, 1.83984375, 2.1279296875, 2.416015625, 2.7041015625, 2.9921875, 3.2802734375, 3.568359375, 3.8564453125, 4.14453125, 4.4326171875, 4.720703125, 5.0087890625, 5.296875, 5.5849609375, 5.873046875, 6.1611328125, 6.44921875, 6.7373046875, 7.025390625, 7.3134765625, 7.6015625, 7.8896484375, 8.177734375, 8.4658203125, 8.75390625, 9.0419921875, 9.330078125, 9.6181640625, 9.90625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 10.0, 10.0, 24.0, 28.0, 34.0, 61.0, 68.0, 95.0, 185.0, 258.0, 457.0, 884.0, 2135.0, 6456.0, 33891.0, 471554.0, 2475907.0, 131024.0, 15443.0, 3858.0, 1504.0, 753.0, 380.0, 217.0, 143.0, 98.0, 47.0, 42.0, 29.0, 16.0, 15.0, 17.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-18.515625, -17.990966796875, -17.46630859375, -16.941650390625, -16.4169921875, -15.892333984375, -15.36767578125, -14.843017578125, -14.318359375, -13.793701171875, -13.26904296875, -12.744384765625, -12.2197265625, -11.695068359375, -11.17041015625, -10.645751953125, -10.12109375, -9.596435546875, -9.07177734375, -8.547119140625, -8.0224609375, -7.497802734375, -6.97314453125, -6.448486328125, -5.923828125, -5.399169921875, -4.87451171875, -4.349853515625, -3.8251953125, -3.300537109375, -2.77587890625, -2.251220703125, -1.7265625, -1.201904296875, -0.67724609375, -0.152587890625, 0.3720703125, 0.896728515625, 1.42138671875, 1.946044921875, 2.470703125, 2.995361328125, 3.52001953125, 4.044677734375, 4.5693359375, 5.093994140625, 5.61865234375, 6.143310546875, 6.66796875, 7.192626953125, 7.71728515625, 8.241943359375, 8.7666015625, 9.291259765625, 9.81591796875, 10.340576171875, 10.865234375, 11.389892578125, 11.91455078125, 12.439208984375, 12.9638671875, 13.488525390625, 14.01318359375, 14.537841796875, 15.0625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 14.0, 45.0, 83.0, 262.0, 267.0, 217.0, 89.0, 19.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.848533630371094, -31.134279251098633, -28.420024871826172, -25.705772399902344, -22.991518020629883, -20.277263641357422, -17.563011169433594, -14.848756790161133, -12.134502410888672, -9.420248031616211, -6.705994606018066, -3.991741180419922, -1.277486801147461, 1.436767578125, 4.151020050048828, 6.865274429321289, 9.57952880859375, 12.293783187866211, 15.008036613464355, 17.7222900390625, 20.43654441833496, 23.150798797607422, 25.86505126953125, 28.57930564880371, 31.293560028076172, 34.0078125, 36.722068786621094, 39.43632125854492, 42.15057373046875, 44.864830017089844, 47.57908248901367, 50.2933349609375, 53.007598876953125, 55.72185134887695, 58.43610763549805, 61.150360107421875, 63.86461639404297, 66.57887268066406, 69.29312133789062, 72.00737762451172, 74.72163391113281, 77.4358901977539, 80.15013885498047, 82.86439514160156, 85.57865142822266, 88.29290771484375, 91.00715637207031, 93.7214126586914, 96.43566131591797, 99.14991760253906, 101.86416625976562, 104.57842254638672, 107.29267883300781, 110.00692749023438, 112.72118377685547, 115.43544006347656, 118.14968872070312, 120.86394500732422, 123.57819366455078, 126.29244995117188, 129.00669860839844, 131.72096252441406, 134.43521118164062, 137.1494598388672, 139.8637237548828]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 3.0, 6.0, 9.0, 9.0, 8.0, 15.0, 13.0, 19.0, 19.0, 23.0, 23.0, 25.0, 29.0, 32.0, 34.0, 31.0, 23.0, 40.0, 41.0, 48.0, 39.0, 37.0, 36.0, 38.0, 30.0, 36.0, 36.0, 20.0, 32.0, 26.0, 25.0, 19.0, 24.0, 21.0, 16.0, 17.0, 20.0, 7.0, 12.0, 11.0, 6.0, 3.0, 8.0, 7.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.35373306274414, -24.54157257080078, -23.72941017150879, -22.91724967956543, -22.105087280273438, -21.292926788330078, -20.48076629638672, -19.668603897094727, -18.856443405151367, -18.044282913208008, -17.232120513916016, -16.419960021972656, -15.60779857635498, -14.795637130737305, -13.983475685119629, -13.171314239501953, -12.359152793884277, -11.546991348266602, -10.734829902648926, -9.92266845703125, -9.11050796508789, -8.298346519470215, -7.486185073852539, -6.6740241050720215, -5.861862659454346, -5.04970121383667, -4.237540245056152, -3.4253787994384766, -2.61321759223938, -1.8010563850402832, -0.9888949394226074, -0.17673397064208984, 0.6354274749755859, 1.4475886821746826, 2.2597498893737793, 3.071911334991455, 3.8840725421905518, 4.696233749389648, 5.508395195007324, 6.320556163787842, 7.132717609405518, 7.944879055023193, 8.757040023803711, 9.569201469421387, 10.381362915039062, 11.193523406982422, 12.005685806274414, 12.817846298217773, 13.63000774383545, 14.442169189453125, 15.2543306350708, 16.066492080688477, 16.878652572631836, 17.690814971923828, 18.502975463867188, 19.315135955810547, 20.12729835510254, 20.9394588470459, 21.75162124633789, 22.56378173828125, 23.375944137573242, 24.1881046295166, 25.000267028808594, 25.812427520751953, 26.624588012695312]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 12.0, 12.0, 17.0, 16.0, 19.0, 30.0, 27.0, 27.0, 28.0, 44.0, 38.0, 45.0, 48.0, 49.0, 55.0, 44.0, 54.0, 47.0, 37.0, 41.0, 35.0, 35.0, 36.0, 30.0, 31.0, 20.0, 11.0, 18.0, 12.0, 11.0, 7.0, 11.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.138671875, -3.043243408203125, -2.94781494140625, -2.852386474609375, -2.7569580078125, -2.661529541015625, -2.56610107421875, -2.470672607421875, -2.375244140625, -2.279815673828125, -2.18438720703125, -2.088958740234375, -1.9935302734375, -1.898101806640625, -1.80267333984375, -1.707244873046875, -1.61181640625, -1.516387939453125, -1.42095947265625, -1.325531005859375, -1.2301025390625, -1.134674072265625, -1.03924560546875, -0.943817138671875, -0.848388671875, -0.752960205078125, -0.65753173828125, -0.562103271484375, -0.4666748046875, -0.371246337890625, -0.27581787109375, -0.180389404296875, -0.0849609375, 0.010467529296875, 0.10589599609375, 0.201324462890625, 0.2967529296875, 0.392181396484375, 0.48760986328125, 0.583038330078125, 0.678466796875, 0.773895263671875, 0.86932373046875, 0.964752197265625, 1.0601806640625, 1.155609130859375, 1.25103759765625, 1.346466064453125, 1.44189453125, 1.537322998046875, 1.63275146484375, 1.728179931640625, 1.8236083984375, 1.919036865234375, 2.01446533203125, 2.109893798828125, 2.205322265625, 2.300750732421875, 2.39617919921875, 2.491607666015625, 2.5870361328125, 2.682464599609375, 2.77789306640625, 2.873321533203125, 2.96875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 10.0, 25.0, 23.0, 26.0, 47.0, 95.0, 107.0, 167.0, 293.0, 417.0, 679.0, 1202.0, 2217.0, 4334.0, 9773.0, 27206.0, 139078.0, 1457781.0, 2247907.0, 241964.0, 38458.0, 12147.0, 5058.0, 2364.0, 1172.0, 674.0, 368.0, 236.0, 151.0, 90.0, 74.0, 31.0, 27.0, 17.0, 11.0, 11.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.2890625, -10.00421142578125, -9.7193603515625, -9.43450927734375, -9.149658203125, -8.86480712890625, -8.5799560546875, -8.29510498046875, -8.01025390625, -7.72540283203125, -7.4405517578125, -7.15570068359375, -6.870849609375, -6.58599853515625, -6.3011474609375, -6.01629638671875, -5.7314453125, -5.44659423828125, -5.1617431640625, -4.87689208984375, -4.592041015625, -4.30718994140625, -4.0223388671875, -3.73748779296875, -3.45263671875, -3.16778564453125, -2.8829345703125, -2.59808349609375, -2.313232421875, -2.02838134765625, -1.7435302734375, -1.45867919921875, -1.173828125, -0.88897705078125, -0.6041259765625, -0.31927490234375, -0.034423828125, 0.25042724609375, 0.5352783203125, 0.82012939453125, 1.10498046875, 1.38983154296875, 1.6746826171875, 1.95953369140625, 2.244384765625, 2.52923583984375, 2.8140869140625, 3.09893798828125, 3.3837890625, 3.66864013671875, 3.9534912109375, 4.23834228515625, 4.523193359375, 4.80804443359375, 5.0928955078125, 5.37774658203125, 5.66259765625, 5.94744873046875, 6.2322998046875, 6.51715087890625, 6.802001953125, 7.08685302734375, 7.3717041015625, 7.65655517578125, 7.94140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 6.0, 9.0, 5.0, 16.0, 13.0, 22.0, 28.0, 35.0, 70.0, 112.0, 169.0, 242.0, 363.0, 493.0, 621.0, 538.0, 409.0, 303.0, 190.0, 135.0, 70.0, 63.0, 44.0, 26.0, 20.0, 14.0, 10.0, 11.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.2890625, -7.035400390625, -6.78173828125, -6.528076171875, -6.2744140625, -6.020751953125, -5.76708984375, -5.513427734375, -5.259765625, -5.006103515625, -4.75244140625, -4.498779296875, -4.2451171875, -3.991455078125, -3.73779296875, -3.484130859375, -3.23046875, -2.976806640625, -2.72314453125, -2.469482421875, -2.2158203125, -1.962158203125, -1.70849609375, -1.454833984375, -1.201171875, -0.947509765625, -0.69384765625, -0.440185546875, -0.1865234375, 0.067138671875, 0.32080078125, 0.574462890625, 0.828125, 1.081787109375, 1.33544921875, 1.589111328125, 1.8427734375, 2.096435546875, 2.35009765625, 2.603759765625, 2.857421875, 3.111083984375, 3.36474609375, 3.618408203125, 3.8720703125, 4.125732421875, 4.37939453125, 4.633056640625, 4.88671875, 5.140380859375, 5.39404296875, 5.647705078125, 5.9013671875, 6.155029296875, 6.40869140625, 6.662353515625, 6.916015625, 7.169677734375, 7.42333984375, 7.677001953125, 7.9306640625, 8.184326171875, 8.43798828125, 8.691650390625, 8.9453125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 6.0, 5.0, 13.0, 12.0, 13.0, 35.0, 48.0, 56.0, 95.0, 184.0, 342.0, 626.0, 1453.0, 3699.0, 11632.0, 60272.0, 994363.0, 2912691.0, 176357.0, 22148.0, 6103.0, 2173.0, 931.0, 428.0, 216.0, 131.0, 72.0, 43.0, 34.0, 31.0, 16.0, 14.0, 11.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.8704833984375, -18.319091796875, -17.7677001953125, -17.21630859375, -16.6649169921875, -16.113525390625, -15.5621337890625, -15.0107421875, -14.4593505859375, -13.907958984375, -13.3565673828125, -12.80517578125, -12.2537841796875, -11.702392578125, -11.1510009765625, -10.599609375, -10.0482177734375, -9.496826171875, -8.9454345703125, -8.39404296875, -7.8426513671875, -7.291259765625, -6.7398681640625, -6.1884765625, -5.6370849609375, -5.085693359375, -4.5343017578125, -3.98291015625, -3.4315185546875, -2.880126953125, -2.3287353515625, -1.77734375, -1.2259521484375, -0.674560546875, -0.1231689453125, 0.42822265625, 0.9796142578125, 1.531005859375, 2.0823974609375, 2.6337890625, 3.1851806640625, 3.736572265625, 4.2879638671875, 4.83935546875, 5.3907470703125, 5.942138671875, 6.4935302734375, 7.044921875, 7.5963134765625, 8.147705078125, 8.6990966796875, 9.25048828125, 9.8018798828125, 10.353271484375, 10.9046630859375, 11.4560546875, 12.0074462890625, 12.558837890625, 13.1102294921875, 13.66162109375, 14.2130126953125, 14.764404296875, 15.3157958984375, 15.8671875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 15.0, 10.0, 33.0, 43.0, 66.0, 78.0, 100.0, 103.0, 106.0, 114.0, 93.0, 65.0, 51.0, 45.0, 25.0, 17.0, 9.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.406036376953125, -48.03774642944336, -46.66946029663086, -45.301170349121094, -43.932884216308594, -42.56459426879883, -41.19630432128906, -39.82801818847656, -38.4597282409668, -37.09143829345703, -35.72315216064453, -34.354862213134766, -32.986572265625, -31.6182861328125, -30.249996185302734, -28.8817081451416, -27.51342010498047, -26.145132064819336, -24.776844024658203, -23.408554077148438, -22.040266036987305, -20.671977996826172, -19.303688049316406, -17.935400009155273, -16.56711196899414, -15.198823928833008, -13.830534934997559, -12.46224594116211, -11.093957901000977, -9.725669860839844, -8.357380867004395, -6.989091873168945, -5.620807647705078, -4.252519130706787, -2.884230613708496, -1.515942096710205, -0.14765357971191406, 1.220634937286377, 2.588923454284668, 3.957212448120117, 5.32550048828125, 6.693789005279541, 8.062077522277832, 9.430366516113281, 10.798654556274414, 12.166942596435547, 13.535231590270996, 14.903520584106445, 16.271808624267578, 17.64009666442871, 19.008384704589844, 20.37667465209961, 21.744962692260742, 23.113250732421875, 24.48154067993164, 25.849828720092773, 27.218116760253906, 28.58640480041504, 29.954692840576172, 31.322982788085938, 32.69126892089844, 34.0595588684082, 35.42784881591797, 36.79613494873047, 38.164424896240234]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 14.0, 10.0, 9.0, 17.0, 15.0, 18.0, 17.0, 15.0, 21.0, 24.0, 24.0, 33.0, 36.0, 29.0, 33.0, 43.0, 40.0, 32.0, 28.0, 35.0, 32.0, 37.0, 40.0, 37.0, 46.0, 32.0, 39.0, 29.0, 24.0, 28.0, 24.0, 20.0, 19.0, 10.0, 14.0, 9.0, 13.0, 16.0, 11.0, 9.0, 8.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.156085968017578, -25.404306411743164, -24.652524948120117, -23.900745391845703, -23.14896583557129, -22.397184371948242, -21.645404815673828, -20.89362335205078, -20.141843795776367, -19.390064239501953, -18.638282775878906, -17.886503219604492, -17.134723663330078, -16.38294219970703, -15.631162643432617, -14.879382133483887, -14.127602577209473, -13.375822067260742, -12.624042510986328, -11.872262001037598, -11.120481491088867, -10.368701934814453, -9.616921424865723, -8.865140914916992, -8.113361358642578, -7.361581325531006, -6.609800815582275, -5.858020782470703, -5.106240272521973, -4.3544602394104, -3.602680206298828, -2.8508996963500977, -2.099119186401367, -1.3473389148712158, -0.595558762550354, 0.1562213897705078, 0.9080016613006592, 1.6597819328308105, 2.411561965942383, 3.1633424758911133, 3.9151225090026855, 4.666902542114258, 5.418683052062988, 6.1704630851745605, 6.922243118286133, 7.674023628234863, 8.425804138183594, 9.177583694458008, 9.929364204406738, 10.681144714355469, 11.432924270629883, 12.184704780578613, 12.936485290527344, 13.688264846801758, 14.440045356750488, 15.191825866699219, 15.943605422973633, 16.695384979248047, 17.447166442871094, 18.198945999145508, 18.950725555419922, 19.70250701904297, 20.454286575317383, 21.206066131591797, 21.957847595214844]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0, 8.0, 5.0, 1.0, 5.0, 11.0, 14.0, 12.0, 19.0, 22.0, 23.0, 27.0, 31.0, 42.0, 29.0, 40.0, 43.0, 37.0, 60.0, 54.0, 46.0, 35.0, 42.0, 61.0, 36.0, 49.0, 32.0, 49.0, 25.0, 24.0, 20.0, 26.0, 11.0, 19.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.107421875, -3.0081787109375, -2.908935546875, -2.8096923828125, -2.71044921875, -2.6112060546875, -2.511962890625, -2.4127197265625, -2.3134765625, -2.2142333984375, -2.114990234375, -2.0157470703125, -1.91650390625, -1.8172607421875, -1.718017578125, -1.6187744140625, -1.51953125, -1.4202880859375, -1.321044921875, -1.2218017578125, -1.12255859375, -1.0233154296875, -0.924072265625, -0.8248291015625, -0.7255859375, -0.6263427734375, -0.527099609375, -0.4278564453125, -0.32861328125, -0.2293701171875, -0.130126953125, -0.0308837890625, 0.068359375, 0.1676025390625, 0.266845703125, 0.3660888671875, 0.46533203125, 0.5645751953125, 0.663818359375, 0.7630615234375, 0.8623046875, 0.9615478515625, 1.060791015625, 1.1600341796875, 1.25927734375, 1.3585205078125, 1.457763671875, 1.5570068359375, 1.65625, 1.7554931640625, 1.854736328125, 1.9539794921875, 2.05322265625, 2.1524658203125, 2.251708984375, 2.3509521484375, 2.4501953125, 2.5494384765625, 2.648681640625, 2.7479248046875, 2.84716796875, 2.9464111328125, 3.045654296875, 3.1448974609375, 3.244140625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 13.0, 19.0, 20.0, 52.0, 68.0, 93.0, 128.0, 208.0, 307.0, 483.0, 693.0, 1033.0, 1606.0, 2451.0, 3652.0, 5676.0, 8713.0, 13744.0, 21105.0, 33493.0, 56761.0, 101764.0, 241199.0, 279582.0, 113250.0, 61446.0, 36416.0, 22868.0, 14570.0, 9430.0, 6098.0, 3970.0, 2603.0, 1708.0, 1114.0, 718.0, 512.0, 320.0, 230.0, 142.0, 95.0, 71.0, 46.0, 24.0, 19.0, 14.0, 13.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1541748046875, -0.14965057373046875, -0.1451263427734375, -0.14060211181640625, -0.136077880859375, -0.13155364990234375, -0.1270294189453125, -0.12250518798828125, -0.11798095703125, -0.11345672607421875, -0.1089324951171875, -0.10440826416015625, -0.099884033203125, -0.09535980224609375, -0.0908355712890625, -0.08631134033203125, -0.081787109375, -0.07726287841796875, -0.0727386474609375, -0.06821441650390625, -0.063690185546875, -0.05916595458984375, -0.0546417236328125, -0.05011749267578125, -0.04559326171875, -0.04106903076171875, -0.0365447998046875, -0.03202056884765625, -0.027496337890625, -0.02297210693359375, -0.0184478759765625, -0.01392364501953125, -0.0093994140625, -0.00487518310546875, -0.0003509521484375, 0.00417327880859375, 0.008697509765625, 0.01322174072265625, 0.0177459716796875, 0.02227020263671875, 0.02679443359375, 0.03131866455078125, 0.0358428955078125, 0.04036712646484375, 0.044891357421875, 0.04941558837890625, 0.0539398193359375, 0.05846405029296875, 0.06298828125, 0.06751251220703125, 0.0720367431640625, 0.07656097412109375, 0.081085205078125, 0.08560943603515625, 0.0901336669921875, 0.09465789794921875, 0.09918212890625, 0.10370635986328125, 0.1082305908203125, 0.11275482177734375, 0.117279052734375, 0.12180328369140625, 0.1263275146484375, 0.13085174560546875, 0.1353759765625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 2.0, 8.0, 7.0, 11.0, 16.0, 15.0, 8.0, 16.0, 17.0, 32.0, 19.0, 26.0, 25.0, 40.0, 43.0, 29.0, 36.0, 43.0, 34.0, 37.0, 1066.0, 42.0, 38.0, 50.0, 41.0, 29.0, 40.0, 36.0, 39.0, 24.0, 22.0, 14.0, 21.0, 11.0, 12.0, 11.0, 15.0, 7.0, 7.0, 7.0, 4.0, 7.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.298828125, -2.22186279296875, -2.1448974609375, -2.06793212890625, -1.990966796875, -1.91400146484375, -1.8370361328125, -1.76007080078125, -1.68310546875, -1.60614013671875, -1.5291748046875, -1.45220947265625, -1.375244140625, -1.29827880859375, -1.2213134765625, -1.14434814453125, -1.0673828125, -0.99041748046875, -0.9134521484375, -0.83648681640625, -0.759521484375, -0.68255615234375, -0.6055908203125, -0.52862548828125, -0.45166015625, -0.37469482421875, -0.2977294921875, -0.22076416015625, -0.143798828125, -0.06683349609375, 0.0101318359375, 0.08709716796875, 0.1640625, 0.24102783203125, 0.3179931640625, 0.39495849609375, 0.471923828125, 0.54888916015625, 0.6258544921875, 0.70281982421875, 0.77978515625, 0.85675048828125, 0.9337158203125, 1.01068115234375, 1.087646484375, 1.16461181640625, 1.2415771484375, 1.31854248046875, 1.3955078125, 1.47247314453125, 1.5494384765625, 1.62640380859375, 1.703369140625, 1.78033447265625, 1.8572998046875, 1.93426513671875, 2.01123046875, 2.08819580078125, 2.1651611328125, 2.24212646484375, 2.319091796875, 2.39605712890625, 2.4730224609375, 2.54998779296875, 2.626953125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 10.0, 22.0, 18.0, 19.0, 25.0, 53.0, 60.0, 103.0, 142.0, 147.0, 235.0, 322.0, 464.0, 619.0, 923.0, 1232.0, 1923.0, 2685.0, 3877.0, 5452.0, 7873.0, 12008.0, 17751.0, 26737.0, 40833.0, 65781.0, 116257.0, 1170532.0, 334786.0, 107504.0, 61664.0, 38815.0, 25357.0, 16509.0, 11107.0, 7859.0, 5189.0, 3595.0, 2455.0, 1743.0, 1256.0, 896.0, 686.0, 469.0, 327.0, 254.0, 149.0, 125.0, 90.0, 55.0, 32.0, 35.0, 26.0, 14.0, 10.0, 9.0, 9.0, 7.0, 4.0], "bins": [-0.05206298828125, -0.05048227310180664, -0.04890155792236328, -0.04732084274291992, -0.04574012756347656, -0.0441594123840332, -0.042578697204589844, -0.040997982025146484, -0.039417266845703125, -0.037836551666259766, -0.036255836486816406, -0.03467512130737305, -0.03309440612792969, -0.03151369094848633, -0.02993297576904297, -0.02835226058959961, -0.02677154541015625, -0.02519083023071289, -0.02361011505126953, -0.022029399871826172, -0.020448684692382812, -0.018867969512939453, -0.017287254333496094, -0.015706539154052734, -0.014125823974609375, -0.012545108795166016, -0.010964393615722656, -0.009383678436279297, -0.0078029632568359375, -0.006222248077392578, -0.004641532897949219, -0.0030608177185058594, -0.0014801025390625, 0.00010061264038085938, 0.0016813278198242188, 0.003262042999267578, 0.0048427581787109375, 0.006423473358154297, 0.008004188537597656, 0.009584903717041016, 0.011165618896484375, 0.012746334075927734, 0.014327049255371094, 0.015907764434814453, 0.017488479614257812, 0.019069194793701172, 0.02064990997314453, 0.02223062515258789, 0.02381134033203125, 0.02539205551147461, 0.02697277069091797, 0.028553485870361328, 0.030134201049804688, 0.03171491622924805, 0.033295631408691406, 0.034876346588134766, 0.036457061767578125, 0.038037776947021484, 0.039618492126464844, 0.0411992073059082, 0.04277992248535156, 0.04436063766479492, 0.04594135284423828, 0.04752206802368164, 0.049102783203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 6.0, 13.0, 15.0, 7.0, 9.0, 27.0, 13.0, 27.0, 41.0, 42.0, 39.0, 46.0, 74.0, 118.0, 120.0, 73.0, 51.0, 37.0, 43.0, 35.0, 25.0, 23.0, 27.0, 22.0, 11.0, 12.0, 6.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00070953369140625, -0.000684201717376709, -0.000658869743347168, -0.000633537769317627, -0.0006082057952880859, -0.0005828738212585449, -0.0005575418472290039, -0.0005322098731994629, -0.0005068778991699219, -0.00048154592514038086, -0.00045621395111083984, -0.00043088197708129883, -0.0004055500030517578, -0.0003802180290222168, -0.0003548860549926758, -0.00032955408096313477, -0.00030422210693359375, -0.00027889013290405273, -0.0002535581588745117, -0.0002282261848449707, -0.0002028942108154297, -0.00017756223678588867, -0.00015223026275634766, -0.00012689828872680664, -0.00010156631469726562, -7.623434066772461e-05, -5.0902366638183594e-05, -2.5570392608642578e-05, -2.384185791015625e-07, 2.5093555450439453e-05, 5.042552947998047e-05, 7.575750350952148e-05, 0.0001010894775390625, 0.00012642145156860352, 0.00015175342559814453, 0.00017708539962768555, 0.00020241737365722656, 0.00022774934768676758, 0.0002530813217163086, 0.0002784132957458496, 0.0003037452697753906, 0.00032907724380493164, 0.00035440921783447266, 0.00037974119186401367, 0.0004050731658935547, 0.0004304051399230957, 0.0004557371139526367, 0.00048106908798217773, 0.0005064010620117188, 0.0005317330360412598, 0.0005570650100708008, 0.0005823969841003418, 0.0006077289581298828, 0.0006330609321594238, 0.0006583929061889648, 0.0006837248802185059, 0.0007090568542480469, 0.0007343888282775879, 0.0007597208023071289, 0.0007850527763366699, 0.0008103847503662109, 0.000835716724395752, 0.000861048698425293, 0.000886380672454834, 0.000911712646484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 8.0, 12.0, 5.0, 14.0, 20.0, 26.0, 32.0, 32.0, 57.0, 102.0, 175.0, 671.0, 8313.0, 449726.0, 578541.0, 9465.0, 793.0, 227.0, 100.0, 64.0, 43.0, 20.0, 25.0, 12.0, 12.0, 14.0, 10.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0154571533203125, -0.015027999877929688, -0.014598846435546875, -0.014169692993164062, -0.01374053955078125, -0.013311386108398438, -0.012882232666015625, -0.012453079223632812, -0.01202392578125, -0.011594772338867188, -0.011165618896484375, -0.010736465454101562, -0.01030731201171875, -0.009878158569335938, -0.009449005126953125, -0.009019851684570312, -0.0085906982421875, -0.008161544799804688, -0.007732391357421875, -0.0073032379150390625, -0.00687408447265625, -0.0064449310302734375, -0.006015777587890625, -0.0055866241455078125, -0.005157470703125, -0.0047283172607421875, -0.004299163818359375, -0.0038700103759765625, -0.00344085693359375, -0.0030117034912109375, -0.002582550048828125, -0.0021533966064453125, -0.0017242431640625, -0.0012950897216796875, -0.000865936279296875, -0.0004367828369140625, -7.62939453125e-06, 0.0004215240478515625, 0.000850677490234375, 0.0012798309326171875, 0.001708984375, 0.0021381378173828125, 0.002567291259765625, 0.0029964447021484375, 0.00342559814453125, 0.0038547515869140625, 0.004283905029296875, 0.0047130584716796875, 0.0051422119140625, 0.0055713653564453125, 0.006000518798828125, 0.0064296722412109375, 0.00685882568359375, 0.0072879791259765625, 0.007717132568359375, 0.008146286010742188, 0.008575439453125, 0.009004592895507812, 0.009433746337890625, 0.009862899780273438, 0.01029205322265625, 0.010721206665039062, 0.011150360107421875, 0.011579513549804688, 0.0120086669921875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 12.0, 485.0, 503.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022504893131554127, -0.001876032561995089, -0.0015015758108347654, -0.00112711894325912, -0.0007526621920987964, -0.00037820544093847275, -3.748573362827301e-06, 0.0003707080613821745, 0.0007451649289578199, 0.0011196216801181436, 0.0014940784312784672, 0.0018685352988541126, 0.002242992166429758, 0.00261744880117476, 0.0029919056687504053, 0.003366362303495407, 0.0037408191710710526, 0.004115276038646698, 0.0044897329062223434, 0.004864189773797989, 0.005238646175712347, 0.0056131030432879925, 0.005987559910863638, 0.006362016312777996, 0.0067364731803536415, 0.007110930047929287, 0.007485386915504932, 0.007859843783080578, 0.008234300650656223, 0.008608756586909294, 0.00898321345448494, 0.009357670322060585, 0.009732128120958805, 0.01010658498853445, 0.010481041856110096, 0.010855498723685741, 0.011229955591261387, 0.011604411527514458, 0.011978868395090103, 0.012353325262665749, 0.012727782130241394, 0.01310223899781704, 0.013476695865392685, 0.01385115273296833, 0.014225609600543976, 0.014600066468119621, 0.014974523335695267, 0.015348979271948338, 0.015723437070846558, 0.016097893938422203, 0.01647235080599785, 0.016846807673573494, 0.01722126454114914, 0.017595721408724785, 0.01797017827630043, 0.018344635143876076, 0.018719090148806572, 0.019093547016382217, 0.019468003883957863, 0.01984246075153351, 0.020216917619109154, 0.0205913744866848, 0.020965831354260445, 0.02134028822183609, 0.021714745089411736]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 5.0, 8.0, 9.0, 18.0, 19.0, 32.0, 38.0, 50.0, 47.0, 65.0, 65.0, 76.0, 59.0, 71.0, 78.0, 89.0, 61.0, 47.0, 42.0, 36.0, 18.0, 19.0, 19.0, 15.0, 6.0, 10.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001292884349822998, -0.0012626098468899727, -0.0012323353439569473, -0.001202060841023922, -0.0011717863380908966, -0.0011415118351578712, -0.0011112373322248459, -0.0010809628292918205, -0.0010506883263587952, -0.0010204138234257698, -0.0009901393204927444, -0.0009598648175597191, -0.0009295903146266937, -0.0008993158116936684, -0.000869041308760643, -0.0008387668058276176, -0.0008084923028945923, -0.0007782177999615669, -0.0007479432970285416, -0.0007176687940955162, -0.0006873942911624908, -0.0006571197882294655, -0.0006268452852964401, -0.0005965707823634148, -0.0005662962794303894, -0.000536021776497364, -0.0005057472735643387, -0.0004754727706313133, -0.00044519826769828796, -0.0004149237647652626, -0.00038464926183223724, -0.0003543747588992119, -0.0003241002559661865, -0.00029382575303316116, -0.0002635512501001358, -0.00023327674716711044, -0.00020300224423408508, -0.00017272774130105972, -0.00014245323836803436, -0.000112178735435009, -8.190423250198364e-05, -5.162972956895828e-05, -2.1355226635932922e-05, 8.919276297092438e-06, 3.91937792301178e-05, 6.946828216314316e-05, 9.974278509616852e-05, 0.00013001728802919388, 0.00016029179096221924, 0.0001905662938952446, 0.00022084079682826996, 0.0002511152997612953, 0.0002813898026943207, 0.00031166430562734604, 0.0003419388085603714, 0.00037221331149339676, 0.0004024878144264221, 0.0004327623173594475, 0.00046303682029247284, 0.0004933113232254982, 0.0005235858261585236, 0.0005538603290915489, 0.0005841348320245743, 0.0006144093349575996, 0.000644683837890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0, 8.0, 5.0, 1.0, 5.0, 11.0, 14.0, 12.0, 19.0, 22.0, 24.0, 26.0, 31.0, 42.0, 29.0, 40.0, 43.0, 37.0, 60.0, 54.0, 46.0, 35.0, 42.0, 61.0, 36.0, 49.0, 32.0, 49.0, 25.0, 24.0, 20.0, 26.0, 11.0, 19.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.107421875, -3.0081787109375, -2.908935546875, -2.8096923828125, -2.71044921875, -2.6112060546875, -2.511962890625, -2.4127197265625, -2.3134765625, -2.2142333984375, -2.114990234375, -2.0157470703125, -1.91650390625, -1.8172607421875, -1.718017578125, -1.6187744140625, -1.51953125, -1.4202880859375, -1.321044921875, -1.2218017578125, -1.12255859375, -1.0233154296875, -0.924072265625, -0.8248291015625, -0.7255859375, -0.6263427734375, -0.527099609375, -0.4278564453125, -0.32861328125, -0.2293701171875, -0.130126953125, -0.0308837890625, 0.068359375, 0.1676025390625, 0.266845703125, 0.3660888671875, 0.46533203125, 0.5645751953125, 0.663818359375, 0.7630615234375, 0.8623046875, 0.9615478515625, 1.060791015625, 1.1600341796875, 1.25927734375, 1.3585205078125, 1.457763671875, 1.5570068359375, 1.65625, 1.7554931640625, 1.854736328125, 1.9539794921875, 2.05322265625, 2.1524658203125, 2.251708984375, 2.3509521484375, 2.4501953125, 2.5494384765625, 2.648681640625, 2.7479248046875, 2.84716796875, 2.9464111328125, 3.045654296875, 3.1448974609375, 3.244140625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 9.0, 10.0, 11.0, 17.0, 39.0, 46.0, 81.0, 115.0, 202.0, 367.0, 691.0, 1319.0, 2844.0, 6723.0, 19350.0, 75653.0, 466056.0, 383934.0, 63006.0, 16792.0, 6000.0, 2576.0, 1236.0, 621.0, 321.0, 200.0, 121.0, 86.0, 32.0, 29.0, 19.0, 17.0, 13.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.2568359375, -10.880859375, -10.5048828125, -10.12890625, -9.7529296875, -9.376953125, -9.0009765625, -8.625, -8.2490234375, -7.873046875, -7.4970703125, -7.12109375, -6.7451171875, -6.369140625, -5.9931640625, -5.6171875, -5.2412109375, -4.865234375, -4.4892578125, -4.11328125, -3.7373046875, -3.361328125, -2.9853515625, -2.609375, -2.2333984375, -1.857421875, -1.4814453125, -1.10546875, -0.7294921875, -0.353515625, 0.0224609375, 0.3984375, 0.7744140625, 1.150390625, 1.5263671875, 1.90234375, 2.2783203125, 2.654296875, 3.0302734375, 3.40625, 3.7822265625, 4.158203125, 4.5341796875, 4.91015625, 5.2861328125, 5.662109375, 6.0380859375, 6.4140625, 6.7900390625, 7.166015625, 7.5419921875, 7.91796875, 8.2939453125, 8.669921875, 9.0458984375, 9.421875, 9.7978515625, 10.173828125, 10.5498046875, 10.92578125, 11.3017578125, 11.677734375, 12.0537109375, 12.4296875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 6.0, 13.0, 15.0, 13.0, 11.0, 22.0, 12.0, 33.0, 43.0, 32.0, 41.0, 45.0, 60.0, 101.0, 138.0, 208.0, 1313.0, 249.0, 177.0, 98.0, 74.0, 60.0, 40.0, 40.0, 34.0, 32.0, 23.0, 8.0, 19.0, 20.0, 10.0, 11.0, 13.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.20654296875, -8.8974609375, -8.58837890625, -8.279296875, -7.97021484375, -7.6611328125, -7.35205078125, -7.04296875, -6.73388671875, -6.4248046875, -6.11572265625, -5.806640625, -5.49755859375, -5.1884765625, -4.87939453125, -4.5703125, -4.26123046875, -3.9521484375, -3.64306640625, -3.333984375, -3.02490234375, -2.7158203125, -2.40673828125, -2.09765625, -1.78857421875, -1.4794921875, -1.17041015625, -0.861328125, -0.55224609375, -0.2431640625, 0.06591796875, 0.375, 0.68408203125, 0.9931640625, 1.30224609375, 1.611328125, 1.92041015625, 2.2294921875, 2.53857421875, 2.84765625, 3.15673828125, 3.4658203125, 3.77490234375, 4.083984375, 4.39306640625, 4.7021484375, 5.01123046875, 5.3203125, 5.62939453125, 5.9384765625, 6.24755859375, 6.556640625, 6.86572265625, 7.1748046875, 7.48388671875, 7.79296875, 8.10205078125, 8.4111328125, 8.72021484375, 9.029296875, 9.33837890625, 9.6474609375, 9.95654296875, 10.265625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 9.0, 15.0, 8.0, 14.0, 13.0, 21.0, 29.0, 31.0, 41.0, 61.0, 101.0, 169.0, 293.0, 629.0, 1467.0, 4089.0, 13232.0, 74066.0, 1477895.0, 1478421.0, 74509.0, 13687.0, 4047.0, 1478.0, 605.0, 288.0, 132.0, 97.0, 62.0, 46.0, 33.0, 21.0, 13.0, 17.0, 11.0, 12.0, 9.0, 5.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.234375, -15.72705078125, -15.2197265625, -14.71240234375, -14.205078125, -13.69775390625, -13.1904296875, -12.68310546875, -12.17578125, -11.66845703125, -11.1611328125, -10.65380859375, -10.146484375, -9.63916015625, -9.1318359375, -8.62451171875, -8.1171875, -7.60986328125, -7.1025390625, -6.59521484375, -6.087890625, -5.58056640625, -5.0732421875, -4.56591796875, -4.05859375, -3.55126953125, -3.0439453125, -2.53662109375, -2.029296875, -1.52197265625, -1.0146484375, -0.50732421875, 0.0, 0.50732421875, 1.0146484375, 1.52197265625, 2.029296875, 2.53662109375, 3.0439453125, 3.55126953125, 4.05859375, 4.56591796875, 5.0732421875, 5.58056640625, 6.087890625, 6.59521484375, 7.1025390625, 7.60986328125, 8.1171875, 8.62451171875, 9.1318359375, 9.63916015625, 10.146484375, 10.65380859375, 11.1611328125, 11.66845703125, 12.17578125, 12.68310546875, 13.1904296875, 13.69775390625, 14.205078125, 14.71240234375, 15.2197265625, 15.72705078125, 16.234375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 15.0, 20.0, 40.0, 68.0, 100.0, 125.0, 147.0, 134.0, 132.0, 82.0, 54.0, 45.0, 19.0, 12.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.56389045715332, -15.25368881225586, -13.943486213684082, -12.633284568786621, -11.323081970214844, -10.012880325317383, -8.702678680419922, -7.3924760818481445, -6.082274436950684, -4.7720723152160645, -3.4618704319000244, -2.1516685485839844, -0.8414664268493652, 0.4687356948852539, 1.7789373397827148, 3.089139938354492, 4.399341583251953, 5.709543704986572, 7.019745826721191, 8.329947471618652, 9.64015007019043, 10.95035171508789, 12.260553359985352, 13.570755958557129, 14.88095760345459, 16.191160202026367, 17.501361846923828, 18.81156349182129, 20.12176513671875, 21.431968688964844, 22.742168426513672, 24.052371978759766, 25.36257553100586, 26.67277717590332, 27.98297882080078, 29.293182373046875, 30.603384017944336, 31.913585662841797, 33.223785400390625, 34.53398895263672, 35.84419250488281, 37.154396057128906, 38.464595794677734, 39.77479934692383, 41.084999084472656, 42.39520263671875, 43.705406188964844, 45.01560592651367, 46.3258056640625, 47.636009216308594, 48.94620895385742, 50.256412506103516, 51.566612243652344, 52.87681579589844, 54.18701934814453, 55.49721908569336, 56.80742263793945, 58.11762619018555, 59.427825927734375, 60.73802947998047, 62.0482292175293, 63.35843276977539, 64.66863250732422, 65.97883605957031, 67.2890396118164]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 9.0, 11.0, 17.0, 14.0, 14.0, 23.0, 27.0, 27.0, 25.0, 24.0, 26.0, 30.0, 37.0, 47.0, 47.0, 45.0, 46.0, 40.0, 43.0, 48.0, 36.0, 48.0, 30.0, 40.0, 32.0, 20.0, 31.0, 26.0, 18.0, 16.0, 13.0, 11.0, 9.0, 13.0, 8.0, 12.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.860036849975586, -28.899385452270508, -27.93873405456543, -26.97808074951172, -26.01742935180664, -25.056777954101562, -24.096126556396484, -23.135475158691406, -22.174823760986328, -21.21417236328125, -20.253520965576172, -19.292869567871094, -18.332216262817383, -17.371564865112305, -16.410913467407227, -15.450262069702148, -14.489608764648438, -13.52895736694336, -12.568305015563965, -11.607653617858887, -10.647001266479492, -9.686349868774414, -8.725698471069336, -7.7650465965271, -6.804394721984863, -5.843742847442627, -4.883090972900391, -3.9224395751953125, -2.961787700653076, -2.00113582611084, -1.0404844284057617, -0.07983255386352539, 0.8808174133300781, 1.841469168663025, 2.8021209239959717, 3.762772560119629, 4.723424434661865, 5.684076309204102, 6.64472770690918, 7.605379581451416, 8.566031455993652, 9.52668285369873, 10.487335205078125, 11.447986602783203, 12.408638000488281, 13.369290351867676, 14.329941749572754, 15.290594100952148, 16.251245498657227, 17.211896896362305, 18.172548294067383, 19.133201599121094, 20.093852996826172, 21.05450439453125, 22.015155792236328, 22.975807189941406, 23.936458587646484, 24.897109985351562, 25.85776138305664, 26.81841278076172, 27.77906608581543, 28.739717483520508, 29.700368881225586, 30.661020278930664, 31.621673583984375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 1.0, 6.0, 15.0, 23.0, 17.0, 19.0, 22.0, 22.0, 50.0, 21.0, 35.0, 32.0, 40.0, 38.0, 49.0, 53.0, 49.0, 38.0, 46.0, 37.0, 50.0, 48.0, 36.0, 39.0, 37.0, 30.0, 24.0, 20.0, 19.0, 7.0, 13.0, 9.0, 8.0, 8.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.486328125, -3.382415771484375, -3.27850341796875, -3.174591064453125, -3.0706787109375, -2.966766357421875, -2.86285400390625, -2.758941650390625, -2.655029296875, -2.551116943359375, -2.44720458984375, -2.343292236328125, -2.2393798828125, -2.135467529296875, -2.03155517578125, -1.927642822265625, -1.82373046875, -1.719818115234375, -1.61590576171875, -1.511993408203125, -1.4080810546875, -1.304168701171875, -1.20025634765625, -1.096343994140625, -0.992431640625, -0.888519287109375, -0.78460693359375, -0.680694580078125, -0.5767822265625, -0.472869873046875, -0.36895751953125, -0.265045166015625, -0.1611328125, -0.057220458984375, 0.04669189453125, 0.150604248046875, 0.2545166015625, 0.358428955078125, 0.46234130859375, 0.566253662109375, 0.670166015625, 0.774078369140625, 0.87799072265625, 0.981903076171875, 1.0858154296875, 1.189727783203125, 1.29364013671875, 1.397552490234375, 1.50146484375, 1.605377197265625, 1.70928955078125, 1.813201904296875, 1.9171142578125, 2.021026611328125, 2.12493896484375, 2.228851318359375, 2.332763671875, 2.436676025390625, 2.54058837890625, 2.644500732421875, 2.7484130859375, 2.852325439453125, 2.95623779296875, 3.060150146484375, 3.1640625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 8.0, 4.0, 9.0, 7.0, 25.0, 24.0, 40.0, 49.0, 108.0, 158.0, 272.0, 455.0, 771.0, 1500.0, 3344.0, 8105.0, 26570.0, 199498.0, 2623301.0, 1221508.0, 82779.0, 15952.0, 5244.0, 2146.0, 1069.0, 549.0, 311.0, 172.0, 114.0, 67.0, 42.0, 33.0, 14.0, 11.0, 13.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4921875, -11.1419677734375, -10.791748046875, -10.4415283203125, -10.09130859375, -9.7410888671875, -9.390869140625, -9.0406494140625, -8.6904296875, -8.3402099609375, -7.989990234375, -7.6397705078125, -7.28955078125, -6.9393310546875, -6.589111328125, -6.2388916015625, -5.888671875, -5.5384521484375, -5.188232421875, -4.8380126953125, -4.48779296875, -4.1375732421875, -3.787353515625, -3.4371337890625, -3.0869140625, -2.7366943359375, -2.386474609375, -2.0362548828125, -1.68603515625, -1.3358154296875, -0.985595703125, -0.6353759765625, -0.28515625, 0.0650634765625, 0.415283203125, 0.7655029296875, 1.11572265625, 1.4659423828125, 1.816162109375, 2.1663818359375, 2.5166015625, 2.8668212890625, 3.217041015625, 3.5672607421875, 3.91748046875, 4.2677001953125, 4.617919921875, 4.9681396484375, 5.318359375, 5.6685791015625, 6.018798828125, 6.3690185546875, 6.71923828125, 7.0694580078125, 7.419677734375, 7.7698974609375, 8.1201171875, 8.4703369140625, 8.820556640625, 9.1707763671875, 9.52099609375, 9.8712158203125, 10.221435546875, 10.5716552734375, 10.921875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 5.0, 2.0, 7.0, 9.0, 11.0, 12.0, 25.0, 25.0, 38.0, 52.0, 69.0, 96.0, 114.0, 155.0, 241.0, 302.0, 389.0, 458.0, 482.0, 428.0, 304.0, 220.0, 182.0, 134.0, 82.0, 47.0, 44.0, 33.0, 13.0, 16.0, 14.0, 15.0, 13.0, 4.0, 8.0, 3.0, 10.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.28125, -6.07208251953125, -5.8629150390625, -5.65374755859375, -5.444580078125, -5.23541259765625, -5.0262451171875, -4.81707763671875, -4.60791015625, -4.39874267578125, -4.1895751953125, -3.98040771484375, -3.771240234375, -3.56207275390625, -3.3529052734375, -3.14373779296875, -2.9345703125, -2.72540283203125, -2.5162353515625, -2.30706787109375, -2.097900390625, -1.88873291015625, -1.6795654296875, -1.47039794921875, -1.26123046875, -1.05206298828125, -0.8428955078125, -0.63372802734375, -0.424560546875, -0.21539306640625, -0.0062255859375, 0.20294189453125, 0.412109375, 0.62127685546875, 0.8304443359375, 1.03961181640625, 1.248779296875, 1.45794677734375, 1.6671142578125, 1.87628173828125, 2.08544921875, 2.29461669921875, 2.5037841796875, 2.71295166015625, 2.922119140625, 3.13128662109375, 3.3404541015625, 3.54962158203125, 3.7587890625, 3.96795654296875, 4.1771240234375, 4.38629150390625, 4.595458984375, 4.80462646484375, 5.0137939453125, 5.22296142578125, 5.43212890625, 5.64129638671875, 5.8504638671875, 6.05963134765625, 6.268798828125, 6.47796630859375, 6.6871337890625, 6.89630126953125, 7.10546875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 13.0, 6.0, 18.0, 19.0, 23.0, 24.0, 32.0, 53.0, 88.0, 143.0, 270.0, 711.0, 1902.0, 7106.0, 56316.0, 2241944.0, 1828059.0, 47723.0, 6559.0, 1820.0, 634.0, 307.0, 159.0, 111.0, 66.0, 38.0, 28.0, 26.0, 15.0, 18.0, 4.0, 4.0, 10.0, 2.0, 5.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.375, -22.666015625, -21.95703125, -21.248046875, -20.5390625, -19.830078125, -19.12109375, -18.412109375, -17.703125, -16.994140625, -16.28515625, -15.576171875, -14.8671875, -14.158203125, -13.44921875, -12.740234375, -12.03125, -11.322265625, -10.61328125, -9.904296875, -9.1953125, -8.486328125, -7.77734375, -7.068359375, -6.359375, -5.650390625, -4.94140625, -4.232421875, -3.5234375, -2.814453125, -2.10546875, -1.396484375, -0.6875, 0.021484375, 0.73046875, 1.439453125, 2.1484375, 2.857421875, 3.56640625, 4.275390625, 4.984375, 5.693359375, 6.40234375, 7.111328125, 7.8203125, 8.529296875, 9.23828125, 9.947265625, 10.65625, 11.365234375, 12.07421875, 12.783203125, 13.4921875, 14.201171875, 14.91015625, 15.619140625, 16.328125, 17.037109375, 17.74609375, 18.455078125, 19.1640625, 19.873046875, 20.58203125, 21.291015625, 22.0]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 16.0, 29.0, 86.0, 143.0, 184.0, 229.0, 151.0, 95.0, 46.0, 14.0, 9.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.230268478393555, -17.723499298095703, -15.216730117797852, -12.709961891174316, -10.203192710876465, -7.696423530578613, -5.189655303955078, -2.6828861236572266, -0.176116943359375, 2.3306519985198975, 4.83742094039917, 7.344189643859863, 9.850958824157715, 12.357728004455566, 14.864496231079102, 17.371265411376953, 19.878034591674805, 22.384803771972656, 24.891572952270508, 27.39834213256836, 29.905109405517578, 32.41188049316406, 34.91864776611328, 37.4254150390625, 39.932186126708984, 42.4389533996582, 44.94572448730469, 47.452491760253906, 49.95926284790039, 52.46603012084961, 54.972801208496094, 57.47956848144531, 59.98633575439453, 62.49310302734375, 64.99987030029297, 67.50664520263672, 70.01341247558594, 72.52017974853516, 75.02694702148438, 77.53372192382812, 80.04048919677734, 82.54725646972656, 85.05402374267578, 87.56079864501953, 90.06756591796875, 92.57433319091797, 95.08110046386719, 97.58787536621094, 100.09463500976562, 102.60140228271484, 105.10816955566406, 107.61494445800781, 110.12171173095703, 112.62847900390625, 115.13524627685547, 117.64201354980469, 120.14878845214844, 122.65555572509766, 125.16232299804688, 127.66909790039062, 130.1758575439453, 132.68263244628906, 135.1894073486328, 137.6961669921875, 140.20294189453125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 4.0, 5.0, 10.0, 8.0, 11.0, 14.0, 18.0, 16.0, 21.0, 16.0, 37.0, 30.0, 38.0, 29.0, 33.0, 41.0, 44.0, 50.0, 39.0, 50.0, 49.0, 53.0, 44.0, 45.0, 36.0, 25.0, 21.0, 22.0, 31.0, 26.0, 19.0, 22.0, 18.0, 18.0, 12.0, 8.0, 6.0, 10.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.2144832611084, -24.47092628479004, -23.727367401123047, -22.983810424804688, -22.240253448486328, -21.49669647216797, -20.75313949584961, -20.009580612182617, -19.266023635864258, -18.5224666595459, -17.778907775878906, -17.035350799560547, -16.291793823242188, -15.548236846923828, -14.804678916931152, -14.061120986938477, -13.317564010620117, -12.574007034301758, -11.830449104309082, -11.086891174316406, -10.343334197998047, -9.599777221679688, -8.856219291687012, -8.112661361694336, -7.369104385375977, -6.625546932220459, -5.881989479064941, -5.138432025909424, -4.394874572753906, -3.6513171195983887, -2.907759666442871, -2.1642022132873535, -1.4206466674804688, -0.6770892143249512, 0.0664682388305664, 0.810025691986084, 1.5535831451416016, 2.297140598297119, 3.0406980514526367, 3.7842555046081543, 4.527812957763672, 5.2713704109191895, 6.014927864074707, 6.758485317230225, 7.502042770385742, 8.245599746704102, 8.989157676696777, 9.732715606689453, 10.476272583007812, 11.219829559326172, 11.963387489318848, 12.706945419311523, 13.450502395629883, 14.194059371948242, 14.937617301940918, 15.681175231933594, 16.424732208251953, 17.168289184570312, 17.911846160888672, 18.655405044555664, 19.398962020874023, 20.142518997192383, 20.886077880859375, 21.629634857177734, 22.373191833496094]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 6.0, 11.0, 10.0, 15.0, 14.0, 19.0, 30.0, 29.0, 30.0, 22.0, 28.0, 39.0, 53.0, 35.0, 44.0, 47.0, 42.0, 40.0, 50.0, 39.0, 45.0, 43.0, 37.0, 40.0, 42.0, 32.0, 27.0, 17.0, 18.0, 18.0, 12.0, 19.0, 8.0, 7.0, 6.0, 4.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.013580322265625, -2.90997314453125, -2.806365966796875, -2.7027587890625, -2.599151611328125, -2.49554443359375, -2.391937255859375, -2.288330078125, -2.184722900390625, -2.08111572265625, -1.977508544921875, -1.8739013671875, -1.770294189453125, -1.66668701171875, -1.563079833984375, -1.45947265625, -1.355865478515625, -1.25225830078125, -1.148651123046875, -1.0450439453125, -0.941436767578125, -0.83782958984375, -0.734222412109375, -0.630615234375, -0.527008056640625, -0.42340087890625, -0.319793701171875, -0.2161865234375, -0.112579345703125, -0.00897216796875, 0.094635009765625, 0.1982421875, 0.301849365234375, 0.40545654296875, 0.509063720703125, 0.6126708984375, 0.716278076171875, 0.81988525390625, 0.923492431640625, 1.027099609375, 1.130706787109375, 1.23431396484375, 1.337921142578125, 1.4415283203125, 1.545135498046875, 1.64874267578125, 1.752349853515625, 1.85595703125, 1.959564208984375, 2.06317138671875, 2.166778564453125, 2.2703857421875, 2.373992919921875, 2.47760009765625, 2.581207275390625, 2.684814453125, 2.788421630859375, 2.89202880859375, 2.995635986328125, 3.0992431640625, 3.202850341796875, 3.30645751953125, 3.410064697265625, 3.513671875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 18.0, 13.0, 21.0, 43.0, 59.0, 81.0, 149.0, 153.0, 291.0, 399.0, 654.0, 1037.0, 1585.0, 2429.0, 3767.0, 5756.0, 9417.0, 15253.0, 25505.0, 44359.0, 81679.0, 169423.0, 325170.0, 168612.0, 81923.0, 44404.0, 25564.0, 15045.0, 9259.0, 5881.0, 3776.0, 2366.0, 1475.0, 1020.0, 661.0, 433.0, 300.0, 195.0, 122.0, 92.0, 49.0, 37.0, 22.0, 21.0, 17.0, 10.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166015625, -0.16057205200195312, -0.15512847900390625, -0.14968490600585938, -0.1442413330078125, -0.13879776000976562, -0.13335418701171875, -0.12791061401367188, -0.122467041015625, -0.11702346801757812, -0.11157989501953125, -0.10613632202148438, -0.1006927490234375, -0.09524917602539062, -0.08980560302734375, -0.08436203002929688, -0.07891845703125, -0.07347488403320312, -0.06803131103515625, -0.06258773803710938, -0.0571441650390625, -0.051700592041015625, -0.04625701904296875, -0.040813446044921875, -0.035369873046875, -0.029926300048828125, -0.02448272705078125, -0.019039154052734375, -0.0135955810546875, -0.008152008056640625, -0.00270843505859375, 0.002735137939453125, 0.0081787109375, 0.013622283935546875, 0.01906585693359375, 0.024509429931640625, 0.0299530029296875, 0.035396575927734375, 0.04084014892578125, 0.046283721923828125, 0.051727294921875, 0.057170867919921875, 0.06261444091796875, 0.06805801391601562, 0.0735015869140625, 0.07894515991210938, 0.08438873291015625, 0.08983230590820312, 0.09527587890625, 0.10071945190429688, 0.10616302490234375, 0.11160659790039062, 0.1170501708984375, 0.12249374389648438, 0.12793731689453125, 0.13338088989257812, 0.138824462890625, 0.14426803588867188, 0.14971160888671875, 0.15515518188476562, 0.1605987548828125, 0.16604232788085938, 0.17148590087890625, 0.17692947387695312, 0.182373046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 7.0, 12.0, 7.0, 12.0, 13.0, 16.0, 16.0, 21.0, 16.0, 17.0, 28.0, 26.0, 26.0, 26.0, 42.0, 35.0, 33.0, 44.0, 36.0, 38.0, 1064.0, 39.0, 36.0, 39.0, 38.0, 26.0, 36.0, 28.0, 31.0, 31.0, 33.0, 22.0, 18.0, 21.0, 12.0, 16.0, 11.0, 13.0, 7.0, 5.0, 6.0, 9.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.615234375, -2.535308837890625, -2.45538330078125, -2.375457763671875, -2.2955322265625, -2.215606689453125, -2.13568115234375, -2.055755615234375, -1.975830078125, -1.895904541015625, -1.81597900390625, -1.736053466796875, -1.6561279296875, -1.576202392578125, -1.49627685546875, -1.416351318359375, -1.33642578125, -1.256500244140625, -1.17657470703125, -1.096649169921875, -1.0167236328125, -0.936798095703125, -0.85687255859375, -0.776947021484375, -0.697021484375, -0.617095947265625, -0.53717041015625, -0.457244873046875, -0.3773193359375, -0.297393798828125, -0.21746826171875, -0.137542724609375, -0.0576171875, 0.022308349609375, 0.10223388671875, 0.182159423828125, 0.2620849609375, 0.342010498046875, 0.42193603515625, 0.501861572265625, 0.581787109375, 0.661712646484375, 0.74163818359375, 0.821563720703125, 0.9014892578125, 0.981414794921875, 1.06134033203125, 1.141265869140625, 1.22119140625, 1.301116943359375, 1.38104248046875, 1.460968017578125, 1.5408935546875, 1.620819091796875, 1.70074462890625, 1.780670166015625, 1.860595703125, 1.940521240234375, 2.02044677734375, 2.100372314453125, 2.1802978515625, 2.260223388671875, 2.34014892578125, 2.420074462890625, 2.5]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 7.0, 10.0, 17.0, 13.0, 31.0, 33.0, 45.0, 72.0, 87.0, 126.0, 181.0, 299.0, 385.0, 518.0, 712.0, 1051.0, 1457.0, 1978.0, 2709.0, 3980.0, 5565.0, 7791.0, 11214.0, 15667.0, 23360.0, 34812.0, 53961.0, 89851.0, 170040.0, 1300163.0, 141790.0, 78705.0, 48532.0, 31463.0, 20914.0, 14568.0, 10081.0, 7094.0, 5098.0, 3584.0, 2611.0, 1898.0, 1280.0, 967.0, 684.0, 477.0, 369.0, 258.0, 203.0, 127.0, 81.0, 70.0, 46.0, 40.0, 19.0, 21.0, 12.0, 11.0, 1.0, 5.0, 2.0, 1.0], "bins": [-0.050750732421875, -0.04913330078125, -0.047515869140625, -0.0458984375, -0.044281005859375, -0.04266357421875, -0.041046142578125, -0.0394287109375, -0.037811279296875, -0.03619384765625, -0.034576416015625, -0.032958984375, -0.031341552734375, -0.02972412109375, -0.028106689453125, -0.0264892578125, -0.024871826171875, -0.02325439453125, -0.021636962890625, -0.02001953125, -0.018402099609375, -0.01678466796875, -0.015167236328125, -0.0135498046875, -0.011932373046875, -0.01031494140625, -0.008697509765625, -0.007080078125, -0.005462646484375, -0.00384521484375, -0.002227783203125, -0.0006103515625, 0.001007080078125, 0.00262451171875, 0.004241943359375, 0.005859375, 0.007476806640625, 0.00909423828125, 0.010711669921875, 0.0123291015625, 0.013946533203125, 0.01556396484375, 0.017181396484375, 0.018798828125, 0.020416259765625, 0.02203369140625, 0.023651123046875, 0.0252685546875, 0.026885986328125, 0.02850341796875, 0.030120849609375, 0.03173828125, 0.033355712890625, 0.03497314453125, 0.036590576171875, 0.0382080078125, 0.039825439453125, 0.04144287109375, 0.043060302734375, 0.044677734375, 0.046295166015625, 0.04791259765625, 0.049530029296875, 0.0511474609375, 0.052764892578125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 1.0, 7.0, 7.0, 6.0, 8.0, 8.0, 7.0, 19.0, 24.0, 30.0, 27.0, 36.0, 54.0, 58.0, 73.0, 126.0, 125.0, 83.0, 47.0, 44.0, 31.0, 32.0, 27.0, 18.0, 11.0, 15.0, 5.0, 9.0, 12.0, 6.0, 7.0, 1.0, 5.0, 2.0, 8.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0009245872497558594, -0.0008936896920204163, -0.0008627921342849731, -0.00083189457654953, -0.0008009970188140869, -0.0007700994610786438, -0.0007392019033432007, -0.0007083043456077576, -0.0006774067878723145, -0.0006465092301368713, -0.0006156116724014282, -0.0005847141146659851, -0.000553816556930542, -0.0005229189991950989, -0.0004920214414596558, -0.00046112388372421265, -0.00043022632598876953, -0.0003993287682533264, -0.0003684312105178833, -0.0003375336527824402, -0.00030663609504699707, -0.00027573853731155396, -0.00024484097957611084, -0.00021394342184066772, -0.0001830458641052246, -0.0001521483063697815, -0.00012125074863433838, -9.035319089889526e-05, -5.945563316345215e-05, -2.8558075428009033e-05, 2.339482307434082e-06, 3.32370400428772e-05, 6.413459777832031e-05, 9.503215551376343e-05, 0.00012592971324920654, 0.00015682727098464966, 0.00018772482872009277, 0.0002186223864555359, 0.000249519944190979, 0.0002804175019264221, 0.00031131505966186523, 0.00034221261739730835, 0.00037311017513275146, 0.0004040077328681946, 0.0004349052906036377, 0.0004658028483390808, 0.0004967004060745239, 0.000527597963809967, 0.0005584955215454102, 0.0005893930792808533, 0.0006202906370162964, 0.0006511881947517395, 0.0006820857524871826, 0.0007129833102226257, 0.0007438808679580688, 0.000774778425693512, 0.0008056759834289551, 0.0008365735411643982, 0.0008674710988998413, 0.0008983686566352844, 0.0009292662143707275, 0.0009601637721061707, 0.0009910613298416138, 0.0010219588875770569, 0.0010528564453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 10.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 13.0, 5.0, 11.0, 15.0, 17.0, 35.0, 40.0, 72.0, 102.0, 283.0, 1278.0, 31318.0, 979370.0, 33975.0, 1363.0, 251.0, 116.0, 58.0, 51.0, 37.0, 27.0, 16.0, 9.0, 11.0, 7.0, 6.0, 6.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.019622802734375, -0.019054174423217773, -0.018485546112060547, -0.01791691780090332, -0.017348289489746094, -0.016779661178588867, -0.01621103286743164, -0.015642404556274414, -0.015073776245117188, -0.014505147933959961, -0.013936519622802734, -0.013367891311645508, -0.012799263000488281, -0.012230634689331055, -0.011662006378173828, -0.011093378067016602, -0.010524749755859375, -0.009956121444702148, -0.009387493133544922, -0.008818864822387695, -0.008250236511230469, -0.007681608200073242, -0.007112979888916016, -0.006544351577758789, -0.0059757232666015625, -0.005407094955444336, -0.004838466644287109, -0.004269838333129883, -0.0037012100219726562, -0.0031325817108154297, -0.002563953399658203, -0.0019953250885009766, -0.00142669677734375, -0.0008580684661865234, -0.0002894401550292969, 0.0002791881561279297, 0.0008478164672851562, 0.0014164447784423828, 0.0019850730895996094, 0.002553701400756836, 0.0031223297119140625, 0.003690958023071289, 0.004259586334228516, 0.004828214645385742, 0.005396842956542969, 0.005965471267700195, 0.006534099578857422, 0.0071027278900146484, 0.007671356201171875, 0.008239984512329102, 0.008808612823486328, 0.009377241134643555, 0.009945869445800781, 0.010514497756958008, 0.011083126068115234, 0.011651754379272461, 0.012220382690429688, 0.012789011001586914, 0.01335763931274414, 0.013926267623901367, 0.014494895935058594, 0.01506352424621582, 0.015632152557373047, 0.016200780868530273, 0.0167694091796875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 653.0, 359.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018341382965445518, -0.001212620292790234, -0.0005911022890359163, 3.0415714718401432e-05, 0.0006519337184727192, 0.0012734518386423588, 0.0018949697259813547, 0.0025164876133203506, 0.0031380057334899902, 0.00375952385365963, 0.004381041973829269, 0.005002559628337622, 0.005624077748507261, 0.006245595868676901, 0.006867113523185253, 0.007488631643354893, 0.008110149763524532, 0.008731667883694172, 0.009353186003863811, 0.009974704124033451, 0.010596221312880516, 0.011217739433050156, 0.011839257553219795, 0.012460775673389435, 0.013082293793559074, 0.013703811913728714, 0.014325330033898354, 0.014946848154067993, 0.015568366274237633, 0.016189884394407272, 0.016811402514576912, 0.01743292063474655, 0.018054436892271042, 0.01867595501244068, 0.01929747313261032, 0.01991899125277996, 0.0205405093729496, 0.02116202749311924, 0.02178354561328888, 0.02240506187081337, 0.02302658185362816, 0.023648099973797798, 0.024269618093967438, 0.024891136214137077, 0.025512654334306717, 0.026134172454476357, 0.026755690574645996, 0.027377206832170486, 0.027998724952340126, 0.028620243072509766, 0.029241761192679405, 0.029863279312849045, 0.030484797433018684, 0.031106315553188324, 0.031727831810712814, 0.0323493517935276, 0.032970868051052094, 0.033592384308576584, 0.03421390429139137, 0.03483542054891586, 0.03545694053173065, 0.03607845678925514, 0.03669997677206993, 0.03732149302959442, 0.03794301301240921]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 9.0, 7.0, 13.0, 29.0, 30.0, 30.0, 46.0, 55.0, 50.0, 84.0, 73.0, 79.0, 108.0, 66.0, 85.0, 63.0, 53.0, 42.0, 35.0, 24.0, 10.0, 3.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.002049744129180908, -0.002006715163588524, -0.0019636861979961395, -0.0019206572324037552, -0.0018776282668113708, -0.0018345993012189865, -0.0017915703356266022, -0.0017485413700342178, -0.0017055124044418335, -0.0016624834388494492, -0.0016194544732570648, -0.0015764255076646805, -0.0015333965420722961, -0.0014903675764799118, -0.0014473386108875275, -0.0014043096452951431, -0.0013612806797027588, -0.0013182517141103745, -0.0012752227485179901, -0.0012321937829256058, -0.0011891648173332214, -0.001146135851740837, -0.0011031068861484528, -0.0010600779205560684, -0.001017048954963684, -0.0009740199893712997, -0.0009309910237789154, -0.0008879620581865311, -0.0008449330925941467, -0.0008019041270017624, -0.000758875161409378, -0.0007158461958169937, -0.0006728172302246094, -0.000629788264632225, -0.0005867592990398407, -0.0005437303334474564, -0.000500701367855072, -0.0004576724022626877, -0.00041464343667030334, -0.000371614471077919, -0.00032858550548553467, -0.00028555653989315033, -0.000242527574300766, -0.00019949860870838165, -0.00015646964311599731, -0.00011344067752361298, -7.041171193122864e-05, -2.73827463388443e-05, 1.564621925354004e-05, 5.867518484592438e-05, 0.00010170415043830872, 0.00014473311603069305, 0.0001877620816230774, 0.00023079104721546173, 0.00027382001280784607, 0.0003168489784002304, 0.00035987794399261475, 0.0004029069095849991, 0.0004459358751773834, 0.0004889648407697678, 0.0005319938063621521, 0.0005750227719545364, 0.0006180517375469208, 0.0006610807031393051, 0.0007041096687316895]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 7.0, 4.0, 5.0, 6.0, 11.0, 10.0, 15.0, 14.0, 19.0, 30.0, 29.0, 30.0, 22.0, 28.0, 39.0, 53.0, 35.0, 44.0, 47.0, 42.0, 40.0, 50.0, 39.0, 45.0, 43.0, 37.0, 40.0, 42.0, 32.0, 27.0, 17.0, 18.0, 18.0, 12.0, 19.0, 8.0, 7.0, 6.0, 4.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1171875, -3.013580322265625, -2.90997314453125, -2.806365966796875, -2.7027587890625, -2.599151611328125, -2.49554443359375, -2.391937255859375, -2.288330078125, -2.184722900390625, -2.08111572265625, -1.977508544921875, -1.8739013671875, -1.770294189453125, -1.66668701171875, -1.563079833984375, -1.45947265625, -1.355865478515625, -1.25225830078125, -1.148651123046875, -1.0450439453125, -0.941436767578125, -0.83782958984375, -0.734222412109375, -0.630615234375, -0.527008056640625, -0.42340087890625, -0.319793701171875, -0.2161865234375, -0.112579345703125, -0.00897216796875, 0.094635009765625, 0.1982421875, 0.301849365234375, 0.40545654296875, 0.509063720703125, 0.6126708984375, 0.716278076171875, 0.81988525390625, 0.923492431640625, 1.027099609375, 1.130706787109375, 1.23431396484375, 1.337921142578125, 1.4415283203125, 1.545135498046875, 1.64874267578125, 1.752349853515625, 1.85595703125, 1.959564208984375, 2.06317138671875, 2.166778564453125, 2.2703857421875, 2.373992919921875, 2.47760009765625, 2.581207275390625, 2.684814453125, 2.788421630859375, 2.89202880859375, 2.995635986328125, 3.0992431640625, 3.202850341796875, 3.30645751953125, 3.410064697265625, 3.513671875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 12.0, 8.0, 19.0, 21.0, 43.0, 61.0, 118.0, 154.0, 265.0, 454.0, 751.0, 1355.0, 2515.0, 4702.0, 9846.0, 22616.0, 57395.0, 176433.0, 428822.0, 223002.0, 69928.0, 26697.0, 11492.0, 5494.0, 2769.0, 1478.0, 782.0, 526.0, 282.0, 178.0, 116.0, 62.0, 56.0, 32.0, 22.0, 18.0, 9.0, 9.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.91058349609375, -5.7235107421875, -5.53643798828125, -5.349365234375, -5.16229248046875, -4.9752197265625, -4.78814697265625, -4.60107421875, -4.41400146484375, -4.2269287109375, -4.03985595703125, -3.852783203125, -3.66571044921875, -3.4786376953125, -3.29156494140625, -3.1044921875, -2.91741943359375, -2.7303466796875, -2.54327392578125, -2.356201171875, -2.16912841796875, -1.9820556640625, -1.79498291015625, -1.60791015625, -1.42083740234375, -1.2337646484375, -1.04669189453125, -0.859619140625, -0.67254638671875, -0.4854736328125, -0.29840087890625, -0.111328125, 0.07574462890625, 0.2628173828125, 0.44989013671875, 0.636962890625, 0.82403564453125, 1.0111083984375, 1.19818115234375, 1.38525390625, 1.57232666015625, 1.7593994140625, 1.94647216796875, 2.133544921875, 2.32061767578125, 2.5076904296875, 2.69476318359375, 2.8818359375, 3.06890869140625, 3.2559814453125, 3.44305419921875, 3.630126953125, 3.81719970703125, 4.0042724609375, 4.19134521484375, 4.37841796875, 4.56549072265625, 4.7525634765625, 4.93963623046875, 5.126708984375, 5.31378173828125, 5.5008544921875, 5.68792724609375, 5.875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 8.0, 9.0, 15.0, 12.0, 13.0, 16.0, 24.0, 28.0, 23.0, 34.0, 43.0, 51.0, 52.0, 73.0, 119.0, 171.0, 1339.0, 330.0, 175.0, 111.0, 70.0, 61.0, 42.0, 41.0, 20.0, 32.0, 28.0, 18.0, 12.0, 20.0, 13.0, 7.0, 8.0, 8.0, 2.0, 6.0, 0.0, 2.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9466552734375, -10.604248046875, -10.2618408203125, -9.91943359375, -9.5770263671875, -9.234619140625, -8.8922119140625, -8.5498046875, -8.2073974609375, -7.864990234375, -7.5225830078125, -7.18017578125, -6.8377685546875, -6.495361328125, -6.1529541015625, -5.810546875, -5.4681396484375, -5.125732421875, -4.7833251953125, -4.44091796875, -4.0985107421875, -3.756103515625, -3.4136962890625, -3.0712890625, -2.7288818359375, -2.386474609375, -2.0440673828125, -1.70166015625, -1.3592529296875, -1.016845703125, -0.6744384765625, -0.33203125, 0.0103759765625, 0.352783203125, 0.6951904296875, 1.03759765625, 1.3800048828125, 1.722412109375, 2.0648193359375, 2.4072265625, 2.7496337890625, 3.092041015625, 3.4344482421875, 3.77685546875, 4.1192626953125, 4.461669921875, 4.8040771484375, 5.146484375, 5.4888916015625, 5.831298828125, 6.1737060546875, 6.51611328125, 6.8585205078125, 7.200927734375, 7.5433349609375, 7.8857421875, 8.2281494140625, 8.570556640625, 8.9129638671875, 9.25537109375, 9.5977783203125, 9.940185546875, 10.2825927734375, 10.625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 11.0, 11.0, 4.0, 14.0, 22.0, 28.0, 41.0, 38.0, 54.0, 71.0, 107.0, 165.0, 228.0, 463.0, 1219.0, 3885.0, 25041.0, 782205.0, 2262337.0, 60165.0, 6404.0, 1626.0, 618.0, 306.0, 183.0, 120.0, 73.0, 65.0, 44.0, 35.0, 19.0, 22.0, 21.0, 14.0, 13.0, 9.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.07373046875, -15.5224609375, -14.97119140625, -14.419921875, -13.86865234375, -13.3173828125, -12.76611328125, -12.21484375, -11.66357421875, -11.1123046875, -10.56103515625, -10.009765625, -9.45849609375, -8.9072265625, -8.35595703125, -7.8046875, -7.25341796875, -6.7021484375, -6.15087890625, -5.599609375, -5.04833984375, -4.4970703125, -3.94580078125, -3.39453125, -2.84326171875, -2.2919921875, -1.74072265625, -1.189453125, -0.63818359375, -0.0869140625, 0.46435546875, 1.015625, 1.56689453125, 2.1181640625, 2.66943359375, 3.220703125, 3.77197265625, 4.3232421875, 4.87451171875, 5.42578125, 5.97705078125, 6.5283203125, 7.07958984375, 7.630859375, 8.18212890625, 8.7333984375, 9.28466796875, 9.8359375, 10.38720703125, 10.9384765625, 11.48974609375, 12.041015625, 12.59228515625, 13.1435546875, 13.69482421875, 14.24609375, 14.79736328125, 15.3486328125, 15.89990234375, 16.451171875, 17.00244140625, 17.5537109375, 18.10498046875, 18.65625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 13.0, 325.0, 639.0, 42.0, 1.0], "bins": [-458.5304870605469, -451.0351867675781, -443.5398864746094, -436.0445556640625, -428.54925537109375, -421.053955078125, -413.55865478515625, -406.0633239746094, -398.5680236816406, -391.0727233886719, -383.5774230957031, -376.08209228515625, -368.5867919921875, -361.09149169921875, -353.59619140625, -346.1008605957031, -338.6055603027344, -331.1102600097656, -323.6149597167969, -316.11962890625, -308.62432861328125, -301.1290283203125, -293.63372802734375, -286.1383972167969, -278.6430969238281, -271.1477966308594, -263.6524963378906, -256.15716552734375, -248.661865234375, -241.16656494140625, -233.67124938964844, -226.1759490966797, -218.68063354492188, -211.18533325195312, -203.6900177001953, -196.19471740722656, -188.69940185546875, -181.2041015625, -173.7087860107422, -166.21348571777344, -158.7181854248047, -151.22288513183594, -143.72756958007812, -136.23226928710938, -128.73695373535156, -121.24165344238281, -113.746337890625, -106.25103759765625, -98.75572204589844, -91.26041412353516, -83.76510620117188, -76.2697982788086, -68.77449035644531, -61.2791862487793, -53.783878326416016, -46.288570404052734, -38.79326248168945, -31.297954559326172, -23.80264663696289, -16.307340621948242, -8.812032699584961, -1.3167266845703125, 6.178581237792969, 13.67388916015625, 21.16919708251953]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 8.0, 5.0, 12.0, 18.0, 16.0, 17.0, 18.0, 20.0, 19.0, 33.0, 37.0, 38.0, 39.0, 45.0, 41.0, 58.0, 40.0, 45.0, 38.0, 39.0, 33.0, 51.0, 32.0, 32.0, 31.0, 30.0, 25.0, 27.0, 23.0, 32.0, 18.0, 12.0, 17.0, 11.0, 9.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.43394470214844, -32.4145393371582, -31.395137786865234, -30.375734329223633, -29.35633087158203, -28.336925506591797, -27.317522048950195, -26.298118591308594, -25.278715133666992, -24.25931167602539, -23.23990821838379, -22.220504760742188, -21.201099395751953, -20.181697845458984, -19.16229248046875, -18.14288902282715, -17.123485565185547, -16.104082107543945, -15.084678649902344, -14.065274238586426, -13.045870780944824, -12.026467323303223, -11.007062911987305, -9.987659454345703, -8.968255996704102, -7.9488525390625, -6.92944860458374, -5.9100446701049805, -4.890641212463379, -3.8712377548217773, -2.8518338203430176, -1.8324298858642578, -0.8130302429199219, 0.2063734531402588, 1.2257771492004395, 2.24518084526062, 3.264584541320801, 4.283987998962402, 5.303391933441162, 6.322795867919922, 7.342199325561523, 8.361602783203125, 9.381006240844727, 10.400410652160645, 11.419814109802246, 12.439217567443848, 13.458621978759766, 14.478025436401367, 15.497428894042969, 16.51683235168457, 17.536235809326172, 18.555639266967773, 19.575042724609375, 20.59444808959961, 21.61385154724121, 22.633255004882812, 23.652658462524414, 24.672061920166016, 25.691465377807617, 26.71086883544922, 27.730274200439453, 28.749675750732422, 29.769081115722656, 30.788484573364258, 31.80788803100586]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 4.0, 9.0, 11.0, 6.0, 6.0, 15.0, 12.0, 20.0, 17.0, 22.0, 28.0, 27.0, 30.0, 38.0, 25.0, 40.0, 45.0, 44.0, 51.0, 45.0, 36.0, 39.0, 51.0, 46.0, 36.0, 35.0, 41.0, 38.0, 37.0, 26.0, 20.0, 18.0, 17.0, 13.0, 12.0, 10.0, 7.0, 6.0, 10.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.404296875, -3.298065185546875, -3.19183349609375, -3.085601806640625, -2.9793701171875, -2.873138427734375, -2.76690673828125, -2.660675048828125, -2.554443359375, -2.448211669921875, -2.34197998046875, -2.235748291015625, -2.1295166015625, -2.023284912109375, -1.91705322265625, -1.810821533203125, -1.70458984375, -1.598358154296875, -1.49212646484375, -1.385894775390625, -1.2796630859375, -1.173431396484375, -1.06719970703125, -0.960968017578125, -0.854736328125, -0.748504638671875, -0.64227294921875, -0.536041259765625, -0.4298095703125, -0.323577880859375, -0.21734619140625, -0.111114501953125, -0.0048828125, 0.101348876953125, 0.20758056640625, 0.313812255859375, 0.4200439453125, 0.526275634765625, 0.63250732421875, 0.738739013671875, 0.844970703125, 0.951202392578125, 1.05743408203125, 1.163665771484375, 1.2698974609375, 1.376129150390625, 1.48236083984375, 1.588592529296875, 1.69482421875, 1.801055908203125, 1.90728759765625, 2.013519287109375, 2.1197509765625, 2.225982666015625, 2.33221435546875, 2.438446044921875, 2.544677734375, 2.650909423828125, 2.75714111328125, 2.863372802734375, 2.9696044921875, 3.075836181640625, 3.18206787109375, 3.288299560546875, 3.39453125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 6.0, 9.0, 12.0, 24.0, 47.0, 56.0, 97.0, 169.0, 234.0, 452.0, 883.0, 1849.0, 3893.0, 10331.0, 37207.0, 369706.0, 2999431.0, 692840.0, 55603.0, 12653.0, 4565.0, 2034.0, 1001.0, 489.0, 259.0, 153.0, 95.0, 67.0, 29.0, 28.0, 17.0, 17.0, 5.0, 7.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53125, -11.1776123046875, -10.823974609375, -10.4703369140625, -10.11669921875, -9.7630615234375, -9.409423828125, -9.0557861328125, -8.7021484375, -8.3485107421875, -7.994873046875, -7.6412353515625, -7.28759765625, -6.9339599609375, -6.580322265625, -6.2266845703125, -5.873046875, -5.5194091796875, -5.165771484375, -4.8121337890625, -4.45849609375, -4.1048583984375, -3.751220703125, -3.3975830078125, -3.0439453125, -2.6903076171875, -2.336669921875, -1.9830322265625, -1.62939453125, -1.2757568359375, -0.922119140625, -0.5684814453125, -0.21484375, 0.1387939453125, 0.492431640625, 0.8460693359375, 1.19970703125, 1.5533447265625, 1.906982421875, 2.2606201171875, 2.6142578125, 2.9678955078125, 3.321533203125, 3.6751708984375, 4.02880859375, 4.3824462890625, 4.736083984375, 5.0897216796875, 5.443359375, 5.7969970703125, 6.150634765625, 6.5042724609375, 6.85791015625, 7.2115478515625, 7.565185546875, 7.9188232421875, 8.2724609375, 8.6260986328125, 8.979736328125, 9.3333740234375, 9.68701171875, 10.0406494140625, 10.394287109375, 10.7479248046875, 11.1015625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 12.0, 20.0, 31.0, 40.0, 64.0, 123.0, 151.0, 277.0, 453.0, 713.0, 794.0, 557.0, 358.0, 201.0, 105.0, 63.0, 41.0, 17.0, 23.0, 11.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.203125, -11.845703125, -11.48828125, -11.130859375, -10.7734375, -10.416015625, -10.05859375, -9.701171875, -9.34375, -8.986328125, -8.62890625, -8.271484375, -7.9140625, -7.556640625, -7.19921875, -6.841796875, -6.484375, -6.126953125, -5.76953125, -5.412109375, -5.0546875, -4.697265625, -4.33984375, -3.982421875, -3.625, -3.267578125, -2.91015625, -2.552734375, -2.1953125, -1.837890625, -1.48046875, -1.123046875, -0.765625, -0.408203125, -0.05078125, 0.306640625, 0.6640625, 1.021484375, 1.37890625, 1.736328125, 2.09375, 2.451171875, 2.80859375, 3.166015625, 3.5234375, 3.880859375, 4.23828125, 4.595703125, 4.953125, 5.310546875, 5.66796875, 6.025390625, 6.3828125, 6.740234375, 7.09765625, 7.455078125, 7.8125, 8.169921875, 8.52734375, 8.884765625, 9.2421875, 9.599609375, 9.95703125, 10.314453125, 10.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 20.0, 25.0, 38.0, 67.0, 159.0, 255.0, 792.0, 2887.0, 28037.0, 3335165.0, 811808.0, 12016.0, 1859.0, 553.0, 277.0, 126.0, 69.0, 45.0, 27.0, 13.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.9375, -31.7958984375, -30.654296875, -29.5126953125, -28.37109375, -27.2294921875, -26.087890625, -24.9462890625, -23.8046875, -22.6630859375, -21.521484375, -20.3798828125, -19.23828125, -18.0966796875, -16.955078125, -15.8134765625, -14.671875, -13.5302734375, -12.388671875, -11.2470703125, -10.10546875, -8.9638671875, -7.822265625, -6.6806640625, -5.5390625, -4.3974609375, -3.255859375, -2.1142578125, -0.97265625, 0.1689453125, 1.310546875, 2.4521484375, 3.59375, 4.7353515625, 5.876953125, 7.0185546875, 8.16015625, 9.3017578125, 10.443359375, 11.5849609375, 12.7265625, 13.8681640625, 15.009765625, 16.1513671875, 17.29296875, 18.4345703125, 19.576171875, 20.7177734375, 21.859375, 23.0009765625, 24.142578125, 25.2841796875, 26.42578125, 27.5673828125, 28.708984375, 29.8505859375, 30.9921875, 32.1337890625, 33.275390625, 34.4169921875, 35.55859375, 36.7001953125, 37.841796875, 38.9833984375, 40.125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 10.0, 16.0, 20.0, 25.0, 38.0, 54.0, 76.0, 95.0, 108.0, 113.0, 90.0, 90.0, 73.0, 61.0, 35.0, 34.0, 17.0, 13.0, 8.0, 13.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.78776168823242, -36.51385498046875, -35.23994445800781, -33.96603775024414, -32.69213104248047, -31.418222427368164, -30.14431381225586, -28.870407104492188, -27.596500396728516, -26.32259178161621, -25.04868507385254, -23.774776458740234, -22.500869750976562, -21.226961135864258, -19.953052520751953, -18.67914581298828, -17.405237197875977, -16.131328582763672, -14.857421875, -13.583513259887695, -12.309606552124023, -11.035697937011719, -9.76179027557373, -8.487882614135742, -7.213974952697754, -5.940067291259766, -4.666159629821777, -3.392251491546631, -2.1183438301086426, -0.8444361686706543, 0.4294719696044922, 1.7033796310424805, 2.9772872924804688, 4.251194953918457, 5.525102615356445, 6.799010753631592, 8.072917938232422, 9.346826553344727, 10.620734214782715, 11.894641876220703, 13.168549537658691, 14.44245719909668, 15.716364860534668, 16.990272521972656, 18.26418113708496, 19.538087844848633, 20.811996459960938, 22.08590316772461, 23.359811782836914, 24.63372039794922, 25.90762710571289, 27.181535720825195, 28.455442428588867, 29.729351043701172, 31.003257751464844, 32.27716827392578, 33.55107498168945, 34.824981689453125, 36.09889221191406, 37.372798919677734, 38.646705627441406, 39.92061233520508, 41.194522857666016, 42.46842956542969, 43.74233627319336]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 5.0, 7.0, 15.0, 6.0, 15.0, 13.0, 22.0, 18.0, 28.0, 28.0, 21.0, 25.0, 28.0, 35.0, 25.0, 46.0, 35.0, 33.0, 33.0, 47.0, 39.0, 30.0, 34.0, 30.0, 32.0, 35.0, 37.0, 32.0, 31.0, 26.0, 28.0, 17.0, 22.0, 18.0, 13.0, 7.0, 18.0, 10.0, 13.0, 7.0, 6.0, 6.0, 3.0, 4.0, 3.0, 5.0, 6.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-20.617080688476562, -19.964778900146484, -19.312477111816406, -18.660175323486328, -18.00787353515625, -17.355571746826172, -16.703269958496094, -16.050968170166016, -15.398666381835938, -14.74636459350586, -14.094062805175781, -13.441761016845703, -12.789459228515625, -12.137157440185547, -11.484855651855469, -10.83255386352539, -10.180252075195312, -9.527950286865234, -8.875648498535156, -8.223346710205078, -7.571044921875, -6.918743133544922, -6.266441345214844, -5.614139556884766, -4.9618377685546875, -4.309535980224609, -3.6572341918945312, -3.004932403564453, -2.352630615234375, -1.7003288269042969, -1.0480270385742188, -0.3957252502441406, 0.2565765380859375, 0.9088783264160156, 1.5611801147460938, 2.213481903076172, 2.86578369140625, 3.518085479736328, 4.170387268066406, 4.822689056396484, 5.4749908447265625, 6.127292633056641, 6.779594421386719, 7.431896209716797, 8.084197998046875, 8.736499786376953, 9.388801574707031, 10.04110336303711, 10.693405151367188, 11.345706939697266, 11.998008728027344, 12.650310516357422, 13.3026123046875, 13.954914093017578, 14.607215881347656, 15.259517669677734, 15.911819458007812, 16.56412124633789, 17.21642303466797, 17.868724822998047, 18.521026611328125, 19.173328399658203, 19.82563018798828, 20.47793197631836, 21.130233764648438]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 5.0, 7.0, 3.0, 12.0, 5.0, 10.0, 9.0, 14.0, 14.0, 18.0, 18.0, 28.0, 26.0, 30.0, 30.0, 37.0, 37.0, 39.0, 38.0, 54.0, 38.0, 39.0, 44.0, 47.0, 38.0, 41.0, 38.0, 33.0, 36.0, 35.0, 28.0, 28.0, 23.0, 13.0, 15.0, 17.0, 13.0, 9.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.5078125, -3.403350830078125, -3.29888916015625, -3.194427490234375, -3.0899658203125, -2.985504150390625, -2.88104248046875, -2.776580810546875, -2.672119140625, -2.567657470703125, -2.46319580078125, -2.358734130859375, -2.2542724609375, -2.149810791015625, -2.04534912109375, -1.940887451171875, -1.83642578125, -1.731964111328125, -1.62750244140625, -1.523040771484375, -1.4185791015625, -1.314117431640625, -1.20965576171875, -1.105194091796875, -1.000732421875, -0.896270751953125, -0.79180908203125, -0.687347412109375, -0.5828857421875, -0.478424072265625, -0.37396240234375, -0.269500732421875, -0.1650390625, -0.060577392578125, 0.04388427734375, 0.148345947265625, 0.2528076171875, 0.357269287109375, 0.46173095703125, 0.566192626953125, 0.670654296875, 0.775115966796875, 0.87957763671875, 0.984039306640625, 1.0885009765625, 1.192962646484375, 1.29742431640625, 1.401885986328125, 1.50634765625, 1.610809326171875, 1.71527099609375, 1.819732666015625, 1.9241943359375, 2.028656005859375, 2.13311767578125, 2.237579345703125, 2.342041015625, 2.446502685546875, 2.55096435546875, 2.655426025390625, 2.7598876953125, 2.864349365234375, 2.96881103515625, 3.073272705078125, 3.177734375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 12.0, 16.0, 37.0, 44.0, 65.0, 65.0, 139.0, 199.0, 267.0, 428.0, 615.0, 857.0, 1327.0, 2132.0, 3340.0, 5147.0, 8506.0, 13864.0, 23269.0, 40812.0, 74616.0, 159974.0, 372954.0, 162192.0, 75524.0, 41149.0, 23777.0, 13865.0, 8476.0, 5177.0, 3396.0, 2109.0, 1424.0, 939.0, 560.0, 405.0, 310.0, 178.0, 105.0, 100.0, 63.0, 34.0, 34.0, 19.0, 14.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19729995727539062, -0.19123077392578125, -0.18516159057617188, -0.1790924072265625, -0.17302322387695312, -0.16695404052734375, -0.16088485717773438, -0.154815673828125, -0.14874649047851562, -0.14267730712890625, -0.13660812377929688, -0.1305389404296875, -0.12446975708007812, -0.11840057373046875, -0.11233139038085938, -0.10626220703125, -0.10019302368164062, -0.09412384033203125, -0.08805465698242188, -0.0819854736328125, -0.07591629028320312, -0.06984710693359375, -0.06377792358398438, -0.057708740234375, -0.051639556884765625, -0.04557037353515625, -0.039501190185546875, -0.0334320068359375, -0.027362823486328125, -0.02129364013671875, -0.015224456787109375, -0.0091552734375, -0.003086090087890625, 0.00298309326171875, 0.009052276611328125, 0.0151214599609375, 0.021190643310546875, 0.02725982666015625, 0.033329010009765625, 0.039398193359375, 0.045467376708984375, 0.05153656005859375, 0.057605743408203125, 0.0636749267578125, 0.06974411010742188, 0.07581329345703125, 0.08188247680664062, 0.08795166015625, 0.09402084350585938, 0.10009002685546875, 0.10615921020507812, 0.1122283935546875, 0.11829757690429688, 0.12436676025390625, 0.13043594360351562, 0.136505126953125, 0.14257431030273438, 0.14864349365234375, 0.15471267700195312, 0.1607818603515625, 0.16685104370117188, 0.17292022705078125, 0.17898941040039062, 0.18505859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 10.0, 4.0, 11.0, 7.0, 19.0, 16.0, 23.0, 27.0, 20.0, 22.0, 31.0, 30.0, 28.0, 33.0, 32.0, 31.0, 44.0, 31.0, 39.0, 1070.0, 44.0, 51.0, 33.0, 43.0, 40.0, 35.0, 29.0, 30.0, 34.0, 27.0, 19.0, 15.0, 15.0, 14.0, 9.0, 15.0, 12.0, 6.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.811279296875, -2.72412109375, -2.636962890625, -2.5498046875, -2.462646484375, -2.37548828125, -2.288330078125, -2.201171875, -2.114013671875, -2.02685546875, -1.939697265625, -1.8525390625, -1.765380859375, -1.67822265625, -1.591064453125, -1.50390625, -1.416748046875, -1.32958984375, -1.242431640625, -1.1552734375, -1.068115234375, -0.98095703125, -0.893798828125, -0.806640625, -0.719482421875, -0.63232421875, -0.545166015625, -0.4580078125, -0.370849609375, -0.28369140625, -0.196533203125, -0.109375, -0.022216796875, 0.06494140625, 0.152099609375, 0.2392578125, 0.326416015625, 0.41357421875, 0.500732421875, 0.587890625, 0.675048828125, 0.76220703125, 0.849365234375, 0.9365234375, 1.023681640625, 1.11083984375, 1.197998046875, 1.28515625, 1.372314453125, 1.45947265625, 1.546630859375, 1.6337890625, 1.720947265625, 1.80810546875, 1.895263671875, 1.982421875, 2.069580078125, 2.15673828125, 2.243896484375, 2.3310546875, 2.418212890625, 2.50537109375, 2.592529296875, 2.6796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 2.0, 10.0, 6.0, 14.0, 20.0, 36.0, 46.0, 58.0, 92.0, 107.0, 200.0, 283.0, 372.0, 569.0, 801.0, 1213.0, 1775.0, 2722.0, 4082.0, 6403.0, 9795.0, 15047.0, 23948.0, 37636.0, 62233.0, 113683.0, 520384.0, 1008119.0, 116570.0, 63608.0, 38210.0, 24113.0, 15651.0, 9924.0, 6619.0, 4262.0, 2808.0, 1921.0, 1191.0, 820.0, 547.0, 394.0, 261.0, 184.0, 124.0, 85.0, 64.0, 29.0, 30.0, 20.0, 19.0, 9.0, 10.0, 3.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.06573486328125, -0.06374406814575195, -0.061753273010253906, -0.05976247787475586, -0.05777168273925781, -0.055780887603759766, -0.05379009246826172, -0.05179929733276367, -0.049808502197265625, -0.04781770706176758, -0.04582691192626953, -0.043836116790771484, -0.04184532165527344, -0.03985452651977539, -0.037863731384277344, -0.0358729362487793, -0.03388214111328125, -0.0318913459777832, -0.029900550842285156, -0.02790975570678711, -0.025918960571289062, -0.023928165435791016, -0.02193737030029297, -0.019946575164794922, -0.017955780029296875, -0.015964984893798828, -0.013974189758300781, -0.011983394622802734, -0.009992599487304688, -0.00800180435180664, -0.006011009216308594, -0.004020214080810547, -0.0020294189453125, -3.8623809814453125e-05, 0.0019521713256835938, 0.003942966461181641, 0.0059337615966796875, 0.007924556732177734, 0.009915351867675781, 0.011906147003173828, 0.013896942138671875, 0.015887737274169922, 0.01787853240966797, 0.019869327545166016, 0.021860122680664062, 0.02385091781616211, 0.025841712951660156, 0.027832508087158203, 0.02982330322265625, 0.0318140983581543, 0.033804893493652344, 0.03579568862915039, 0.03778648376464844, 0.039777278900146484, 0.04176807403564453, 0.04375886917114258, 0.045749664306640625, 0.04774045944213867, 0.04973125457763672, 0.051722049713134766, 0.05371284484863281, 0.05570363998413086, 0.057694435119628906, 0.05968523025512695, 0.061676025390625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 6.0, 8.0, 18.0, 15.0, 19.0, 24.0, 19.0, 32.0, 30.0, 59.0, 29.0, 50.0, 66.0, 106.0, 79.0, 65.0, 50.0, 43.0, 44.0, 36.0, 34.0, 26.0, 22.0, 20.0, 12.0, 9.0, 12.0, 3.0, 7.0, 3.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007395744323730469, -0.0007162019610404968, -0.0006928294897079468, -0.0006694570183753967, -0.0006460845470428467, -0.0006227120757102966, -0.0005993396043777466, -0.0005759671330451965, -0.0005525946617126465, -0.0005292221903800964, -0.0005058497190475464, -0.00048247724771499634, -0.0004591047763824463, -0.00043573230504989624, -0.0004123598337173462, -0.00038898736238479614, -0.0003656148910522461, -0.00034224241971969604, -0.000318869948387146, -0.00029549747705459595, -0.0002721250057220459, -0.00024875253438949585, -0.0002253800630569458, -0.00020200759172439575, -0.0001786351203918457, -0.00015526264905929565, -0.0001318901777267456, -0.00010851770639419556, -8.514523506164551e-05, -6.177276372909546e-05, -3.840029239654541e-05, -1.5027821063995361e-05, 8.344650268554688e-06, 3.1717121601104736e-05, 5.5089592933654785e-05, 7.846206426620483e-05, 0.00010183453559875488, 0.00012520700693130493, 0.00014857947826385498, 0.00017195194959640503, 0.00019532442092895508, 0.00021869689226150513, 0.00024206936359405518, 0.0002654418349266052, 0.0002888143062591553, 0.0003121867775917053, 0.00033555924892425537, 0.0003589317202568054, 0.00038230419158935547, 0.0004056766629219055, 0.00042904913425445557, 0.0004524216055870056, 0.00047579407691955566, 0.0004991665482521057, 0.0005225390195846558, 0.0005459114909172058, 0.0005692839622497559, 0.0005926564335823059, 0.000616028904914856, 0.000639401376247406, 0.0006627738475799561, 0.0006861463189125061, 0.0007095187902450562, 0.0007328912615776062, 0.0007562637329101562]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 9.0, 2.0, 3.0, 1.0, 4.0, 6.0, 6.0, 10.0, 12.0, 29.0, 33.0, 39.0, 49.0, 74.0, 105.0, 185.0, 581.0, 4876.0, 102722.0, 905777.0, 31211.0, 2026.0, 346.0, 146.0, 75.0, 62.0, 40.0, 28.0, 20.0, 16.0, 11.0, 10.0, 4.0, 12.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.0151519775390625, -0.014683246612548828, -0.014214515686035156, -0.013745784759521484, -0.013277053833007812, -0.01280832290649414, -0.012339591979980469, -0.011870861053466797, -0.011402130126953125, -0.010933399200439453, -0.010464668273925781, -0.00999593734741211, -0.009527206420898438, -0.009058475494384766, -0.008589744567871094, -0.008121013641357422, -0.00765228271484375, -0.007183551788330078, -0.006714820861816406, -0.006246089935302734, -0.0057773590087890625, -0.005308628082275391, -0.004839897155761719, -0.004371166229248047, -0.003902435302734375, -0.003433704376220703, -0.0029649734497070312, -0.0024962425231933594, -0.0020275115966796875, -0.0015587806701660156, -0.0010900497436523438, -0.0006213188171386719, -0.000152587890625, 0.0003161430358886719, 0.0007848739624023438, 0.0012536048889160156, 0.0017223358154296875, 0.0021910667419433594, 0.0026597976684570312, 0.003128528594970703, 0.003597259521484375, 0.004065990447998047, 0.004534721374511719, 0.005003452301025391, 0.0054721832275390625, 0.005940914154052734, 0.006409645080566406, 0.006878376007080078, 0.00734710693359375, 0.007815837860107422, 0.008284568786621094, 0.008753299713134766, 0.009222030639648438, 0.00969076156616211, 0.010159492492675781, 0.010628223419189453, 0.011096954345703125, 0.011565685272216797, 0.012034416198730469, 0.01250314712524414, 0.012971878051757812, 0.013440608978271484, 0.013909339904785156, 0.014378070831298828, 0.0148468017578125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 58.0, 937.0, 21.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020125017035752535, -0.0014199453871697187, -0.0008273891871795058, -0.0002348329871892929, 0.00035772332921624184, 0.0009502796456217766, 0.0015428357291966677, 0.0021353920456022024, 0.002727948362007737, 0.003320504678413272, 0.003913060761988163, 0.004505617078393698, 0.0050981733947992325, 0.005690729711204767, 0.006283286027610302, 0.006875841878354549, 0.0074683986604213715, 0.008060954511165619, 0.008653511293232441, 0.009246067143976688, 0.00983862392604351, 0.010431179776787758, 0.011023735627532005, 0.011616292409598827, 0.012208848260343075, 0.012801404111087322, 0.013393960893154144, 0.013986516743898392, 0.014579073525965214, 0.015171629376709461, 0.015764186158776283, 0.01635674200952053, 0.016949297860264778, 0.017541853711009026, 0.018134409561753273, 0.01872696727514267, 0.019319523125886917, 0.019912078976631165, 0.020504634827375412, 0.02109719067811966, 0.021689748391509056, 0.022282304242253304, 0.02287486009299755, 0.023467417806386948, 0.024059973657131195, 0.024652529507875443, 0.02524508535861969, 0.025837641209363937, 0.026430197060108185, 0.027022752910852432, 0.02761530876159668, 0.028207866474986076, 0.028800422325730324, 0.02939297817647457, 0.02998553402721882, 0.030578091740608215, 0.031170647591352463, 0.03176320344209671, 0.03235575929284096, 0.032948315143585205, 0.03354087099432945, 0.034133430570364, 0.034725986421108246, 0.03531854227185249, 0.03591109812259674]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 6.0, 11.0, 22.0, 25.0, 40.0, 59.0, 79.0, 65.0, 105.0, 103.0, 84.0, 94.0, 88.0, 64.0, 49.0, 52.0, 21.0, 15.0, 7.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018720626831054688, -0.0018301485106348991, -0.0017882343381643295, -0.00174632016569376, -0.0017044059932231903, -0.0016624918207526207, -0.001620577648282051, -0.0015786634758114815, -0.0015367493033409119, -0.0014948351308703423, -0.0014529209583997726, -0.001411006785929203, -0.0013690926134586334, -0.0013271784409880638, -0.0012852642685174942, -0.0012433500960469246, -0.001201435923576355, -0.0011595217511057854, -0.0011176075786352158, -0.0010756934061646461, -0.0010337792336940765, -0.000991865061223507, -0.0009499508887529373, -0.0009080367162823677, -0.0008661225438117981, -0.0008242083713412285, -0.0007822941988706589, -0.0007403800264000893, -0.0006984658539295197, -0.00065655168145895, -0.0006146375089883804, -0.0005727233365178108, -0.0005308091640472412, -0.0004888949915766716, -0.000446980819106102, -0.0004050666466355324, -0.00036315247416496277, -0.00032123830169439316, -0.00027932412922382355, -0.00023740995675325394, -0.00019549578428268433, -0.00015358161181211472, -0.0001116674393415451, -6.97532668709755e-05, -2.7839094400405884e-05, 1.4075078070163727e-05, 5.598925054073334e-05, 9.790342301130295e-05, 0.00013981759548187256, 0.00018173176795244217, 0.00022364594042301178, 0.0002655601128935814, 0.000307474285364151, 0.0003493884578347206, 0.0003913026303052902, 0.00043321680277585983, 0.00047513097524642944, 0.000517045147716999, 0.0005589593201875687, 0.0006008734926581383, 0.0006427876651287079, 0.0006847018375992775, 0.0007266160100698471, 0.0007685301825404167, 0.0008104443550109863]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 5.0, 7.0, 4.0, 11.0, 5.0, 10.0, 9.0, 14.0, 14.0, 18.0, 18.0, 28.0, 26.0, 30.0, 30.0, 37.0, 37.0, 39.0, 38.0, 54.0, 38.0, 39.0, 44.0, 47.0, 38.0, 41.0, 38.0, 33.0, 36.0, 35.0, 28.0, 28.0, 23.0, 13.0, 15.0, 17.0, 13.0, 9.0, 8.0, 5.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.5078125, -3.403350830078125, -3.29888916015625, -3.194427490234375, -3.0899658203125, -2.985504150390625, -2.88104248046875, -2.776580810546875, -2.672119140625, -2.567657470703125, -2.46319580078125, -2.358734130859375, -2.2542724609375, -2.149810791015625, -2.04534912109375, -1.940887451171875, -1.83642578125, -1.731964111328125, -1.62750244140625, -1.523040771484375, -1.4185791015625, -1.314117431640625, -1.20965576171875, -1.105194091796875, -1.000732421875, -0.896270751953125, -0.79180908203125, -0.687347412109375, -0.5828857421875, -0.478424072265625, -0.37396240234375, -0.269500732421875, -0.1650390625, -0.060577392578125, 0.04388427734375, 0.148345947265625, 0.2528076171875, 0.357269287109375, 0.46173095703125, 0.566192626953125, 0.670654296875, 0.775115966796875, 0.87957763671875, 0.984039306640625, 1.0885009765625, 1.192962646484375, 1.29742431640625, 1.401885986328125, 1.50634765625, 1.610809326171875, 1.71527099609375, 1.819732666015625, 1.9241943359375, 2.028656005859375, 2.13311767578125, 2.237579345703125, 2.342041015625, 2.446502685546875, 2.55096435546875, 2.655426025390625, 2.7598876953125, 2.864349365234375, 2.96881103515625, 3.073272705078125, 3.177734375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 13.0, 10.0, 15.0, 25.0, 27.0, 56.0, 80.0, 112.0, 186.0, 278.0, 418.0, 680.0, 1120.0, 1896.0, 3546.0, 6606.0, 14382.0, 34509.0, 93444.0, 308098.0, 389377.0, 117773.0, 41652.0, 16943.0, 7741.0, 3997.0, 2230.0, 1212.0, 776.0, 471.0, 304.0, 183.0, 121.0, 90.0, 61.0, 40.0, 30.0, 15.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.84765625, -6.62750244140625, -6.4073486328125, -6.18719482421875, -5.967041015625, -5.74688720703125, -5.5267333984375, -5.30657958984375, -5.08642578125, -4.86627197265625, -4.6461181640625, -4.42596435546875, -4.205810546875, -3.98565673828125, -3.7655029296875, -3.54534912109375, -3.3251953125, -3.10504150390625, -2.8848876953125, -2.66473388671875, -2.444580078125, -2.22442626953125, -2.0042724609375, -1.78411865234375, -1.56396484375, -1.34381103515625, -1.1236572265625, -0.90350341796875, -0.683349609375, -0.46319580078125, -0.2430419921875, -0.02288818359375, 0.197265625, 0.41741943359375, 0.6375732421875, 0.85772705078125, 1.077880859375, 1.29803466796875, 1.5181884765625, 1.73834228515625, 1.95849609375, 2.17864990234375, 2.3988037109375, 2.61895751953125, 2.839111328125, 3.05926513671875, 3.2794189453125, 3.49957275390625, 3.7197265625, 3.93988037109375, 4.1600341796875, 4.38018798828125, 4.600341796875, 4.82049560546875, 5.0406494140625, 5.26080322265625, 5.48095703125, 5.70111083984375, 5.9212646484375, 6.14141845703125, 6.361572265625, 6.58172607421875, 6.8018798828125, 7.02203369140625, 7.2421875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 7.0, 10.0, 6.0, 9.0, 8.0, 14.0, 17.0, 12.0, 24.0, 22.0, 29.0, 37.0, 20.0, 45.0, 41.0, 52.0, 61.0, 98.0, 135.0, 200.0, 1294.0, 218.0, 152.0, 94.0, 72.0, 55.0, 49.0, 41.0, 40.0, 30.0, 26.0, 29.0, 23.0, 16.0, 12.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-11.1796875, -10.85693359375, -10.5341796875, -10.21142578125, -9.888671875, -9.56591796875, -9.2431640625, -8.92041015625, -8.59765625, -8.27490234375, -7.9521484375, -7.62939453125, -7.306640625, -6.98388671875, -6.6611328125, -6.33837890625, -6.015625, -5.69287109375, -5.3701171875, -5.04736328125, -4.724609375, -4.40185546875, -4.0791015625, -3.75634765625, -3.43359375, -3.11083984375, -2.7880859375, -2.46533203125, -2.142578125, -1.81982421875, -1.4970703125, -1.17431640625, -0.8515625, -0.52880859375, -0.2060546875, 0.11669921875, 0.439453125, 0.76220703125, 1.0849609375, 1.40771484375, 1.73046875, 2.05322265625, 2.3759765625, 2.69873046875, 3.021484375, 3.34423828125, 3.6669921875, 3.98974609375, 4.3125, 4.63525390625, 4.9580078125, 5.28076171875, 5.603515625, 5.92626953125, 6.2490234375, 6.57177734375, 6.89453125, 7.21728515625, 7.5400390625, 7.86279296875, 8.185546875, 8.50830078125, 8.8310546875, 9.15380859375, 9.4765625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 4.0, 8.0, 9.0, 7.0, 4.0, 11.0, 17.0, 20.0, 23.0, 40.0, 56.0, 78.0, 102.0, 142.0, 233.0, 433.0, 933.0, 2373.0, 7585.0, 43016.0, 724148.0, 2235220.0, 110875.0, 13990.0, 3539.0, 1356.0, 566.0, 278.0, 183.0, 103.0, 82.0, 67.0, 44.0, 39.0, 25.0, 19.0, 20.0, 11.0, 9.0, 6.0, 10.0, 3.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.115966796875, -15.54443359375, -14.972900390625, -14.4013671875, -13.829833984375, -13.25830078125, -12.686767578125, -12.115234375, -11.543701171875, -10.97216796875, -10.400634765625, -9.8291015625, -9.257568359375, -8.68603515625, -8.114501953125, -7.54296875, -6.971435546875, -6.39990234375, -5.828369140625, -5.2568359375, -4.685302734375, -4.11376953125, -3.542236328125, -2.970703125, -2.399169921875, -1.82763671875, -1.256103515625, -0.6845703125, -0.113037109375, 0.45849609375, 1.030029296875, 1.6015625, 2.173095703125, 2.74462890625, 3.316162109375, 3.8876953125, 4.459228515625, 5.03076171875, 5.602294921875, 6.173828125, 6.745361328125, 7.31689453125, 7.888427734375, 8.4599609375, 9.031494140625, 9.60302734375, 10.174560546875, 10.74609375, 11.317626953125, 11.88916015625, 12.460693359375, 13.0322265625, 13.603759765625, 14.17529296875, 14.746826171875, 15.318359375, 15.889892578125, 16.46142578125, 17.032958984375, 17.6044921875, 18.176025390625, 18.74755859375, 19.319091796875, 19.890625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 12.0, 34.0, 75.0, 212.0, 287.0, 246.0, 97.0, 34.0, 16.0, 3.0, 3.0], "bins": [-139.24452209472656, -136.82455444335938, -134.40460205078125, -131.98464965820312, -129.56468200683594, -127.14472198486328, -124.72476196289062, -122.30480194091797, -119.88484191894531, -117.46488189697266, -115.044921875, -112.62496185302734, -110.20500183105469, -107.78504180908203, -105.36508178710938, -102.94512176513672, -100.52516174316406, -98.1052017211914, -95.68524169921875, -93.2652816772461, -90.84532165527344, -88.42536163330078, -86.00540161132812, -83.58544158935547, -81.16548156738281, -78.74552154541016, -76.3255615234375, -73.90560150146484, -71.48564147949219, -69.06568145751953, -66.64572143554688, -64.22576141357422, -61.80579376220703, -59.385833740234375, -56.96587371826172, -54.54591369628906, -52.125953674316406, -49.70599365234375, -47.286033630371094, -44.86607360839844, -42.44611358642578, -40.026153564453125, -37.60619354248047, -35.18623352050781, -32.766273498535156, -30.3463134765625, -27.926353454589844, -25.506393432617188, -23.086435317993164, -20.666475296020508, -18.24651527404785, -15.826555252075195, -13.406595230102539, -10.986635208129883, -8.566675186157227, -6.14671516418457, -3.726755142211914, -1.3067951202392578, 1.1131649017333984, 3.5331249237060547, 5.953084945678711, 8.373044967651367, 10.793004989624023, 13.21296501159668, 15.632925033569336]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 8.0, 4.0, 13.0, 13.0, 22.0, 20.0, 23.0, 22.0, 31.0, 23.0, 29.0, 30.0, 37.0, 44.0, 48.0, 50.0, 39.0, 39.0, 48.0, 42.0, 35.0, 37.0, 34.0, 43.0, 36.0, 31.0, 25.0, 28.0, 15.0, 22.0, 17.0, 19.0, 17.0, 14.0, 5.0, 7.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.509851455688477, -27.478479385375977, -26.447107315063477, -25.415735244750977, -24.384363174438477, -23.352991104125977, -22.321619033813477, -21.290246963500977, -20.258874893188477, -19.227502822875977, -18.196130752563477, -17.164758682250977, -16.133386611938477, -15.102014541625977, -14.070642471313477, -13.039270401000977, -12.007898330688477, -10.976526260375977, -9.945154190063477, -8.913782119750977, -7.882410049438477, -6.851037979125977, -5.819665908813477, -4.788293838500977, -3.7569217681884766, -2.7255496978759766, -1.6941776275634766, -0.6628055572509766, 0.36856651306152344, 1.3999385833740234, 2.4313106536865234, 3.4626827239990234, 4.494052886962891, 5.525424957275391, 6.556797027587891, 7.588169097900391, 8.61954116821289, 9.65091323852539, 10.68228530883789, 11.71365737915039, 12.74502944946289, 13.77640151977539, 14.80777359008789, 15.83914566040039, 16.87051773071289, 17.90188980102539, 18.93326187133789, 19.96463394165039, 20.99600601196289, 22.02737808227539, 23.05875015258789, 24.09012222290039, 25.12149429321289, 26.15286636352539, 27.18423843383789, 28.21561050415039, 29.24698257446289, 30.27835464477539, 31.30972671508789, 32.34109878540039, 33.37247085571289, 34.40384292602539, 35.43521499633789, 36.46658706665039, 37.49795913696289]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 4.0, 8.0, 5.0, 10.0, 6.0, 13.0, 18.0, 17.0, 17.0, 21.0, 22.0, 32.0, 33.0, 27.0, 32.0, 28.0, 44.0, 47.0, 44.0, 34.0, 46.0, 49.0, 39.0, 39.0, 44.0, 49.0, 31.0, 28.0, 28.0, 25.0, 28.0, 17.0, 25.0, 9.0, 9.0, 12.0, 18.0, 2.0, 9.0, 4.0, 3.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5546875, -3.44476318359375, -3.3348388671875, -3.22491455078125, -3.114990234375, -3.00506591796875, -2.8951416015625, -2.78521728515625, -2.67529296875, -2.56536865234375, -2.4554443359375, -2.34552001953125, -2.235595703125, -2.12567138671875, -2.0157470703125, -1.90582275390625, -1.7958984375, -1.68597412109375, -1.5760498046875, -1.46612548828125, -1.356201171875, -1.24627685546875, -1.1363525390625, -1.02642822265625, -0.91650390625, -0.80657958984375, -0.6966552734375, -0.58673095703125, -0.476806640625, -0.36688232421875, -0.2569580078125, -0.14703369140625, -0.037109375, 0.07281494140625, 0.1827392578125, 0.29266357421875, 0.402587890625, 0.51251220703125, 0.6224365234375, 0.73236083984375, 0.84228515625, 0.95220947265625, 1.0621337890625, 1.17205810546875, 1.281982421875, 1.39190673828125, 1.5018310546875, 1.61175537109375, 1.7216796875, 1.83160400390625, 1.9415283203125, 2.05145263671875, 2.161376953125, 2.27130126953125, 2.3812255859375, 2.49114990234375, 2.60107421875, 2.71099853515625, 2.8209228515625, 2.93084716796875, 3.040771484375, 3.15069580078125, 3.2606201171875, 3.37054443359375, 3.48046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 16.0, 24.0, 42.0, 70.0, 90.0, 144.0, 246.0, 448.0, 914.0, 1681.0, 3807.0, 9888.0, 37363.0, 320521.0, 2743810.0, 967320.0, 80734.0, 16426.0, 5712.0, 2459.0, 1115.0, 587.0, 292.0, 205.0, 105.0, 77.0, 54.0, 43.0, 20.0, 17.0, 10.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.3394775390625, -9.991455078125, -9.6434326171875, -9.29541015625, -8.9473876953125, -8.599365234375, -8.2513427734375, -7.9033203125, -7.5552978515625, -7.207275390625, -6.8592529296875, -6.51123046875, -6.1632080078125, -5.815185546875, -5.4671630859375, -5.119140625, -4.7711181640625, -4.423095703125, -4.0750732421875, -3.72705078125, -3.3790283203125, -3.031005859375, -2.6829833984375, -2.3349609375, -1.9869384765625, -1.638916015625, -1.2908935546875, -0.94287109375, -0.5948486328125, -0.246826171875, 0.1011962890625, 0.44921875, 0.7972412109375, 1.145263671875, 1.4932861328125, 1.84130859375, 2.1893310546875, 2.537353515625, 2.8853759765625, 3.2333984375, 3.5814208984375, 3.929443359375, 4.2774658203125, 4.62548828125, 4.9735107421875, 5.321533203125, 5.6695556640625, 6.017578125, 6.3656005859375, 6.713623046875, 7.0616455078125, 7.40966796875, 7.7576904296875, 8.105712890625, 8.4537353515625, 8.8017578125, 9.1497802734375, 9.497802734375, 9.8458251953125, 10.19384765625, 10.5418701171875, 10.889892578125, 11.2379150390625, 11.5859375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 9.0, 10.0, 5.0, 18.0, 23.0, 11.0, 30.0, 33.0, 49.0, 72.0, 98.0, 147.0, 220.0, 312.0, 453.0, 544.0, 564.0, 417.0, 343.0, 228.0, 145.0, 94.0, 74.0, 43.0, 37.0, 24.0, 18.0, 12.0, 12.0, 4.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.6796875, -8.416259765625, -8.15283203125, -7.889404296875, -7.6259765625, -7.362548828125, -7.09912109375, -6.835693359375, -6.572265625, -6.308837890625, -6.04541015625, -5.781982421875, -5.5185546875, -5.255126953125, -4.99169921875, -4.728271484375, -4.46484375, -4.201416015625, -3.93798828125, -3.674560546875, -3.4111328125, -3.147705078125, -2.88427734375, -2.620849609375, -2.357421875, -2.093994140625, -1.83056640625, -1.567138671875, -1.3037109375, -1.040283203125, -0.77685546875, -0.513427734375, -0.25, 0.013427734375, 0.27685546875, 0.540283203125, 0.8037109375, 1.067138671875, 1.33056640625, 1.593994140625, 1.857421875, 2.120849609375, 2.38427734375, 2.647705078125, 2.9111328125, 3.174560546875, 3.43798828125, 3.701416015625, 3.96484375, 4.228271484375, 4.49169921875, 4.755126953125, 5.0185546875, 5.281982421875, 5.54541015625, 5.808837890625, 6.072265625, 6.335693359375, 6.59912109375, 6.862548828125, 7.1259765625, 7.389404296875, 7.65283203125, 7.916259765625, 8.1796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 12.0, 14.0, 20.0, 27.0, 45.0, 42.0, 97.0, 143.0, 252.0, 604.0, 2460.0, 26530.0, 3408415.0, 742719.0, 10380.0, 1415.0, 462.0, 204.0, 121.0, 79.0, 56.0, 36.0, 26.0, 18.0, 23.0, 17.0, 6.0, 6.0, 12.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.75, -36.564453125, -35.37890625, -34.193359375, -33.0078125, -31.822265625, -30.63671875, -29.451171875, -28.265625, -27.080078125, -25.89453125, -24.708984375, -23.5234375, -22.337890625, -21.15234375, -19.966796875, -18.78125, -17.595703125, -16.41015625, -15.224609375, -14.0390625, -12.853515625, -11.66796875, -10.482421875, -9.296875, -8.111328125, -6.92578125, -5.740234375, -4.5546875, -3.369140625, -2.18359375, -0.998046875, 0.1875, 1.373046875, 2.55859375, 3.744140625, 4.9296875, 6.115234375, 7.30078125, 8.486328125, 9.671875, 10.857421875, 12.04296875, 13.228515625, 14.4140625, 15.599609375, 16.78515625, 17.970703125, 19.15625, 20.341796875, 21.52734375, 22.712890625, 23.8984375, 25.083984375, 26.26953125, 27.455078125, 28.640625, 29.826171875, 31.01171875, 32.197265625, 33.3828125, 34.568359375, 35.75390625, 36.939453125, 38.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 2.0, 6.0, 16.0, 21.0, 23.0, 36.0, 58.0, 53.0, 68.0, 73.0, 78.0, 89.0, 99.0, 85.0, 77.0, 54.0, 39.0, 28.0, 30.0, 20.0, 12.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.624752044677734, -40.56349182128906, -39.502227783203125, -38.44096755981445, -37.37970733642578, -36.31844711303711, -35.25718307495117, -34.1959228515625, -33.13466262817383, -32.073402404785156, -31.01214027404785, -29.950878143310547, -28.889617919921875, -27.82835578918457, -26.767093658447266, -25.705833435058594, -24.64457130432129, -23.583309173583984, -22.522048950195312, -21.460786819458008, -20.399526596069336, -19.33826446533203, -18.27700424194336, -17.215742111206055, -16.15447998046875, -15.093218803405762, -14.031957626342773, -12.970695495605469, -11.909435272216797, -10.848173141479492, -9.786911964416504, -8.725650787353516, -7.664388656616211, -6.603127479553223, -5.541866302490234, -4.480604648590088, -3.4193434715270996, -2.3580822944641113, -1.2968206405639648, -0.23555946350097656, 0.8257017135620117, 1.8869630098342896, 2.9482243061065674, 4.009485721588135, 5.070746898651123, 6.132008075714111, 7.193269729614258, 8.254530906677246, 9.315792083740234, 10.377053260803223, 11.438314437866211, 12.499576568603516, 13.560836791992188, 14.622098922729492, 15.68336009979248, 16.74462127685547, 17.80588150024414, 18.867143630981445, 19.928403854370117, 20.989665985107422, 22.050926208496094, 23.1121883392334, 24.173450469970703, 25.234710693359375, 26.29597282409668]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 0.0, 6.0, 6.0, 8.0, 7.0, 12.0, 10.0, 9.0, 21.0, 20.0, 35.0, 17.0, 29.0, 27.0, 39.0, 40.0, 39.0, 47.0, 35.0, 38.0, 30.0, 39.0, 41.0, 41.0, 44.0, 40.0, 40.0, 34.0, 27.0, 28.0, 29.0, 28.0, 32.0, 23.0, 11.0, 17.0, 10.0, 7.0, 5.0, 12.0, 9.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.379417419433594, -28.551237106323242, -27.723058700561523, -26.894878387451172, -26.066699981689453, -25.2385196685791, -24.41033935546875, -23.58216094970703, -22.75398063659668, -21.925800323486328, -21.09762191772461, -20.269441604614258, -19.441261291503906, -18.613082885742188, -17.784902572631836, -16.956722259521484, -16.128543853759766, -15.30036449432373, -14.472185134887695, -13.644004821777344, -12.815825462341309, -11.987646102905273, -11.159465789794922, -10.331286430358887, -9.503107070922852, -8.674927711486816, -7.846747875213623, -7.01856803894043, -6.1903886795043945, -5.362209320068359, -4.534029483795166, -3.7058496475219727, -2.8776721954345703, -2.049492597579956, -1.2213129997253418, -0.39313340187072754, 0.4350461959838867, 1.2632255554199219, 2.0914053916931152, 2.9195852279663086, 3.7477645874023438, 4.575943946838379, 5.404123783111572, 6.232303619384766, 7.060482978820801, 7.888662338256836, 8.716842651367188, 9.545022010803223, 10.373201370239258, 11.201380729675293, 12.029560089111328, 12.85774040222168, 13.685919761657715, 14.51409912109375, 15.342279434204102, 16.170459747314453, 16.998638153076172, 17.826818466186523, 18.654996871948242, 19.483177185058594, 20.311355590820312, 21.139535903930664, 21.967716217041016, 22.795894622802734, 23.624074935913086]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 7.0, 9.0, 12.0, 12.0, 13.0, 19.0, 21.0, 23.0, 19.0, 25.0, 29.0, 29.0, 37.0, 33.0, 36.0, 42.0, 41.0, 53.0, 38.0, 49.0, 46.0, 43.0, 49.0, 32.0, 27.0, 25.0, 29.0, 28.0, 23.0, 22.0, 21.0, 13.0, 12.0, 14.0, 10.0, 14.0, 3.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.30078125, -3.192108154296875, -3.08343505859375, -2.974761962890625, -2.8660888671875, -2.757415771484375, -2.64874267578125, -2.540069580078125, -2.431396484375, -2.322723388671875, -2.21405029296875, -2.105377197265625, -1.9967041015625, -1.888031005859375, -1.77935791015625, -1.670684814453125, -1.56201171875, -1.453338623046875, -1.34466552734375, -1.235992431640625, -1.1273193359375, -1.018646240234375, -0.90997314453125, -0.801300048828125, -0.692626953125, -0.583953857421875, -0.47528076171875, -0.366607666015625, -0.2579345703125, -0.149261474609375, -0.04058837890625, 0.068084716796875, 0.1767578125, 0.285430908203125, 0.39410400390625, 0.502777099609375, 0.6114501953125, 0.720123291015625, 0.82879638671875, 0.937469482421875, 1.046142578125, 1.154815673828125, 1.26348876953125, 1.372161865234375, 1.4808349609375, 1.589508056640625, 1.69818115234375, 1.806854248046875, 1.91552734375, 2.024200439453125, 2.13287353515625, 2.241546630859375, 2.3502197265625, 2.458892822265625, 2.56756591796875, 2.676239013671875, 2.784912109375, 2.893585205078125, 3.00225830078125, 3.110931396484375, 3.2196044921875, 3.328277587890625, 3.43695068359375, 3.545623779296875, 3.654296875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 11.0, 15.0, 29.0, 33.0, 53.0, 83.0, 120.0, 162.0, 228.0, 338.0, 503.0, 715.0, 1068.0, 1619.0, 2398.0, 3720.0, 5652.0, 8930.0, 14046.0, 22945.0, 38002.0, 66224.0, 122581.0, 314410.0, 212692.0, 94900.0, 53442.0, 31328.0, 18958.0, 11664.0, 7432.0, 4784.0, 3113.0, 2068.0, 1376.0, 927.0, 584.0, 429.0, 323.0, 212.0, 135.0, 84.0, 76.0, 54.0, 30.0, 18.0, 14.0, 10.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1890869140625, -0.18294906616210938, -0.17681121826171875, -0.17067337036132812, -0.1645355224609375, -0.15839767456054688, -0.15225982666015625, -0.14612197875976562, -0.139984130859375, -0.13384628295898438, -0.12770843505859375, -0.12157058715820312, -0.1154327392578125, -0.10929489135742188, -0.10315704345703125, -0.09701919555664062, -0.09088134765625, -0.08474349975585938, -0.07860565185546875, -0.07246780395507812, -0.0663299560546875, -0.060192108154296875, -0.05405426025390625, -0.047916412353515625, -0.041778564453125, -0.035640716552734375, -0.02950286865234375, -0.023365020751953125, -0.0172271728515625, -0.011089324951171875, -0.00495147705078125, 0.001186370849609375, 0.00732421875, 0.013462066650390625, 0.01959991455078125, 0.025737762451171875, 0.0318756103515625, 0.038013458251953125, 0.04415130615234375, 0.050289154052734375, 0.056427001953125, 0.06256484985351562, 0.06870269775390625, 0.07484054565429688, 0.0809783935546875, 0.08711624145507812, 0.09325408935546875, 0.09939193725585938, 0.10552978515625, 0.11166763305664062, 0.11780548095703125, 0.12394332885742188, 0.1300811767578125, 0.13621902465820312, 0.14235687255859375, 0.14849472045898438, 0.154632568359375, 0.16077041625976562, 0.16690826416015625, 0.17304611206054688, 0.1791839599609375, 0.18532180786132812, 0.19145965576171875, 0.19759750366210938, 0.2037353515625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 6.0, 5.0, 10.0, 8.0, 9.0, 11.0, 19.0, 17.0, 15.0, 9.0, 19.0, 24.0, 28.0, 32.0, 32.0, 30.0, 41.0, 39.0, 33.0, 44.0, 31.0, 44.0, 1056.0, 33.0, 31.0, 40.0, 43.0, 31.0, 33.0, 30.0, 33.0, 27.0, 18.0, 26.0, 17.0, 15.0, 12.0, 12.0, 10.0, 8.0, 9.0, 8.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.90234375, -2.815399169921875, -2.72845458984375, -2.641510009765625, -2.5545654296875, -2.467620849609375, -2.38067626953125, -2.293731689453125, -2.206787109375, -2.119842529296875, -2.03289794921875, -1.945953369140625, -1.8590087890625, -1.772064208984375, -1.68511962890625, -1.598175048828125, -1.51123046875, -1.424285888671875, -1.33734130859375, -1.250396728515625, -1.1634521484375, -1.076507568359375, -0.98956298828125, -0.902618408203125, -0.815673828125, -0.728729248046875, -0.64178466796875, -0.554840087890625, -0.4678955078125, -0.380950927734375, -0.29400634765625, -0.207061767578125, -0.1201171875, -0.033172607421875, 0.05377197265625, 0.140716552734375, 0.2276611328125, 0.314605712890625, 0.40155029296875, 0.488494873046875, 0.575439453125, 0.662384033203125, 0.74932861328125, 0.836273193359375, 0.9232177734375, 1.010162353515625, 1.09710693359375, 1.184051513671875, 1.27099609375, 1.357940673828125, 1.44488525390625, 1.531829833984375, 1.6187744140625, 1.705718994140625, 1.79266357421875, 1.879608154296875, 1.966552734375, 2.053497314453125, 2.14044189453125, 2.227386474609375, 2.3143310546875, 2.401275634765625, 2.48822021484375, 2.575164794921875, 2.662109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 17.0, 20.0, 40.0, 44.0, 69.0, 97.0, 166.0, 212.0, 330.0, 484.0, 728.0, 1118.0, 1618.0, 2386.0, 3736.0, 5950.0, 9205.0, 14501.0, 23140.0, 38395.0, 63919.0, 120484.0, 1282399.0, 273595.0, 104591.0, 56894.0, 34110.0, 21072.0, 13216.0, 8484.0, 5481.0, 3542.0, 2297.0, 1486.0, 1039.0, 670.0, 495.0, 313.0, 224.0, 161.0, 110.0, 93.0, 51.0, 45.0, 28.0, 12.0, 13.0, 13.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0692138671875, -0.06697368621826172, -0.06473350524902344, -0.062493324279785156, -0.060253143310546875, -0.058012962341308594, -0.05577278137207031, -0.05353260040283203, -0.05129241943359375, -0.04905223846435547, -0.04681205749511719, -0.044571876525878906, -0.042331695556640625, -0.040091514587402344, -0.03785133361816406, -0.03561115264892578, -0.0333709716796875, -0.03113079071044922, -0.028890609741210938, -0.026650428771972656, -0.024410247802734375, -0.022170066833496094, -0.019929885864257812, -0.01768970489501953, -0.01544952392578125, -0.013209342956542969, -0.010969161987304688, -0.008728981018066406, -0.006488800048828125, -0.004248619079589844, -0.0020084381103515625, 0.00023174285888671875, 0.002471923828125, 0.004712104797363281, 0.0069522857666015625, 0.009192466735839844, 0.011432647705078125, 0.013672828674316406, 0.015913009643554688, 0.01815319061279297, 0.02039337158203125, 0.02263355255126953, 0.024873733520507812, 0.027113914489746094, 0.029354095458984375, 0.031594276428222656, 0.03383445739746094, 0.03607463836669922, 0.0383148193359375, 0.04055500030517578, 0.04279518127441406, 0.045035362243652344, 0.047275543212890625, 0.049515724182128906, 0.05175590515136719, 0.05399608612060547, 0.05623626708984375, 0.05847644805908203, 0.06071662902832031, 0.0629568099975586, 0.06519699096679688, 0.06743717193603516, 0.06967735290527344, 0.07191753387451172, 0.07415771484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 2.0, 7.0, 14.0, 13.0, 17.0, 17.0, 14.0, 17.0, 24.0, 27.0, 38.0, 27.0, 39.0, 42.0, 51.0, 44.0, 62.0, 48.0, 72.0, 55.0, 50.0, 37.0, 43.0, 33.0, 35.0, 25.0, 25.0, 25.0, 15.0, 11.0, 14.0, 9.0, 15.0, 7.0, 4.0, 2.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0008521080017089844, -0.0008273199200630188, -0.0008025318384170532, -0.0007777437567710876, -0.0007529556751251221, -0.0007281675934791565, -0.0007033795118331909, -0.0006785914301872253, -0.0006538033485412598, -0.0006290152668952942, -0.0006042271852493286, -0.000579439103603363, -0.0005546510219573975, -0.0005298629403114319, -0.0005050748586654663, -0.00048028677701950073, -0.00045549869537353516, -0.0004307106137275696, -0.000405922532081604, -0.00038113445043563843, -0.00035634636878967285, -0.0003315582871437073, -0.0003067702054977417, -0.0002819821238517761, -0.00025719404220581055, -0.00023240596055984497, -0.0002076178789138794, -0.00018282979726791382, -0.00015804171562194824, -0.00013325363397598267, -0.00010846555233001709, -8.367747068405151e-05, -5.888938903808594e-05, -3.410130739212036e-05, -9.313225746154785e-06, 1.547485589981079e-05, 4.026293754577637e-05, 6.505101919174194e-05, 8.983910083770752e-05, 0.0001146271824836731, 0.00013941526412963867, 0.00016420334577560425, 0.00018899142742156982, 0.0002137795090675354, 0.00023856759071350098, 0.00026335567235946655, 0.00028814375400543213, 0.0003129318356513977, 0.0003377199172973633, 0.00036250799894332886, 0.00038729608058929443, 0.00041208416223526, 0.0004368722438812256, 0.00046166032552719116, 0.00048644840717315674, 0.0005112364888191223, 0.0005360245704650879, 0.0005608126521110535, 0.000585600733757019, 0.0006103888154029846, 0.0006351768970489502, 0.0006599649786949158, 0.0006847530603408813, 0.0007095411419868469, 0.0007343292236328125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 5.0, 11.0, 10.0, 8.0, 8.0, 15.0, 21.0, 23.0, 27.0, 33.0, 39.0, 42.0, 92.0, 138.0, 386.0, 2134.0, 34680.0, 934023.0, 72376.0, 3417.0, 523.0, 165.0, 98.0, 52.0, 49.0, 28.0, 31.0, 14.0, 16.0, 15.0, 13.0, 18.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01458740234375, -0.01409459114074707, -0.01360177993774414, -0.013108968734741211, -0.012616157531738281, -0.012123346328735352, -0.011630535125732422, -0.011137723922729492, -0.010644912719726562, -0.010152101516723633, -0.009659290313720703, -0.009166479110717773, -0.008673667907714844, -0.008180856704711914, -0.007688045501708984, -0.007195234298706055, -0.006702423095703125, -0.006209611892700195, -0.005716800689697266, -0.005223989486694336, -0.004731178283691406, -0.0042383670806884766, -0.003745555877685547, -0.003252744674682617, -0.0027599334716796875, -0.002267122268676758, -0.0017743110656738281, -0.0012814998626708984, -0.0007886886596679688, -0.00029587745666503906, 0.00019693374633789062, 0.0006897449493408203, 0.00118255615234375, 0.0016753673553466797, 0.0021681785583496094, 0.002660989761352539, 0.0031538009643554688, 0.0036466121673583984, 0.004139423370361328, 0.004632234573364258, 0.0051250457763671875, 0.005617856979370117, 0.006110668182373047, 0.0066034793853759766, 0.007096290588378906, 0.007589101791381836, 0.008081912994384766, 0.008574724197387695, 0.009067535400390625, 0.009560346603393555, 0.010053157806396484, 0.010545969009399414, 0.011038780212402344, 0.011531591415405273, 0.012024402618408203, 0.012517213821411133, 0.013010025024414062, 0.013502836227416992, 0.013995647430419922, 0.014488458633422852, 0.014981269836425781, 0.015474081039428711, 0.01596689224243164, 0.01645970344543457, 0.0169525146484375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 861.0, 155.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002205475000664592, -0.001434606732800603, -0.0006637385813519359, 0.00010712957009673119, 0.0008779978379607201, 0.001648866105824709, 0.002419734140858054, 0.003190602408722043, 0.003961470909416676, 0.0047323391772806644, 0.005503207445144653, 0.006274075247347355, 0.007044943980872631, 0.007815811783075333, 0.008586680516600609, 0.00935754831880331, 0.010128416121006012, 0.010899283923208714, 0.01167015265673399, 0.012441020458936691, 0.013211889192461967, 0.013982756994664669, 0.01475362479686737, 0.015524493530392647, 0.016295362263917923, 0.0170662309974432, 0.017837097868323326, 0.018607966601848602, 0.01937883533537388, 0.020149704068899155, 0.02092057093977928, 0.021691439673304558, 0.022462306544184685, 0.02323317527770996, 0.024004042148590088, 0.024774910882115364, 0.02554577961564064, 0.026316648349165916, 0.027087515220046043, 0.02785838395357132, 0.028629252687096596, 0.029400121420621872, 0.030170988291502, 0.030941857025027275, 0.03171272575855255, 0.03248359262943268, 0.033254463225603104, 0.03402533009648323, 0.03479619696736336, 0.035567063838243484, 0.03633793443441391, 0.03710880130529404, 0.037879668176174164, 0.03865053877234459, 0.039421405643224716, 0.04019227623939514, 0.04096314311027527, 0.041734009981155396, 0.04250488057732582, 0.04327574744820595, 0.044046614319086075, 0.0448174849152565, 0.04558835178613663, 0.046359218657016754, 0.04713008925318718]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 19.0, 17.0, 36.0, 44.0, 71.0, 87.0, 99.0, 97.0, 75.0, 93.0, 77.0, 77.0, 50.0, 42.0, 49.0, 26.0, 14.0, 11.0, 7.0, 5.0, 1.0, 4.0, 0.0, 1.0], "bins": [-0.002314150333404541, -0.002266271971166134, -0.0022183936089277267, -0.0021705152466893196, -0.0021226368844509125, -0.0020747585222125053, -0.002026880159974098, -0.001979001797735691, -0.001931123435497284, -0.0018832450732588768, -0.0018353667110204697, -0.0017874883487820625, -0.0017396099865436554, -0.0016917316243052483, -0.0016438532620668411, -0.001595974899828434, -0.0015480965375900269, -0.0015002181753516197, -0.0014523398131132126, -0.0014044614508748055, -0.0013565830886363983, -0.0013087047263979912, -0.001260826364159584, -0.001212948001921177, -0.0011650696396827698, -0.0011171912774443626, -0.0010693129152059555, -0.0010214345529675484, -0.0009735561907291412, -0.0009256778284907341, -0.000877799466252327, -0.0008299211040139198, -0.0007820427417755127, -0.0007341643795371056, -0.0006862860172986984, -0.0006384076550602913, -0.0005905292928218842, -0.000542650930583477, -0.0004947725683450699, -0.00044689420610666275, -0.0003990158438682556, -0.0003511374816298485, -0.00030325911939144135, -0.0002553807571530342, -0.00020750239491462708, -0.00015962403267621994, -0.0001117456704378128, -6.386730819940567e-05, -1.5988945960998535e-05, 3.18894162774086e-05, 7.976777851581573e-05, 0.00012764614075422287, 0.00017552450299263, 0.00022340286523103714, 0.0002712812274694443, 0.0003191595897078514, 0.00036703795194625854, 0.0004149163141846657, 0.0004627946764230728, 0.00051067303866148, 0.0005585514008998871, 0.0006064297631382942, 0.0006543081253767014, 0.0007021864876151085, 0.0007500648498535156]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 6.0, 8.0, 6.0, 7.0, 9.0, 12.0, 12.0, 13.0, 19.0, 22.0, 22.0, 19.0, 25.0, 29.0, 29.0, 37.0, 33.0, 36.0, 42.0, 41.0, 53.0, 38.0, 49.0, 46.0, 43.0, 49.0, 32.0, 27.0, 25.0, 29.0, 28.0, 23.0, 22.0, 21.0, 13.0, 12.0, 14.0, 10.0, 14.0, 3.0, 4.0, 7.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.30078125, -3.192108154296875, -3.08343505859375, -2.974761962890625, -2.8660888671875, -2.757415771484375, -2.64874267578125, -2.540069580078125, -2.431396484375, -2.322723388671875, -2.21405029296875, -2.105377197265625, -1.9967041015625, -1.888031005859375, -1.77935791015625, -1.670684814453125, -1.56201171875, -1.453338623046875, -1.34466552734375, -1.235992431640625, -1.1273193359375, -1.018646240234375, -0.90997314453125, -0.801300048828125, -0.692626953125, -0.583953857421875, -0.47528076171875, -0.366607666015625, -0.2579345703125, -0.149261474609375, -0.04058837890625, 0.068084716796875, 0.1767578125, 0.285430908203125, 0.39410400390625, 0.502777099609375, 0.6114501953125, 0.720123291015625, 0.82879638671875, 0.937469482421875, 1.046142578125, 1.154815673828125, 1.26348876953125, 1.372161865234375, 1.4808349609375, 1.589508056640625, 1.69818115234375, 1.806854248046875, 1.91552734375, 2.024200439453125, 2.13287353515625, 2.241546630859375, 2.3502197265625, 2.458892822265625, 2.56756591796875, 2.676239013671875, 2.784912109375, 2.893585205078125, 3.00225830078125, 3.110931396484375, 3.2196044921875, 3.328277587890625, 3.43695068359375, 3.545623779296875, 3.654296875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 10.0, 13.0, 18.0, 22.0, 38.0, 55.0, 80.0, 117.0, 190.0, 296.0, 441.0, 690.0, 1100.0, 1864.0, 3358.0, 6333.0, 12422.0, 25297.0, 64792.0, 317007.0, 460345.0, 90875.0, 31388.0, 14630.0, 7494.0, 3979.0, 2188.0, 1258.0, 808.0, 491.0, 309.0, 216.0, 145.0, 81.0, 63.0, 36.0, 32.0, 16.0, 15.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.078125, -7.83428955078125, -7.5904541015625, -7.34661865234375, -7.102783203125, -6.85894775390625, -6.6151123046875, -6.37127685546875, -6.12744140625, -5.88360595703125, -5.6397705078125, -5.39593505859375, -5.152099609375, -4.90826416015625, -4.6644287109375, -4.42059326171875, -4.1767578125, -3.93292236328125, -3.6890869140625, -3.44525146484375, -3.201416015625, -2.95758056640625, -2.7137451171875, -2.46990966796875, -2.22607421875, -1.98223876953125, -1.7384033203125, -1.49456787109375, -1.250732421875, -1.00689697265625, -0.7630615234375, -0.51922607421875, -0.275390625, -0.03155517578125, 0.2122802734375, 0.45611572265625, 0.699951171875, 0.94378662109375, 1.1876220703125, 1.43145751953125, 1.67529296875, 1.91912841796875, 2.1629638671875, 2.40679931640625, 2.650634765625, 2.89447021484375, 3.1383056640625, 3.38214111328125, 3.6259765625, 3.86981201171875, 4.1136474609375, 4.35748291015625, 4.601318359375, 4.84515380859375, 5.0889892578125, 5.33282470703125, 5.57666015625, 5.82049560546875, 6.0643310546875, 6.30816650390625, 6.552001953125, 6.79583740234375, 7.0396728515625, 7.28350830078125, 7.52734375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 5.0, 8.0, 10.0, 9.0, 21.0, 17.0, 10.0, 14.0, 21.0, 21.0, 29.0, 38.0, 37.0, 62.0, 53.0, 84.0, 111.0, 237.0, 1437.0, 229.0, 131.0, 84.0, 60.0, 47.0, 49.0, 43.0, 33.0, 35.0, 28.0, 18.0, 18.0, 14.0, 4.0, 7.0, 6.0, 2.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.21875, -11.8046875, -11.390625, -10.9765625, -10.5625, -10.1484375, -9.734375, -9.3203125, -8.90625, -8.4921875, -8.078125, -7.6640625, -7.25, -6.8359375, -6.421875, -6.0078125, -5.59375, -5.1796875, -4.765625, -4.3515625, -3.9375, -3.5234375, -3.109375, -2.6953125, -2.28125, -1.8671875, -1.453125, -1.0390625, -0.625, -0.2109375, 0.203125, 0.6171875, 1.03125, 1.4453125, 1.859375, 2.2734375, 2.6875, 3.1015625, 3.515625, 3.9296875, 4.34375, 4.7578125, 5.171875, 5.5859375, 6.0, 6.4140625, 6.828125, 7.2421875, 7.65625, 8.0703125, 8.484375, 8.8984375, 9.3125, 9.7265625, 10.140625, 10.5546875, 10.96875, 11.3828125, 11.796875, 12.2109375, 12.625, 13.0390625, 13.453125, 13.8671875, 14.28125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 7.0, 7.0, 8.0, 12.0, 15.0, 23.0, 29.0, 50.0, 46.0, 65.0, 90.0, 158.0, 287.0, 767.0, 4076.0, 43965.0, 2597837.0, 479536.0, 15562.0, 1952.0, 507.0, 208.0, 130.0, 89.0, 64.0, 48.0, 40.0, 27.0, 19.0, 16.0, 16.0, 14.0, 9.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.25, -27.4384765625, -26.626953125, -25.8154296875, -25.00390625, -24.1923828125, -23.380859375, -22.5693359375, -21.7578125, -20.9462890625, -20.134765625, -19.3232421875, -18.51171875, -17.7001953125, -16.888671875, -16.0771484375, -15.265625, -14.4541015625, -13.642578125, -12.8310546875, -12.01953125, -11.2080078125, -10.396484375, -9.5849609375, -8.7734375, -7.9619140625, -7.150390625, -6.3388671875, -5.52734375, -4.7158203125, -3.904296875, -3.0927734375, -2.28125, -1.4697265625, -0.658203125, 0.1533203125, 0.96484375, 1.7763671875, 2.587890625, 3.3994140625, 4.2109375, 5.0224609375, 5.833984375, 6.6455078125, 7.45703125, 8.2685546875, 9.080078125, 9.8916015625, 10.703125, 11.5146484375, 12.326171875, 13.1376953125, 13.94921875, 14.7607421875, 15.572265625, 16.3837890625, 17.1953125, 18.0068359375, 18.818359375, 19.6298828125, 20.44140625, 21.2529296875, 22.064453125, 22.8759765625, 23.6875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 62.0, 412.0, 460.0, 79.0, 4.0, 1.0, 1.0], "bins": [-264.3245544433594, -259.8451232910156, -255.3656768798828, -250.88624572753906, -246.40679931640625, -241.9273681640625, -237.44793701171875, -232.96849060058594, -228.4890594482422, -224.00962829589844, -219.53018188476562, -215.05075073242188, -210.57130432128906, -206.0918731689453, -201.6124267578125, -197.13299560546875, -192.653564453125, -188.17413330078125, -183.69468688964844, -179.2152557373047, -174.73580932617188, -170.25637817382812, -165.77694702148438, -161.29750061035156, -156.81805419921875, -152.338623046875, -147.8591766357422, -143.37974548339844, -138.90029907226562, -134.42086791992188, -129.94143676757812, -125.46199035644531, -120.98255920410156, -116.50312042236328, -112.023681640625, -107.54425048828125, -103.06481170654297, -98.58537292480469, -94.1059341430664, -89.62649536132812, -85.14705657958984, -80.66761779785156, -76.18817901611328, -71.708740234375, -67.22930908203125, -62.74987030029297, -58.27043151855469, -53.790992736816406, -49.31155776977539, -44.83211898803711, -40.352684020996094, -35.87324523925781, -31.393808364868164, -26.914371490478516, -22.434932708740234, -17.955495834350586, -13.476058959960938, -8.996622085571289, -4.517184257507324, -0.037746429443359375, 4.441690444946289, 8.921127319335938, 13.400566101074219, 17.880002975463867, 22.359439849853516]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 7.0, 5.0, 10.0, 11.0, 8.0, 10.0, 18.0, 19.0, 17.0, 18.0, 33.0, 36.0, 39.0, 33.0, 32.0, 39.0, 44.0, 39.0, 36.0, 40.0, 46.0, 37.0, 40.0, 31.0, 29.0, 32.0, 28.0, 27.0, 30.0, 30.0, 18.0, 21.0, 15.0, 10.0, 13.0, 12.0, 13.0, 8.0, 12.0, 9.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-28.69312858581543, -27.771778106689453, -26.850425720214844, -25.929075241088867, -25.00772476196289, -24.08637237548828, -23.165021896362305, -22.243671417236328, -21.32231903076172, -20.400968551635742, -19.479616165161133, -18.558265686035156, -17.636913299560547, -16.71556282043457, -15.794212341308594, -14.8728609085083, -13.951509475708008, -13.030158042907715, -12.108806610107422, -11.187456130981445, -10.266104698181152, -9.34475326538086, -8.423402786254883, -7.50205135345459, -6.580699920654297, -5.659348487854004, -4.737997531890869, -3.8166463375091553, -2.8952951431274414, -1.9739437103271484, -1.0525927543640137, -0.1312417984008789, 0.7901096343994141, 1.711460828781128, 2.632812023162842, 3.5541632175445557, 4.4755144119262695, 5.3968658447265625, 6.318216800689697, 7.239567756652832, 8.160919189453125, 9.082270622253418, 10.003622055053711, 10.924972534179688, 11.84632396697998, 12.767675399780273, 13.68902587890625, 14.610377311706543, 15.531728744506836, 16.453079223632812, 17.374431610107422, 18.2957820892334, 19.217132568359375, 20.138484954833984, 21.05983543395996, 21.981185913085938, 22.902538299560547, 23.823888778686523, 24.745241165161133, 25.66659164428711, 26.58794403076172, 27.509294509887695, 28.430644989013672, 29.35199737548828, 30.273347854614258]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 6.0, 8.0, 5.0, 12.0, 17.0, 10.0, 13.0, 22.0, 21.0, 31.0, 26.0, 28.0, 26.0, 41.0, 36.0, 32.0, 50.0, 52.0, 51.0, 46.0, 56.0, 52.0, 44.0, 39.0, 27.0, 33.0, 29.0, 27.0, 14.0, 24.0, 27.0, 17.0, 14.0, 14.0, 7.0, 13.0, 4.0, 1.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.619140625, -3.498321533203125, -3.37750244140625, -3.256683349609375, -3.1358642578125, -3.015045166015625, -2.89422607421875, -2.773406982421875, -2.652587890625, -2.531768798828125, -2.41094970703125, -2.290130615234375, -2.1693115234375, -2.048492431640625, -1.92767333984375, -1.806854248046875, -1.68603515625, -1.565216064453125, -1.44439697265625, -1.323577880859375, -1.2027587890625, -1.081939697265625, -0.96112060546875, -0.840301513671875, -0.719482421875, -0.598663330078125, -0.47784423828125, -0.357025146484375, -0.2362060546875, -0.115386962890625, 0.00543212890625, 0.126251220703125, 0.2470703125, 0.367889404296875, 0.48870849609375, 0.609527587890625, 0.7303466796875, 0.851165771484375, 0.97198486328125, 1.092803955078125, 1.213623046875, 1.334442138671875, 1.45526123046875, 1.576080322265625, 1.6968994140625, 1.817718505859375, 1.93853759765625, 2.059356689453125, 2.18017578125, 2.300994873046875, 2.42181396484375, 2.542633056640625, 2.6634521484375, 2.784271240234375, 2.90509033203125, 3.025909423828125, 3.146728515625, 3.267547607421875, 3.38836669921875, 3.509185791015625, 3.6300048828125, 3.750823974609375, 3.87164306640625, 3.992462158203125, 4.11328125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 8.0, 11.0, 12.0, 21.0, 29.0, 37.0, 56.0, 108.0, 163.0, 334.0, 885.0, 2570.0, 12295.0, 195303.0, 3681141.0, 281830.0, 14652.0, 2955.0, 942.0, 403.0, 198.0, 112.0, 55.0, 39.0, 36.0, 15.0, 18.0, 14.0, 9.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.494873046875, -15.89599609375, -15.297119140625, -14.6982421875, -14.099365234375, -13.50048828125, -12.901611328125, -12.302734375, -11.703857421875, -11.10498046875, -10.506103515625, -9.9072265625, -9.308349609375, -8.70947265625, -8.110595703125, -7.51171875, -6.912841796875, -6.31396484375, -5.715087890625, -5.1162109375, -4.517333984375, -3.91845703125, -3.319580078125, -2.720703125, -2.121826171875, -1.52294921875, -0.924072265625, -0.3251953125, 0.273681640625, 0.87255859375, 1.471435546875, 2.0703125, 2.669189453125, 3.26806640625, 3.866943359375, 4.4658203125, 5.064697265625, 5.66357421875, 6.262451171875, 6.861328125, 7.460205078125, 8.05908203125, 8.657958984375, 9.2568359375, 9.855712890625, 10.45458984375, 11.053466796875, 11.65234375, 12.251220703125, 12.85009765625, 13.448974609375, 14.0478515625, 14.646728515625, 15.24560546875, 15.844482421875, 16.443359375, 17.042236328125, 17.64111328125, 18.239990234375, 18.8388671875, 19.437744140625, 20.03662109375, 20.635498046875, 21.234375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 12.0, 12.0, 15.0, 22.0, 27.0, 69.0, 101.0, 142.0, 222.0, 393.0, 543.0, 784.0, 669.0, 425.0, 234.0, 161.0, 95.0, 50.0, 33.0, 16.0, 12.0, 11.0, 12.0, 5.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.669677734375, -8.33154296875, -7.993408203125, -7.6552734375, -7.317138671875, -6.97900390625, -6.640869140625, -6.302734375, -5.964599609375, -5.62646484375, -5.288330078125, -4.9501953125, -4.612060546875, -4.27392578125, -3.935791015625, -3.59765625, -3.259521484375, -2.92138671875, -2.583251953125, -2.2451171875, -1.906982421875, -1.56884765625, -1.230712890625, -0.892578125, -0.554443359375, -0.21630859375, 0.121826171875, 0.4599609375, 0.798095703125, 1.13623046875, 1.474365234375, 1.8125, 2.150634765625, 2.48876953125, 2.826904296875, 3.1650390625, 3.503173828125, 3.84130859375, 4.179443359375, 4.517578125, 4.855712890625, 5.19384765625, 5.531982421875, 5.8701171875, 6.208251953125, 6.54638671875, 6.884521484375, 7.22265625, 7.560791015625, 7.89892578125, 8.237060546875, 8.5751953125, 8.913330078125, 9.25146484375, 9.589599609375, 9.927734375, 10.265869140625, 10.60400390625, 10.942138671875, 11.2802734375, 11.618408203125, 11.95654296875, 12.294677734375, 12.6328125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 12.0, 6.0, 19.0, 12.0, 28.0, 41.0, 80.0, 172.0, 308.0, 966.0, 12364.0, 3949046.0, 227451.0, 2637.0, 547.0, 258.0, 117.0, 89.0, 43.0, 26.0, 18.0, 10.0, 17.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.8125, -60.17529296875, -58.5380859375, -56.90087890625, -55.263671875, -53.62646484375, -51.9892578125, -50.35205078125, -48.71484375, -47.07763671875, -45.4404296875, -43.80322265625, -42.166015625, -40.52880859375, -38.8916015625, -37.25439453125, -35.6171875, -33.97998046875, -32.3427734375, -30.70556640625, -29.068359375, -27.43115234375, -25.7939453125, -24.15673828125, -22.51953125, -20.88232421875, -19.2451171875, -17.60791015625, -15.970703125, -14.33349609375, -12.6962890625, -11.05908203125, -9.421875, -7.78466796875, -6.1474609375, -4.51025390625, -2.873046875, -1.23583984375, 0.4013671875, 2.03857421875, 3.67578125, 5.31298828125, 6.9501953125, 8.58740234375, 10.224609375, 11.86181640625, 13.4990234375, 15.13623046875, 16.7734375, 18.41064453125, 20.0478515625, 21.68505859375, 23.322265625, 24.95947265625, 26.5966796875, 28.23388671875, 29.87109375, 31.50830078125, 33.1455078125, 34.78271484375, 36.419921875, 38.05712890625, 39.6943359375, 41.33154296875, 42.96875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 16.0, 20.0, 24.0, 39.0, 52.0, 78.0, 80.0, 106.0, 116.0, 98.0, 93.0, 75.0, 59.0, 39.0, 36.0, 30.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.172107696533203, -19.05388069152832, -17.935653686523438, -16.817428588867188, -15.699201583862305, -14.580974578857422, -13.462747573852539, -12.344520568847656, -11.22629451751709, -10.108067512512207, -8.98984146118164, -7.871614456176758, -6.753387928009033, -5.635161399841309, -4.516934394836426, -3.398707866668701, -2.2804813385009766, -1.1622546911239624, -0.04402804374694824, 1.0741987228393555, 2.19242525100708, 3.3106517791748047, 4.4288787841796875, 5.547105312347412, 6.665331840515137, 7.783558368682861, 8.901784896850586, 10.020011901855469, 11.138238906860352, 12.256464958190918, 13.3746919631958, 14.492918014526367, 15.61114501953125, 16.729372024536133, 17.847599029541016, 18.965824127197266, 20.08405113220215, 21.20227813720703, 22.320505142211914, 23.438732147216797, 24.556957244873047, 25.67518424987793, 26.793411254882812, 27.911636352539062, 29.029863357543945, 30.148090362548828, 31.26631736755371, 32.384544372558594, 33.502769470214844, 34.620994567871094, 35.73922348022461, 36.85744857788086, 37.975677490234375, 39.093902587890625, 40.212127685546875, 41.33035659790039, 42.448585510253906, 43.566810607910156, 44.68503952026367, 45.80326461791992, 46.92149353027344, 48.03971862792969, 49.15794372558594, 50.27617263793945, 51.3943977355957]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 7.0, 5.0, 13.0, 11.0, 11.0, 15.0, 21.0, 20.0, 23.0, 25.0, 25.0, 33.0, 38.0, 45.0, 30.0, 47.0, 45.0, 47.0, 53.0, 45.0, 44.0, 46.0, 50.0, 40.0, 39.0, 34.0, 25.0, 27.0, 24.0, 28.0, 14.0, 19.0, 15.0, 10.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-31.912277221679688, -31.053913116455078, -30.19554901123047, -29.337182998657227, -28.478818893432617, -27.620454788208008, -26.762088775634766, -25.903724670410156, -25.045360565185547, -24.186996459960938, -23.328632354736328, -22.470266342163086, -21.611902236938477, -20.753538131713867, -19.895172119140625, -19.036808013916016, -18.178443908691406, -17.320079803466797, -16.461715698242188, -15.603349685668945, -14.744985580444336, -13.886621475219727, -13.0282564163208, -12.169891357421875, -11.311527252197266, -10.453163146972656, -9.59479808807373, -8.736433029174805, -7.878068923950195, -7.019704341888428, -6.16133975982666, -5.302975177764893, -4.444612503051758, -3.5862479209899902, -2.7278833389282227, -1.869518756866455, -1.0111541748046875, -0.15278959274291992, 0.7055749893188477, 1.5639395713806152, 2.422304153442383, 3.2806687355041504, 4.139033317565918, 4.9973978996276855, 5.855762481689453, 6.714127063751221, 7.572491645812988, 8.430856704711914, 9.289220809936523, 10.147584915161133, 11.005949974060059, 11.864315032958984, 12.722679138183594, 13.581043243408203, 14.439408302307129, 15.297773361206055, 16.156137466430664, 17.014501571655273, 17.872867584228516, 18.731231689453125, 19.589595794677734, 20.447959899902344, 21.306324005126953, 22.164690017700195, 23.023054122924805]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 4.0, 9.0, 2.0, 10.0, 12.0, 10.0, 23.0, 14.0, 24.0, 18.0, 31.0, 24.0, 19.0, 34.0, 39.0, 34.0, 34.0, 43.0, 46.0, 50.0, 41.0, 54.0, 51.0, 44.0, 34.0, 33.0, 33.0, 24.0, 28.0, 16.0, 25.0, 28.0, 20.0, 21.0, 11.0, 13.0, 8.0, 11.0, 1.0, 9.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.405242919921875, -3.28900146484375, -3.172760009765625, -3.0565185546875, -2.940277099609375, -2.82403564453125, -2.707794189453125, -2.591552734375, -2.475311279296875, -2.35906982421875, -2.242828369140625, -2.1265869140625, -2.010345458984375, -1.89410400390625, -1.777862548828125, -1.66162109375, -1.545379638671875, -1.42913818359375, -1.312896728515625, -1.1966552734375, -1.080413818359375, -0.96417236328125, -0.847930908203125, -0.731689453125, -0.615447998046875, -0.49920654296875, -0.382965087890625, -0.2667236328125, -0.150482177734375, -0.03424072265625, 0.082000732421875, 0.1982421875, 0.314483642578125, 0.43072509765625, 0.546966552734375, 0.6632080078125, 0.779449462890625, 0.89569091796875, 1.011932373046875, 1.128173828125, 1.244415283203125, 1.36065673828125, 1.476898193359375, 1.5931396484375, 1.709381103515625, 1.82562255859375, 1.941864013671875, 2.05810546875, 2.174346923828125, 2.29058837890625, 2.406829833984375, 2.5230712890625, 2.639312744140625, 2.75555419921875, 2.871795654296875, 2.988037109375, 3.104278564453125, 3.22052001953125, 3.336761474609375, 3.4530029296875, 3.569244384765625, 3.68548583984375, 3.801727294921875, 3.91796875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 11.0, 5.0, 20.0, 18.0, 25.0, 22.0, 45.0, 59.0, 90.0, 112.0, 114.0, 212.0, 342.0, 492.0, 571.0, 933.0, 1289.0, 1713.0, 2590.0, 3689.0, 5434.0, 7995.0, 12017.0, 17903.0, 26344.0, 40451.0, 64383.0, 114507.0, 261002.0, 217331.0, 98990.0, 57762.0, 36982.0, 24292.0, 16013.0, 10706.0, 7558.0, 5167.0, 3380.0, 2418.0, 1659.0, 1108.0, 791.0, 615.0, 364.0, 286.0, 221.0, 153.0, 112.0, 69.0, 46.0, 51.0, 28.0, 30.0, 14.0, 10.0, 8.0, 8.0, 4.0, 5.0], "bins": [-0.1783447265625, -0.17292213439941406, -0.16749954223632812, -0.1620769500732422, -0.15665435791015625, -0.1512317657470703, -0.14580917358398438, -0.14038658142089844, -0.1349639892578125, -0.12954139709472656, -0.12411880493164062, -0.11869621276855469, -0.11327362060546875, -0.10785102844238281, -0.10242843627929688, -0.09700584411621094, -0.091583251953125, -0.08616065979003906, -0.08073806762695312, -0.07531547546386719, -0.06989288330078125, -0.06447029113769531, -0.059047698974609375, -0.05362510681152344, -0.0482025146484375, -0.04277992248535156, -0.037357330322265625, -0.03193473815917969, -0.02651214599609375, -0.021089553833007812, -0.015666961669921875, -0.010244369506835938, -0.00482177734375, 0.0006008148193359375, 0.006023406982421875, 0.011445999145507812, 0.01686859130859375, 0.022291183471679688, 0.027713775634765625, 0.03313636779785156, 0.0385589599609375, 0.04398155212402344, 0.049404144287109375, 0.05482673645019531, 0.06024932861328125, 0.06567192077636719, 0.07109451293945312, 0.07651710510253906, 0.081939697265625, 0.08736228942871094, 0.09278488159179688, 0.09820747375488281, 0.10363006591796875, 0.10905265808105469, 0.11447525024414062, 0.11989784240722656, 0.1253204345703125, 0.13074302673339844, 0.13616561889648438, 0.1415882110595703, 0.14701080322265625, 0.1524333953857422, 0.15785598754882812, 0.16327857971191406, 0.168701171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 6.0, 5.0, 12.0, 10.0, 14.0, 17.0, 14.0, 21.0, 23.0, 24.0, 25.0, 26.0, 43.0, 32.0, 40.0, 41.0, 33.0, 35.0, 53.0, 1070.0, 55.0, 56.0, 49.0, 32.0, 40.0, 39.0, 33.0, 34.0, 33.0, 23.0, 16.0, 21.0, 9.0, 9.0, 11.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.462890625, -3.35888671875, -3.2548828125, -3.15087890625, -3.046875, -2.94287109375, -2.8388671875, -2.73486328125, -2.630859375, -2.52685546875, -2.4228515625, -2.31884765625, -2.21484375, -2.11083984375, -2.0068359375, -1.90283203125, -1.798828125, -1.69482421875, -1.5908203125, -1.48681640625, -1.3828125, -1.27880859375, -1.1748046875, -1.07080078125, -0.966796875, -0.86279296875, -0.7587890625, -0.65478515625, -0.55078125, -0.44677734375, -0.3427734375, -0.23876953125, -0.134765625, -0.03076171875, 0.0732421875, 0.17724609375, 0.28125, 0.38525390625, 0.4892578125, 0.59326171875, 0.697265625, 0.80126953125, 0.9052734375, 1.00927734375, 1.11328125, 1.21728515625, 1.3212890625, 1.42529296875, 1.529296875, 1.63330078125, 1.7373046875, 1.84130859375, 1.9453125, 2.04931640625, 2.1533203125, 2.25732421875, 2.361328125, 2.46533203125, 2.5693359375, 2.67333984375, 2.77734375, 2.88134765625, 2.9853515625, 3.08935546875, 3.193359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 11.0, 8.0, 12.0, 16.0, 24.0, 45.0, 51.0, 86.0, 115.0, 175.0, 236.0, 365.0, 500.0, 711.0, 1105.0, 1582.0, 2295.0, 3457.0, 4911.0, 6964.0, 10494.0, 15649.0, 23735.0, 36908.0, 60520.0, 107590.0, 301436.0, 1208540.0, 122648.0, 67216.0, 40913.0, 26180.0, 16784.0, 11308.0, 7702.0, 5199.0, 3534.0, 2515.0, 1664.0, 1224.0, 830.0, 579.0, 399.0, 313.0, 183.0, 145.0, 75.0, 63.0, 37.0, 30.0, 20.0, 17.0, 4.0, 8.0, 5.0, 2.0, 5.0, 1.0], "bins": [-0.05926513671875, -0.057474613189697266, -0.05568408966064453, -0.0538935661315918, -0.05210304260253906, -0.05031251907348633, -0.048521995544433594, -0.04673147201538086, -0.044940948486328125, -0.04315042495727539, -0.041359901428222656, -0.03956937789916992, -0.03777885437011719, -0.03598833084106445, -0.03419780731201172, -0.032407283782958984, -0.03061676025390625, -0.028826236724853516, -0.02703571319580078, -0.025245189666748047, -0.023454666137695312, -0.021664142608642578, -0.019873619079589844, -0.01808309555053711, -0.016292572021484375, -0.01450204849243164, -0.012711524963378906, -0.010921001434326172, -0.009130477905273438, -0.007339954376220703, -0.005549430847167969, -0.0037589073181152344, -0.0019683837890625, -0.00017786026000976562, 0.0016126632690429688, 0.003403186798095703, 0.0051937103271484375, 0.006984233856201172, 0.008774757385253906, 0.01056528091430664, 0.012355804443359375, 0.01414632797241211, 0.015936851501464844, 0.017727375030517578, 0.019517898559570312, 0.021308422088623047, 0.02309894561767578, 0.024889469146728516, 0.02667999267578125, 0.028470516204833984, 0.03026103973388672, 0.03205156326293945, 0.03384208679199219, 0.03563261032104492, 0.037423133850097656, 0.03921365737915039, 0.041004180908203125, 0.04279470443725586, 0.044585227966308594, 0.04637575149536133, 0.04816627502441406, 0.0499567985534668, 0.05174732208251953, 0.053537845611572266, 0.055328369140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 4.0, 6.0, 11.0, 17.0, 17.0, 25.0, 32.0, 32.0, 41.0, 60.0, 74.0, 73.0, 80.0, 90.0, 73.0, 68.0, 49.0, 45.0, 36.0, 29.0, 21.0, 22.0, 18.0, 16.0, 11.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014886856079101562, -0.0014462918043136597, -0.001403898000717163, -0.0013615041971206665, -0.00131911039352417, -0.0012767165899276733, -0.0012343227863311768, -0.0011919289827346802, -0.0011495351791381836, -0.001107141375541687, -0.0010647475719451904, -0.0010223537683486938, -0.0009799599647521973, -0.0009375661611557007, -0.0008951723575592041, -0.0008527785539627075, -0.0008103847503662109, -0.0007679909467697144, -0.0007255971431732178, -0.0006832033395767212, -0.0006408095359802246, -0.000598415732383728, -0.0005560219287872314, -0.0005136281251907349, -0.0004712343215942383, -0.0004288405179977417, -0.0003864467144012451, -0.00034405291080474854, -0.00030165910720825195, -0.00025926530361175537, -0.0002168715000152588, -0.0001744776964187622, -0.00013208389282226562, -8.969008922576904e-05, -4.729628562927246e-05, -4.902482032775879e-06, 3.74913215637207e-05, 7.988512516021729e-05, 0.00012227892875671387, 0.00016467273235321045, 0.00020706653594970703, 0.0002494603395462036, 0.0002918541431427002, 0.0003342479467391968, 0.00037664175033569336, 0.00041903555393218994, 0.0004614293575286865, 0.0005038231611251831, 0.0005462169647216797, 0.0005886107683181763, 0.0006310045719146729, 0.0006733983755111694, 0.000715792179107666, 0.0007581859827041626, 0.0008005797863006592, 0.0008429735898971558, 0.0008853673934936523, 0.0009277611970901489, 0.0009701550006866455, 0.001012548804283142, 0.0010549426078796387, 0.0010973364114761353, 0.0011397302150726318, 0.0011821240186691284, 0.001224517822265625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 3.0, 7.0, 2.0, 9.0, 9.0, 20.0, 18.0, 23.0, 25.0, 29.0, 43.0, 68.0, 120.0, 342.0, 3412.0, 882491.0, 160013.0, 1301.0, 261.0, 112.0, 57.0, 38.0, 40.0, 26.0, 17.0, 16.0, 10.0, 7.0, 4.0, 11.0, 3.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026042938232421875, -0.02510833740234375, -0.024173736572265625, -0.0232391357421875, -0.022304534912109375, -0.02136993408203125, -0.020435333251953125, -0.019500732421875, -0.018566131591796875, -0.01763153076171875, -0.016696929931640625, -0.0157623291015625, -0.014827728271484375, -0.01389312744140625, -0.012958526611328125, -0.01202392578125, -0.011089324951171875, -0.01015472412109375, -0.009220123291015625, -0.0082855224609375, -0.007350921630859375, -0.00641632080078125, -0.005481719970703125, -0.004547119140625, -0.003612518310546875, -0.00267791748046875, -0.001743316650390625, -0.0008087158203125, 0.000125885009765625, 0.00106048583984375, 0.001995086669921875, 0.0029296875, 0.003864288330078125, 0.00479888916015625, 0.005733489990234375, 0.0066680908203125, 0.007602691650390625, 0.00853729248046875, 0.009471893310546875, 0.010406494140625, 0.011341094970703125, 0.01227569580078125, 0.013210296630859375, 0.0141448974609375, 0.015079498291015625, 0.01601409912109375, 0.016948699951171875, 0.01788330078125, 0.018817901611328125, 0.01975250244140625, 0.020687103271484375, 0.0216217041015625, 0.022556304931640625, 0.02349090576171875, 0.024425506591796875, 0.025360107421875, 0.026294708251953125, 0.02722930908203125, 0.028163909912109375, 0.0290985107421875, 0.030033111572265625, 0.03096771240234375, 0.031902313232421875, 0.0328369140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 61.0, 951.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002530066529288888, -0.001415963633917272, -0.0003018607385456562, 0.0008122420404106379, 0.0019263450521975756, 0.0030404480639845133, 0.004154550842940807, 0.005268653854727745, 0.006382756866514683, 0.0074968598783016205, 0.008610962890088558, 0.009725065901875496, 0.010839167982339859, 0.011953271925449371, 0.013067374005913734, 0.014181477017700672, 0.01529558002948761, 0.016409682109951973, 0.017523786053061485, 0.01863788813352585, 0.01975199207663536, 0.020866094157099724, 0.021980196237564087, 0.0230943001806736, 0.024208402261137962, 0.025322504341602325, 0.026436608284711838, 0.0275507103651762, 0.028664814308285713, 0.029778916388750076, 0.03089302033185959, 0.0320071205496788, 0.033121224492788315, 0.03423532843589783, 0.03534942865371704, 0.03646353259682655, 0.037577636539936066, 0.03869174048304558, 0.03980584070086479, 0.040919944643974304, 0.042034048587083817, 0.04314815253019333, 0.04426225274801254, 0.045376356691122055, 0.04649046063423157, 0.04760456457734108, 0.048718664795160294, 0.049832768738269806, 0.05094686895608902, 0.05206097289919853, 0.053175073117017746, 0.05428917706012726, 0.05540328100323677, 0.05651738494634628, 0.0576314851641655, 0.05874558910727501, 0.05985969305038452, 0.060973796993494034, 0.06208789721131325, 0.06320200115442276, 0.06431610137224197, 0.06543020904064178, 0.066544309258461, 0.06765840947628021, 0.06877251714468002]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 20.0, 21.0, 26.0, 54.0, 69.0, 76.0, 80.0, 93.0, 102.0, 97.0, 84.0, 80.0, 49.0, 41.0, 32.0, 27.0, 18.0, 12.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0030908584594726562, -0.00302241463214159, -0.002953970804810524, -0.002885526977479458, -0.0028170831501483917, -0.0027486393228173256, -0.0026801954954862595, -0.0026117516681551933, -0.002543307840824127, -0.002474864013493061, -0.002406420186161995, -0.002337976358830929, -0.0022695325314998627, -0.0022010887041687965, -0.0021326448768377304, -0.0020642010495066643, -0.001995757222175598, -0.001927313394844532, -0.0018588695675134659, -0.0017904257401823997, -0.0017219819128513336, -0.0016535380855202675, -0.0015850942581892014, -0.0015166504308581352, -0.001448206603527069, -0.001379762776196003, -0.0013113189488649368, -0.0012428751215338707, -0.0011744312942028046, -0.0011059874668717384, -0.0010375436395406723, -0.0009690998122096062, -0.00090065598487854, -0.0008322121575474739, -0.0007637683302164078, -0.0006953245028853416, -0.0006268806755542755, -0.0005584368482232094, -0.0004899930208921432, -0.0004215491935610771, -0.000353105366230011, -0.00028466153889894485, -0.00021621771156787872, -0.0001477738842368126, -7.933005690574646e-05, -1.0886229574680328e-05, 5.75575977563858e-05, 0.00012600142508745193, 0.00019444525241851807, 0.0002628890797495842, 0.00033133290708065033, 0.00039977673441171646, 0.0004682205617427826, 0.0005366643890738487, 0.0006051082164049149, 0.000673552043735981, 0.0007419958710670471, 0.0008104396983981133, 0.0008788835257291794, 0.0009473273530602455, 0.0010157711803913116, 0.0010842150077223778, 0.001152658835053444, 0.00122110266238451, 0.0012895464897155762]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 4.0, 9.0, 2.0, 10.0, 12.0, 10.0, 23.0, 14.0, 24.0, 18.0, 31.0, 24.0, 19.0, 34.0, 39.0, 34.0, 34.0, 43.0, 46.0, 50.0, 41.0, 54.0, 51.0, 44.0, 34.0, 33.0, 33.0, 24.0, 28.0, 16.0, 25.0, 28.0, 20.0, 21.0, 11.0, 13.0, 8.0, 11.0, 1.0, 9.0, 2.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.405242919921875, -3.28900146484375, -3.172760009765625, -3.0565185546875, -2.940277099609375, -2.82403564453125, -2.707794189453125, -2.591552734375, -2.475311279296875, -2.35906982421875, -2.242828369140625, -2.1265869140625, -2.010345458984375, -1.89410400390625, -1.777862548828125, -1.66162109375, -1.545379638671875, -1.42913818359375, -1.312896728515625, -1.1966552734375, -1.080413818359375, -0.96417236328125, -0.847930908203125, -0.731689453125, -0.615447998046875, -0.49920654296875, -0.382965087890625, -0.2667236328125, -0.150482177734375, -0.03424072265625, 0.082000732421875, 0.1982421875, 0.314483642578125, 0.43072509765625, 0.546966552734375, 0.6632080078125, 0.779449462890625, 0.89569091796875, 1.011932373046875, 1.128173828125, 1.244415283203125, 1.36065673828125, 1.476898193359375, 1.5931396484375, 1.709381103515625, 1.82562255859375, 1.941864013671875, 2.05810546875, 2.174346923828125, 2.29058837890625, 2.406829833984375, 2.5230712890625, 2.639312744140625, 2.75555419921875, 2.871795654296875, 2.988037109375, 3.104278564453125, 3.22052001953125, 3.336761474609375, 3.4530029296875, 3.569244384765625, 3.68548583984375, 3.801727294921875, 3.91796875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 3.0, 11.0, 9.0, 24.0, 24.0, 50.0, 63.0, 95.0, 182.0, 273.0, 403.0, 672.0, 1102.0, 1981.0, 3472.0, 6392.0, 12736.0, 25439.0, 58949.0, 178297.0, 448747.0, 192822.0, 61508.0, 26591.0, 12959.0, 6892.0, 3745.0, 2097.0, 1171.0, 721.0, 396.0, 241.0, 151.0, 112.0, 62.0, 45.0, 32.0, 31.0, 22.0, 9.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.2109375, -6.9892578125, -6.767578125, -6.5458984375, -6.32421875, -6.1025390625, -5.880859375, -5.6591796875, -5.4375, -5.2158203125, -4.994140625, -4.7724609375, -4.55078125, -4.3291015625, -4.107421875, -3.8857421875, -3.6640625, -3.4423828125, -3.220703125, -2.9990234375, -2.77734375, -2.5556640625, -2.333984375, -2.1123046875, -1.890625, -1.6689453125, -1.447265625, -1.2255859375, -1.00390625, -0.7822265625, -0.560546875, -0.3388671875, -0.1171875, 0.1044921875, 0.326171875, 0.5478515625, 0.76953125, 0.9912109375, 1.212890625, 1.4345703125, 1.65625, 1.8779296875, 2.099609375, 2.3212890625, 2.54296875, 2.7646484375, 2.986328125, 3.2080078125, 3.4296875, 3.6513671875, 3.873046875, 4.0947265625, 4.31640625, 4.5380859375, 4.759765625, 4.9814453125, 5.203125, 5.4248046875, 5.646484375, 5.8681640625, 6.08984375, 6.3115234375, 6.533203125, 6.7548828125, 6.9765625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 5.0, 8.0, 6.0, 5.0, 21.0, 15.0, 18.0, 18.0, 20.0, 20.0, 26.0, 27.0, 37.0, 43.0, 44.0, 59.0, 75.0, 126.0, 196.0, 1320.0, 261.0, 152.0, 112.0, 75.0, 64.0, 37.0, 30.0, 26.0, 28.0, 33.0, 23.0, 26.0, 15.0, 9.0, 12.0, 9.0, 11.0, 11.0, 11.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.540771484375, -9.19873046875, -8.856689453125, -8.5146484375, -8.172607421875, -7.83056640625, -7.488525390625, -7.146484375, -6.804443359375, -6.46240234375, -6.120361328125, -5.7783203125, -5.436279296875, -5.09423828125, -4.752197265625, -4.41015625, -4.068115234375, -3.72607421875, -3.384033203125, -3.0419921875, -2.699951171875, -2.35791015625, -2.015869140625, -1.673828125, -1.331787109375, -0.98974609375, -0.647705078125, -0.3056640625, 0.036376953125, 0.37841796875, 0.720458984375, 1.0625, 1.404541015625, 1.74658203125, 2.088623046875, 2.4306640625, 2.772705078125, 3.11474609375, 3.456787109375, 3.798828125, 4.140869140625, 4.48291015625, 4.824951171875, 5.1669921875, 5.509033203125, 5.85107421875, 6.193115234375, 6.53515625, 6.877197265625, 7.21923828125, 7.561279296875, 7.9033203125, 8.245361328125, 8.58740234375, 8.929443359375, 9.271484375, 9.613525390625, 9.95556640625, 10.297607421875, 10.6396484375, 10.981689453125, 11.32373046875, 11.665771484375, 12.0078125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 3.0, 9.0, 10.0, 26.0, 17.0, 24.0, 38.0, 57.0, 82.0, 125.0, 177.0, 378.0, 867.0, 2956.0, 17889.0, 363015.0, 2652274.0, 95966.0, 8586.0, 1828.0, 611.0, 293.0, 141.0, 87.0, 54.0, 52.0, 45.0, 22.0, 17.0, 13.0, 4.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.953125, -22.30322265625, -21.6533203125, -21.00341796875, -20.353515625, -19.70361328125, -19.0537109375, -18.40380859375, -17.75390625, -17.10400390625, -16.4541015625, -15.80419921875, -15.154296875, -14.50439453125, -13.8544921875, -13.20458984375, -12.5546875, -11.90478515625, -11.2548828125, -10.60498046875, -9.955078125, -9.30517578125, -8.6552734375, -8.00537109375, -7.35546875, -6.70556640625, -6.0556640625, -5.40576171875, -4.755859375, -4.10595703125, -3.4560546875, -2.80615234375, -2.15625, -1.50634765625, -0.8564453125, -0.20654296875, 0.443359375, 1.09326171875, 1.7431640625, 2.39306640625, 3.04296875, 3.69287109375, 4.3427734375, 4.99267578125, 5.642578125, 6.29248046875, 6.9423828125, 7.59228515625, 8.2421875, 8.89208984375, 9.5419921875, 10.19189453125, 10.841796875, 11.49169921875, 12.1416015625, 12.79150390625, 13.44140625, 14.09130859375, 14.7412109375, 15.39111328125, 16.041015625, 16.69091796875, 17.3408203125, 17.99072265625, 18.640625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 12.0, 22.0, 50.0, 85.0, 115.0, 139.0, 150.0, 147.0, 110.0, 72.0, 50.0, 31.0, 18.0, 7.0, 3.0], "bins": [-60.706565856933594, -59.61306381225586, -58.51956558227539, -57.426063537597656, -56.33256530761719, -55.23906326293945, -54.14556121826172, -53.05206298828125, -51.958560943603516, -50.86505889892578, -49.77156066894531, -48.67805862426758, -47.584556579589844, -46.491058349609375, -45.39755630493164, -44.30405807495117, -43.21055603027344, -42.1170539855957, -41.023555755615234, -39.9300537109375, -38.83655548095703, -37.7430534362793, -36.64955139160156, -35.556053161621094, -34.46255111694336, -33.369049072265625, -32.275550842285156, -31.182048797607422, -30.08854866027832, -28.99504852294922, -27.901546478271484, -26.808046340942383, -25.714550018310547, -24.621049880981445, -23.527549743652344, -22.43404769897461, -21.340547561645508, -20.247047424316406, -19.153545379638672, -18.06004524230957, -16.96654510498047, -15.873044967651367, -14.77954387664795, -13.686042785644531, -12.59254264831543, -11.499042510986328, -10.40554141998291, -9.312040328979492, -8.21854019165039, -7.125039577484131, -6.031538963317871, -4.938038349151611, -3.8445377349853516, -2.751037120819092, -1.657536506652832, -0.5640358924865723, 0.5294647216796875, 1.6229653358459473, 2.716465950012207, 3.809966564178467, 4.903467178344727, 5.996967792510986, 7.090468406677246, 8.183969497680664, 9.277469635009766]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 8.0, 9.0, 11.0, 13.0, 21.0, 16.0, 24.0, 31.0, 29.0, 31.0, 27.0, 28.0, 37.0, 41.0, 47.0, 46.0, 28.0, 50.0, 54.0, 47.0, 50.0, 33.0, 39.0, 33.0, 44.0, 22.0, 20.0, 21.0, 18.0, 19.0, 19.0, 7.0, 8.0, 21.0, 6.0, 11.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.46092987060547, -33.44132995605469, -32.421730041503906, -31.402130126953125, -30.382530212402344, -29.362930297851562, -28.34332847595215, -27.323728561401367, -26.304128646850586, -25.284528732299805, -24.264928817749023, -23.245328903198242, -22.225727081298828, -21.206127166748047, -20.186527252197266, -19.166927337646484, -18.147327423095703, -17.127727508544922, -16.10812759399414, -15.088526725769043, -14.068926811218262, -13.04932689666748, -12.029726028442383, -11.010126113891602, -9.99052619934082, -8.970926284790039, -7.9513258934021, -6.93172550201416, -5.912125587463379, -4.892525672912598, -3.872925281524658, -2.8533248901367188, -1.8337249755859375, -0.8141248226165771, 0.2054753303527832, 1.2250754833221436, 2.244675636291504, 3.264275550842285, 4.283875942230225, 5.303476333618164, 6.323076248168945, 7.342676162719727, 8.362276077270508, 9.381876945495605, 10.401476860046387, 11.421076774597168, 12.440677642822266, 13.460277557373047, 14.479877471923828, 15.49947738647461, 16.51907730102539, 17.538677215576172, 18.558277130126953, 19.577877044677734, 20.59747886657715, 21.61707878112793, 22.63667869567871, 23.656278610229492, 24.675878524780273, 25.695478439331055, 26.71508026123047, 27.73468017578125, 28.75428009033203, 29.773880004882812, 30.793479919433594]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 11.0, 18.0, 12.0, 8.0, 17.0, 17.0, 21.0, 29.0, 20.0, 25.0, 36.0, 34.0, 42.0, 40.0, 53.0, 37.0, 51.0, 58.0, 49.0, 48.0, 29.0, 34.0, 27.0, 33.0, 29.0, 28.0, 30.0, 18.0, 27.0, 17.0, 13.0, 10.0, 22.0, 9.0, 8.0, 6.0, 6.0, 4.0, 7.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.035614013671875, -3.91107177734375, -3.786529541015625, -3.6619873046875, -3.537445068359375, -3.41290283203125, -3.288360595703125, -3.163818359375, -3.039276123046875, -2.91473388671875, -2.790191650390625, -2.6656494140625, -2.541107177734375, -2.41656494140625, -2.292022705078125, -2.16748046875, -2.042938232421875, -1.91839599609375, -1.793853759765625, -1.6693115234375, -1.544769287109375, -1.42022705078125, -1.295684814453125, -1.171142578125, -1.046600341796875, -0.92205810546875, -0.797515869140625, -0.6729736328125, -0.548431396484375, -0.42388916015625, -0.299346923828125, -0.1748046875, -0.050262451171875, 0.07427978515625, 0.198822021484375, 0.3233642578125, 0.447906494140625, 0.57244873046875, 0.696990966796875, 0.821533203125, 0.946075439453125, 1.07061767578125, 1.195159912109375, 1.3197021484375, 1.444244384765625, 1.56878662109375, 1.693328857421875, 1.81787109375, 1.942413330078125, 2.06695556640625, 2.191497802734375, 2.3160400390625, 2.440582275390625, 2.56512451171875, 2.689666748046875, 2.814208984375, 2.938751220703125, 3.06329345703125, 3.187835693359375, 3.3123779296875, 3.436920166015625, 3.56146240234375, 3.686004638671875, 3.810546875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 17.0, 15.0, 9.0, 19.0, 22.0, 30.0, 45.0, 53.0, 75.0, 142.0, 212.0, 361.0, 748.0, 1482.0, 3365.0, 8978.0, 31787.0, 191536.0, 1580116.0, 2048505.0, 267471.0, 40742.0, 10886.0, 3931.0, 1745.0, 839.0, 408.0, 229.0, 146.0, 87.0, 83.0, 38.0, 33.0, 29.0, 24.0, 24.0, 13.0, 5.0, 10.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6875, -8.398681640625, -8.10986328125, -7.821044921875, -7.5322265625, -7.243408203125, -6.95458984375, -6.665771484375, -6.376953125, -6.088134765625, -5.79931640625, -5.510498046875, -5.2216796875, -4.932861328125, -4.64404296875, -4.355224609375, -4.06640625, -3.777587890625, -3.48876953125, -3.199951171875, -2.9111328125, -2.622314453125, -2.33349609375, -2.044677734375, -1.755859375, -1.467041015625, -1.17822265625, -0.889404296875, -0.6005859375, -0.311767578125, -0.02294921875, 0.265869140625, 0.5546875, 0.843505859375, 1.13232421875, 1.421142578125, 1.7099609375, 1.998779296875, 2.28759765625, 2.576416015625, 2.865234375, 3.154052734375, 3.44287109375, 3.731689453125, 4.0205078125, 4.309326171875, 4.59814453125, 4.886962890625, 5.17578125, 5.464599609375, 5.75341796875, 6.042236328125, 6.3310546875, 6.619873046875, 6.90869140625, 7.197509765625, 7.486328125, 7.775146484375, 8.06396484375, 8.352783203125, 8.6416015625, 8.930419921875, 9.21923828125, 9.508056640625, 9.796875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 5.0, 16.0, 12.0, 26.0, 27.0, 45.0, 55.0, 78.0, 93.0, 141.0, 215.0, 279.0, 397.0, 524.0, 573.0, 446.0, 319.0, 247.0, 148.0, 129.0, 72.0, 62.0, 40.0, 35.0, 15.0, 15.0, 14.0, 10.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.23828125, -7.006591796875, -6.77490234375, -6.543212890625, -6.3115234375, -6.079833984375, -5.84814453125, -5.616455078125, -5.384765625, -5.153076171875, -4.92138671875, -4.689697265625, -4.4580078125, -4.226318359375, -3.99462890625, -3.762939453125, -3.53125, -3.299560546875, -3.06787109375, -2.836181640625, -2.6044921875, -2.372802734375, -2.14111328125, -1.909423828125, -1.677734375, -1.446044921875, -1.21435546875, -0.982666015625, -0.7509765625, -0.519287109375, -0.28759765625, -0.055908203125, 0.17578125, 0.407470703125, 0.63916015625, 0.870849609375, 1.1025390625, 1.334228515625, 1.56591796875, 1.797607421875, 2.029296875, 2.260986328125, 2.49267578125, 2.724365234375, 2.9560546875, 3.187744140625, 3.41943359375, 3.651123046875, 3.8828125, 4.114501953125, 4.34619140625, 4.577880859375, 4.8095703125, 5.041259765625, 5.27294921875, 5.504638671875, 5.736328125, 5.968017578125, 6.19970703125, 6.431396484375, 6.6630859375, 6.894775390625, 7.12646484375, 7.358154296875, 7.58984375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 12.0, 14.0, 10.0, 12.0, 16.0, 25.0, 28.0, 48.0, 65.0, 87.0, 164.0, 218.0, 431.0, 1856.0, 53715.0, 4043571.0, 90323.0, 2389.0, 473.0, 288.0, 156.0, 101.0, 84.0, 60.0, 35.0, 28.0, 17.0, 19.0, 10.0, 9.0, 3.0, 5.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-45.125, -43.81884765625, -42.5126953125, -41.20654296875, -39.900390625, -38.59423828125, -37.2880859375, -35.98193359375, -34.67578125, -33.36962890625, -32.0634765625, -30.75732421875, -29.451171875, -28.14501953125, -26.8388671875, -25.53271484375, -24.2265625, -22.92041015625, -21.6142578125, -20.30810546875, -19.001953125, -17.69580078125, -16.3896484375, -15.08349609375, -13.77734375, -12.47119140625, -11.1650390625, -9.85888671875, -8.552734375, -7.24658203125, -5.9404296875, -4.63427734375, -3.328125, -2.02197265625, -0.7158203125, 0.59033203125, 1.896484375, 3.20263671875, 4.5087890625, 5.81494140625, 7.12109375, 8.42724609375, 9.7333984375, 11.03955078125, 12.345703125, 13.65185546875, 14.9580078125, 16.26416015625, 17.5703125, 18.87646484375, 20.1826171875, 21.48876953125, 22.794921875, 24.10107421875, 25.4072265625, 26.71337890625, 28.01953125, 29.32568359375, 30.6318359375, 31.93798828125, 33.244140625, 34.55029296875, 35.8564453125, 37.16259765625, 38.46875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 20.0, 53.0, 92.0, 138.0, 177.0, 168.0, 149.0, 105.0, 55.0, 24.0, 13.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.600791931152344, -17.844432830810547, -16.08807373046875, -14.33171558380127, -12.575357437133789, -10.818998336791992, -9.062639236450195, -7.306281089782715, -5.549921989440918, -3.7935633659362793, -2.0372045040130615, -0.28084564208984375, 1.475512981414795, 3.2318716049194336, 4.9882307052612305, 6.744588851928711, 8.500947952270508, 10.257307052612305, 12.013665199279785, 13.770024299621582, 15.526382446289062, 17.28274154663086, 19.039100646972656, 20.795459747314453, 22.55181884765625, 24.308177947998047, 26.064537048339844, 27.82089614868164, 29.577253341674805, 31.3336124420166, 33.08997344970703, 34.84632873535156, 36.60268783569336, 38.359046936035156, 40.11540603637695, 41.87176513671875, 43.62812423706055, 45.384483337402344, 47.140838623046875, 48.89719772338867, 50.65355682373047, 52.409915924072266, 54.16627502441406, 55.92263412475586, 57.678993225097656, 59.43534851074219, 61.19171142578125, 62.94806671142578, 64.70442962646484, 66.46078491210938, 68.21714782714844, 69.97350311279297, 71.72986602783203, 73.48622131347656, 75.24258422851562, 76.99893951416016, 78.75529479980469, 80.51165008544922, 82.26801300048828, 84.02436828613281, 85.78073120117188, 87.5370864868164, 89.29344940185547, 91.0498046875, 92.80616760253906]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 10.0, 4.0, 7.0, 9.0, 8.0, 13.0, 24.0, 15.0, 23.0, 30.0, 28.0, 27.0, 28.0, 42.0, 38.0, 27.0, 35.0, 32.0, 33.0, 31.0, 32.0, 37.0, 35.0, 39.0, 41.0, 39.0, 29.0, 42.0, 25.0, 37.0, 25.0, 21.0, 17.0, 14.0, 12.0, 13.0, 13.0, 10.0, 10.0, 6.0, 12.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 5.0, 1.0], "bins": [-22.695520401000977, -22.04084587097168, -21.386171340942383, -20.73149871826172, -20.076824188232422, -19.422149658203125, -18.767475128173828, -18.11280059814453, -17.458126068115234, -16.803451538085938, -16.14877700805664, -15.49410343170166, -14.83942985534668, -14.184755325317383, -13.530080795288086, -12.875406265258789, -12.220733642578125, -11.566059112548828, -10.911385536193848, -10.25671100616455, -9.60203742980957, -8.947362899780273, -8.292688369750977, -7.638014316558838, -6.983340263366699, -6.3286662101745605, -5.673992156982422, -5.019317626953125, -4.364643573760986, -3.7099695205688477, -3.05529522895813, -2.400620937347412, -1.7459487915039062, -1.091274619102478, -0.4366004467010498, 0.21807372570037842, 0.8727478981018066, 1.5274219512939453, 2.182096242904663, 2.836770534515381, 3.4914445877075195, 4.146118640899658, 4.800792694091797, 5.455467224121094, 6.110141277313232, 6.764815330505371, 7.419489860534668, 8.074163436889648, 8.728837966918945, 9.383512496948242, 10.038186073303223, 10.69286060333252, 11.3475341796875, 12.002208709716797, 12.656883239746094, 13.31155776977539, 13.966231346130371, 14.620905876159668, 15.275579452514648, 15.930253982543945, 16.584928512573242, 17.239601135253906, 17.894275665283203, 18.5489501953125, 19.203624725341797]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 8.0, 2.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 12.0, 11.0, 19.0, 26.0, 24.0, 19.0, 38.0, 23.0, 38.0, 44.0, 39.0, 53.0, 38.0, 38.0, 37.0, 42.0, 45.0, 33.0, 45.0, 29.0, 33.0, 28.0, 24.0, 23.0, 25.0, 25.0, 13.0, 17.0, 17.0, 22.0, 17.0, 15.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.939453125, -3.82269287109375, -3.7059326171875, -3.58917236328125, -3.472412109375, -3.35565185546875, -3.2388916015625, -3.12213134765625, -3.00537109375, -2.88861083984375, -2.7718505859375, -2.65509033203125, -2.538330078125, -2.42156982421875, -2.3048095703125, -2.18804931640625, -2.0712890625, -1.95452880859375, -1.8377685546875, -1.72100830078125, -1.604248046875, -1.48748779296875, -1.3707275390625, -1.25396728515625, -1.13720703125, -1.02044677734375, -0.9036865234375, -0.78692626953125, -0.670166015625, -0.55340576171875, -0.4366455078125, -0.31988525390625, -0.203125, -0.08636474609375, 0.0303955078125, 0.14715576171875, 0.263916015625, 0.38067626953125, 0.4974365234375, 0.61419677734375, 0.73095703125, 0.84771728515625, 0.9644775390625, 1.08123779296875, 1.197998046875, 1.31475830078125, 1.4315185546875, 1.54827880859375, 1.6650390625, 1.78179931640625, 1.8985595703125, 2.01531982421875, 2.132080078125, 2.24884033203125, 2.3656005859375, 2.48236083984375, 2.59912109375, 2.71588134765625, 2.8326416015625, 2.94940185546875, 3.066162109375, 3.18292236328125, 3.2996826171875, 3.41644287109375, 3.533203125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 8.0, 12.0, 12.0, 15.0, 32.0, 41.0, 70.0, 122.0, 168.0, 209.0, 354.0, 515.0, 822.0, 1201.0, 1686.0, 2515.0, 3845.0, 5872.0, 8390.0, 12648.0, 19356.0, 30151.0, 49108.0, 85605.0, 177136.0, 305986.0, 144983.0, 74906.0, 43469.0, 27036.0, 17387.0, 11355.0, 7623.0, 5209.0, 3494.0, 2367.0, 1602.0, 1083.0, 707.0, 486.0, 334.0, 209.0, 134.0, 95.0, 64.0, 57.0, 27.0, 21.0, 13.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.170654296875, -0.1650371551513672, -0.15942001342773438, -0.15380287170410156, -0.14818572998046875, -0.14256858825683594, -0.13695144653320312, -0.1313343048095703, -0.1257171630859375, -0.12010002136230469, -0.11448287963867188, -0.10886573791503906, -0.10324859619140625, -0.09763145446777344, -0.09201431274414062, -0.08639717102050781, -0.080780029296875, -0.07516288757324219, -0.06954574584960938, -0.06392860412597656, -0.05831146240234375, -0.05269432067871094, -0.047077178955078125, -0.04146003723144531, -0.0358428955078125, -0.030225753784179688, -0.024608612060546875, -0.018991470336914062, -0.01337432861328125, -0.0077571868896484375, -0.002140045166015625, 0.0034770965576171875, 0.00909423828125, 0.014711380004882812, 0.020328521728515625, 0.025945663452148438, 0.03156280517578125, 0.03717994689941406, 0.042797088623046875, 0.04841423034667969, 0.0540313720703125, 0.05964851379394531, 0.06526565551757812, 0.07088279724121094, 0.07649993896484375, 0.08211708068847656, 0.08773422241210938, 0.09335136413574219, 0.098968505859375, 0.10458564758300781, 0.11020278930664062, 0.11581993103027344, 0.12143707275390625, 0.12705421447753906, 0.13267135620117188, 0.1382884979248047, 0.1439056396484375, 0.1495227813720703, 0.15513992309570312, 0.16075706481933594, 0.16637420654296875, 0.17199134826660156, 0.17760848999023438, 0.1832256317138672, 0.1888427734375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 5.0, 9.0, 8.0, 10.0, 15.0, 15.0, 14.0, 19.0, 19.0, 26.0, 25.0, 23.0, 33.0, 37.0, 31.0, 33.0, 33.0, 36.0, 40.0, 40.0, 1061.0, 34.0, 30.0, 42.0, 56.0, 34.0, 30.0, 24.0, 26.0, 20.0, 21.0, 32.0, 18.0, 16.0, 13.0, 17.0, 10.0, 7.0, 6.0, 6.0, 10.0, 4.0, 5.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.822265625, -2.72857666015625, -2.6348876953125, -2.54119873046875, -2.447509765625, -2.35382080078125, -2.2601318359375, -2.16644287109375, -2.07275390625, -1.97906494140625, -1.8853759765625, -1.79168701171875, -1.697998046875, -1.60430908203125, -1.5106201171875, -1.41693115234375, -1.3232421875, -1.22955322265625, -1.1358642578125, -1.04217529296875, -0.948486328125, -0.85479736328125, -0.7611083984375, -0.66741943359375, -0.57373046875, -0.48004150390625, -0.3863525390625, -0.29266357421875, -0.198974609375, -0.10528564453125, -0.0115966796875, 0.08209228515625, 0.17578125, 0.26947021484375, 0.3631591796875, 0.45684814453125, 0.550537109375, 0.64422607421875, 0.7379150390625, 0.83160400390625, 0.92529296875, 1.01898193359375, 1.1126708984375, 1.20635986328125, 1.300048828125, 1.39373779296875, 1.4874267578125, 1.58111572265625, 1.6748046875, 1.76849365234375, 1.8621826171875, 1.95587158203125, 2.049560546875, 2.14324951171875, 2.2369384765625, 2.33062744140625, 2.42431640625, 2.51800537109375, 2.6116943359375, 2.70538330078125, 2.799072265625, 2.89276123046875, 2.9864501953125, 3.08013916015625, 3.173828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 6.0, 1.0, 1.0, 6.0, 7.0, 12.0, 22.0, 13.0, 36.0, 48.0, 67.0, 95.0, 156.0, 211.0, 342.0, 475.0, 698.0, 965.0, 1561.0, 2176.0, 3274.0, 4992.0, 7461.0, 11118.0, 17063.0, 26337.0, 41901.0, 68749.0, 123315.0, 1250471.0, 259724.0, 107324.0, 61036.0, 37490.0, 23842.0, 15728.0, 9995.0, 6704.0, 4494.0, 2921.0, 1995.0, 1435.0, 904.0, 624.0, 402.0, 300.0, 188.0, 137.0, 95.0, 73.0, 52.0, 29.0, 22.0, 26.0, 7.0, 9.0, 3.0, 8.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.060638427734375, -0.058675289154052734, -0.05671215057373047, -0.0547490119934082, -0.05278587341308594, -0.05082273483276367, -0.048859596252441406, -0.04689645767211914, -0.044933319091796875, -0.04297018051147461, -0.041007041931152344, -0.03904390335083008, -0.03708076477050781, -0.03511762619018555, -0.03315448760986328, -0.031191349029541016, -0.02922821044921875, -0.027265071868896484, -0.02530193328857422, -0.023338794708251953, -0.021375656127929688, -0.019412517547607422, -0.017449378967285156, -0.01548624038696289, -0.013523101806640625, -0.01155996322631836, -0.009596824645996094, -0.007633686065673828, -0.0056705474853515625, -0.003707408905029297, -0.0017442703247070312, 0.00021886825561523438, 0.0021820068359375, 0.004145145416259766, 0.006108283996582031, 0.008071422576904297, 0.010034561157226562, 0.011997699737548828, 0.013960838317871094, 0.01592397689819336, 0.017887115478515625, 0.01985025405883789, 0.021813392639160156, 0.023776531219482422, 0.025739669799804688, 0.027702808380126953, 0.02966594696044922, 0.031629085540771484, 0.03359222412109375, 0.035555362701416016, 0.03751850128173828, 0.03948163986206055, 0.04144477844238281, 0.04340791702270508, 0.045371055603027344, 0.04733419418334961, 0.049297332763671875, 0.05126047134399414, 0.053223609924316406, 0.05518674850463867, 0.05714988708496094, 0.0591130256652832, 0.06107616424560547, 0.06303930282592773, 0.06500244140625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 9.0, 6.0, 4.0, 5.0, 10.0, 9.0, 17.0, 18.0, 27.0, 21.0, 29.0, 29.0, 49.0, 47.0, 56.0, 57.0, 76.0, 92.0, 70.0, 62.0, 43.0, 44.0, 38.0, 26.0, 29.0, 24.0, 15.0, 16.0, 9.0, 10.0, 13.0, 8.0, 7.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0008101463317871094, -0.0007843151688575745, -0.0007584840059280396, -0.0007326528429985046, -0.0007068216800689697, -0.0006809905171394348, -0.0006551593542098999, -0.000629328191280365, -0.0006034970283508301, -0.0005776658654212952, -0.0005518347024917603, -0.0005260035395622253, -0.0005001723766326904, -0.0004743412137031555, -0.0004485100507736206, -0.0004226788878440857, -0.0003968477249145508, -0.00037101656198501587, -0.00034518539905548096, -0.00031935423612594604, -0.00029352307319641113, -0.0002676919102668762, -0.0002418607473373413, -0.0002160295844078064, -0.00019019842147827148, -0.00016436725854873657, -0.00013853609561920166, -0.00011270493268966675, -8.687376976013184e-05, -6.104260683059692e-05, -3.521144390106201e-05, -9.3802809715271e-06, 1.6450881958007812e-05, 4.2282044887542725e-05, 6.811320781707764e-05, 9.394437074661255e-05, 0.00011977553367614746, 0.00014560669660568237, 0.00017143785953521729, 0.0001972690224647522, 0.0002231001853942871, 0.000248931348323822, 0.00027476251125335693, 0.00030059367418289185, 0.00032642483711242676, 0.00035225600004196167, 0.0003780871629714966, 0.0004039183259010315, 0.0004297494888305664, 0.0004555806517601013, 0.00048141181468963623, 0.0005072429776191711, 0.0005330741405487061, 0.000558905303478241, 0.0005847364664077759, 0.0006105676293373108, 0.0006363987922668457, 0.0006622299551963806, 0.0006880611181259155, 0.0007138922810554504, 0.0007397234439849854, 0.0007655546069145203, 0.0007913857698440552, 0.0008172169327735901, 0.000843048095703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 3.0, 5.0, 6.0, 15.0, 8.0, 7.0, 20.0, 13.0, 24.0, 33.0, 29.0, 41.0, 70.0, 129.0, 275.0, 2429.0, 931986.0, 112052.0, 814.0, 181.0, 109.0, 74.0, 38.0, 32.0, 30.0, 26.0, 16.0, 21.0, 14.0, 6.0, 4.0, 4.0, 7.0, 8.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0198822021484375, -0.01927661895751953, -0.018671035766601562, -0.018065452575683594, -0.017459869384765625, -0.016854286193847656, -0.016248703002929688, -0.01564311981201172, -0.01503753662109375, -0.014431953430175781, -0.013826370239257812, -0.013220787048339844, -0.012615203857421875, -0.012009620666503906, -0.011404037475585938, -0.010798454284667969, -0.01019287109375, -0.009587287902832031, -0.008981704711914062, -0.008376121520996094, -0.007770538330078125, -0.007164955139160156, -0.0065593719482421875, -0.005953788757324219, -0.00534820556640625, -0.004742622375488281, -0.0041370391845703125, -0.0035314559936523438, -0.002925872802734375, -0.0023202896118164062, -0.0017147064208984375, -0.0011091232299804688, -0.0005035400390625, 0.00010204315185546875, 0.0007076263427734375, 0.0013132095336914062, 0.001918792724609375, 0.0025243759155273438, 0.0031299591064453125, 0.0037355422973632812, 0.00434112548828125, 0.004946708679199219, 0.0055522918701171875, 0.006157875061035156, 0.006763458251953125, 0.007369041442871094, 0.007974624633789062, 0.008580207824707031, 0.009185791015625, 0.009791374206542969, 0.010396957397460938, 0.011002540588378906, 0.011608123779296875, 0.012213706970214844, 0.012819290161132812, 0.013424873352050781, 0.01403045654296875, 0.014636039733886719, 0.015241622924804688, 0.015847206115722656, 0.016452789306640625, 0.017058372497558594, 0.017663955688476562, 0.01826953887939453, 0.0188751220703125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 940.0, 67.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034326589666306973, -0.003038111375644803, -0.002643563784658909, -0.002249015960842371, -0.0018544683698564768, -0.0014599207788705826, -0.0010653729550540447, -0.0006708253640681505, -0.0002762777730822563, 0.0001182698761112988, 0.0005128175253048539, 0.00090736523270607, 0.0013019128236919641, 0.0016964604146778584, 0.002091008238494396, 0.0024855558294802904, 0.0028801034204661846, 0.003274651011452079, 0.003669198602437973, 0.004063746426254511, 0.004458294250071049, 0.004852841608226299, 0.005247389432042837, 0.005641937255859375, 0.0060364846140146255, 0.006431032437831163, 0.006825579795986414, 0.007220127619802952, 0.007614674977958202, 0.008009223267436028, 0.008403770625591278, 0.008798317983746529, 0.00919286534190178, 0.00958741270005703, 0.009981960989534855, 0.010376508347690105, 0.010771055705845356, 0.011165603995323181, 0.011560151353478432, 0.011954698711633682, 0.012349246069788933, 0.012743793427944183, 0.013138341717422009, 0.013532889075577259, 0.01392743643373251, 0.014321984723210335, 0.014716532081365585, 0.015111079439520836, 0.015505627728998661, 0.015900176018476486, 0.016294723376631737, 0.016689270734786987, 0.017083818092942238, 0.01747836545109749, 0.017872914671897888, 0.01826746203005314, 0.01866200938820839, 0.01905655674636364, 0.01945110410451889, 0.01984565332531929, 0.02024020068347454, 0.02063474804162979, 0.021029295399785042, 0.021423842757940292, 0.021818390116095543]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 7.0, 5.0, 2.0, 8.0, 5.0, 2.0, 8.0, 13.0, 24.0, 21.0, 25.0, 26.0, 24.0, 27.0, 42.0, 40.0, 43.0, 44.0, 54.0, 49.0, 50.0, 42.0, 66.0, 68.0, 50.0, 42.0, 42.0, 30.0, 23.0, 32.0, 20.0, 19.0, 19.0, 12.0, 9.0, 3.0, 3.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009229183197021484, -0.0008987244218587875, -0.0008745305240154266, -0.0008503366261720657, -0.0008261427283287048, -0.0008019488304853439, -0.000777754932641983, -0.0007535610347986221, -0.0007293671369552612, -0.0007051732391119003, -0.0006809793412685394, -0.0006567854434251785, -0.0006325915455818176, -0.0006083976477384567, -0.0005842037498950958, -0.0005600098520517349, -0.000535815954208374, -0.0005116220563650131, -0.0004874281585216522, -0.0004632342606782913, -0.0004390403628349304, -0.0004148464649915695, -0.0003906525671482086, -0.0003664586693048477, -0.0003422647714614868, -0.0003180708736181259, -0.000293876975774765, -0.0002696830779314041, -0.0002454891800880432, -0.0002212952822446823, -0.0001971013844013214, -0.0001729074865579605, -0.0001487135887145996, -0.0001245196908712387, -0.00010032579302787781, -7.61318951845169e-05, -5.1937997341156006e-05, -2.7744099497795105e-05, -3.550201654434204e-06, 2.0643696188926697e-05, 4.48375940322876e-05, 6.90314918756485e-05, 9.32253897190094e-05, 0.0001174192875623703, 0.0001416131854057312, 0.0001658070832490921, 0.000190000981092453, 0.0002141948789358139, 0.0002383887767791748, 0.0002625826746225357, 0.0002867765724658966, 0.0003109704703092575, 0.0003351643681526184, 0.0003593582659959793, 0.0003835521638393402, 0.0004077460616827011, 0.000431939959526062, 0.0004561338573694229, 0.0004803277552127838, 0.0005045216530561447, 0.0005287155508995056, 0.0005529094487428665, 0.0005771033465862274, 0.0006012972444295883, 0.0006254911422729492]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 8.0, 2.0, 7.0, 3.0, 9.0, 8.0, 11.0, 11.0, 12.0, 11.0, 19.0, 26.0, 24.0, 19.0, 38.0, 23.0, 38.0, 44.0, 39.0, 53.0, 38.0, 38.0, 37.0, 42.0, 45.0, 33.0, 45.0, 29.0, 33.0, 28.0, 24.0, 23.0, 25.0, 25.0, 13.0, 17.0, 17.0, 22.0, 17.0, 15.0, 7.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.939453125, -3.82269287109375, -3.7059326171875, -3.58917236328125, -3.472412109375, -3.35565185546875, -3.2388916015625, -3.12213134765625, -3.00537109375, -2.88861083984375, -2.7718505859375, -2.65509033203125, -2.538330078125, -2.42156982421875, -2.3048095703125, -2.18804931640625, -2.0712890625, -1.95452880859375, -1.8377685546875, -1.72100830078125, -1.604248046875, -1.48748779296875, -1.3707275390625, -1.25396728515625, -1.13720703125, -1.02044677734375, -0.9036865234375, -0.78692626953125, -0.670166015625, -0.55340576171875, -0.4366455078125, -0.31988525390625, -0.203125, -0.08636474609375, 0.0303955078125, 0.14715576171875, 0.263916015625, 0.38067626953125, 0.4974365234375, 0.61419677734375, 0.73095703125, 0.84771728515625, 0.9644775390625, 1.08123779296875, 1.197998046875, 1.31475830078125, 1.4315185546875, 1.54827880859375, 1.6650390625, 1.78179931640625, 1.8985595703125, 2.01531982421875, 2.132080078125, 2.24884033203125, 2.3656005859375, 2.48236083984375, 2.59912109375, 2.71588134765625, 2.8326416015625, 2.94940185546875, 3.066162109375, 3.18292236328125, 3.2996826171875, 3.41644287109375, 3.533203125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 2.0, 5.0, 11.0, 12.0, 19.0, 32.0, 37.0, 62.0, 91.0, 128.0, 232.0, 442.0, 682.0, 1142.0, 1971.0, 3624.0, 7217.0, 15408.0, 35202.0, 93157.0, 350008.0, 372525.0, 97460.0, 36383.0, 16312.0, 7617.0, 3892.0, 2030.0, 1125.0, 645.0, 388.0, 228.0, 175.0, 103.0, 62.0, 50.0, 31.0, 20.0, 8.0, 9.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.61328125, -6.39300537109375, -6.1727294921875, -5.95245361328125, -5.732177734375, -5.51190185546875, -5.2916259765625, -5.07135009765625, -4.85107421875, -4.63079833984375, -4.4105224609375, -4.19024658203125, -3.969970703125, -3.74969482421875, -3.5294189453125, -3.30914306640625, -3.0888671875, -2.86859130859375, -2.6483154296875, -2.42803955078125, -2.207763671875, -1.98748779296875, -1.7672119140625, -1.54693603515625, -1.32666015625, -1.10638427734375, -0.8861083984375, -0.66583251953125, -0.445556640625, -0.22528076171875, -0.0050048828125, 0.21527099609375, 0.435546875, 0.65582275390625, 0.8760986328125, 1.09637451171875, 1.316650390625, 1.53692626953125, 1.7572021484375, 1.97747802734375, 2.19775390625, 2.41802978515625, 2.6383056640625, 2.85858154296875, 3.078857421875, 3.29913330078125, 3.5194091796875, 3.73968505859375, 3.9599609375, 4.18023681640625, 4.4005126953125, 4.62078857421875, 4.841064453125, 5.06134033203125, 5.2816162109375, 5.50189208984375, 5.72216796875, 5.94244384765625, 6.1627197265625, 6.38299560546875, 6.603271484375, 6.82354736328125, 7.0438232421875, 7.26409912109375, 7.484375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 12.0, 10.0, 9.0, 8.0, 16.0, 11.0, 22.0, 18.0, 34.0, 37.0, 30.0, 36.0, 42.0, 43.0, 58.0, 55.0, 113.0, 191.0, 1405.0, 262.0, 126.0, 78.0, 66.0, 54.0, 38.0, 27.0, 46.0, 24.0, 28.0, 29.0, 21.0, 17.0, 13.0, 17.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.5703125, -12.1861572265625, -11.802001953125, -11.4178466796875, -11.03369140625, -10.6495361328125, -10.265380859375, -9.8812255859375, -9.4970703125, -9.1129150390625, -8.728759765625, -8.3446044921875, -7.96044921875, -7.5762939453125, -7.192138671875, -6.8079833984375, -6.423828125, -6.0396728515625, -5.655517578125, -5.2713623046875, -4.88720703125, -4.5030517578125, -4.118896484375, -3.7347412109375, -3.3505859375, -2.9664306640625, -2.582275390625, -2.1981201171875, -1.81396484375, -1.4298095703125, -1.045654296875, -0.6614990234375, -0.27734375, 0.1068115234375, 0.490966796875, 0.8751220703125, 1.25927734375, 1.6434326171875, 2.027587890625, 2.4117431640625, 2.7958984375, 3.1800537109375, 3.564208984375, 3.9483642578125, 4.33251953125, 4.7166748046875, 5.100830078125, 5.4849853515625, 5.869140625, 6.2532958984375, 6.637451171875, 7.0216064453125, 7.40576171875, 7.7899169921875, 8.174072265625, 8.5582275390625, 8.9423828125, 9.3265380859375, 9.710693359375, 10.0948486328125, 10.47900390625, 10.8631591796875, 11.247314453125, 11.6314697265625, 12.015625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 10.0, 9.0, 25.0, 22.0, 27.0, 26.0, 45.0, 44.0, 70.0, 102.0, 159.0, 357.0, 775.0, 2267.0, 8140.0, 57964.0, 1946268.0, 1076769.0, 42504.0, 6701.0, 1889.0, 690.0, 278.0, 159.0, 94.0, 65.0, 50.0, 37.0, 33.0, 23.0, 18.0, 16.0, 10.0, 10.0, 8.0, 7.0, 3.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.921875, -19.27783203125, -18.6337890625, -17.98974609375, -17.345703125, -16.70166015625, -16.0576171875, -15.41357421875, -14.76953125, -14.12548828125, -13.4814453125, -12.83740234375, -12.193359375, -11.54931640625, -10.9052734375, -10.26123046875, -9.6171875, -8.97314453125, -8.3291015625, -7.68505859375, -7.041015625, -6.39697265625, -5.7529296875, -5.10888671875, -4.46484375, -3.82080078125, -3.1767578125, -2.53271484375, -1.888671875, -1.24462890625, -0.6005859375, 0.04345703125, 0.6875, 1.33154296875, 1.9755859375, 2.61962890625, 3.263671875, 3.90771484375, 4.5517578125, 5.19580078125, 5.83984375, 6.48388671875, 7.1279296875, 7.77197265625, 8.416015625, 9.06005859375, 9.7041015625, 10.34814453125, 10.9921875, 11.63623046875, 12.2802734375, 12.92431640625, 13.568359375, 14.21240234375, 14.8564453125, 15.50048828125, 16.14453125, 16.78857421875, 17.4326171875, 18.07666015625, 18.720703125, 19.36474609375, 20.0087890625, 20.65283203125, 21.296875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [4.0, 41.0, 190.0, 412.0, 294.0, 71.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.550666809082031, -8.441230773925781, -5.331793785095215, -2.2223567962646484, 0.8870792388916016, 3.9965152740478516, 7.105953216552734, 10.215389251708984, 13.324825286865234, 16.434261322021484, 19.543697357177734, 22.653135299682617, 25.762571334838867, 28.872007369995117, 31.9814453125, 35.09088134765625, 38.2003173828125, 41.30975341796875, 44.419189453125, 47.52862548828125, 50.6380615234375, 53.74749755859375, 56.856937408447266, 59.966373443603516, 63.075809478759766, 66.18524932861328, 69.29468536376953, 72.40412139892578, 75.51355743408203, 78.62299346923828, 81.73242950439453, 84.84186553955078, 87.9512939453125, 91.06072998046875, 94.170166015625, 97.27960205078125, 100.3890380859375, 103.49847412109375, 106.60791015625, 109.71734619140625, 112.8267822265625, 115.93621826171875, 119.045654296875, 122.15509033203125, 125.2645263671875, 128.37396240234375, 131.4833984375, 134.59283447265625, 137.7022705078125, 140.81170654296875, 143.921142578125, 147.03057861328125, 150.1400146484375, 153.24945068359375, 156.35888671875, 159.46832275390625, 162.57777404785156, 165.6872100830078, 168.79664611816406, 171.9060821533203, 175.01551818847656, 178.1249542236328, 181.23439025878906, 184.3438262939453, 187.45326232910156]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 8.0, 4.0, 4.0, 15.0, 12.0, 17.0, 12.0, 16.0, 16.0, 20.0, 27.0, 30.0, 31.0, 28.0, 25.0, 50.0, 46.0, 41.0, 40.0, 46.0, 48.0, 41.0, 38.0, 45.0, 33.0, 38.0, 35.0, 22.0, 23.0, 25.0, 30.0, 18.0, 22.0, 10.0, 19.0, 13.0, 15.0, 11.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.978919982910156, -37.775390625, -36.571861267089844, -35.36833572387695, -34.1648063659668, -32.96127700805664, -31.757749557495117, -30.554222106933594, -29.350692749023438, -28.14716339111328, -26.943635940551758, -25.740108489990234, -24.536579132080078, -23.333049774169922, -22.1295223236084, -20.925994873046875, -19.72246551513672, -18.518936157226562, -17.31540870666504, -16.111881256103516, -14.90835189819336, -13.70482349395752, -12.50129508972168, -11.29776668548584, -10.09423828125, -8.89070987701416, -7.68718147277832, -6.4836530685424805, -5.280124664306641, -4.076596260070801, -2.873067855834961, -1.669539451599121, -0.4660148620605469, 0.737513542175293, 1.9410419464111328, 3.1445703506469727, 4.3480987548828125, 5.551627159118652, 6.755155563354492, 7.958683967590332, 9.162212371826172, 10.365740776062012, 11.569269180297852, 12.772797584533691, 13.976325988769531, 15.179854393005371, 16.38338279724121, 17.586910247802734, 18.79043960571289, 19.993968963623047, 21.19749641418457, 22.401023864746094, 23.60455322265625, 24.808082580566406, 26.01161003112793, 27.215137481689453, 28.41866683959961, 29.622196197509766, 30.82572364807129, 32.02925109863281, 33.23278045654297, 34.436309814453125, 35.63983917236328, 36.84336471557617, 38.04689407348633]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 8.0, 7.0, 8.0, 9.0, 5.0, 10.0, 15.0, 25.0, 15.0, 15.0, 26.0, 32.0, 33.0, 33.0, 34.0, 30.0, 45.0, 45.0, 55.0, 41.0, 39.0, 50.0, 24.0, 48.0, 36.0, 22.0, 20.0, 32.0, 24.0, 30.0, 25.0, 18.0, 16.0, 22.0, 23.0, 16.0, 11.0, 8.0, 13.0, 5.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.3359375, -4.212860107421875, -4.08978271484375, -3.966705322265625, -3.8436279296875, -3.720550537109375, -3.59747314453125, -3.474395751953125, -3.351318359375, -3.228240966796875, -3.10516357421875, -2.982086181640625, -2.8590087890625, -2.735931396484375, -2.61285400390625, -2.489776611328125, -2.36669921875, -2.243621826171875, -2.12054443359375, -1.997467041015625, -1.8743896484375, -1.751312255859375, -1.62823486328125, -1.505157470703125, -1.382080078125, -1.259002685546875, -1.13592529296875, -1.012847900390625, -0.8897705078125, -0.766693115234375, -0.64361572265625, -0.520538330078125, -0.3974609375, -0.274383544921875, -0.15130615234375, -0.028228759765625, 0.0948486328125, 0.217926025390625, 0.34100341796875, 0.464080810546875, 0.587158203125, 0.710235595703125, 0.83331298828125, 0.956390380859375, 1.0794677734375, 1.202545166015625, 1.32562255859375, 1.448699951171875, 1.57177734375, 1.694854736328125, 1.81793212890625, 1.941009521484375, 2.0640869140625, 2.187164306640625, 2.31024169921875, 2.433319091796875, 2.556396484375, 2.679473876953125, 2.80255126953125, 2.925628662109375, 3.0487060546875, 3.171783447265625, 3.29486083984375, 3.417938232421875, 3.541015625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 11.0, 13.0, 11.0, 26.0, 29.0, 30.0, 61.0, 76.0, 139.0, 227.0, 503.0, 1390.0, 4773.0, 28063.0, 527902.0, 3220112.0, 381677.0, 22859.0, 4111.0, 1179.0, 440.0, 222.0, 129.0, 93.0, 46.0, 40.0, 31.0, 20.0, 19.0, 7.0, 12.0, 6.0, 3.0, 3.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.26416015625, -11.8173828125, -11.37060546875, -10.923828125, -10.47705078125, -10.0302734375, -9.58349609375, -9.13671875, -8.68994140625, -8.2431640625, -7.79638671875, -7.349609375, -6.90283203125, -6.4560546875, -6.00927734375, -5.5625, -5.11572265625, -4.6689453125, -4.22216796875, -3.775390625, -3.32861328125, -2.8818359375, -2.43505859375, -1.98828125, -1.54150390625, -1.0947265625, -0.64794921875, -0.201171875, 0.24560546875, 0.6923828125, 1.13916015625, 1.5859375, 2.03271484375, 2.4794921875, 2.92626953125, 3.373046875, 3.81982421875, 4.2666015625, 4.71337890625, 5.16015625, 5.60693359375, 6.0537109375, 6.50048828125, 6.947265625, 7.39404296875, 7.8408203125, 8.28759765625, 8.734375, 9.18115234375, 9.6279296875, 10.07470703125, 10.521484375, 10.96826171875, 11.4150390625, 11.86181640625, 12.30859375, 12.75537109375, 13.2021484375, 13.64892578125, 14.095703125, 14.54248046875, 14.9892578125, 15.43603515625, 15.8828125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 11.0, 12.0, 20.0, 32.0, 42.0, 30.0, 71.0, 113.0, 174.0, 243.0, 352.0, 535.0, 668.0, 515.0, 403.0, 248.0, 180.0, 130.0, 90.0, 62.0, 44.0, 25.0, 31.0, 12.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.515625, -10.2432861328125, -9.970947265625, -9.6986083984375, -9.42626953125, -9.1539306640625, -8.881591796875, -8.6092529296875, -8.3369140625, -8.0645751953125, -7.792236328125, -7.5198974609375, -7.24755859375, -6.9752197265625, -6.702880859375, -6.4305419921875, -6.158203125, -5.8858642578125, -5.613525390625, -5.3411865234375, -5.06884765625, -4.7965087890625, -4.524169921875, -4.2518310546875, -3.9794921875, -3.7071533203125, -3.434814453125, -3.1624755859375, -2.89013671875, -2.6177978515625, -2.345458984375, -2.0731201171875, -1.80078125, -1.5284423828125, -1.256103515625, -0.9837646484375, -0.71142578125, -0.4390869140625, -0.166748046875, 0.1055908203125, 0.3779296875, 0.6502685546875, 0.922607421875, 1.1949462890625, 1.46728515625, 1.7396240234375, 2.011962890625, 2.2843017578125, 2.556640625, 2.8289794921875, 3.101318359375, 3.3736572265625, 3.64599609375, 3.9183349609375, 4.190673828125, 4.4630126953125, 4.7353515625, 5.0076904296875, 5.280029296875, 5.5523681640625, 5.82470703125, 6.0970458984375, 6.369384765625, 6.6417236328125, 6.9140625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 2.0, 7.0, 16.0, 33.0, 34.0, 59.0, 97.0, 143.0, 260.0, 524.0, 1540.0, 15132.0, 3219881.0, 947011.0, 7383.0, 1176.0, 435.0, 211.0, 112.0, 64.0, 45.0, 43.0, 20.0, 15.0, 10.0, 5.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.734375, -28.585693359375, -27.43701171875, -26.288330078125, -25.1396484375, -23.990966796875, -22.84228515625, -21.693603515625, -20.544921875, -19.396240234375, -18.24755859375, -17.098876953125, -15.9501953125, -14.801513671875, -13.65283203125, -12.504150390625, -11.35546875, -10.206787109375, -9.05810546875, -7.909423828125, -6.7607421875, -5.612060546875, -4.46337890625, -3.314697265625, -2.166015625, -1.017333984375, 0.13134765625, 1.280029296875, 2.4287109375, 3.577392578125, 4.72607421875, 5.874755859375, 7.0234375, 8.172119140625, 9.32080078125, 10.469482421875, 11.6181640625, 12.766845703125, 13.91552734375, 15.064208984375, 16.212890625, 17.361572265625, 18.51025390625, 19.658935546875, 20.8076171875, 21.956298828125, 23.10498046875, 24.253662109375, 25.40234375, 26.551025390625, 27.69970703125, 28.848388671875, 29.9970703125, 31.145751953125, 32.29443359375, 33.443115234375, 34.591796875, 35.740478515625, 36.88916015625, 38.037841796875, 39.1865234375, 40.335205078125, 41.48388671875, 42.632568359375, 43.78125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 65.0, 224.0, 365.0, 250.0, 84.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.75772476196289, -38.14714431762695, -34.53656005859375, -30.925979614257812, -27.315399169921875, -23.704818725585938, -20.094236373901367, -16.483654022216797, -12.87307357788086, -9.262492179870605, -5.651910781860352, -2.0413293838500977, 1.5692520141601562, 5.179832458496094, 8.790414810180664, 12.400997161865234, 16.011577606201172, 19.62215805053711, 23.23274040222168, 26.84332275390625, 30.453903198242188, 34.064483642578125, 37.67506408691406, 41.285648345947266, 44.8962287902832, 48.50680923461914, 52.117393493652344, 55.72797393798828, 59.33855438232422, 62.949134826660156, 66.5597152709961, 70.17030334472656, 73.7808837890625, 77.39146423339844, 81.00204467773438, 84.61262512207031, 88.22320556640625, 91.83378601074219, 95.44437408447266, 99.0549545288086, 102.66553497314453, 106.27611541748047, 109.8866958618164, 113.49727630615234, 117.10786437988281, 120.71844482421875, 124.32902526855469, 127.93960571289062, 131.55018615722656, 135.1607666015625, 138.77134704589844, 142.38192749023438, 145.9925079345703, 149.60308837890625, 153.2136688232422, 156.82424926757812, 160.43484497070312, 164.04542541503906, 167.656005859375, 171.26658630371094, 174.87716674804688, 178.4877471923828, 182.09832763671875, 185.70892333984375, 189.31948852539062]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 7.0, 6.0, 8.0, 10.0, 14.0, 12.0, 18.0, 12.0, 16.0, 24.0, 34.0, 30.0, 21.0, 35.0, 37.0, 31.0, 42.0, 47.0, 46.0, 43.0, 35.0, 35.0, 36.0, 42.0, 34.0, 32.0, 35.0, 27.0, 38.0, 33.0, 23.0, 23.0, 8.0, 17.0, 23.0, 10.0, 10.0, 14.0, 9.0, 2.0, 5.0, 3.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.64120101928711, -23.8935489654541, -23.145896911621094, -22.39824676513672, -21.65059471130371, -20.902942657470703, -20.155290603637695, -19.407638549804688, -18.659988403320312, -17.912336349487305, -17.164684295654297, -16.417034149169922, -15.669382095336914, -14.921730041503906, -14.174077987670898, -13.426426887512207, -12.6787748336792, -11.931122779846191, -11.1834716796875, -10.435819625854492, -9.6881685256958, -8.940516471862793, -8.192865371704102, -7.445213317871094, -6.697561740875244, -5.9499101638793945, -5.202258586883545, -4.454607009887695, -3.7069551944732666, -2.959303617477417, -2.2116518020629883, -1.4640002250671387, -0.7163486480712891, 0.03130298852920532, 0.7789546251296997, 1.5266063213348389, 2.2742578983306885, 3.021909475326538, 3.769561290740967, 4.517212867736816, 5.264864444732666, 6.012516021728516, 6.760167598724365, 7.507819175720215, 8.255471229553223, 9.003122329711914, 9.750774383544922, 10.49842643737793, 11.246077537536621, 11.993729591369629, 12.74138069152832, 13.489032745361328, 14.23668384552002, 14.984335899353027, 15.731986999511719, 16.479639053344727, 17.227291107177734, 17.974943161010742, 18.72259521484375, 19.470245361328125, 20.217897415161133, 20.96554946899414, 21.71320152282715, 22.460853576660156, 23.20850372314453]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 8.0, 8.0, 2.0, 8.0, 15.0, 19.0, 19.0, 18.0, 28.0, 28.0, 28.0, 31.0, 39.0, 46.0, 48.0, 31.0, 45.0, 42.0, 46.0, 45.0, 38.0, 42.0, 33.0, 35.0, 32.0, 33.0, 36.0, 27.0, 22.0, 15.0, 23.0, 13.0, 20.0, 19.0, 6.0, 13.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44921875, -4.320526123046875, -4.19183349609375, -4.063140869140625, -3.9344482421875, -3.805755615234375, -3.67706298828125, -3.548370361328125, -3.419677734375, -3.290985107421875, -3.16229248046875, -3.033599853515625, -2.9049072265625, -2.776214599609375, -2.64752197265625, -2.518829345703125, -2.39013671875, -2.261444091796875, -2.13275146484375, -2.004058837890625, -1.8753662109375, -1.746673583984375, -1.61798095703125, -1.489288330078125, -1.360595703125, -1.231903076171875, -1.10321044921875, -0.974517822265625, -0.8458251953125, -0.717132568359375, -0.58843994140625, -0.459747314453125, -0.3310546875, -0.202362060546875, -0.07366943359375, 0.055023193359375, 0.1837158203125, 0.312408447265625, 0.44110107421875, 0.569793701171875, 0.698486328125, 0.827178955078125, 0.95587158203125, 1.084564208984375, 1.2132568359375, 1.341949462890625, 1.47064208984375, 1.599334716796875, 1.72802734375, 1.856719970703125, 1.98541259765625, 2.114105224609375, 2.2427978515625, 2.371490478515625, 2.50018310546875, 2.628875732421875, 2.757568359375, 2.886260986328125, 3.01495361328125, 3.143646240234375, 3.2723388671875, 3.401031494140625, 3.52972412109375, 3.658416748046875, 3.787109375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 14.0, 10.0, 16.0, 28.0, 45.0, 59.0, 110.0, 117.0, 210.0, 298.0, 475.0, 714.0, 1012.0, 1613.0, 2412.0, 3592.0, 5607.0, 8718.0, 13382.0, 20489.0, 33493.0, 56108.0, 101231.0, 208453.0, 277830.0, 131057.0, 70448.0, 40382.0, 25410.0, 15671.0, 10186.0, 6549.0, 4367.0, 2937.0, 1857.0, 1234.0, 783.0, 525.0, 362.0, 239.0, 170.0, 116.0, 71.0, 41.0, 40.0, 22.0, 18.0, 11.0, 6.0, 3.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.1827392578125, -0.17723464965820312, -0.17173004150390625, -0.16622543334960938, -0.1607208251953125, -0.15521621704101562, -0.14971160888671875, -0.14420700073242188, -0.138702392578125, -0.13319778442382812, -0.12769317626953125, -0.12218856811523438, -0.1166839599609375, -0.11117935180664062, -0.10567474365234375, -0.10017013549804688, -0.09466552734375, -0.08916091918945312, -0.08365631103515625, -0.07815170288085938, -0.0726470947265625, -0.06714248657226562, -0.06163787841796875, -0.056133270263671875, -0.050628662109375, -0.045124053955078125, -0.03961944580078125, -0.034114837646484375, -0.0286102294921875, -0.023105621337890625, -0.01760101318359375, -0.012096405029296875, -0.006591796875, -0.001087188720703125, 0.00441741943359375, 0.009922027587890625, 0.0154266357421875, 0.020931243896484375, 0.02643585205078125, 0.031940460205078125, 0.037445068359375, 0.042949676513671875, 0.04845428466796875, 0.053958892822265625, 0.0594635009765625, 0.06496810913085938, 0.07047271728515625, 0.07597732543945312, 0.08148193359375, 0.08698654174804688, 0.09249114990234375, 0.09799575805664062, 0.1035003662109375, 0.10900497436523438, 0.11450958251953125, 0.12001419067382812, 0.125518798828125, 0.13102340698242188, 0.13652801513671875, 0.14203262329101562, 0.1475372314453125, 0.15304183959960938, 0.15854644775390625, 0.16405105590820312, 0.1695556640625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 4.0, 8.0, 5.0, 8.0, 10.0, 8.0, 16.0, 18.0, 16.0, 12.0, 22.0, 22.0, 25.0, 29.0, 36.0, 45.0, 26.0, 39.0, 48.0, 43.0, 27.0, 30.0, 1062.0, 34.0, 42.0, 38.0, 34.0, 34.0, 42.0, 30.0, 33.0, 29.0, 20.0, 24.0, 23.0, 13.0, 13.0, 8.0, 13.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.4722900390625, -3.356689453125, -3.2410888671875, -3.12548828125, -3.0098876953125, -2.894287109375, -2.7786865234375, -2.6630859375, -2.5474853515625, -2.431884765625, -2.3162841796875, -2.20068359375, -2.0850830078125, -1.969482421875, -1.8538818359375, -1.73828125, -1.6226806640625, -1.507080078125, -1.3914794921875, -1.27587890625, -1.1602783203125, -1.044677734375, -0.9290771484375, -0.8134765625, -0.6978759765625, -0.582275390625, -0.4666748046875, -0.35107421875, -0.2354736328125, -0.119873046875, -0.0042724609375, 0.111328125, 0.2269287109375, 0.342529296875, 0.4581298828125, 0.57373046875, 0.6893310546875, 0.804931640625, 0.9205322265625, 1.0361328125, 1.1517333984375, 1.267333984375, 1.3829345703125, 1.49853515625, 1.6141357421875, 1.729736328125, 1.8453369140625, 1.9609375, 2.0765380859375, 2.192138671875, 2.3077392578125, 2.42333984375, 2.5389404296875, 2.654541015625, 2.7701416015625, 2.8857421875, 3.0013427734375, 3.116943359375, 3.2325439453125, 3.34814453125, 3.4637451171875, 3.579345703125, 3.6949462890625, 3.810546875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 9.0, 10.0, 11.0, 10.0, 18.0, 31.0, 63.0, 79.0, 100.0, 141.0, 217.0, 283.0, 394.0, 632.0, 851.0, 1354.0, 1786.0, 2623.0, 3815.0, 5628.0, 8140.0, 11710.0, 17467.0, 26299.0, 40533.0, 64305.0, 111075.0, 248333.0, 1223109.0, 123900.0, 71448.0, 44280.0, 28608.0, 18970.0, 12884.0, 8700.0, 5894.0, 4047.0, 2885.0, 1987.0, 1372.0, 969.0, 659.0, 465.0, 321.0, 221.0, 162.0, 94.0, 78.0, 56.0, 33.0, 26.0, 20.0, 9.0, 5.0, 7.0, 6.0, 5.0, 4.0], "bins": [-0.06500244140625, -0.06303834915161133, -0.061074256896972656, -0.059110164642333984, -0.05714607238769531, -0.05518198013305664, -0.05321788787841797, -0.0512537956237793, -0.049289703369140625, -0.04732561111450195, -0.04536151885986328, -0.04339742660522461, -0.04143333435058594, -0.039469242095947266, -0.037505149841308594, -0.03554105758666992, -0.03357696533203125, -0.03161287307739258, -0.029648780822753906, -0.027684688568115234, -0.025720596313476562, -0.02375650405883789, -0.02179241180419922, -0.019828319549560547, -0.017864227294921875, -0.015900135040283203, -0.013936042785644531, -0.01197195053100586, -0.010007858276367188, -0.008043766021728516, -0.006079673767089844, -0.004115581512451172, -0.0021514892578125, -0.00018739700317382812, 0.0017766952514648438, 0.0037407875061035156, 0.0057048797607421875, 0.007668972015380859, 0.009633064270019531, 0.011597156524658203, 0.013561248779296875, 0.015525341033935547, 0.01748943328857422, 0.01945352554321289, 0.021417617797851562, 0.023381710052490234, 0.025345802307128906, 0.027309894561767578, 0.02927398681640625, 0.031238079071044922, 0.033202171325683594, 0.035166263580322266, 0.03713035583496094, 0.03909444808959961, 0.04105854034423828, 0.04302263259887695, 0.044986724853515625, 0.0469508171081543, 0.04891490936279297, 0.05087900161743164, 0.05284309387207031, 0.054807186126708984, 0.056771278381347656, 0.05873537063598633, 0.060699462890625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 7.0, 4.0, 4.0, 4.0, 5.0, 6.0, 15.0, 9.0, 8.0, 17.0, 17.0, 21.0, 38.0, 52.0, 66.0, 88.0, 127.0, 124.0, 85.0, 70.0, 44.0, 40.0, 25.0, 19.0, 15.0, 16.0, 12.0, 13.0, 10.0, 6.0, 5.0, 7.0, 7.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.00091552734375, -0.0008915364742279053, -0.0008675456047058105, -0.0008435547351837158, -0.0008195638656616211, -0.0007955729961395264, -0.0007715821266174316, -0.0007475912570953369, -0.0007236003875732422, -0.0006996095180511475, -0.0006756186485290527, -0.000651627779006958, -0.0006276369094848633, -0.0006036460399627686, -0.0005796551704406738, -0.0005556643009185791, -0.0005316734313964844, -0.0005076825618743896, -0.0004836916923522949, -0.0004597008228302002, -0.00043570995330810547, -0.00041171908378601074, -0.000387728214263916, -0.0003637373447418213, -0.00033974647521972656, -0.00031575560569763184, -0.0002917647361755371, -0.0002677738666534424, -0.00024378299713134766, -0.00021979212760925293, -0.0001958012580871582, -0.00017181038856506348, -0.00014781951904296875, -0.00012382864952087402, -9.98377799987793e-05, -7.584691047668457e-05, -5.1856040954589844e-05, -2.7865171432495117e-05, -3.874301910400391e-06, 2.0116567611694336e-05, 4.410743713378906e-05, 6.809830665588379e-05, 9.208917617797852e-05, 0.00011608004570007324, 0.00014007091522216797, 0.0001640617847442627, 0.00018805265426635742, 0.00021204352378845215, 0.00023603439331054688, 0.0002600252628326416, 0.00028401613235473633, 0.00030800700187683105, 0.0003319978713989258, 0.0003559887409210205, 0.00037997961044311523, 0.00040397047996520996, 0.0004279613494873047, 0.0004519522190093994, 0.00047594308853149414, 0.0004999339580535889, 0.0005239248275756836, 0.0005479156970977783, 0.000571906566619873, 0.0005958974361419678, 0.0006198883056640625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 8.0, 5.0, 6.0, 5.0, 12.0, 12.0, 14.0, 16.0, 15.0, 22.0, 36.0, 61.0, 69.0, 197.0, 943.0, 931711.0, 114467.0, 512.0, 157.0, 85.0, 49.0, 37.0, 20.0, 15.0, 7.0, 12.0, 11.0, 8.0, 7.0, 3.0, 4.0, 5.0, 8.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015228271484375, -0.014639616012573242, -0.014050960540771484, -0.013462305068969727, -0.012873649597167969, -0.012284994125366211, -0.011696338653564453, -0.011107683181762695, -0.010519027709960938, -0.00993037223815918, -0.009341716766357422, -0.008753061294555664, -0.008164405822753906, -0.0075757503509521484, -0.006987094879150391, -0.006398439407348633, -0.005809783935546875, -0.005221128463745117, -0.004632472991943359, -0.0040438175201416016, -0.0034551620483398438, -0.002866506576538086, -0.002277851104736328, -0.0016891956329345703, -0.0011005401611328125, -0.0005118846893310547, 7.677078247070312e-05, 0.0006654262542724609, 0.0012540817260742188, 0.0018427371978759766, 0.0024313926696777344, 0.003020048141479492, 0.00360870361328125, 0.004197359085083008, 0.004786014556884766, 0.0053746700286865234, 0.005963325500488281, 0.006551980972290039, 0.007140636444091797, 0.007729291915893555, 0.008317947387695312, 0.00890660285949707, 0.009495258331298828, 0.010083913803100586, 0.010672569274902344, 0.011261224746704102, 0.01184988021850586, 0.012438535690307617, 0.013027191162109375, 0.013615846633911133, 0.01420450210571289, 0.014793157577514648, 0.015381813049316406, 0.015970468521118164, 0.016559123992919922, 0.01714777946472168, 0.017736434936523438, 0.018325090408325195, 0.018913745880126953, 0.01950240135192871, 0.02009105682373047, 0.020679712295532227, 0.021268367767333984, 0.021857023239135742, 0.0224456787109375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 72.0, 884.0, 61.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002409297041594982, -0.0022169805597513914, -0.002024663845077157, -0.0018323473632335663, -0.001640030648559332, -0.0014477141667157412, -0.0012553975684568286, -0.001063080970197916, -0.0008707643719390035, -0.0006784477736800909, -0.0004861312045250088, -0.0002938146353699267, -0.00010149803711101413, 9.081856114789844e-05, 0.0002831351011991501, 0.00047545169945806265, 0.0006677682977169752, 0.0008600848959758878, 0.0010524014942348003, 0.001244717976078391, 0.0014370346907526255, 0.0016293511725962162, 0.0018216677708551288, 0.0020139843691140413, 0.002206300850957632, 0.002398617332801223, 0.002590934047475457, 0.002783250529319048, 0.0029755672439932823, 0.003167883725836873, 0.003360200207680464, 0.003552516922354698, 0.0037448336370289326, 0.003937150351703167, 0.004129466600716114, 0.0043217833153903484, 0.004514100030064583, 0.004706416744738817, 0.004898732993751764, 0.005091049708425999, 0.005283366423100233, 0.0054756831377744675, 0.0056679993867874146, 0.005860316101461649, 0.006052632816135883, 0.006244949530810118, 0.006437265779823065, 0.006629582494497299, 0.006821898743510246, 0.007014215458184481, 0.007206531707197428, 0.007398848421871662, 0.0075911651365458965, 0.007783481851220131, 0.007975798100233078, 0.008168114349246025, 0.008360431529581547, 0.008552747778594494, 0.008745064958930016, 0.008937381207942963, 0.00912969745695591, 0.009322014637291431, 0.009514330886304379, 0.0097066480666399, 0.009898964315652847]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 3.0, 8.0, 10.0, 10.0, 19.0, 15.0, 16.0, 23.0, 25.0, 25.0, 24.0, 32.0, 39.0, 39.0, 38.0, 38.0, 42.0, 45.0, 51.0, 46.0, 40.0, 39.0, 43.0, 37.0, 36.0, 35.0, 27.0, 35.0, 21.0, 23.0, 12.0, 10.0, 19.0, 15.0, 14.0, 10.0, 5.0, 9.0, 2.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004904270172119141, -0.0004765978083014488, -0.0004627685993909836, -0.00044893939048051834, -0.0004351101815700531, -0.00042128097265958786, -0.0004074517637491226, -0.0003936225548386574, -0.00037979334592819214, -0.0003659641370177269, -0.00035213492810726166, -0.0003383057191967964, -0.0003244765102863312, -0.00031064730137586594, -0.0002968180924654007, -0.00028298888355493546, -0.0002691596746444702, -0.000255330465734005, -0.00024150125682353973, -0.0002276720479130745, -0.00021384283900260925, -0.000200013630092144, -0.00018618442118167877, -0.00017235521227121353, -0.0001585260033607483, -0.00014469679445028305, -0.0001308675855398178, -0.00011703837662935257, -0.00010320916771888733, -8.937995880842209e-05, -7.555074989795685e-05, -6.172154098749161e-05, -4.789233207702637e-05, -3.406312316656113e-05, -2.0233914256095886e-05, -6.404705345630646e-06, 7.424503564834595e-06, 2.1253712475299835e-05, 3.5082921385765076e-05, 4.8912130296230316e-05, 6.274133920669556e-05, 7.65705481171608e-05, 9.039975702762604e-05, 0.00010422896593809128, 0.00011805817484855652, 0.00013188738375902176, 0.000145716592669487, 0.00015954580157995224, 0.00017337501049041748, 0.00018720421940088272, 0.00020103342831134796, 0.0002148626372218132, 0.00022869184613227844, 0.00024252105504274368, 0.0002563502639532089, 0.00027017947286367416, 0.0002840086817741394, 0.00029783789068460464, 0.0003116670995950699, 0.0003254963085055351, 0.00033932551741600037, 0.0003531547263264656, 0.00036698393523693085, 0.0003808131441473961, 0.00039464235305786133]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 8.0, 8.0, 2.0, 8.0, 15.0, 19.0, 19.0, 18.0, 28.0, 28.0, 28.0, 31.0, 39.0, 46.0, 48.0, 31.0, 45.0, 42.0, 46.0, 45.0, 38.0, 42.0, 33.0, 35.0, 32.0, 33.0, 36.0, 27.0, 22.0, 15.0, 23.0, 13.0, 20.0, 19.0, 6.0, 13.0, 7.0, 4.0, 5.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.44921875, -4.320526123046875, -4.19183349609375, -4.063140869140625, -3.9344482421875, -3.805755615234375, -3.67706298828125, -3.548370361328125, -3.419677734375, -3.290985107421875, -3.16229248046875, -3.033599853515625, -2.9049072265625, -2.776214599609375, -2.64752197265625, -2.518829345703125, -2.39013671875, -2.261444091796875, -2.13275146484375, -2.004058837890625, -1.8753662109375, -1.746673583984375, -1.61798095703125, -1.489288330078125, -1.360595703125, -1.231903076171875, -1.10321044921875, -0.974517822265625, -0.8458251953125, -0.717132568359375, -0.58843994140625, -0.459747314453125, -0.3310546875, -0.202362060546875, -0.07366943359375, 0.055023193359375, 0.1837158203125, 0.312408447265625, 0.44110107421875, 0.569793701171875, 0.698486328125, 0.827178955078125, 0.95587158203125, 1.084564208984375, 1.2132568359375, 1.341949462890625, 1.47064208984375, 1.599334716796875, 1.72802734375, 1.856719970703125, 1.98541259765625, 2.114105224609375, 2.2427978515625, 2.371490478515625, 2.50018310546875, 2.628875732421875, 2.757568359375, 2.886260986328125, 3.01495361328125, 3.143646240234375, 3.2723388671875, 3.401031494140625, 3.52972412109375, 3.658416748046875, 3.787109375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 10.0, 14.0, 27.0, 44.0, 57.0, 81.0, 140.0, 195.0, 290.0, 467.0, 694.0, 1078.0, 1615.0, 2686.0, 4119.0, 6863.0, 10796.0, 17771.0, 28542.0, 48818.0, 93650.0, 210939.0, 300369.0, 148193.0, 70398.0, 38848.0, 23248.0, 14204.0, 9056.0, 5638.0, 3548.0, 2202.0, 1398.0, 881.0, 536.0, 383.0, 255.0, 178.0, 114.0, 71.0, 46.0, 32.0, 21.0, 14.0, 7.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0], "bins": [-4.828125, -4.68310546875, -4.5380859375, -4.39306640625, -4.248046875, -4.10302734375, -3.9580078125, -3.81298828125, -3.66796875, -3.52294921875, -3.3779296875, -3.23291015625, -3.087890625, -2.94287109375, -2.7978515625, -2.65283203125, -2.5078125, -2.36279296875, -2.2177734375, -2.07275390625, -1.927734375, -1.78271484375, -1.6376953125, -1.49267578125, -1.34765625, -1.20263671875, -1.0576171875, -0.91259765625, -0.767578125, -0.62255859375, -0.4775390625, -0.33251953125, -0.1875, -0.04248046875, 0.1025390625, 0.24755859375, 0.392578125, 0.53759765625, 0.6826171875, 0.82763671875, 0.97265625, 1.11767578125, 1.2626953125, 1.40771484375, 1.552734375, 1.69775390625, 1.8427734375, 1.98779296875, 2.1328125, 2.27783203125, 2.4228515625, 2.56787109375, 2.712890625, 2.85791015625, 3.0029296875, 3.14794921875, 3.29296875, 3.43798828125, 3.5830078125, 3.72802734375, 3.873046875, 4.01806640625, 4.1630859375, 4.30810546875, 4.453125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 1.0, 7.0, 4.0, 5.0, 6.0, 9.0, 5.0, 16.0, 13.0, 12.0, 9.0, 11.0, 26.0, 23.0, 32.0, 37.0, 29.0, 44.0, 38.0, 54.0, 67.0, 81.0, 147.0, 211.0, 1346.0, 197.0, 127.0, 63.0, 75.0, 56.0, 43.0, 41.0, 37.0, 29.0, 16.0, 18.0, 25.0, 11.0, 10.0, 14.0, 14.0, 13.0, 4.0, 5.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.5078125, -10.1380615234375, -9.768310546875, -9.3985595703125, -9.02880859375, -8.6590576171875, -8.289306640625, -7.9195556640625, -7.5498046875, -7.1800537109375, -6.810302734375, -6.4405517578125, -6.07080078125, -5.7010498046875, -5.331298828125, -4.9615478515625, -4.591796875, -4.2220458984375, -3.852294921875, -3.4825439453125, -3.11279296875, -2.7430419921875, -2.373291015625, -2.0035400390625, -1.6337890625, -1.2640380859375, -0.894287109375, -0.5245361328125, -0.15478515625, 0.2149658203125, 0.584716796875, 0.9544677734375, 1.32421875, 1.6939697265625, 2.063720703125, 2.4334716796875, 2.80322265625, 3.1729736328125, 3.542724609375, 3.9124755859375, 4.2822265625, 4.6519775390625, 5.021728515625, 5.3914794921875, 5.76123046875, 6.1309814453125, 6.500732421875, 6.8704833984375, 7.240234375, 7.6099853515625, 7.979736328125, 8.3494873046875, 8.71923828125, 9.0889892578125, 9.458740234375, 9.8284912109375, 10.1982421875, 10.5679931640625, 10.937744140625, 11.3074951171875, 11.67724609375, 12.0469970703125, 12.416748046875, 12.7864990234375, 13.15625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 5.0, 3.0, 4.0, 11.0, 5.0, 12.0, 7.0, 18.0, 15.0, 20.0, 33.0, 42.0, 51.0, 57.0, 93.0, 110.0, 186.0, 330.0, 644.0, 1719.0, 6042.0, 26518.0, 153274.0, 1776731.0, 1049072.0, 103653.0, 19510.0, 4646.0, 1391.0, 536.0, 274.0, 165.0, 143.0, 98.0, 67.0, 51.0, 29.0, 28.0, 23.0, 18.0, 13.0, 11.0, 11.0, 15.0, 6.0, 8.0, 5.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.546875, -13.15869140625, -12.7705078125, -12.38232421875, -11.994140625, -11.60595703125, -11.2177734375, -10.82958984375, -10.44140625, -10.05322265625, -9.6650390625, -9.27685546875, -8.888671875, -8.50048828125, -8.1123046875, -7.72412109375, -7.3359375, -6.94775390625, -6.5595703125, -6.17138671875, -5.783203125, -5.39501953125, -5.0068359375, -4.61865234375, -4.23046875, -3.84228515625, -3.4541015625, -3.06591796875, -2.677734375, -2.28955078125, -1.9013671875, -1.51318359375, -1.125, -0.73681640625, -0.3486328125, 0.03955078125, 0.427734375, 0.81591796875, 1.2041015625, 1.59228515625, 1.98046875, 2.36865234375, 2.7568359375, 3.14501953125, 3.533203125, 3.92138671875, 4.3095703125, 4.69775390625, 5.0859375, 5.47412109375, 5.8623046875, 6.25048828125, 6.638671875, 7.02685546875, 7.4150390625, 7.80322265625, 8.19140625, 8.57958984375, 8.9677734375, 9.35595703125, 9.744140625, 10.13232421875, 10.5205078125, 10.90869140625, 11.296875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 10.0, 14.0, 34.0, 35.0, 58.0, 86.0, 103.0, 124.0, 113.0, 120.0, 93.0, 77.0, 58.0, 30.0, 23.0, 9.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.431642532348633, -19.52145767211914, -18.61127471923828, -17.70108985900879, -16.79090690612793, -15.880722045898438, -14.970538139343262, -14.060354232788086, -13.15017032623291, -12.239986419677734, -11.329802513122559, -10.419618606567383, -9.50943374633789, -8.599250793457031, -7.689065933227539, -6.778882026672363, -5.8686981201171875, -4.958514213562012, -4.048330307006836, -3.138145923614502, -2.227962017059326, -1.3177781105041504, -0.4075937271118164, 0.5025901794433594, 1.4127740859985352, 2.322957992553711, 3.233142137527466, 4.143326282501221, 5.0535101890563965, 5.963694095611572, 6.873878479003906, 7.784062385559082, 8.694244384765625, 9.6044282913208, 10.514612197875977, 11.424797058105469, 12.334980010986328, 13.24516487121582, 14.155348777770996, 15.065532684326172, 15.975716590881348, 16.885900497436523, 17.796085357666016, 18.706268310546875, 19.616453170776367, 20.526636123657227, 21.43682098388672, 22.347003936767578, 23.25718879699707, 24.167373657226562, 25.077556610107422, 25.987741470336914, 26.897924423217773, 27.808109283447266, 28.718292236328125, 29.628477096557617, 30.53866195678711, 31.4488468170166, 32.359031677246094, 33.26921463012695, 34.17939758300781, 35.08958053588867, 35.9997673034668, 36.909950256347656, 37.820133209228516]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 9.0, 9.0, 11.0, 11.0, 15.0, 17.0, 23.0, 23.0, 26.0, 23.0, 31.0, 31.0, 46.0, 45.0, 34.0, 37.0, 51.0, 51.0, 52.0, 44.0, 33.0, 43.0, 34.0, 43.0, 44.0, 25.0, 19.0, 30.0, 15.0, 27.0, 13.0, 16.0, 12.0, 14.0, 9.0, 2.0, 11.0, 6.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.04414367675781, -32.93817901611328, -31.832218170166016, -30.726255416870117, -29.62029266357422, -28.51432991027832, -27.408367156982422, -26.302404403686523, -25.196441650390625, -24.090478897094727, -22.984516143798828, -21.87855339050293, -20.77259063720703, -19.666627883911133, -18.560665130615234, -17.454702377319336, -16.348739624023438, -15.242776870727539, -14.13681411743164, -13.030851364135742, -11.924888610839844, -10.818925857543945, -9.712963104248047, -8.607000350952148, -7.50103759765625, -6.395074844360352, -5.289112091064453, -4.183149337768555, -3.0771865844726562, -1.9712238311767578, -0.8652610778808594, 0.24070167541503906, 1.3466682434082031, 2.4526309967041016, 3.55859375, 4.664556503295898, 5.770519256591797, 6.876482009887695, 7.982444763183594, 9.088407516479492, 10.19437026977539, 11.300333023071289, 12.406295776367188, 13.512258529663086, 14.618221282958984, 15.724184036254883, 16.83014678955078, 17.93610954284668, 19.042072296142578, 20.148035049438477, 21.253997802734375, 22.359960556030273, 23.465923309326172, 24.57188606262207, 25.67784881591797, 26.783811569213867, 27.889774322509766, 28.995737075805664, 30.101699829101562, 31.20766258239746, 32.31362533569336, 33.419586181640625, 34.525550842285156, 35.63151550292969, 36.73747634887695]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 5.0, 7.0, 16.0, 15.0, 13.0, 19.0, 19.0, 20.0, 18.0, 36.0, 46.0, 33.0, 38.0, 42.0, 42.0, 42.0, 40.0, 42.0, 38.0, 46.0, 35.0, 39.0, 35.0, 37.0, 28.0, 30.0, 22.0, 30.0, 24.0, 26.0, 13.0, 15.0, 14.0, 19.0, 7.0, 6.0, 4.0, 6.0, 5.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-4.6953125, -4.564361572265625, -4.43341064453125, -4.302459716796875, -4.1715087890625, -4.040557861328125, -3.90960693359375, -3.778656005859375, -3.647705078125, -3.516754150390625, -3.38580322265625, -3.254852294921875, -3.1239013671875, -2.992950439453125, -2.86199951171875, -2.731048583984375, -2.60009765625, -2.469146728515625, -2.33819580078125, -2.207244873046875, -2.0762939453125, -1.945343017578125, -1.81439208984375, -1.683441162109375, -1.552490234375, -1.421539306640625, -1.29058837890625, -1.159637451171875, -1.0286865234375, -0.897735595703125, -0.76678466796875, -0.635833740234375, -0.5048828125, -0.373931884765625, -0.24298095703125, -0.112030029296875, 0.0189208984375, 0.149871826171875, 0.28082275390625, 0.411773681640625, 0.542724609375, 0.673675537109375, 0.80462646484375, 0.935577392578125, 1.0665283203125, 1.197479248046875, 1.32843017578125, 1.459381103515625, 1.59033203125, 1.721282958984375, 1.85223388671875, 1.983184814453125, 2.1141357421875, 2.245086669921875, 2.37603759765625, 2.506988525390625, 2.637939453125, 2.768890380859375, 2.89984130859375, 3.030792236328125, 3.1617431640625, 3.292694091796875, 3.42364501953125, 3.554595947265625, 3.685546875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 11.0, 12.0, 14.0, 22.0, 33.0, 42.0, 65.0, 59.0, 127.0, 184.0, 289.0, 493.0, 964.0, 2076.0, 5440.0, 20010.0, 116945.0, 1016475.0, 2528107.0, 429394.0, 54856.0, 11300.0, 3715.0, 1589.0, 824.0, 445.0, 225.0, 145.0, 115.0, 78.0, 54.0, 43.0, 25.0, 14.0, 18.0, 17.0, 3.0, 7.0, 11.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-10.6875, -10.384765625, -10.08203125, -9.779296875, -9.4765625, -9.173828125, -8.87109375, -8.568359375, -8.265625, -7.962890625, -7.66015625, -7.357421875, -7.0546875, -6.751953125, -6.44921875, -6.146484375, -5.84375, -5.541015625, -5.23828125, -4.935546875, -4.6328125, -4.330078125, -4.02734375, -3.724609375, -3.421875, -3.119140625, -2.81640625, -2.513671875, -2.2109375, -1.908203125, -1.60546875, -1.302734375, -1.0, -0.697265625, -0.39453125, -0.091796875, 0.2109375, 0.513671875, 0.81640625, 1.119140625, 1.421875, 1.724609375, 2.02734375, 2.330078125, 2.6328125, 2.935546875, 3.23828125, 3.541015625, 3.84375, 4.146484375, 4.44921875, 4.751953125, 5.0546875, 5.357421875, 5.66015625, 5.962890625, 6.265625, 6.568359375, 6.87109375, 7.173828125, 7.4765625, 7.779296875, 8.08203125, 8.384765625, 8.6875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 7.0, 14.0, 24.0, 18.0, 31.0, 45.0, 72.0, 117.0, 167.0, 253.0, 381.0, 519.0, 613.0, 545.0, 395.0, 292.0, 162.0, 127.0, 76.0, 62.0, 41.0, 28.0, 25.0, 19.0, 14.0, 7.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.953125, -8.6866455078125, -8.420166015625, -8.1536865234375, -7.88720703125, -7.6207275390625, -7.354248046875, -7.0877685546875, -6.8212890625, -6.5548095703125, -6.288330078125, -6.0218505859375, -5.75537109375, -5.4888916015625, -5.222412109375, -4.9559326171875, -4.689453125, -4.4229736328125, -4.156494140625, -3.8900146484375, -3.62353515625, -3.3570556640625, -3.090576171875, -2.8240966796875, -2.5576171875, -2.2911376953125, -2.024658203125, -1.7581787109375, -1.49169921875, -1.2252197265625, -0.958740234375, -0.6922607421875, -0.42578125, -0.1593017578125, 0.107177734375, 0.3736572265625, 0.64013671875, 0.9066162109375, 1.173095703125, 1.4395751953125, 1.7060546875, 1.9725341796875, 2.239013671875, 2.5054931640625, 2.77197265625, 3.0384521484375, 3.304931640625, 3.5714111328125, 3.837890625, 4.1043701171875, 4.370849609375, 4.6373291015625, 4.90380859375, 5.1702880859375, 5.436767578125, 5.7032470703125, 5.9697265625, 6.2362060546875, 6.502685546875, 6.7691650390625, 7.03564453125, 7.3021240234375, 7.568603515625, 7.8350830078125, 8.1015625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 18.0, 13.0, 23.0, 41.0, 49.0, 74.0, 103.0, 228.0, 386.0, 1093.0, 7105.0, 302912.0, 3806578.0, 70754.0, 3380.0, 740.0, 345.0, 163.0, 105.0, 46.0, 30.0, 30.0, 16.0, 15.0, 9.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.265625, -28.268310546875, -27.27099609375, -26.273681640625, -25.2763671875, -24.279052734375, -23.28173828125, -22.284423828125, -21.287109375, -20.289794921875, -19.29248046875, -18.295166015625, -17.2978515625, -16.300537109375, -15.30322265625, -14.305908203125, -13.30859375, -12.311279296875, -11.31396484375, -10.316650390625, -9.3193359375, -8.322021484375, -7.32470703125, -6.327392578125, -5.330078125, -4.332763671875, -3.33544921875, -2.338134765625, -1.3408203125, -0.343505859375, 0.65380859375, 1.651123046875, 2.6484375, 3.645751953125, 4.64306640625, 5.640380859375, 6.6376953125, 7.635009765625, 8.63232421875, 9.629638671875, 10.626953125, 11.624267578125, 12.62158203125, 13.618896484375, 14.6162109375, 15.613525390625, 16.61083984375, 17.608154296875, 18.60546875, 19.602783203125, 20.60009765625, 21.597412109375, 22.5947265625, 23.592041015625, 24.58935546875, 25.586669921875, 26.583984375, 27.581298828125, 28.57861328125, 29.575927734375, 30.5732421875, 31.570556640625, 32.56787109375, 33.565185546875, 34.5625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 18.0, 63.0, 159.0, 265.0, 251.0, 158.0, 68.0, 19.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.928932189941406, -38.51460266113281, -36.10027313232422, -33.685943603515625, -31.27161407470703, -28.857284545898438, -26.44295310974121, -24.028623580932617, -21.614294052124023, -19.19996452331543, -16.785634994506836, -14.371304512023926, -11.956974983215332, -9.542645454406738, -7.128314971923828, -4.713985443115234, -2.2996559143066406, 0.11467385292053223, 2.529003620147705, 4.943333625793457, 7.357663154602051, 9.771992683410645, 12.186323165893555, 14.600652694702148, 17.014982223510742, 19.429311752319336, 21.84364128112793, 24.257972717285156, 26.67230224609375, 29.086631774902344, 31.500961303710938, 33.91529083251953, 36.329620361328125, 38.74394989013672, 41.15827941894531, 43.572608947753906, 45.9869384765625, 48.401268005371094, 50.81559753417969, 53.22992706298828, 55.644256591796875, 58.05858612060547, 60.47291564941406, 62.887245178222656, 65.30157470703125, 67.71590423583984, 70.13023376464844, 72.54456329345703, 74.95889282226562, 77.37322235107422, 79.78755187988281, 82.2018814086914, 84.6162109375, 87.0305404663086, 89.44486999511719, 91.85919952392578, 94.2735366821289, 96.6878662109375, 99.1021957397461, 101.51652526855469, 103.93085479736328, 106.34518432617188, 108.75951385498047, 111.17384338378906, 113.58817291259766]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 7.0, 10.0, 12.0, 11.0, 15.0, 11.0, 15.0, 23.0, 25.0, 25.0, 29.0, 32.0, 30.0, 34.0, 39.0, 34.0, 28.0, 37.0, 54.0, 45.0, 41.0, 42.0, 38.0, 29.0, 40.0, 39.0, 34.0, 32.0, 36.0, 18.0, 16.0, 22.0, 18.0, 12.0, 13.0, 11.0, 12.0, 6.0, 4.0, 8.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.781631469726562, -21.092193603515625, -20.402755737304688, -19.71331787109375, -19.023880004882812, -18.334442138671875, -17.645004272460938, -16.95556640625, -16.266128540039062, -15.576690673828125, -14.887252807617188, -14.19781494140625, -13.508377075195312, -12.818939208984375, -12.129501342773438, -11.4400634765625, -10.750624656677246, -10.061186790466309, -9.371748924255371, -8.682311058044434, -7.992873191833496, -7.303435325622559, -6.613996982574463, -5.924559116363525, -5.235121250152588, -4.54568338394165, -3.856245517730713, -3.1668074131011963, -2.477369546890259, -1.7879316806793213, -1.0984935760498047, -0.4090557098388672, 0.2803821563720703, 0.9698200821876526, 1.6592580080032349, 2.348695993423462, 3.0381338596343994, 3.727571725845337, 4.4170098304748535, 5.106447696685791, 5.7958855628967285, 6.485323429107666, 7.1747612953186035, 7.864199638366699, 8.553637504577637, 9.243075370788574, 9.932513236999512, 10.62195110321045, 11.311388969421387, 12.000826835632324, 12.690264701843262, 13.3797025680542, 14.069140434265137, 14.758578300476074, 15.448017120361328, 16.137454986572266, 16.826892852783203, 17.51633071899414, 18.205768585205078, 18.895206451416016, 19.584644317626953, 20.27408218383789, 20.963520050048828, 21.652957916259766, 22.342395782470703]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 6.0, 7.0, 18.0, 16.0, 14.0, 12.0, 19.0, 24.0, 28.0, 22.0, 23.0, 34.0, 32.0, 44.0, 39.0, 33.0, 32.0, 33.0, 43.0, 45.0, 51.0, 30.0, 35.0, 42.0, 36.0, 30.0, 31.0, 28.0, 21.0, 24.0, 16.0, 19.0, 15.0, 12.0, 12.0, 14.0, 10.0, 11.0, 2.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.625, -4.498931884765625, -4.37286376953125, -4.246795654296875, -4.1207275390625, -3.994659423828125, -3.86859130859375, -3.742523193359375, -3.616455078125, -3.490386962890625, -3.36431884765625, -3.238250732421875, -3.1121826171875, -2.986114501953125, -2.86004638671875, -2.733978271484375, -2.60791015625, -2.481842041015625, -2.35577392578125, -2.229705810546875, -2.1036376953125, -1.977569580078125, -1.85150146484375, -1.725433349609375, -1.599365234375, -1.473297119140625, -1.34722900390625, -1.221160888671875, -1.0950927734375, -0.969024658203125, -0.84295654296875, -0.716888427734375, -0.5908203125, -0.464752197265625, -0.33868408203125, -0.212615966796875, -0.0865478515625, 0.039520263671875, 0.16558837890625, 0.291656494140625, 0.417724609375, 0.543792724609375, 0.66986083984375, 0.795928955078125, 0.9219970703125, 1.048065185546875, 1.17413330078125, 1.300201416015625, 1.42626953125, 1.552337646484375, 1.67840576171875, 1.804473876953125, 1.9305419921875, 2.056610107421875, 2.18267822265625, 2.308746337890625, 2.434814453125, 2.560882568359375, 2.68695068359375, 2.813018798828125, 2.9390869140625, 3.065155029296875, 3.19122314453125, 3.317291259765625, 3.443359375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 11.0, 17.0, 17.0, 24.0, 38.0, 59.0, 74.0, 130.0, 193.0, 255.0, 325.0, 540.0, 682.0, 1004.0, 1456.0, 2148.0, 3097.0, 4459.0, 6469.0, 9369.0, 13539.0, 19965.0, 29504.0, 43999.0, 71187.0, 129268.0, 256506.0, 189680.0, 94398.0, 56455.0, 36180.0, 24258.0, 16640.0, 11363.0, 7739.0, 5308.0, 3713.0, 2534.0, 1792.0, 1295.0, 866.0, 611.0, 415.0, 304.0, 199.0, 134.0, 104.0, 73.0, 61.0, 46.0, 25.0, 11.0, 6.0, 8.0, 3.0, 0.0, 0.0, 6.0], "bins": [-0.1502685546875, -0.14568138122558594, -0.14109420776367188, -0.1365070343017578, -0.13191986083984375, -0.1273326873779297, -0.12274551391601562, -0.11815834045410156, -0.1135711669921875, -0.10898399353027344, -0.10439682006835938, -0.09980964660644531, -0.09522247314453125, -0.09063529968261719, -0.08604812622070312, -0.08146095275878906, -0.076873779296875, -0.07228660583496094, -0.06769943237304688, -0.06311225891113281, -0.05852508544921875, -0.05393791198730469, -0.049350738525390625, -0.04476356506347656, -0.0401763916015625, -0.03558921813964844, -0.031002044677734375, -0.026414871215820312, -0.02182769775390625, -0.017240524291992188, -0.012653350830078125, -0.008066177368164062, -0.00347900390625, 0.0011081695556640625, 0.005695343017578125, 0.010282516479492188, 0.01486968994140625, 0.019456863403320312, 0.024044036865234375, 0.028631210327148438, 0.0332183837890625, 0.03780555725097656, 0.042392730712890625, 0.04697990417480469, 0.05156707763671875, 0.05615425109863281, 0.060741424560546875, 0.06532859802246094, 0.069915771484375, 0.07450294494628906, 0.07909011840820312, 0.08367729187011719, 0.08826446533203125, 0.09285163879394531, 0.09743881225585938, 0.10202598571777344, 0.1066131591796875, 0.11120033264160156, 0.11578750610351562, 0.12037467956542969, 0.12496185302734375, 0.1295490264892578, 0.13413619995117188, 0.13872337341308594, 0.143310546875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 5.0, 8.0, 9.0, 11.0, 15.0, 13.0, 15.0, 22.0, 24.0, 24.0, 26.0, 29.0, 21.0, 27.0, 37.0, 36.0, 46.0, 33.0, 1067.0, 52.0, 36.0, 42.0, 49.0, 45.0, 37.0, 30.0, 44.0, 30.0, 29.0, 25.0, 13.0, 16.0, 25.0, 14.0, 10.0, 7.0, 8.0, 7.0, 6.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.787109375, -3.668365478515625, -3.54962158203125, -3.430877685546875, -3.3121337890625, -3.193389892578125, -3.07464599609375, -2.955902099609375, -2.837158203125, -2.718414306640625, -2.59967041015625, -2.480926513671875, -2.3621826171875, -2.243438720703125, -2.12469482421875, -2.005950927734375, -1.88720703125, -1.768463134765625, -1.64971923828125, -1.530975341796875, -1.4122314453125, -1.293487548828125, -1.17474365234375, -1.055999755859375, -0.937255859375, -0.818511962890625, -0.69976806640625, -0.581024169921875, -0.4622802734375, -0.343536376953125, -0.22479248046875, -0.106048583984375, 0.0126953125, 0.131439208984375, 0.25018310546875, 0.368927001953125, 0.4876708984375, 0.606414794921875, 0.72515869140625, 0.843902587890625, 0.962646484375, 1.081390380859375, 1.20013427734375, 1.318878173828125, 1.4376220703125, 1.556365966796875, 1.67510986328125, 1.793853759765625, 1.91259765625, 2.031341552734375, 2.15008544921875, 2.268829345703125, 2.3875732421875, 2.506317138671875, 2.62506103515625, 2.743804931640625, 2.862548828125, 2.981292724609375, 3.10003662109375, 3.218780517578125, 3.3375244140625, 3.456268310546875, 3.57501220703125, 3.693756103515625, 3.8125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 6.0, 5.0, 15.0, 14.0, 30.0, 35.0, 51.0, 82.0, 109.0, 147.0, 219.0, 321.0, 461.0, 659.0, 1046.0, 1497.0, 2162.0, 3214.0, 4618.0, 6749.0, 10223.0, 15669.0, 24027.0, 36993.0, 60929.0, 107170.0, 214845.0, 1285791.0, 127578.0, 71110.0, 42447.0, 26862.0, 17252.0, 11402.0, 7629.0, 5060.0, 3420.0, 2257.0, 1517.0, 1102.0, 737.0, 515.0, 371.0, 252.0, 167.0, 116.0, 81.0, 50.0, 45.0, 33.0, 18.0, 13.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.06304931640625, -0.06102466583251953, -0.05900001525878906, -0.056975364685058594, -0.054950714111328125, -0.052926063537597656, -0.05090141296386719, -0.04887676239013672, -0.04685211181640625, -0.04482746124267578, -0.04280281066894531, -0.040778160095214844, -0.038753509521484375, -0.036728858947753906, -0.03470420837402344, -0.03267955780029297, -0.0306549072265625, -0.02863025665283203, -0.026605606079101562, -0.024580955505371094, -0.022556304931640625, -0.020531654357910156, -0.018507003784179688, -0.01648235321044922, -0.01445770263671875, -0.012433052062988281, -0.010408401489257812, -0.008383750915527344, -0.006359100341796875, -0.004334449768066406, -0.0023097991943359375, -0.00028514862060546875, 0.001739501953125, 0.0037641525268554688, 0.0057888031005859375, 0.007813453674316406, 0.009838104248046875, 0.011862754821777344, 0.013887405395507812, 0.01591205596923828, 0.01793670654296875, 0.01996135711669922, 0.021986007690429688, 0.024010658264160156, 0.026035308837890625, 0.028059959411621094, 0.030084609985351562, 0.03210926055908203, 0.0341339111328125, 0.03615856170654297, 0.03818321228027344, 0.040207862854003906, 0.042232513427734375, 0.044257164001464844, 0.04628181457519531, 0.04830646514892578, 0.05033111572265625, 0.05235576629638672, 0.05438041687011719, 0.056405067443847656, 0.058429718017578125, 0.060454368591308594, 0.06247901916503906, 0.06450366973876953, 0.0665283203125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 6.0, 11.0, 6.0, 7.0, 9.0, 8.0, 13.0, 13.0, 25.0, 18.0, 43.0, 28.0, 56.0, 67.0, 71.0, 86.0, 86.0, 82.0, 65.0, 51.0, 40.0, 30.0, 25.0, 26.0, 17.0, 20.0, 11.0, 18.0, 8.0, 11.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0002872943878173828, -0.00027855485677719116, -0.0002698153257369995, -0.00026107579469680786, -0.0002523362636566162, -0.00024359673261642456, -0.0002348572015762329, -0.00022611767053604126, -0.0002173781394958496, -0.00020863860845565796, -0.0001998990774154663, -0.00019115954637527466, -0.000182420015335083, -0.00017368048429489136, -0.0001649409532546997, -0.00015620142221450806, -0.0001474618911743164, -0.00013872236013412476, -0.0001299828290939331, -0.00012124329805374146, -0.0001125037670135498, -0.00010376423597335815, -9.50247049331665e-05, -8.628517389297485e-05, -7.75456428527832e-05, -6.880611181259155e-05, -6.00665807723999e-05, -5.132704973220825e-05, -4.25875186920166e-05, -3.384798765182495e-05, -2.51084566116333e-05, -1.636892557144165e-05, -7.62939453125e-06, 1.1101365089416504e-06, 9.8496675491333e-06, 1.858919858932495e-05, 2.73287296295166e-05, 3.606826066970825e-05, 4.48077917098999e-05, 5.354732275009155e-05, 6.22868537902832e-05, 7.102638483047485e-05, 7.97659158706665e-05, 8.850544691085815e-05, 9.72449779510498e-05, 0.00010598450899124146, 0.0001147240400314331, 0.00012346357107162476, 0.0001322031021118164, 0.00014094263315200806, 0.0001496821641921997, 0.00015842169523239136, 0.000167161226272583, 0.00017590075731277466, 0.0001846402883529663, 0.00019337981939315796, 0.0002021193504333496, 0.00021085888147354126, 0.0002195984125137329, 0.00022833794355392456, 0.0002370774745941162, 0.00024581700563430786, 0.0002545565366744995, 0.00026329606771469116, 0.0002720355987548828]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 7.0, 10.0, 12.0, 21.0, 19.0, 24.0, 26.0, 38.0, 40.0, 92.0, 165.0, 648.0, 7752.0, 257446.0, 764361.0, 16240.0, 1117.0, 195.0, 104.0, 51.0, 29.0, 27.0, 19.0, 17.0, 7.0, 14.0, 7.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0066375732421875, -0.006417214870452881, -0.006196856498718262, -0.005976498126983643, -0.0057561397552490234, -0.005535781383514404, -0.005315423011779785, -0.005095064640045166, -0.004874706268310547, -0.004654347896575928, -0.004433989524841309, -0.0042136311531066895, -0.00399327278137207, -0.003772914409637451, -0.003552556037902832, -0.003332197666168213, -0.0031118392944335938, -0.0028914809226989746, -0.0026711225509643555, -0.0024507641792297363, -0.002230405807495117, -0.002010047435760498, -0.001789689064025879, -0.0015693306922912598, -0.0013489723205566406, -0.0011286139488220215, -0.0009082555770874023, -0.0006878972053527832, -0.00046753883361816406, -0.0002471804618835449, -2.682209014892578e-05, 0.00019353628158569336, 0.0004138946533203125, 0.0006342530250549316, 0.0008546113967895508, 0.00107496976852417, 0.001295328140258789, 0.0015156865119934082, 0.0017360448837280273, 0.0019564032554626465, 0.0021767616271972656, 0.0023971199989318848, 0.002617478370666504, 0.002837836742401123, 0.003058195114135742, 0.0032785534858703613, 0.0034989118576049805, 0.0037192702293395996, 0.003939628601074219, 0.004159986972808838, 0.004380345344543457, 0.004600703716278076, 0.004821062088012695, 0.0050414204597473145, 0.005261778831481934, 0.005482137203216553, 0.005702495574951172, 0.005922853946685791, 0.00614321231842041, 0.006363570690155029, 0.0065839290618896484, 0.006804287433624268, 0.007024645805358887, 0.007245004177093506, 0.007465362548828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 4.0, 16.0, 13.0, 37.0, 46.0, 105.0, 189.0, 248.0, 148.0, 83.0, 40.0, 25.0, 17.0, 11.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0], "bins": [-0.00111119425855577, -0.001089525525458157, -0.001067856908775866, -0.0010461881756782532, -0.0010245195589959621, -0.0010028508258983493, -0.0009811822092160583, -0.0009595134761184454, -0.0009378448012284935, -0.0009161761263385415, -0.0008945074514485896, -0.0008728387765586376, -0.0008511700434610248, -0.0008295013685710728, -0.0008078326936811209, -0.0007861640187911689, -0.000764495343901217, -0.000742826669011265, -0.0007211579941213131, -0.0006994893192313612, -0.0006778206443414092, -0.0006561519112437963, -0.0006344832363538444, -0.0006128145614638925, -0.0005911458865739405, -0.0005694772116839886, -0.0005478085367940366, -0.0005261398619040847, -0.0005044711288064718, -0.00048280248302035034, -0.00046113377902656794, -0.000439465104136616, -0.0004177964583504945, -0.00039612778346054256, -0.00037445907946676016, -0.0003527904045768082, -0.00033112172968685627, -0.0003094530547969043, -0.0002877843799069524, -0.00026611567591317, -0.00024444700102321804, -0.0002227783261332661, -0.00020110963669139892, -0.00017944094724953175, -0.0001577722723595798, -0.00013610359746962786, -0.00011443490802776068, -9.276621858589351e-05, -7.109754369594157e-05, -4.942886153003201e-05, -2.776017936412245e-05, -6.091497198212892e-06, 1.5577184967696667e-05, 3.7245867133606225e-05, 5.8914549299515784e-05, 8.058323874138296e-05, 0.0001022519136313349, 0.00012392058852128685, 0.00014558927796315402, 0.0001672579674050212, 0.00018892664229497313, 0.00021059531718492508, 0.00023226400662679225, 0.0002539326960686594, 0.00027560137095861137]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 12.0, 9.0, 6.0, 17.0, 21.0, 15.0, 27.0, 28.0, 33.0, 40.0, 48.0, 42.0, 40.0, 46.0, 58.0, 49.0, 54.0, 51.0, 46.0, 50.0, 37.0, 39.0, 43.0, 25.0, 32.0, 24.0, 28.0, 14.0, 13.0, 12.0, 9.0, 4.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0001927018165588379, -0.00018705707043409348, -0.00018141232430934906, -0.00017576757818460464, -0.00017012283205986023, -0.00016447808593511581, -0.0001588333398103714, -0.00015318859368562698, -0.00014754384756088257, -0.00014189910143613815, -0.00013625435531139374, -0.00013060960918664932, -0.0001249648630619049, -0.00011932011693716049, -0.00011367537081241608, -0.00010803062468767166, -0.00010238587856292725, -9.674113243818283e-05, -9.109638631343842e-05, -8.5451640188694e-05, -7.980689406394958e-05, -7.416214793920517e-05, -6.851740181446075e-05, -6.287265568971634e-05, -5.7227909564971924e-05, -5.158316344022751e-05, -4.593841731548309e-05, -4.029367119073868e-05, -3.464892506599426e-05, -2.9004178941249847e-05, -2.3359432816505432e-05, -1.7714686691761017e-05, -1.2069940567016602e-05, -6.425194442272186e-06, -7.80448317527771e-07, 4.864297807216644e-06, 1.050904393196106e-05, 1.6153790056705475e-05, 2.179853618144989e-05, 2.7443282306194305e-05, 3.308802843093872e-05, 3.8732774555683136e-05, 4.437752068042755e-05, 5.0022266805171967e-05, 5.566701292991638e-05, 6.13117590546608e-05, 6.695650517940521e-05, 7.260125130414963e-05, 7.824599742889404e-05, 8.389074355363846e-05, 8.953548967838287e-05, 9.518023580312729e-05, 0.0001008249819278717, 0.00010646972805261612, 0.00011211447417736053, 0.00011775922030210495, 0.00012340396642684937, 0.00012904871255159378, 0.0001346934586763382, 0.0001403382048010826, 0.00014598295092582703, 0.00015162769705057144, 0.00015727244317531586, 0.00016291718930006027, 0.0001685619354248047]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 9.0, 5.0, 4.0, 6.0, 7.0, 18.0, 16.0, 14.0, 12.0, 19.0, 24.0, 28.0, 22.0, 23.0, 34.0, 32.0, 44.0, 39.0, 33.0, 32.0, 33.0, 43.0, 45.0, 51.0, 30.0, 35.0, 42.0, 36.0, 30.0, 31.0, 28.0, 21.0, 24.0, 16.0, 19.0, 15.0, 12.0, 12.0, 14.0, 10.0, 11.0, 2.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.625, -4.498931884765625, -4.37286376953125, -4.246795654296875, -4.1207275390625, -3.994659423828125, -3.86859130859375, -3.742523193359375, -3.616455078125, -3.490386962890625, -3.36431884765625, -3.238250732421875, -3.1121826171875, -2.986114501953125, -2.86004638671875, -2.733978271484375, -2.60791015625, -2.481842041015625, -2.35577392578125, -2.229705810546875, -2.1036376953125, -1.977569580078125, -1.85150146484375, -1.725433349609375, -1.599365234375, -1.473297119140625, -1.34722900390625, -1.221160888671875, -1.0950927734375, -0.969024658203125, -0.84295654296875, -0.716888427734375, -0.5908203125, -0.464752197265625, -0.33868408203125, -0.212615966796875, -0.0865478515625, 0.039520263671875, 0.16558837890625, 0.291656494140625, 0.417724609375, 0.543792724609375, 0.66986083984375, 0.795928955078125, 0.9219970703125, 1.048065185546875, 1.17413330078125, 1.300201416015625, 1.42626953125, 1.552337646484375, 1.67840576171875, 1.804473876953125, 1.9305419921875, 2.056610107421875, 2.18267822265625, 2.308746337890625, 2.434814453125, 2.560882568359375, 2.68695068359375, 2.813018798828125, 2.9390869140625, 3.065155029296875, 3.19122314453125, 3.317291259765625, 3.443359375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 6.0, 12.0, 11.0, 27.0, 33.0, 49.0, 59.0, 82.0, 138.0, 216.0, 316.0, 512.0, 784.0, 1154.0, 1976.0, 3350.0, 5653.0, 10131.0, 19394.0, 43950.0, 116288.0, 303441.0, 321516.0, 125963.0, 47450.0, 20506.0, 10701.0, 5858.0, 3400.0, 2015.0, 1236.0, 813.0, 484.0, 318.0, 254.0, 141.0, 105.0, 72.0, 45.0, 34.0, 21.0, 11.0, 10.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75494384765625, -5.5567626953125, -5.35858154296875, -5.160400390625, -4.96221923828125, -4.7640380859375, -4.56585693359375, -4.36767578125, -4.16949462890625, -3.9713134765625, -3.77313232421875, -3.574951171875, -3.37677001953125, -3.1785888671875, -2.98040771484375, -2.7822265625, -2.58404541015625, -2.3858642578125, -2.18768310546875, -1.989501953125, -1.79132080078125, -1.5931396484375, -1.39495849609375, -1.19677734375, -0.99859619140625, -0.8004150390625, -0.60223388671875, -0.404052734375, -0.20587158203125, -0.0076904296875, 0.19049072265625, 0.388671875, 0.58685302734375, 0.7850341796875, 0.98321533203125, 1.181396484375, 1.37957763671875, 1.5777587890625, 1.77593994140625, 1.97412109375, 2.17230224609375, 2.3704833984375, 2.56866455078125, 2.766845703125, 2.96502685546875, 3.1632080078125, 3.36138916015625, 3.5595703125, 3.75775146484375, 3.9559326171875, 4.15411376953125, 4.352294921875, 4.55047607421875, 4.7486572265625, 4.94683837890625, 5.14501953125, 5.34320068359375, 5.5413818359375, 5.73956298828125, 5.937744140625, 6.13592529296875, 6.3341064453125, 6.53228759765625, 6.73046875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 9.0, 5.0, 10.0, 14.0, 15.0, 15.0, 20.0, 27.0, 23.0, 20.0, 31.0, 38.0, 40.0, 50.0, 63.0, 75.0, 139.0, 252.0, 1406.0, 248.0, 129.0, 62.0, 59.0, 40.0, 51.0, 33.0, 27.0, 22.0, 30.0, 15.0, 16.0, 13.0, 10.0, 8.0, 8.0, 6.0, 7.0, 1.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3671875, -12.9285888671875, -12.489990234375, -12.0513916015625, -11.61279296875, -11.1741943359375, -10.735595703125, -10.2969970703125, -9.8583984375, -9.4197998046875, -8.981201171875, -8.5426025390625, -8.10400390625, -7.6654052734375, -7.226806640625, -6.7882080078125, -6.349609375, -5.9110107421875, -5.472412109375, -5.0338134765625, -4.59521484375, -4.1566162109375, -3.718017578125, -3.2794189453125, -2.8408203125, -2.4022216796875, -1.963623046875, -1.5250244140625, -1.08642578125, -0.6478271484375, -0.209228515625, 0.2293701171875, 0.66796875, 1.1065673828125, 1.545166015625, 1.9837646484375, 2.42236328125, 2.8609619140625, 3.299560546875, 3.7381591796875, 4.1767578125, 4.6153564453125, 5.053955078125, 5.4925537109375, 5.93115234375, 6.3697509765625, 6.808349609375, 7.2469482421875, 7.685546875, 8.1241455078125, 8.562744140625, 9.0013427734375, 9.43994140625, 9.8785400390625, 10.317138671875, 10.7557373046875, 11.1943359375, 11.6329345703125, 12.071533203125, 12.5101318359375, 12.94873046875, 13.3873291015625, 13.825927734375, 14.2645263671875, 14.703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 13.0, 11.0, 17.0, 26.0, 31.0, 54.0, 81.0, 88.0, 162.0, 286.0, 514.0, 1076.0, 3235.0, 15708.0, 135203.0, 2454310.0, 491251.0, 34495.0, 5874.0, 1649.0, 633.0, 346.0, 200.0, 138.0, 78.0, 59.0, 37.0, 35.0, 25.0, 17.0, 11.0, 13.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.947509765625, -15.41064453125, -14.873779296875, -14.3369140625, -13.800048828125, -13.26318359375, -12.726318359375, -12.189453125, -11.652587890625, -11.11572265625, -10.578857421875, -10.0419921875, -9.505126953125, -8.96826171875, -8.431396484375, -7.89453125, -7.357666015625, -6.82080078125, -6.283935546875, -5.7470703125, -5.210205078125, -4.67333984375, -4.136474609375, -3.599609375, -3.062744140625, -2.52587890625, -1.989013671875, -1.4521484375, -0.915283203125, -0.37841796875, 0.158447265625, 0.6953125, 1.232177734375, 1.76904296875, 2.305908203125, 2.8427734375, 3.379638671875, 3.91650390625, 4.453369140625, 4.990234375, 5.527099609375, 6.06396484375, 6.600830078125, 7.1376953125, 7.674560546875, 8.21142578125, 8.748291015625, 9.28515625, 9.822021484375, 10.35888671875, 10.895751953125, 11.4326171875, 11.969482421875, 12.50634765625, 13.043212890625, 13.580078125, 14.116943359375, 14.65380859375, 15.190673828125, 15.7275390625, 16.264404296875, 16.80126953125, 17.338134765625, 17.875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 45.0, 275.0, 450.0, 212.0, 32.0, 1.0], "bins": [-228.4581756591797, -224.67642211914062, -220.89466857910156, -217.1129150390625, -213.33116149902344, -209.54940795898438, -205.76763916015625, -201.98590087890625, -198.20413208007812, -194.42237854003906, -190.640625, -186.85887145996094, -183.07711791992188, -179.2953643798828, -175.51361083984375, -171.73184204101562, -167.95010375976562, -164.16835021972656, -160.3865966796875, -156.60484313964844, -152.82308959960938, -149.0413360595703, -145.25958251953125, -141.47781372070312, -137.69606018066406, -133.914306640625, -130.13255310058594, -126.35079956054688, -122.56903839111328, -118.78728485107422, -115.00553131103516, -111.2237777709961, -107.44202423095703, -103.66027069091797, -99.8785171508789, -96.09675598144531, -92.31500244140625, -88.53324890136719, -84.75149536132812, -80.96974182128906, -77.18798828125, -73.40623474121094, -69.62448120117188, -65.84272766113281, -62.060970306396484, -58.279212951660156, -54.497459411621094, -50.71570587158203, -46.93395233154297, -43.152198791503906, -39.37044143676758, -35.588687896728516, -31.806934356689453, -28.025178909301758, -24.243423461914062, -20.461669921875, -16.679912567138672, -12.898158073425293, -9.116403579711914, -5.334648132324219, -1.5528936386108398, 2.228860855102539, 6.010616302490234, 9.792369842529297, 13.574124336242676]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 2.0, 11.0, 5.0, 12.0, 15.0, 11.0, 8.0, 16.0, 12.0, 28.0, 21.0, 20.0, 44.0, 36.0, 39.0, 35.0, 50.0, 43.0, 37.0, 50.0, 45.0, 46.0, 41.0, 37.0, 32.0, 41.0, 39.0, 32.0, 18.0, 28.0, 30.0, 15.0, 17.0, 8.0, 13.0, 6.0, 9.0, 15.0, 11.0, 9.0, 2.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.09288787841797, -35.01768493652344, -33.942481994628906, -32.867279052734375, -31.79207420349121, -30.71687126159668, -29.641666412353516, -28.566463470458984, -27.491260528564453, -26.416057586669922, -25.34085464477539, -24.265649795532227, -23.190446853637695, -22.115243911743164, -21.0400390625, -19.96483612060547, -18.889633178710938, -17.814430236816406, -16.739227294921875, -15.664022445678711, -14.58881950378418, -13.513616561889648, -12.4384126663208, -11.363208770751953, -10.288005828857422, -9.21280288696289, -8.137598991394043, -7.0623955726623535, -5.987192153930664, -4.911988735198975, -3.836785316467285, -2.7615818977355957, -1.6863784790039062, -0.6111750602722168, 0.46402835845947266, 1.539231777191162, 2.6144351959228516, 3.689638614654541, 4.7648420333862305, 5.84004545211792, 6.915248870849609, 7.990452289581299, 9.065655708312988, 10.140859603881836, 11.216062545776367, 12.291265487670898, 13.366469383239746, 14.441673278808594, 15.516876220703125, 16.592079162597656, 17.667282104492188, 18.74248695373535, 19.817689895629883, 20.892892837524414, 21.968097686767578, 23.04330062866211, 24.11850357055664, 25.193706512451172, 26.268909454345703, 27.344114303588867, 28.4193172454834, 29.49452018737793, 30.569725036621094, 31.644927978515625, 32.720130920410156]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 1.0, 8.0, 5.0, 7.0, 5.0, 6.0, 13.0, 18.0, 14.0, 17.0, 18.0, 15.0, 21.0, 24.0, 25.0, 25.0, 39.0, 31.0, 37.0, 20.0, 50.0, 30.0, 50.0, 39.0, 46.0, 29.0, 39.0, 38.0, 34.0, 35.0, 37.0, 17.0, 21.0, 20.0, 30.0, 16.0, 21.0, 18.0, 15.0, 12.0, 9.0, 16.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 2.0], "bins": [-4.7265625, -4.599578857421875, -4.47259521484375, -4.345611572265625, -4.2186279296875, -4.091644287109375, -3.96466064453125, -3.837677001953125, -3.710693359375, -3.583709716796875, -3.45672607421875, -3.329742431640625, -3.2027587890625, -3.075775146484375, -2.94879150390625, -2.821807861328125, -2.69482421875, -2.567840576171875, -2.44085693359375, -2.313873291015625, -2.1868896484375, -2.059906005859375, -1.93292236328125, -1.805938720703125, -1.678955078125, -1.551971435546875, -1.42498779296875, -1.298004150390625, -1.1710205078125, -1.044036865234375, -0.91705322265625, -0.790069580078125, -0.6630859375, -0.536102294921875, -0.40911865234375, -0.282135009765625, -0.1551513671875, -0.028167724609375, 0.09881591796875, 0.225799560546875, 0.352783203125, 0.479766845703125, 0.60675048828125, 0.733734130859375, 0.8607177734375, 0.987701416015625, 1.11468505859375, 1.241668701171875, 1.36865234375, 1.495635986328125, 1.62261962890625, 1.749603271484375, 1.8765869140625, 2.003570556640625, 2.13055419921875, 2.257537841796875, 2.384521484375, 2.511505126953125, 2.63848876953125, 2.765472412109375, 2.8924560546875, 3.019439697265625, 3.14642333984375, 3.273406982421875, 3.400390625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 6.0, 8.0, 7.0, 5.0, 7.0, 14.0, 19.0, 29.0, 34.0, 47.0, 67.0, 135.0, 216.0, 452.0, 805.0, 1526.0, 3234.0, 7592.0, 21529.0, 79508.0, 361455.0, 1517815.0, 1652139.0, 415171.0, 91828.0, 24597.0, 8537.0, 3641.0, 1660.0, 919.0, 498.0, 307.0, 165.0, 115.0, 58.0, 43.0, 32.0, 15.0, 20.0, 8.0, 8.0, 4.0, 2.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.6640625, -7.44537353515625, -7.2266845703125, -7.00799560546875, -6.789306640625, -6.57061767578125, -6.3519287109375, -6.13323974609375, -5.91455078125, -5.69586181640625, -5.4771728515625, -5.25848388671875, -5.039794921875, -4.82110595703125, -4.6024169921875, -4.38372802734375, -4.1650390625, -3.94635009765625, -3.7276611328125, -3.50897216796875, -3.290283203125, -3.07159423828125, -2.8529052734375, -2.63421630859375, -2.41552734375, -2.19683837890625, -1.9781494140625, -1.75946044921875, -1.540771484375, -1.32208251953125, -1.1033935546875, -0.88470458984375, -0.666015625, -0.44732666015625, -0.2286376953125, -0.00994873046875, 0.208740234375, 0.42742919921875, 0.6461181640625, 0.86480712890625, 1.08349609375, 1.30218505859375, 1.5208740234375, 1.73956298828125, 1.958251953125, 2.17694091796875, 2.3956298828125, 2.61431884765625, 2.8330078125, 3.05169677734375, 3.2703857421875, 3.48907470703125, 3.707763671875, 3.92645263671875, 4.1451416015625, 4.36383056640625, 4.58251953125, 4.80120849609375, 5.0198974609375, 5.23858642578125, 5.457275390625, 5.67596435546875, 5.8946533203125, 6.11334228515625, 6.33203125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 8.0, 6.0, 16.0, 15.0, 19.0, 34.0, 40.0, 83.0, 108.0, 158.0, 212.0, 313.0, 410.0, 593.0, 568.0, 422.0, 348.0, 211.0, 153.0, 109.0, 79.0, 44.0, 26.0, 25.0, 15.0, 11.0, 7.0, 11.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51171875, -7.25286865234375, -6.9940185546875, -6.73516845703125, -6.476318359375, -6.21746826171875, -5.9586181640625, -5.69976806640625, -5.44091796875, -5.18206787109375, -4.9232177734375, -4.66436767578125, -4.405517578125, -4.14666748046875, -3.8878173828125, -3.62896728515625, -3.3701171875, -3.11126708984375, -2.8524169921875, -2.59356689453125, -2.334716796875, -2.07586669921875, -1.8170166015625, -1.55816650390625, -1.29931640625, -1.04046630859375, -0.7816162109375, -0.52276611328125, -0.263916015625, -0.00506591796875, 0.2537841796875, 0.51263427734375, 0.771484375, 1.03033447265625, 1.2891845703125, 1.54803466796875, 1.806884765625, 2.06573486328125, 2.3245849609375, 2.58343505859375, 2.84228515625, 3.10113525390625, 3.3599853515625, 3.61883544921875, 3.877685546875, 4.13653564453125, 4.3953857421875, 4.65423583984375, 4.9130859375, 5.17193603515625, 5.4307861328125, 5.68963623046875, 5.948486328125, 6.20733642578125, 6.4661865234375, 6.72503662109375, 6.98388671875, 7.24273681640625, 7.5015869140625, 7.76043701171875, 8.019287109375, 8.27813720703125, 8.5369873046875, 8.79583740234375, 9.0546875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 11.0, 17.0, 9.0, 22.0, 24.0, 46.0, 65.0, 113.0, 174.0, 350.0, 772.0, 2563.0, 13255.0, 212913.0, 3605022.0, 336952.0, 17146.0, 2937.0, 938.0, 402.0, 208.0, 107.0, 76.0, 62.0, 20.0, 18.0, 15.0, 15.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.8740234375, -24.154296875, -23.4345703125, -22.71484375, -21.9951171875, -21.275390625, -20.5556640625, -19.8359375, -19.1162109375, -18.396484375, -17.6767578125, -16.95703125, -16.2373046875, -15.517578125, -14.7978515625, -14.078125, -13.3583984375, -12.638671875, -11.9189453125, -11.19921875, -10.4794921875, -9.759765625, -9.0400390625, -8.3203125, -7.6005859375, -6.880859375, -6.1611328125, -5.44140625, -4.7216796875, -4.001953125, -3.2822265625, -2.5625, -1.8427734375, -1.123046875, -0.4033203125, 0.31640625, 1.0361328125, 1.755859375, 2.4755859375, 3.1953125, 3.9150390625, 4.634765625, 5.3544921875, 6.07421875, 6.7939453125, 7.513671875, 8.2333984375, 8.953125, 9.6728515625, 10.392578125, 11.1123046875, 11.83203125, 12.5517578125, 13.271484375, 13.9912109375, 14.7109375, 15.4306640625, 16.150390625, 16.8701171875, 17.58984375, 18.3095703125, 19.029296875, 19.7490234375, 20.46875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 44.0, 239.0, 458.0, 223.0, 40.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.15943145751953, -55.67448425292969, -51.18954086303711, -46.70459747314453, -42.21965026855469, -37.734703063964844, -33.249759674072266, -28.764814376831055, -24.279869079589844, -19.794923782348633, -15.309978485107422, -10.825033187866211, -6.340087890625, -1.855142593383789, 2.629802703857422, 7.114748001098633, 11.599693298339844, 16.084638595581055, 20.569583892822266, 25.054529190063477, 29.539474487304688, 34.02442169189453, 38.50936508178711, 42.99430847167969, 47.47925567626953, 51.964202880859375, 56.44914627075195, 60.93408966064453, 65.41903686523438, 69.90398406982422, 74.38893127441406, 78.87387084960938, 83.35881042480469, 87.84375762939453, 92.32870483398438, 96.81364440917969, 101.29859161376953, 105.78353881835938, 110.26847839355469, 114.75342559814453, 119.23837280273438, 123.72332000732422, 128.20826721191406, 132.69320678710938, 137.17816162109375, 141.66310119628906, 146.14804077148438, 150.63299560546875, 155.11793518066406, 159.60287475585938, 164.08782958984375, 168.57276916503906, 173.05770874023438, 177.54266357421875, 182.02760314941406, 186.51255798339844, 190.99749755859375, 195.48243713378906, 199.96739196777344, 204.45233154296875, 208.93728637695312, 213.42222595214844, 217.90716552734375, 222.39212036132812, 226.87705993652344]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 7.0, 8.0, 7.0, 19.0, 16.0, 14.0, 13.0, 22.0, 20.0, 25.0, 28.0, 28.0, 35.0, 32.0, 39.0, 38.0, 30.0, 33.0, 37.0, 35.0, 42.0, 32.0, 41.0, 42.0, 32.0, 38.0, 38.0, 21.0, 30.0, 25.0, 20.0, 20.0, 22.0, 20.0, 8.0, 15.0, 13.0, 9.0, 8.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-24.05582618713379, -23.329723358154297, -22.603622436523438, -21.877519607543945, -21.151416778564453, -20.425315856933594, -19.6992130279541, -18.97311019897461, -18.24700927734375, -17.520906448364258, -16.7948055267334, -16.068702697753906, -15.342599868774414, -14.616497993469238, -13.890396118164062, -13.16429328918457, -12.438190460205078, -11.712088584899902, -10.98598575592041, -10.259883880615234, -9.533781051635742, -8.807679176330566, -8.08157730102539, -7.355474948883057, -6.629372596740723, -5.903270244598389, -5.177167892456055, -4.451066017150879, -3.724963665008545, -2.998861312866211, -2.272759437561035, -1.5466570854187012, -0.8205528259277344, -0.09445059299468994, 0.6316516399383545, 1.3577537536621094, 2.0838561058044434, 2.8099584579467773, 3.536060333251953, 4.262162685394287, 4.988265037536621, 5.714367389678955, 6.440469741821289, 7.166571617126465, 7.892673969268799, 8.618776321411133, 9.344878196716309, 10.070980072021484, 10.797082901000977, 11.523184776306152, 12.249287605285645, 12.97538948059082, 13.701492309570312, 14.427594184875488, 15.153696060180664, 15.879798889160156, 16.605899810791016, 17.332002639770508, 18.058103561401367, 18.78420639038086, 19.51030921936035, 20.236412048339844, 20.962512969970703, 21.688615798950195, 22.414718627929688]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 8.0, 12.0, 9.0, 13.0, 9.0, 12.0, 16.0, 13.0, 19.0, 31.0, 19.0, 12.0, 31.0, 34.0, 33.0, 36.0, 33.0, 30.0, 39.0, 40.0, 47.0, 31.0, 31.0, 45.0, 32.0, 36.0, 35.0, 35.0, 29.0, 25.0, 19.0, 23.0, 26.0, 25.0, 21.0, 13.0, 12.0, 13.0, 10.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.640625, -4.510589599609375, -4.38055419921875, -4.250518798828125, -4.1204833984375, -3.990447998046875, -3.86041259765625, -3.730377197265625, -3.600341796875, -3.470306396484375, -3.34027099609375, -3.210235595703125, -3.0802001953125, -2.950164794921875, -2.82012939453125, -2.690093994140625, -2.56005859375, -2.430023193359375, -2.29998779296875, -2.169952392578125, -2.0399169921875, -1.909881591796875, -1.77984619140625, -1.649810791015625, -1.519775390625, -1.389739990234375, -1.25970458984375, -1.129669189453125, -0.9996337890625, -0.869598388671875, -0.73956298828125, -0.609527587890625, -0.4794921875, -0.349456787109375, -0.21942138671875, -0.089385986328125, 0.0406494140625, 0.170684814453125, 0.30072021484375, 0.430755615234375, 0.560791015625, 0.690826416015625, 0.82086181640625, 0.950897216796875, 1.0809326171875, 1.210968017578125, 1.34100341796875, 1.471038818359375, 1.60107421875, 1.731109619140625, 1.86114501953125, 1.991180419921875, 2.1212158203125, 2.251251220703125, 2.38128662109375, 2.511322021484375, 2.641357421875, 2.771392822265625, 2.90142822265625, 3.031463623046875, 3.1614990234375, 3.291534423828125, 3.42156982421875, 3.551605224609375, 3.681640625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 8.0, 10.0, 16.0, 22.0, 39.0, 62.0, 65.0, 129.0, 163.0, 233.0, 401.0, 642.0, 912.0, 1355.0, 1977.0, 3016.0, 4568.0, 7157.0, 10657.0, 16430.0, 26320.0, 43260.0, 75871.0, 144626.0, 282185.0, 190852.0, 95884.0, 53646.0, 31573.0, 19703.0, 12554.0, 8239.0, 5368.0, 3477.0, 2425.0, 1610.0, 1073.0, 663.0, 435.0, 283.0, 231.0, 148.0, 94.0, 54.0, 42.0, 25.0, 17.0, 9.0, 13.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.156005859375, -0.1509227752685547, -0.14583969116210938, -0.14075660705566406, -0.13567352294921875, -0.13059043884277344, -0.12550735473632812, -0.12042427062988281, -0.1153411865234375, -0.11025810241699219, -0.10517501831054688, -0.10009193420410156, -0.09500885009765625, -0.08992576599121094, -0.08484268188476562, -0.07975959777832031, -0.074676513671875, -0.06959342956542969, -0.06451034545898438, -0.05942726135253906, -0.05434417724609375, -0.04926109313964844, -0.044178009033203125, -0.03909492492675781, -0.0340118408203125, -0.028928756713867188, -0.023845672607421875, -0.018762588500976562, -0.01367950439453125, -0.008596420288085938, -0.003513336181640625, 0.0015697479248046875, 0.00665283203125, 0.011735916137695312, 0.016819000244140625, 0.021902084350585938, 0.02698516845703125, 0.03206825256347656, 0.037151336669921875, 0.04223442077636719, 0.0473175048828125, 0.05240058898925781, 0.057483673095703125, 0.06256675720214844, 0.06764984130859375, 0.07273292541503906, 0.07781600952148438, 0.08289909362792969, 0.087982177734375, 0.09306526184082031, 0.09814834594726562, 0.10323143005371094, 0.10831451416015625, 0.11339759826660156, 0.11848068237304688, 0.12356376647949219, 0.1286468505859375, 0.1337299346923828, 0.13881301879882812, 0.14389610290527344, 0.14897918701171875, 0.15406227111816406, 0.15914535522460938, 0.1642284393310547, 0.1693115234375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 2.0, 4.0, 3.0, 8.0, 9.0, 12.0, 11.0, 8.0, 14.0, 21.0, 14.0, 22.0, 27.0, 19.0, 32.0, 28.0, 39.0, 34.0, 36.0, 41.0, 45.0, 38.0, 1072.0, 48.0, 42.0, 32.0, 30.0, 41.0, 24.0, 39.0, 33.0, 30.0, 25.0, 17.0, 23.0, 16.0, 21.0, 11.0, 14.0, 5.0, 10.0, 6.0, 10.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.662109375, -3.537933349609375, -3.41375732421875, -3.289581298828125, -3.1654052734375, -3.041229248046875, -2.91705322265625, -2.792877197265625, -2.668701171875, -2.544525146484375, -2.42034912109375, -2.296173095703125, -2.1719970703125, -2.047821044921875, -1.92364501953125, -1.799468994140625, -1.67529296875, -1.551116943359375, -1.42694091796875, -1.302764892578125, -1.1785888671875, -1.054412841796875, -0.93023681640625, -0.806060791015625, -0.681884765625, -0.557708740234375, -0.43353271484375, -0.309356689453125, -0.1851806640625, -0.061004638671875, 0.06317138671875, 0.187347412109375, 0.3115234375, 0.435699462890625, 0.55987548828125, 0.684051513671875, 0.8082275390625, 0.932403564453125, 1.05657958984375, 1.180755615234375, 1.304931640625, 1.429107666015625, 1.55328369140625, 1.677459716796875, 1.8016357421875, 1.925811767578125, 2.04998779296875, 2.174163818359375, 2.29833984375, 2.422515869140625, 2.54669189453125, 2.670867919921875, 2.7950439453125, 2.919219970703125, 3.04339599609375, 3.167572021484375, 3.291748046875, 3.415924072265625, 3.54010009765625, 3.664276123046875, 3.7884521484375, 3.912628173828125, 4.03680419921875, 4.160980224609375, 4.28515625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 10.0, 25.0, 34.0, 52.0, 67.0, 84.0, 130.0, 172.0, 246.0, 342.0, 459.0, 613.0, 886.0, 1247.0, 1631.0, 2326.0, 3319.0, 4559.0, 6274.0, 8840.0, 12787.0, 18205.0, 26840.0, 40401.0, 65178.0, 111778.0, 232978.0, 1225629.0, 122952.0, 70677.0, 43718.0, 28533.0, 19228.0, 13491.0, 9531.0, 6624.0, 4763.0, 3394.0, 2514.0, 1920.0, 1366.0, 958.0, 721.0, 455.0, 362.0, 222.0, 173.0, 115.0, 94.0, 61.0, 45.0, 33.0, 20.0, 17.0, 15.0, 5.0, 7.0, 4.0], "bins": [-0.062469482421875, -0.060581207275390625, -0.05869293212890625, -0.056804656982421875, -0.0549163818359375, -0.053028106689453125, -0.05113983154296875, -0.049251556396484375, -0.04736328125, -0.045475006103515625, -0.04358673095703125, -0.041698455810546875, -0.0398101806640625, -0.037921905517578125, -0.03603363037109375, -0.034145355224609375, -0.032257080078125, -0.030368804931640625, -0.02848052978515625, -0.026592254638671875, -0.0247039794921875, -0.022815704345703125, -0.02092742919921875, -0.019039154052734375, -0.01715087890625, -0.015262603759765625, -0.01337432861328125, -0.011486053466796875, -0.0095977783203125, -0.007709503173828125, -0.00582122802734375, -0.003932952880859375, -0.002044677734375, -0.000156402587890625, 0.00173187255859375, 0.003620147705078125, 0.0055084228515625, 0.007396697998046875, 0.00928497314453125, 0.011173248291015625, 0.0130615234375, 0.014949798583984375, 0.01683807373046875, 0.018726348876953125, 0.0206146240234375, 0.022502899169921875, 0.02439117431640625, 0.026279449462890625, 0.028167724609375, 0.030055999755859375, 0.03194427490234375, 0.033832550048828125, 0.0357208251953125, 0.037609100341796875, 0.03949737548828125, 0.041385650634765625, 0.04327392578125, 0.045162200927734375, 0.04705047607421875, 0.048938751220703125, 0.0508270263671875, 0.052715301513671875, 0.05460357666015625, 0.056491851806640625, 0.058380126953125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 9.0, 7.0, 13.0, 25.0, 31.0, 34.0, 45.0, 62.0, 80.0, 122.0, 141.0, 104.0, 73.0, 51.0, 39.0, 26.0, 29.0, 13.0, 11.0, 9.0, 12.0, 8.0, 10.0, 3.0, 5.0, 3.0, 1.0, 1.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005860328674316406, -0.000567898154258728, -0.0005497634410858154, -0.0005316287279129028, -0.0005134940147399902, -0.0004953593015670776, -0.00047722458839416504, -0.00045908987522125244, -0.00044095516204833984, -0.00042282044887542725, -0.00040468573570251465, -0.00038655102252960205, -0.00036841630935668945, -0.00035028159618377686, -0.00033214688301086426, -0.00031401216983795166, -0.00029587745666503906, -0.00027774274349212646, -0.00025960803031921387, -0.00024147331714630127, -0.00022333860397338867, -0.00020520389080047607, -0.00018706917762756348, -0.00016893446445465088, -0.00015079975128173828, -0.00013266503810882568, -0.00011453032493591309, -9.639561176300049e-05, -7.826089859008789e-05, -6.012618541717529e-05, -4.1991472244262695e-05, -2.3856759071350098e-05, -5.7220458984375e-06, 1.2412667274475098e-05, 3.0547380447387695e-05, 4.868209362030029e-05, 6.681680679321289e-05, 8.495151996612549e-05, 0.00010308623313903809, 0.00012122094631195068, 0.00013935565948486328, 0.00015749037265777588, 0.00017562508583068848, 0.00019375979900360107, 0.00021189451217651367, 0.00023002922534942627, 0.00024816393852233887, 0.00026629865169525146, 0.00028443336486816406, 0.00030256807804107666, 0.00032070279121398926, 0.00033883750438690186, 0.00035697221755981445, 0.00037510693073272705, 0.00039324164390563965, 0.00041137635707855225, 0.00042951107025146484, 0.00044764578342437744, 0.00046578049659729004, 0.00048391520977020264, 0.0005020499229431152, 0.0005201846361160278, 0.0005383193492889404, 0.000556454062461853, 0.0005745887756347656]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 8.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 10.0, 7.0, 13.0, 12.0, 18.0, 21.0, 34.0, 49.0, 86.0, 197.0, 2066.0, 1012311.0, 33020.0, 331.0, 106.0, 82.0, 38.0, 39.0, 26.0, 12.0, 4.0, 11.0, 13.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01427459716796875, -0.01382458209991455, -0.013374567031860352, -0.012924551963806152, -0.012474536895751953, -0.012024521827697754, -0.011574506759643555, -0.011124491691589355, -0.010674476623535156, -0.010224461555480957, -0.009774446487426758, -0.009324431419372559, -0.00887441635131836, -0.00842440128326416, -0.007974386215209961, -0.007524371147155762, -0.0070743560791015625, -0.006624341011047363, -0.006174325942993164, -0.005724310874938965, -0.005274295806884766, -0.004824280738830566, -0.004374265670776367, -0.003924250602722168, -0.0034742355346679688, -0.0030242204666137695, -0.0025742053985595703, -0.002124190330505371, -0.0016741752624511719, -0.0012241601943969727, -0.0007741451263427734, -0.0003241300582885742, 0.000125885009765625, 0.0005759000778198242, 0.0010259151458740234, 0.0014759302139282227, 0.0019259452819824219, 0.002375960350036621, 0.0028259754180908203, 0.0032759904861450195, 0.0037260055541992188, 0.004176020622253418, 0.004626035690307617, 0.005076050758361816, 0.005526065826416016, 0.005976080894470215, 0.006426095962524414, 0.006876111030578613, 0.0073261260986328125, 0.007776141166687012, 0.008226156234741211, 0.00867617130279541, 0.00912618637084961, 0.009576201438903809, 0.010026216506958008, 0.010476231575012207, 0.010926246643066406, 0.011376261711120605, 0.011826276779174805, 0.012276291847229004, 0.012726306915283203, 0.013176321983337402, 0.013626337051391602, 0.0140763521194458, 0.0145263671875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 11.0, 101.0, 676.0, 209.0, 21.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033415743382647634, -0.00026288485969416797, -0.0001916122855618596, -0.00012033971142955124, -4.906713729724288e-05, 2.2205436835065484e-05, 9.347801096737385e-05, 0.00016475055599585176, 0.00023602315923199058, 0.00030729573336429894, 0.0003785683074966073, 0.00044984088162891567, 0.000521113455761224, 0.0005923860007897019, 0.0006636586040258408, 0.0007349311490543187, 0.0008062037522904575, 0.0008774762973189354, 0.0009487489005550742, 0.001020021503791213, 0.00109129399061203, 0.0011625665938481688, 0.0012338391970843077, 0.0013051116839051247, 0.0013763844035565853, 0.0014476570067927241, 0.001518929610028863, 0.00159020209684968, 0.0016614747000858188, 0.0017327473033219576, 0.0018040197901427746, 0.0018752923933789134, 0.0019465647637844086, 0.0020178372506052256, 0.002089109970256686, 0.002160382457077503, 0.002231655176728964, 0.002302927663549781, 0.002374200150370598, 0.0024454728700220585, 0.0025167453568428755, 0.0025880178436636925, 0.002659290563315153, 0.00273056305013597, 0.002801835536956787, 0.0028731082566082478, 0.0029443807434290648, 0.0030156532302498817, 0.0030869259499013424, 0.0031581984367221594, 0.00322947115637362, 0.003300743643194437, 0.0033720163628458977, 0.0034432888496667147, 0.0035145613364875317, 0.0035858340561389923, 0.0036571065429598093, 0.0037283790297806263, 0.003799651749432087, 0.003870924236252904, 0.003942196723073721, 0.004013469442725182, 0.004084742162376642, 0.004156014416366816, 0.004227287136018276]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 7.0, 9.0, 10.0, 11.0, 18.0, 15.0, 21.0, 25.0, 35.0, 27.0, 18.0, 31.0, 42.0, 34.0, 36.0, 55.0, 41.0, 48.0, 48.0, 43.0, 53.0, 33.0, 43.0, 38.0, 49.0, 26.0, 28.0, 29.0, 25.0, 10.0, 25.0, 12.0, 4.0, 9.0, 8.0, 6.0, 4.0, 3.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002391338348388672, -0.0002312762662768364, -0.0002234186977148056, -0.0002155611291527748, -0.00020770356059074402, -0.00019984599202871323, -0.00019198842346668243, -0.00018413085490465164, -0.00017627328634262085, -0.00016841571778059006, -0.00016055814921855927, -0.00015270058065652847, -0.00014484301209449768, -0.0001369854435324669, -0.0001291278749704361, -0.0001212703064084053, -0.00011341273784637451, -0.00010555516928434372, -9.769760072231293e-05, -8.984003216028214e-05, -8.198246359825134e-05, -7.412489503622055e-05, -6.626732647418976e-05, -5.8409757912158966e-05, -5.0552189350128174e-05, -4.269462078809738e-05, -3.483705222606659e-05, -2.6979483664035797e-05, -1.9121915102005005e-05, -1.1264346539974213e-05, -3.4067779779434204e-06, 4.450790584087372e-06, 1.2308359146118164e-05, 2.0165927708148956e-05, 2.802349627017975e-05, 3.588106483221054e-05, 4.373863339424133e-05, 5.1596201956272125e-05, 5.945377051830292e-05, 6.731133908033371e-05, 7.51689076423645e-05, 8.30264762043953e-05, 9.088404476642609e-05, 9.874161332845688e-05, 0.00010659918189048767, 0.00011445675045251846, 0.00012231431901454926, 0.00013017188757658005, 0.00013802945613861084, 0.00014588702470064163, 0.00015374459326267242, 0.00016160216182470322, 0.000169459730386734, 0.0001773172989487648, 0.0001851748675107956, 0.00019303243607282639, 0.00020089000463485718, 0.00020874757319688797, 0.00021660514175891876, 0.00022446271032094955, 0.00023232027888298035, 0.00024017784744501114, 0.00024803541600704193, 0.0002558929845690727, 0.0002637505531311035]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 8.0, 12.0, 9.0, 13.0, 9.0, 12.0, 16.0, 13.0, 19.0, 31.0, 19.0, 12.0, 31.0, 34.0, 33.0, 36.0, 33.0, 30.0, 39.0, 40.0, 47.0, 31.0, 31.0, 45.0, 32.0, 36.0, 35.0, 35.0, 29.0, 25.0, 19.0, 23.0, 26.0, 25.0, 21.0, 13.0, 12.0, 13.0, 10.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.640625, -4.510589599609375, -4.38055419921875, -4.250518798828125, -4.1204833984375, -3.990447998046875, -3.86041259765625, -3.730377197265625, -3.600341796875, -3.470306396484375, -3.34027099609375, -3.210235595703125, -3.0802001953125, -2.950164794921875, -2.82012939453125, -2.690093994140625, -2.56005859375, -2.430023193359375, -2.29998779296875, -2.169952392578125, -2.0399169921875, -1.909881591796875, -1.77984619140625, -1.649810791015625, -1.519775390625, -1.389739990234375, -1.25970458984375, -1.129669189453125, -0.9996337890625, -0.869598388671875, -0.73956298828125, -0.609527587890625, -0.4794921875, -0.349456787109375, -0.21942138671875, -0.089385986328125, 0.0406494140625, 0.170684814453125, 0.30072021484375, 0.430755615234375, 0.560791015625, 0.690826416015625, 0.82086181640625, 0.950897216796875, 1.0809326171875, 1.210968017578125, 1.34100341796875, 1.471038818359375, 1.60107421875, 1.731109619140625, 1.86114501953125, 1.991180419921875, 2.1212158203125, 2.251251220703125, 2.38128662109375, 2.511322021484375, 2.641357421875, 2.771392822265625, 2.90142822265625, 3.031463623046875, 3.1614990234375, 3.291534423828125, 3.42156982421875, 3.551605224609375, 3.681640625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 4.0, 12.0, 14.0, 14.0, 20.0, 21.0, 45.0, 46.0, 79.0, 125.0, 170.0, 228.0, 395.0, 701.0, 1140.0, 1935.0, 3716.0, 6685.0, 12810.0, 26560.0, 60354.0, 182171.0, 480187.0, 163080.0, 56389.0, 24782.0, 12206.0, 6268.0, 3503.0, 1921.0, 1142.0, 652.0, 388.0, 252.0, 168.0, 108.0, 71.0, 54.0, 34.0, 36.0, 20.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.68359375, -6.45672607421875, -6.2298583984375, -6.00299072265625, -5.776123046875, -5.54925537109375, -5.3223876953125, -5.09552001953125, -4.86865234375, -4.64178466796875, -4.4149169921875, -4.18804931640625, -3.961181640625, -3.73431396484375, -3.5074462890625, -3.28057861328125, -3.0537109375, -2.82684326171875, -2.5999755859375, -2.37310791015625, -2.146240234375, -1.91937255859375, -1.6925048828125, -1.46563720703125, -1.23876953125, -1.01190185546875, -0.7850341796875, -0.55816650390625, -0.331298828125, -0.10443115234375, 0.1224365234375, 0.34930419921875, 0.576171875, 0.80303955078125, 1.0299072265625, 1.25677490234375, 1.483642578125, 1.71051025390625, 1.9373779296875, 2.16424560546875, 2.39111328125, 2.61798095703125, 2.8448486328125, 3.07171630859375, 3.298583984375, 3.52545166015625, 3.7523193359375, 3.97918701171875, 4.2060546875, 4.43292236328125, 4.6597900390625, 4.88665771484375, 5.113525390625, 5.34039306640625, 5.5672607421875, 5.79412841796875, 6.02099609375, 6.24786376953125, 6.4747314453125, 6.70159912109375, 6.928466796875, 7.15533447265625, 7.3822021484375, 7.60906982421875, 7.8359375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 11.0, 10.0, 10.0, 30.0, 22.0, 24.0, 40.0, 33.0, 36.0, 29.0, 54.0, 69.0, 69.0, 112.0, 201.0, 1392.0, 252.0, 121.0, 91.0, 76.0, 42.0, 39.0, 31.0, 42.0, 39.0, 25.0, 27.0, 14.0, 19.0, 18.0, 8.0, 14.0, 8.0, 6.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.7734375, -12.3699951171875, -11.966552734375, -11.5631103515625, -11.15966796875, -10.7562255859375, -10.352783203125, -9.9493408203125, -9.5458984375, -9.1424560546875, -8.739013671875, -8.3355712890625, -7.93212890625, -7.5286865234375, -7.125244140625, -6.7218017578125, -6.318359375, -5.9149169921875, -5.511474609375, -5.1080322265625, -4.70458984375, -4.3011474609375, -3.897705078125, -3.4942626953125, -3.0908203125, -2.6873779296875, -2.283935546875, -1.8804931640625, -1.47705078125, -1.0736083984375, -0.670166015625, -0.2667236328125, 0.13671875, 0.5401611328125, 0.943603515625, 1.3470458984375, 1.75048828125, 2.1539306640625, 2.557373046875, 2.9608154296875, 3.3642578125, 3.7677001953125, 4.171142578125, 4.5745849609375, 4.97802734375, 5.3814697265625, 5.784912109375, 6.1883544921875, 6.591796875, 6.9952392578125, 7.398681640625, 7.8021240234375, 8.20556640625, 8.6090087890625, 9.012451171875, 9.4158935546875, 9.8193359375, 10.2227783203125, 10.626220703125, 11.0296630859375, 11.43310546875, 11.8365478515625, 12.239990234375, 12.6434326171875, 13.046875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 8.0, 10.0, 14.0, 10.0, 12.0, 27.0, 34.0, 53.0, 76.0, 126.0, 182.0, 264.0, 461.0, 827.0, 2060.0, 7056.0, 37158.0, 412344.0, 2486086.0, 170518.0, 20528.0, 4531.0, 1477.0, 692.0, 416.0, 239.0, 139.0, 97.0, 64.0, 58.0, 28.0, 24.0, 18.0, 12.0, 17.0, 10.0, 6.0, 1.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 4.0], "bins": [-18.9375, -18.4163818359375, -17.895263671875, -17.3741455078125, -16.85302734375, -16.3319091796875, -15.810791015625, -15.2896728515625, -14.7685546875, -14.2474365234375, -13.726318359375, -13.2052001953125, -12.68408203125, -12.1629638671875, -11.641845703125, -11.1207275390625, -10.599609375, -10.0784912109375, -9.557373046875, -9.0362548828125, -8.51513671875, -7.9940185546875, -7.472900390625, -6.9517822265625, -6.4306640625, -5.9095458984375, -5.388427734375, -4.8673095703125, -4.34619140625, -3.8250732421875, -3.303955078125, -2.7828369140625, -2.26171875, -1.7406005859375, -1.219482421875, -0.6983642578125, -0.17724609375, 0.3438720703125, 0.864990234375, 1.3861083984375, 1.9072265625, 2.4283447265625, 2.949462890625, 3.4705810546875, 3.99169921875, 4.5128173828125, 5.033935546875, 5.5550537109375, 6.076171875, 6.5972900390625, 7.118408203125, 7.6395263671875, 8.16064453125, 8.6817626953125, 9.202880859375, 9.7239990234375, 10.2451171875, 10.7662353515625, 11.287353515625, 11.8084716796875, 12.32958984375, 12.8507080078125, 13.371826171875, 13.8929443359375, 14.4140625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 87.0, 509.0, 368.0, 45.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-250.22364807128906, -245.8242950439453, -241.4249267578125, -237.02557373046875, -232.62620544433594, -228.2268524169922, -223.82748413085938, -219.42813110351562, -215.02877807617188, -210.62942504882812, -206.2300567626953, -201.83070373535156, -197.43133544921875, -193.031982421875, -188.6326141357422, -184.23326110839844, -179.83389282226562, -175.43453979492188, -171.03517150878906, -166.6358184814453, -162.2364501953125, -157.83709716796875, -153.43772888183594, -149.0383758544922, -144.63900756835938, -140.23965454101562, -135.8402862548828, -131.44093322753906, -127.04156494140625, -122.6422119140625, -118.24285125732422, -113.84349060058594, -109.44413757324219, -105.0447769165039, -100.64541625976562, -96.24605560302734, -91.84669494628906, -87.44734191894531, -83.04798126220703, -78.64862060546875, -74.24925994873047, -69.84989929199219, -65.4505386352539, -61.05118179321289, -56.65182113647461, -52.25246047973633, -47.85310363769531, -43.45374298095703, -39.05438232421875, -34.65502166748047, -30.25566291809082, -25.856304168701172, -21.45694351196289, -17.05758285522461, -12.658224105834961, -8.258865356445312, -3.8595046997070312, 0.5398550033569336, 4.939214706420898, 9.338574409484863, 13.737934112548828, 18.13729476928711, 22.536653518676758, 26.936012268066406, 31.335372924804688]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 5.0, 6.0, 5.0, 6.0, 12.0, 10.0, 17.0, 30.0, 16.0, 20.0, 17.0, 21.0, 33.0, 29.0, 31.0, 17.0, 42.0, 28.0, 35.0, 44.0, 35.0, 37.0, 32.0, 33.0, 41.0, 38.0, 25.0, 46.0, 29.0, 31.0, 31.0, 26.0, 17.0, 17.0, 14.0, 21.0, 17.0, 5.0, 17.0, 12.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0], "bins": [-30.363006591796875, -29.4329833984375, -28.502960205078125, -27.57293701171875, -26.642915725708008, -25.712892532348633, -24.782869338989258, -23.852846145629883, -22.922822952270508, -21.992799758911133, -21.062776565551758, -20.132755279541016, -19.20273208618164, -18.272708892822266, -17.34268569946289, -16.412662506103516, -15.482640266418457, -14.552617073059082, -13.622594833374023, -12.692571640014648, -11.762548446655273, -10.832525253295898, -9.90250301361084, -8.972479820251465, -8.042457580566406, -7.1124348640441895, -6.1824116706848145, -5.252388954162598, -4.322365760803223, -3.392343044281006, -2.462320327758789, -1.532297134399414, -0.6022739410400391, 0.32774895429611206, 1.2577718496322632, 2.1877946853637695, 3.1178176403045654, 4.047840595245361, 4.977863311767578, 5.907886505126953, 6.83790922164917, 7.767931938171387, 8.697955131530762, 9.62797737121582, 10.558000564575195, 11.48802375793457, 12.418046951293945, 13.34807014465332, 14.278092384338379, 15.208115577697754, 16.138137817382812, 17.068161010742188, 17.998184204101562, 18.928207397460938, 19.858230590820312, 20.788253784179688, 21.71827507019043, 22.648298263549805, 23.57832145690918, 24.508342742919922, 25.438365936279297, 26.368389129638672, 27.298412322998047, 28.228435516357422, 29.158458709716797]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 11.0, 7.0, 6.0, 17.0, 15.0, 13.0, 13.0, 17.0, 19.0, 26.0, 20.0, 20.0, 36.0, 31.0, 24.0, 41.0, 31.0, 27.0, 37.0, 37.0, 36.0, 35.0, 38.0, 39.0, 39.0, 38.0, 32.0, 33.0, 21.0, 26.0, 19.0, 22.0, 27.0, 19.0, 17.0, 14.0, 13.0, 14.0, 11.0, 5.0, 9.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.11468505859375, -3.9871826171875, -3.85968017578125, -3.732177734375, -3.60467529296875, -3.4771728515625, -3.34967041015625, -3.22216796875, -3.09466552734375, -2.9671630859375, -2.83966064453125, -2.712158203125, -2.58465576171875, -2.4571533203125, -2.32965087890625, -2.2021484375, -2.07464599609375, -1.9471435546875, -1.81964111328125, -1.692138671875, -1.56463623046875, -1.4371337890625, -1.30963134765625, -1.18212890625, -1.05462646484375, -0.9271240234375, -0.79962158203125, -0.672119140625, -0.54461669921875, -0.4171142578125, -0.28961181640625, -0.162109375, -0.03460693359375, 0.0928955078125, 0.22039794921875, 0.347900390625, 0.47540283203125, 0.6029052734375, 0.73040771484375, 0.85791015625, 0.98541259765625, 1.1129150390625, 1.24041748046875, 1.367919921875, 1.49542236328125, 1.6229248046875, 1.75042724609375, 1.8779296875, 2.00543212890625, 2.1329345703125, 2.26043701171875, 2.387939453125, 2.51544189453125, 2.6429443359375, 2.77044677734375, 2.89794921875, 3.02545166015625, 3.1529541015625, 3.28045654296875, 3.407958984375, 3.53546142578125, 3.6629638671875, 3.79046630859375, 3.91796875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 4.0, 7.0, 6.0, 9.0, 10.0, 12.0, 24.0, 33.0, 44.0, 63.0, 83.0, 122.0, 187.0, 301.0, 487.0, 887.0, 1822.0, 4047.0, 10502.0, 36558.0, 208679.0, 1468096.0, 2044994.0, 340484.0, 53285.0, 13435.0, 5010.0, 2236.0, 1098.0, 638.0, 388.0, 236.0, 139.0, 93.0, 65.0, 47.0, 41.0, 23.0, 21.0, 12.0, 15.0, 10.0, 4.0, 4.0, 2.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.078125, -8.7767333984375, -8.475341796875, -8.1739501953125, -7.87255859375, -7.5711669921875, -7.269775390625, -6.9683837890625, -6.6669921875, -6.3656005859375, -6.064208984375, -5.7628173828125, -5.46142578125, -5.1600341796875, -4.858642578125, -4.5572509765625, -4.255859375, -3.9544677734375, -3.653076171875, -3.3516845703125, -3.05029296875, -2.7489013671875, -2.447509765625, -2.1461181640625, -1.8447265625, -1.5433349609375, -1.241943359375, -0.9405517578125, -0.63916015625, -0.3377685546875, -0.036376953125, 0.2650146484375, 0.56640625, 0.8677978515625, 1.169189453125, 1.4705810546875, 1.77197265625, 2.0733642578125, 2.374755859375, 2.6761474609375, 2.9775390625, 3.2789306640625, 3.580322265625, 3.8817138671875, 4.18310546875, 4.4844970703125, 4.785888671875, 5.0872802734375, 5.388671875, 5.6900634765625, 5.991455078125, 6.2928466796875, 6.59423828125, 6.8956298828125, 7.197021484375, 7.4984130859375, 7.7998046875, 8.1011962890625, 8.402587890625, 8.7039794921875, 9.00537109375, 9.3067626953125, 9.608154296875, 9.9095458984375, 10.2109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 12.0, 10.0, 13.0, 18.0, 23.0, 28.0, 26.0, 35.0, 47.0, 50.0, 97.0, 131.0, 180.0, 192.0, 281.0, 373.0, 422.0, 429.0, 422.0, 312.0, 246.0, 150.0, 129.0, 97.0, 67.0, 62.0, 50.0, 38.0, 26.0, 20.0, 16.0, 12.0, 17.0, 6.0, 5.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.80078125, -5.6025390625, -5.404296875, -5.2060546875, -5.0078125, -4.8095703125, -4.611328125, -4.4130859375, -4.21484375, -4.0166015625, -3.818359375, -3.6201171875, -3.421875, -3.2236328125, -3.025390625, -2.8271484375, -2.62890625, -2.4306640625, -2.232421875, -2.0341796875, -1.8359375, -1.6376953125, -1.439453125, -1.2412109375, -1.04296875, -0.8447265625, -0.646484375, -0.4482421875, -0.25, -0.0517578125, 0.146484375, 0.3447265625, 0.54296875, 0.7412109375, 0.939453125, 1.1376953125, 1.3359375, 1.5341796875, 1.732421875, 1.9306640625, 2.12890625, 2.3271484375, 2.525390625, 2.7236328125, 2.921875, 3.1201171875, 3.318359375, 3.5166015625, 3.71484375, 3.9130859375, 4.111328125, 4.3095703125, 4.5078125, 4.7060546875, 4.904296875, 5.1025390625, 5.30078125, 5.4990234375, 5.697265625, 5.8955078125, 6.09375, 6.2919921875, 6.490234375, 6.6884765625, 6.88671875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 4.0, 5.0, 9.0, 10.0, 12.0, 27.0, 16.0, 26.0, 30.0, 51.0, 80.0, 100.0, 168.0, 248.0, 411.0, 802.0, 1760.0, 5027.0, 21086.0, 139569.0, 1843245.0, 1999434.0, 150385.0, 22486.0, 5377.0, 1823.0, 860.0, 439.0, 250.0, 148.0, 104.0, 74.0, 54.0, 39.0, 36.0, 23.0, 14.0, 15.0, 8.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-17.40625, -16.9229736328125, -16.439697265625, -15.9564208984375, -15.47314453125, -14.9898681640625, -14.506591796875, -14.0233154296875, -13.5400390625, -13.0567626953125, -12.573486328125, -12.0902099609375, -11.60693359375, -11.1236572265625, -10.640380859375, -10.1571044921875, -9.673828125, -9.1905517578125, -8.707275390625, -8.2239990234375, -7.74072265625, -7.2574462890625, -6.774169921875, -6.2908935546875, -5.8076171875, -5.3243408203125, -4.841064453125, -4.3577880859375, -3.87451171875, -3.3912353515625, -2.907958984375, -2.4246826171875, -1.94140625, -1.4581298828125, -0.974853515625, -0.4915771484375, -0.00830078125, 0.4749755859375, 0.958251953125, 1.4415283203125, 1.9248046875, 2.4080810546875, 2.891357421875, 3.3746337890625, 3.85791015625, 4.3411865234375, 4.824462890625, 5.3077392578125, 5.791015625, 6.2742919921875, 6.757568359375, 7.2408447265625, 7.72412109375, 8.2073974609375, 8.690673828125, 9.1739501953125, 9.6572265625, 10.1405029296875, 10.623779296875, 11.1070556640625, 11.59033203125, 12.0736083984375, 12.556884765625, 13.0401611328125, 13.5234375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 13.0, 63.0, 191.0, 350.0, 259.0, 102.0, 29.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.66197204589844, -52.304664611816406, -48.947357177734375, -45.59005355834961, -42.23274612426758, -38.87543869018555, -35.51813507080078, -32.16082763671875, -28.80352020263672, -25.446212768554688, -22.08890724182129, -18.73160171508789, -15.37429428100586, -12.016986846923828, -8.65968132019043, -5.302375793457031, -1.945068359375, 1.4122381210327148, 4.76954460144043, 8.126851081848145, 11.48415756225586, 14.84146499633789, 18.19877052307129, 21.556076049804688, 24.91338348388672, 28.27069091796875, 31.62799644470215, 34.98530197143555, 38.34260940551758, 41.69991683959961, 45.057220458984375, 48.414527893066406, 51.77183532714844, 55.12914276123047, 58.4864501953125, 61.843753814697266, 65.20106506347656, 68.55836486816406, 71.9156723022461, 75.27297973632812, 78.63028717041016, 81.98759460449219, 85.34490203857422, 88.70220947265625, 92.05950927734375, 95.41682434082031, 98.77412414550781, 102.13143157958984, 105.48873901367188, 108.8460464477539, 112.20335388183594, 115.56066131591797, 118.91796875, 122.2752685546875, 125.63257598876953, 128.98988342285156, 132.34719848632812, 135.70449829101562, 139.0618133544922, 142.4191131591797, 145.77642822265625, 149.13372802734375, 152.4910430908203, 155.8483428955078, 159.2056427001953]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 7.0, 5.0, 4.0, 9.0, 7.0, 15.0, 14.0, 21.0, 20.0, 19.0, 27.0, 26.0, 34.0, 27.0, 37.0, 34.0, 37.0, 38.0, 35.0, 48.0, 43.0, 38.0, 42.0, 35.0, 38.0, 52.0, 35.0, 31.0, 30.0, 27.0, 21.0, 24.0, 26.0, 12.0, 17.0, 9.0, 14.0, 9.0, 11.0, 5.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.901531219482422, -24.117189407348633, -23.33284568786621, -22.548503875732422, -21.76416015625, -20.97981834411621, -20.195476531982422, -19.4111328125, -18.626789093017578, -17.84244728088379, -17.058103561401367, -16.273761749267578, -15.489418029785156, -14.705076217651367, -13.920733451843262, -13.136390686035156, -12.352048873901367, -11.567706108093262, -10.783363342285156, -9.999021530151367, -9.214677810668945, -8.430335998535156, -7.645993232727051, -6.861650466918945, -6.07730770111084, -5.292964935302734, -4.508622169494629, -3.7242798805236816, -2.939937114715576, -2.1555943489074707, -1.3712520599365234, -0.586909294128418, 0.1974334716796875, 0.9817761182785034, 1.7661187648773193, 2.5504612922668457, 3.334804058074951, 4.119146823883057, 4.903489112854004, 5.687831878662109, 6.472174644470215, 7.25651741027832, 8.040860176086426, 8.825202941894531, 9.60954475402832, 10.393888473510742, 11.178230285644531, 11.962573051452637, 12.746915817260742, 13.531258583068848, 14.315601348876953, 15.099943161010742, 15.884286880493164, 16.668628692626953, 17.452972412109375, 18.237314224243164, 19.021656036376953, 19.805997848510742, 20.590341567993164, 21.374683380126953, 22.159027099609375, 22.943368911743164, 23.727710723876953, 24.512054443359375, 25.296398162841797]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 13.0, 10.0, 5.0, 11.0, 9.0, 13.0, 18.0, 9.0, 21.0, 19.0, 17.0, 21.0, 32.0, 25.0, 32.0, 23.0, 44.0, 28.0, 31.0, 41.0, 40.0, 36.0, 42.0, 38.0, 36.0, 36.0, 40.0, 41.0, 19.0, 34.0, 28.0, 24.0, 22.0, 17.0, 15.0, 18.0, 16.0, 8.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.56640625, -4.43212890625, -4.2978515625, -4.16357421875, -4.029296875, -3.89501953125, -3.7607421875, -3.62646484375, -3.4921875, -3.35791015625, -3.2236328125, -3.08935546875, -2.955078125, -2.82080078125, -2.6865234375, -2.55224609375, -2.41796875, -2.28369140625, -2.1494140625, -2.01513671875, -1.880859375, -1.74658203125, -1.6123046875, -1.47802734375, -1.34375, -1.20947265625, -1.0751953125, -0.94091796875, -0.806640625, -0.67236328125, -0.5380859375, -0.40380859375, -0.26953125, -0.13525390625, -0.0009765625, 0.13330078125, 0.267578125, 0.40185546875, 0.5361328125, 0.67041015625, 0.8046875, 0.93896484375, 1.0732421875, 1.20751953125, 1.341796875, 1.47607421875, 1.6103515625, 1.74462890625, 1.87890625, 2.01318359375, 2.1474609375, 2.28173828125, 2.416015625, 2.55029296875, 2.6845703125, 2.81884765625, 2.953125, 3.08740234375, 3.2216796875, 3.35595703125, 3.490234375, 3.62451171875, 3.7587890625, 3.89306640625, 4.02734375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 17.0, 19.0, 21.0, 36.0, 50.0, 70.0, 95.0, 134.0, 217.0, 349.0, 500.0, 642.0, 992.0, 1479.0, 2147.0, 3254.0, 4769.0, 7232.0, 10630.0, 16475.0, 24964.0, 39789.0, 66783.0, 120375.0, 252705.0, 221679.0, 107766.0, 60248.0, 36537.0, 23065.0, 15085.0, 9913.0, 6745.0, 4512.0, 2954.0, 1979.0, 1412.0, 908.0, 590.0, 466.0, 306.0, 191.0, 137.0, 103.0, 75.0, 37.0, 33.0, 22.0, 22.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.156982421875, -0.15221214294433594, -0.14744186401367188, -0.1426715850830078, -0.13790130615234375, -0.1331310272216797, -0.12836074829101562, -0.12359046936035156, -0.1188201904296875, -0.11404991149902344, -0.10927963256835938, -0.10450935363769531, -0.09973907470703125, -0.09496879577636719, -0.09019851684570312, -0.08542823791503906, -0.080657958984375, -0.07588768005371094, -0.07111740112304688, -0.06634712219238281, -0.06157684326171875, -0.05680656433105469, -0.052036285400390625, -0.04726600646972656, -0.0424957275390625, -0.03772544860839844, -0.032955169677734375, -0.028184890747070312, -0.02341461181640625, -0.018644332885742188, -0.013874053955078125, -0.009103775024414062, -0.00433349609375, 0.0004367828369140625, 0.005207061767578125, 0.009977340698242188, 0.01474761962890625, 0.019517898559570312, 0.024288177490234375, 0.029058456420898438, 0.0338287353515625, 0.03859901428222656, 0.043369293212890625, 0.04813957214355469, 0.05290985107421875, 0.05768013000488281, 0.062450408935546875, 0.06722068786621094, 0.071990966796875, 0.07676124572753906, 0.08153152465820312, 0.08630180358886719, 0.09107208251953125, 0.09584236145019531, 0.10061264038085938, 0.10538291931152344, 0.1101531982421875, 0.11492347717285156, 0.11969375610351562, 0.12446403503417969, 0.12923431396484375, 0.1340045928955078, 0.13877487182617188, 0.14354515075683594, 0.1483154296875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 9.0, 14.0, 9.0, 10.0, 15.0, 19.0, 24.0, 15.0, 24.0, 24.0, 34.0, 39.0, 32.0, 32.0, 38.0, 34.0, 41.0, 29.0, 38.0, 1056.0, 38.0, 41.0, 47.0, 38.0, 41.0, 34.0, 28.0, 24.0, 17.0, 20.0, 21.0, 14.0, 15.0, 13.0, 16.0, 12.0, 13.0, 6.0, 9.0, 5.0, 12.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.383758544921875, -3.27532958984375, -3.166900634765625, -3.0584716796875, -2.950042724609375, -2.84161376953125, -2.733184814453125, -2.624755859375, -2.516326904296875, -2.40789794921875, -2.299468994140625, -2.1910400390625, -2.082611083984375, -1.97418212890625, -1.865753173828125, -1.75732421875, -1.648895263671875, -1.54046630859375, -1.432037353515625, -1.3236083984375, -1.215179443359375, -1.10675048828125, -0.998321533203125, -0.889892578125, -0.781463623046875, -0.67303466796875, -0.564605712890625, -0.4561767578125, -0.347747802734375, -0.23931884765625, -0.130889892578125, -0.0224609375, 0.085968017578125, 0.19439697265625, 0.302825927734375, 0.4112548828125, 0.519683837890625, 0.62811279296875, 0.736541748046875, 0.844970703125, 0.953399658203125, 1.06182861328125, 1.170257568359375, 1.2786865234375, 1.387115478515625, 1.49554443359375, 1.603973388671875, 1.71240234375, 1.820831298828125, 1.92926025390625, 2.037689208984375, 2.1461181640625, 2.254547119140625, 2.36297607421875, 2.471405029296875, 2.579833984375, 2.688262939453125, 2.79669189453125, 2.905120849609375, 3.0135498046875, 3.121978759765625, 3.23040771484375, 3.338836669921875, 3.447265625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 8.0, 4.0, 11.0, 21.0, 30.0, 46.0, 66.0, 87.0, 131.0, 201.0, 312.0, 411.0, 594.0, 903.0, 1406.0, 2067.0, 2996.0, 4286.0, 6288.0, 9321.0, 14073.0, 21696.0, 34385.0, 55239.0, 94115.0, 175796.0, 1300306.0, 150478.0, 83028.0, 49185.0, 30456.0, 19474.0, 13070.0, 8712.0, 6034.0, 3901.0, 2505.0, 1703.0, 1175.0, 827.0, 577.0, 408.0, 251.0, 174.0, 128.0, 74.0, 54.0, 42.0, 27.0, 15.0, 15.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.0672607421875, -0.06518363952636719, -0.06310653686523438, -0.06102943420410156, -0.05895233154296875, -0.05687522888183594, -0.054798126220703125, -0.05272102355957031, -0.0506439208984375, -0.04856681823730469, -0.046489715576171875, -0.04441261291503906, -0.04233551025390625, -0.04025840759277344, -0.038181304931640625, -0.03610420227050781, -0.034027099609375, -0.03194999694824219, -0.029872894287109375, -0.027795791625976562, -0.02571868896484375, -0.023641586303710938, -0.021564483642578125, -0.019487380981445312, -0.0174102783203125, -0.015333175659179688, -0.013256072998046875, -0.011178970336914062, -0.00910186767578125, -0.0070247650146484375, -0.004947662353515625, -0.0028705596923828125, -0.00079345703125, 0.0012836456298828125, 0.003360748291015625, 0.0054378509521484375, 0.00751495361328125, 0.009592056274414062, 0.011669158935546875, 0.013746261596679688, 0.0158233642578125, 0.017900466918945312, 0.019977569580078125, 0.022054672241210938, 0.02413177490234375, 0.026208877563476562, 0.028285980224609375, 0.030363082885742188, 0.032440185546875, 0.03451728820800781, 0.036594390869140625, 0.03867149353027344, 0.04074859619140625, 0.04282569885253906, 0.044902801513671875, 0.04697990417480469, 0.0490570068359375, 0.05113410949707031, 0.053211212158203125, 0.05528831481933594, 0.05736541748046875, 0.05944252014160156, 0.061519622802734375, 0.06359672546386719, 0.065673828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 11.0, 5.0, 6.0, 7.0, 9.0, 13.0, 17.0, 16.0, 19.0, 17.0, 10.0, 33.0, 37.0, 56.0, 76.0, 108.0, 125.0, 127.0, 61.0, 52.0, 43.0, 27.0, 15.0, 16.0, 14.0, 12.0, 3.0, 9.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0003745555877685547, -0.00036362186074256897, -0.00035268813371658325, -0.00034175440669059753, -0.0003308206796646118, -0.0003198869526386261, -0.0003089532256126404, -0.00029801949858665466, -0.00028708577156066895, -0.00027615204453468323, -0.0002652183175086975, -0.0002542845904827118, -0.00024335086345672607, -0.00023241713643074036, -0.00022148340940475464, -0.00021054968237876892, -0.0001996159553527832, -0.00018868222832679749, -0.00017774850130081177, -0.00016681477427482605, -0.00015588104724884033, -0.00014494732022285461, -0.0001340135931968689, -0.00012307986617088318, -0.00011214613914489746, -0.00010121241211891174, -9.027868509292603e-05, -7.934495806694031e-05, -6.841123104095459e-05, -5.747750401496887e-05, -4.6543776988983154e-05, -3.5610049962997437e-05, -2.467632293701172e-05, -1.3742595911026001e-05, -2.808868885040283e-06, 8.124858140945435e-06, 1.9058585166931152e-05, 2.999231219291687e-05, 4.092603921890259e-05, 5.1859766244888306e-05, 6.279349327087402e-05, 7.372722029685974e-05, 8.466094732284546e-05, 9.559467434883118e-05, 0.0001065284013748169, 0.00011746212840080261, 0.00012839585542678833, 0.00013932958245277405, 0.00015026330947875977, 0.00016119703650474548, 0.0001721307635307312, 0.00018306449055671692, 0.00019399821758270264, 0.00020493194460868835, 0.00021586567163467407, 0.0002267993986606598, 0.0002377331256866455, 0.0002486668527126312, 0.00025960057973861694, 0.00027053430676460266, 0.0002814680337905884, 0.0002924017608165741, 0.0003033354878425598, 0.00031426921486854553, 0.00032520294189453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 5.0, 9.0, 7.0, 6.0, 18.0, 17.0, 22.0, 37.0, 67.0, 120.0, 244.0, 2139.0, 776753.0, 267178.0, 1378.0, 200.0, 104.0, 54.0, 26.0, 23.0, 18.0, 18.0, 17.0, 12.0, 9.0, 6.0, 5.0, 8.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00846099853515625, -0.008178353309631348, -0.007895708084106445, -0.007613062858581543, -0.007330417633056641, -0.007047772407531738, -0.006765127182006836, -0.006482481956481934, -0.006199836730957031, -0.005917191505432129, -0.0056345462799072266, -0.005351901054382324, -0.005069255828857422, -0.0047866106033325195, -0.004503965377807617, -0.004221320152282715, -0.0039386749267578125, -0.00365602970123291, -0.003373384475708008, -0.0030907392501831055, -0.002808094024658203, -0.0025254487991333008, -0.0022428035736083984, -0.001960158348083496, -0.0016775131225585938, -0.0013948678970336914, -0.001112222671508789, -0.0008295774459838867, -0.0005469322204589844, -0.00026428699493408203, 1.8358230590820312e-05, 0.00030100345611572266, 0.000583648681640625, 0.0008662939071655273, 0.0011489391326904297, 0.001431584358215332, 0.0017142295837402344, 0.0019968748092651367, 0.002279520034790039, 0.0025621652603149414, 0.0028448104858398438, 0.003127455711364746, 0.0034101009368896484, 0.0036927461624145508, 0.003975391387939453, 0.0042580366134643555, 0.004540681838989258, 0.00482332706451416, 0.0051059722900390625, 0.005388617515563965, 0.005671262741088867, 0.0059539079666137695, 0.006236553192138672, 0.006519198417663574, 0.0068018436431884766, 0.007084488868713379, 0.007367134094238281, 0.007649779319763184, 0.007932424545288086, 0.008215069770812988, 0.00849771499633789, 0.008780360221862793, 0.009063005447387695, 0.009345650672912598, 0.0096282958984375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 13.0, 32.0, 122.0, 371.0, 344.0, 97.0, 22.0, 10.0, 5.0, 0.0, 1.0], "bins": [-0.0019118670606985688, -0.001878263894468546, -0.001844660728238523, -0.0018110575620085, -0.0017774543957784772, -0.0017438512295484543, -0.0017102480633184314, -0.0016766448970884085, -0.0016430417308583856, -0.0016094385646283627, -0.0015758353983983397, -0.0015422322321683168, -0.001508629065938294, -0.001475025899708271, -0.0014414227334782481, -0.0014078195672482252, -0.0013742165174335241, -0.0013406133512035012, -0.0013070101849734783, -0.0012734070187434554, -0.0012398038525134325, -0.0012062006862834096, -0.0011725975200533867, -0.0011389943538233638, -0.0011053911875933409, -0.001071788021363318, -0.001038184855133295, -0.0010045816889032722, -0.0009709785226732492, -0.0009373753564432263, -0.0009037721902132034, -0.0008701690239831805, -0.0008365659159608185, -0.0008029627497307956, -0.0007693595835007727, -0.0007357564172707498, -0.0007021532510407269, -0.000668550084810704, -0.000634946976788342, -0.0006013438105583191, -0.0005677405861206353, -0.0005341374198906124, -0.0005005342536605895, -0.00046693108743056655, -0.00043332792120054364, -0.00039972475497052073, -0.0003661216178443283, -0.0003325184516143054, -0.0002989153144881129, -0.00026531214825809, -0.0002317089820280671, -0.00019810583034995943, -0.00016450266411993653, -0.00013089949788991362, -9.729634621180594e-05, -6.369317998178303e-05, -3.0089999199844897e-05, 3.5131633921992034e-06, 3.7116325984243304e-05, 7.07194849383086e-05, 0.0001043226511683315, 0.0001379258173983544, 0.0001715289690764621, 0.000205132135306485, 0.0002387353015365079]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 8.0, 10.0, 11.0, 11.0, 18.0, 18.0, 18.0, 19.0, 26.0, 25.0, 32.0, 37.0, 36.0, 45.0, 36.0, 36.0, 34.0, 56.0, 44.0, 41.0, 38.0, 30.0, 45.0, 30.0, 29.0, 25.0, 29.0, 21.0, 23.0, 32.0, 23.0, 21.0, 12.0, 13.0, 10.0, 6.0, 8.0, 4.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.00018358230590820312, -0.00017814245074987411, -0.0001727025955915451, -0.0001672627404332161, -0.00016182288527488708, -0.00015638303011655807, -0.00015094317495822906, -0.00014550331979990005, -0.00014006346464157104, -0.00013462360948324203, -0.00012918375432491302, -0.00012374389916658401, -0.000118304044008255, -0.000112864188849926, -0.00010742433369159698, -0.00010198447853326797, -9.654462337493896e-05, -9.110476821660995e-05, -8.566491305828094e-05, -8.022505789995193e-05, -7.478520274162292e-05, -6.934534758329391e-05, -6.39054924249649e-05, -5.8465637266635895e-05, -5.3025782108306885e-05, -4.7585926949977875e-05, -4.2146071791648865e-05, -3.6706216633319855e-05, -3.1266361474990845e-05, -2.5826506316661835e-05, -2.0386651158332825e-05, -1.4946796000003815e-05, -9.506940841674805e-06, -4.067085683345795e-06, 1.3727694749832153e-06, 6.812624633312225e-06, 1.2252479791641235e-05, 1.7692334949970245e-05, 2.3132190108299255e-05, 2.8572045266628265e-05, 3.4011900424957275e-05, 3.9451755583286285e-05, 4.4891610741615295e-05, 5.0331465899944305e-05, 5.5771321058273315e-05, 6.121117621660233e-05, 6.665103137493134e-05, 7.209088653326035e-05, 7.753074169158936e-05, 8.297059684991837e-05, 8.841045200824738e-05, 9.385030716657639e-05, 9.92901623249054e-05, 0.0001047300174832344, 0.00011016987264156342, 0.00011560972779989243, 0.00012104958295822144, 0.00012648943811655045, 0.00013192929327487946, 0.00013736914843320847, 0.00014280900359153748, 0.00014824885874986649, 0.0001536887139081955, 0.0001591285690665245, 0.00016456842422485352]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 13.0, 10.0, 5.0, 11.0, 9.0, 13.0, 18.0, 9.0, 21.0, 19.0, 17.0, 21.0, 32.0, 25.0, 32.0, 23.0, 44.0, 28.0, 31.0, 41.0, 40.0, 36.0, 42.0, 38.0, 36.0, 36.0, 40.0, 41.0, 19.0, 34.0, 28.0, 24.0, 22.0, 17.0, 16.0, 17.0, 16.0, 8.0, 13.0, 11.0, 9.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.56640625, -4.43212890625, -4.2978515625, -4.16357421875, -4.029296875, -3.89501953125, -3.7607421875, -3.62646484375, -3.4921875, -3.35791015625, -3.2236328125, -3.08935546875, -2.955078125, -2.82080078125, -2.6865234375, -2.55224609375, -2.41796875, -2.28369140625, -2.1494140625, -2.01513671875, -1.880859375, -1.74658203125, -1.6123046875, -1.47802734375, -1.34375, -1.20947265625, -1.0751953125, -0.94091796875, -0.806640625, -0.67236328125, -0.5380859375, -0.40380859375, -0.26953125, -0.13525390625, -0.0009765625, 0.13330078125, 0.267578125, 0.40185546875, 0.5361328125, 0.67041015625, 0.8046875, 0.93896484375, 1.0732421875, 1.20751953125, 1.341796875, 1.47607421875, 1.6103515625, 1.74462890625, 1.87890625, 2.01318359375, 2.1474609375, 2.28173828125, 2.416015625, 2.55029296875, 2.6845703125, 2.81884765625, 2.953125, 3.08740234375, 3.2216796875, 3.35595703125, 3.490234375, 3.62451171875, 3.7587890625, 3.89306640625, 4.02734375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 21.0, 15.0, 32.0, 39.0, 51.0, 79.0, 145.0, 204.0, 270.0, 426.0, 576.0, 851.0, 1321.0, 1877.0, 2814.0, 4212.0, 6554.0, 10138.0, 15775.0, 25844.0, 41298.0, 69659.0, 119766.0, 189829.0, 205443.0, 139415.0, 81699.0, 48792.0, 29395.0, 18343.0, 11556.0, 7391.0, 4910.0, 3151.0, 2118.0, 1523.0, 971.0, 652.0, 437.0, 318.0, 222.0, 130.0, 104.0, 60.0, 39.0, 21.0, 19.0, 15.0, 12.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-5.125, -4.97039794921875, -4.8157958984375, -4.66119384765625, -4.506591796875, -4.35198974609375, -4.1973876953125, -4.04278564453125, -3.88818359375, -3.73358154296875, -3.5789794921875, -3.42437744140625, -3.269775390625, -3.11517333984375, -2.9605712890625, -2.80596923828125, -2.6513671875, -2.49676513671875, -2.3421630859375, -2.18756103515625, -2.032958984375, -1.87835693359375, -1.7237548828125, -1.56915283203125, -1.41455078125, -1.25994873046875, -1.1053466796875, -0.95074462890625, -0.796142578125, -0.64154052734375, -0.4869384765625, -0.33233642578125, -0.177734375, -0.02313232421875, 0.1314697265625, 0.28607177734375, 0.440673828125, 0.59527587890625, 0.7498779296875, 0.90447998046875, 1.05908203125, 1.21368408203125, 1.3682861328125, 1.52288818359375, 1.677490234375, 1.83209228515625, 1.9866943359375, 2.14129638671875, 2.2958984375, 2.45050048828125, 2.6051025390625, 2.75970458984375, 2.914306640625, 3.06890869140625, 3.2235107421875, 3.37811279296875, 3.53271484375, 3.68731689453125, 3.8419189453125, 3.99652099609375, 4.151123046875, 4.30572509765625, 4.4603271484375, 4.61492919921875, 4.76953125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 12.0, 1.0, 4.0, 9.0, 10.0, 7.0, 12.0, 7.0, 10.0, 15.0, 14.0, 24.0, 32.0, 31.0, 27.0, 34.0, 49.0, 48.0, 57.0, 70.0, 102.0, 139.0, 199.0, 1263.0, 193.0, 153.0, 104.0, 63.0, 54.0, 52.0, 41.0, 31.0, 28.0, 23.0, 19.0, 20.0, 11.0, 18.0, 10.0, 15.0, 8.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-12.296875, -11.9183349609375, -11.539794921875, -11.1612548828125, -10.78271484375, -10.4041748046875, -10.025634765625, -9.6470947265625, -9.2685546875, -8.8900146484375, -8.511474609375, -8.1329345703125, -7.75439453125, -7.3758544921875, -6.997314453125, -6.6187744140625, -6.240234375, -5.8616943359375, -5.483154296875, -5.1046142578125, -4.72607421875, -4.3475341796875, -3.968994140625, -3.5904541015625, -3.2119140625, -2.8333740234375, -2.454833984375, -2.0762939453125, -1.69775390625, -1.3192138671875, -0.940673828125, -0.5621337890625, -0.18359375, 0.1949462890625, 0.573486328125, 0.9520263671875, 1.33056640625, 1.7091064453125, 2.087646484375, 2.4661865234375, 2.8447265625, 3.2232666015625, 3.601806640625, 3.9803466796875, 4.35888671875, 4.7374267578125, 5.115966796875, 5.4945068359375, 5.873046875, 6.2515869140625, 6.630126953125, 7.0086669921875, 7.38720703125, 7.7657470703125, 8.144287109375, 8.5228271484375, 8.9013671875, 9.2799072265625, 9.658447265625, 10.0369873046875, 10.41552734375, 10.7940673828125, 11.172607421875, 11.5511474609375, 11.9296875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 12.0, 17.0, 19.0, 28.0, 33.0, 54.0, 78.0, 82.0, 126.0, 150.0, 228.0, 311.0, 450.0, 722.0, 1243.0, 2136.0, 4468.0, 10167.0, 27395.0, 94993.0, 506575.0, 1917699.0, 446380.0, 86990.0, 25913.0, 9643.0, 4216.0, 2175.0, 1150.0, 709.0, 440.0, 286.0, 215.0, 152.0, 110.0, 67.0, 61.0, 42.0, 36.0, 30.0, 15.0, 21.0, 16.0, 9.0, 5.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.65625, -11.2972412109375, -10.938232421875, -10.5792236328125, -10.22021484375, -9.8612060546875, -9.502197265625, -9.1431884765625, -8.7841796875, -8.4251708984375, -8.066162109375, -7.7071533203125, -7.34814453125, -6.9891357421875, -6.630126953125, -6.2711181640625, -5.912109375, -5.5531005859375, -5.194091796875, -4.8350830078125, -4.47607421875, -4.1170654296875, -3.758056640625, -3.3990478515625, -3.0400390625, -2.6810302734375, -2.322021484375, -1.9630126953125, -1.60400390625, -1.2449951171875, -0.885986328125, -0.5269775390625, -0.16796875, 0.1910400390625, 0.550048828125, 0.9090576171875, 1.26806640625, 1.6270751953125, 1.986083984375, 2.3450927734375, 2.7041015625, 3.0631103515625, 3.422119140625, 3.7811279296875, 4.14013671875, 4.4991455078125, 4.858154296875, 5.2171630859375, 5.576171875, 5.9351806640625, 6.294189453125, 6.6531982421875, 7.01220703125, 7.3712158203125, 7.730224609375, 8.0892333984375, 8.4482421875, 8.8072509765625, 9.166259765625, 9.5252685546875, 9.88427734375, 10.2432861328125, 10.602294921875, 10.9613037109375, 11.3203125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 13.0, 107.0, 491.0, 338.0, 49.0, 13.0, 3.0, 0.0, 0.0, 1.0], "bins": [-445.2985534667969, -437.456787109375, -429.6150207519531, -421.7732238769531, -413.93145751953125, -406.0896911621094, -398.2479248046875, -390.4061279296875, -382.5643615722656, -374.72259521484375, -366.8808288574219, -359.0390319824219, -351.197265625, -343.3554992675781, -335.51373291015625, -327.67193603515625, -319.8301696777344, -311.9884033203125, -304.1466369628906, -296.3048400878906, -288.46307373046875, -280.6213073730469, -272.779541015625, -264.937744140625, -257.0959777832031, -249.25421142578125, -241.4124298095703, -233.57066345214844, -225.7288818359375, -217.88711547851562, -210.0453338623047, -202.2035675048828, -194.36180114746094, -186.52003479003906, -178.67825317382812, -170.83648681640625, -162.9947052001953, -155.15293884277344, -147.3111572265625, -139.46939086914062, -131.6276092529297, -123.78583526611328, -115.94406127929688, -108.10228729248047, -100.26051330566406, -92.41874694824219, -84.57696533203125, -76.73519897460938, -68.89341735839844, -61.05164337158203, -53.209869384765625, -45.36809539794922, -37.52632141113281, -29.684551239013672, -21.842777252197266, -14.00100326538086, -6.159233093261719, 1.6825404167175293, 9.524313926696777, 17.366086959838867, 25.207860946655273, 33.04963302612305, 40.89140701293945, 48.73318099975586, 56.574954986572266]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 5.0, 13.0, 4.0, 6.0, 16.0, 11.0, 16.0, 12.0, 21.0, 24.0, 24.0, 27.0, 29.0, 18.0, 44.0, 31.0, 37.0, 29.0, 40.0, 34.0, 37.0, 37.0, 61.0, 38.0, 39.0, 47.0, 31.0, 38.0, 28.0, 30.0, 23.0, 23.0, 22.0, 21.0, 14.0, 9.0, 9.0, 13.0, 6.0, 7.0, 2.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.93986129760742, -31.80710792541504, -30.674354553222656, -29.54159927368164, -28.408845901489258, -27.276092529296875, -26.14333724975586, -25.010583877563477, -23.877830505371094, -22.74507713317871, -21.612323760986328, -20.479568481445312, -19.34681510925293, -18.214061737060547, -17.08130645751953, -15.948553085327148, -14.815799713134766, -13.683046340942383, -12.550292015075684, -11.417537689208984, -10.284784317016602, -9.152030944824219, -8.01927661895752, -6.8865227699279785, -5.7537689208984375, -4.6210150718688965, -3.4882612228393555, -2.3555073738098145, -1.2227535247802734, -0.08999967575073242, 1.0427541732788086, 2.1755080223083496, 3.308258056640625, 4.441011905670166, 5.573765754699707, 6.706519603729248, 7.839273452758789, 8.972026824951172, 10.104781150817871, 11.23753547668457, 12.370288848876953, 13.503042221069336, 14.635796546936035, 15.768550872802734, 16.901304244995117, 18.0340576171875, 19.166812896728516, 20.2995662689209, 21.43231964111328, 22.565073013305664, 23.697826385498047, 24.830581665039062, 25.963335037231445, 27.096088409423828, 28.228843688964844, 29.361597061157227, 30.49435043334961, 31.627103805541992, 32.759857177734375, 33.89261245727539, 35.025367736816406, 36.158119201660156, 37.29087448120117, 38.42362594604492, 39.55638122558594]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 4.0, 6.0, 8.0, 10.0, 12.0, 8.0, 8.0, 9.0, 20.0, 18.0, 18.0, 21.0, 19.0, 28.0, 23.0, 21.0, 33.0, 36.0, 34.0, 37.0, 30.0, 43.0, 43.0, 31.0, 26.0, 33.0, 47.0, 30.0, 35.0, 22.0, 37.0, 21.0, 26.0, 26.0, 19.0, 27.0, 19.0, 17.0, 15.0, 8.0, 7.0, 6.0, 14.0, 7.0, 7.0, 6.0, 3.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.6640625, -4.52679443359375, -4.3895263671875, -4.25225830078125, -4.114990234375, -3.97772216796875, -3.8404541015625, -3.70318603515625, -3.56591796875, -3.42864990234375, -3.2913818359375, -3.15411376953125, -3.016845703125, -2.87957763671875, -2.7423095703125, -2.60504150390625, -2.4677734375, -2.33050537109375, -2.1932373046875, -2.05596923828125, -1.918701171875, -1.78143310546875, -1.6441650390625, -1.50689697265625, -1.36962890625, -1.23236083984375, -1.0950927734375, -0.95782470703125, -0.820556640625, -0.68328857421875, -0.5460205078125, -0.40875244140625, -0.271484375, -0.13421630859375, 0.0030517578125, 0.14031982421875, 0.277587890625, 0.41485595703125, 0.5521240234375, 0.68939208984375, 0.82666015625, 0.96392822265625, 1.1011962890625, 1.23846435546875, 1.375732421875, 1.51300048828125, 1.6502685546875, 1.78753662109375, 1.9248046875, 2.06207275390625, 2.1993408203125, 2.33660888671875, 2.473876953125, 2.61114501953125, 2.7484130859375, 2.88568115234375, 3.02294921875, 3.16021728515625, 3.2974853515625, 3.43475341796875, 3.572021484375, 3.70928955078125, 3.8465576171875, 3.98382568359375, 4.12109375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 10.0, 11.0, 8.0, 14.0, 19.0, 28.0, 44.0, 54.0, 72.0, 119.0, 147.0, 203.0, 270.0, 423.0, 576.0, 818.0, 1190.0, 1882.0, 2849.0, 4956.0, 8802.0, 18863.0, 50128.0, 185571.0, 855820.0, 2080893.0, 734155.0, 162894.0, 44920.0, 17290.0, 8303.0, 4652.0, 2832.0, 1705.0, 1173.0, 787.0, 521.0, 376.0, 255.0, 185.0, 148.0, 100.0, 60.0, 52.0, 27.0, 24.0, 9.0, 18.0, 9.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.703125, -7.45819091796875, -7.2132568359375, -6.96832275390625, -6.723388671875, -6.47845458984375, -6.2335205078125, -5.98858642578125, -5.74365234375, -5.49871826171875, -5.2537841796875, -5.00885009765625, -4.763916015625, -4.51898193359375, -4.2740478515625, -4.02911376953125, -3.7841796875, -3.53924560546875, -3.2943115234375, -3.04937744140625, -2.804443359375, -2.55950927734375, -2.3145751953125, -2.06964111328125, -1.82470703125, -1.57977294921875, -1.3348388671875, -1.08990478515625, -0.844970703125, -0.60003662109375, -0.3551025390625, -0.11016845703125, 0.134765625, 0.37969970703125, 0.6246337890625, 0.86956787109375, 1.114501953125, 1.35943603515625, 1.6043701171875, 1.84930419921875, 2.09423828125, 2.33917236328125, 2.5841064453125, 2.82904052734375, 3.073974609375, 3.31890869140625, 3.5638427734375, 3.80877685546875, 4.0537109375, 4.29864501953125, 4.5435791015625, 4.78851318359375, 5.033447265625, 5.27838134765625, 5.5233154296875, 5.76824951171875, 6.01318359375, 6.25811767578125, 6.5030517578125, 6.74798583984375, 6.992919921875, 7.23785400390625, 7.4827880859375, 7.72772216796875, 7.97265625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 14.0, 7.0, 11.0, 15.0, 18.0, 32.0, 54.0, 59.0, 74.0, 107.0, 179.0, 252.0, 393.0, 505.0, 682.0, 554.0, 379.0, 251.0, 127.0, 102.0, 65.0, 52.0, 31.0, 28.0, 16.0, 17.0, 10.0, 8.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8125, -9.5098876953125, -9.207275390625, -8.9046630859375, -8.60205078125, -8.2994384765625, -7.996826171875, -7.6942138671875, -7.3916015625, -7.0889892578125, -6.786376953125, -6.4837646484375, -6.18115234375, -5.8785400390625, -5.575927734375, -5.2733154296875, -4.970703125, -4.6680908203125, -4.365478515625, -4.0628662109375, -3.76025390625, -3.4576416015625, -3.155029296875, -2.8524169921875, -2.5498046875, -2.2471923828125, -1.944580078125, -1.6419677734375, -1.33935546875, -1.0367431640625, -0.734130859375, -0.4315185546875, -0.12890625, 0.1737060546875, 0.476318359375, 0.7789306640625, 1.08154296875, 1.3841552734375, 1.686767578125, 1.9893798828125, 2.2919921875, 2.5946044921875, 2.897216796875, 3.1998291015625, 3.50244140625, 3.8050537109375, 4.107666015625, 4.4102783203125, 4.712890625, 5.0155029296875, 5.318115234375, 5.6207275390625, 5.92333984375, 6.2259521484375, 6.528564453125, 6.8311767578125, 7.1337890625, 7.4364013671875, 7.739013671875, 8.0416259765625, 8.34423828125, 8.6468505859375, 8.949462890625, 9.2520751953125, 9.5546875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 16.0, 30.0, 47.0, 75.0, 117.0, 188.0, 327.0, 628.0, 1079.0, 2504.0, 6608.0, 23828.0, 167610.0, 2979044.0, 928226.0, 62954.0, 13081.0, 4184.0, 1781.0, 861.0, 442.0, 267.0, 135.0, 91.0, 48.0, 37.0, 26.0, 10.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.96875, -20.3291015625, -19.689453125, -19.0498046875, -18.41015625, -17.7705078125, -17.130859375, -16.4912109375, -15.8515625, -15.2119140625, -14.572265625, -13.9326171875, -13.29296875, -12.6533203125, -12.013671875, -11.3740234375, -10.734375, -10.0947265625, -9.455078125, -8.8154296875, -8.17578125, -7.5361328125, -6.896484375, -6.2568359375, -5.6171875, -4.9775390625, -4.337890625, -3.6982421875, -3.05859375, -2.4189453125, -1.779296875, -1.1396484375, -0.5, 0.1396484375, 0.779296875, 1.4189453125, 2.05859375, 2.6982421875, 3.337890625, 3.9775390625, 4.6171875, 5.2568359375, 5.896484375, 6.5361328125, 7.17578125, 7.8154296875, 8.455078125, 9.0947265625, 9.734375, 10.3740234375, 11.013671875, 11.6533203125, 12.29296875, 12.9326171875, 13.572265625, 14.2119140625, 14.8515625, 15.4912109375, 16.130859375, 16.7705078125, 17.41015625, 18.0498046875, 18.689453125, 19.3291015625, 19.96875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [3.0, 16.0, 60.0, 348.0, 424.0, 137.0, 23.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.02175521850586, -17.56312370300293, -12.104493141174316, -6.645862579345703, -1.1872310638427734, 4.271400451660156, 9.730030059814453, 15.188663482666016, 20.647293090820312, 26.105924606323242, 31.564556121826172, 37.02318572998047, 42.48181915283203, 47.94044876098633, 53.399078369140625, 58.85771179199219, 64.31634521484375, 69.77497863769531, 75.23360443115234, 80.6922378540039, 86.15087127685547, 91.6094970703125, 97.06813049316406, 102.52676391601562, 107.98538970947266, 113.44402313232422, 118.90264892578125, 124.36128234863281, 129.81991577148438, 135.27854919433594, 140.7371826171875, 146.19580078125, 151.65443420410156, 157.11306762695312, 162.5717010498047, 168.03033447265625, 173.48895263671875, 178.9475860595703, 184.40621948242188, 189.86485290527344, 195.323486328125, 200.78211975097656, 206.24075317382812, 211.69937133789062, 217.1580047607422, 222.61663818359375, 228.0752716064453, 233.53390502929688, 238.99252319335938, 244.45115661621094, 249.9097900390625, 255.368408203125, 260.8270568847656, 266.2856750488281, 271.74432373046875, 277.20294189453125, 282.6615905761719, 288.1202087402344, 293.578857421875, 299.0374755859375, 304.4961242675781, 309.9547424316406, 315.41339111328125, 320.87200927734375, 326.33062744140625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 3.0, 7.0, 6.0, 7.0, 8.0, 9.0, 11.0, 20.0, 21.0, 20.0, 24.0, 28.0, 22.0, 27.0, 28.0, 38.0, 35.0, 43.0, 37.0, 49.0, 54.0, 38.0, 46.0, 44.0, 40.0, 35.0, 30.0, 36.0, 33.0, 25.0, 28.0, 28.0, 16.0, 11.0, 16.0, 10.0, 13.0, 8.0, 9.0, 7.0, 7.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.29015350341797, -26.372365951538086, -25.454578399658203, -24.536788940429688, -23.619001388549805, -22.701213836669922, -21.78342628479004, -20.865638732910156, -19.94784927368164, -19.030061721801758, -18.112274169921875, -17.19448471069336, -16.276697158813477, -15.358909606933594, -14.441122055053711, -13.523334503173828, -12.605546951293945, -11.687759399414062, -10.769970893859863, -9.85218334197998, -8.934394836425781, -8.016607284545898, -7.098819732666016, -6.181031703948975, -5.263243675231934, -4.345455646514893, -3.4276678562164307, -2.5098800659179688, -1.5920920372009277, -0.6743040084838867, 0.2434835433959961, 1.161271572113037, 2.079059600830078, 2.996847629547119, 3.914635419845581, 4.832423210144043, 5.750211238861084, 6.667999267578125, 7.585786819458008, 8.50357437133789, 9.42136287689209, 10.339150428771973, 11.256938934326172, 12.174726486206055, 13.092514038085938, 14.010302543640137, 14.92809009552002, 15.845878601074219, 16.7636661529541, 17.681453704833984, 18.599241256713867, 19.51702880859375, 20.434818267822266, 21.35260581970215, 22.27039337158203, 23.188180923461914, 24.105968475341797, 25.02375602722168, 25.941543579101562, 26.859333038330078, 27.77712059020996, 28.694908142089844, 29.612695693969727, 30.53048324584961, 31.448272705078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 6.0, 9.0, 12.0, 21.0, 17.0, 23.0, 20.0, 35.0, 23.0, 30.0, 35.0, 35.0, 29.0, 41.0, 33.0, 41.0, 33.0, 51.0, 39.0, 37.0, 33.0, 38.0, 37.0, 36.0, 30.0, 26.0, 27.0, 32.0, 32.0, 21.0, 18.0, 16.0, 10.0, 10.0, 6.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.400146484375, -5.23779296875, -5.075439453125, -4.9130859375, -4.750732421875, -4.58837890625, -4.426025390625, -4.263671875, -4.101318359375, -3.93896484375, -3.776611328125, -3.6142578125, -3.451904296875, -3.28955078125, -3.127197265625, -2.96484375, -2.802490234375, -2.64013671875, -2.477783203125, -2.3154296875, -2.153076171875, -1.99072265625, -1.828369140625, -1.666015625, -1.503662109375, -1.34130859375, -1.178955078125, -1.0166015625, -0.854248046875, -0.69189453125, -0.529541015625, -0.3671875, -0.204833984375, -0.04248046875, 0.119873046875, 0.2822265625, 0.444580078125, 0.60693359375, 0.769287109375, 0.931640625, 1.093994140625, 1.25634765625, 1.418701171875, 1.5810546875, 1.743408203125, 1.90576171875, 2.068115234375, 2.23046875, 2.392822265625, 2.55517578125, 2.717529296875, 2.8798828125, 3.042236328125, 3.20458984375, 3.366943359375, 3.529296875, 3.691650390625, 3.85400390625, 4.016357421875, 4.1787109375, 4.341064453125, 4.50341796875, 4.665771484375, 4.828125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 5.0, 5.0, 10.0, 20.0, 23.0, 47.0, 47.0, 66.0, 110.0, 146.0, 198.0, 281.0, 455.0, 673.0, 932.0, 1283.0, 1884.0, 2638.0, 3964.0, 5737.0, 8309.0, 11807.0, 17408.0, 25686.0, 38718.0, 59696.0, 94983.0, 161028.0, 221048.0, 142178.0, 85234.0, 53966.0, 35153.0, 23267.0, 15762.0, 11014.0, 7736.0, 5168.0, 3605.0, 2540.0, 1689.0, 1268.0, 871.0, 612.0, 404.0, 260.0, 184.0, 144.0, 99.0, 62.0, 49.0, 34.0, 17.0, 16.0, 14.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.140380859375, -0.1359081268310547, -0.13143539428710938, -0.12696266174316406, -0.12248992919921875, -0.11801719665527344, -0.11354446411132812, -0.10907173156738281, -0.1045989990234375, -0.10012626647949219, -0.09565353393554688, -0.09118080139160156, -0.08670806884765625, -0.08223533630371094, -0.07776260375976562, -0.07328987121582031, -0.068817138671875, -0.06434440612792969, -0.059871673583984375, -0.05539894104003906, -0.05092620849609375, -0.04645347595214844, -0.041980743408203125, -0.03750801086425781, -0.0330352783203125, -0.028562545776367188, -0.024089813232421875, -0.019617080688476562, -0.01514434814453125, -0.010671615600585938, -0.006198883056640625, -0.0017261505126953125, 0.00274658203125, 0.0072193145751953125, 0.011692047119140625, 0.016164779663085938, 0.02063751220703125, 0.025110244750976562, 0.029582977294921875, 0.03405570983886719, 0.0385284423828125, 0.04300117492675781, 0.047473907470703125, 0.05194664001464844, 0.05641937255859375, 0.06089210510253906, 0.06536483764648438, 0.06983757019042969, 0.074310302734375, 0.07878303527832031, 0.08325576782226562, 0.08772850036621094, 0.09220123291015625, 0.09667396545410156, 0.10114669799804688, 0.10561943054199219, 0.1100921630859375, 0.11456489562988281, 0.11903762817382812, 0.12351036071777344, 0.12798309326171875, 0.13245582580566406, 0.13692855834960938, 0.1414012908935547, 0.1458740234375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 9.0, 9.0, 8.0, 23.0, 7.0, 27.0, 21.0, 18.0, 19.0, 24.0, 36.0, 29.0, 22.0, 49.0, 25.0, 40.0, 35.0, 34.0, 1070.0, 56.0, 37.0, 42.0, 49.0, 36.0, 23.0, 35.0, 38.0, 33.0, 17.0, 25.0, 12.0, 17.0, 9.0, 13.0, 13.0, 6.0, 8.0, 11.0, 3.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0], "bins": [-4.46875, -4.33966064453125, -4.2105712890625, -4.08148193359375, -3.952392578125, -3.82330322265625, -3.6942138671875, -3.56512451171875, -3.43603515625, -3.30694580078125, -3.1778564453125, -3.04876708984375, -2.919677734375, -2.79058837890625, -2.6614990234375, -2.53240966796875, -2.4033203125, -2.27423095703125, -2.1451416015625, -2.01605224609375, -1.886962890625, -1.75787353515625, -1.6287841796875, -1.49969482421875, -1.37060546875, -1.24151611328125, -1.1124267578125, -0.98333740234375, -0.854248046875, -0.72515869140625, -0.5960693359375, -0.46697998046875, -0.337890625, -0.20880126953125, -0.0797119140625, 0.04937744140625, 0.178466796875, 0.30755615234375, 0.4366455078125, 0.56573486328125, 0.69482421875, 0.82391357421875, 0.9530029296875, 1.08209228515625, 1.211181640625, 1.34027099609375, 1.4693603515625, 1.59844970703125, 1.7275390625, 1.85662841796875, 1.9857177734375, 2.11480712890625, 2.243896484375, 2.37298583984375, 2.5020751953125, 2.63116455078125, 2.76025390625, 2.88934326171875, 3.0184326171875, 3.14752197265625, 3.276611328125, 3.40570068359375, 3.5347900390625, 3.66387939453125, 3.79296875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 10.0, 11.0, 22.0, 31.0, 23.0, 55.0, 77.0, 101.0, 153.0, 176.0, 282.0, 394.0, 523.0, 805.0, 1070.0, 1625.0, 2154.0, 3116.0, 4411.0, 6118.0, 8910.0, 12948.0, 19168.0, 28479.0, 44137.0, 71601.0, 123191.0, 1200283.0, 256551.0, 115251.0, 67271.0, 41893.0, 27159.0, 17954.0, 12331.0, 8596.0, 5958.0, 4213.0, 2830.0, 2080.0, 1478.0, 1073.0, 709.0, 572.0, 399.0, 287.0, 199.0, 141.0, 104.0, 64.0, 44.0, 36.0, 27.0, 19.0, 11.0, 6.0, 5.0, 2.0, 5.0], "bins": [-0.07073974609375, -0.06859207153320312, -0.06644439697265625, -0.06429672241210938, -0.0621490478515625, -0.060001373291015625, -0.05785369873046875, -0.055706024169921875, -0.053558349609375, -0.051410675048828125, -0.04926300048828125, -0.047115325927734375, -0.0449676513671875, -0.042819976806640625, -0.04067230224609375, -0.038524627685546875, -0.036376953125, -0.034229278564453125, -0.03208160400390625, -0.029933929443359375, -0.0277862548828125, -0.025638580322265625, -0.02349090576171875, -0.021343231201171875, -0.019195556640625, -0.017047882080078125, -0.01490020751953125, -0.012752532958984375, -0.0106048583984375, -0.008457183837890625, -0.00630950927734375, -0.004161834716796875, -0.00201416015625, 0.000133514404296875, 0.00228118896484375, 0.004428863525390625, 0.0065765380859375, 0.008724212646484375, 0.01087188720703125, 0.013019561767578125, 0.015167236328125, 0.017314910888671875, 0.01946258544921875, 0.021610260009765625, 0.0237579345703125, 0.025905609130859375, 0.02805328369140625, 0.030200958251953125, 0.0323486328125, 0.034496307373046875, 0.03664398193359375, 0.038791656494140625, 0.0409393310546875, 0.043087005615234375, 0.04523468017578125, 0.047382354736328125, 0.049530029296875, 0.051677703857421875, 0.05382537841796875, 0.055973052978515625, 0.0581207275390625, 0.060268402099609375, 0.06241607666015625, 0.06456375122070312, 0.06671142578125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 8.0, 6.0, 7.0, 12.0, 9.0, 18.0, 21.0, 46.0, 67.0, 92.0, 149.0, 169.0, 109.0, 84.0, 47.0, 32.0, 22.0, 10.0, 15.0, 12.0, 5.0, 5.0, 6.0, 5.0, 10.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007557868957519531, -0.0007337108254432678, -0.0007116347551345825, -0.0006895586848258972, -0.0006674826145172119, -0.0006454065442085266, -0.0006233304738998413, -0.000601254403591156, -0.0005791783332824707, -0.0005571022629737854, -0.0005350261926651001, -0.0005129501223564148, -0.0004908740520477295, -0.0004687979817390442, -0.0004467219114303589, -0.0004246458411216736, -0.0004025697708129883, -0.000380493700504303, -0.0003584176301956177, -0.0003363415598869324, -0.00031426548957824707, -0.00029218941926956177, -0.00027011334896087646, -0.00024803727865219116, -0.00022596120834350586, -0.00020388513803482056, -0.00018180906772613525, -0.00015973299741744995, -0.00013765692710876465, -0.00011558085680007935, -9.350478649139404e-05, -7.142871618270874e-05, -4.935264587402344e-05, -2.7276575565338135e-05, -5.200505256652832e-06, 1.687556505203247e-05, 3.8951635360717773e-05, 6.1027705669403076e-05, 8.310377597808838e-05, 0.00010517984628677368, 0.00012725591659545898, 0.0001493319869041443, 0.0001714080572128296, 0.0001934841275215149, 0.0002155601978302002, 0.0002376362681388855, 0.0002597123384475708, 0.0002817884087562561, 0.0003038644790649414, 0.0003259405493736267, 0.000348016619682312, 0.0003700926899909973, 0.0003921687602996826, 0.0004142448306083679, 0.0004363209009170532, 0.0004583969712257385, 0.00048047304153442383, 0.0005025491118431091, 0.0005246251821517944, 0.0005467012524604797, 0.000568777322769165, 0.0005908533930778503, 0.0006129294633865356, 0.000635005533695221, 0.0006570816040039062]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 5.0, 2.0, 10.0, 2.0, 7.0, 7.0, 6.0, 11.0, 19.0, 17.0, 37.0, 75.0, 113.0, 304.0, 1730.0, 985389.0, 59750.0, 592.0, 209.0, 111.0, 47.0, 27.0, 16.0, 16.0, 7.0, 4.0, 9.0, 6.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01580810546875, -0.015277624130249023, -0.014747142791748047, -0.01421666145324707, -0.013686180114746094, -0.013155698776245117, -0.01262521743774414, -0.012094736099243164, -0.011564254760742188, -0.011033773422241211, -0.010503292083740234, -0.009972810745239258, -0.009442329406738281, -0.008911848068237305, -0.008381366729736328, -0.007850885391235352, -0.007320404052734375, -0.0067899227142333984, -0.006259441375732422, -0.005728960037231445, -0.005198478698730469, -0.004667997360229492, -0.004137516021728516, -0.003607034683227539, -0.0030765533447265625, -0.002546072006225586, -0.0020155906677246094, -0.0014851093292236328, -0.0009546279907226562, -0.0004241466522216797, 0.00010633468627929688, 0.0006368160247802734, 0.00116729736328125, 0.0016977787017822266, 0.002228260040283203, 0.0027587413787841797, 0.0032892227172851562, 0.003819704055786133, 0.004350185394287109, 0.004880666732788086, 0.0054111480712890625, 0.005941629409790039, 0.006472110748291016, 0.007002592086791992, 0.007533073425292969, 0.008063554763793945, 0.008594036102294922, 0.009124517440795898, 0.009654998779296875, 0.010185480117797852, 0.010715961456298828, 0.011246442794799805, 0.011776924133300781, 0.012307405471801758, 0.012837886810302734, 0.013368368148803711, 0.013898849487304688, 0.014429330825805664, 0.01495981216430664, 0.015490293502807617, 0.016020774841308594, 0.01655125617980957, 0.017081737518310547, 0.017612218856811523, 0.0181427001953125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 42.0, 599.0, 341.0, 28.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016375152627006173, -0.0015273196622729301, -0.001417124061845243, -0.0013069284614175558, -0.0011967328609898686, -0.0010865372605621815, -0.0009763416019268334, -0.0008661460014991462, -0.0007559504010714591, -0.0006457548006437719, -0.0005355592002160847, -0.0004253635706845671, -0.0003151679702568799, -0.0002049723407253623, -9.477674029767513e-05, 1.5418860130012035e-05, 0.0001256144605576992, 0.00023581006098538637, 0.00034600566141307354, 0.00045620129094459116, 0.0005663968622684479, 0.000676592520903796, 0.0007867881213314831, 0.0008969837217591703, 0.0010071792639791965, 0.0011173748644068837, 0.0012275704648345709, 0.001337766065262258, 0.0014479616656899452, 0.0015581573825329542, 0.0016683528665453196, 0.0017785485833883286, 0.0018887443002313375, 0.0019989400170743465, 0.002109135501086712, 0.002219331217929721, 0.0023295267019420862, 0.002439722418785095, 0.0025499179027974606, 0.0026601136196404696, 0.002770309103652835, 0.002880504820495844, 0.0029907003045082092, 0.0031008960213512182, 0.0032110915053635836, 0.0033212872222065926, 0.003431482706218958, 0.003541678423061967, 0.003651874139904976, 0.003762069856747985, 0.0038722653407603502, 0.003982461057603359, 0.0040926565416157246, 0.00420285202562809, 0.0043130479753017426, 0.004423243459314108, 0.004533438943326473, 0.004643634427338839, 0.004753830377012491, 0.004864025861024857, 0.004974221345037222, 0.005084416829049587, 0.00519461277872324, 0.005304808262735605, 0.005415003746747971]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 8.0, 10.0, 11.0, 15.0, 10.0, 17.0, 27.0, 32.0, 30.0, 49.0, 36.0, 47.0, 41.0, 45.0, 56.0, 51.0, 53.0, 55.0, 47.0, 41.0, 45.0, 41.0, 46.0, 42.0, 32.0, 20.0, 21.0, 20.0, 14.0, 8.0, 10.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002808570861816406, -0.0002685869112610817, -0.00025631673634052277, -0.00024404656141996384, -0.0002317763864994049, -0.00021950621157884598, -0.00020723603665828705, -0.00019496586173772812, -0.0001826956868171692, -0.00017042551189661026, -0.00015815533697605133, -0.0001458851620554924, -0.00013361498713493347, -0.00012134481221437454, -0.00010907463729381561, -9.680446237325668e-05, -8.453428745269775e-05, -7.226411253213882e-05, -5.9993937611579895e-05, -4.7723762691020966e-05, -3.5453587770462036e-05, -2.3183412849903107e-05, -1.0913237929344177e-05, 1.3569369912147522e-06, 1.3627111911773682e-05, 2.589728683233261e-05, 3.816746175289154e-05, 5.043763667345047e-05, 6.27078115940094e-05, 7.497798651456833e-05, 8.724816143512726e-05, 9.951833635568619e-05, 0.00011178851127624512, 0.00012405868619680405, 0.00013632886111736298, 0.0001485990360379219, 0.00016086921095848083, 0.00017313938587903976, 0.0001854095607995987, 0.00019767973572015762, 0.00020994991064071655, 0.00022222008556127548, 0.0002344902604818344, 0.00024676043540239334, 0.00025903061032295227, 0.0002713007852435112, 0.00028357096016407013, 0.00029584113508462906, 0.000308111310005188, 0.0003203814849257469, 0.00033265165984630585, 0.0003449218347668648, 0.0003571920096874237, 0.00036946218460798264, 0.00038173235952854156, 0.0003940025344491005, 0.0004062727093696594, 0.00041854288429021835, 0.0004308130592107773, 0.0004430832341313362, 0.00045535340905189514, 0.00046762358397245407, 0.000479893758893013, 0.0004921639338135719, 0.0005044341087341309]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 6.0, 9.0, 12.0, 21.0, 17.0, 23.0, 20.0, 35.0, 23.0, 30.0, 35.0, 35.0, 29.0, 41.0, 33.0, 41.0, 33.0, 51.0, 39.0, 37.0, 33.0, 38.0, 37.0, 36.0, 30.0, 26.0, 27.0, 32.0, 32.0, 21.0, 18.0, 16.0, 10.0, 10.0, 6.0, 12.0, 3.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5625, -5.400146484375, -5.23779296875, -5.075439453125, -4.9130859375, -4.750732421875, -4.58837890625, -4.426025390625, -4.263671875, -4.101318359375, -3.93896484375, -3.776611328125, -3.6142578125, -3.451904296875, -3.28955078125, -3.127197265625, -2.96484375, -2.802490234375, -2.64013671875, -2.477783203125, -2.3154296875, -2.153076171875, -1.99072265625, -1.828369140625, -1.666015625, -1.503662109375, -1.34130859375, -1.178955078125, -1.0166015625, -0.854248046875, -0.69189453125, -0.529541015625, -0.3671875, -0.204833984375, -0.04248046875, 0.119873046875, 0.2822265625, 0.444580078125, 0.60693359375, 0.769287109375, 0.931640625, 1.093994140625, 1.25634765625, 1.418701171875, 1.5810546875, 1.743408203125, 1.90576171875, 2.068115234375, 2.23046875, 2.392822265625, 2.55517578125, 2.717529296875, 2.8798828125, 3.042236328125, 3.20458984375, 3.366943359375, 3.529296875, 3.691650390625, 3.85400390625, 4.016357421875, 4.1787109375, 4.341064453125, 4.50341796875, 4.665771484375, 4.828125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 26.0, 23.0, 36.0, 69.0, 78.0, 132.0, 223.0, 320.0, 450.0, 709.0, 997.0, 1588.0, 2590.0, 3951.0, 6320.0, 10119.0, 15997.0, 24858.0, 40777.0, 71067.0, 142353.0, 288369.0, 204338.0, 96239.0, 52505.0, 31271.0, 19390.0, 12306.0, 7859.0, 4909.0, 3117.0, 1961.0, 1223.0, 844.0, 515.0, 335.0, 189.0, 145.0, 110.0, 67.0, 56.0, 34.0, 24.0, 12.0, 15.0, 9.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75286865234375, -5.5526123046875, -5.35235595703125, -5.152099609375, -4.95184326171875, -4.7515869140625, -4.55133056640625, -4.35107421875, -4.15081787109375, -3.9505615234375, -3.75030517578125, -3.550048828125, -3.34979248046875, -3.1495361328125, -2.94927978515625, -2.7490234375, -2.54876708984375, -2.3485107421875, -2.14825439453125, -1.947998046875, -1.74774169921875, -1.5474853515625, -1.34722900390625, -1.14697265625, -0.94671630859375, -0.7464599609375, -0.54620361328125, -0.345947265625, -0.14569091796875, 0.0545654296875, 0.25482177734375, 0.455078125, 0.65533447265625, 0.8555908203125, 1.05584716796875, 1.256103515625, 1.45635986328125, 1.6566162109375, 1.85687255859375, 2.05712890625, 2.25738525390625, 2.4576416015625, 2.65789794921875, 2.858154296875, 3.05841064453125, 3.2586669921875, 3.45892333984375, 3.6591796875, 3.85943603515625, 4.0596923828125, 4.25994873046875, 4.460205078125, 4.66046142578125, 4.8607177734375, 5.06097412109375, 5.26123046875, 5.46148681640625, 5.6617431640625, 5.86199951171875, 6.062255859375, 6.26251220703125, 6.4627685546875, 6.66302490234375, 6.86328125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 15.0, 10.0, 20.0, 11.0, 27.0, 35.0, 37.0, 30.0, 39.0, 45.0, 34.0, 60.0, 78.0, 112.0, 168.0, 231.0, 1293.0, 186.0, 121.0, 76.0, 68.0, 48.0, 47.0, 45.0, 28.0, 38.0, 28.0, 22.0, 19.0, 16.0, 17.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.546875, -17.073974609375, -16.60107421875, -16.128173828125, -15.6552734375, -15.182373046875, -14.70947265625, -14.236572265625, -13.763671875, -13.290771484375, -12.81787109375, -12.344970703125, -11.8720703125, -11.399169921875, -10.92626953125, -10.453369140625, -9.98046875, -9.507568359375, -9.03466796875, -8.561767578125, -8.0888671875, -7.615966796875, -7.14306640625, -6.670166015625, -6.197265625, -5.724365234375, -5.25146484375, -4.778564453125, -4.3056640625, -3.832763671875, -3.35986328125, -2.886962890625, -2.4140625, -1.941162109375, -1.46826171875, -0.995361328125, -0.5224609375, -0.049560546875, 0.42333984375, 0.896240234375, 1.369140625, 1.842041015625, 2.31494140625, 2.787841796875, 3.2607421875, 3.733642578125, 4.20654296875, 4.679443359375, 5.15234375, 5.625244140625, 6.09814453125, 6.571044921875, 7.0439453125, 7.516845703125, 7.98974609375, 8.462646484375, 8.935546875, 9.408447265625, 9.88134765625, 10.354248046875, 10.8271484375, 11.300048828125, 11.77294921875, 12.245849609375, 12.71875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 7.0, 6.0, 3.0, 10.0, 10.0, 18.0, 22.0, 31.0, 54.0, 66.0, 110.0, 163.0, 223.0, 329.0, 462.0, 663.0, 1015.0, 1803.0, 3364.0, 7640.0, 22644.0, 92216.0, 897734.0, 1914844.0, 150484.0, 31920.0, 9869.0, 4151.0, 2104.0, 1292.0, 759.0, 518.0, 341.0, 244.0, 168.0, 126.0, 76.0, 70.0, 39.0, 28.0, 25.0, 16.0, 17.0, 9.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.136474609375, -15.60107421875, -15.065673828125, -14.5302734375, -13.994873046875, -13.45947265625, -12.924072265625, -12.388671875, -11.853271484375, -11.31787109375, -10.782470703125, -10.2470703125, -9.711669921875, -9.17626953125, -8.640869140625, -8.10546875, -7.570068359375, -7.03466796875, -6.499267578125, -5.9638671875, -5.428466796875, -4.89306640625, -4.357666015625, -3.822265625, -3.286865234375, -2.75146484375, -2.216064453125, -1.6806640625, -1.145263671875, -0.60986328125, -0.074462890625, 0.4609375, 0.996337890625, 1.53173828125, 2.067138671875, 2.6025390625, 3.137939453125, 3.67333984375, 4.208740234375, 4.744140625, 5.279541015625, 5.81494140625, 6.350341796875, 6.8857421875, 7.421142578125, 7.95654296875, 8.491943359375, 9.02734375, 9.562744140625, 10.09814453125, 10.633544921875, 11.1689453125, 11.704345703125, 12.23974609375, 12.775146484375, 13.310546875, 13.845947265625, 14.38134765625, 14.916748046875, 15.4521484375, 15.987548828125, 16.52294921875, 17.058349609375, 17.59375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 29.0, 46.0, 177.0, 383.0, 245.0, 86.0, 20.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.758544921875, -214.1777801513672, -207.59701538085938, -201.01625061035156, -194.43548583984375, -187.854736328125, -181.2739715576172, -174.69320678710938, -168.11244201660156, -161.53167724609375, -154.95091247558594, -148.37014770507812, -141.78939819335938, -135.2086181640625, -128.62786865234375, -122.04710388183594, -115.46633911132812, -108.88557434082031, -102.3048095703125, -95.72405242919922, -89.1432876586914, -82.5625228881836, -75.98176574707031, -69.4010009765625, -62.82023620605469, -56.239471435546875, -49.65871047973633, -43.07794952392578, -36.49718475341797, -29.916419982910156, -23.33565902709961, -16.754898071289062, -10.174118041992188, -3.593355178833008, 2.987407684326172, 9.568170547485352, 16.14893341064453, 22.729698181152344, 29.31045913696289, 35.89122009277344, 42.47198486328125, 49.05274963378906, 55.63351058959961, 62.214271545410156, 68.79503631591797, 75.37580108642578, 81.95655822753906, 88.53732299804688, 95.11808776855469, 101.6988525390625, 108.27961730957031, 114.8603744506836, 121.4411392211914, 128.02191162109375, 134.6026611328125, 141.1834259033203, 147.76419067382812, 154.34495544433594, 160.92572021484375, 167.50648498535156, 174.08724975585938, 180.66799926757812, 187.24876403808594, 193.82952880859375, 200.41029357910156]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 8.0, 6.0, 4.0, 12.0, 20.0, 10.0, 14.0, 25.0, 24.0, 15.0, 29.0, 29.0, 20.0, 36.0, 38.0, 26.0, 50.0, 48.0, 43.0, 37.0, 23.0, 35.0, 38.0, 39.0, 34.0, 30.0, 29.0, 45.0, 32.0, 18.0, 37.0, 29.0, 25.0, 14.0, 18.0, 15.0, 8.0, 9.0, 5.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.59511947631836, -36.26951599121094, -34.943912506103516, -33.618309020996094, -32.29270935058594, -30.967103958129883, -29.641502380371094, -28.315898895263672, -26.99029541015625, -25.664691925048828, -24.339088439941406, -23.013486862182617, -21.687883377075195, -20.362279891967773, -19.036678314208984, -17.711074829101562, -16.38547134399414, -15.059867858886719, -13.734265327453613, -12.408662796020508, -11.083059310913086, -9.757455825805664, -8.431853294372559, -7.106250762939453, -5.780647277832031, -4.455044269561768, -3.129441261291504, -1.8038382530212402, -0.47823524475097656, 0.8473677635192871, 2.172970771789551, 3.4985733032226562, 4.8241729736328125, 6.149775981903076, 7.47537899017334, 8.800981521606445, 10.126585006713867, 11.452188491821289, 12.777791023254395, 14.1033935546875, 15.428997039794922, 16.754600524902344, 18.080204010009766, 19.405805587768555, 20.731409072875977, 22.0570125579834, 23.382614135742188, 24.70821762084961, 26.03382110595703, 27.359424591064453, 28.685028076171875, 30.010629653930664, 31.336233139038086, 32.661834716796875, 33.9874382019043, 35.31304168701172, 36.63864517211914, 37.96424865722656, 39.289852142333984, 40.615455627441406, 41.94105529785156, 43.266658782958984, 44.592262268066406, 45.91786575317383, 47.24346923828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 3.0, 10.0, 7.0, 16.0, 6.0, 16.0, 16.0, 10.0, 23.0, 23.0, 25.0, 18.0, 36.0, 34.0, 32.0, 34.0, 31.0, 32.0, 34.0, 41.0, 42.0, 31.0, 32.0, 47.0, 39.0, 31.0, 31.0, 39.0, 39.0, 38.0, 18.0, 30.0, 24.0, 10.0, 16.0, 23.0, 15.0, 11.0, 6.0, 8.0, 1.0, 10.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.890625, -5.71673583984375, -5.5428466796875, -5.36895751953125, -5.195068359375, -5.02117919921875, -4.8472900390625, -4.67340087890625, -4.49951171875, -4.32562255859375, -4.1517333984375, -3.97784423828125, -3.803955078125, -3.63006591796875, -3.4561767578125, -3.28228759765625, -3.1083984375, -2.93450927734375, -2.7606201171875, -2.58673095703125, -2.412841796875, -2.23895263671875, -2.0650634765625, -1.89117431640625, -1.71728515625, -1.54339599609375, -1.3695068359375, -1.19561767578125, -1.021728515625, -0.84783935546875, -0.6739501953125, -0.50006103515625, -0.326171875, -0.15228271484375, 0.0216064453125, 0.19549560546875, 0.369384765625, 0.54327392578125, 0.7171630859375, 0.89105224609375, 1.06494140625, 1.23883056640625, 1.4127197265625, 1.58660888671875, 1.760498046875, 1.93438720703125, 2.1082763671875, 2.28216552734375, 2.4560546875, 2.62994384765625, 2.8038330078125, 2.97772216796875, 3.151611328125, 3.32550048828125, 3.4993896484375, 3.67327880859375, 3.84716796875, 4.02105712890625, 4.1949462890625, 4.36883544921875, 4.542724609375, 4.71661376953125, 4.8905029296875, 5.06439208984375, 5.23828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 5.0, 13.0, 15.0, 23.0, 23.0, 36.0, 45.0, 58.0, 86.0, 127.0, 189.0, 338.0, 647.0, 1914.0, 8705.0, 169969.0, 3963731.0, 40889.0, 4867.0, 1270.0, 501.0, 272.0, 179.0, 80.0, 76.0, 58.0, 46.0, 29.0, 17.0, 18.0, 13.0, 13.0, 9.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.81298828125, -44.2509765625, -42.68896484375, -41.126953125, -39.56494140625, -38.0029296875, -36.44091796875, -34.87890625, -33.31689453125, -31.7548828125, -30.19287109375, -28.630859375, -27.06884765625, -25.5068359375, -23.94482421875, -22.3828125, -20.82080078125, -19.2587890625, -17.69677734375, -16.134765625, -14.57275390625, -13.0107421875, -11.44873046875, -9.88671875, -8.32470703125, -6.7626953125, -5.20068359375, -3.638671875, -2.07666015625, -0.5146484375, 1.04736328125, 2.609375, 4.17138671875, 5.7333984375, 7.29541015625, 8.857421875, 10.41943359375, 11.9814453125, 13.54345703125, 15.10546875, 16.66748046875, 18.2294921875, 19.79150390625, 21.353515625, 22.91552734375, 24.4775390625, 26.03955078125, 27.6015625, 29.16357421875, 30.7255859375, 32.28759765625, 33.849609375, 35.41162109375, 36.9736328125, 38.53564453125, 40.09765625, 41.65966796875, 43.2216796875, 44.78369140625, 46.345703125, 47.90771484375, 49.4697265625, 51.03173828125, 52.59375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 21.0, 17.0, 58.0, 79.0, 164.0, 334.0, 715.0, 1436.0, 720.0, 249.0, 112.0, 75.0, 33.0, 21.0, 7.0, 8.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.328125, -13.593017578125, -12.85791015625, -12.122802734375, -11.3876953125, -10.652587890625, -9.91748046875, -9.182373046875, -8.447265625, -7.712158203125, -6.97705078125, -6.241943359375, -5.5068359375, -4.771728515625, -4.03662109375, -3.301513671875, -2.56640625, -1.831298828125, -1.09619140625, -0.361083984375, 0.3740234375, 1.109130859375, 1.84423828125, 2.579345703125, 3.314453125, 4.049560546875, 4.78466796875, 5.519775390625, 6.2548828125, 6.989990234375, 7.72509765625, 8.460205078125, 9.1953125, 9.930419921875, 10.66552734375, 11.400634765625, 12.1357421875, 12.870849609375, 13.60595703125, 14.341064453125, 15.076171875, 15.811279296875, 16.54638671875, 17.281494140625, 18.0166015625, 18.751708984375, 19.48681640625, 20.221923828125, 20.95703125, 21.692138671875, 22.42724609375, 23.162353515625, 23.8974609375, 24.632568359375, 25.36767578125, 26.102783203125, 26.837890625, 27.572998046875, 28.30810546875, 29.043212890625, 29.7783203125, 30.513427734375, 31.24853515625, 31.983642578125, 32.71875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 6.0, 10.0, 12.0, 22.0, 27.0, 68.0, 163.0, 394.0, 938.0, 3039.0, 15951.0, 1631968.0, 2519084.0, 17629.0, 3273.0, 1018.0, 362.0, 150.0, 71.0, 44.0, 19.0, 18.0, 8.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.71875, -41.81982421875, -39.9208984375, -38.02197265625, -36.123046875, -34.22412109375, -32.3251953125, -30.42626953125, -28.52734375, -26.62841796875, -24.7294921875, -22.83056640625, -20.931640625, -19.03271484375, -17.1337890625, -15.23486328125, -13.3359375, -11.43701171875, -9.5380859375, -7.63916015625, -5.740234375, -3.84130859375, -1.9423828125, -0.04345703125, 1.85546875, 3.75439453125, 5.6533203125, 7.55224609375, 9.451171875, 11.35009765625, 13.2490234375, 15.14794921875, 17.046875, 18.94580078125, 20.8447265625, 22.74365234375, 24.642578125, 26.54150390625, 28.4404296875, 30.33935546875, 32.23828125, 34.13720703125, 36.0361328125, 37.93505859375, 39.833984375, 41.73291015625, 43.6318359375, 45.53076171875, 47.4296875, 49.32861328125, 51.2275390625, 53.12646484375, 55.025390625, 56.92431640625, 58.8232421875, 60.72216796875, 62.62109375, 64.52001953125, 66.4189453125, 68.31787109375, 70.216796875, 72.11572265625, 74.0146484375, 75.91357421875, 77.8125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [2.0, 105.0, 740.0, 170.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.89746856689453, -22.230972290039062, -8.564477920532227, 5.102016448974609, 18.768512725830078, 32.43500518798828, 46.10150146484375, 59.76799774169922, 73.43449401855469, 87.10099029541016, 100.76748657226562, 114.43397521972656, 128.10047912597656, 141.7669677734375, 155.4334716796875, 169.09996032714844, 182.76644897460938, 196.4329376220703, 210.0994415283203, 223.76593017578125, 237.43243408203125, 251.0989227294922, 264.7654113769531, 278.4319152832031, 292.0984191894531, 305.7649230957031, 319.431396484375, 333.097900390625, 346.764404296875, 360.430908203125, 374.0973815917969, 387.7638854980469, 401.4303894042969, 415.0968933105469, 428.76336669921875, 442.42987060546875, 456.09637451171875, 469.76287841796875, 483.4293518066406, 497.0958557128906, 510.7623596191406, 524.4288330078125, 538.0953369140625, 551.7618408203125, 565.4283447265625, 579.0948486328125, 592.7613525390625, 606.4278564453125, 620.0942993164062, 633.7608032226562, 647.4273071289062, 661.0938110351562, 674.76025390625, 688.4267578125, 702.09326171875, 715.759765625, 729.42626953125, 743.0927734375, 756.75927734375, 770.42578125, 784.0922241210938, 797.7587280273438, 811.4252319335938, 825.0917358398438, 838.7582397460938]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 8.0, 7.0, 12.0, 10.0, 11.0, 10.0, 20.0, 26.0, 22.0, 30.0, 30.0, 42.0, 44.0, 38.0, 54.0, 51.0, 53.0, 44.0, 31.0, 36.0, 38.0, 34.0, 44.0, 45.0, 33.0, 38.0, 23.0, 29.0, 21.0, 31.0, 15.0, 16.0, 13.0, 6.0, 5.0, 11.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.707557678222656, -38.42266845703125, -37.13777542114258, -35.852882385253906, -34.5679931640625, -33.283103942871094, -31.998210906982422, -30.713319778442383, -29.428428649902344, -28.143537521362305, -26.858646392822266, -25.573755264282227, -24.288864135742188, -23.00397300720215, -21.71908187866211, -20.43419075012207, -19.14929962158203, -17.864408493041992, -16.579517364501953, -15.294626235961914, -14.009735107421875, -12.724843978881836, -11.439952850341797, -10.155061721801758, -8.870170593261719, -7.58527946472168, -6.300388336181641, -5.015497207641602, -3.7306060791015625, -2.4457149505615234, -1.1608238220214844, 0.12406730651855469, 1.4089622497558594, 2.6938533782958984, 3.9787445068359375, 5.263635635375977, 6.548526763916016, 7.833417892456055, 9.118309020996094, 10.403200149536133, 11.688091278076172, 12.972982406616211, 14.25787353515625, 15.542764663696289, 16.827655792236328, 18.112546920776367, 19.397438049316406, 20.682329177856445, 21.967220306396484, 23.252111434936523, 24.537002563476562, 25.8218936920166, 27.10678482055664, 28.39167594909668, 29.67656707763672, 30.961458206176758, 32.2463493347168, 33.53124237060547, 34.816131591796875, 36.10102081298828, 37.38591384887695, 38.670806884765625, 39.95569610595703, 41.24058532714844, 42.52547836303711]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 6.0, 8.0, 17.0, 13.0, 19.0, 16.0, 28.0, 26.0, 30.0, 46.0, 30.0, 35.0, 34.0, 34.0, 35.0, 43.0, 41.0, 52.0, 50.0, 46.0, 44.0, 48.0, 31.0, 32.0, 20.0, 31.0, 32.0, 27.0, 20.0, 16.0, 13.0, 13.0, 16.0, 10.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.7242431640625, -5.526611328125, -5.3289794921875, -5.13134765625, -4.9337158203125, -4.736083984375, -4.5384521484375, -4.3408203125, -4.1431884765625, -3.945556640625, -3.7479248046875, -3.55029296875, -3.3526611328125, -3.155029296875, -2.9573974609375, -2.759765625, -2.5621337890625, -2.364501953125, -2.1668701171875, -1.96923828125, -1.7716064453125, -1.573974609375, -1.3763427734375, -1.1787109375, -0.9810791015625, -0.783447265625, -0.5858154296875, -0.38818359375, -0.1905517578125, 0.007080078125, 0.2047119140625, 0.40234375, 0.5999755859375, 0.797607421875, 0.9952392578125, 1.19287109375, 1.3905029296875, 1.588134765625, 1.7857666015625, 1.9833984375, 2.1810302734375, 2.378662109375, 2.5762939453125, 2.77392578125, 2.9715576171875, 3.169189453125, 3.3668212890625, 3.564453125, 3.7620849609375, 3.959716796875, 4.1573486328125, 4.35498046875, 4.5526123046875, 4.750244140625, 4.9478759765625, 5.1455078125, 5.3431396484375, 5.540771484375, 5.7384033203125, 5.93603515625, 6.1336669921875, 6.331298828125, 6.5289306640625, 6.7265625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 10.0, 23.0, 28.0, 31.0, 73.0, 105.0, 149.0, 222.0, 352.0, 550.0, 871.0, 1376.0, 2100.0, 3465.0, 5733.0, 9373.0, 15598.0, 26042.0, 45571.0, 81833.0, 154295.0, 263621.0, 196452.0, 103565.0, 56464.0, 31967.0, 19120.0, 11473.0, 6814.0, 4158.0, 2655.0, 1645.0, 1020.0, 612.0, 378.0, 259.0, 188.0, 122.0, 82.0, 52.0, 31.0, 19.0, 13.0, 10.0, 12.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2080078125, -0.20183372497558594, -0.19565963745117188, -0.1894855499267578, -0.18331146240234375, -0.1771373748779297, -0.17096328735351562, -0.16478919982910156, -0.1586151123046875, -0.15244102478027344, -0.14626693725585938, -0.1400928497314453, -0.13391876220703125, -0.1277446746826172, -0.12157058715820312, -0.11539649963378906, -0.109222412109375, -0.10304832458496094, -0.09687423706054688, -0.09070014953613281, -0.08452606201171875, -0.07835197448730469, -0.07217788696289062, -0.06600379943847656, -0.0598297119140625, -0.05365562438964844, -0.047481536865234375, -0.04130744934082031, -0.03513336181640625, -0.028959274291992188, -0.022785186767578125, -0.016611099243164062, -0.01043701171875, -0.0042629241943359375, 0.001911163330078125, 0.008085250854492188, 0.01425933837890625, 0.020433425903320312, 0.026607513427734375, 0.03278160095214844, 0.0389556884765625, 0.04512977600097656, 0.051303863525390625, 0.05747795104980469, 0.06365203857421875, 0.06982612609863281, 0.07600021362304688, 0.08217430114746094, 0.088348388671875, 0.09452247619628906, 0.10069656372070312, 0.10687065124511719, 0.11304473876953125, 0.11921882629394531, 0.12539291381835938, 0.13156700134277344, 0.1377410888671875, 0.14391517639160156, 0.15008926391601562, 0.1562633514404297, 0.16243743896484375, 0.1686115264892578, 0.17478561401367188, 0.18095970153808594, 0.1871337890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 12.0, 11.0, 9.0, 11.0, 17.0, 21.0, 14.0, 24.0, 25.0, 25.0, 27.0, 30.0, 34.0, 33.0, 46.0, 48.0, 55.0, 45.0, 1079.0, 49.0, 43.0, 41.0, 28.0, 52.0, 31.0, 28.0, 19.0, 17.0, 26.0, 22.0, 20.0, 18.0, 10.0, 13.0, 12.0, 5.0, 8.0, 5.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-6.19921875, -6.02752685546875, -5.8558349609375, -5.68414306640625, -5.512451171875, -5.34075927734375, -5.1690673828125, -4.99737548828125, -4.82568359375, -4.65399169921875, -4.4822998046875, -4.31060791015625, -4.138916015625, -3.96722412109375, -3.7955322265625, -3.62384033203125, -3.4521484375, -3.28045654296875, -3.1087646484375, -2.93707275390625, -2.765380859375, -2.59368896484375, -2.4219970703125, -2.25030517578125, -2.07861328125, -1.90692138671875, -1.7352294921875, -1.56353759765625, -1.391845703125, -1.22015380859375, -1.0484619140625, -0.87677001953125, -0.705078125, -0.53338623046875, -0.3616943359375, -0.19000244140625, -0.018310546875, 0.15338134765625, 0.3250732421875, 0.49676513671875, 0.66845703125, 0.84014892578125, 1.0118408203125, 1.18353271484375, 1.355224609375, 1.52691650390625, 1.6986083984375, 1.87030029296875, 2.0419921875, 2.21368408203125, 2.3853759765625, 2.55706787109375, 2.728759765625, 2.90045166015625, 3.0721435546875, 3.24383544921875, 3.41552734375, 3.58721923828125, 3.7589111328125, 3.93060302734375, 4.102294921875, 4.27398681640625, 4.4456787109375, 4.61737060546875, 4.7890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 7.0, 10.0, 11.0, 12.0, 21.0, 37.0, 52.0, 57.0, 96.0, 109.0, 178.0, 234.0, 373.0, 559.0, 850.0, 1253.0, 1891.0, 2841.0, 4538.0, 7006.0, 10963.0, 17213.0, 28047.0, 46035.0, 80060.0, 143195.0, 1290677.0, 195928.0, 107408.0, 60800.0, 35771.0, 21785.0, 13867.0, 8854.0, 5571.0, 3760.0, 2385.0, 1614.0, 999.0, 664.0, 486.0, 312.0, 193.0, 128.0, 86.0, 67.0, 43.0, 21.0, 14.0, 14.0, 12.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 4.0], "bins": [-0.0875244140625, -0.08485221862792969, -0.08218002319335938, -0.07950782775878906, -0.07683563232421875, -0.07416343688964844, -0.07149124145507812, -0.06881904602050781, -0.0661468505859375, -0.06347465515136719, -0.060802459716796875, -0.05813026428222656, -0.05545806884765625, -0.05278587341308594, -0.050113677978515625, -0.04744148254394531, -0.044769287109375, -0.04209709167480469, -0.039424896240234375, -0.03675270080566406, -0.03408050537109375, -0.03140830993652344, -0.028736114501953125, -0.026063919067382812, -0.0233917236328125, -0.020719528198242188, -0.018047332763671875, -0.015375137329101562, -0.01270294189453125, -0.010030746459960938, -0.007358551025390625, -0.0046863555908203125, -0.00201416015625, 0.0006580352783203125, 0.003330230712890625, 0.0060024261474609375, 0.00867462158203125, 0.011346817016601562, 0.014019012451171875, 0.016691207885742188, 0.0193634033203125, 0.022035598754882812, 0.024707794189453125, 0.027379989624023438, 0.03005218505859375, 0.03272438049316406, 0.035396575927734375, 0.03806877136230469, 0.040740966796875, 0.04341316223144531, 0.046085357666015625, 0.04875755310058594, 0.05142974853515625, 0.05410194396972656, 0.056774139404296875, 0.05944633483886719, 0.0621185302734375, 0.06479072570800781, 0.06746292114257812, 0.07013511657714844, 0.07280731201171875, 0.07547950744628906, 0.07815170288085938, 0.08082389831542969, 0.08349609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 8.0, 5.0, 11.0, 14.0, 7.0, 11.0, 20.0, 12.0, 19.0, 24.0, 27.0, 39.0, 34.0, 72.0, 76.0, 107.0, 87.0, 78.0, 55.0, 43.0, 39.0, 48.0, 19.0, 16.0, 15.0, 16.0, 11.0, 16.0, 12.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0005183219909667969, -0.0005003586411476135, -0.0004823952913284302, -0.0004644319415092468, -0.0004464685916900635, -0.0004285052418708801, -0.0004105418920516968, -0.00039257854223251343, -0.0003746151924133301, -0.00035665184259414673, -0.0003386884927749634, -0.00032072514295578003, -0.0003027617931365967, -0.00028479844331741333, -0.00026683509349823, -0.00024887174367904663, -0.00023090839385986328, -0.00021294504404067993, -0.00019498169422149658, -0.00017701834440231323, -0.00015905499458312988, -0.00014109164476394653, -0.00012312829494476318, -0.00010516494512557983, -8.720159530639648e-05, -6.923824548721313e-05, -5.1274895668029785e-05, -3.3311545848846436e-05, -1.5348196029663086e-05, 2.6151537895202637e-06, 2.0578503608703613e-05, 3.854185342788696e-05, 5.650520324707031e-05, 7.446855306625366e-05, 9.243190288543701e-05, 0.00011039525270462036, 0.0001283586025238037, 0.00014632195234298706, 0.0001642853021621704, 0.00018224865198135376, 0.0002002120018005371, 0.00021817535161972046, 0.0002361387014389038, 0.00025410205125808716, 0.0002720654010772705, 0.00029002875089645386, 0.0003079921007156372, 0.00032595545053482056, 0.0003439188003540039, 0.00036188215017318726, 0.0003798454999923706, 0.00039780884981155396, 0.0004157721996307373, 0.00043373554944992065, 0.000451698899269104, 0.00046966224908828735, 0.0004876255989074707, 0.000505588948726654, 0.0005235522985458374, 0.0005415156483650208, 0.0005594789981842041, 0.0005774423480033875, 0.0005954056978225708, 0.0006133690476417542, 0.0006313323974609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 10.0, 17.0, 17.0, 20.0, 20.0, 28.0, 39.0, 74.0, 92.0, 194.0, 359.0, 1980.0, 264832.0, 776533.0, 3268.0, 489.0, 189.0, 110.0, 58.0, 34.0, 25.0, 18.0, 24.0, 11.0, 9.0, 16.0, 11.0, 8.0, 9.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.01486968994140625, -0.014445781707763672, -0.014021873474121094, -0.013597965240478516, -0.013174057006835938, -0.01275014877319336, -0.012326240539550781, -0.011902332305908203, -0.011478424072265625, -0.011054515838623047, -0.010630607604980469, -0.01020669937133789, -0.009782791137695312, -0.009358882904052734, -0.008934974670410156, -0.008511066436767578, -0.008087158203125, -0.007663249969482422, -0.007239341735839844, -0.006815433502197266, -0.0063915252685546875, -0.005967617034912109, -0.005543708801269531, -0.005119800567626953, -0.004695892333984375, -0.004271984100341797, -0.0038480758666992188, -0.0034241676330566406, -0.0030002593994140625, -0.0025763511657714844, -0.0021524429321289062, -0.0017285346984863281, -0.00130462646484375, -0.0008807182312011719, -0.00045680999755859375, -3.2901763916015625e-05, 0.0003910064697265625, 0.0008149147033691406, 0.0012388229370117188, 0.0016627311706542969, 0.002086639404296875, 0.002510547637939453, 0.0029344558715820312, 0.0033583641052246094, 0.0037822723388671875, 0.004206180572509766, 0.004630088806152344, 0.005053997039794922, 0.0054779052734375, 0.005901813507080078, 0.006325721740722656, 0.006749629974365234, 0.0071735382080078125, 0.007597446441650391, 0.008021354675292969, 0.008445262908935547, 0.008869171142578125, 0.009293079376220703, 0.009716987609863281, 0.01014089584350586, 0.010564804077148438, 0.010988712310791016, 0.011412620544433594, 0.011836528778076172, 0.01226043701171875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 33.0, 247.0, 601.0, 111.0, 15.0, 4.0], "bins": [-0.0061801765114068985, -0.006077658850699663, -0.0059751407243311405, -0.005872623063623905, -0.00577010540291667, -0.005667587276548147, -0.005565069615840912, -0.005462551489472389, -0.005360033828765154, -0.0052575161680579185, -0.005154998041689396, -0.005052480380982161, -0.004949962720274925, -0.004847444593906403, -0.004744926933199167, -0.004642409272491932, -0.004539891146123409, -0.004437373485416174, -0.004334855359047651, -0.004232337698340416, -0.004129820037633181, -0.004027301911264658, -0.003924784250557423, -0.0038222663570195436, -0.0037197486963123083, -0.0036172308027744293, -0.003514713142067194, -0.003412195248529315, -0.003309677354991436, -0.0032071596942842007, -0.0031046418007463217, -0.0030021239072084427, -0.0028996060136705637, -0.0027970881201326847, -0.0026945704594254494, -0.0025920525658875704, -0.0024895346723496914, -0.002387017011642456, -0.002284499118104577, -0.002181981224566698, -0.0020794635638594627, -0.0019769456703215837, -0.0018744278931990266, -0.0017719101160764694, -0.0016693922225385904, -0.0015668744454160333, -0.001464356668293476, -0.0013618387747555971, -0.0012593208812177181, -0.001156803104095161, -0.001054285210557282, -0.0009517674334347248, -0.0008492495398968458, -0.0007467317627742887, -0.0006442139274440706, -0.0005416960921138525, -0.00043917822767980397, -0.0003366603923495859, -0.00023414257157128304, -0.0001316247507929802, -2.9106915462762117e-05, 7.34108907636255e-05, 0.00017592872609384358, 0.00027844656142406166, 0.00038096439675427973]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 5.0, 16.0, 14.0, 11.0, 15.0, 22.0, 18.0, 30.0, 24.0, 28.0, 28.0, 36.0, 43.0, 41.0, 40.0, 37.0, 35.0, 57.0, 55.0, 46.0, 40.0, 41.0, 37.0, 43.0, 23.0, 20.0, 16.0, 28.0, 21.0, 19.0, 9.0, 14.0, 10.0, 10.0, 9.0, 8.0, 9.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00036454200744628906, -0.0003531603142619133, -0.00034177862107753754, -0.0003303969278931618, -0.000319015234708786, -0.00030763354152441025, -0.0002962518483400345, -0.0002848701551556587, -0.00027348846197128296, -0.0002621067687869072, -0.00025072507560253143, -0.00023934338241815567, -0.0002279616892337799, -0.00021657999604940414, -0.00020519830286502838, -0.00019381660968065262, -0.00018243491649627686, -0.0001710532233119011, -0.00015967153012752533, -0.00014828983694314957, -0.0001369081437587738, -0.00012552645057439804, -0.00011414475739002228, -0.00010276306420564651, -9.138137102127075e-05, -7.999967783689499e-05, -6.861798465251923e-05, -5.723629146814346e-05, -4.58545982837677e-05, -3.447290509939194e-05, -2.3091211915016174e-05, -1.1709518730640411e-05, -3.2782554626464844e-07, 1.1053867638111115e-05, 2.2435560822486877e-05, 3.381725400686264e-05, 4.51989471912384e-05, 5.6580640375614166e-05, 6.796233355998993e-05, 7.934402674436569e-05, 9.072571992874146e-05, 0.00010210741311311722, 0.00011348910629749298, 0.00012487079948186874, 0.0001362524926662445, 0.00014763418585062027, 0.00015901587903499603, 0.0001703975722193718, 0.00018177926540374756, 0.00019316095858812332, 0.00020454265177249908, 0.00021592434495687485, 0.0002273060381412506, 0.00023868773132562637, 0.00025006942451000214, 0.0002614511176943779, 0.00027283281087875366, 0.0002842145040631294, 0.0002955961972475052, 0.00030697789043188095, 0.0003183595836162567, 0.0003297412768006325, 0.00034112296998500824, 0.000352504663169384, 0.00036388635635375977]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 5.0, 6.0, 6.0, 8.0, 17.0, 13.0, 19.0, 16.0, 28.0, 26.0, 30.0, 46.0, 30.0, 35.0, 34.0, 34.0, 35.0, 43.0, 41.0, 52.0, 50.0, 46.0, 44.0, 48.0, 31.0, 32.0, 20.0, 31.0, 32.0, 27.0, 20.0, 16.0, 13.0, 13.0, 16.0, 10.0, 5.0, 5.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.7242431640625, -5.526611328125, -5.3289794921875, -5.13134765625, -4.9337158203125, -4.736083984375, -4.5384521484375, -4.3408203125, -4.1431884765625, -3.945556640625, -3.7479248046875, -3.55029296875, -3.3526611328125, -3.155029296875, -2.9573974609375, -2.759765625, -2.5621337890625, -2.364501953125, -2.1668701171875, -1.96923828125, -1.7716064453125, -1.573974609375, -1.3763427734375, -1.1787109375, -0.9810791015625, -0.783447265625, -0.5858154296875, -0.38818359375, -0.1905517578125, 0.007080078125, 0.2047119140625, 0.40234375, 0.5999755859375, 0.797607421875, 0.9952392578125, 1.19287109375, 1.3905029296875, 1.588134765625, 1.7857666015625, 1.9833984375, 2.1810302734375, 2.378662109375, 2.5762939453125, 2.77392578125, 2.9715576171875, 3.169189453125, 3.3668212890625, 3.564453125, 3.7620849609375, 3.959716796875, 4.1573486328125, 4.35498046875, 4.5526123046875, 4.750244140625, 4.9478759765625, 5.1455078125, 5.3431396484375, 5.540771484375, 5.7384033203125, 5.93603515625, 6.1336669921875, 6.331298828125, 6.5289306640625, 6.7265625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 11.0, 8.0, 13.0, 14.0, 32.0, 63.0, 129.0, 258.0, 539.0, 1497.0, 4147.0, 16373.0, 83455.0, 490559.0, 372037.0, 61172.0, 12546.0, 3565.0, 1139.0, 506.0, 219.0, 107.0, 52.0, 35.0, 15.0, 12.0, 13.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-23.390625, -22.679931640625, -21.96923828125, -21.258544921875, -20.5478515625, -19.837158203125, -19.12646484375, -18.415771484375, -17.705078125, -16.994384765625, -16.28369140625, -15.572998046875, -14.8623046875, -14.151611328125, -13.44091796875, -12.730224609375, -12.01953125, -11.308837890625, -10.59814453125, -9.887451171875, -9.1767578125, -8.466064453125, -7.75537109375, -7.044677734375, -6.333984375, -5.623291015625, -4.91259765625, -4.201904296875, -3.4912109375, -2.780517578125, -2.06982421875, -1.359130859375, -0.6484375, 0.062255859375, 0.77294921875, 1.483642578125, 2.1943359375, 2.905029296875, 3.61572265625, 4.326416015625, 5.037109375, 5.747802734375, 6.45849609375, 7.169189453125, 7.8798828125, 8.590576171875, 9.30126953125, 10.011962890625, 10.72265625, 11.433349609375, 12.14404296875, 12.854736328125, 13.5654296875, 14.276123046875, 14.98681640625, 15.697509765625, 16.408203125, 17.118896484375, 17.82958984375, 18.540283203125, 19.2509765625, 19.961669921875, 20.67236328125, 21.383056640625, 22.09375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 17.0, 16.0, 24.0, 23.0, 37.0, 30.0, 64.0, 63.0, 79.0, 109.0, 187.0, 293.0, 1342.0, 187.0, 131.0, 100.0, 71.0, 49.0, 54.0, 32.0, 28.0, 23.0, 20.0, 11.0, 8.0, 12.0, 5.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.9375, -17.32177734375, -16.7060546875, -16.09033203125, -15.474609375, -14.85888671875, -14.2431640625, -13.62744140625, -13.01171875, -12.39599609375, -11.7802734375, -11.16455078125, -10.548828125, -9.93310546875, -9.3173828125, -8.70166015625, -8.0859375, -7.47021484375, -6.8544921875, -6.23876953125, -5.623046875, -5.00732421875, -4.3916015625, -3.77587890625, -3.16015625, -2.54443359375, -1.9287109375, -1.31298828125, -0.697265625, -0.08154296875, 0.5341796875, 1.14990234375, 1.765625, 2.38134765625, 2.9970703125, 3.61279296875, 4.228515625, 4.84423828125, 5.4599609375, 6.07568359375, 6.69140625, 7.30712890625, 7.9228515625, 8.53857421875, 9.154296875, 9.77001953125, 10.3857421875, 11.00146484375, 11.6171875, 12.23291015625, 12.8486328125, 13.46435546875, 14.080078125, 14.69580078125, 15.3115234375, 15.92724609375, 16.54296875, 17.15869140625, 17.7744140625, 18.39013671875, 19.005859375, 19.62158203125, 20.2373046875, 20.85302734375, 21.46875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 12.0, 12.0, 15.0, 35.0, 37.0, 53.0, 79.0, 114.0, 155.0, 213.0, 333.0, 571.0, 1068.0, 3763.0, 50418.0, 2942086.0, 137825.0, 5739.0, 1326.0, 668.0, 385.0, 263.0, 174.0, 113.0, 84.0, 53.0, 35.0, 33.0, 27.0, 5.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.4189453125, -38.087890625, -36.7568359375, -35.42578125, -34.0947265625, -32.763671875, -31.4326171875, -30.1015625, -28.7705078125, -27.439453125, -26.1083984375, -24.77734375, -23.4462890625, -22.115234375, -20.7841796875, -19.453125, -18.1220703125, -16.791015625, -15.4599609375, -14.12890625, -12.7978515625, -11.466796875, -10.1357421875, -8.8046875, -7.4736328125, -6.142578125, -4.8115234375, -3.48046875, -2.1494140625, -0.818359375, 0.5126953125, 1.84375, 3.1748046875, 4.505859375, 5.8369140625, 7.16796875, 8.4990234375, 9.830078125, 11.1611328125, 12.4921875, 13.8232421875, 15.154296875, 16.4853515625, 17.81640625, 19.1474609375, 20.478515625, 21.8095703125, 23.140625, 24.4716796875, 25.802734375, 27.1337890625, 28.46484375, 29.7958984375, 31.126953125, 32.4580078125, 33.7890625, 35.1201171875, 36.451171875, 37.7822265625, 39.11328125, 40.4443359375, 41.775390625, 43.1064453125, 44.4375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 21.0, 47.0, 122.0, 239.0, 286.0, 176.0, 77.0, 27.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.66944885253906, -95.56439971923828, -91.4593505859375, -87.35430145263672, -83.24925231933594, -79.14420318603516, -75.03915405273438, -70.9341049194336, -66.82905578613281, -62.72400665283203, -58.61895751953125, -54.51390838623047, -50.40885925292969, -46.303810119628906, -42.198760986328125, -38.093711853027344, -33.98866271972656, -29.88361358642578, -25.778564453125, -21.67351531982422, -17.568466186523438, -13.463417053222656, -9.358367919921875, -5.253318786621094, -1.1482696533203125, 2.9567794799804688, 7.06182861328125, 11.166877746582031, 15.271926879882812, 19.376976013183594, 23.482025146484375, 27.587074279785156, 31.692108154296875, 35.797157287597656, 39.90220642089844, 44.00725555419922, 48.1123046875, 52.21735382080078, 56.32240295410156, 60.427452087402344, 64.53250122070312, 68.6375503540039, 72.74259948730469, 76.84764862060547, 80.95269775390625, 85.05774688720703, 89.16279602050781, 93.2678451538086, 97.37289428710938, 101.47794342041016, 105.58299255371094, 109.68804168701172, 113.7930908203125, 117.89813995361328, 122.00318908691406, 126.10823822021484, 130.21328735351562, 134.31832885742188, 138.4233856201172, 142.5284423828125, 146.63348388671875, 150.738525390625, 154.8435821533203, 158.94863891601562, 163.05368041992188]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 10.0, 5.0, 7.0, 11.0, 12.0, 14.0, 18.0, 17.0, 31.0, 21.0, 28.0, 23.0, 27.0, 39.0, 39.0, 32.0, 27.0, 38.0, 40.0, 43.0, 50.0, 45.0, 38.0, 44.0, 32.0, 37.0, 35.0, 36.0, 25.0, 24.0, 23.0, 23.0, 13.0, 16.0, 11.0, 11.0, 11.0, 6.0, 5.0, 7.0, 7.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.98893356323242, -49.46489715576172, -47.94085693359375, -46.41682052612305, -44.892784118652344, -43.368743896484375, -41.84470748901367, -40.32067108154297, -38.796630859375, -37.2725944519043, -35.74855422973633, -34.224517822265625, -32.700477600097656, -31.176441192626953, -29.65240478515625, -28.128366470336914, -26.604328155517578, -25.080289840698242, -23.556251525878906, -22.032215118408203, -20.508176803588867, -18.98413848876953, -17.460102081298828, -15.936063766479492, -14.412025451660156, -12.88798713684082, -11.3639497756958, -9.839912414550781, -8.315874099731445, -6.791836261749268, -5.26779842376709, -3.7437610626220703, -2.2197265625, -0.6956887245178223, 0.8283491134643555, 2.352386951446533, 3.876424789428711, 5.400462627410889, 6.924500465393066, 8.448537826538086, 9.972576141357422, 11.496614456176758, 13.020651817321777, 14.544689178466797, 16.068727493286133, 17.59276580810547, 19.116802215576172, 20.640840530395508, 22.164878845214844, 23.68891716003418, 25.212955474853516, 26.73699188232422, 28.261030197143555, 29.78506851196289, 31.309104919433594, 32.83314514160156, 34.357181549072266, 35.88121795654297, 37.40525817871094, 38.92929458618164, 40.453330993652344, 41.97737121582031, 43.501407623291016, 45.02544403076172, 46.54948425292969]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 6.0, 9.0, 13.0, 12.0, 13.0, 17.0, 25.0, 22.0, 28.0, 36.0, 29.0, 31.0, 33.0, 40.0, 40.0, 47.0, 43.0, 42.0, 45.0, 44.0, 49.0, 46.0, 39.0, 33.0, 28.0, 24.0, 32.0, 24.0, 24.0, 19.0, 10.0, 15.0, 18.0, 6.0, 9.0, 14.0, 3.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.71484375, -6.52154541015625, -6.3282470703125, -6.13494873046875, -5.941650390625, -5.74835205078125, -5.5550537109375, -5.36175537109375, -5.16845703125, -4.97515869140625, -4.7818603515625, -4.58856201171875, -4.395263671875, -4.20196533203125, -4.0086669921875, -3.81536865234375, -3.6220703125, -3.42877197265625, -3.2354736328125, -3.04217529296875, -2.848876953125, -2.65557861328125, -2.4622802734375, -2.26898193359375, -2.07568359375, -1.88238525390625, -1.6890869140625, -1.49578857421875, -1.302490234375, -1.10919189453125, -0.9158935546875, -0.72259521484375, -0.529296875, -0.33599853515625, -0.1427001953125, 0.05059814453125, 0.243896484375, 0.43719482421875, 0.6304931640625, 0.82379150390625, 1.01708984375, 1.21038818359375, 1.4036865234375, 1.59698486328125, 1.790283203125, 1.98358154296875, 2.1768798828125, 2.37017822265625, 2.5634765625, 2.75677490234375, 2.9500732421875, 3.14337158203125, 3.336669921875, 3.52996826171875, 3.7232666015625, 3.91656494140625, 4.10986328125, 4.30316162109375, 4.4964599609375, 4.68975830078125, 4.883056640625, 5.07635498046875, 5.2696533203125, 5.46295166015625, 5.65625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 8.0, 4.0, 11.0, 22.0, 38.0, 78.0, 112.0, 221.0, 382.0, 653.0, 1177.0, 2302.0, 5997.0, 23638.0, 404287.0, 3264174.0, 454559.0, 25200.0, 6208.0, 2456.0, 1172.0, 633.0, 407.0, 247.0, 119.0, 72.0, 45.0, 19.0, 14.0, 5.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.171875, -17.576416015625, -16.98095703125, -16.385498046875, -15.7900390625, -15.194580078125, -14.59912109375, -14.003662109375, -13.408203125, -12.812744140625, -12.21728515625, -11.621826171875, -11.0263671875, -10.430908203125, -9.83544921875, -9.239990234375, -8.64453125, -8.049072265625, -7.45361328125, -6.858154296875, -6.2626953125, -5.667236328125, -5.07177734375, -4.476318359375, -3.880859375, -3.285400390625, -2.68994140625, -2.094482421875, -1.4990234375, -0.903564453125, -0.30810546875, 0.287353515625, 0.8828125, 1.478271484375, 2.07373046875, 2.669189453125, 3.2646484375, 3.860107421875, 4.45556640625, 5.051025390625, 5.646484375, 6.241943359375, 6.83740234375, 7.432861328125, 8.0283203125, 8.623779296875, 9.21923828125, 9.814697265625, 10.41015625, 11.005615234375, 11.60107421875, 12.196533203125, 12.7919921875, 13.387451171875, 13.98291015625, 14.578369140625, 15.173828125, 15.769287109375, 16.36474609375, 16.960205078125, 17.5556640625, 18.151123046875, 18.74658203125, 19.342041015625, 19.9375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 12.0, 9.0, 19.0, 22.0, 37.0, 44.0, 66.0, 136.0, 189.0, 300.0, 457.0, 740.0, 678.0, 447.0, 310.0, 180.0, 133.0, 85.0, 55.0, 35.0, 27.0, 20.0, 16.0, 10.0, 3.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.688232421875, -10.30615234375, -9.924072265625, -9.5419921875, -9.159912109375, -8.77783203125, -8.395751953125, -8.013671875, -7.631591796875, -7.24951171875, -6.867431640625, -6.4853515625, -6.103271484375, -5.72119140625, -5.339111328125, -4.95703125, -4.574951171875, -4.19287109375, -3.810791015625, -3.4287109375, -3.046630859375, -2.66455078125, -2.282470703125, -1.900390625, -1.518310546875, -1.13623046875, -0.754150390625, -0.3720703125, 0.010009765625, 0.39208984375, 0.774169921875, 1.15625, 1.538330078125, 1.92041015625, 2.302490234375, 2.6845703125, 3.066650390625, 3.44873046875, 3.830810546875, 4.212890625, 4.594970703125, 4.97705078125, 5.359130859375, 5.7412109375, 6.123291015625, 6.50537109375, 6.887451171875, 7.26953125, 7.651611328125, 8.03369140625, 8.415771484375, 8.7978515625, 9.179931640625, 9.56201171875, 9.944091796875, 10.326171875, 10.708251953125, 11.09033203125, 11.472412109375, 11.8544921875, 12.236572265625, 12.61865234375, 13.000732421875, 13.3828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 9.0, 5.0, 17.0, 33.0, 46.0, 63.0, 125.0, 192.0, 378.0, 792.0, 1869.0, 5212.0, 21332.0, 221749.0, 3631149.0, 278130.0, 23819.0, 5669.0, 1900.0, 833.0, 417.0, 233.0, 134.0, 56.0, 40.0, 29.0, 12.0, 13.0, 8.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.1865234375, -22.451171875, -21.7158203125, -20.98046875, -20.2451171875, -19.509765625, -18.7744140625, -18.0390625, -17.3037109375, -16.568359375, -15.8330078125, -15.09765625, -14.3623046875, -13.626953125, -12.8916015625, -12.15625, -11.4208984375, -10.685546875, -9.9501953125, -9.21484375, -8.4794921875, -7.744140625, -7.0087890625, -6.2734375, -5.5380859375, -4.802734375, -4.0673828125, -3.33203125, -2.5966796875, -1.861328125, -1.1259765625, -0.390625, 0.3447265625, 1.080078125, 1.8154296875, 2.55078125, 3.2861328125, 4.021484375, 4.7568359375, 5.4921875, 6.2275390625, 6.962890625, 7.6982421875, 8.43359375, 9.1689453125, 9.904296875, 10.6396484375, 11.375, 12.1103515625, 12.845703125, 13.5810546875, 14.31640625, 15.0517578125, 15.787109375, 16.5224609375, 17.2578125, 17.9931640625, 18.728515625, 19.4638671875, 20.19921875, 20.9345703125, 21.669921875, 22.4052734375, 23.140625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 14.0, 97.0, 381.0, 369.0, 131.0, 17.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.70587158203125, -128.3730926513672, -123.04029846191406, -117.70751190185547, -112.37472534179688, -107.04193878173828, -101.70915222167969, -96.37637329101562, -91.0435791015625, -85.7107925415039, -80.37800598144531, -75.04521942138672, -69.71243286132812, -64.37964630126953, -59.0468635559082, -53.71407699584961, -48.38129425048828, -43.04850769042969, -37.715721130371094, -32.3829345703125, -27.05014991760254, -21.717363357543945, -16.384578704833984, -11.05179214477539, -5.719005584716797, -0.38621950149536133, 4.946566581726074, 10.279352188110352, 15.612138748168945, 20.94492530822754, 26.2777099609375, 31.610496520996094, 36.94328308105469, 42.27606964111328, 47.608856201171875, 52.94164276123047, 58.27442932128906, 63.607215881347656, 68.94000244140625, 74.27278137207031, 79.60557556152344, 84.93836212158203, 90.27114868164062, 95.60393524169922, 100.93672180175781, 106.2695083618164, 111.602294921875, 116.93507385253906, 122.26786041259766, 127.60064697265625, 132.9334259033203, 138.26622009277344, 143.5989990234375, 148.93179321289062, 154.2645721435547, 159.5973663330078, 164.93014526367188, 170.26292419433594, 175.59571838378906, 180.92849731445312, 186.26129150390625, 191.5940704345703, 196.92686462402344, 202.2596435546875, 207.59243774414062]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 8.0, 11.0, 15.0, 23.0, 16.0, 26.0, 43.0, 55.0, 40.0, 57.0, 52.0, 63.0, 80.0, 85.0, 60.0, 60.0, 76.0, 60.0, 53.0, 44.0, 28.0, 26.0, 3.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.37450408935547, -67.34610748291016, -65.31771850585938, -63.28932189941406, -61.26092529296875, -59.23252868652344, -57.20413589477539, -55.175743103027344, -53.14734649658203, -51.11894989013672, -49.09055709838867, -47.062164306640625, -45.03376770019531, -43.00537109375, -40.97697830200195, -38.948585510253906, -36.920188903808594, -34.89179229736328, -32.863399505615234, -30.835004806518555, -28.806610107421875, -26.778215408325195, -24.749820709228516, -22.721426010131836, -20.693031311035156, -18.664636611938477, -16.636241912841797, -14.607847213745117, -12.579452514648438, -10.551057815551758, -8.522663116455078, -6.494268417358398, -4.465869903564453, -2.4374752044677734, -0.40908050537109375, 1.619314193725586, 3.6477088928222656, 5.676103591918945, 7.704498291015625, 9.732892990112305, 11.761287689208984, 13.789682388305664, 15.818077087402344, 17.846471786499023, 19.874866485595703, 21.903261184692383, 23.931655883789062, 25.960050582885742, 27.988445281982422, 30.0168399810791, 32.04523468017578, 34.073631286621094, 36.10202407836914, 38.13041687011719, 40.1588134765625, 42.18721008300781, 44.21560287475586, 46.243995666503906, 48.27239227294922, 50.30078887939453, 52.32918167114258, 54.357574462890625, 56.38597106933594, 58.41436767578125, 60.4427604675293]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 13.0, 7.0, 16.0, 11.0, 18.0, 25.0, 21.0, 28.0, 25.0, 39.0, 30.0, 38.0, 29.0, 35.0, 33.0, 36.0, 40.0, 36.0, 50.0, 34.0, 37.0, 28.0, 42.0, 28.0, 31.0, 35.0, 29.0, 28.0, 21.0, 21.0, 18.0, 19.0, 11.0, 11.0, 14.0, 8.0, 4.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.97686767578125, -4.8092041015625, -4.64154052734375, -4.473876953125, -4.30621337890625, -4.1385498046875, -3.97088623046875, -3.80322265625, -3.63555908203125, -3.4678955078125, -3.30023193359375, -3.132568359375, -2.96490478515625, -2.7972412109375, -2.62957763671875, -2.4619140625, -2.29425048828125, -2.1265869140625, -1.95892333984375, -1.791259765625, -1.62359619140625, -1.4559326171875, -1.28826904296875, -1.12060546875, -0.95294189453125, -0.7852783203125, -0.61761474609375, -0.449951171875, -0.28228759765625, -0.1146240234375, 0.05303955078125, 0.220703125, 0.38836669921875, 0.5560302734375, 0.72369384765625, 0.891357421875, 1.05902099609375, 1.2266845703125, 1.39434814453125, 1.56201171875, 1.72967529296875, 1.8973388671875, 2.06500244140625, 2.232666015625, 2.40032958984375, 2.5679931640625, 2.73565673828125, 2.9033203125, 3.07098388671875, 3.2386474609375, 3.40631103515625, 3.573974609375, 3.74163818359375, 3.9093017578125, 4.07696533203125, 4.24462890625, 4.41229248046875, 4.5799560546875, 4.74761962890625, 4.915283203125, 5.08294677734375, 5.2506103515625, 5.41827392578125, 5.5859375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 4.0, 9.0, 15.0, 22.0, 28.0, 50.0, 77.0, 97.0, 128.0, 226.0, 301.0, 488.0, 703.0, 1033.0, 1550.0, 2314.0, 3562.0, 5375.0, 8054.0, 12101.0, 18168.0, 27374.0, 43215.0, 71542.0, 125205.0, 228969.0, 207752.0, 111111.0, 64414.0, 39626.0, 25123.0, 16421.0, 11088.0, 7229.0, 4943.0, 3390.0, 2208.0, 1511.0, 985.0, 707.0, 475.0, 309.0, 205.0, 135.0, 106.0, 75.0, 45.0, 27.0, 26.0, 12.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.164794921875, -0.15978622436523438, -0.15477752685546875, -0.14976882934570312, -0.1447601318359375, -0.13975143432617188, -0.13474273681640625, -0.12973403930664062, -0.124725341796875, -0.11971664428710938, -0.11470794677734375, -0.10969924926757812, -0.1046905517578125, -0.09968185424804688, -0.09467315673828125, -0.08966445922851562, -0.08465576171875, -0.07964706420898438, -0.07463836669921875, -0.06962966918945312, -0.0646209716796875, -0.059612274169921875, -0.05460357666015625, -0.049594879150390625, -0.044586181640625, -0.039577484130859375, -0.03456878662109375, -0.029560089111328125, -0.0245513916015625, -0.019542694091796875, -0.01453399658203125, -0.009525299072265625, -0.0045166015625, 0.000492095947265625, 0.00550079345703125, 0.010509490966796875, 0.0155181884765625, 0.020526885986328125, 0.02553558349609375, 0.030544281005859375, 0.035552978515625, 0.040561676025390625, 0.04557037353515625, 0.050579071044921875, 0.0555877685546875, 0.060596466064453125, 0.06560516357421875, 0.07061386108398438, 0.07562255859375, 0.08063125610351562, 0.08563995361328125, 0.09064865112304688, 0.0956573486328125, 0.10066604614257812, 0.10567474365234375, 0.11068344116210938, 0.115692138671875, 0.12070083618164062, 0.12570953369140625, 0.13071823120117188, 0.1357269287109375, 0.14073562622070312, 0.14574432373046875, 0.15075302124023438, 0.15576171875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 9.0, 10.0, 14.0, 14.0, 21.0, 18.0, 29.0, 27.0, 25.0, 33.0, 30.0, 49.0, 41.0, 26.0, 41.0, 28.0, 45.0, 49.0, 1072.0, 40.0, 22.0, 28.0, 42.0, 28.0, 36.0, 20.0, 33.0, 21.0, 20.0, 15.0, 29.0, 7.0, 16.0, 18.0, 11.0, 10.0, 6.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4453125, -4.28656005859375, -4.1278076171875, -3.96905517578125, -3.810302734375, -3.65155029296875, -3.4927978515625, -3.33404541015625, -3.17529296875, -3.01654052734375, -2.8577880859375, -2.69903564453125, -2.540283203125, -2.38153076171875, -2.2227783203125, -2.06402587890625, -1.9052734375, -1.74652099609375, -1.5877685546875, -1.42901611328125, -1.270263671875, -1.11151123046875, -0.9527587890625, -0.79400634765625, -0.63525390625, -0.47650146484375, -0.3177490234375, -0.15899658203125, -0.000244140625, 0.15850830078125, 0.3172607421875, 0.47601318359375, 0.634765625, 0.79351806640625, 0.9522705078125, 1.11102294921875, 1.269775390625, 1.42852783203125, 1.5872802734375, 1.74603271484375, 1.90478515625, 2.06353759765625, 2.2222900390625, 2.38104248046875, 2.539794921875, 2.69854736328125, 2.8572998046875, 3.01605224609375, 3.1748046875, 3.33355712890625, 3.4923095703125, 3.65106201171875, 3.809814453125, 3.96856689453125, 4.1273193359375, 4.28607177734375, 4.44482421875, 4.60357666015625, 4.7623291015625, 4.92108154296875, 5.079833984375, 5.23858642578125, 5.3973388671875, 5.55609130859375, 5.71484375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 4.0, 7.0, 5.0, 14.0, 23.0, 32.0, 55.0, 89.0, 157.0, 225.0, 375.0, 669.0, 987.0, 1761.0, 2870.0, 4626.0, 7647.0, 12831.0, 22120.0, 39295.0, 73723.0, 149206.0, 1347233.0, 211501.0, 100252.0, 51773.0, 28340.0, 16374.0, 9950.0, 5949.0, 3504.0, 2101.0, 1293.0, 784.0, 496.0, 308.0, 190.0, 127.0, 79.0, 47.0, 33.0, 28.0, 11.0, 16.0, 4.0, 4.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11102294921875, -0.10740947723388672, -0.10379600524902344, -0.10018253326416016, -0.09656906127929688, -0.0929555892944336, -0.08934211730957031, -0.08572864532470703, -0.08211517333984375, -0.07850170135498047, -0.07488822937011719, -0.0712747573852539, -0.06766128540039062, -0.06404781341552734, -0.06043434143066406, -0.05682086944580078, -0.0532073974609375, -0.04959392547607422, -0.04598045349121094, -0.042366981506347656, -0.038753509521484375, -0.035140037536621094, -0.03152656555175781, -0.02791309356689453, -0.02429962158203125, -0.02068614959716797, -0.017072677612304688, -0.013459205627441406, -0.009845733642578125, -0.006232261657714844, -0.0026187896728515625, 0.0009946823120117188, 0.004608154296875, 0.008221626281738281, 0.011835098266601562, 0.015448570251464844, 0.019062042236328125, 0.022675514221191406, 0.026288986206054688, 0.02990245819091797, 0.03351593017578125, 0.03712940216064453, 0.04074287414550781, 0.044356346130371094, 0.047969818115234375, 0.051583290100097656, 0.05519676208496094, 0.05881023406982422, 0.0624237060546875, 0.06603717803955078, 0.06965065002441406, 0.07326412200927734, 0.07687759399414062, 0.0804910659790039, 0.08410453796386719, 0.08771800994873047, 0.09133148193359375, 0.09494495391845703, 0.09855842590332031, 0.1021718978881836, 0.10578536987304688, 0.10939884185791016, 0.11301231384277344, 0.11662578582763672, 0.1202392578125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 9.0, 17.0, 35.0, 40.0, 56.0, 80.0, 96.0, 197.0, 164.0, 94.0, 57.0, 42.0, 27.0, 25.0, 14.0, 7.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006814002990722656, -0.0006584897637367249, -0.0006355792284011841, -0.0006126686930656433, -0.0005897581577301025, -0.0005668476223945618, -0.000543937087059021, -0.0005210265517234802, -0.0004981160163879395, -0.0004752054810523987, -0.0004522949457168579, -0.00042938441038131714, -0.00040647387504577637, -0.0003835633397102356, -0.0003606528043746948, -0.00033774226903915405, -0.0003148317337036133, -0.0002919211983680725, -0.00026901066303253174, -0.00024610012769699097, -0.0002231895923614502, -0.00020027905702590942, -0.00017736852169036865, -0.00015445798635482788, -0.0001315474510192871, -0.00010863691568374634, -8.572638034820557e-05, -6.28158450126648e-05, -3.9905309677124023e-05, -1.6994774341583252e-05, 5.9157609939575195e-06, 2.882629632949829e-05, 5.173683166503906e-05, 7.464736700057983e-05, 9.75579023361206e-05, 0.00012046843767166138, 0.00014337897300720215, 0.00016628950834274292, 0.0001892000436782837, 0.00021211057901382446, 0.00023502111434936523, 0.000257931649684906, 0.0002808421850204468, 0.00030375272035598755, 0.0003266632556915283, 0.0003495737910270691, 0.00037248432636260986, 0.00039539486169815063, 0.0004183053970336914, 0.0004412159323692322, 0.00046412646770477295, 0.0004870370030403137, 0.0005099475383758545, 0.0005328580737113953, 0.000555768609046936, 0.0005786791443824768, 0.0006015896797180176, 0.0006245002150535583, 0.0006474107503890991, 0.0006703212857246399, 0.0006932318210601807, 0.0007161423563957214, 0.0007390528917312622, 0.000761963427066803, 0.0007848739624023438]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 9.0, 7.0, 11.0, 17.0, 25.0, 40.0, 53.0, 130.0, 396.0, 22311.0, 1023468.0, 1599.0, 214.0, 101.0, 60.0, 46.0, 20.0, 14.0, 9.0, 9.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.01800537109375, -0.017480134963989258, -0.016954898834228516, -0.016429662704467773, -0.01590442657470703, -0.015379190444946289, -0.014853954315185547, -0.014328718185424805, -0.013803482055664062, -0.01327824592590332, -0.012753009796142578, -0.012227773666381836, -0.011702537536621094, -0.011177301406860352, -0.01065206527709961, -0.010126829147338867, -0.009601593017578125, -0.009076356887817383, -0.00855112075805664, -0.008025884628295898, -0.007500648498535156, -0.006975412368774414, -0.006450176239013672, -0.00592494010925293, -0.0053997039794921875, -0.004874467849731445, -0.004349231719970703, -0.003823995590209961, -0.0032987594604492188, -0.0027735233306884766, -0.0022482872009277344, -0.0017230510711669922, -0.00119781494140625, -0.0006725788116455078, -0.00014734268188476562, 0.00037789344787597656, 0.0009031295776367188, 0.001428365707397461, 0.001953601837158203, 0.0024788379669189453, 0.0030040740966796875, 0.0035293102264404297, 0.004054546356201172, 0.004579782485961914, 0.005105018615722656, 0.0056302547454833984, 0.006155490875244141, 0.006680727005004883, 0.007205963134765625, 0.007731199264526367, 0.00825643539428711, 0.008781671524047852, 0.009306907653808594, 0.009832143783569336, 0.010357379913330078, 0.01088261604309082, 0.011407852172851562, 0.011933088302612305, 0.012458324432373047, 0.012983560562133789, 0.013508796691894531, 0.014034032821655273, 0.014559268951416016, 0.015084505081176758, 0.0156097412109375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 16.0, 156.0, 658.0, 160.0, 19.0, 3.0], "bins": [-0.004613654688000679, -0.004537419881671667, -0.004461185075342655, -0.004384950269013643, -0.004308715462684631, -0.004232480656355619, -0.0041562458500266075, -0.004080011043697596, -0.004003776237368584, -0.003927541431039572, -0.00385130662471056, -0.003775071818381548, -0.003698837012052536, -0.003622602205723524, -0.003546367399394512, -0.0034701325930655003, -0.0033938977867364883, -0.0033176629804074764, -0.0032414281740784645, -0.0031651933677494526, -0.0030889585614204407, -0.0030127237550914288, -0.002936488948762417, -0.002860254142433405, -0.002784019336104393, -0.002707784529775381, -0.002631549723446369, -0.0025553149171173573, -0.0024790801107883453, -0.0024028453044593334, -0.0023266104981303215, -0.0022503756918013096, -0.0021741408854722977, -0.0020979060791432858, -0.002021671272814274, -0.001945436466485262, -0.00186920166015625, -0.001792966853827238, -0.0017167320474982262, -0.0016404972411692142, -0.0015642623184248805, -0.0014880275120958686, -0.0014117927057668567, -0.0013355578994378448, -0.0012593230931088328, -0.001183088286779821, -0.001106853480450809, -0.001030618674121797, -0.0009543838677927852, -0.0008781490614637733, -0.0008019142551347613, -0.0007256794488057494, -0.0006494446424767375, -0.0005732098361477256, -0.0004969750298187137, -0.00042074022348970175, -0.00034450541716068983, -0.0002682706108316779, -0.000192035804502666, -0.00011580099817365408, -3.956619184464216e-05, 3.6668614484369755e-05, 0.00011290342081338167, 0.0001891382271423936, 0.0002653730334714055]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 9.0, 8.0, 17.0, 15.0, 17.0, 16.0, 12.0, 21.0, 20.0, 17.0, 25.0, 31.0, 37.0, 39.0, 36.0, 40.0, 38.0, 41.0, 44.0, 38.0, 28.0, 46.0, 37.0, 43.0, 44.0, 32.0, 36.0, 26.0, 20.0, 25.0, 22.0, 16.0, 10.0, 13.0, 19.0, 14.0, 7.0, 7.0, 6.0, 7.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00025153160095214844, -0.0002434970811009407, -0.00023546256124973297, -0.00022742804139852524, -0.0002193935215473175, -0.00021135900169610977, -0.00020332448184490204, -0.0001952899619936943, -0.00018725544214248657, -0.00017922092229127884, -0.0001711864024400711, -0.00016315188258886337, -0.00015511736273765564, -0.0001470828428864479, -0.00013904832303524017, -0.00013101380318403244, -0.0001229792833328247, -0.00011494476348161697, -0.00010691024363040924, -9.887572377920151e-05, -9.084120392799377e-05, -8.280668407678604e-05, -7.477216422557831e-05, -6.673764437437057e-05, -5.870312452316284e-05, -5.066860467195511e-05, -4.2634084820747375e-05, -3.459956496953964e-05, -2.656504511833191e-05, -1.8530525267124176e-05, -1.0496005415916443e-05, -2.4614855647087097e-06, 5.5730342864990234e-06, 1.3607554137706757e-05, 2.164207398891449e-05, 2.9676593840122223e-05, 3.7711113691329956e-05, 4.574563354253769e-05, 5.378015339374542e-05, 6.181467324495316e-05, 6.984919309616089e-05, 7.788371294736862e-05, 8.591823279857635e-05, 9.395275264978409e-05, 0.00010198727250099182, 0.00011002179235219955, 0.00011805631220340729, 0.00012609083205461502, 0.00013412535190582275, 0.0001421598717570305, 0.00015019439160823822, 0.00015822891145944595, 0.0001662634313106537, 0.00017429795116186142, 0.00018233247101306915, 0.00019036699086427689, 0.00019840151071548462, 0.00020643603056669235, 0.00021447055041790009, 0.00022250507026910782, 0.00023053959012031555, 0.00023857410997152328, 0.000246608629822731, 0.00025464314967393875, 0.0002626776695251465]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 13.0, 6.0, 17.0, 11.0, 18.0, 25.0, 21.0, 28.0, 25.0, 39.0, 30.0, 38.0, 29.0, 35.0, 33.0, 36.0, 40.0, 36.0, 50.0, 34.0, 37.0, 28.0, 42.0, 28.0, 31.0, 35.0, 29.0, 28.0, 21.0, 21.0, 18.0, 19.0, 11.0, 11.0, 14.0, 8.0, 4.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.97686767578125, -4.8092041015625, -4.64154052734375, -4.473876953125, -4.30621337890625, -4.1385498046875, -3.97088623046875, -3.80322265625, -3.63555908203125, -3.4678955078125, -3.30023193359375, -3.132568359375, -2.96490478515625, -2.7972412109375, -2.62957763671875, -2.4619140625, -2.29425048828125, -2.1265869140625, -1.95892333984375, -1.791259765625, -1.62359619140625, -1.4559326171875, -1.28826904296875, -1.12060546875, -0.95294189453125, -0.7852783203125, -0.61761474609375, -0.449951171875, -0.28228759765625, -0.1146240234375, 0.05303955078125, 0.220703125, 0.38836669921875, 0.5560302734375, 0.72369384765625, 0.891357421875, 1.05902099609375, 1.2266845703125, 1.39434814453125, 1.56201171875, 1.72967529296875, 1.8973388671875, 2.06500244140625, 2.232666015625, 2.40032958984375, 2.5679931640625, 2.73565673828125, 2.9033203125, 3.07098388671875, 3.2386474609375, 3.40631103515625, 3.573974609375, 3.74163818359375, 3.9093017578125, 4.07696533203125, 4.24462890625, 4.41229248046875, 4.5799560546875, 4.74761962890625, 4.915283203125, 5.08294677734375, 5.2506103515625, 5.41827392578125, 5.5859375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 2.0, 3.0, 9.0, 5.0, 11.0, 21.0, 30.0, 50.0, 85.0, 107.0, 219.0, 420.0, 855.0, 1874.0, 4212.0, 10889.0, 31505.0, 112851.0, 496300.0, 288961.0, 66624.0, 20438.0, 7220.0, 3031.0, 1347.0, 662.0, 357.0, 172.0, 115.0, 55.0, 39.0, 20.0, 20.0, 10.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.7059326171875, -11.325927734375, -10.9459228515625, -10.56591796875, -10.1859130859375, -9.805908203125, -9.4259033203125, -9.0458984375, -8.6658935546875, -8.285888671875, -7.9058837890625, -7.52587890625, -7.1458740234375, -6.765869140625, -6.3858642578125, -6.005859375, -5.6258544921875, -5.245849609375, -4.8658447265625, -4.48583984375, -4.1058349609375, -3.725830078125, -3.3458251953125, -2.9658203125, -2.5858154296875, -2.205810546875, -1.8258056640625, -1.44580078125, -1.0657958984375, -0.685791015625, -0.3057861328125, 0.07421875, 0.4542236328125, 0.834228515625, 1.2142333984375, 1.59423828125, 1.9742431640625, 2.354248046875, 2.7342529296875, 3.1142578125, 3.4942626953125, 3.874267578125, 4.2542724609375, 4.63427734375, 5.0142822265625, 5.394287109375, 5.7742919921875, 6.154296875, 6.5343017578125, 6.914306640625, 7.2943115234375, 7.67431640625, 8.0543212890625, 8.434326171875, 8.8143310546875, 9.1943359375, 9.5743408203125, 9.954345703125, 10.3343505859375, 10.71435546875, 11.0943603515625, 11.474365234375, 11.8543701171875, 12.234375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 6.0, 12.0, 2.0, 10.0, 11.0, 11.0, 12.0, 15.0, 24.0, 33.0, 43.0, 40.0, 57.0, 81.0, 102.0, 188.0, 363.0, 1406.0, 175.0, 105.0, 78.0, 49.0, 49.0, 38.0, 31.0, 23.0, 21.0, 18.0, 17.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.9375, -18.398193359375, -17.85888671875, -17.319580078125, -16.7802734375, -16.240966796875, -15.70166015625, -15.162353515625, -14.623046875, -14.083740234375, -13.54443359375, -13.005126953125, -12.4658203125, -11.926513671875, -11.38720703125, -10.847900390625, -10.30859375, -9.769287109375, -9.22998046875, -8.690673828125, -8.1513671875, -7.612060546875, -7.07275390625, -6.533447265625, -5.994140625, -5.454833984375, -4.91552734375, -4.376220703125, -3.8369140625, -3.297607421875, -2.75830078125, -2.218994140625, -1.6796875, -1.140380859375, -0.60107421875, -0.061767578125, 0.4775390625, 1.016845703125, 1.55615234375, 2.095458984375, 2.634765625, 3.174072265625, 3.71337890625, 4.252685546875, 4.7919921875, 5.331298828125, 5.87060546875, 6.409912109375, 6.94921875, 7.488525390625, 8.02783203125, 8.567138671875, 9.1064453125, 9.645751953125, 10.18505859375, 10.724365234375, 11.263671875, 11.802978515625, 12.34228515625, 12.881591796875, 13.4208984375, 13.960205078125, 14.49951171875, 15.038818359375, 15.578125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 6.0, 7.0, 11.0, 14.0, 21.0, 30.0, 38.0, 72.0, 110.0, 159.0, 227.0, 388.0, 694.0, 1621.0, 5860.0, 1483335.0, 1643553.0, 6190.0, 1577.0, 687.0, 400.0, 239.0, 180.0, 91.0, 69.0, 42.0, 30.0, 21.0, 11.0, 11.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.53125, -32.28955078125, -31.0478515625, -29.80615234375, -28.564453125, -27.32275390625, -26.0810546875, -24.83935546875, -23.59765625, -22.35595703125, -21.1142578125, -19.87255859375, -18.630859375, -17.38916015625, -16.1474609375, -14.90576171875, -13.6640625, -12.42236328125, -11.1806640625, -9.93896484375, -8.697265625, -7.45556640625, -6.2138671875, -4.97216796875, -3.73046875, -2.48876953125, -1.2470703125, -0.00537109375, 1.236328125, 2.47802734375, 3.7197265625, 4.96142578125, 6.203125, 7.44482421875, 8.6865234375, 9.92822265625, 11.169921875, 12.41162109375, 13.6533203125, 14.89501953125, 16.13671875, 17.37841796875, 18.6201171875, 19.86181640625, 21.103515625, 22.34521484375, 23.5869140625, 24.82861328125, 26.0703125, 27.31201171875, 28.5537109375, 29.79541015625, 31.037109375, 32.27880859375, 33.5205078125, 34.76220703125, 36.00390625, 37.24560546875, 38.4873046875, 39.72900390625, 40.970703125, 42.21240234375, 43.4541015625, 44.69580078125, 45.9375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 22.0, 171.0, 518.0, 266.0, 31.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.76693725585938, -214.76980590820312, -207.77267456054688, -200.7755584716797, -193.77842712402344, -186.7812957763672, -179.78416442871094, -172.78704833984375, -165.7899169921875, -158.79278564453125, -151.795654296875, -144.7985382080078, -137.80140686035156, -130.8042755126953, -123.80714416503906, -116.81002044677734, -109.8128890991211, -102.81575775146484, -95.81863403320312, -88.82150268554688, -81.82437896728516, -74.8272476196289, -67.83012390136719, -60.83299255371094, -53.83586502075195, -46.83873748779297, -39.841609954833984, -32.844482421875, -25.847352981567383, -18.850223541259766, -11.853096008300781, -4.855968475341797, 2.1411590576171875, 9.138286590576172, 16.135414123535156, 23.132543563842773, 30.129671096801758, 37.126800537109375, 44.12392807006836, 51.121055603027344, 58.11818313598633, 65.11531066894531, 72.11244201660156, 79.10956573486328, 86.10669708251953, 93.10382080078125, 100.1009521484375, 107.09808349609375, 114.09520721435547, 121.09233856201172, 128.08946228027344, 135.0865936279297, 142.08372497558594, 149.08084106445312, 156.07797241210938, 163.07510375976562, 170.07223510742188, 177.06936645507812, 184.06649780273438, 191.06361389160156, 198.0607452392578, 205.05787658691406, 212.0550079345703, 219.0521240234375, 226.04925537109375]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 4.0, 12.0, 18.0, 6.0, 17.0, 20.0, 15.0, 18.0, 23.0, 21.0, 26.0, 37.0, 30.0, 34.0, 30.0, 41.0, 40.0, 42.0, 29.0, 49.0, 42.0, 49.0, 40.0, 37.0, 44.0, 34.0, 25.0, 31.0, 29.0, 20.0, 23.0, 18.0, 20.0, 12.0, 11.0, 8.0, 5.0, 9.0, 5.0, 5.0, 1.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.837921142578125, -37.444236755371094, -36.05055236816406, -34.65686798095703, -33.263179779052734, -31.869495391845703, -30.475811004638672, -29.08212661743164, -27.688440322875977, -26.294755935668945, -24.90106964111328, -23.50738525390625, -22.11370086669922, -20.720014572143555, -19.326330184936523, -17.93264389038086, -16.538959503173828, -15.14527416229248, -13.751588821411133, -12.357904434204102, -10.964219093322754, -9.570533752441406, -8.176849365234375, -6.783164024353027, -5.38947868347168, -3.995793581008911, -2.6021084785461426, -1.2084236145019531, 0.18526172637939453, 1.5789470672607422, 2.9726314544677734, 4.366316795349121, 5.760002136230469, 7.153687477111816, 8.547372817993164, 9.941057205200195, 11.334742546081543, 12.72842788696289, 14.122112274169922, 15.51579761505127, 16.909482955932617, 18.30316734313965, 19.696853637695312, 21.090538024902344, 22.484222412109375, 23.87790870666504, 25.27159309387207, 26.665279388427734, 28.058963775634766, 29.452648162841797, 30.84633445739746, 32.240020751953125, 33.633705139160156, 35.02738952636719, 36.42107391357422, 37.81475830078125, 39.20844268798828, 40.60212707519531, 41.995811462402344, 43.389495849609375, 44.78318405151367, 46.1768684387207, 47.570552825927734, 48.964237213134766, 50.35792541503906]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 7.0, 7.0, 12.0, 16.0, 17.0, 14.0, 20.0, 22.0, 20.0, 28.0, 33.0, 32.0, 36.0, 32.0, 32.0, 32.0, 39.0, 41.0, 32.0, 40.0, 38.0, 34.0, 38.0, 43.0, 33.0, 35.0, 32.0, 31.0, 25.0, 20.0, 22.0, 11.0, 19.0, 15.0, 13.0, 15.0, 8.0, 10.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.484375, -5.31842041015625, -5.1524658203125, -4.98651123046875, -4.820556640625, -4.65460205078125, -4.4886474609375, -4.32269287109375, -4.15673828125, -3.99078369140625, -3.8248291015625, -3.65887451171875, -3.492919921875, -3.32696533203125, -3.1610107421875, -2.99505615234375, -2.8291015625, -2.66314697265625, -2.4971923828125, -2.33123779296875, -2.165283203125, -1.99932861328125, -1.8333740234375, -1.66741943359375, -1.50146484375, -1.33551025390625, -1.1695556640625, -1.00360107421875, -0.837646484375, -0.67169189453125, -0.5057373046875, -0.33978271484375, -0.173828125, -0.00787353515625, 0.1580810546875, 0.32403564453125, 0.489990234375, 0.65594482421875, 0.8218994140625, 0.98785400390625, 1.15380859375, 1.31976318359375, 1.4857177734375, 1.65167236328125, 1.817626953125, 1.98358154296875, 2.1495361328125, 2.31549072265625, 2.4814453125, 2.64739990234375, 2.8133544921875, 2.97930908203125, 3.145263671875, 3.31121826171875, 3.4771728515625, 3.64312744140625, 3.80908203125, 3.97503662109375, 4.1409912109375, 4.30694580078125, 4.472900390625, 4.63885498046875, 4.8048095703125, 4.97076416015625, 5.13671875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 9.0, 11.0, 14.0, 11.0, 33.0, 30.0, 40.0, 37.0, 68.0, 110.0, 131.0, 166.0, 223.0, 320.0, 453.0, 660.0, 1038.0, 1605.0, 2715.0, 4971.0, 9889.0, 26003.0, 141450.0, 1081529.0, 2331394.0, 495122.0, 61913.0, 16687.0, 7325.0, 3798.0, 2206.0, 1312.0, 894.0, 604.0, 383.0, 302.0, 205.0, 174.0, 103.0, 83.0, 63.0, 57.0, 39.0, 25.0, 26.0, 16.0, 9.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.7879638671875, -10.419677734375, -10.0513916015625, -9.68310546875, -9.3148193359375, -8.946533203125, -8.5782470703125, -8.2099609375, -7.8416748046875, -7.473388671875, -7.1051025390625, -6.73681640625, -6.3685302734375, -6.000244140625, -5.6319580078125, -5.263671875, -4.8953857421875, -4.527099609375, -4.1588134765625, -3.79052734375, -3.4222412109375, -3.053955078125, -2.6856689453125, -2.3173828125, -1.9490966796875, -1.580810546875, -1.2125244140625, -0.84423828125, -0.4759521484375, -0.107666015625, 0.2606201171875, 0.62890625, 0.9971923828125, 1.365478515625, 1.7337646484375, 2.10205078125, 2.4703369140625, 2.838623046875, 3.2069091796875, 3.5751953125, 3.9434814453125, 4.311767578125, 4.6800537109375, 5.04833984375, 5.4166259765625, 5.784912109375, 6.1531982421875, 6.521484375, 6.8897705078125, 7.258056640625, 7.6263427734375, 7.99462890625, 8.3629150390625, 8.731201171875, 9.0994873046875, 9.4677734375, 9.8360595703125, 10.204345703125, 10.5726318359375, 10.94091796875, 11.3092041015625, 11.677490234375, 12.0457763671875, 12.4140625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 9.0, 21.0, 38.0, 49.0, 90.0, 127.0, 217.0, 340.0, 562.0, 852.0, 658.0, 433.0, 252.0, 156.0, 88.0, 63.0, 31.0, 22.0, 21.0, 13.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.4765625, -9.0594482421875, -8.642333984375, -8.2252197265625, -7.80810546875, -7.3909912109375, -6.973876953125, -6.5567626953125, -6.1396484375, -5.7225341796875, -5.305419921875, -4.8883056640625, -4.47119140625, -4.0540771484375, -3.636962890625, -3.2198486328125, -2.802734375, -2.3856201171875, -1.968505859375, -1.5513916015625, -1.13427734375, -0.7171630859375, -0.300048828125, 0.1170654296875, 0.5341796875, 0.9512939453125, 1.368408203125, 1.7855224609375, 2.20263671875, 2.6197509765625, 3.036865234375, 3.4539794921875, 3.87109375, 4.2882080078125, 4.705322265625, 5.1224365234375, 5.53955078125, 5.9566650390625, 6.373779296875, 6.7908935546875, 7.2080078125, 7.6251220703125, 8.042236328125, 8.4593505859375, 8.87646484375, 9.2935791015625, 9.710693359375, 10.1278076171875, 10.544921875, 10.9620361328125, 11.379150390625, 11.7962646484375, 12.21337890625, 12.6304931640625, 13.047607421875, 13.4647216796875, 13.8818359375, 14.2989501953125, 14.716064453125, 15.1331787109375, 15.55029296875, 15.9674072265625, 16.384521484375, 16.8016357421875, 17.21875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 12.0, 9.0, 28.0, 31.0, 50.0, 57.0, 114.0, 162.0, 289.0, 526.0, 1436.0, 4722.0, 28356.0, 707687.0, 3349882.0, 87461.0, 9578.0, 2232.0, 753.0, 355.0, 199.0, 125.0, 75.0, 39.0, 29.0, 19.0, 15.0, 10.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -19.9091796875, -19.177734375, -18.4462890625, -17.71484375, -16.9833984375, -16.251953125, -15.5205078125, -14.7890625, -14.0576171875, -13.326171875, -12.5947265625, -11.86328125, -11.1318359375, -10.400390625, -9.6689453125, -8.9375, -8.2060546875, -7.474609375, -6.7431640625, -6.01171875, -5.2802734375, -4.548828125, -3.8173828125, -3.0859375, -2.3544921875, -1.623046875, -0.8916015625, -0.16015625, 0.5712890625, 1.302734375, 2.0341796875, 2.765625, 3.4970703125, 4.228515625, 4.9599609375, 5.69140625, 6.4228515625, 7.154296875, 7.8857421875, 8.6171875, 9.3486328125, 10.080078125, 10.8115234375, 11.54296875, 12.2744140625, 13.005859375, 13.7373046875, 14.46875, 15.2001953125, 15.931640625, 16.6630859375, 17.39453125, 18.1259765625, 18.857421875, 19.5888671875, 20.3203125, 21.0517578125, 21.783203125, 22.5146484375, 23.24609375, 23.9775390625, 24.708984375, 25.4404296875, 26.171875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 70.0, 677.0, 261.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-499.9446105957031, -488.7540588378906, -477.5635070800781, -466.3729553222656, -455.1824035644531, -443.9918518066406, -432.8013000488281, -421.6107482910156, -410.4201965332031, -399.2296447753906, -388.0390930175781, -376.8485412597656, -365.6579895019531, -354.4674377441406, -343.2768859863281, -332.0863342285156, -320.895751953125, -309.7052001953125, -298.5146484375, -287.3240966796875, -276.133544921875, -264.9429931640625, -253.75244140625, -242.5618896484375, -231.371337890625, -220.1807861328125, -208.990234375, -197.7996826171875, -186.609130859375, -175.4185791015625, -164.22802734375, -153.0374755859375, -141.84693908691406, -130.65638732910156, -119.46583557128906, -108.27528381347656, -97.08473205566406, -85.89418029785156, -74.70362091064453, -63.51306915283203, -52.32251739501953, -41.13196563720703, -29.9414119720459, -18.750858306884766, -7.560306549072266, 3.6302452087402344, 14.82080078125, 26.0113525390625, 37.201904296875, 48.3924560546875, 59.5830078125, 70.7735595703125, 81.964111328125, 93.1546630859375, 104.34522247314453, 115.53577423095703, 126.72632598876953, 137.91688537597656, 149.10743713378906, 160.29798889160156, 171.48854064941406, 182.67909240722656, 193.86964416503906, 205.06019592285156, 216.25074768066406]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 15.0, 13.0, 12.0, 14.0, 23.0, 24.0, 22.0, 31.0, 33.0, 42.0, 33.0, 42.0, 45.0, 49.0, 52.0, 53.0, 61.0, 41.0, 41.0, 39.0, 36.0, 49.0, 38.0, 35.0, 16.0, 18.0, 17.0, 19.0, 16.0, 14.0, 9.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-48.039894104003906, -46.751075744628906, -45.462257385253906, -44.173439025878906, -42.884620666503906, -41.595802307128906, -40.306983947753906, -39.018165588378906, -37.729347229003906, -36.440528869628906, -35.151710510253906, -33.862892150878906, -32.574073791503906, -31.285255432128906, -29.996435165405273, -28.707616806030273, -27.41879653930664, -26.12997817993164, -24.84115982055664, -23.55234146118164, -22.26352310180664, -20.97470474243164, -19.685884475708008, -18.397066116333008, -17.108247756958008, -15.819429397583008, -14.530611038208008, -13.241791725158691, -11.952973365783691, -10.664155006408691, -9.375335693359375, -8.086517333984375, -6.797698974609375, -5.508880615234375, -4.220061779022217, -2.9312431812286377, -1.6424245834350586, -0.3536062240600586, 0.9352126121520996, 2.224031448364258, 3.512849807739258, 4.801668167114258, 6.090487003326416, 7.379305839538574, 8.668124198913574, 9.956942558288574, 11.24576187133789, 12.53458023071289, 13.82339859008789, 15.11221694946289, 16.40103530883789, 17.68985366821289, 18.97867202758789, 20.26749038696289, 21.556310653686523, 22.845129013061523, 24.133947372436523, 25.422765731811523, 26.711584091186523, 28.000402450561523, 29.289222717285156, 30.578041076660156, 31.866859436035156, 33.155677795410156, 34.444496154785156]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 4.0, 8.0, 10.0, 6.0, 8.0, 14.0, 20.0, 12.0, 23.0, 21.0, 30.0, 24.0, 34.0, 35.0, 24.0, 37.0, 39.0, 32.0, 38.0, 50.0, 38.0, 36.0, 37.0, 41.0, 38.0, 33.0, 25.0, 40.0, 27.0, 28.0, 29.0, 16.0, 10.0, 20.0, 11.0, 10.0, 15.0, 11.0, 13.0, 10.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.34375, -5.1767578125, -5.009765625, -4.8427734375, -4.67578125, -4.5087890625, -4.341796875, -4.1748046875, -4.0078125, -3.8408203125, -3.673828125, -3.5068359375, -3.33984375, -3.1728515625, -3.005859375, -2.8388671875, -2.671875, -2.5048828125, -2.337890625, -2.1708984375, -2.00390625, -1.8369140625, -1.669921875, -1.5029296875, -1.3359375, -1.1689453125, -1.001953125, -0.8349609375, -0.66796875, -0.5009765625, -0.333984375, -0.1669921875, 0.0, 0.1669921875, 0.333984375, 0.5009765625, 0.66796875, 0.8349609375, 1.001953125, 1.1689453125, 1.3359375, 1.5029296875, 1.669921875, 1.8369140625, 2.00390625, 2.1708984375, 2.337890625, 2.5048828125, 2.671875, 2.8388671875, 3.005859375, 3.1728515625, 3.33984375, 3.5068359375, 3.673828125, 3.8408203125, 4.0078125, 4.1748046875, 4.341796875, 4.5087890625, 4.67578125, 4.8427734375, 5.009765625, 5.1767578125, 5.34375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 11.0, 9.0, 14.0, 25.0, 28.0, 64.0, 67.0, 120.0, 152.0, 276.0, 414.0, 551.0, 780.0, 1175.0, 1751.0, 2468.0, 3739.0, 5378.0, 7953.0, 11753.0, 17426.0, 26033.0, 41394.0, 68597.0, 126762.0, 241114.0, 211937.0, 108364.0, 60361.0, 37100.0, 23621.0, 15783.0, 10468.0, 7232.0, 4957.0, 3405.0, 2302.0, 1638.0, 1070.0, 687.0, 517.0, 323.0, 224.0, 151.0, 127.0, 89.0, 52.0, 27.0, 30.0, 16.0, 15.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1663818359375, -0.16132164001464844, -0.15626144409179688, -0.1512012481689453, -0.14614105224609375, -0.1410808563232422, -0.13602066040039062, -0.13096046447753906, -0.1259002685546875, -0.12084007263183594, -0.11577987670898438, -0.11071968078613281, -0.10565948486328125, -0.10059928894042969, -0.09553909301757812, -0.09047889709472656, -0.085418701171875, -0.08035850524902344, -0.07529830932617188, -0.07023811340332031, -0.06517791748046875, -0.06011772155761719, -0.055057525634765625, -0.04999732971191406, -0.0449371337890625, -0.03987693786621094, -0.034816741943359375, -0.029756546020507812, -0.02469635009765625, -0.019636154174804688, -0.014575958251953125, -0.009515762329101562, -0.00445556640625, 0.0006046295166015625, 0.005664825439453125, 0.010725021362304688, 0.01578521728515625, 0.020845413208007812, 0.025905609130859375, 0.030965805053710938, 0.0360260009765625, 0.04108619689941406, 0.046146392822265625, 0.05120658874511719, 0.05626678466796875, 0.06132698059082031, 0.06638717651367188, 0.07144737243652344, 0.076507568359375, 0.08156776428222656, 0.08662796020507812, 0.09168815612792969, 0.09674835205078125, 0.10180854797363281, 0.10686874389648438, 0.11192893981933594, 0.1169891357421875, 0.12204933166503906, 0.12710952758789062, 0.1321697235107422, 0.13722991943359375, 0.1422901153564453, 0.14735031127929688, 0.15241050720214844, 0.157470703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 0.0, 5.0, 6.0, 8.0, 5.0, 13.0, 10.0, 19.0, 19.0, 19.0, 20.0, 20.0, 19.0, 29.0, 32.0, 37.0, 36.0, 36.0, 35.0, 39.0, 38.0, 29.0, 1062.0, 37.0, 26.0, 56.0, 44.0, 48.0, 35.0, 32.0, 35.0, 13.0, 31.0, 24.0, 13.0, 14.0, 12.0, 17.0, 14.0, 4.0, 12.0, 5.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.87109375, -4.71942138671875, -4.5677490234375, -4.41607666015625, -4.264404296875, -4.11273193359375, -3.9610595703125, -3.80938720703125, -3.65771484375, -3.50604248046875, -3.3543701171875, -3.20269775390625, -3.051025390625, -2.89935302734375, -2.7476806640625, -2.59600830078125, -2.4443359375, -2.29266357421875, -2.1409912109375, -1.98931884765625, -1.837646484375, -1.68597412109375, -1.5343017578125, -1.38262939453125, -1.23095703125, -1.07928466796875, -0.9276123046875, -0.77593994140625, -0.624267578125, -0.47259521484375, -0.3209228515625, -0.16925048828125, -0.017578125, 0.13409423828125, 0.2857666015625, 0.43743896484375, 0.589111328125, 0.74078369140625, 0.8924560546875, 1.04412841796875, 1.19580078125, 1.34747314453125, 1.4991455078125, 1.65081787109375, 1.802490234375, 1.95416259765625, 2.1058349609375, 2.25750732421875, 2.4091796875, 2.56085205078125, 2.7125244140625, 2.86419677734375, 3.015869140625, 3.16754150390625, 3.3192138671875, 3.47088623046875, 3.62255859375, 3.77423095703125, 3.9259033203125, 4.07757568359375, 4.229248046875, 4.38092041015625, 4.5325927734375, 4.68426513671875, 4.8359375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 2.0, 12.0, 17.0, 9.0, 28.0, 28.0, 57.0, 79.0, 106.0, 177.0, 251.0, 370.0, 546.0, 841.0, 1126.0, 1674.0, 2428.0, 3455.0, 5184.0, 7621.0, 11771.0, 18063.0, 28643.0, 47428.0, 82636.0, 152420.0, 1301055.0, 183555.0, 98100.0, 55093.0, 33206.0, 20706.0, 13384.0, 8779.0, 5956.0, 3773.0, 2741.0, 1883.0, 1202.0, 804.0, 588.0, 405.0, 289.0, 209.0, 125.0, 106.0, 70.0, 48.0, 27.0, 25.0, 13.0, 10.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.085693359375, -0.08289718627929688, -0.08010101318359375, -0.07730484008789062, -0.0745086669921875, -0.07171249389648438, -0.06891632080078125, -0.06612014770507812, -0.063323974609375, -0.060527801513671875, -0.05773162841796875, -0.054935455322265625, -0.0521392822265625, -0.049343109130859375, -0.04654693603515625, -0.043750762939453125, -0.04095458984375, -0.038158416748046875, -0.03536224365234375, -0.032566070556640625, -0.0297698974609375, -0.026973724365234375, -0.02417755126953125, -0.021381378173828125, -0.018585205078125, -0.015789031982421875, -0.01299285888671875, -0.010196685791015625, -0.0074005126953125, -0.004604339599609375, -0.00180816650390625, 0.000988006591796875, 0.0037841796875, 0.006580352783203125, 0.00937652587890625, 0.012172698974609375, 0.0149688720703125, 0.017765045166015625, 0.02056121826171875, 0.023357391357421875, 0.026153564453125, 0.028949737548828125, 0.03174591064453125, 0.034542083740234375, 0.0373382568359375, 0.040134429931640625, 0.04293060302734375, 0.045726776123046875, 0.04852294921875, 0.051319122314453125, 0.05411529541015625, 0.056911468505859375, 0.0597076416015625, 0.06250381469726562, 0.06529998779296875, 0.06809616088867188, 0.070892333984375, 0.07368850708007812, 0.07648468017578125, 0.07928085327148438, 0.0820770263671875, 0.08487319946289062, 0.08766937255859375, 0.09046554565429688, 0.09326171875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 5.0, 2.0, 7.0, 11.0, 15.0, 20.0, 22.0, 34.0, 57.0, 89.0, 118.0, 166.0, 144.0, 81.0, 57.0, 41.0, 30.0, 28.0, 15.0, 13.0, 7.0, 2.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011606216430664062, -0.001123964786529541, -0.0010873079299926758, -0.0010506510734558105, -0.0010139942169189453, -0.00097733736038208, -0.0009406805038452148, -0.0009040236473083496, -0.0008673667907714844, -0.0008307099342346191, -0.0007940530776977539, -0.0007573962211608887, -0.0007207393646240234, -0.0006840825080871582, -0.000647425651550293, -0.0006107687950134277, -0.0005741119384765625, -0.0005374550819396973, -0.000500798225402832, -0.0004641413688659668, -0.00042748451232910156, -0.00039082765579223633, -0.0003541707992553711, -0.00031751394271850586, -0.0002808570861816406, -0.0002442002296447754, -0.00020754337310791016, -0.00017088651657104492, -0.0001342296600341797, -9.757280349731445e-05, -6.091594696044922e-05, -2.4259090423583984e-05, 1.239776611328125e-05, 4.9054622650146484e-05, 8.571147918701172e-05, 0.00012236833572387695, 0.0001590251922607422, 0.00019568204879760742, 0.00023233890533447266, 0.0002689957618713379, 0.0003056526184082031, 0.00034230947494506836, 0.0003789663314819336, 0.00041562318801879883, 0.00045228004455566406, 0.0004889369010925293, 0.0005255937576293945, 0.0005622506141662598, 0.000598907470703125, 0.0006355643272399902, 0.0006722211837768555, 0.0007088780403137207, 0.0007455348968505859, 0.0007821917533874512, 0.0008188486099243164, 0.0008555054664611816, 0.0008921623229980469, 0.0009288191795349121, 0.0009654760360717773, 0.0010021328926086426, 0.0010387897491455078, 0.001075446605682373, 0.0011121034622192383, 0.0011487603187561035, 0.0011854171752929688]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 2.0, 7.0, 6.0, 19.0, 21.0, 35.0, 44.0, 47.0, 115.0, 186.0, 479.0, 10880.0, 1033895.0, 1994.0, 368.0, 181.0, 75.0, 53.0, 38.0, 27.0, 16.0, 13.0, 10.0, 3.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023681640625, -0.022949695587158203, -0.022217750549316406, -0.02148580551147461, -0.020753860473632812, -0.020021915435791016, -0.01928997039794922, -0.018558025360107422, -0.017826080322265625, -0.017094135284423828, -0.01636219024658203, -0.015630245208740234, -0.014898300170898438, -0.01416635513305664, -0.013434410095214844, -0.012702465057373047, -0.01197052001953125, -0.011238574981689453, -0.010506629943847656, -0.00977468490600586, -0.009042739868164062, -0.008310794830322266, -0.007578849792480469, -0.006846904754638672, -0.006114959716796875, -0.005383014678955078, -0.004651069641113281, -0.003919124603271484, -0.0031871795654296875, -0.0024552345275878906, -0.0017232894897460938, -0.0009913444519042969, -0.0002593994140625, 0.0004725456237792969, 0.0012044906616210938, 0.0019364356994628906, 0.0026683807373046875, 0.0034003257751464844, 0.004132270812988281, 0.004864215850830078, 0.005596160888671875, 0.006328105926513672, 0.007060050964355469, 0.007791996002197266, 0.008523941040039062, 0.00925588607788086, 0.009987831115722656, 0.010719776153564453, 0.01145172119140625, 0.012183666229248047, 0.012915611267089844, 0.01364755630493164, 0.014379501342773438, 0.015111446380615234, 0.01584339141845703, 0.016575336456298828, 0.017307281494140625, 0.018039226531982422, 0.01877117156982422, 0.019503116607666016, 0.020235061645507812, 0.02096700668334961, 0.021698951721191406, 0.022430896759033203, 0.023162841796875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 67.0, 396.0, 436.0, 77.0, 19.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002718091243878007, -0.0026244448963552713, -0.0025307987816631794, -0.002437152434140444, -0.002343506319448352, -0.0022498599719256163, -0.0021562138572335243, -0.0020625675097107887, -0.001968921162188053, -0.0018752749310806394, -0.0017816286999732256, -0.00168798235245049, -0.001594336237758398, -0.0015006898902356625, -0.0014070436591282487, -0.001313397428020835, -0.001219751313328743, -0.0011261050822213292, -0.0010324588511139154, -0.0009388125617988408, -0.000845166330691427, -0.0007515200995840132, -0.0006578738102689385, -0.0005642275791615248, -0.000470581348054111, -0.00037693511694669724, -0.000283288856735453, -0.00018964259652420878, -9.599636541679502e-05, -2.3501343093812466e-06, 9.129615500569344e-05, 0.0001849423861131072, 0.000278588617220521, 0.00037223484832793474, 0.00046588110853917897, 0.0005595273687504232, 0.000653173599857837, 0.0007468198309652507, 0.0008404661202803254, 0.0009341123513877392, 0.001027758582495153, 0.0011214048136025667, 0.0012150510447099805, 0.0013086972758173943, 0.0014023436233401299, 0.0014959897380322218, 0.0015896360855549574, 0.0016832823166623712, 0.001776928547769785, 0.0018705747788771987, 0.0019642210099846125, 0.002057867357507348, 0.00215151347219944, 0.0022451598197221756, 0.002338806167244911, 0.002432452281937003, 0.002526098396629095, 0.0026197447441518307, 0.0027133908588439226, 0.002807037206366658, 0.00290068332105875, 0.0029943296685814857, 0.0030879760161042213, 0.0031816221307963133, 0.003275268478319049]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 13.0, 13.0, 11.0, 19.0, 10.0, 23.0, 12.0, 18.0, 18.0, 29.0, 36.0, 40.0, 32.0, 34.0, 36.0, 36.0, 39.0, 42.0, 33.0, 34.0, 40.0, 37.0, 43.0, 37.0, 29.0, 34.0, 34.0, 32.0, 25.0, 24.0, 21.0, 24.0, 11.0, 16.0, 14.0, 7.0, 9.0, 7.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005884170532226562, -0.0005696052685379982, -0.0005507934838533401, -0.0005319816991686821, -0.000513169914484024, -0.000494358129799366, -0.00047554634511470795, -0.0004567345604300499, -0.00043792277574539185, -0.0004191109910607338, -0.00040029920637607574, -0.0003814874216914177, -0.00036267563700675964, -0.0003438638523221016, -0.00032505206763744354, -0.0003062402829527855, -0.00028742849826812744, -0.0002686167135834694, -0.00024980492889881134, -0.0002309931442141533, -0.00021218135952949524, -0.0001933695748448372, -0.00017455779016017914, -0.0001557460054755211, -0.00013693422079086304, -0.00011812243610620499, -9.931065142154694e-05, -8.049886673688889e-05, -6.168708205223083e-05, -4.2875297367572784e-05, -2.4063512682914734e-05, -5.251727998256683e-06, 1.3560056686401367e-05, 3.237184137105942e-05, 5.118362605571747e-05, 6.999541074037552e-05, 8.880719542503357e-05, 0.00010761898010969162, 0.00012643076479434967, 0.00014524254947900772, 0.00016405433416366577, 0.00018286611884832382, 0.00020167790353298187, 0.00022048968821763992, 0.00023930147290229797, 0.000258113257586956, 0.0002769250422716141, 0.0002957368269562721, 0.0003145486116409302, 0.0003333603963255882, 0.0003521721810102463, 0.00037098396569490433, 0.0003897957503795624, 0.00040860753506422043, 0.0004274193197488785, 0.00044623110443353653, 0.0004650428891181946, 0.00048385467380285263, 0.0005026664584875107, 0.0005214782431721687, 0.0005402900278568268, 0.0005591018125414848, 0.0005779135972261429, 0.0005967253819108009, 0.000615537166595459]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 4.0, 8.0, 10.0, 6.0, 8.0, 14.0, 20.0, 12.0, 23.0, 21.0, 30.0, 24.0, 34.0, 35.0, 24.0, 37.0, 39.0, 32.0, 38.0, 50.0, 38.0, 36.0, 37.0, 41.0, 38.0, 33.0, 25.0, 40.0, 27.0, 28.0, 29.0, 15.0, 11.0, 20.0, 11.0, 10.0, 15.0, 11.0, 13.0, 10.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.34375, -5.1767578125, -5.009765625, -4.8427734375, -4.67578125, -4.5087890625, -4.341796875, -4.1748046875, -4.0078125, -3.8408203125, -3.673828125, -3.5068359375, -3.33984375, -3.1728515625, -3.005859375, -2.8388671875, -2.671875, -2.5048828125, -2.337890625, -2.1708984375, -2.00390625, -1.8369140625, -1.669921875, -1.5029296875, -1.3359375, -1.1689453125, -1.001953125, -0.8349609375, -0.66796875, -0.5009765625, -0.333984375, -0.1669921875, 0.0, 0.1669921875, 0.333984375, 0.5009765625, 0.66796875, 0.8349609375, 1.001953125, 1.1689453125, 1.3359375, 1.5029296875, 1.669921875, 1.8369140625, 2.00390625, 2.1708984375, 2.337890625, 2.5048828125, 2.671875, 2.8388671875, 3.005859375, 3.1728515625, 3.33984375, 3.5068359375, 3.673828125, 3.8408203125, 4.0078125, 4.1748046875, 4.341796875, 4.5087890625, 4.67578125, 4.8427734375, 5.009765625, 5.1767578125, 5.34375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 10.0, 13.0, 20.0, 25.0, 22.0, 35.0, 72.0, 71.0, 101.0, 153.0, 202.0, 293.0, 401.0, 566.0, 906.0, 1496.0, 2390.0, 4314.0, 7759.0, 14504.0, 27194.0, 53712.0, 106715.0, 209371.0, 276948.0, 166821.0, 83728.0, 41892.0, 21580.0, 11539.0, 6337.0, 3513.0, 2009.0, 1283.0, 826.0, 485.0, 370.0, 259.0, 186.0, 133.0, 84.0, 64.0, 41.0, 28.0, 23.0, 16.0, 15.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.2734375, -5.11029052734375, -4.9471435546875, -4.78399658203125, -4.620849609375, -4.45770263671875, -4.2945556640625, -4.13140869140625, -3.96826171875, -3.80511474609375, -3.6419677734375, -3.47882080078125, -3.315673828125, -3.15252685546875, -2.9893798828125, -2.82623291015625, -2.6630859375, -2.49993896484375, -2.3367919921875, -2.17364501953125, -2.010498046875, -1.84735107421875, -1.6842041015625, -1.52105712890625, -1.35791015625, -1.19476318359375, -1.0316162109375, -0.86846923828125, -0.705322265625, -0.54217529296875, -0.3790283203125, -0.21588134765625, -0.052734375, 0.11041259765625, 0.2735595703125, 0.43670654296875, 0.599853515625, 0.76300048828125, 0.9261474609375, 1.08929443359375, 1.25244140625, 1.41558837890625, 1.5787353515625, 1.74188232421875, 1.905029296875, 2.06817626953125, 2.2313232421875, 2.39447021484375, 2.5576171875, 2.72076416015625, 2.8839111328125, 3.04705810546875, 3.210205078125, 3.37335205078125, 3.5364990234375, 3.69964599609375, 3.86279296875, 4.02593994140625, 4.1890869140625, 4.35223388671875, 4.515380859375, 4.67852783203125, 4.8416748046875, 5.00482177734375, 5.16796875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 7.0, 4.0, 9.0, 11.0, 7.0, 12.0, 25.0, 19.0, 30.0, 33.0, 51.0, 58.0, 78.0, 79.0, 149.0, 299.0, 1400.0, 267.0, 140.0, 77.0, 56.0, 50.0, 41.0, 25.0, 26.0, 24.0, 15.0, 13.0, 9.0, 16.0, 7.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.3868408203125, -12.812744140625, -12.2386474609375, -11.66455078125, -11.0904541015625, -10.516357421875, -9.9422607421875, -9.3681640625, -8.7940673828125, -8.219970703125, -7.6458740234375, -7.07177734375, -6.4976806640625, -5.923583984375, -5.3494873046875, -4.775390625, -4.2012939453125, -3.627197265625, -3.0531005859375, -2.47900390625, -1.9049072265625, -1.330810546875, -0.7567138671875, -0.1826171875, 0.3914794921875, 0.965576171875, 1.5396728515625, 2.11376953125, 2.6878662109375, 3.261962890625, 3.8360595703125, 4.41015625, 4.9842529296875, 5.558349609375, 6.1324462890625, 6.70654296875, 7.2806396484375, 7.854736328125, 8.4288330078125, 9.0029296875, 9.5770263671875, 10.151123046875, 10.7252197265625, 11.29931640625, 11.8734130859375, 12.447509765625, 13.0216064453125, 13.595703125, 14.1697998046875, 14.743896484375, 15.3179931640625, 15.89208984375, 16.4661865234375, 17.040283203125, 17.6143798828125, 18.1884765625, 18.7625732421875, 19.336669921875, 19.9107666015625, 20.48486328125, 21.0589599609375, 21.633056640625, 22.2071533203125, 22.78125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 11.0, 12.0, 8.0, 12.0, 16.0, 14.0, 32.0, 46.0, 31.0, 48.0, 71.0, 102.0, 178.0, 312.0, 662.0, 3235.0, 86730.0, 2972088.0, 77559.0, 3015.0, 641.0, 308.0, 166.0, 114.0, 73.0, 64.0, 40.0, 25.0, 28.0, 16.0, 15.0, 11.0, 4.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-30.859375, -30.077880859375, -29.29638671875, -28.514892578125, -27.7333984375, -26.951904296875, -26.17041015625, -25.388916015625, -24.607421875, -23.825927734375, -23.04443359375, -22.262939453125, -21.4814453125, -20.699951171875, -19.91845703125, -19.136962890625, -18.35546875, -17.573974609375, -16.79248046875, -16.010986328125, -15.2294921875, -14.447998046875, -13.66650390625, -12.885009765625, -12.103515625, -11.322021484375, -10.54052734375, -9.759033203125, -8.9775390625, -8.196044921875, -7.41455078125, -6.633056640625, -5.8515625, -5.070068359375, -4.28857421875, -3.507080078125, -2.7255859375, -1.944091796875, -1.16259765625, -0.381103515625, 0.400390625, 1.181884765625, 1.96337890625, 2.744873046875, 3.5263671875, 4.307861328125, 5.08935546875, 5.870849609375, 6.65234375, 7.433837890625, 8.21533203125, 8.996826171875, 9.7783203125, 10.559814453125, 11.34130859375, 12.122802734375, 12.904296875, 13.685791015625, 14.46728515625, 15.248779296875, 16.0302734375, 16.811767578125, 17.59326171875, 18.374755859375, 19.15625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 12.0, 50.0, 118.0, 212.0, 241.0, 193.0, 111.0, 46.0, 15.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.87434768676758, -34.32606506347656, -31.777782440185547, -29.22949981689453, -26.681217193603516, -24.1329345703125, -21.584651947021484, -19.03636932373047, -16.488086700439453, -13.939804077148438, -11.391521453857422, -8.843238830566406, -6.294956207275391, -3.746673583984375, -1.1983909606933594, 1.3498916625976562, 3.898174285888672, 6.4464569091796875, 8.994739532470703, 11.543022155761719, 14.091304779052734, 16.63958740234375, 19.187870025634766, 21.73615264892578, 24.284435272216797, 26.832717895507812, 29.381000518798828, 31.929283142089844, 34.47756576538086, 37.025848388671875, 39.57413101196289, 42.122413635253906, 44.670692443847656, 47.21897506713867, 49.76725769042969, 52.3155403137207, 54.86382293701172, 57.412105560302734, 59.96038818359375, 62.508670806884766, 65.05695343017578, 67.60523986816406, 70.15351867675781, 72.70179748535156, 75.25008392333984, 77.79837036132812, 80.34664916992188, 82.89492797851562, 85.4432144165039, 87.99150085449219, 90.53977966308594, 93.08805847167969, 95.63634490966797, 98.18463134765625, 100.73291015625, 103.28118896484375, 105.82947540283203, 108.37776184082031, 110.92604064941406, 113.47431945800781, 116.0226058959961, 118.57089233398438, 121.11917114257812, 123.66744995117188, 126.21573638916016]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 13.0, 22.0, 14.0, 14.0, 16.0, 25.0, 23.0, 26.0, 32.0, 34.0, 44.0, 45.0, 36.0, 48.0, 46.0, 38.0, 55.0, 34.0, 39.0, 43.0, 40.0, 41.0, 38.0, 28.0, 22.0, 24.0, 19.0, 19.0, 18.0, 15.0, 13.0, 11.0, 10.0, 11.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0], "bins": [-43.98972702026367, -42.67571258544922, -41.3616943359375, -40.04767990112305, -38.73366165161133, -37.419647216796875, -36.105628967285156, -34.7916145324707, -33.47760009765625, -32.1635856628418, -30.849567413330078, -29.535551071166992, -28.221534729003906, -26.907520294189453, -25.593503952026367, -24.27948760986328, -22.965469360351562, -21.651453018188477, -20.33743667602539, -19.023420333862305, -17.70940399169922, -16.395389556884766, -15.08137321472168, -13.767356872558594, -12.453340530395508, -11.139324188232422, -9.825307846069336, -8.511292457580566, -7.1972761154174805, -5.8832597732543945, -4.569243907928467, -3.255228042602539, -1.9412155151367188, -0.6271994113922119, 0.6868166923522949, 2.0008327960968018, 3.3148488998413086, 4.6288652420043945, 5.942881107330322, 7.25689697265625, 8.570913314819336, 9.884929656982422, 11.198945999145508, 12.512961387634277, 13.826977729797363, 15.14099407196045, 16.45500946044922, 17.769025802612305, 19.08304214477539, 20.397058486938477, 21.711074829101562, 23.02509117126465, 24.339107513427734, 25.653121948242188, 26.967138290405273, 28.28115463256836, 29.595170974731445, 30.90918731689453, 32.223201751708984, 33.5372200012207, 34.851234436035156, 36.165252685546875, 37.47926712036133, 38.79328155517578, 40.1072998046875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 4.0, 9.0, 11.0, 6.0, 7.0, 8.0, 12.0, 12.0, 18.0, 11.0, 16.0, 14.0, 22.0, 15.0, 29.0, 18.0, 31.0, 39.0, 40.0, 33.0, 42.0, 38.0, 27.0, 40.0, 42.0, 36.0, 34.0, 37.0, 37.0, 27.0, 33.0, 32.0, 25.0, 20.0, 17.0, 15.0, 13.0, 21.0, 22.0, 12.0, 14.0, 13.0, 8.0, 7.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.2578125, -5.0858154296875, -4.913818359375, -4.7418212890625, -4.56982421875, -4.3978271484375, -4.225830078125, -4.0538330078125, -3.8818359375, -3.7098388671875, -3.537841796875, -3.3658447265625, -3.19384765625, -3.0218505859375, -2.849853515625, -2.6778564453125, -2.505859375, -2.3338623046875, -2.161865234375, -1.9898681640625, -1.81787109375, -1.6458740234375, -1.473876953125, -1.3018798828125, -1.1298828125, -0.9578857421875, -0.785888671875, -0.6138916015625, -0.44189453125, -0.2698974609375, -0.097900390625, 0.0740966796875, 0.24609375, 0.4180908203125, 0.590087890625, 0.7620849609375, 0.93408203125, 1.1060791015625, 1.278076171875, 1.4500732421875, 1.6220703125, 1.7940673828125, 1.966064453125, 2.1380615234375, 2.31005859375, 2.4820556640625, 2.654052734375, 2.8260498046875, 2.998046875, 3.1700439453125, 3.342041015625, 3.5140380859375, 3.68603515625, 3.8580322265625, 4.030029296875, 4.2020263671875, 4.3740234375, 4.5460205078125, 4.718017578125, 4.8900146484375, 5.06201171875, 5.2340087890625, 5.406005859375, 5.5780029296875, 5.75]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 6.0, 6.0, 17.0, 12.0, 7.0, 11.0, 13.0, 27.0, 32.0, 42.0, 59.0, 81.0, 150.0, 201.0, 359.0, 680.0, 1403.0, 3079.0, 8223.0, 28132.0, 167334.0, 2439550.0, 1411730.0, 100443.0, 20768.0, 6644.0, 2591.0, 1155.0, 610.0, 335.0, 177.0, 100.0, 67.0, 45.0, 37.0, 23.0, 27.0, 17.0, 16.0, 8.0, 15.0, 8.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.3125, -31.26611328125, -30.2197265625, -29.17333984375, -28.126953125, -27.08056640625, -26.0341796875, -24.98779296875, -23.94140625, -22.89501953125, -21.8486328125, -20.80224609375, -19.755859375, -18.70947265625, -17.6630859375, -16.61669921875, -15.5703125, -14.52392578125, -13.4775390625, -12.43115234375, -11.384765625, -10.33837890625, -9.2919921875, -8.24560546875, -7.19921875, -6.15283203125, -5.1064453125, -4.06005859375, -3.013671875, -1.96728515625, -0.9208984375, 0.12548828125, 1.171875, 2.21826171875, 3.2646484375, 4.31103515625, 5.357421875, 6.40380859375, 7.4501953125, 8.49658203125, 9.54296875, 10.58935546875, 11.6357421875, 12.68212890625, 13.728515625, 14.77490234375, 15.8212890625, 16.86767578125, 17.9140625, 18.96044921875, 20.0068359375, 21.05322265625, 22.099609375, 23.14599609375, 24.1923828125, 25.23876953125, 26.28515625, 27.33154296875, 28.3779296875, 29.42431640625, 30.470703125, 31.51708984375, 32.5634765625, 33.60986328125, 34.65625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 14.0, 15.0, 27.0, 46.0, 56.0, 101.0, 233.0, 417.0, 779.0, 930.0, 612.0, 379.0, 212.0, 114.0, 58.0, 37.0, 24.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.78125, -28.767578125, -27.75390625, -26.740234375, -25.7265625, -24.712890625, -23.69921875, -22.685546875, -21.671875, -20.658203125, -19.64453125, -18.630859375, -17.6171875, -16.603515625, -15.58984375, -14.576171875, -13.5625, -12.548828125, -11.53515625, -10.521484375, -9.5078125, -8.494140625, -7.48046875, -6.466796875, -5.453125, -4.439453125, -3.42578125, -2.412109375, -1.3984375, -0.384765625, 0.62890625, 1.642578125, 2.65625, 3.669921875, 4.68359375, 5.697265625, 6.7109375, 7.724609375, 8.73828125, 9.751953125, 10.765625, 11.779296875, 12.79296875, 13.806640625, 14.8203125, 15.833984375, 16.84765625, 17.861328125, 18.875, 19.888671875, 20.90234375, 21.916015625, 22.9296875, 23.943359375, 24.95703125, 25.970703125, 26.984375, 27.998046875, 29.01171875, 30.025390625, 31.0390625, 32.052734375, 33.06640625, 34.080078125, 35.09375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 13.0, 14.0, 17.0, 24.0, 36.0, 46.0, 66.0, 66.0, 106.0, 182.0, 330.0, 718.0, 2214.0, 8853.0, 46328.0, 521715.0, 3272750.0, 298418.0, 32413.0, 6643.0, 1829.0, 609.0, 279.0, 184.0, 107.0, 77.0, 48.0, 39.0, 34.0, 32.0, 17.0, 19.0, 16.0, 6.0, 10.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.375, -35.2861328125, -34.197265625, -33.1083984375, -32.01953125, -30.9306640625, -29.841796875, -28.7529296875, -27.6640625, -26.5751953125, -25.486328125, -24.3974609375, -23.30859375, -22.2197265625, -21.130859375, -20.0419921875, -18.953125, -17.8642578125, -16.775390625, -15.6865234375, -14.59765625, -13.5087890625, -12.419921875, -11.3310546875, -10.2421875, -9.1533203125, -8.064453125, -6.9755859375, -5.88671875, -4.7978515625, -3.708984375, -2.6201171875, -1.53125, -0.4423828125, 0.646484375, 1.7353515625, 2.82421875, 3.9130859375, 5.001953125, 6.0908203125, 7.1796875, 8.2685546875, 9.357421875, 10.4462890625, 11.53515625, 12.6240234375, 13.712890625, 14.8017578125, 15.890625, 16.9794921875, 18.068359375, 19.1572265625, 20.24609375, 21.3349609375, 22.423828125, 23.5126953125, 24.6015625, 25.6904296875, 26.779296875, 27.8681640625, 28.95703125, 30.0458984375, 31.134765625, 32.2236328125, 33.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 13.0, 27.0, 22.0, 16.0, 32.0, 45.0, 61.0, 69.0, 77.0, 77.0, 101.0, 80.0, 67.0, 77.0, 54.0, 40.0, 26.0, 30.0, 17.0, 15.0, 11.0, 2.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-119.81044006347656, -115.21060180664062, -110.61077117919922, -106.01094055175781, -101.41110229492188, -96.81126403808594, -92.21143341064453, -87.61160278320312, -83.01176452636719, -78.41192626953125, -73.81209564208984, -69.21226501464844, -64.6124267578125, -60.01259231567383, -55.412757873535156, -50.812923431396484, -46.21308898925781, -41.61325454711914, -37.01342010498047, -32.4135856628418, -27.813751220703125, -23.213916778564453, -18.61408233642578, -14.01424789428711, -9.414413452148438, -4.814579010009766, -0.21474456787109375, 4.385089874267578, 8.98492431640625, 13.584758758544922, 18.184593200683594, 22.784427642822266, 27.384246826171875, 31.984081268310547, 36.58391571044922, 41.18375015258789, 45.78358459472656, 50.383419036865234, 54.983253479003906, 59.58308792114258, 64.18292236328125, 68.78276062011719, 73.3825912475586, 77.982421875, 82.58226013183594, 87.18209838867188, 91.78192901611328, 96.38175964355469, 100.98159790039062, 105.58143615722656, 110.18126678466797, 114.78109741210938, 119.38093566894531, 123.98077392578125, 128.58059692382812, 133.18043518066406, 137.7802734375, 142.38011169433594, 146.97994995117188, 151.57977294921875, 156.1796112060547, 160.77944946289062, 165.3792724609375, 169.97911071777344, 174.57894897460938]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 7.0, 9.0, 8.0, 13.0, 12.0, 9.0, 13.0, 22.0, 15.0, 18.0, 21.0, 26.0, 24.0, 35.0, 29.0, 28.0, 36.0, 43.0, 39.0, 44.0, 54.0, 37.0, 51.0, 29.0, 36.0, 41.0, 33.0, 31.0, 32.0, 39.0, 34.0, 23.0, 25.0, 18.0, 17.0, 13.0, 6.0, 8.0, 8.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-103.0640869140625, -100.19120025634766, -97.31831359863281, -94.44542694091797, -91.57254028320312, -88.69965362548828, -85.82676696777344, -82.95388793945312, -80.08099365234375, -77.2081069946289, -74.33522033691406, -71.46233367919922, -68.58944702148438, -65.71656036376953, -62.84367752075195, -59.97079086303711, -57.09790802001953, -54.22502136230469, -51.352134704589844, -48.479248046875, -45.606361389160156, -42.73347473144531, -39.860591888427734, -36.98770523071289, -34.11481857299805, -31.241931915283203, -28.36904525756836, -25.49616050720215, -22.623273849487305, -19.75038719177246, -16.87750244140625, -14.004615783691406, -11.131729125976562, -8.258842468261719, -5.385956764221191, -2.513071060180664, 0.3598155975341797, 3.2327022552490234, 6.105587005615234, 8.978473663330078, 11.851360321044922, 14.724246978759766, 17.59713363647461, 20.47001838684082, 23.342905044555664, 26.215791702270508, 29.08867645263672, 31.961563110351562, 34.834449768066406, 37.70733642578125, 40.580223083496094, 43.45310974121094, 46.32599639892578, 49.198883056640625, 52.0717658996582, 54.94465255737305, 57.81753921508789, 60.690425872802734, 63.56331253051758, 66.43619537353516, 69.30908203125, 72.18196868896484, 75.05485534667969, 77.92774200439453, 80.80062866210938]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 6.0, 16.0, 15.0, 15.0, 19.0, 18.0, 21.0, 26.0, 21.0, 31.0, 23.0, 35.0, 42.0, 43.0, 50.0, 44.0, 50.0, 43.0, 41.0, 47.0, 52.0, 37.0, 32.0, 38.0, 34.0, 39.0, 28.0, 31.0, 19.0, 17.0, 9.0, 10.0, 11.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-250.625, -243.646484375, -236.66796875, -229.689453125, -222.7109375, -215.732421875, -208.75390625, -201.775390625, -194.796875, -187.818359375, -180.83984375, -173.861328125, -166.8828125, -159.904296875, -152.92578125, -145.947265625, -138.96875, -131.990234375, -125.01171875, -118.033203125, -111.0546875, -104.076171875, -97.09765625, -90.119140625, -83.140625, -76.162109375, -69.18359375, -62.205078125, -55.2265625, -48.248046875, -41.26953125, -34.291015625, -27.3125, -20.333984375, -13.35546875, -6.376953125, 0.6015625, 7.580078125, 14.55859375, 21.537109375, 28.515625, 35.494140625, 42.47265625, 49.451171875, 56.4296875, 63.408203125, 70.38671875, 77.365234375, 84.34375, 91.322265625, 98.30078125, 105.279296875, 112.2578125, 119.236328125, 126.21484375, 133.193359375, 140.171875, 147.150390625, 154.12890625, 161.107421875, 168.0859375, 175.064453125, 182.04296875, 189.021484375, 196.0]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 10.0, 18.0, 17.0, 21.0, 51.0, 87.0, 119.0, 142.0, 245.0, 428.0, 628.0, 964.0, 1668.0, 2590.0, 4469.0, 7540.0, 13304.0, 23379.0, 42008.0, 79523.0, 173573.0, 360450.0, 165376.0, 77008.0, 40903.0, 22577.0, 12837.0, 7327.0, 4410.0, 2580.0, 1628.0, 956.0, 579.0, 407.0, 239.0, 173.0, 129.0, 56.0, 41.0, 28.0, 23.0, 14.0, 16.0, 2.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5390625, -7.3138427734375, -7.088623046875, -6.8634033203125, -6.63818359375, -6.4129638671875, -6.187744140625, -5.9625244140625, -5.7373046875, -5.5120849609375, -5.286865234375, -5.0616455078125, -4.83642578125, -4.6112060546875, -4.385986328125, -4.1607666015625, -3.935546875, -3.7103271484375, -3.485107421875, -3.2598876953125, -3.03466796875, -2.8094482421875, -2.584228515625, -2.3590087890625, -2.1337890625, -1.9085693359375, -1.683349609375, -1.4581298828125, -1.23291015625, -1.0076904296875, -0.782470703125, -0.5572509765625, -0.33203125, -0.1068115234375, 0.118408203125, 0.3436279296875, 0.56884765625, 0.7940673828125, 1.019287109375, 1.2445068359375, 1.4697265625, 1.6949462890625, 1.920166015625, 2.1453857421875, 2.37060546875, 2.5958251953125, 2.821044921875, 3.0462646484375, 3.271484375, 3.4967041015625, 3.721923828125, 3.9471435546875, 4.17236328125, 4.3975830078125, 4.622802734375, 4.8480224609375, 5.0732421875, 5.2984619140625, 5.523681640625, 5.7489013671875, 5.97412109375, 6.1993408203125, 6.424560546875, 6.6497802734375, 6.875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 5.0, 7.0, 13.0, 9.0, 15.0, 16.0, 17.0, 16.0, 25.0, 18.0, 27.0, 25.0, 38.0, 41.0, 30.0, 30.0, 34.0, 42.0, 44.0, 37.0, 1071.0, 29.0, 33.0, 42.0, 39.0, 30.0, 32.0, 32.0, 24.0, 28.0, 31.0, 12.0, 19.0, 12.0, 22.0, 14.0, 14.0, 14.0, 5.0, 6.0, 5.0, 3.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.5, -133.83984375, -129.1796875, -124.51953125, -119.859375, -115.19921875, -110.5390625, -105.87890625, -101.21875, -96.55859375, -91.8984375, -87.23828125, -82.578125, -77.91796875, -73.2578125, -68.59765625, -63.9375, -59.27734375, -54.6171875, -49.95703125, -45.296875, -40.63671875, -35.9765625, -31.31640625, -26.65625, -21.99609375, -17.3359375, -12.67578125, -8.015625, -3.35546875, 1.3046875, 5.96484375, 10.625, 15.28515625, 19.9453125, 24.60546875, 29.265625, 33.92578125, 38.5859375, 43.24609375, 47.90625, 52.56640625, 57.2265625, 61.88671875, 66.546875, 71.20703125, 75.8671875, 80.52734375, 85.1875, 89.84765625, 94.5078125, 99.16796875, 103.828125, 108.48828125, 113.1484375, 117.80859375, 122.46875, 127.12890625, 131.7890625, 136.44921875, 141.109375, 145.76953125, 150.4296875, 155.08984375, 159.75]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 12.0, 16.0, 13.0, 39.0, 44.0, 77.0, 101.0, 172.0, 254.0, 352.0, 550.0, 821.0, 1265.0, 1849.0, 2820.0, 4292.0, 6624.0, 10201.0, 15684.0, 25178.0, 40450.0, 67584.0, 124013.0, 1322280.0, 217783.0, 100715.0, 57103.0, 35064.0, 21866.0, 14004.0, 8888.0, 5835.0, 3855.0, 2526.0, 1654.0, 1054.0, 705.0, 462.0, 294.0, 215.0, 135.0, 95.0, 70.0, 39.0, 22.0, 16.0, 14.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.95703125, -3.8365478515625, -3.716064453125, -3.5955810546875, -3.47509765625, -3.3546142578125, -3.234130859375, -3.1136474609375, -2.9931640625, -2.8726806640625, -2.752197265625, -2.6317138671875, -2.51123046875, -2.3907470703125, -2.270263671875, -2.1497802734375, -2.029296875, -1.9088134765625, -1.788330078125, -1.6678466796875, -1.54736328125, -1.4268798828125, -1.306396484375, -1.1859130859375, -1.0654296875, -0.9449462890625, -0.824462890625, -0.7039794921875, -0.58349609375, -0.4630126953125, -0.342529296875, -0.2220458984375, -0.1015625, 0.0189208984375, 0.139404296875, 0.2598876953125, 0.38037109375, 0.5008544921875, 0.621337890625, 0.7418212890625, 0.8623046875, 0.9827880859375, 1.103271484375, 1.2237548828125, 1.34423828125, 1.4647216796875, 1.585205078125, 1.7056884765625, 1.826171875, 1.9466552734375, 2.067138671875, 2.1876220703125, 2.30810546875, 2.4285888671875, 2.549072265625, 2.6695556640625, 2.7900390625, 2.9105224609375, 3.031005859375, 3.1514892578125, 3.27197265625, 3.3924560546875, 3.512939453125, 3.6334228515625, 3.75390625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 10.0, 6.0, 11.0, 15.0, 8.0, 16.0, 15.0, 24.0, 26.0, 39.0, 49.0, 58.0, 55.0, 79.0, 82.0, 84.0, 62.0, 55.0, 60.0, 54.0, 32.0, 28.0, 23.0, 24.0, 17.0, 12.0, 10.0, 8.0, 3.0, 5.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015625, -0.015136480331420898, -0.014647960662841797, -0.014159440994262695, -0.013670921325683594, -0.013182401657104492, -0.01269388198852539, -0.012205362319946289, -0.011716842651367188, -0.011228322982788086, -0.010739803314208984, -0.010251283645629883, -0.009762763977050781, -0.00927424430847168, -0.008785724639892578, -0.008297204971313477, -0.007808685302734375, -0.0073201656341552734, -0.006831645965576172, -0.00634312629699707, -0.005854606628417969, -0.005366086959838867, -0.004877567291259766, -0.004389047622680664, -0.0039005279541015625, -0.003412008285522461, -0.0029234886169433594, -0.002434968948364258, -0.0019464492797851562, -0.0014579296112060547, -0.0009694099426269531, -0.00048089027404785156, 7.62939453125e-06, 0.0004961490631103516, 0.0009846687316894531, 0.0014731884002685547, 0.0019617080688476562, 0.002450227737426758, 0.0029387474060058594, 0.003427267074584961, 0.0039157867431640625, 0.004404306411743164, 0.004892826080322266, 0.005381345748901367, 0.005869865417480469, 0.00635838508605957, 0.006846904754638672, 0.0073354244232177734, 0.007823944091796875, 0.008312463760375977, 0.008800983428955078, 0.00928950309753418, 0.009778022766113281, 0.010266542434692383, 0.010755062103271484, 0.011243581771850586, 0.011732101440429688, 0.012220621109008789, 0.01270914077758789, 0.013197660446166992, 0.013686180114746094, 0.014174699783325195, 0.014663219451904297, 0.015151739120483398, 0.0156402587890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 5.0, 4.0, 15.0, 19.0, 28.0, 49.0, 92.0, 112.0, 188.0, 374.0, 595.0, 1023.0, 1945.0, 3838.0, 8340.0, 18819.0, 48435.0, 152236.0, 500630.0, 208434.0, 60946.0, 23005.0, 9705.0, 4585.0, 2295.0, 1214.0, 656.0, 367.0, 232.0, 123.0, 75.0, 64.0, 41.0, 26.0, 9.0, 10.0, 8.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09222412109375, -0.08955955505371094, -0.08689498901367188, -0.08423042297363281, -0.08156585693359375, -0.07890129089355469, -0.07623672485351562, -0.07357215881347656, -0.0709075927734375, -0.06824302673339844, -0.06557846069335938, -0.06291389465332031, -0.06024932861328125, -0.05758476257324219, -0.054920196533203125, -0.05225563049316406, -0.049591064453125, -0.04692649841308594, -0.044261932373046875, -0.04159736633300781, -0.03893280029296875, -0.03626823425292969, -0.033603668212890625, -0.030939102172851562, -0.0282745361328125, -0.025609970092773438, -0.022945404052734375, -0.020280838012695312, -0.01761627197265625, -0.014951705932617188, -0.012287139892578125, -0.009622573852539062, -0.0069580078125, -0.0042934417724609375, -0.001628875732421875, 0.0010356903076171875, 0.00370025634765625, 0.0063648223876953125, 0.009029388427734375, 0.011693954467773438, 0.0143585205078125, 0.017023086547851562, 0.019687652587890625, 0.022352218627929688, 0.02501678466796875, 0.027681350708007812, 0.030345916748046875, 0.03301048278808594, 0.035675048828125, 0.03833961486816406, 0.041004180908203125, 0.04366874694824219, 0.04633331298828125, 0.04899787902832031, 0.051662445068359375, 0.05432701110839844, 0.0569915771484375, 0.05965614318847656, 0.062320709228515625, 0.06498527526855469, 0.06764984130859375, 0.07031440734863281, 0.07297897338867188, 0.07564353942871094, 0.07830810546875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 3.0, 11.0, 7.0, 7.0, 9.0, 18.0, 20.0, 22.0, 29.0, 38.0, 55.0, 61.0, 67.0, 73.0, 74.0, 84.0, 72.0, 72.0, 47.0, 44.0, 44.0, 33.0, 25.0, 19.0, 15.0, 13.0, 3.0, 7.0, 3.0, 9.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0177143607288599, -0.017120180651545525, -0.016525998711586, -0.01593181863427162, -0.01533763762563467, -0.014743456616997719, -0.014149276539683342, -0.01355509553104639, -0.012960914522409439, -0.012366733513772488, -0.011772552505135536, -0.01117837242782116, -0.010584191419184208, -0.009990010410547256, -0.00939583033323288, -0.008801649324595928, -0.008207468315958977, -0.007613287307322025, -0.007019106764346361, -0.006424926221370697, -0.005830745212733746, -0.005236564204096794, -0.00464238366112113, -0.004048203118145466, -0.0034540221095085144, -0.0028598413337022066, -0.002265660557895899, -0.001671479782089591, -0.0010772990062832832, -0.00048311823047697544, 0.00011106254532933235, 0.0007052430883049965, 0.0012994222342967987, 0.0018936030101031065, 0.0024877837859094143, 0.003081964561715722, 0.00367614533752203, 0.004270326346158981, 0.0048645068891346455, 0.00545868743211031, 0.006052868440747261, 0.0066470494493842125, 0.007241229992359877, 0.00783541053533554, 0.008429591543972492, 0.009023772552609444, 0.00961795262992382, 0.010212133638560772, 0.010806314647197723, 0.011400495655834675, 0.011994676664471626, 0.012588856741786003, 0.013183037750422955, 0.013777218759059906, 0.014371398836374283, 0.014965579845011234, 0.015559760853648186, 0.016153940930962563, 0.01674812287092209, 0.017342302948236465, 0.017936483025550842, 0.01853066496551037, 0.019124845042824745, 0.01971902698278427, 0.020313207060098648]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 14.0, 14.0, 13.0, 17.0, 10.0, 31.0, 21.0, 24.0, 35.0, 27.0, 34.0, 31.0, 36.0, 42.0, 46.0, 54.0, 37.0, 31.0, 39.0, 45.0, 46.0, 42.0, 33.0, 32.0, 23.0, 34.0, 22.0, 25.0, 24.0, 20.0, 15.0, 19.0, 8.0, 5.0, 6.0, 11.0, 5.0, 3.0, 0.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.011652886867523193, -0.011288831941783428, -0.010924777016043663, -0.010560722090303898, -0.010196667164564133, -0.009832612238824368, -0.009468557313084602, -0.009104502387344837, -0.008740447461605072, -0.008376392535865307, -0.008012337610125542, -0.0076482826843857765, -0.007284227758646011, -0.006920172832906246, -0.006556117907166481, -0.006192062981426716, -0.005828008055686951, -0.0054639531299471855, -0.00509989820420742, -0.004735843278467655, -0.00437178835272789, -0.004007733426988125, -0.0036436785012483597, -0.0032796235755085945, -0.0029155686497688293, -0.002551513724029064, -0.002187458798289299, -0.0018234038725495338, -0.0014593489468097687, -0.0010952940210700035, -0.0007312390953302383, -0.0003671841695904732, -3.129243850708008e-06, 0.00036092568188905716, 0.0007249806076288223, 0.0010890355333685875, 0.0014530904591083527, 0.0018171453848481178, 0.002181200310587883, 0.002545255236327648, 0.0029093101620674133, 0.0032733650878071785, 0.0036374200135469437, 0.004001474939286709, 0.004365529865026474, 0.004729584790766239, 0.005093639716506004, 0.0054576946422457695, 0.005821749567985535, 0.0061858044937253, 0.006549859419465065, 0.00691391434520483, 0.007277969270944595, 0.0076420241966843605, 0.008006079122424126, 0.00837013404816389, 0.008734188973903656, 0.009098243899643421, 0.009462298825383186, 0.009826353751122952, 0.010190408676862717, 0.010554463602602482, 0.010918518528342247, 0.011282573454082012, 0.011646628379821777]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 7.0, 6.0, 16.0, 15.0, 15.0, 19.0, 18.0, 21.0, 26.0, 21.0, 31.0, 23.0, 34.0, 43.0, 43.0, 50.0, 44.0, 49.0, 44.0, 41.0, 46.0, 53.0, 37.0, 31.0, 39.0, 33.0, 40.0, 28.0, 29.0, 21.0, 17.0, 9.0, 10.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-250.625, -243.6484375, -236.671875, -229.6953125, -222.71875, -215.7421875, -208.765625, -201.7890625, -194.8125, -187.8359375, -180.859375, -173.8828125, -166.90625, -159.9296875, -152.953125, -145.9765625, -139.0, -132.0234375, -125.046875, -118.0703125, -111.09375, -104.1171875, -97.140625, -90.1640625, -83.1875, -76.2109375, -69.234375, -62.2578125, -55.28125, -48.3046875, -41.328125, -34.3515625, -27.375, -20.3984375, -13.421875, -6.4453125, 0.53125, 7.5078125, 14.484375, 21.4609375, 28.4375, 35.4140625, 42.390625, 49.3671875, 56.34375, 63.3203125, 70.296875, 77.2734375, 84.25, 91.2265625, 98.203125, 105.1796875, 112.15625, 119.1328125, 126.109375, 133.0859375, 140.0625, 147.0390625, 154.015625, 160.9921875, 167.96875, 174.9453125, 181.921875, 188.8984375, 195.875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 4.0, 13.0, 6.0, 8.0, 19.0, 13.0, 22.0, 22.0, 22.0, 27.0, 41.0, 62.0, 87.0, 172.0, 270.0, 567.0, 1804.0, 14631.0, 440088.0, 567335.0, 19808.0, 1988.0, 651.0, 302.0, 184.0, 115.0, 62.0, 57.0, 42.0, 30.0, 28.0, 20.0, 7.0, 12.0, 10.0, 5.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-49.65625, -48.27880859375, -46.9013671875, -45.52392578125, -44.146484375, -42.76904296875, -41.3916015625, -40.01416015625, -38.63671875, -37.25927734375, -35.8818359375, -34.50439453125, -33.126953125, -31.74951171875, -30.3720703125, -28.99462890625, -27.6171875, -26.23974609375, -24.8623046875, -23.48486328125, -22.107421875, -20.72998046875, -19.3525390625, -17.97509765625, -16.59765625, -15.22021484375, -13.8427734375, -12.46533203125, -11.087890625, -9.71044921875, -8.3330078125, -6.95556640625, -5.578125, -4.20068359375, -2.8232421875, -1.44580078125, -0.068359375, 1.30908203125, 2.6865234375, 4.06396484375, 5.44140625, 6.81884765625, 8.1962890625, 9.57373046875, 10.951171875, 12.32861328125, 13.7060546875, 15.08349609375, 16.4609375, 17.83837890625, 19.2158203125, 20.59326171875, 21.970703125, 23.34814453125, 24.7255859375, 26.10302734375, 27.48046875, 28.85791015625, 30.2353515625, 31.61279296875, 32.990234375, 34.36767578125, 35.7451171875, 37.12255859375, 38.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 18.0, 19.0, 24.0, 20.0, 36.0, 33.0, 43.0, 65.0, 62.0, 79.0, 80.0, 2105.0, 75.0, 48.0, 63.0, 50.0, 46.0, 47.0, 25.0, 24.0, 14.0, 11.0, 10.0, 10.0, 10.0, 5.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-443.0, -429.23046875, -415.4609375, -401.69140625, -387.921875, -374.15234375, -360.3828125, -346.61328125, -332.84375, -319.07421875, -305.3046875, -291.53515625, -277.765625, -263.99609375, -250.2265625, -236.45703125, -222.6875, -208.91796875, -195.1484375, -181.37890625, -167.609375, -153.83984375, -140.0703125, -126.30078125, -112.53125, -98.76171875, -84.9921875, -71.22265625, -57.453125, -43.68359375, -29.9140625, -16.14453125, -2.375, 11.39453125, 25.1640625, 38.93359375, 52.703125, 66.47265625, 80.2421875, 94.01171875, 107.78125, 121.55078125, 135.3203125, 149.08984375, 162.859375, 176.62890625, 190.3984375, 204.16796875, 217.9375, 231.70703125, 245.4765625, 259.24609375, 273.015625, 286.78515625, 300.5546875, 314.32421875, 328.09375, 341.86328125, 355.6328125, 369.40234375, 383.171875, 396.94140625, 410.7109375, 424.48046875, 438.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 12.0, 12.0, 19.0, 34.0, 75.0, 147.0, 333.0, 1014.0, 5484.0, 92770.0, 2982915.0, 57071.0, 4294.0, 929.0, 303.0, 135.0, 56.0, 31.0, 19.0, 5.0, 10.0, 9.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.84375, -38.71923828125, -37.5947265625, -36.47021484375, -35.345703125, -34.22119140625, -33.0966796875, -31.97216796875, -30.84765625, -29.72314453125, -28.5986328125, -27.47412109375, -26.349609375, -25.22509765625, -24.1005859375, -22.97607421875, -21.8515625, -20.72705078125, -19.6025390625, -18.47802734375, -17.353515625, -16.22900390625, -15.1044921875, -13.97998046875, -12.85546875, -11.73095703125, -10.6064453125, -9.48193359375, -8.357421875, -7.23291015625, -6.1083984375, -4.98388671875, -3.859375, -2.73486328125, -1.6103515625, -0.48583984375, 0.638671875, 1.76318359375, 2.8876953125, 4.01220703125, 5.13671875, 6.26123046875, 7.3857421875, 8.51025390625, 9.634765625, 10.75927734375, 11.8837890625, 13.00830078125, 14.1328125, 15.25732421875, 16.3818359375, 17.50634765625, 18.630859375, 19.75537109375, 20.8798828125, 22.00439453125, 23.12890625, 24.25341796875, 25.3779296875, 26.50244140625, 27.626953125, 28.75146484375, 29.8759765625, 31.00048828125, 32.125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 5.0, 8.0, 14.0, 15.0, 22.0, 43.0, 51.0, 91.0, 196.0, 204.0, 153.0, 68.0, 29.0, 35.0, 15.0, 10.0, 7.0, 2.0, 6.0, 5.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-559.679443359375, -539.1724853515625, -518.66552734375, -498.1585998535156, -477.6516418457031, -457.1446838378906, -436.63775634765625, -416.13079833984375, -395.62384033203125, -375.11688232421875, -354.60992431640625, -334.1029968261719, -313.5960388183594, -293.0890808105469, -272.5821533203125, -252.0751953125, -231.5682373046875, -211.061279296875, -190.55433654785156, -170.04739379882812, -149.54043579101562, -129.03347778320312, -108.52653503417969, -88.01959228515625, -67.51263427734375, -47.00568389892578, -26.498733520507812, -5.991783142089844, 14.515167236328125, 35.022117614746094, 55.52906799316406, 76.0360107421875, 96.54296875, 117.04991912841797, 137.55686950683594, 158.06381225585938, 178.57077026367188, 199.07772827148438, 219.5846710205078, 240.09161376953125, 260.59857177734375, 281.10552978515625, 301.61248779296875, 322.1194152832031, 342.6263732910156, 363.1333312988281, 383.6402587890625, 404.147216796875, 424.6541748046875, 445.1611328125, 465.6680908203125, 486.1750183105469, 506.6819763183594, 527.1889038085938, 547.6958618164062, 568.2028198242188, 588.7097778320312, 609.2167358398438, 629.7236938476562, 650.2306518554688, 670.737548828125, 691.2445068359375, 711.75146484375, 732.2584228515625, 752.765380859375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 5.0, 7.0, 11.0, 17.0, 23.0, 16.0, 23.0, 18.0, 13.0, 26.0, 24.0, 27.0, 31.0, 55.0, 44.0, 43.0, 48.0, 49.0, 50.0, 40.0, 33.0, 34.0, 44.0, 29.0, 34.0, 27.0, 48.0, 29.0, 26.0, 18.0, 18.0, 12.0, 15.0, 7.0, 8.0, 9.0, 2.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-704.7015380859375, -684.605224609375, -664.5088500976562, -644.4125366210938, -624.316162109375, -604.2198486328125, -584.1234741210938, -564.0271606445312, -543.9307861328125, -523.83447265625, -503.73809814453125, -483.6417541503906, -463.54541015625, -443.4490661621094, -423.35272216796875, -403.25640869140625, -383.1600646972656, -363.063720703125, -342.9673767089844, -322.87103271484375, -302.7746887207031, -282.6783447265625, -262.58203125, -242.4856719970703, -222.3893280029297, -202.29298400878906, -182.19664001464844, -162.10031127929688, -142.00396728515625, -121.9076156616211, -101.811279296875, -81.71493530273438, -61.61859130859375, -41.522247314453125, -21.425907135009766, -1.3295669555664062, 18.76677703857422, 38.863121032714844, 58.95945739746094, 79.05580139160156, 99.15214538574219, 119.24848937988281, 139.34483337402344, 159.441162109375, 179.53750610351562, 199.63385009765625, 219.73019409179688, 239.8265380859375, 259.9228820800781, 280.01922607421875, 300.1155700683594, 320.2119140625, 340.3082580566406, 360.40460205078125, 380.50091552734375, 400.5972900390625, 420.693603515625, 440.7899475097656, 460.88629150390625, 480.9826354980469, 501.0789794921875, 521.17529296875, 541.2716674804688, 561.3679809570312, 581.46435546875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 10.0, 9.0, 9.0, 12.0, 22.0, 24.0, 29.0, 37.0, 27.0, 51.0, 54.0, 109.0, 177.0, 263.0, 552.0, 1553.0, 5682.0, 1025233.0, 10269.0, 2567.0, 775.0, 362.0, 226.0, 138.0, 71.0, 51.0, 41.0, 27.0, 30.0, 12.0, 14.0, 17.0, 11.0, 18.0, 11.0, 7.0, 6.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-148.81954956054688, -144.12600708007812, -139.43246459960938, -134.73892211914062, -130.0453643798828, -125.35182189941406, -120.65827941894531, -115.96473693847656, -111.27119445800781, -106.57765197753906, -101.88410186767578, -97.19055938720703, -92.49701690673828, -87.803466796875, -83.10992431640625, -78.4163818359375, -73.72283172607422, -69.02928924560547, -64.33573913574219, -59.64219665527344, -54.94865417480469, -50.25510787963867, -45.561561584472656, -40.868019104003906, -36.17447280883789, -31.480928421020508, -26.787384033203125, -22.09383773803711, -17.400293350219727, -12.706748962402344, -8.013202667236328, -3.319660186767578, 1.3738861083984375, 6.0674309730529785, 10.76097583770752, 15.454521179199219, 20.1480655670166, 24.841609954833984, 29.53515625, 34.22869873046875, 38.922245025634766, 43.61579132080078, 48.30933380126953, 53.00288009643555, 57.69642639160156, 62.38996887207031, 67.08351135253906, 71.77705383300781, 76.4706039428711, 81.16414642333984, 85.85769653320312, 90.55123901367188, 95.24478149414062, 99.93832397460938, 104.63187408447266, 109.3254165649414, 114.01896667480469, 118.71250915527344, 123.40605926513672, 128.099609375, 132.79315185546875, 137.4866943359375, 142.18023681640625, 146.873779296875, 151.56732177734375]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 2.0, 5.0, 12.0, 12.0, 24.0, 30.0, 65.0, 85.0, 155.0, 286.0, 550.0, 2039.0, 49823.0, 51402116.0, 6298.0, 911.0, 310.0, 159.0, 93.0, 56.0, 30.0, 10.0, 15.0, 17.0, 15.0, 6.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-407.26434326171875, -394.21893310546875, -381.1735534667969, -368.1281433105469, -355.082763671875, -342.037353515625, -328.991943359375, -315.9465637207031, -302.90118408203125, -289.85577392578125, -276.8103942871094, -263.7649841308594, -250.7196044921875, -237.6741943359375, -224.62879943847656, -211.58340454101562, -198.53799438476562, -185.4925994873047, -172.44720458984375, -159.40179443359375, -146.35641479492188, -133.31100463867188, -120.26560974121094, -107.22021484375, -94.17481994628906, -81.12942504882812, -68.08403015136719, -55.03862762451172, -41.99323272705078, -28.947837829589844, -15.902435302734375, -2.8570404052734375, 10.188385009765625, 23.233781814575195, 36.279178619384766, 49.32457733154297, 62.369972229003906, 75.41536712646484, 88.46076965332031, 101.50616455078125, 114.55155944824219, 127.59695434570312, 140.64234924316406, 153.687744140625, 166.733154296875, 179.77853393554688, 192.82394409179688, 205.8693389892578, 218.91473388671875, 231.9601287841797, 245.00552368164062, 258.0509338378906, 271.0963134765625, 284.1417236328125, 297.1871337890625, 310.2325134277344, 323.27789306640625, 336.32330322265625, 349.3686828613281, 362.4140930175781, 375.45947265625, 388.5048828125, 401.55029296875, 414.5956726074219, 427.6410827636719]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 2.0, 8.0, 21.0, 19.0, 33.0, 61.0, 75.0, 119.0, 196.0, 338.0, 471.0, 742.0, 1195.0, 1776.0, 2593.0, 3998.0, 6034.0, 9242.0, 14371.0, 23046.0, 36345.0, 58880.0, 99671.0, 175856.0, 340920.0, 783054.0, 3871106.0, 385483.0, 195006.0, 109252.0, 64453.0, 38800.0, 24846.0, 15508.0, 9789.0, 6259.0, 4011.0, 2649.0, 1727.0, 1129.0, 739.0, 530.0, 325.0, 246.0, 170.0, 116.0, 85.0, 42.0, 35.0, 29.0, 14.0, 5.0, 0.0, 2.0, 2.0, 1.0, 5.0], "bins": [-1.134765625, -1.1004638671875, -1.066162109375, -1.0318603515625, -0.99755859375, -0.9632568359375, -0.928955078125, -0.8946533203125, -0.8603515625, -0.8260498046875, -0.791748046875, -0.7574462890625, -0.72314453125, -0.6888427734375, -0.654541015625, -0.6202392578125, -0.5859375, -0.5516357421875, -0.517333984375, -0.4830322265625, -0.44873046875, -0.4144287109375, -0.380126953125, -0.3458251953125, -0.3115234375, -0.2772216796875, -0.242919921875, -0.2086181640625, -0.17431640625, -0.1400146484375, -0.105712890625, -0.0714111328125, -0.037109375, -0.0028076171875, 0.031494140625, 0.0657958984375, 0.10009765625, 0.1343994140625, 0.168701171875, 0.2030029296875, 0.2373046875, 0.2716064453125, 0.305908203125, 0.3402099609375, 0.37451171875, 0.4088134765625, 0.443115234375, 0.4774169921875, 0.51171875, 0.5460205078125, 0.580322265625, 0.6146240234375, 0.64892578125, 0.6832275390625, 0.717529296875, 0.7518310546875, 0.7861328125, 0.8204345703125, 0.854736328125, 0.8890380859375, 0.92333984375, 0.9576416015625, 0.991943359375, 1.0262451171875, 1.060546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 11.0, 5.0, 7.0, 15.0, 12.0, 13.0, 24.0, 13.0, 36.0, 24.0, 32.0, 37.0, 35.0, 37.0, 41.0, 35.0, 39.0, 53.0, 1064.0, 41.0, 54.0, 44.0, 35.0, 35.0, 33.0, 32.0, 26.0, 27.0, 28.0, 12.0, 22.0, 17.0, 12.0, 9.0, 10.0, 11.0, 7.0, 6.0, 8.0, 6.0, 1.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-68.0, -65.90234375, -63.8046875, -61.70703125, -59.609375, -57.51171875, -55.4140625, -53.31640625, -51.21875, -49.12109375, -47.0234375, -44.92578125, -42.828125, -40.73046875, -38.6328125, -36.53515625, -34.4375, -32.33984375, -30.2421875, -28.14453125, -26.046875, -23.94921875, -21.8515625, -19.75390625, -17.65625, -15.55859375, -13.4609375, -11.36328125, -9.265625, -7.16796875, -5.0703125, -2.97265625, -0.875, 1.22265625, 3.3203125, 5.41796875, 7.515625, 9.61328125, 11.7109375, 13.80859375, 15.90625, 18.00390625, 20.1015625, 22.19921875, 24.296875, 26.39453125, 28.4921875, 30.58984375, 32.6875, 34.78515625, 36.8828125, 38.98046875, 41.078125, 43.17578125, 45.2734375, 47.37109375, 49.46875, 51.56640625, 53.6640625, 55.76171875, 57.859375, 59.95703125, 62.0546875, 64.15234375, 66.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 4.0, 5.0, 1.0, 6.0, 9.0, 9.0, 9.0, 30.0, 38.0, 45.0, 68.0, 120.0, 158.0, 226.0, 349.0, 481.0, 754.0, 1175.0, 1732.0, 2617.0, 4137.0, 6467.0, 10102.0, 15675.0, 25011.0, 39961.0, 66043.0, 114546.0, 215911.0, 440240.0, 3932259.0, 674187.0, 332650.0, 168221.0, 92687.0, 54211.0, 33213.0, 20643.0, 13314.0, 8331.0, 5452.0, 3527.0, 2330.0, 1530.0, 971.0, 661.0, 425.0, 270.0, 190.0, 126.0, 78.0, 61.0, 54.0, 41.0, 29.0, 14.0, 15.0, 9.0, 10.0, 5.0, 4.0], "bins": [-0.94775390625, -0.9197235107421875, -0.891693115234375, -0.8636627197265625, -0.83563232421875, -0.8076019287109375, -0.779571533203125, -0.7515411376953125, -0.7235107421875, -0.6954803466796875, -0.667449951171875, -0.6394195556640625, -0.61138916015625, -0.5833587646484375, -0.555328369140625, -0.5272979736328125, -0.499267578125, -0.4712371826171875, -0.443206787109375, -0.4151763916015625, -0.38714599609375, -0.3591156005859375, -0.331085205078125, -0.3030548095703125, -0.2750244140625, -0.2469940185546875, -0.218963623046875, -0.1909332275390625, -0.16290283203125, -0.1348724365234375, -0.106842041015625, -0.0788116455078125, -0.05078125, -0.0227508544921875, 0.005279541015625, 0.0333099365234375, 0.06134033203125, 0.0893707275390625, 0.117401123046875, 0.1454315185546875, 0.1734619140625, 0.2014923095703125, 0.229522705078125, 0.2575531005859375, 0.28558349609375, 0.3136138916015625, 0.341644287109375, 0.3696746826171875, 0.397705078125, 0.4257354736328125, 0.453765869140625, 0.4817962646484375, 0.50982666015625, 0.5378570556640625, 0.565887451171875, 0.5939178466796875, 0.6219482421875, 0.6499786376953125, 0.678009033203125, 0.7060394287109375, 0.73406982421875, 0.7621002197265625, 0.790130615234375, 0.8181610107421875, 0.84619140625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 3.0, 11.0, 10.0, 10.0, 12.0, 11.0, 10.0, 13.0, 14.0, 23.0, 19.0, 20.0, 19.0, 29.0, 31.0, 38.0, 31.0, 30.0, 42.0, 30.0, 34.0, 1061.0, 33.0, 51.0, 36.0, 40.0, 37.0, 40.0, 31.0, 33.0, 23.0, 14.0, 25.0, 15.0, 21.0, 19.0, 11.0, 14.0, 14.0, 8.0, 8.0, 8.0, 6.0, 6.0, 5.0, 4.0, 1.0, 8.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-47.78125, -46.2177734375, -44.654296875, -43.0908203125, -41.52734375, -39.9638671875, -38.400390625, -36.8369140625, -35.2734375, -33.7099609375, -32.146484375, -30.5830078125, -29.01953125, -27.4560546875, -25.892578125, -24.3291015625, -22.765625, -21.2021484375, -19.638671875, -18.0751953125, -16.51171875, -14.9482421875, -13.384765625, -11.8212890625, -10.2578125, -8.6943359375, -7.130859375, -5.5673828125, -4.00390625, -2.4404296875, -0.876953125, 0.6865234375, 2.25, 3.8134765625, 5.376953125, 6.9404296875, 8.50390625, 10.0673828125, 11.630859375, 13.1943359375, 14.7578125, 16.3212890625, 17.884765625, 19.4482421875, 21.01171875, 22.5751953125, 24.138671875, 25.7021484375, 27.265625, 28.8291015625, 30.392578125, 31.9560546875, 33.51953125, 35.0830078125, 36.646484375, 38.2099609375, 39.7734375, 41.3369140625, 42.900390625, 44.4638671875, 46.02734375, 47.5908203125, 49.154296875, 50.7177734375, 52.28125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 11.0, 18.0, 12.0, 23.0, 31.0, 34.0, 50.0, 58.0, 69.0, 116.0, 127.0, 134.0, 199.0, 260.0, 333.0, 466.0, 702.0, 981.0, 1525.0, 2588.0, 5597.0, 14041.0, 42023.0, 198596.0, 5906098.0, 77368.0, 21565.0, 8411.0, 3772.0, 1990.0, 1154.0, 790.0, 535.0, 407.0, 308.0, 241.0, 218.0, 152.0, 101.0, 82.0, 52.0, 55.0, 40.0, 32.0, 19.0, 13.0, 13.0, 11.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.30078125, -4.16302490234375, -4.0252685546875, -3.88751220703125, -3.749755859375, -3.61199951171875, -3.4742431640625, -3.33648681640625, -3.19873046875, -3.06097412109375, -2.9232177734375, -2.78546142578125, -2.647705078125, -2.50994873046875, -2.3721923828125, -2.23443603515625, -2.0966796875, -1.95892333984375, -1.8211669921875, -1.68341064453125, -1.545654296875, -1.40789794921875, -1.2701416015625, -1.13238525390625, -0.99462890625, -0.85687255859375, -0.7191162109375, -0.58135986328125, -0.443603515625, -0.30584716796875, -0.1680908203125, -0.03033447265625, 0.107421875, 0.24517822265625, 0.3829345703125, 0.52069091796875, 0.658447265625, 0.79620361328125, 0.9339599609375, 1.07171630859375, 1.20947265625, 1.34722900390625, 1.4849853515625, 1.62274169921875, 1.760498046875, 1.89825439453125, 2.0360107421875, 2.17376708984375, 2.3115234375, 2.44927978515625, 2.5870361328125, 2.72479248046875, 2.862548828125, 3.00030517578125, 3.1380615234375, 3.27581787109375, 3.41357421875, 3.55133056640625, 3.6890869140625, 3.82684326171875, 3.964599609375, 4.10235595703125, 4.2401123046875, 4.37786865234375, 4.515625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 8.0, 9.0, 11.0, 10.0, 9.0, 21.0, 18.0, 15.0, 23.0, 19.0, 27.0, 23.0, 33.0, 35.0, 36.0, 27.0, 29.0, 33.0, 31.0, 41.0, 1073.0, 32.0, 47.0, 32.0, 37.0, 27.0, 32.0, 34.0, 36.0, 31.0, 18.0, 31.0, 14.0, 15.0, 14.0, 19.0, 16.0, 16.0, 10.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-52.0625, -50.552734375, -49.04296875, -47.533203125, -46.0234375, -44.513671875, -43.00390625, -41.494140625, -39.984375, -38.474609375, -36.96484375, -35.455078125, -33.9453125, -32.435546875, -30.92578125, -29.416015625, -27.90625, -26.396484375, -24.88671875, -23.376953125, -21.8671875, -20.357421875, -18.84765625, -17.337890625, -15.828125, -14.318359375, -12.80859375, -11.298828125, -9.7890625, -8.279296875, -6.76953125, -5.259765625, -3.75, -2.240234375, -0.73046875, 0.779296875, 2.2890625, 3.798828125, 5.30859375, 6.818359375, 8.328125, 9.837890625, 11.34765625, 12.857421875, 14.3671875, 15.876953125, 17.38671875, 18.896484375, 20.40625, 21.916015625, 23.42578125, 24.935546875, 26.4453125, 27.955078125, 29.46484375, 30.974609375, 32.484375, 33.994140625, 35.50390625, 37.013671875, 38.5234375, 40.033203125, 41.54296875, 43.052734375, 44.5625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 13.0, 128.0, 808.0, 31.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-701.2349853515625, -687.2791748046875, -673.3233032226562, -659.3674926757812, -645.4116821289062, -631.4558715820312, -617.5, -603.544189453125, -589.58837890625, -575.632568359375, -561.6766967773438, -547.7208862304688, -533.7650756835938, -519.8092651367188, -505.8533935546875, -491.8975830078125, -477.9417419433594, -463.98590087890625, -450.03009033203125, -436.0742492675781, -422.1184387207031, -408.16259765625, -394.206787109375, -380.2509460449219, -366.29510498046875, -352.3392639160156, -338.3834533691406, -324.4276123046875, -310.4718017578125, -296.5159606933594, -282.56011962890625, -268.60430908203125, -254.64846801757812, -240.69264221191406, -226.73681640625, -212.78097534179688, -198.82516479492188, -184.86932373046875, -170.9134979248047, -156.95767211914062, -143.00184631347656, -129.0460205078125, -115.09019470214844, -101.13436126708984, -87.17853546142578, -73.22270965576172, -59.266876220703125, -45.31105041503906, -31.355224609375, -17.399396896362305, -3.4435691833496094, 10.512260437011719, 24.46808624267578, 38.423912048339844, 52.37974548339844, 66.3355712890625, 80.29139709472656, 94.24722290039062, 108.20304870605469, 122.15888214111328, 136.11471557617188, 150.07052612304688, 164.0263671875, 177.98219299316406, 191.93801879882812]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 1.0, 4.0, 10.0, 10.0, 16.0, 15.0, 18.0, 22.0, 26.0, 33.0, 22.0, 37.0, 31.0, 44.0, 41.0, 40.0, 46.0, 42.0, 46.0, 48.0, 44.0, 45.0, 41.0, 39.0, 40.0, 35.0, 27.0, 24.0, 23.0, 20.0, 15.0, 15.0, 12.0, 12.0, 9.0, 9.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.25540161132812, -123.369873046875, -119.48434448242188, -115.59882354736328, -111.71329498291016, -107.82776641845703, -103.94224548339844, -100.05671691894531, -96.17118835449219, -92.28565979003906, -88.40013122558594, -84.51461029052734, -80.62908172607422, -76.7435531616211, -72.8580322265625, -68.97250366210938, -65.08697509765625, -61.201446533203125, -57.315921783447266, -53.430397033691406, -49.54486846923828, -45.659339904785156, -41.7738151550293, -37.88829040527344, -34.00276184082031, -30.11723518371582, -26.231708526611328, -22.346181869506836, -18.460655212402344, -14.575128555297852, -10.68960189819336, -6.804075241088867, -2.918548583984375, 0.9669780731201172, 4.852504730224609, 8.738031387329102, 12.623558044433594, 16.509084701538086, 20.394611358642578, 24.28013801574707, 28.165664672851562, 32.05119323730469, 35.93671798706055, 39.822242736816406, 43.70777130126953, 47.593299865722656, 51.478824615478516, 55.364349365234375, 59.2498779296875, 63.135406494140625, 67.02093505859375, 70.90645599365234, 74.79198455810547, 78.6775131225586, 82.56303405761719, 86.44856262207031, 90.33409118652344, 94.21961975097656, 98.10514831542969, 101.99066925048828, 105.8761978149414, 109.76172637939453, 113.64724731445312, 117.53277587890625, 121.41830444335938]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 0.0, 6.0, 2.0, 6.0, 2.0, 1.0, 6.0, 0.0, 4.0, 3.0, 7.0, 18.0, 6.0, 3.0, 1.0, 16.0, 5.0, 14.0, 15.0, 11.0, 15.0, 14.0, 24.0, 26.0, 39.0, 76.0, 103.0, 360.0, 2873.0, 56601.0, 4117218.0, 14809.0, 1520.0, 213.0, 46.0, 30.0, 35.0, 33.0, 19.0, 15.0, 10.0, 18.0, 4.0, 12.0, 8.0, 8.0, 2.0, 6.0, 5.0, 8.0, 0.0, 4.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0], "bins": [-0.1676025390625, -0.1627063751220703, -0.15781021118164062, -0.15291404724121094, -0.14801788330078125, -0.14312171936035156, -0.13822555541992188, -0.1333293914794922, -0.1284332275390625, -0.12353706359863281, -0.11864089965820312, -0.11374473571777344, -0.10884857177734375, -0.10395240783691406, -0.09905624389648438, -0.09416007995605469, -0.089263916015625, -0.08436775207519531, -0.07947158813476562, -0.07457542419433594, -0.06967926025390625, -0.06478309631347656, -0.059886932373046875, -0.05499076843261719, -0.0500946044921875, -0.04519844055175781, -0.040302276611328125, -0.03540611267089844, -0.03050994873046875, -0.025613784790039062, -0.020717620849609375, -0.015821456909179688, -0.01092529296875, -0.0060291290283203125, -0.001132965087890625, 0.0037631988525390625, 0.00865936279296875, 0.013555526733398438, 0.018451690673828125, 0.023347854614257812, 0.0282440185546875, 0.03314018249511719, 0.038036346435546875, 0.04293251037597656, 0.04782867431640625, 0.05272483825683594, 0.057621002197265625, 0.06251716613769531, 0.067413330078125, 0.07230949401855469, 0.07720565795898438, 0.08210182189941406, 0.08699798583984375, 0.09189414978027344, 0.09679031372070312, 0.10168647766113281, 0.1065826416015625, 0.11147880554199219, 0.11637496948242188, 0.12127113342285156, 0.12616729736328125, 0.13106346130371094, 0.13595962524414062, 0.1408557891845703, 0.145751953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 5.0, 4.0, 10.0, 6.0, 7.0, 13.0, 13.0, 17.0, 715.0, 94.0, 20.0, 15.0, 6.0, 4.0, 10.0, 11.0, 2.0, 4.0, 4.0, 4.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1058349609375, -0.10268402099609375, -0.0995330810546875, -0.09638214111328125, -0.093231201171875, -0.09008026123046875, -0.0869293212890625, -0.08377838134765625, -0.08062744140625, -0.07747650146484375, -0.0743255615234375, -0.07117462158203125, -0.068023681640625, -0.06487274169921875, -0.0617218017578125, -0.05857086181640625, -0.055419921875, -0.05226898193359375, -0.0491180419921875, -0.04596710205078125, -0.042816162109375, -0.03966522216796875, -0.0365142822265625, -0.03336334228515625, -0.03021240234375, -0.02706146240234375, -0.0239105224609375, -0.02075958251953125, -0.017608642578125, -0.01445770263671875, -0.0113067626953125, -0.00815582275390625, -0.0050048828125, -0.00185394287109375, 0.0012969970703125, 0.00444793701171875, 0.007598876953125, 0.01074981689453125, 0.0139007568359375, 0.01705169677734375, 0.02020263671875, 0.02335357666015625, 0.0265045166015625, 0.02965545654296875, 0.032806396484375, 0.03595733642578125, 0.0391082763671875, 0.04225921630859375, 0.04541015625, 0.04856109619140625, 0.0517120361328125, 0.05486297607421875, 0.058013916015625, 0.06116485595703125, 0.0643157958984375, 0.06746673583984375, 0.07061767578125, 0.07376861572265625, 0.0769195556640625, 0.08007049560546875, 0.083221435546875, 0.08637237548828125, 0.0895233154296875, 0.09267425537109375, 0.0958251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 2.0, 5.0, 14.0, 2.0, 12.0, 19.0, 21.0, 37.0, 71.0, 108.0, 138.0, 313.0, 537.0, 1440.0, 5015.0, 204959.0, 3970652.0, 8460.0, 1577.0, 458.0, 177.0, 83.0, 58.0, 39.0, 18.0, 19.0, 7.0, 7.0, 5.0, 5.0, 4.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177490234375, -0.17196083068847656, -0.16643142700195312, -0.1609020233154297, -0.15537261962890625, -0.1498432159423828, -0.14431381225585938, -0.13878440856933594, -0.1332550048828125, -0.12772560119628906, -0.12219619750976562, -0.11666679382324219, -0.11113739013671875, -0.10560798645019531, -0.10007858276367188, -0.09454917907714844, -0.089019775390625, -0.08349037170410156, -0.07796096801757812, -0.07243156433105469, -0.06690216064453125, -0.06137275695800781, -0.055843353271484375, -0.05031394958496094, -0.0447845458984375, -0.03925514221191406, -0.033725738525390625, -0.028196334838867188, -0.02266693115234375, -0.017137527465820312, -0.011608123779296875, -0.0060787200927734375, -0.00054931640625, 0.0049800872802734375, 0.010509490966796875, 0.016038894653320312, 0.02156829833984375, 0.027097702026367188, 0.032627105712890625, 0.03815650939941406, 0.0436859130859375, 0.04921531677246094, 0.054744720458984375, 0.06027412414550781, 0.06580352783203125, 0.07133293151855469, 0.07686233520507812, 0.08239173889160156, 0.087921142578125, 0.09345054626464844, 0.09897994995117188, 0.10450935363769531, 0.11003875732421875, 0.11556816101074219, 0.12109756469726562, 0.12662696838378906, 0.1321563720703125, 0.13768577575683594, 0.14321517944335938, 0.1487445831298828, 0.15427398681640625, 0.1598033905029297, 0.16533279418945312, 0.17086219787597656, 0.1763916015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 9.0, 7.0, 4.0, 24.0, 67.0, 290.0, 2684.0, 719.0, 151.0, 48.0, 22.0, 14.0, 3.0, 7.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1121826171875, -0.10921096801757812, -0.10623931884765625, -0.10326766967773438, -0.1002960205078125, -0.09732437133789062, -0.09435272216796875, -0.09138107299804688, -0.088409423828125, -0.08543777465820312, -0.08246612548828125, -0.07949447631835938, -0.0765228271484375, -0.07355117797851562, -0.07057952880859375, -0.06760787963867188, -0.06463623046875, -0.061664581298828125, -0.05869293212890625, -0.055721282958984375, -0.0527496337890625, -0.049777984619140625, -0.04680633544921875, -0.043834686279296875, -0.040863037109375, -0.037891387939453125, -0.03491973876953125, -0.031948089599609375, -0.0289764404296875, -0.026004791259765625, -0.02303314208984375, -0.020061492919921875, -0.01708984375, -0.014118194580078125, -0.01114654541015625, -0.008174896240234375, -0.0052032470703125, -0.002231597900390625, 0.00074005126953125, 0.003711700439453125, 0.006683349609375, 0.009654998779296875, 0.01262664794921875, 0.015598297119140625, 0.0185699462890625, 0.021541595458984375, 0.02451324462890625, 0.027484893798828125, 0.03045654296875, 0.033428192138671875, 0.03639984130859375, 0.039371490478515625, 0.0423431396484375, 0.045314788818359375, 0.04828643798828125, 0.051258087158203125, 0.054229736328125, 0.057201385498046875, 0.06017303466796875, 0.06314468383789062, 0.0661163330078125, 0.06908798217773438, 0.07205963134765625, 0.07503128051757812, 0.0780029296875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 7.0, 10.0, 27.0, 606.0, 305.0, 27.0, 9.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.5389622449874878, -0.5269617438316345, -0.5149612426757812, -0.502960741519928, -0.4909602701663971, -0.4789597690105438, -0.46695929765701294, -0.45495879650115967, -0.4429582953453064, -0.4309577941894531, -0.41895729303359985, -0.40695682168006897, -0.3949563205242157, -0.3829558193683624, -0.37095534801483154, -0.35895484685897827, -0.346954345703125, -0.33495384454727173, -0.32295334339141846, -0.3109528720378876, -0.2989523708820343, -0.28695186972618103, -0.27495139837265015, -0.2629508972167969, -0.2509503960609436, -0.23894989490509033, -0.22694940865039825, -0.21494892239570618, -0.2029484212398529, -0.19094792008399963, -0.17894743382930756, -0.16694694757461548, -0.1549464464187622, -0.14294594526290894, -0.13094545900821686, -0.11894496530294418, -0.10694447159767151, -0.09494397789239883, -0.08294348418712616, -0.07094299048185349, -0.05894249677658081, -0.046942003071308136, -0.03494150936603546, -0.022941015660762787, -0.010940521955490112, 0.0010599717497825623, 0.013060465455055237, 0.02506095916032791, 0.037061452865600586, 0.04906194657087326, 0.061062440276145935, 0.07306293398141861, 0.08506342768669128, 0.09706392139196396, 0.10906441509723663, 0.12106490880250931, 0.13306540250778198, 0.14506590366363525, 0.15706638991832733, 0.1690668761730194, 0.18106737732887268, 0.19306787848472595, 0.20506836473941803, 0.2170688509941101, 0.22906935214996338]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 10.0, 7.0, 5.0, 9.0, 5.0, 13.0, 26.0, 44.0, 55.0, 101.0, 128.0, 132.0, 131.0, 96.0, 75.0, 42.0, 22.0, 16.0, 11.0, 7.0, 5.0, 10.0, 5.0, 5.0, 0.0, 7.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.39849191904067993, -0.3884199559688568, -0.3783479928970337, -0.3682760000228882, -0.35820403695106506, -0.34813207387924194, -0.33806008100509644, -0.3279881179332733, -0.3179161548614502, -0.3078441917896271, -0.29777222871780396, -0.28770023584365845, -0.2776282727718353, -0.2675563097000122, -0.2574843168258667, -0.24741235375404358, -0.23734039068222046, -0.22726842761039734, -0.21719644963741302, -0.2071244716644287, -0.1970525085926056, -0.18698054552078247, -0.17690856754779816, -0.16683658957481384, -0.15676462650299072, -0.1466926634311676, -0.1366206854581833, -0.12654870748519897, -0.11647674441337585, -0.10640477389097214, -0.09633280336856842, -0.0862608328461647, -0.07618886232376099, -0.06611689180135727, -0.05604492127895355, -0.045972950756549835, -0.03590098023414612, -0.0258290097117424, -0.015757039189338684, -0.005685068666934967, 0.00438690185546875, 0.014458872377872467, 0.024530842900276184, 0.0346028134226799, 0.04467478394508362, 0.054746754467487335, 0.06481872498989105, 0.07489069551229477, 0.08496266603469849, 0.0950346365571022, 0.10510660707950592, 0.11517857760190964, 0.12525054812431335, 0.13532251119613647, 0.1453944891691208, 0.1554664671421051, 0.16553843021392822, 0.17561039328575134, 0.18568237125873566, 0.19575434923171997, 0.2058263123035431, 0.2158982753753662, 0.22597025334835052, 0.23604223132133484, 0.24611419439315796]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 9.0, 18.0, 17.0, 36.0, 59.0, 73.0, 108.0, 184.0, 206.0, 343.0, 451.0, 765.0, 1075.0, 1660.0, 2695.0, 4454.0, 8430.0, 18642.0, 175983.0, 790616.0, 20833.0, 9017.0, 4853.0, 2737.0, 1818.0, 1130.0, 721.0, 504.0, 333.0, 204.0, 181.0, 122.0, 75.0, 58.0, 39.0, 20.0, 28.0, 21.0, 7.0, 6.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.444580078125, -0.4297904968261719, -0.41500091552734375, -0.4002113342285156, -0.3854217529296875, -0.3706321716308594, -0.35584259033203125, -0.3410530090332031, -0.326263427734375, -0.3114738464355469, -0.29668426513671875, -0.2818946838378906, -0.2671051025390625, -0.2523155212402344, -0.23752593994140625, -0.22273635864257812, -0.20794677734375, -0.19315719604492188, -0.17836761474609375, -0.16357803344726562, -0.1487884521484375, -0.13399887084960938, -0.11920928955078125, -0.10441970825195312, -0.089630126953125, -0.07484054565429688, -0.06005096435546875, -0.045261383056640625, -0.0304718017578125, -0.015682220458984375, -0.00089263916015625, 0.013896942138671875, 0.0286865234375, 0.043476104736328125, 0.05826568603515625, 0.07305526733398438, 0.0878448486328125, 0.10263442993164062, 0.11742401123046875, 0.13221359252929688, 0.147003173828125, 0.16179275512695312, 0.17658233642578125, 0.19137191772460938, 0.2061614990234375, 0.22095108032226562, 0.23574066162109375, 0.2505302429199219, 0.26531982421875, 0.2801094055175781, 0.29489898681640625, 0.3096885681152344, 0.3244781494140625, 0.3392677307128906, 0.35405731201171875, 0.3688468933105469, 0.383636474609375, 0.3984260559082031, 0.41321563720703125, 0.4280052185058594, 0.4427947998046875, 0.4575843811035156, 0.47237396240234375, 0.4871635437011719, 0.501953125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 11.0, 13.0, 10.0, 69.0, 739.0, 27.0, 14.0, 12.0, 3.0, 7.0, 10.0, 7.0, 3.0, 4.0, 6.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10589599609375, -0.10278129577636719, -0.09966659545898438, -0.09655189514160156, -0.09343719482421875, -0.09032249450683594, -0.08720779418945312, -0.08409309387207031, -0.0809783935546875, -0.07786369323730469, -0.07474899291992188, -0.07163429260253906, -0.06851959228515625, -0.06540489196777344, -0.062290191650390625, -0.05917549133300781, -0.056060791015625, -0.05294609069824219, -0.049831390380859375, -0.04671669006347656, -0.04360198974609375, -0.04048728942871094, -0.037372589111328125, -0.03425788879394531, -0.0311431884765625, -0.028028488159179688, -0.024913787841796875, -0.021799087524414062, -0.01868438720703125, -0.015569686889648438, -0.012454986572265625, -0.009340286254882812, -0.0062255859375, -0.0031108856201171875, 3.814697265625e-06, 0.0031185150146484375, 0.00623321533203125, 0.009347915649414062, 0.012462615966796875, 0.015577316284179688, 0.0186920166015625, 0.021806716918945312, 0.024921417236328125, 0.028036117553710938, 0.03115081787109375, 0.03426551818847656, 0.037380218505859375, 0.04049491882324219, 0.043609619140625, 0.04672431945800781, 0.049839019775390625, 0.05295372009277344, 0.05606842041015625, 0.05918312072753906, 0.062297821044921875, 0.06541252136230469, 0.0685272216796875, 0.07164192199707031, 0.07475662231445312, 0.07787132263183594, 0.08098602294921875, 0.08410072326660156, 0.08721542358398438, 0.09033012390136719, 0.09344482421875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 8.0, 13.0, 20.0, 30.0, 32.0, 59.0, 49.0, 68.0, 86.0, 93.0, 135.0, 199.0, 353.0, 678.0, 1159.0, 2412.0, 5854.0, 16505.0, 63494.0, 549617.0, 339015.0, 46358.0, 12779.0, 4772.0, 2133.0, 1013.0, 577.0, 287.0, 173.0, 144.0, 82.0, 84.0, 67.0, 64.0, 36.0, 34.0, 15.0, 16.0, 10.0, 6.0, 11.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.251708984375, -0.24449729919433594, -0.23728561401367188, -0.2300739288330078, -0.22286224365234375, -0.2156505584716797, -0.20843887329101562, -0.20122718811035156, -0.1940155029296875, -0.18680381774902344, -0.17959213256835938, -0.1723804473876953, -0.16516876220703125, -0.1579570770263672, -0.15074539184570312, -0.14353370666503906, -0.136322021484375, -0.12911033630371094, -0.12189865112304688, -0.11468696594238281, -0.10747528076171875, -0.10026359558105469, -0.09305191040039062, -0.08584022521972656, -0.0786285400390625, -0.07141685485839844, -0.06420516967773438, -0.05699348449707031, -0.04978179931640625, -0.04257011413574219, -0.035358428955078125, -0.028146743774414062, -0.02093505859375, -0.013723373413085938, -0.006511688232421875, 0.0006999969482421875, 0.00791168212890625, 0.015123367309570312, 0.022335052490234375, 0.029546737670898438, 0.0367584228515625, 0.04397010803222656, 0.051181793212890625, 0.05839347839355469, 0.06560516357421875, 0.07281684875488281, 0.08002853393554688, 0.08724021911621094, 0.094451904296875, 0.10166358947753906, 0.10887527465820312, 0.11608695983886719, 0.12329864501953125, 0.1305103302001953, 0.13772201538085938, 0.14493370056152344, 0.1521453857421875, 0.15935707092285156, 0.16656875610351562, 0.1737804412841797, 0.18099212646484375, 0.1882038116455078, 0.19541549682617188, 0.20262718200683594, 0.2098388671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 8.0, 7.0, 13.0, 18.0, 13.0, 21.0, 18.0, 18.0, 20.0, 21.0, 27.0, 26.0, 26.0, 36.0, 33.0, 36.0, 44.0, 29.0, 47.0, 36.0, 33.0, 43.0, 49.0, 38.0, 37.0, 33.0, 31.0, 35.0, 35.0, 23.0, 13.0, 23.0, 13.0, 15.0, 17.0, 9.0, 22.0, 4.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.37841796875, -0.3673553466796875, -0.356292724609375, -0.3452301025390625, -0.33416748046875, -0.3231048583984375, -0.312042236328125, -0.3009796142578125, -0.2899169921875, -0.2788543701171875, -0.267791748046875, -0.2567291259765625, -0.24566650390625, -0.2346038818359375, -0.223541259765625, -0.2124786376953125, -0.201416015625, -0.1903533935546875, -0.179290771484375, -0.1682281494140625, -0.15716552734375, -0.1461029052734375, -0.135040283203125, -0.1239776611328125, -0.1129150390625, -0.1018524169921875, -0.090789794921875, -0.0797271728515625, -0.06866455078125, -0.0576019287109375, -0.046539306640625, -0.0354766845703125, -0.0244140625, -0.0133514404296875, -0.002288818359375, 0.0087738037109375, 0.01983642578125, 0.0308990478515625, 0.041961669921875, 0.0530242919921875, 0.0640869140625, 0.0751495361328125, 0.086212158203125, 0.0972747802734375, 0.10833740234375, 0.1194000244140625, 0.130462646484375, 0.1415252685546875, 0.152587890625, 0.1636505126953125, 0.174713134765625, 0.1857757568359375, 0.19683837890625, 0.2079010009765625, 0.218963623046875, 0.2300262451171875, 0.2410888671875, 0.2521514892578125, 0.263214111328125, 0.2742767333984375, 0.28533935546875, 0.2964019775390625, 0.307464599609375, 0.3185272216796875, 0.32958984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 7.0, 8.0, 9.0, 17.0, 16.0, 36.0, 59.0, 108.0, 230.0, 476.0, 1163.0, 4851.0, 174406.0, 857683.0, 7082.0, 1422.0, 490.0, 205.0, 107.0, 61.0, 31.0, 24.0, 14.0, 8.0, 12.0, 8.0, 7.0, 2.0, 0.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.114013671875, -0.11109733581542969, -0.10818099975585938, -0.10526466369628906, -0.10234832763671875, -0.09943199157714844, -0.09651565551757812, -0.09359931945800781, -0.0906829833984375, -0.08776664733886719, -0.08485031127929688, -0.08193397521972656, -0.07901763916015625, -0.07610130310058594, -0.07318496704101562, -0.07026863098144531, -0.067352294921875, -0.06443595886230469, -0.061519622802734375, -0.05860328674316406, -0.05568695068359375, -0.05277061462402344, -0.049854278564453125, -0.04693794250488281, -0.0440216064453125, -0.04110527038574219, -0.038188934326171875, -0.03527259826660156, -0.03235626220703125, -0.029439926147460938, -0.026523590087890625, -0.023607254028320312, -0.02069091796875, -0.017774581909179688, -0.014858245849609375, -0.011941909790039062, -0.00902557373046875, -0.0061092376708984375, -0.003192901611328125, -0.0002765655517578125, 0.0026397705078125, 0.0055561065673828125, 0.008472442626953125, 0.011388778686523438, 0.01430511474609375, 0.017221450805664062, 0.020137786865234375, 0.023054122924804688, 0.025970458984375, 0.028886795043945312, 0.031803131103515625, 0.03471946716308594, 0.03763580322265625, 0.04055213928222656, 0.043468475341796875, 0.04638481140136719, 0.0493011474609375, 0.05221748352050781, 0.055133819580078125, 0.05805015563964844, 0.06096649169921875, 0.06388282775878906, 0.06679916381835938, 0.06971549987792969, 0.0726318359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 13.0, 10.0, 13.0, 22.0, 22.0, 54.0, 57.0, 78.0, 82.0, 102.0, 111.0, 92.0, 81.0, 76.0, 54.0, 43.0, 20.0, 18.0, 10.0, 7.0, 11.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.329183578491211e-05, -1.2675300240516663e-05, -1.2058764696121216e-05, -1.1442229151725769e-05, -1.0825693607330322e-05, -1.0209158062934875e-05, -9.592622518539429e-06, -8.976086974143982e-06, -8.359551429748535e-06, -7.743015885353088e-06, -7.126480340957642e-06, -6.509944796562195e-06, -5.893409252166748e-06, -5.276873707771301e-06, -4.6603381633758545e-06, -4.043802618980408e-06, -3.427267074584961e-06, -2.810731530189514e-06, -2.1941959857940674e-06, -1.5776604413986206e-06, -9.611248970031738e-07, -3.4458935260772705e-07, 2.7194619178771973e-07, 8.884817361831665e-07, 1.5050172805786133e-06, 2.12155282497406e-06, 2.738088369369507e-06, 3.3546239137649536e-06, 3.9711594581604e-06, 4.587695002555847e-06, 5.204230546951294e-06, 5.820766091346741e-06, 6.4373016357421875e-06, 7.053837180137634e-06, 7.670372724533081e-06, 8.286908268928528e-06, 8.903443813323975e-06, 9.519979357719421e-06, 1.0136514902114868e-05, 1.0753050446510315e-05, 1.1369585990905762e-05, 1.1986121535301208e-05, 1.2602657079696655e-05, 1.3219192624092102e-05, 1.3835728168487549e-05, 1.4452263712882996e-05, 1.5068799257278442e-05, 1.568533480167389e-05, 1.6301870346069336e-05, 1.6918405890464783e-05, 1.753494143486023e-05, 1.8151476979255676e-05, 1.8768012523651123e-05, 1.938454806804657e-05, 2.0001083612442017e-05, 2.0617619156837463e-05, 2.123415470123291e-05, 2.1850690245628357e-05, 2.2467225790023804e-05, 2.308376133441925e-05, 2.3700296878814697e-05, 2.4316832423210144e-05, 2.493336796760559e-05, 2.5549903512001038e-05, 2.6166439056396484e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 8.0, 13.0, 14.0, 19.0, 29.0, 36.0, 55.0, 92.0, 127.0, 257.0, 494.0, 1062.0, 2937.0, 10760.0, 98576.0, 884489.0, 39317.0, 6505.0, 1997.0, 789.0, 426.0, 203.0, 102.0, 80.0, 48.0, 36.0, 22.0, 12.0, 13.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06585693359375, -0.06388139724731445, -0.061905860900878906, -0.05993032455444336, -0.05795478820800781, -0.055979251861572266, -0.05400371551513672, -0.05202817916870117, -0.050052642822265625, -0.04807710647583008, -0.04610157012939453, -0.044126033782958984, -0.04215049743652344, -0.04017496109008789, -0.038199424743652344, -0.0362238883972168, -0.03424835205078125, -0.0322728157043457, -0.030297279357910156, -0.02832174301147461, -0.026346206665039062, -0.024370670318603516, -0.02239513397216797, -0.020419597625732422, -0.018444061279296875, -0.016468524932861328, -0.014492988586425781, -0.012517452239990234, -0.010541915893554688, -0.00856637954711914, -0.006590843200683594, -0.004615306854248047, -0.0026397705078125, -0.0006642341613769531, 0.0013113021850585938, 0.0032868385314941406, 0.0052623748779296875, 0.007237911224365234, 0.009213447570800781, 0.011188983917236328, 0.013164520263671875, 0.015140056610107422, 0.01711559295654297, 0.019091129302978516, 0.021066665649414062, 0.02304220199584961, 0.025017738342285156, 0.026993274688720703, 0.02896881103515625, 0.030944347381591797, 0.032919883728027344, 0.03489542007446289, 0.03687095642089844, 0.038846492767333984, 0.04082202911376953, 0.04279756546020508, 0.044773101806640625, 0.04674863815307617, 0.04872417449951172, 0.050699710845947266, 0.05267524719238281, 0.05465078353881836, 0.056626319885253906, 0.05860185623168945, 0.060577392578125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 2.0, 9.0, 9.0, 8.0, 26.0, 14.0, 27.0, 36.0, 45.0, 78.0, 76.0, 110.0, 107.0, 108.0, 73.0, 63.0, 51.0, 31.0, 41.0, 24.0, 11.0, 14.0, 7.0, 5.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1173095703125, -0.11426067352294922, -0.11121177673339844, -0.10816287994384766, -0.10511398315429688, -0.1020650863647461, -0.09901618957519531, -0.09596729278564453, -0.09291839599609375, -0.08986949920654297, -0.08682060241699219, -0.0837717056274414, -0.08072280883789062, -0.07767391204833984, -0.07462501525878906, -0.07157611846923828, -0.0685272216796875, -0.06547832489013672, -0.06242942810058594, -0.059380531311035156, -0.056331634521484375, -0.053282737731933594, -0.05023384094238281, -0.04718494415283203, -0.04413604736328125, -0.04108715057373047, -0.03803825378417969, -0.034989356994628906, -0.031940460205078125, -0.028891563415527344, -0.025842666625976562, -0.02279376983642578, -0.019744873046875, -0.01669597625732422, -0.013647079467773438, -0.010598182678222656, -0.007549285888671875, -0.004500389099121094, -0.0014514923095703125, 0.0015974044799804688, 0.00464630126953125, 0.007695198059082031, 0.010744094848632812, 0.013792991638183594, 0.016841888427734375, 0.019890785217285156, 0.022939682006835938, 0.02598857879638672, 0.0290374755859375, 0.03208637237548828, 0.03513526916503906, 0.038184165954589844, 0.041233062744140625, 0.044281959533691406, 0.04733085632324219, 0.05037975311279297, 0.05342864990234375, 0.05647754669189453, 0.05952644348144531, 0.0625753402709961, 0.06562423706054688, 0.06867313385009766, 0.07172203063964844, 0.07477092742919922, 0.07781982421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 37.0, 670.0, 261.0, 23.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.026463508605957, -12.754094123840332, -12.48172378540039, -12.209354400634766, -11.936984062194824, -11.6646146774292, -11.392244338989258, -11.119874954223633, -10.847505569458008, -10.575136184692383, -10.302765846252441, -10.030396461486816, -9.758026123046875, -9.48565673828125, -9.213286399841309, -8.940917015075684, -8.668546676635742, -8.396177291870117, -8.123806953430176, -7.851437091827393, -7.579067230224609, -7.306697845458984, -7.034327983856201, -6.761958122253418, -6.489588260650635, -6.217218399047852, -5.944848537445068, -5.672478675842285, -5.40010929107666, -5.127738952636719, -4.855369567871094, -4.5829997062683105, -4.310628890991211, -4.038259029388428, -3.7658891677856445, -3.4935195446014404, -3.2211496829986572, -2.948779821395874, -2.67641019821167, -2.4040403366088867, -2.1316704750061035, -1.8593006134033203, -1.5869308710098267, -1.314561128616333, -1.0421912670135498, -0.7698214054107666, -0.49745166301727295, -0.2250819206237793, 0.047287940979003906, 0.31965774297714233, 0.5920275449752808, 0.8643973469734192, 1.1367671489715576, 1.4091370105743408, 1.6815067529678345, 1.9538764953613281, 2.2262463569641113, 2.4986162185668945, 2.7709860801696777, 3.043355703353882, 3.315725564956665, 3.5880954265594482, 3.8604650497436523, 4.1328349113464355, 4.405204772949219]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 7.0, 9.0, 12.0, 20.0, 26.0, 54.0, 93.0, 110.0, 153.0, 158.0, 104.0, 71.0, 58.0, 26.0, 25.0, 8.0, 15.0, 5.0, 8.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.521082878112793, -7.284963607788086, -7.048844337463379, -6.812725067138672, -6.576605796813965, -6.340486526489258, -6.104366779327393, -5.8682475090026855, -5.6321282386779785, -5.3960089683532715, -5.1598896980285645, -4.923770427703857, -4.687650680541992, -4.451531410217285, -4.215412139892578, -3.979292869567871, -3.743173599243164, -3.507054328918457, -3.27093505859375, -3.034815549850464, -2.798696279525757, -2.56257700920105, -2.3264575004577637, -2.0903382301330566, -1.8542189598083496, -1.6180996894836426, -1.381980299949646, -1.1458609104156494, -0.9097416400909424, -0.6736223697662354, -0.43750298023223877, -0.2013835906982422, 0.034735679626464844, 0.27085500955581665, 0.5069743394851685, 0.7430936694145203, 0.9792129993438721, 1.215332269668579, 1.4514516592025757, 1.6875710487365723, 1.9236903190612793, 2.1598095893859863, 2.3959288597106934, 2.6320483684539795, 2.8681676387786865, 3.1042869091033936, 3.3404064178466797, 3.5765256881713867, 3.8126449584960938, 4.048764228820801, 4.284883499145508, 4.521002769470215, 4.757122039794922, 4.993241310119629, 5.229361057281494, 5.465480327606201, 5.701599597930908, 5.937718868255615, 6.173838138580322, 6.409957408905029, 6.6460771560668945, 6.882196426391602, 7.118315696716309, 7.354434967041016, 7.590554237365723]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 13.0, 24.0, 22.0, 31.0, 56.0, 91.0, 163.0, 257.0, 476.0, 858.0, 1551.0, 3380.0, 7397.0, 22416.0, 4055415.0, 83882.0, 11475.0, 3939.0, 1548.0, 659.0, 298.0, 117.0, 71.0, 45.0, 29.0, 14.0, 14.0, 14.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0791015625, -1.0461883544921875, -1.013275146484375, -0.9803619384765625, -0.94744873046875, -0.9145355224609375, -0.881622314453125, -0.8487091064453125, -0.8157958984375, -0.7828826904296875, -0.749969482421875, -0.7170562744140625, -0.68414306640625, -0.6512298583984375, -0.618316650390625, -0.5854034423828125, -0.552490234375, -0.5195770263671875, -0.486663818359375, -0.4537506103515625, -0.42083740234375, -0.3879241943359375, -0.355010986328125, -0.3220977783203125, -0.2891845703125, -0.2562713623046875, -0.223358154296875, -0.1904449462890625, -0.15753173828125, -0.1246185302734375, -0.091705322265625, -0.0587921142578125, -0.02587890625, 0.0070343017578125, 0.039947509765625, 0.0728607177734375, 0.10577392578125, 0.1386871337890625, 0.171600341796875, 0.2045135498046875, 0.2374267578125, 0.2703399658203125, 0.303253173828125, 0.3361663818359375, 0.36907958984375, 0.4019927978515625, 0.434906005859375, 0.4678192138671875, 0.500732421875, 0.5336456298828125, 0.566558837890625, 0.5994720458984375, 0.63238525390625, 0.6652984619140625, 0.698211669921875, 0.7311248779296875, 0.7640380859375, 0.7969512939453125, 0.829864501953125, 0.8627777099609375, 0.89569091796875, 0.9286041259765625, 0.961517333984375, 0.9944305419921875, 1.02734375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 10.0, 3.0, 7.0, 7.0, 11.0, 9.0, 21.0, 18.0, 442.0, 355.0, 27.0, 7.0, 15.0, 10.0, 7.0, 11.0, 8.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.0982208251953125, -0.095306396484375, -0.0923919677734375, -0.0894775390625, -0.0865631103515625, -0.083648681640625, -0.0807342529296875, -0.07781982421875, -0.0749053955078125, -0.071990966796875, -0.0690765380859375, -0.066162109375, -0.0632476806640625, -0.060333251953125, -0.0574188232421875, -0.05450439453125, -0.0515899658203125, -0.048675537109375, -0.0457611083984375, -0.0428466796875, -0.0399322509765625, -0.037017822265625, -0.0341033935546875, -0.03118896484375, -0.0282745361328125, -0.025360107421875, -0.0224456787109375, -0.01953125, -0.0166168212890625, -0.013702392578125, -0.0107879638671875, -0.00787353515625, -0.0049591064453125, -0.002044677734375, 0.0008697509765625, 0.0037841796875, 0.0066986083984375, 0.009613037109375, 0.0125274658203125, 0.01544189453125, 0.0183563232421875, 0.021270751953125, 0.0241851806640625, 0.027099609375, 0.0300140380859375, 0.032928466796875, 0.0358428955078125, 0.03875732421875, 0.0416717529296875, 0.044586181640625, 0.0475006103515625, 0.0504150390625, 0.0533294677734375, 0.056243896484375, 0.0591583251953125, 0.06207275390625, 0.0649871826171875, 0.067901611328125, 0.0708160400390625, 0.07373046875, 0.0766448974609375, 0.079559326171875, 0.0824737548828125, 0.08538818359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 12.0, 15.0, 16.0, 16.0, 33.0, 62.0, 74.0, 119.0, 279.0, 594.0, 1315.0, 4059.0, 18178.0, 224298.0, 3864296.0, 62010.0, 12017.0, 3791.0, 1532.0, 697.0, 357.0, 168.0, 111.0, 59.0, 38.0, 30.0, 18.0, 14.0, 13.0, 9.0, 10.0, 7.0, 8.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.457275390625, -0.44309234619140625, -0.4289093017578125, -0.41472625732421875, -0.400543212890625, -0.38636016845703125, -0.3721771240234375, -0.35799407958984375, -0.34381103515625, -0.32962799072265625, -0.3154449462890625, -0.30126190185546875, -0.287078857421875, -0.27289581298828125, -0.2587127685546875, -0.24452972412109375, -0.2303466796875, -0.21616363525390625, -0.2019805908203125, -0.18779754638671875, -0.173614501953125, -0.15943145751953125, -0.1452484130859375, -0.13106536865234375, -0.11688232421875, -0.10269927978515625, -0.0885162353515625, -0.07433319091796875, -0.060150146484375, -0.04596710205078125, -0.0317840576171875, -0.01760101318359375, -0.00341796875, 0.01076507568359375, 0.0249481201171875, 0.03913116455078125, 0.053314208984375, 0.06749725341796875, 0.0816802978515625, 0.09586334228515625, 0.11004638671875, 0.12422943115234375, 0.1384124755859375, 0.15259552001953125, 0.166778564453125, 0.18096160888671875, 0.1951446533203125, 0.20932769775390625, 0.2235107421875, 0.23769378662109375, 0.2518768310546875, 0.26605987548828125, 0.280242919921875, 0.29442596435546875, 0.3086090087890625, 0.32279205322265625, 0.33697509765625, 0.35115814208984375, 0.3653411865234375, 0.37952423095703125, 0.393707275390625, 0.40789031982421875, 0.4220733642578125, 0.43625640869140625, 0.450439453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 3.0, 7.0, 11.0, 9.0, 8.0, 8.0, 18.0, 32.0, 47.0, 59.0, 131.0, 724.0, 2162.0, 268.0, 122.0, 78.0, 58.0, 49.0, 43.0, 31.0, 26.0, 21.0, 17.0, 18.0, 16.0, 11.0, 11.0, 11.0, 7.0, 5.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.0792236328125, -0.07650566101074219, -0.07378768920898438, -0.07106971740722656, -0.06835174560546875, -0.06563377380371094, -0.06291580200195312, -0.06019783020019531, -0.0574798583984375, -0.05476188659667969, -0.052043914794921875, -0.04932594299316406, -0.04660797119140625, -0.04388999938964844, -0.041172027587890625, -0.03845405578613281, -0.035736083984375, -0.03301811218261719, -0.030300140380859375, -0.027582168579101562, -0.02486419677734375, -0.022146224975585938, -0.019428253173828125, -0.016710281372070312, -0.0139923095703125, -0.011274337768554688, -0.008556365966796875, -0.0058383941650390625, -0.00312042236328125, -0.0004024505615234375, 0.002315521240234375, 0.0050334930419921875, 0.00775146484375, 0.010469436645507812, 0.013187408447265625, 0.015905380249023438, 0.01862335205078125, 0.021341323852539062, 0.024059295654296875, 0.026777267456054688, 0.0294952392578125, 0.03221321105957031, 0.034931182861328125, 0.03764915466308594, 0.04036712646484375, 0.04308509826660156, 0.045803070068359375, 0.04852104187011719, 0.051239013671875, 0.05395698547363281, 0.056674957275390625, 0.05939292907714844, 0.06211090087890625, 0.06482887268066406, 0.06754684448242188, 0.07026481628417969, 0.0729827880859375, 0.07570075988769531, 0.07841873168945312, 0.08113670349121094, 0.08385467529296875, 0.08657264709472656, 0.08929061889648438, 0.09200859069824219, 0.0947265625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 746.0, 246.0, 10.0, 4.0, 4.0, 1.0, 1.0], "bins": [-14.510116577148438, -14.259368896484375, -14.008621215820312, -13.75787353515625, -13.507124900817871, -13.256377220153809, -13.005629539489746, -12.754881858825684, -12.504134178161621, -12.253386497497559, -12.002638816833496, -11.751890182495117, -11.501142501831055, -11.250394821166992, -10.99964714050293, -10.748899459838867, -10.498151779174805, -10.247404098510742, -9.99665641784668, -9.745908737182617, -9.495160102844238, -9.244412422180176, -8.993664741516113, -8.74291706085205, -8.492168426513672, -8.24142074584961, -7.990672588348389, -7.739924907684326, -7.489177227020264, -7.238429069519043, -6.9876813888549805, -6.736933708190918, -6.486185073852539, -6.235437393188477, -5.984689235687256, -5.733941555023193, -5.483193874359131, -5.23244571685791, -4.981698036193848, -4.730950355529785, -4.480202674865723, -4.22945499420166, -3.9787070751190186, -3.727959156036377, -3.4772114753723145, -3.226463556289673, -2.9757156372070312, -2.7249679565429688, -2.474220037460327, -2.2234721183776855, -1.972724437713623, -1.7219765186309814, -1.4712287187576294, -1.2204809188842773, -0.9697329998016357, -0.7189851999282837, -0.46823740005493164, -0.2174895703792572, 0.033258259296417236, 0.28400611877441406, 0.5347539186477661, 0.7855017185211182, 1.0362496376037598, 1.2869974374771118, 1.5377452373504639]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 10.0, 12.0, 20.0, 27.0, 57.0, 72.0, 109.0, 100.0, 124.0, 104.0, 90.0, 95.0, 57.0, 45.0, 32.0, 18.0, 6.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5981602668762207, -1.5600923299789429, -1.5220245122909546, -1.4839565753936768, -1.4458887577056885, -1.4078208208084106, -1.3697530031204224, -1.3316850662231445, -1.2936172485351562, -1.2555493116378784, -1.2174814939498901, -1.1794135570526123, -1.141345739364624, -1.1032778024673462, -1.065209984779358, -1.02714204788208, -0.9890741109848022, -0.9510062336921692, -0.9129383563995361, -0.8748704791069031, -0.83680260181427, -0.7987346649169922, -0.7606667876243591, -0.7225989103317261, -0.684531033039093, -0.64646315574646, -0.6083952784538269, -0.5703274011611938, -0.532259464263916, -0.49419161677360535, -0.4561237096786499, -0.41805583238601685, -0.37998783588409424, -0.3419199585914612, -0.3038520812988281, -0.2657841742038727, -0.22771629691123962, -0.18964841961860657, -0.15158052742481232, -0.11351263523101807, -0.07544475793838501, -0.037376873195171356, 0.0006910115480422974, 0.03875889629125595, 0.0768267810344696, 0.11489465832710266, 0.1529625505208969, 0.19103044271469116, 0.22909832000732422, 0.2671661972999573, 0.30523407459259033, 0.3433019816875458, 0.38136985898017883, 0.4194377362728119, 0.45750564336776733, 0.4955735206604004, 0.5336413979530334, 0.5717092752456665, 0.6097771525382996, 0.6478450298309326, 0.6859129667282104, 0.7239807844161987, 0.7620487213134766, 0.8001165986061096, 0.8381844758987427]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 12.0, 17.0, 25.0, 34.0, 46.0, 83.0, 133.0, 178.0, 298.0, 510.0, 960.0, 1922.0, 4525.0, 11776.0, 43058.0, 915777.0, 47523.0, 12429.0, 4803.0, 2041.0, 949.0, 525.0, 339.0, 175.0, 119.0, 83.0, 55.0, 48.0, 27.0, 14.0, 7.0, 9.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.49951171875, -0.48314666748046875, -0.4667816162109375, -0.45041656494140625, -0.434051513671875, -0.41768646240234375, -0.4013214111328125, -0.38495635986328125, -0.36859130859375, -0.35222625732421875, -0.3358612060546875, -0.31949615478515625, -0.303131103515625, -0.28676605224609375, -0.2704010009765625, -0.25403594970703125, -0.2376708984375, -0.22130584716796875, -0.2049407958984375, -0.18857574462890625, -0.172210693359375, -0.15584564208984375, -0.1394805908203125, -0.12311553955078125, -0.10675048828125, -0.09038543701171875, -0.0740203857421875, -0.05765533447265625, -0.041290283203125, -0.02492523193359375, -0.0085601806640625, 0.00780487060546875, 0.024169921875, 0.04053497314453125, 0.0569000244140625, 0.07326507568359375, 0.089630126953125, 0.10599517822265625, 0.1223602294921875, 0.13872528076171875, 0.15509033203125, 0.17145538330078125, 0.1878204345703125, 0.20418548583984375, 0.220550537109375, 0.23691558837890625, 0.2532806396484375, 0.26964569091796875, 0.2860107421875, 0.30237579345703125, 0.3187408447265625, 0.33510589599609375, 0.351470947265625, 0.36783599853515625, 0.3842010498046875, 0.40056610107421875, 0.41693115234375, 0.43329620361328125, 0.4496612548828125, 0.46602630615234375, 0.482391357421875, 0.49875640869140625, 0.5151214599609375, 0.5314865112304688, 0.5478515625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 5.0, 9.0, 8.0, 12.0, 18.0, 13.0, 81.0, 429.0, 294.0, 46.0, 12.0, 12.0, 8.0, 10.0, 10.0, 6.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10565185546875, -0.10260200500488281, -0.09955215454101562, -0.09650230407714844, -0.09345245361328125, -0.09040260314941406, -0.08735275268554688, -0.08430290222167969, -0.0812530517578125, -0.07820320129394531, -0.07515335083007812, -0.07210350036621094, -0.06905364990234375, -0.06600379943847656, -0.06295394897460938, -0.05990409851074219, -0.056854248046875, -0.05380439758300781, -0.050754547119140625, -0.04770469665527344, -0.04465484619140625, -0.04160499572753906, -0.038555145263671875, -0.03550529479980469, -0.0324554443359375, -0.029405593872070312, -0.026355743408203125, -0.023305892944335938, -0.02025604248046875, -0.017206192016601562, -0.014156341552734375, -0.011106491088867188, -0.008056640625, -0.0050067901611328125, -0.001956939697265625, 0.0010929107666015625, 0.00414276123046875, 0.0071926116943359375, 0.010242462158203125, 0.013292312622070312, 0.0163421630859375, 0.019392013549804688, 0.022441864013671875, 0.025491714477539062, 0.02854156494140625, 0.03159141540527344, 0.034641265869140625, 0.03769111633300781, 0.040740966796875, 0.04379081726074219, 0.046840667724609375, 0.04989051818847656, 0.05294036865234375, 0.05599021911621094, 0.059040069580078125, 0.06208992004394531, 0.0651397705078125, 0.06818962097167969, 0.07123947143554688, 0.07428932189941406, 0.07733917236328125, 0.08038902282714844, 0.08343887329101562, 0.08648872375488281, 0.08953857421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 4.0, 3.0, 10.0, 9.0, 7.0, 11.0, 4.0, 12.0, 9.0, 21.0, 27.0, 32.0, 26.0, 39.0, 64.0, 98.0, 151.0, 256.0, 467.0, 900.0, 2171.0, 7366.0, 44771.0, 594949.0, 357426.0, 30581.0, 5546.0, 1735.0, 749.0, 392.0, 246.0, 115.0, 82.0, 50.0, 43.0, 25.0, 19.0, 26.0, 21.0, 14.0, 11.0, 12.0, 16.0, 10.0, 7.0, 9.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.3134765625, -0.304229736328125, -0.29498291015625, -0.285736083984375, -0.2764892578125, -0.267242431640625, -0.25799560546875, -0.248748779296875, -0.239501953125, -0.230255126953125, -0.22100830078125, -0.211761474609375, -0.2025146484375, -0.193267822265625, -0.18402099609375, -0.174774169921875, -0.16552734375, -0.156280517578125, -0.14703369140625, -0.137786865234375, -0.1285400390625, -0.119293212890625, -0.11004638671875, -0.100799560546875, -0.091552734375, -0.082305908203125, -0.07305908203125, -0.063812255859375, -0.0545654296875, -0.045318603515625, -0.03607177734375, -0.026824951171875, -0.017578125, -0.008331298828125, 0.00091552734375, 0.010162353515625, 0.0194091796875, 0.028656005859375, 0.03790283203125, 0.047149658203125, 0.056396484375, 0.065643310546875, 0.07489013671875, 0.084136962890625, 0.0933837890625, 0.102630615234375, 0.11187744140625, 0.121124267578125, 0.13037109375, 0.139617919921875, 0.14886474609375, 0.158111572265625, 0.1673583984375, 0.176605224609375, 0.18585205078125, 0.195098876953125, 0.204345703125, 0.213592529296875, 0.22283935546875, 0.232086181640625, 0.2413330078125, 0.250579833984375, 0.25982666015625, 0.269073486328125, 0.2783203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 7.0, 5.0, 11.0, 10.0, 9.0, 8.0, 9.0, 19.0, 24.0, 18.0, 25.0, 18.0, 30.0, 33.0, 34.0, 40.0, 29.0, 45.0, 44.0, 44.0, 36.0, 33.0, 39.0, 28.0, 51.0, 35.0, 38.0, 37.0, 25.0, 23.0, 24.0, 11.0, 23.0, 21.0, 17.0, 16.0, 11.0, 11.0, 17.0, 9.0, 13.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.220458984375, -0.21431541442871094, -0.20817184448242188, -0.2020282745361328, -0.19588470458984375, -0.1897411346435547, -0.18359756469726562, -0.17745399475097656, -0.1713104248046875, -0.16516685485839844, -0.15902328491210938, -0.1528797149658203, -0.14673614501953125, -0.1405925750732422, -0.13444900512695312, -0.12830543518066406, -0.122161865234375, -0.11601829528808594, -0.10987472534179688, -0.10373115539550781, -0.09758758544921875, -0.09144401550292969, -0.08530044555664062, -0.07915687561035156, -0.0730133056640625, -0.06686973571777344, -0.060726165771484375, -0.05458259582519531, -0.04843902587890625, -0.04229545593261719, -0.036151885986328125, -0.030008316040039062, -0.02386474609375, -0.017721176147460938, -0.011577606201171875, -0.0054340362548828125, 0.00070953369140625, 0.0068531036376953125, 0.012996673583984375, 0.019140243530273438, 0.0252838134765625, 0.03142738342285156, 0.037570953369140625, 0.04371452331542969, 0.04985809326171875, 0.05600166320800781, 0.062145233154296875, 0.06828880310058594, 0.074432373046875, 0.08057594299316406, 0.08671951293945312, 0.09286308288574219, 0.09900665283203125, 0.10515022277832031, 0.11129379272460938, 0.11743736267089844, 0.1235809326171875, 0.12972450256347656, 0.13586807250976562, 0.1420116424560547, 0.14815521240234375, 0.1542987823486328, 0.16044235229492188, 0.16658592224121094, 0.1727294921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 8.0, 13.0, 13.0, 8.0, 21.0, 28.0, 59.0, 76.0, 181.0, 386.0, 873.0, 2975.0, 17053.0, 977829.0, 42477.0, 4320.0, 1249.0, 451.0, 233.0, 108.0, 40.0, 32.0, 27.0, 24.0, 10.0, 15.0, 3.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1954345703125, -0.18995094299316406, -0.18446731567382812, -0.1789836883544922, -0.17350006103515625, -0.1680164337158203, -0.16253280639648438, -0.15704917907714844, -0.1515655517578125, -0.14608192443847656, -0.14059829711914062, -0.1351146697998047, -0.12963104248046875, -0.12414741516113281, -0.11866378784179688, -0.11318016052246094, -0.107696533203125, -0.10221290588378906, -0.09672927856445312, -0.09124565124511719, -0.08576202392578125, -0.08027839660644531, -0.07479476928710938, -0.06931114196777344, -0.0638275146484375, -0.05834388732910156, -0.052860260009765625, -0.04737663269042969, -0.04189300537109375, -0.03640937805175781, -0.030925750732421875, -0.025442123413085938, -0.01995849609375, -0.014474868774414062, -0.008991241455078125, -0.0035076141357421875, 0.00197601318359375, 0.0074596405029296875, 0.012943267822265625, 0.018426895141601562, 0.0239105224609375, 0.029394149780273438, 0.034877777099609375, 0.04036140441894531, 0.04584503173828125, 0.05132865905761719, 0.056812286376953125, 0.06229591369628906, 0.067779541015625, 0.07326316833496094, 0.07874679565429688, 0.08423042297363281, 0.08971405029296875, 0.09519767761230469, 0.10068130493164062, 0.10616493225097656, 0.1116485595703125, 0.11713218688964844, 0.12261581420898438, 0.1280994415283203, 0.13358306884765625, 0.1390666961669922, 0.14455032348632812, 0.15003395080566406, 0.155517578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 6.0, 4.0, 2.0, 8.0, 2.0, 12.0, 24.0, 445.0, 399.0, 37.0, 14.0, 8.0, 5.0, 6.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002301931381225586, -0.00022413022816181183, -0.00021806731820106506, -0.0002120044082403183, -0.00020594149827957153, -0.00019987858831882477, -0.000193815678358078, -0.00018775276839733124, -0.00018168985843658447, -0.0001756269484758377, -0.00016956403851509094, -0.00016350112855434418, -0.0001574382185935974, -0.00015137530863285065, -0.00014531239867210388, -0.00013924948871135712, -0.00013318657875061035, -0.00012712366878986359, -0.00012106075882911682, -0.00011499784886837006, -0.00010893493890762329, -0.00010287202894687653, -9.680911898612976e-05, -9.0746209025383e-05, -8.468329906463623e-05, -7.862038910388947e-05, -7.25574791431427e-05, -6.649456918239594e-05, -6.043165922164917e-05, -5.4368749260902405e-05, -4.830583930015564e-05, -4.2242929339408875e-05, -3.618001937866211e-05, -3.0117109417915344e-05, -2.405419945716858e-05, -1.7991289496421814e-05, -1.1928379535675049e-05, -5.865469574928284e-06, 1.9744038581848145e-07, 6.260350346565247e-06, 1.2323260307312012e-05, 1.8386170268058777e-05, 2.4449080228805542e-05, 3.0511990189552307e-05, 3.657490015029907e-05, 4.263781011104584e-05, 4.87007200717926e-05, 5.476363003253937e-05, 6.082653999328613e-05, 6.68894499540329e-05, 7.295235991477966e-05, 7.901526987552643e-05, 8.50781798362732e-05, 9.114108979701996e-05, 9.720399975776672e-05, 0.00010326690971851349, 0.00010932981967926025, 0.00011539272964000702, 0.00012145563960075378, 0.00012751854956150055, 0.00013358145952224731, 0.00013964436948299408, 0.00014570727944374084, 0.0001517701894044876, 0.00015783309936523438]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 13.0, 30.0, 39.0, 42.0, 95.0, 198.0, 345.0, 894.0, 3145.0, 23462.0, 915796.0, 95150.0, 6617.0, 1541.0, 543.0, 275.0, 133.0, 91.0, 50.0, 32.0, 19.0, 6.0, 9.0, 3.0, 8.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1541748046875, -0.1491546630859375, -0.144134521484375, -0.1391143798828125, -0.13409423828125, -0.1290740966796875, -0.124053955078125, -0.1190338134765625, -0.114013671875, -0.1089935302734375, -0.103973388671875, -0.0989532470703125, -0.09393310546875, -0.0889129638671875, -0.083892822265625, -0.0788726806640625, -0.0738525390625, -0.0688323974609375, -0.063812255859375, -0.0587921142578125, -0.05377197265625, -0.0487518310546875, -0.043731689453125, -0.0387115478515625, -0.03369140625, -0.0286712646484375, -0.023651123046875, -0.0186309814453125, -0.01361083984375, -0.0085906982421875, -0.003570556640625, 0.0014495849609375, 0.0064697265625, 0.0114898681640625, 0.016510009765625, 0.0215301513671875, 0.02655029296875, 0.0315704345703125, 0.036590576171875, 0.0416107177734375, 0.046630859375, 0.0516510009765625, 0.056671142578125, 0.0616912841796875, 0.06671142578125, 0.0717315673828125, 0.076751708984375, 0.0817718505859375, 0.0867919921875, 0.0918121337890625, 0.096832275390625, 0.1018524169921875, 0.10687255859375, 0.1118927001953125, 0.116912841796875, 0.1219329833984375, 0.126953125, 0.1319732666015625, 0.136993408203125, 0.1420135498046875, 0.14703369140625, 0.1520538330078125, 0.157073974609375, 0.1620941162109375, 0.1671142578125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 8.0, 17.0, 12.0, 16.0, 44.0, 39.0, 62.0, 86.0, 92.0, 133.0, 124.0, 109.0, 74.0, 45.0, 49.0, 20.0, 19.0, 14.0, 10.0, 2.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08362388610839844, -0.08008956909179688, -0.07655525207519531, -0.07302093505859375, -0.06948661804199219, -0.06595230102539062, -0.06241798400878906, -0.0588836669921875, -0.05534934997558594, -0.051815032958984375, -0.04828071594238281, -0.04474639892578125, -0.04121208190917969, -0.037677764892578125, -0.03414344787597656, -0.030609130859375, -0.027074813842773438, -0.023540496826171875, -0.020006179809570312, -0.01647186279296875, -0.012937545776367188, -0.009403228759765625, -0.0058689117431640625, -0.0023345947265625, 0.0011997222900390625, 0.004734039306640625, 0.008268356323242188, 0.01180267333984375, 0.015336990356445312, 0.018871307373046875, 0.022405624389648438, 0.02593994140625, 0.029474258422851562, 0.033008575439453125, 0.03654289245605469, 0.04007720947265625, 0.04361152648925781, 0.047145843505859375, 0.05068016052246094, 0.0542144775390625, 0.05774879455566406, 0.061283111572265625, 0.06481742858886719, 0.06835174560546875, 0.07188606262207031, 0.07542037963867188, 0.07895469665527344, 0.082489013671875, 0.08602333068847656, 0.08955764770507812, 0.09309196472167969, 0.09662628173828125, 0.10016059875488281, 0.10369491577148438, 0.10722923278808594, 0.1107635498046875, 0.11429786682128906, 0.11783218383789062, 0.12136650085449219, 0.12490081787109375, 0.1284351348876953, 0.13196945190429688, 0.13550376892089844, 0.1390380859375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 22.0, 134.0, 503.0, 240.0, 54.0, 17.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.889031171798706, -2.817814588546753, -2.746598243713379, -2.675381660461426, -2.6041650772094727, -2.5329487323760986, -2.4617321491241455, -2.3905158042907715, -2.3192992210388184, -2.2480826377868652, -2.176866292953491, -2.105649709701538, -2.034433364868164, -1.963216781616211, -1.8920001983642578, -1.8207837343215942, -1.7495672702789307, -1.678350806236267, -1.6071343421936035, -1.5359177589416504, -1.4647012948989868, -1.3934848308563232, -1.3222682476043701, -1.2510517835617065, -1.179835319519043, -1.1086188554763794, -1.0374023914337158, -0.9661858081817627, -0.8949693441390991, -0.8237528800964355, -0.7525363564491272, -0.6813198328018188, -0.6101036071777344, -0.5388871431350708, -0.46767061948776245, -0.3964541256427765, -0.3252376317977905, -0.25402113795280457, -0.1828046441078186, -0.11158815026283264, -0.04037165641784668, 0.030844837427139282, 0.10206133127212524, 0.1732778251171112, 0.24449431896209717, 0.31571081280708313, 0.3869273066520691, 0.45814380049705505, 0.529360294342041, 0.6005767583847046, 0.6717932820320129, 0.7430098056793213, 0.8142262697219849, 0.8854427337646484, 0.9566592574119568, 1.0278757810592651, 1.0990922451019287, 1.1703087091445923, 1.2415251731872559, 1.312741756439209, 1.3839582204818726, 1.4551746845245361, 1.5263912677764893, 1.5976077318191528, 1.6688241958618164]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 10.0, 7.0, 9.0, 7.0, 11.0, 16.0, 24.0, 30.0, 42.0, 43.0, 54.0, 61.0, 69.0, 82.0, 73.0, 69.0, 56.0, 65.0, 57.0, 38.0, 38.0, 22.0, 21.0, 17.0, 20.0, 12.0, 7.0, 8.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.9664127826690674, -1.9060291051864624, -1.8456453084945679, -1.785261631011963, -1.7248778343200684, -1.6644941568374634, -1.6041104793548584, -1.5437266826629639, -1.4833428859710693, -1.4229592084884644, -1.3625754117965698, -1.3021917343139648, -1.2418079376220703, -1.1814242601394653, -1.1210405826568604, -1.0606567859649658, -1.0002731084823608, -0.9398893713951111, -0.8795056343078613, -0.8191219568252563, -0.7587381601333618, -0.6983544826507568, -0.6379707455635071, -0.5775870084762573, -0.5172032713890076, -0.4568195343017578, -0.39643579721450806, -0.3360520899295807, -0.27566835284233093, -0.21528461575508118, -0.1549009084701538, -0.09451717138290405, -0.0341334342956543, 0.026250295341014862, 0.08663402497768402, 0.14701774716377258, 0.20740148425102234, 0.2677852213382721, 0.32816892862319946, 0.3885526657104492, 0.448936402797699, 0.5093201398849487, 0.5697038769721985, 0.6300876140594482, 0.6904712915420532, 0.7508550882339478, 0.8112387657165527, 0.8716225028038025, 0.9320062398910522, 0.992389976978302, 1.0527737140655518, 1.1131573915481567, 1.1735411882400513, 1.2339248657226562, 1.2943086624145508, 1.3546923398971558, 1.4150760173797607, 1.4754596948623657, 1.5358434915542603, 1.5962271690368652, 1.6566109657287598, 1.7169946432113647, 1.7773783206939697, 1.8377621173858643, 1.8981459140777588]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 10.0, 12.0, 12.0, 18.0, 18.0, 28.0, 67.0, 59.0, 82.0, 120.0, 259.0, 521.0, 1201.0, 2664.0, 8070.0, 97311.0, 4065752.0, 13045.0, 2894.0, 1117.0, 505.0, 234.0, 93.0, 53.0, 35.0, 25.0, 15.0, 14.0, 8.0, 6.0, 11.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1512908935546875, -1.113128662109375, -1.0749664306640625, -1.03680419921875, -0.9986419677734375, -0.960479736328125, -0.9223175048828125, -0.8841552734375, -0.8459930419921875, -0.807830810546875, -0.7696685791015625, -0.73150634765625, -0.6933441162109375, -0.655181884765625, -0.6170196533203125, -0.578857421875, -0.5406951904296875, -0.502532958984375, -0.4643707275390625, -0.42620849609375, -0.3880462646484375, -0.349884033203125, -0.3117218017578125, -0.2735595703125, -0.2353973388671875, -0.197235107421875, -0.1590728759765625, -0.12091064453125, -0.0827484130859375, -0.044586181640625, -0.0064239501953125, 0.03173828125, 0.0699005126953125, 0.108062744140625, 0.1462249755859375, 0.18438720703125, 0.2225494384765625, 0.260711669921875, 0.2988739013671875, 0.3370361328125, 0.3751983642578125, 0.413360595703125, 0.4515228271484375, 0.48968505859375, 0.5278472900390625, 0.566009521484375, 0.6041717529296875, 0.642333984375, 0.6804962158203125, 0.718658447265625, 0.7568206787109375, 0.79498291015625, 0.8331451416015625, 0.871307373046875, 0.9094696044921875, 0.9476318359375, 0.9857940673828125, 1.023956298828125, 1.0621185302734375, 1.10028076171875, 1.1384429931640625, 1.176605224609375, 1.2147674560546875, 1.2529296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 7.0, 9.0, 5.0, 12.0, 8.0, 19.0, 13.0, 28.0, 159.0, 418.0, 214.0, 47.0, 15.0, 12.0, 13.0, 9.0, 7.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10174560546875, -0.09870433807373047, -0.09566307067871094, -0.0926218032836914, -0.08958053588867188, -0.08653926849365234, -0.08349800109863281, -0.08045673370361328, -0.07741546630859375, -0.07437419891357422, -0.07133293151855469, -0.06829166412353516, -0.06525039672851562, -0.062209129333496094, -0.05916786193847656, -0.05612659454345703, -0.0530853271484375, -0.05004405975341797, -0.04700279235839844, -0.043961524963378906, -0.040920257568359375, -0.037878990173339844, -0.03483772277832031, -0.03179645538330078, -0.02875518798828125, -0.02571392059326172, -0.022672653198242188, -0.019631385803222656, -0.016590118408203125, -0.013548851013183594, -0.010507583618164062, -0.007466316223144531, -0.004425048828125, -0.0013837814331054688, 0.0016574859619140625, 0.004698753356933594, 0.007740020751953125, 0.010781288146972656, 0.013822555541992188, 0.01686382293701172, 0.01990509033203125, 0.02294635772705078, 0.025987625122070312, 0.029028892517089844, 0.032070159912109375, 0.035111427307128906, 0.03815269470214844, 0.04119396209716797, 0.0442352294921875, 0.04727649688720703, 0.05031776428222656, 0.053359031677246094, 0.056400299072265625, 0.059441566467285156, 0.06248283386230469, 0.06552410125732422, 0.06856536865234375, 0.07160663604736328, 0.07464790344238281, 0.07768917083740234, 0.08073043823242188, 0.0837717056274414, 0.08681297302246094, 0.08985424041748047, 0.0928955078125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 6.0, 12.0, 6.0, 9.0, 12.0, 12.0, 26.0, 32.0, 42.0, 67.0, 114.0, 242.0, 868.0, 6484.0, 3175249.0, 1003323.0, 6356.0, 854.0, 264.0, 110.0, 67.0, 34.0, 28.0, 13.0, 9.0, 14.0, 3.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8319625854492188, -0.8011322021484375, -0.7703018188476562, -0.739471435546875, -0.7086410522460938, -0.6778106689453125, -0.6469802856445312, -0.61614990234375, -0.5853195190429688, -0.5544891357421875, -0.5236587524414062, -0.492828369140625, -0.46199798583984375, -0.4311676025390625, -0.40033721923828125, -0.3695068359375, -0.33867645263671875, -0.3078460693359375, -0.27701568603515625, -0.246185302734375, -0.21535491943359375, -0.1845245361328125, -0.15369415283203125, -0.12286376953125, -0.09203338623046875, -0.0612030029296875, -0.03037261962890625, 0.000457763671875, 0.03128814697265625, 0.0621185302734375, 0.09294891357421875, 0.123779296875, 0.15460968017578125, 0.1854400634765625, 0.21627044677734375, 0.247100830078125, 0.27793121337890625, 0.3087615966796875, 0.33959197998046875, 0.37042236328125, 0.40125274658203125, 0.4320831298828125, 0.46291351318359375, 0.493743896484375, 0.5245742797851562, 0.5554046630859375, 0.5862350463867188, 0.6170654296875, 0.6478958129882812, 0.6787261962890625, 0.7095565795898438, 0.740386962890625, 0.7712173461914062, 0.8020477294921875, 0.8328781127929688, 0.86370849609375, 0.8945388793945312, 0.9253692626953125, 0.9561996459960938, 0.987030029296875, 1.0178604125976562, 1.0486907958984375, 1.0795211791992188, 1.1103515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 4.0, 6.0, 11.0, 8.0, 13.0, 17.0, 20.0, 42.0, 55.0, 106.0, 406.0, 2709.0, 279.0, 134.0, 61.0, 50.0, 23.0, 23.0, 28.0, 15.0, 11.0, 7.0, 6.0, 8.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.141357421875, -0.1375732421875, -0.1337890625, -0.1300048828125, -0.126220703125, -0.1224365234375, -0.11865234375, -0.1148681640625, -0.111083984375, -0.1072998046875, -0.103515625, -0.0997314453125, -0.095947265625, -0.0921630859375, -0.08837890625, -0.0845947265625, -0.080810546875, -0.0770263671875, -0.0732421875, -0.0694580078125, -0.065673828125, -0.0618896484375, -0.05810546875, -0.0543212890625, -0.050537109375, -0.0467529296875, -0.04296875, -0.0391845703125, -0.035400390625, -0.0316162109375, -0.02783203125, -0.0240478515625, -0.020263671875, -0.0164794921875, -0.0126953125, -0.0089111328125, -0.005126953125, -0.0013427734375, 0.00244140625, 0.0062255859375, 0.010009765625, 0.0137939453125, 0.017578125, 0.0213623046875, 0.025146484375, 0.0289306640625, 0.03271484375, 0.0364990234375, 0.040283203125, 0.0440673828125, 0.0478515625, 0.0516357421875, 0.055419921875, 0.0592041015625, 0.06298828125, 0.0667724609375, 0.070556640625, 0.0743408203125, 0.078125, 0.0819091796875, 0.085693359375, 0.0894775390625, 0.09326171875, 0.0970458984375, 0.100830078125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 665.0, 330.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.783815383911133, -6.660317420959473, -6.5368194580078125, -6.413321018218994, -6.289823055267334, -6.166325092315674, -6.042827129364014, -5.919328689575195, -5.795830726623535, -5.672332763671875, -5.548834800720215, -5.4253363609313965, -5.301838397979736, -5.178340435028076, -5.054842472076416, -4.931344032287598, -4.8078460693359375, -4.684348106384277, -4.560850143432617, -4.437351703643799, -4.313853740692139, -4.1903557777404785, -4.066857814788818, -3.943359613418579, -3.819861650466919, -3.696363687515259, -3.5728654861450195, -3.4493675231933594, -3.32586932182312, -3.20237135887146, -3.0788731575012207, -2.9553751945495605, -2.831876754760742, -2.708378791809082, -2.5848805904388428, -2.4613826274871826, -2.3378844261169434, -2.214386463165283, -2.090888261795044, -1.9673902988433838, -1.8438923358917236, -1.720394253730774, -1.5968961715698242, -1.4733980894088745, -1.3499000072479248, -1.2264020442962646, -1.1029038429260254, -0.9794058203697205, -0.855907678604126, -0.7324095964431763, -0.6089115142822266, -0.48541346192359924, -0.36191537976264954, -0.23841732740402222, -0.11491924524307251, 0.008578836917877197, 0.1320769190788269, 0.2555750012397766, 0.3790730834007263, 0.5025711059570312, 0.626069188117981, 0.7495672702789307, 0.8730653524398804, 0.9965634346008301, 1.1200615167617798]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 5.0, 8.0, 7.0, 13.0, 31.0, 38.0, 59.0, 60.0, 76.0, 102.0, 86.0, 106.0, 85.0, 72.0, 70.0, 53.0, 35.0, 25.0, 21.0, 13.0, 7.0, 5.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5499835014343262, -0.5298078060150146, -0.5096321702003479, -0.4894564747810364, -0.46928080916404724, -0.4491051435470581, -0.42892947793006897, -0.40875381231307983, -0.3885781168937683, -0.3684024512767792, -0.34822678565979004, -0.3280510902404785, -0.3078754246234894, -0.28769975900650024, -0.2675240933895111, -0.24734841287136078, -0.22717276215553284, -0.2069970965385437, -0.18682141602039337, -0.16664575040340424, -0.1464700698852539, -0.12629440426826477, -0.10611873865127563, -0.0859430581331253, -0.06576739251613617, -0.04559171944856644, -0.025416050106287003, -0.005240380764007568, 0.014935292303562164, 0.0351109653711319, 0.05528663098812103, 0.07546231150627136, 0.0956379771232605, 0.11581365019083023, 0.13598932325839996, 0.1561649888753891, 0.17634066939353943, 0.19651633501052856, 0.2166920006275177, 0.23686768114566803, 0.25704336166381836, 0.2772190272808075, 0.29739469289779663, 0.31757038831710815, 0.3377460539340973, 0.3579217195510864, 0.37809738516807556, 0.3982730507850647, 0.41844871640205383, 0.43862438201904297, 0.4588000476360321, 0.47897571325302124, 0.49915140867233276, 0.5193270444869995, 0.539502739906311, 0.5596784353256226, 0.5798540711402893, 0.6000297665596008, 0.6202054023742676, 0.6403810977935791, 0.6605567336082458, 0.6807324290275574, 0.7009080648422241, 0.7210837602615356, 0.7412594556808472]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 17.0, 9.0, 19.0, 27.0, 17.0, 24.0, 31.0, 43.0, 60.0, 87.0, 145.0, 194.0, 274.0, 491.0, 930.0, 1892.0, 4380.0, 14350.0, 139988.0, 841478.0, 31321.0, 6917.0, 2784.0, 1217.0, 636.0, 400.0, 233.0, 137.0, 115.0, 89.0, 49.0, 27.0, 38.0, 30.0, 19.0, 18.0, 12.0, 17.0, 8.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.45361328125, -0.4390869140625, -0.424560546875, -0.4100341796875, -0.3955078125, -0.3809814453125, -0.366455078125, -0.3519287109375, -0.33740234375, -0.3228759765625, -0.308349609375, -0.2938232421875, -0.279296875, -0.2647705078125, -0.250244140625, -0.2357177734375, -0.22119140625, -0.2066650390625, -0.192138671875, -0.1776123046875, -0.1630859375, -0.1485595703125, -0.134033203125, -0.1195068359375, -0.10498046875, -0.0904541015625, -0.075927734375, -0.0614013671875, -0.046875, -0.0323486328125, -0.017822265625, -0.0032958984375, 0.01123046875, 0.0257568359375, 0.040283203125, 0.0548095703125, 0.0693359375, 0.0838623046875, 0.098388671875, 0.1129150390625, 0.12744140625, 0.1419677734375, 0.156494140625, 0.1710205078125, 0.185546875, 0.2000732421875, 0.214599609375, 0.2291259765625, 0.24365234375, 0.2581787109375, 0.272705078125, 0.2872314453125, 0.3017578125, 0.3162841796875, 0.330810546875, 0.3453369140625, 0.35986328125, 0.3743896484375, 0.388916015625, 0.4034423828125, 0.41796875, 0.4324951171875, 0.447021484375, 0.4615478515625, 0.47607421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 12.0, 10.0, 14.0, 16.0, 17.0, 116.0, 325.0, 304.0, 104.0, 27.0, 18.0, 9.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.0956888198852539, -0.09268379211425781, -0.08967876434326172, -0.08667373657226562, -0.08366870880126953, -0.08066368103027344, -0.07765865325927734, -0.07465362548828125, -0.07164859771728516, -0.06864356994628906, -0.06563854217529297, -0.06263351440429688, -0.05962848663330078, -0.05662345886230469, -0.053618431091308594, -0.0506134033203125, -0.047608375549316406, -0.04460334777832031, -0.04159832000732422, -0.038593292236328125, -0.03558826446533203, -0.03258323669433594, -0.029578208923339844, -0.02657318115234375, -0.023568153381347656, -0.020563125610351562, -0.01755809783935547, -0.014553070068359375, -0.011548042297363281, -0.008543014526367188, -0.005537986755371094, -0.002532958984375, 0.00047206878662109375, 0.0034770965576171875, 0.006482124328613281, 0.009487152099609375, 0.012492179870605469, 0.015497207641601562, 0.018502235412597656, 0.02150726318359375, 0.024512290954589844, 0.027517318725585938, 0.03052234649658203, 0.033527374267578125, 0.03653240203857422, 0.03953742980957031, 0.042542457580566406, 0.0455474853515625, 0.048552513122558594, 0.05155754089355469, 0.05456256866455078, 0.057567596435546875, 0.06057262420654297, 0.06357765197753906, 0.06658267974853516, 0.06958770751953125, 0.07259273529052734, 0.07559776306152344, 0.07860279083251953, 0.08160781860351562, 0.08461284637451172, 0.08761787414550781, 0.0906229019165039, 0.0936279296875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 6.0, 13.0, 8.0, 10.0, 7.0, 19.0, 20.0, 19.0, 32.0, 51.0, 59.0, 67.0, 105.0, 130.0, 223.0, 326.0, 582.0, 1009.0, 2020.0, 6162.0, 40531.0, 798150.0, 179255.0, 13120.0, 3282.0, 1399.0, 664.0, 403.0, 275.0, 173.0, 103.0, 90.0, 50.0, 42.0, 33.0, 26.0, 10.0, 18.0, 15.0, 11.0, 9.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.420166015625, -0.4073333740234375, -0.394500732421875, -0.3816680908203125, -0.36883544921875, -0.3560028076171875, -0.343170166015625, -0.3303375244140625, -0.3175048828125, -0.3046722412109375, -0.291839599609375, -0.2790069580078125, -0.26617431640625, -0.2533416748046875, -0.240509033203125, -0.2276763916015625, -0.21484375, -0.2020111083984375, -0.189178466796875, -0.1763458251953125, -0.16351318359375, -0.1506805419921875, -0.137847900390625, -0.1250152587890625, -0.1121826171875, -0.0993499755859375, -0.086517333984375, -0.0736846923828125, -0.06085205078125, -0.0480194091796875, -0.035186767578125, -0.0223541259765625, -0.009521484375, 0.0033111572265625, 0.016143798828125, 0.0289764404296875, 0.04180908203125, 0.0546417236328125, 0.067474365234375, 0.0803070068359375, 0.0931396484375, 0.1059722900390625, 0.118804931640625, 0.1316375732421875, 0.14447021484375, 0.1573028564453125, 0.170135498046875, 0.1829681396484375, 0.19580078125, 0.2086334228515625, 0.221466064453125, 0.2342987060546875, 0.24713134765625, 0.2599639892578125, 0.272796630859375, 0.2856292724609375, 0.2984619140625, 0.3112945556640625, 0.324127197265625, 0.3369598388671875, 0.34979248046875, 0.3626251220703125, 0.375457763671875, 0.3882904052734375, 0.401123046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 9.0, 10.0, 11.0, 13.0, 15.0, 26.0, 19.0, 26.0, 31.0, 26.0, 41.0, 36.0, 39.0, 43.0, 51.0, 48.0, 41.0, 46.0, 38.0, 44.0, 45.0, 31.0, 39.0, 35.0, 30.0, 31.0, 22.0, 23.0, 14.0, 13.0, 13.0, 17.0, 15.0, 7.0, 6.0, 7.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1868896484375, -0.18124008178710938, -0.17559051513671875, -0.16994094848632812, -0.1642913818359375, -0.15864181518554688, -0.15299224853515625, -0.14734268188476562, -0.141693115234375, -0.13604354858398438, -0.13039398193359375, -0.12474441528320312, -0.1190948486328125, -0.11344528198242188, -0.10779571533203125, -0.10214614868164062, -0.09649658203125, -0.09084701538085938, -0.08519744873046875, -0.07954788208007812, -0.0738983154296875, -0.06824874877929688, -0.06259918212890625, -0.056949615478515625, -0.051300048828125, -0.045650482177734375, -0.04000091552734375, -0.034351348876953125, -0.0287017822265625, -0.023052215576171875, -0.01740264892578125, -0.011753082275390625, -0.006103515625, -0.000453948974609375, 0.00519561767578125, 0.010845184326171875, 0.0164947509765625, 0.022144317626953125, 0.02779388427734375, 0.033443450927734375, 0.039093017578125, 0.044742584228515625, 0.05039215087890625, 0.056041717529296875, 0.0616912841796875, 0.06734085083007812, 0.07299041748046875, 0.07863998413085938, 0.08428955078125, 0.08993911743164062, 0.09558868408203125, 0.10123825073242188, 0.1068878173828125, 0.11253738403320312, 0.11818695068359375, 0.12383651733398438, 0.129486083984375, 0.13513565063476562, 0.14078521728515625, 0.14643478393554688, 0.1520843505859375, 0.15773391723632812, 0.16338348388671875, 0.16903305053710938, 0.1746826171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 9.0, 12.0, 9.0, 24.0, 35.0, 54.0, 96.0, 137.0, 280.0, 577.0, 1474.0, 6130.0, 65073.0, 918035.0, 48975.0, 5258.0, 1279.0, 477.0, 224.0, 130.0, 63.0, 49.0, 41.0, 32.0, 17.0, 14.0, 9.0, 7.0, 2.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.25537109375, -0.24795913696289062, -0.24054718017578125, -0.23313522338867188, -0.2257232666015625, -0.21831130981445312, -0.21089935302734375, -0.20348739624023438, -0.196075439453125, -0.18866348266601562, -0.18125152587890625, -0.17383956909179688, -0.1664276123046875, -0.15901565551757812, -0.15160369873046875, -0.14419174194335938, -0.13677978515625, -0.12936782836914062, -0.12195587158203125, -0.11454391479492188, -0.1071319580078125, -0.09972000122070312, -0.09230804443359375, -0.08489608764648438, -0.077484130859375, -0.07007217407226562, -0.06266021728515625, -0.055248260498046875, -0.0478363037109375, -0.040424346923828125, -0.03301239013671875, -0.025600433349609375, -0.0181884765625, -0.010776519775390625, -0.00336456298828125, 0.004047393798828125, 0.0114593505859375, 0.018871307373046875, 0.02628326416015625, 0.033695220947265625, 0.041107177734375, 0.048519134521484375, 0.05593109130859375, 0.06334304809570312, 0.0707550048828125, 0.07816696166992188, 0.08557891845703125, 0.09299087524414062, 0.10040283203125, 0.10781478881835938, 0.11522674560546875, 0.12263870239257812, 0.1300506591796875, 0.13746261596679688, 0.14487457275390625, 0.15228652954101562, 0.159698486328125, 0.16711044311523438, 0.17452239990234375, 0.18193435668945312, 0.1893463134765625, 0.19675827026367188, 0.20417022705078125, 0.21158218383789062, 0.218994140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 10.0, 3.0, 3.0, 13.0, 4.0, 11.0, 13.0, 20.0, 27.0, 39.0, 56.0, 57.0, 108.0, 249.0, 112.0, 66.0, 58.0, 34.0, 31.0, 20.0, 15.0, 16.0, 9.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00022661685943603516, -0.00022023916244506836, -0.00021386146545410156, -0.00020748376846313477, -0.00020110607147216797, -0.00019472837448120117, -0.00018835067749023438, -0.00018197298049926758, -0.00017559528350830078, -0.00016921758651733398, -0.0001628398895263672, -0.0001564621925354004, -0.0001500844955444336, -0.0001437067985534668, -0.0001373291015625, -0.0001309514045715332, -0.0001245737075805664, -0.00011819601058959961, -0.00011181831359863281, -0.00010544061660766602, -9.906291961669922e-05, -9.268522262573242e-05, -8.630752563476562e-05, -7.992982864379883e-05, -7.355213165283203e-05, -6.717443466186523e-05, -6.079673767089844e-05, -5.441904067993164e-05, -4.8041343688964844e-05, -4.166364669799805e-05, -3.528594970703125e-05, -2.8908252716064453e-05, -2.2530555725097656e-05, -1.615285873413086e-05, -9.775161743164062e-06, -3.3974647521972656e-06, 2.9802322387695312e-06, 9.357929229736328e-06, 1.5735626220703125e-05, 2.2113323211669922e-05, 2.849102020263672e-05, 3.4868717193603516e-05, 4.124641418457031e-05, 4.762411117553711e-05, 5.4001808166503906e-05, 6.03795051574707e-05, 6.67572021484375e-05, 7.31348991394043e-05, 7.95125961303711e-05, 8.589029312133789e-05, 9.226799011230469e-05, 9.864568710327148e-05, 0.00010502338409423828, 0.00011140108108520508, 0.00011777877807617188, 0.00012415647506713867, 0.00013053417205810547, 0.00013691186904907227, 0.00014328956604003906, 0.00014966726303100586, 0.00015604496002197266, 0.00016242265701293945, 0.00016880035400390625, 0.00017517805099487305, 0.00018155574798583984]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 14.0, 8.0, 11.0, 26.0, 39.0, 55.0, 72.0, 176.0, 385.0, 971.0, 5173.0, 321141.0, 712628.0, 5960.0, 1100.0, 386.0, 167.0, 78.0, 55.0, 29.0, 26.0, 17.0, 7.0, 7.0, 9.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.496826171875, -0.48223114013671875, -0.4676361083984375, -0.45304107666015625, -0.438446044921875, -0.42385101318359375, -0.4092559814453125, -0.39466094970703125, -0.38006591796875, -0.36547088623046875, -0.3508758544921875, -0.33628082275390625, -0.321685791015625, -0.30709075927734375, -0.2924957275390625, -0.27790069580078125, -0.2633056640625, -0.24871063232421875, -0.2341156005859375, -0.21952056884765625, -0.204925537109375, -0.19033050537109375, -0.1757354736328125, -0.16114044189453125, -0.14654541015625, -0.13195037841796875, -0.1173553466796875, -0.10276031494140625, -0.088165283203125, -0.07357025146484375, -0.0589752197265625, -0.04438018798828125, -0.02978515625, -0.01519012451171875, -0.0005950927734375, 0.01399993896484375, 0.028594970703125, 0.04319000244140625, 0.0577850341796875, 0.07238006591796875, 0.08697509765625, 0.10157012939453125, 0.1161651611328125, 0.13076019287109375, 0.145355224609375, 0.15995025634765625, 0.1745452880859375, 0.18914031982421875, 0.2037353515625, 0.21833038330078125, 0.2329254150390625, 0.24752044677734375, 0.262115478515625, 0.27671051025390625, 0.2913055419921875, 0.30590057373046875, 0.32049560546875, 0.33509063720703125, 0.3496856689453125, 0.36428070068359375, 0.378875732421875, 0.39347076416015625, 0.4080657958984375, 0.42266082763671875, 0.437255859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 4.0, 7.0, 5.0, 10.0, 9.0, 15.0, 16.0, 37.0, 49.0, 91.0, 142.0, 184.0, 144.0, 96.0, 51.0, 31.0, 24.0, 17.0, 11.0, 15.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2091064453125, -0.2036876678466797, -0.19826889038085938, -0.19285011291503906, -0.18743133544921875, -0.18201255798339844, -0.17659378051757812, -0.1711750030517578, -0.1657562255859375, -0.1603374481201172, -0.15491867065429688, -0.14949989318847656, -0.14408111572265625, -0.13866233825683594, -0.13324356079101562, -0.1278247833251953, -0.122406005859375, -0.11698722839355469, -0.11156845092773438, -0.10614967346191406, -0.10073089599609375, -0.09531211853027344, -0.08989334106445312, -0.08447456359863281, -0.0790557861328125, -0.07363700866699219, -0.06821823120117188, -0.06279945373535156, -0.05738067626953125, -0.05196189880371094, -0.046543121337890625, -0.04112434387207031, -0.03570556640625, -0.030286788940429688, -0.024868011474609375, -0.019449234008789062, -0.01403045654296875, -0.008611679077148438, -0.003192901611328125, 0.0022258758544921875, 0.0076446533203125, 0.013063430786132812, 0.018482208251953125, 0.023900985717773438, 0.02931976318359375, 0.03473854064941406, 0.040157318115234375, 0.04557609558105469, 0.050994873046875, 0.05641365051269531, 0.061832427978515625, 0.06725120544433594, 0.07266998291015625, 0.07808876037597656, 0.08350753784179688, 0.08892631530761719, 0.0943450927734375, 0.09976387023925781, 0.10518264770507812, 0.11060142517089844, 0.11602020263671875, 0.12143898010253906, 0.12685775756835938, 0.1322765350341797, 0.1376953125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 12.0, 24.0, 90.0, 377.0, 401.0, 69.0, 13.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6290292739868164, -3.5252389907836914, -3.4214487075805664, -3.3176584243774414, -3.2138681411743164, -3.1100778579711914, -3.0062878131866455, -2.9024975299835205, -2.7987072467803955, -2.6949169635772705, -2.5911266803741455, -2.4873363971710205, -2.3835463523864746, -2.2797560691833496, -2.1759657859802246, -2.0721755027770996, -1.9683852195739746, -1.8645949363708496, -1.7608046531677246, -1.6570144891738892, -1.5532242059707642, -1.4494339227676392, -1.3456437587738037, -1.2418534755706787, -1.1380631923675537, -1.0342729091644287, -0.9304826855659485, -0.8266924619674683, -0.7229021787643433, -0.6191118955612183, -0.515321671962738, -0.4115314483642578, -0.3077414035797119, -0.2039511501789093, -0.10016089677810669, 0.003629356622695923, 0.10741961002349854, 0.21120989322662354, 0.31500011682510376, 0.418790340423584, 0.522580623626709, 0.626370906829834, 0.7301611304283142, 0.8339513540267944, 0.9377416372299194, 1.0415319204330444, 1.1453220844268799, 1.2491123676300049, 1.3529026508331299, 1.4566929340362549, 1.5604832172393799, 1.6642733812332153, 1.7680636644363403, 1.8718539476394653, 1.9756441116333008, 2.079434394836426, 2.183224678039551, 2.287014961242676, 2.390805244445801, 2.494595527648926, 2.598385810852051, 2.702176094055176, 2.8059661388397217, 2.9097564220428467, 3.0135467052459717]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 9.0, 5.0, 12.0, 21.0, 20.0, 28.0, 50.0, 40.0, 44.0, 60.0, 54.0, 55.0, 82.0, 66.0, 70.0, 58.0, 70.0, 59.0, 38.0, 38.0, 34.0, 20.0, 23.0, 9.0, 12.0, 4.0, 10.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.2630128860473633, -2.1985321044921875, -2.134051561355591, -2.069571018218994, -2.0050902366638184, -1.9406095743179321, -1.876128911972046, -1.8116482496261597, -1.7471675872802734, -1.6826869249343872, -1.618206262588501, -1.5537256002426147, -1.4892449378967285, -1.4247642755508423, -1.360283613204956, -1.2958029508590698, -1.2313222885131836, -1.1668416261672974, -1.1023609638214111, -1.037880301475525, -0.9733996391296387, -0.9089189767837524, -0.8444383144378662, -0.77995765209198, -0.7154769897460938, -0.6509963274002075, -0.5865156650543213, -0.5220350027084351, -0.45755434036254883, -0.3930736780166626, -0.32859301567077637, -0.26411235332489014, -0.1996316909790039, -0.13515102863311768, -0.07067036628723145, -0.006189703941345215, 0.058290958404541016, 0.12277162075042725, 0.18725228309631348, 0.2517329454421997, 0.31621360778808594, 0.38069427013397217, 0.4451749324798584, 0.5096555948257446, 0.5741362571716309, 0.6386169195175171, 0.7030975818634033, 0.7675782442092896, 0.8320589065551758, 0.896539568901062, 0.9610202312469482, 1.0255008935928345, 1.0899815559387207, 1.154462218284607, 1.2189428806304932, 1.2834235429763794, 1.3479042053222656, 1.4123848676681519, 1.476865530014038, 1.5413461923599243, 1.6058268547058105, 1.6703075170516968, 1.734788179397583, 1.7992688417434692, 1.8637495040893555]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 17.0, 24.0, 55.0, 124.0, 442.0, 5764.0, 4184984.0, 2458.0, 285.0, 65.0, 21.0, 17.0, 18.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.7738037109375, -2.672607421875, -2.5714111328125, -2.47021484375, -2.3690185546875, -2.267822265625, -2.1666259765625, -2.0654296875, -1.9642333984375, -1.863037109375, -1.7618408203125, -1.66064453125, -1.5594482421875, -1.458251953125, -1.3570556640625, -1.255859375, -1.1546630859375, -1.053466796875, -0.9522705078125, -0.85107421875, -0.7498779296875, -0.648681640625, -0.5474853515625, -0.4462890625, -0.3450927734375, -0.243896484375, -0.1427001953125, -0.04150390625, 0.0596923828125, 0.160888671875, 0.2620849609375, 0.36328125, 0.4644775390625, 0.565673828125, 0.6668701171875, 0.76806640625, 0.8692626953125, 0.970458984375, 1.0716552734375, 1.1728515625, 1.2740478515625, 1.375244140625, 1.4764404296875, 1.57763671875, 1.6788330078125, 1.780029296875, 1.8812255859375, 1.982421875, 2.0836181640625, 2.184814453125, 2.2860107421875, 2.38720703125, 2.4884033203125, 2.589599609375, 2.6907958984375, 2.7919921875, 2.8931884765625, 2.994384765625, 3.0955810546875, 3.19677734375, 3.2979736328125, 3.399169921875, 3.5003662109375, 3.6015625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 15.0, 9.0, 15.0, 18.0, 42.0, 165.0, 289.0, 275.0, 99.0, 30.0, 16.0, 8.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.09336280822753906, -0.09010696411132812, -0.08685111999511719, -0.08359527587890625, -0.08033943176269531, -0.07708358764648438, -0.07382774353027344, -0.0705718994140625, -0.06731605529785156, -0.06406021118164062, -0.06080436706542969, -0.05754852294921875, -0.05429267883300781, -0.051036834716796875, -0.04778099060058594, -0.044525146484375, -0.04126930236816406, -0.038013458251953125, -0.03475761413574219, -0.03150177001953125, -0.028245925903320312, -0.024990081787109375, -0.021734237670898438, -0.0184783935546875, -0.015222549438476562, -0.011966705322265625, -0.008710861206054688, -0.00545501708984375, -0.0021991729736328125, 0.001056671142578125, 0.0043125152587890625, 0.007568359375, 0.010824203491210938, 0.014080047607421875, 0.017335891723632812, 0.02059173583984375, 0.023847579956054688, 0.027103424072265625, 0.030359268188476562, 0.0336151123046875, 0.03687095642089844, 0.040126800537109375, 0.04338264465332031, 0.04663848876953125, 0.04989433288574219, 0.053150177001953125, 0.05640602111816406, 0.059661865234375, 0.06291770935058594, 0.06617355346679688, 0.06942939758300781, 0.07268524169921875, 0.07594108581542969, 0.07919692993164062, 0.08245277404785156, 0.0857086181640625, 0.08896446228027344, 0.09222030639648438, 0.09547615051269531, 0.09873199462890625, 0.10198783874511719, 0.10524368286132812, 0.10849952697753906, 0.11175537109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 7.0, 11.0, 13.0, 18.0, 36.0, 56.0, 68.0, 99.0, 208.0, 424.0, 849.0, 2526.0, 13032.0, 3572018.0, 589218.0, 11049.0, 2514.0, 981.0, 418.0, 240.0, 179.0, 105.0, 61.0, 46.0, 32.0, 23.0, 9.0, 8.0, 4.0, 6.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5830078125, -0.5621414184570312, -0.5412750244140625, -0.5204086303710938, -0.499542236328125, -0.47867584228515625, -0.4578094482421875, -0.43694305419921875, -0.41607666015625, -0.39521026611328125, -0.3743438720703125, -0.35347747802734375, -0.332611083984375, -0.31174468994140625, -0.2908782958984375, -0.27001190185546875, -0.2491455078125, -0.22827911376953125, -0.2074127197265625, -0.18654632568359375, -0.165679931640625, -0.14481353759765625, -0.1239471435546875, -0.10308074951171875, -0.08221435546875, -0.06134796142578125, -0.0404815673828125, -0.01961517333984375, 0.001251220703125, 0.02211761474609375, 0.0429840087890625, 0.06385040283203125, 0.084716796875, 0.10558319091796875, 0.1264495849609375, 0.14731597900390625, 0.168182373046875, 0.18904876708984375, 0.2099151611328125, 0.23078155517578125, 0.25164794921875, 0.27251434326171875, 0.2933807373046875, 0.31424713134765625, 0.335113525390625, 0.35597991943359375, 0.3768463134765625, 0.39771270751953125, 0.4185791015625, 0.43944549560546875, 0.4603118896484375, 0.48117828369140625, 0.502044677734375, 0.5229110717773438, 0.5437774658203125, 0.5646438598632812, 0.58551025390625, 0.6063766479492188, 0.6272430419921875, 0.6481094360351562, 0.668975830078125, 0.6898422241210938, 0.7107086181640625, 0.7315750122070312, 0.75244140625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 8.0, 6.0, 19.0, 23.0, 35.0, 74.0, 202.0, 2515.0, 844.0, 150.0, 59.0, 37.0, 24.0, 18.0, 13.0, 5.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.080810546875, -0.07672882080078125, -0.0726470947265625, -0.06856536865234375, -0.064483642578125, -0.06040191650390625, -0.0563201904296875, -0.05223846435546875, -0.04815673828125, -0.04407501220703125, -0.0399932861328125, -0.03591156005859375, -0.031829833984375, -0.02774810791015625, -0.0236663818359375, -0.01958465576171875, -0.0155029296875, -0.01142120361328125, -0.0073394775390625, -0.00325775146484375, 0.000823974609375, 0.00490570068359375, 0.0089874267578125, 0.01306915283203125, 0.01715087890625, 0.02123260498046875, 0.0253143310546875, 0.02939605712890625, 0.033477783203125, 0.03755950927734375, 0.0416412353515625, 0.04572296142578125, 0.0498046875, 0.05388641357421875, 0.0579681396484375, 0.06204986572265625, 0.066131591796875, 0.07021331787109375, 0.0742950439453125, 0.07837677001953125, 0.08245849609375, 0.08654022216796875, 0.0906219482421875, 0.09470367431640625, 0.098785400390625, 0.10286712646484375, 0.1069488525390625, 0.11103057861328125, 0.1151123046875, 0.11919403076171875, 0.1232757568359375, 0.12735748291015625, 0.131439208984375, 0.13552093505859375, 0.1396026611328125, 0.14368438720703125, 0.14776611328125, 0.15184783935546875, 0.1559295654296875, 0.16001129150390625, 0.164093017578125, 0.16817474365234375, 0.1722564697265625, 0.17633819580078125, 0.180419921875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 13.0, 162.0, 755.0, 63.0, 13.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944117307662964, -2.871133327484131, -2.7981491088867188, -2.7251651287078857, -2.6521811485290527, -2.5791969299316406, -2.5062129497528076, -2.4332289695739746, -2.3602447509765625, -2.2872607707977295, -2.2142765522003174, -2.1412925720214844, -2.0683085918426514, -1.9953244924545288, -1.9223403930664062, -1.8493564128875732, -1.7763724327087402, -1.7033883333206177, -1.6304043531417847, -1.557420253753662, -1.484436273574829, -1.4114521741867065, -1.338468074798584, -1.265484094619751, -1.1924999952316284, -1.1195158958435059, -1.0465319156646729, -0.9735478162765503, -0.9005637764930725, -0.8275797367095947, -0.7545956373214722, -0.6816115975379944, -0.6086273193359375, -0.5356432795524597, -0.46265920996665955, -0.3896751403808594, -0.3166911005973816, -0.2437070608139038, -0.17072299122810364, -0.09773892164230347, -0.024754881858825684, 0.04822917282581329, 0.12121322751045227, 0.19419728219509125, 0.2671813368797302, 0.340165376663208, 0.4131494462490082, 0.48613351583480835, 0.5591175556182861, 0.6321015954017639, 0.7050856351852417, 0.7780697345733643, 0.851053774356842, 0.9240378141403198, 0.9970219135284424, 1.0700058937072754, 1.142989993095398, 1.2159740924835205, 1.2889580726623535, 1.361942172050476, 1.4349262714385986, 1.5079102516174316, 1.5808943510055542, 1.6538784503936768, 1.7268624305725098]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 6.0, 9.0, 14.0, 16.0, 15.0, 32.0, 20.0, 40.0, 54.0, 48.0, 42.0, 58.0, 57.0, 59.0, 48.0, 49.0, 66.0, 64.0, 50.0, 45.0, 34.0, 28.0, 42.0, 25.0, 21.0, 9.0, 8.0, 10.0, 5.0, 2.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4465025067329407, -0.4348994791507721, -0.42329642176628113, -0.41169339418411255, -0.4000903367996216, -0.388487309217453, -0.3768842816352844, -0.36528122425079346, -0.3536781668663025, -0.3420751392841339, -0.33047208189964294, -0.31886905431747437, -0.3072659969329834, -0.2956629693508148, -0.28405994176864624, -0.2724568843841553, -0.2608538568019867, -0.24925081431865692, -0.23764777183532715, -0.22604474425315857, -0.2144416868686676, -0.20283865928649902, -0.19123561680316925, -0.17963257431983948, -0.1680295318365097, -0.15642648935317993, -0.14482344686985016, -0.13322040438652039, -0.12161736935377121, -0.11001432687044144, -0.09841129183769226, -0.08680824935436249, -0.07520520687103271, -0.06360216438770294, -0.05199912562966347, -0.04039608687162399, -0.02879304438829422, -0.017190001904964447, -0.005586966872215271, 0.006016075611114502, 0.017619118094444275, 0.0292221587151289, 0.04082519933581352, 0.052428238093853, 0.06403128057718277, 0.07563432306051254, 0.08723735809326172, 0.09884040057659149, 0.11044344305992126, 0.12204648554325104, 0.1336495280265808, 0.1452525556087494, 0.15685561299324036, 0.16845864057540894, 0.1800616830587387, 0.19166472554206848, 0.20326776802539825, 0.21487081050872803, 0.2264738529920578, 0.23807689547538757, 0.24967992305755615, 0.2612829804420471, 0.2728860080242157, 0.2844890356063843, 0.29609209299087524]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 8.0, 5.0, 8.0, 8.0, 10.0, 14.0, 13.0, 16.0, 10.0, 23.0, 36.0, 54.0, 65.0, 113.0, 112.0, 166.0, 219.0, 339.0, 420.0, 774.0, 1280.0, 2803.0, 9042.0, 56144.0, 800351.0, 152910.0, 15154.0, 4135.0, 1621.0, 895.0, 534.0, 348.0, 228.0, 178.0, 136.0, 107.0, 68.0, 50.0, 44.0, 29.0, 22.0, 17.0, 11.0, 11.0, 7.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291015625, -0.2821083068847656, -0.27320098876953125, -0.2642936706542969, -0.2553863525390625, -0.24647903442382812, -0.23757171630859375, -0.22866439819335938, -0.219757080078125, -0.21084976196289062, -0.20194244384765625, -0.19303512573242188, -0.1841278076171875, -0.17522048950195312, -0.16631317138671875, -0.15740585327148438, -0.14849853515625, -0.13959121704101562, -0.13068389892578125, -0.12177658081054688, -0.1128692626953125, -0.10396194458007812, -0.09505462646484375, -0.08614730834960938, -0.077239990234375, -0.06833267211914062, -0.05942535400390625, -0.050518035888671875, -0.0416107177734375, -0.032703399658203125, -0.02379608154296875, -0.014888763427734375, -0.0059814453125, 0.002925872802734375, 0.01183319091796875, 0.020740509033203125, 0.0296478271484375, 0.038555145263671875, 0.04746246337890625, 0.056369781494140625, 0.065277099609375, 0.07418441772460938, 0.08309173583984375, 0.09199905395507812, 0.1009063720703125, 0.10981369018554688, 0.11872100830078125, 0.12762832641601562, 0.13653564453125, 0.14544296264648438, 0.15435028076171875, 0.16325759887695312, 0.1721649169921875, 0.18107223510742188, 0.18997955322265625, 0.19888687133789062, 0.207794189453125, 0.21670150756835938, 0.22560882568359375, 0.23451614379882812, 0.2434234619140625, 0.2523307800292969, 0.26123809814453125, 0.2701454162597656, 0.279052734375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 11.0, 17.0, 16.0, 22.0, 70.0, 166.0, 290.0, 250.0, 91.0, 35.0, 9.0, 10.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1014404296875, -0.09822463989257812, -0.09500885009765625, -0.09179306030273438, -0.0885772705078125, -0.08536148071289062, -0.08214569091796875, -0.07892990112304688, -0.075714111328125, -0.07249832153320312, -0.06928253173828125, -0.06606674194335938, -0.0628509521484375, -0.059635162353515625, -0.05641937255859375, -0.053203582763671875, -0.04998779296875, -0.046772003173828125, -0.04355621337890625, -0.040340423583984375, -0.0371246337890625, -0.033908843994140625, -0.03069305419921875, -0.027477264404296875, -0.024261474609375, -0.021045684814453125, -0.01782989501953125, -0.014614105224609375, -0.0113983154296875, -0.008182525634765625, -0.00496673583984375, -0.001750946044921875, 0.00146484375, 0.004680633544921875, 0.00789642333984375, 0.011112213134765625, 0.0143280029296875, 0.017543792724609375, 0.02075958251953125, 0.023975372314453125, 0.027191162109375, 0.030406951904296875, 0.03362274169921875, 0.036838531494140625, 0.0400543212890625, 0.043270111083984375, 0.04648590087890625, 0.049701690673828125, 0.05291748046875, 0.056133270263671875, 0.05934906005859375, 0.06256484985351562, 0.0657806396484375, 0.06899642944335938, 0.07221221923828125, 0.07542800903320312, 0.078643798828125, 0.08185958862304688, 0.08507537841796875, 0.08829116821289062, 0.0915069580078125, 0.09472274780273438, 0.09793853759765625, 0.10115432739257812, 0.1043701171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 5.0, 12.0, 20.0, 20.0, 35.0, 34.0, 45.0, 84.0, 120.0, 168.0, 250.0, 378.0, 652.0, 1274.0, 2564.0, 7550.0, 50289.0, 684883.0, 270945.0, 20606.0, 4433.0, 1782.0, 913.0, 498.0, 308.0, 214.0, 155.0, 95.0, 51.0, 40.0, 36.0, 26.0, 13.0, 17.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.33251953125, -0.3232307434082031, -0.31394195556640625, -0.3046531677246094, -0.2953643798828125, -0.2860755920410156, -0.27678680419921875, -0.2674980163574219, -0.258209228515625, -0.24892044067382812, -0.23963165283203125, -0.23034286499023438, -0.2210540771484375, -0.21176528930664062, -0.20247650146484375, -0.19318771362304688, -0.18389892578125, -0.17461013793945312, -0.16532135009765625, -0.15603256225585938, -0.1467437744140625, -0.13745498657226562, -0.12816619873046875, -0.11887741088867188, -0.109588623046875, -0.10029983520507812, -0.09101104736328125, -0.08172225952148438, -0.0724334716796875, -0.06314468383789062, -0.05385589599609375, -0.044567108154296875, -0.0352783203125, -0.025989532470703125, -0.01670074462890625, -0.007411956787109375, 0.0018768310546875, 0.011165618896484375, 0.02045440673828125, 0.029743194580078125, 0.039031982421875, 0.048320770263671875, 0.05760955810546875, 0.06689834594726562, 0.0761871337890625, 0.08547592163085938, 0.09476470947265625, 0.10405349731445312, 0.11334228515625, 0.12263107299804688, 0.13191986083984375, 0.14120864868164062, 0.1504974365234375, 0.15978622436523438, 0.16907501220703125, 0.17836380004882812, 0.187652587890625, 0.19694137573242188, 0.20623016357421875, 0.21551895141601562, 0.2248077392578125, 0.23409652709960938, 0.24338531494140625, 0.2526741027832031, 0.261962890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 9.0, 9.0, 9.0, 10.0, 16.0, 12.0, 27.0, 24.0, 35.0, 37.0, 26.0, 41.0, 61.0, 54.0, 46.0, 49.0, 57.0, 43.0, 41.0, 50.0, 44.0, 48.0, 52.0, 33.0, 26.0, 27.0, 24.0, 16.0, 17.0, 14.0, 10.0, 11.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.270263671875, -0.2636280059814453, -0.2569923400878906, -0.25035667419433594, -0.24372100830078125, -0.23708534240722656, -0.23044967651367188, -0.2238140106201172, -0.2171783447265625, -0.2105426788330078, -0.20390701293945312, -0.19727134704589844, -0.19063568115234375, -0.18400001525878906, -0.17736434936523438, -0.1707286834716797, -0.164093017578125, -0.1574573516845703, -0.15082168579101562, -0.14418601989746094, -0.13755035400390625, -0.13091468811035156, -0.12427902221679688, -0.11764335632324219, -0.1110076904296875, -0.10437202453613281, -0.09773635864257812, -0.09110069274902344, -0.08446502685546875, -0.07782936096191406, -0.07119369506835938, -0.06455802917480469, -0.05792236328125, -0.05128669738769531, -0.044651031494140625, -0.03801536560058594, -0.03137969970703125, -0.024744033813476562, -0.018108367919921875, -0.011472702026367188, -0.0048370361328125, 0.0017986297607421875, 0.008434295654296875, 0.015069961547851562, 0.02170562744140625, 0.028341293334960938, 0.034976959228515625, 0.04161262512207031, 0.048248291015625, 0.05488395690917969, 0.061519622802734375, 0.06815528869628906, 0.07479095458984375, 0.08142662048339844, 0.08806228637695312, 0.09469795227050781, 0.1013336181640625, 0.10796928405761719, 0.11460494995117188, 0.12124061584472656, 0.12787628173828125, 0.13451194763183594, 0.14114761352539062, 0.1477832794189453, 0.1544189453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 2.0, 9.0, 15.0, 22.0, 23.0, 33.0, 65.0, 111.0, 219.0, 420.0, 978.0, 2565.0, 10290.0, 153450.0, 830715.0, 40999.0, 5514.0, 1711.0, 667.0, 308.0, 176.0, 86.0, 49.0, 35.0, 20.0, 20.0, 15.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.174072265625, -0.1686840057373047, -0.16329574584960938, -0.15790748596191406, -0.15251922607421875, -0.14713096618652344, -0.14174270629882812, -0.1363544464111328, -0.1309661865234375, -0.1255779266357422, -0.12018966674804688, -0.11480140686035156, -0.10941314697265625, -0.10402488708496094, -0.09863662719726562, -0.09324836730957031, -0.087860107421875, -0.08247184753417969, -0.07708358764648438, -0.07169532775878906, -0.06630706787109375, -0.06091880798339844, -0.055530548095703125, -0.05014228820800781, -0.0447540283203125, -0.03936576843261719, -0.033977508544921875, -0.028589248657226562, -0.02320098876953125, -0.017812728881835938, -0.012424468994140625, -0.0070362091064453125, -0.00164794921875, 0.0037403106689453125, 0.009128570556640625, 0.014516830444335938, 0.01990509033203125, 0.025293350219726562, 0.030681610107421875, 0.03606986999511719, 0.0414581298828125, 0.04684638977050781, 0.052234649658203125, 0.05762290954589844, 0.06301116943359375, 0.06839942932128906, 0.07378768920898438, 0.07917594909667969, 0.084564208984375, 0.08995246887207031, 0.09534072875976562, 0.10072898864746094, 0.10611724853515625, 0.11150550842285156, 0.11689376831054688, 0.12228202819824219, 0.1276702880859375, 0.1330585479736328, 0.13844680786132812, 0.14383506774902344, 0.14922332763671875, 0.15461158752441406, 0.15999984741210938, 0.1653881072998047, 0.1707763671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 2.0, 5.0, 9.0, 8.0, 8.0, 9.0, 14.0, 19.0, 31.0, 45.0, 99.0, 212.0, 233.0, 105.0, 57.0, 34.0, 32.0, 19.0, 15.0, 10.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001747608184814453, -0.00016832351684570312, -0.00016188621520996094, -0.00015544891357421875, -0.00014901161193847656, -0.00014257431030273438, -0.0001361370086669922, -0.00012969970703125, -0.0001232624053955078, -0.00011682510375976562, -0.00011038780212402344, -0.00010395050048828125, -9.751319885253906e-05, -9.107589721679688e-05, -8.463859558105469e-05, -7.82012939453125e-05, -7.176399230957031e-05, -6.532669067382812e-05, -5.888938903808594e-05, -5.245208740234375e-05, -4.601478576660156e-05, -3.9577484130859375e-05, -3.314018249511719e-05, -2.6702880859375e-05, -2.0265579223632812e-05, -1.3828277587890625e-05, -7.3909759521484375e-06, -9.5367431640625e-07, 5.4836273193359375e-06, 1.1920928955078125e-05, 1.8358230590820312e-05, 2.47955322265625e-05, 3.123283386230469e-05, 3.7670135498046875e-05, 4.410743713378906e-05, 5.054473876953125e-05, 5.698204040527344e-05, 6.341934204101562e-05, 6.985664367675781e-05, 7.62939453125e-05, 8.273124694824219e-05, 8.916854858398438e-05, 9.560585021972656e-05, 0.00010204315185546875, 0.00010848045349121094, 0.00011491775512695312, 0.00012135505676269531, 0.0001277923583984375, 0.0001342296600341797, 0.00014066696166992188, 0.00014710426330566406, 0.00015354156494140625, 0.00015997886657714844, 0.00016641616821289062, 0.0001728534698486328, 0.000179290771484375, 0.0001857280731201172, 0.00019216537475585938, 0.00019860267639160156, 0.00020503997802734375, 0.00021147727966308594, 0.00021791458129882812, 0.0002243518829345703, 0.0002307891845703125, 0.0002372264862060547]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 13.0, 13.0, 24.0, 37.0, 57.0, 72.0, 129.0, 193.0, 391.0, 728.0, 1630.0, 4203.0, 15172.0, 144186.0, 783347.0, 80667.0, 11271.0, 3484.0, 1373.0, 644.0, 363.0, 180.0, 113.0, 61.0, 60.0, 35.0, 20.0, 17.0, 13.0, 17.0, 8.0, 11.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.173828125, -0.1690521240234375, -0.164276123046875, -0.1595001220703125, -0.15472412109375, -0.1499481201171875, -0.145172119140625, -0.1403961181640625, -0.1356201171875, -0.1308441162109375, -0.126068115234375, -0.1212921142578125, -0.11651611328125, -0.1117401123046875, -0.106964111328125, -0.1021881103515625, -0.097412109375, -0.0926361083984375, -0.087860107421875, -0.0830841064453125, -0.07830810546875, -0.0735321044921875, -0.068756103515625, -0.0639801025390625, -0.0592041015625, -0.0544281005859375, -0.049652099609375, -0.0448760986328125, -0.04010009765625, -0.0353240966796875, -0.030548095703125, -0.0257720947265625, -0.02099609375, -0.0162200927734375, -0.011444091796875, -0.0066680908203125, -0.00189208984375, 0.0028839111328125, 0.007659912109375, 0.0124359130859375, 0.0172119140625, 0.0219879150390625, 0.026763916015625, 0.0315399169921875, 0.03631591796875, 0.0410919189453125, 0.045867919921875, 0.0506439208984375, 0.055419921875, 0.0601959228515625, 0.064971923828125, 0.0697479248046875, 0.07452392578125, 0.0792999267578125, 0.084075927734375, 0.0888519287109375, 0.0936279296875, 0.0984039306640625, 0.103179931640625, 0.1079559326171875, 0.11273193359375, 0.1175079345703125, 0.122283935546875, 0.1270599365234375, 0.1318359375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 7.0, 17.0, 17.0, 28.0, 51.0, 52.0, 85.0, 91.0, 120.0, 127.0, 86.0, 88.0, 57.0, 36.0, 33.0, 27.0, 13.0, 16.0, 13.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.13589859008789062, -0.13190460205078125, -0.12791061401367188, -0.1239166259765625, -0.11992263793945312, -0.11592864990234375, -0.11193466186523438, -0.107940673828125, -0.10394668579101562, -0.09995269775390625, -0.09595870971679688, -0.0919647216796875, -0.08797073364257812, -0.08397674560546875, -0.07998275756835938, -0.07598876953125, -0.07199478149414062, -0.06800079345703125, -0.06400680541992188, -0.0600128173828125, -0.056018829345703125, -0.05202484130859375, -0.048030853271484375, -0.044036865234375, -0.040042877197265625, -0.03604888916015625, -0.032054901123046875, -0.0280609130859375, -0.024066925048828125, -0.02007293701171875, -0.016078948974609375, -0.0120849609375, -0.008090972900390625, -0.00409698486328125, -0.000102996826171875, 0.0038909912109375, 0.007884979248046875, 0.01187896728515625, 0.015872955322265625, 0.019866943359375, 0.023860931396484375, 0.02785491943359375, 0.031848907470703125, 0.0358428955078125, 0.039836883544921875, 0.04383087158203125, 0.047824859619140625, 0.05181884765625, 0.055812835693359375, 0.05980682373046875, 0.06380081176757812, 0.0677947998046875, 0.07178878784179688, 0.07578277587890625, 0.07977676391601562, 0.083770751953125, 0.08776473999023438, 0.09175872802734375, 0.09575271606445312, 0.0997467041015625, 0.10374069213867188, 0.10773468017578125, 0.11172866821289062, 0.11572265625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 25.0, 379.0, 580.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.153179168701172, -11.932692527770996, -11.712206840515137, -11.491720199584961, -11.271233558654785, -11.05074691772461, -10.83026123046875, -10.609774589538574, -10.389287948608398, -10.168801307678223, -9.948315620422363, -9.727828979492188, -9.507342338562012, -9.286855697631836, -9.066370010375977, -8.8458833694458, -8.625396728515625, -8.40491008758545, -8.18442440032959, -7.963937759399414, -7.743451118469238, -7.522964954376221, -7.302478313446045, -7.081992149353027, -6.86150598526001, -6.641019821166992, -6.420533180236816, -6.200047016143799, -5.979560375213623, -5.7590742111206055, -5.53858757019043, -5.318101406097412, -5.097614765167236, -4.877128601074219, -4.656641960144043, -4.436155796051025, -4.21566915512085, -3.995182991027832, -3.7746963500976562, -3.5542101860046387, -3.333723545074463, -3.113237142562866, -2.8927507400512695, -2.672264337539673, -2.451777935028076, -2.2312917709350586, -2.010805130004883, -1.7903188467025757, -1.5698325634002686, -1.3493461608886719, -1.1288597583770752, -0.9083734154701233, -0.6878870129585266, -0.4674006700515747, -0.24691426753997803, -0.026427865028381348, 0.19405853748321533, 0.414544939994812, 0.6350313425064087, 0.8555176854133606, 1.0760040283203125, 1.2964904308319092, 1.5169768333435059, 1.7374632358551025, 1.9579496383666992]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 12.0, 12.0, 5.0, 10.0, 21.0, 22.0, 32.0, 44.0, 47.0, 49.0, 55.0, 69.0, 73.0, 63.0, 57.0, 58.0, 55.0, 44.0, 47.0, 41.0, 36.0, 35.0, 21.0, 27.0, 17.0, 17.0, 9.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.251816749572754, -1.1966667175292969, -1.1415166854858398, -1.0863665342330933, -1.0312165021896362, -0.9760664701461792, -0.9209163784980774, -0.8657662868499756, -0.8106162548065186, -0.7554662227630615, -0.7003161311149597, -0.6451660394668579, -0.5900160074234009, -0.5348659753799438, -0.47971588373184204, -0.4245658218860626, -0.3694157600402832, -0.3142656981945038, -0.25911563634872437, -0.20396557450294495, -0.14881551265716553, -0.09366545081138611, -0.03851538896560669, 0.01663467288017273, 0.07178473472595215, 0.12693479657173157, 0.182084858417511, 0.2372349202632904, 0.2923849821090698, 0.34753504395484924, 0.40268510580062866, 0.4578351676464081, 0.5129852294921875, 0.5681352615356445, 0.6232853531837463, 0.6784354448318481, 0.7335854768753052, 0.7887355089187622, 0.843885600566864, 0.8990356922149658, 0.9541857242584229, 1.0093357563018799, 1.064485788345337, 1.1196359395980835, 1.1747859716415405, 1.2299360036849976, 1.2850861549377441, 1.3402361869812012, 1.3953862190246582, 1.4505362510681152, 1.5056862831115723, 1.5608364343643188, 1.6159864664077759, 1.671136498451233, 1.7262866497039795, 1.7814366817474365, 1.8365867137908936, 1.8917367458343506, 1.9468867778778076, 2.0020368099212646, 2.057187080383301, 2.112337112426758, 2.167487144470215, 2.222637176513672, 2.277787208557129]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 8.0, 7.0, 16.0, 16.0, 23.0, 35.0, 71.0, 114.0, 220.0, 527.0, 1580.0, 8503.0, 4056540.0, 121050.0, 3924.0, 929.0, 320.0, 161.0, 75.0, 51.0, 38.0, 19.0, 15.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5664443969726562, -0.5445098876953125, -0.5225753784179688, -0.500640869140625, -0.47870635986328125, -0.4567718505859375, -0.43483734130859375, -0.41290283203125, -0.39096832275390625, -0.3690338134765625, -0.34709930419921875, -0.325164794921875, -0.30323028564453125, -0.2812957763671875, -0.25936126708984375, -0.2374267578125, -0.21549224853515625, -0.1935577392578125, -0.17162322998046875, -0.149688720703125, -0.12775421142578125, -0.1058197021484375, -0.08388519287109375, -0.06195068359375, -0.04001617431640625, -0.0180816650390625, 0.00385284423828125, 0.025787353515625, 0.04772186279296875, 0.0696563720703125, 0.09159088134765625, 0.113525390625, 0.13545989990234375, 0.1573944091796875, 0.17932891845703125, 0.201263427734375, 0.22319793701171875, 0.2451324462890625, 0.26706695556640625, 0.28900146484375, 0.31093597412109375, 0.3328704833984375, 0.35480499267578125, 0.376739501953125, 0.39867401123046875, 0.4206085205078125, 0.44254302978515625, 0.4644775390625, 0.48641204833984375, 0.5083465576171875, 0.5302810668945312, 0.552215576171875, 0.5741500854492188, 0.5960845947265625, 0.6180191040039062, 0.63995361328125, 0.6618881225585938, 0.6838226318359375, 0.7057571411132812, 0.727691650390625, 0.7496261596679688, 0.7715606689453125, 0.7934951782226562, 0.8154296875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 15.0, 18.0, 17.0, 53.0, 126.0, 219.0, 245.0, 163.0, 81.0, 27.0, 13.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093017578125, -0.08992671966552734, -0.08683586120605469, -0.08374500274658203, -0.08065414428710938, -0.07756328582763672, -0.07447242736816406, -0.0713815689086914, -0.06829071044921875, -0.0651998519897461, -0.06210899353027344, -0.05901813507080078, -0.055927276611328125, -0.05283641815185547, -0.04974555969238281, -0.046654701232910156, -0.0435638427734375, -0.040472984313964844, -0.03738212585449219, -0.03429126739501953, -0.031200408935546875, -0.02810955047607422, -0.025018692016601562, -0.021927833557128906, -0.01883697509765625, -0.015746116638183594, -0.012655258178710938, -0.009564399719238281, -0.006473541259765625, -0.0033826828002929688, -0.0002918243408203125, 0.0027990341186523438, 0.005889892578125, 0.008980751037597656, 0.012071609497070312, 0.015162467956542969, 0.018253326416015625, 0.02134418487548828, 0.024435043334960938, 0.027525901794433594, 0.03061676025390625, 0.033707618713378906, 0.03679847717285156, 0.03988933563232422, 0.042980194091796875, 0.04607105255126953, 0.04916191101074219, 0.052252769470214844, 0.0553436279296875, 0.058434486389160156, 0.06152534484863281, 0.06461620330810547, 0.06770706176757812, 0.07079792022705078, 0.07388877868652344, 0.0769796371459961, 0.08007049560546875, 0.0831613540649414, 0.08625221252441406, 0.08934307098388672, 0.09243392944335938, 0.09552478790283203, 0.09861564636230469, 0.10170650482177734, 0.10479736328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 3.0, 4.0, 9.0, 16.0, 17.0, 22.0, 34.0, 56.0, 115.0, 222.0, 433.0, 929.0, 2340.0, 9778.0, 192169.0, 3960707.0, 21379.0, 3742.0, 1240.0, 532.0, 222.0, 136.0, 64.0, 33.0, 41.0, 7.0, 8.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48046875, -0.46506500244140625, -0.4496612548828125, -0.43425750732421875, -0.418853759765625, -0.40345001220703125, -0.3880462646484375, -0.37264251708984375, -0.35723876953125, -0.34183502197265625, -0.3264312744140625, -0.31102752685546875, -0.295623779296875, -0.28022003173828125, -0.2648162841796875, -0.24941253662109375, -0.2340087890625, -0.21860504150390625, -0.2032012939453125, -0.18779754638671875, -0.172393798828125, -0.15699005126953125, -0.1415863037109375, -0.12618255615234375, -0.11077880859375, -0.09537506103515625, -0.0799713134765625, -0.06456756591796875, -0.049163818359375, -0.03376007080078125, -0.0183563232421875, -0.00295257568359375, 0.012451171875, 0.02785491943359375, 0.0432586669921875, 0.05866241455078125, 0.074066162109375, 0.08946990966796875, 0.1048736572265625, 0.12027740478515625, 0.13568115234375, 0.15108489990234375, 0.1664886474609375, 0.18189239501953125, 0.197296142578125, 0.21269989013671875, 0.2281036376953125, 0.24350738525390625, 0.2589111328125, 0.27431488037109375, 0.2897186279296875, 0.30512237548828125, 0.320526123046875, 0.33592987060546875, 0.3513336181640625, 0.36673736572265625, 0.38214111328125, 0.39754486083984375, 0.4129486083984375, 0.42835235595703125, 0.443756103515625, 0.45915985107421875, 0.4745635986328125, 0.48996734619140625, 0.50537109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 11.0, 13.0, 25.0, 51.0, 123.0, 719.0, 2718.0, 239.0, 72.0, 30.0, 19.0, 14.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1259765625, -0.12194061279296875, -0.1179046630859375, -0.11386871337890625, -0.109832763671875, -0.10579681396484375, -0.1017608642578125, -0.09772491455078125, -0.09368896484375, -0.08965301513671875, -0.0856170654296875, -0.08158111572265625, -0.077545166015625, -0.07350921630859375, -0.0694732666015625, -0.06543731689453125, -0.0614013671875, -0.05736541748046875, -0.0533294677734375, -0.04929351806640625, -0.045257568359375, -0.04122161865234375, -0.0371856689453125, -0.03314971923828125, -0.02911376953125, -0.02507781982421875, -0.0210418701171875, -0.01700592041015625, -0.012969970703125, -0.00893402099609375, -0.0048980712890625, -0.00086212158203125, 0.003173828125, 0.00720977783203125, 0.0112457275390625, 0.01528167724609375, 0.019317626953125, 0.02335357666015625, 0.0273895263671875, 0.03142547607421875, 0.03546142578125, 0.03949737548828125, 0.0435333251953125, 0.04756927490234375, 0.051605224609375, 0.05564117431640625, 0.0596771240234375, 0.06371307373046875, 0.0677490234375, 0.07178497314453125, 0.0758209228515625, 0.07985687255859375, 0.083892822265625, 0.08792877197265625, 0.0919647216796875, 0.09600067138671875, 0.10003662109375, 0.10407257080078125, 0.1081085205078125, 0.11214447021484375, 0.116180419921875, 0.12021636962890625, 0.1242523193359375, 0.12828826904296875, 0.13232421875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 19.0, 194.0, 723.0, 54.0, 13.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944915771484375, -2.886420726776123, -2.82792592048645, -2.7694308757781982, -2.7109360694885254, -2.6524410247802734, -2.5939462184906006, -2.5354511737823486, -2.476956367492676, -2.418461322784424, -2.359966516494751, -2.301471471786499, -2.242976665496826, -2.184481620788574, -2.1259868144989014, -2.0674917697906494, -2.0089969635009766, -1.9505020380020142, -1.8920071125030518, -1.8335121870040894, -1.775017261505127, -1.7165223360061646, -1.6580274105072021, -1.5995323657989502, -1.5410373210906982, -1.4825423955917358, -1.4240474700927734, -1.365552544593811, -1.3070576190948486, -1.2485626935958862, -1.1900677680969238, -1.1315727233886719, -1.073077917098999, -1.0145829916000366, -0.9560880661010742, -0.8975931406021118, -0.8390982151031494, -0.780603289604187, -0.7221083045005798, -0.6636133790016174, -0.605118453502655, -0.5466235280036926, -0.4881286025047302, -0.42963364720344543, -0.37113872170448303, -0.31264379620552063, -0.25414884090423584, -0.19565391540527344, -0.13715898990631104, -0.07866405695676804, -0.020169124007225037, 0.03832581639289856, 0.09682074189186096, 0.15531566739082336, 0.21381062269210815, 0.27230554819107056, 0.33080047369003296, 0.38929539918899536, 0.44779032468795776, 0.5062853097915649, 0.5647802352905273, 0.6232751607894897, 0.6817700862884521, 0.7402650117874146, 0.798759937286377]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 6.0, 2.0, 10.0, 15.0, 12.0, 12.0, 19.0, 23.0, 26.0, 21.0, 36.0, 42.0, 41.0, 41.0, 38.0, 51.0, 54.0, 54.0, 48.0, 59.0, 58.0, 49.0, 31.0, 31.0, 45.0, 43.0, 15.0, 18.0, 19.0, 15.0, 16.0, 7.0, 12.0, 13.0, 8.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2920803427696228, -0.2838532328605652, -0.27562612295150757, -0.26739904284477234, -0.2591719329357147, -0.2509448230266571, -0.24271772801876068, -0.23449063301086426, -0.22626352310180664, -0.21803641319274902, -0.2098093181848526, -0.20158222317695618, -0.19335511326789856, -0.18512800335884094, -0.17690090835094452, -0.1686738133430481, -0.16044670343399048, -0.15221959352493286, -0.14399249851703644, -0.13576540350914001, -0.1275382936000824, -0.11931119114160538, -0.11108408868312836, -0.10285698622465134, -0.09462988376617432, -0.0864027813076973, -0.07817567884922028, -0.06994857639074326, -0.061721473932266235, -0.053494371473789215, -0.045267269015312195, -0.037040166556835175, -0.028813064098358154, -0.020585961639881134, -0.012358859181404114, -0.0041317567229270935, 0.004095345735549927, 0.012322448194026947, 0.020549550652503967, 0.028776653110980988, 0.03700375556945801, 0.04523085802793503, 0.05345796048641205, 0.06168506294488907, 0.06991216540336609, 0.07813926786184311, 0.08636637032032013, 0.09459347277879715, 0.10282057523727417, 0.11104767769575119, 0.11927478015422821, 0.12750187516212463, 0.13572898507118225, 0.14395609498023987, 0.1521831899881363, 0.16041028499603271, 0.16863739490509033, 0.17686450481414795, 0.18509159982204437, 0.1933186948299408, 0.2015458047389984, 0.20977291464805603, 0.21800000965595245, 0.22622710466384888, 0.2344542145729065]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 19.0, 14.0, 27.0, 38.0, 44.0, 56.0, 90.0, 118.0, 157.0, 241.0, 380.0, 603.0, 990.0, 2230.0, 7859.0, 68327.0, 825119.0, 125418.0, 11039.0, 2683.0, 1185.0, 619.0, 378.0, 275.0, 176.0, 121.0, 92.0, 68.0, 49.0, 34.0, 24.0, 17.0, 14.0, 6.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.25162506103515625, -0.2425079345703125, -0.23339080810546875, -0.224273681640625, -0.21515655517578125, -0.2060394287109375, -0.19692230224609375, -0.18780517578125, -0.17868804931640625, -0.1695709228515625, -0.16045379638671875, -0.151336669921875, -0.14221954345703125, -0.1331024169921875, -0.12398529052734375, -0.1148681640625, -0.10575103759765625, -0.0966339111328125, -0.08751678466796875, -0.078399658203125, -0.06928253173828125, -0.0601654052734375, -0.05104827880859375, -0.04193115234375, -0.03281402587890625, -0.0236968994140625, -0.01457977294921875, -0.005462646484375, 0.00365447998046875, 0.0127716064453125, 0.02188873291015625, 0.031005859375, 0.04012298583984375, 0.0492401123046875, 0.05835723876953125, 0.067474365234375, 0.07659149169921875, 0.0857086181640625, 0.09482574462890625, 0.10394287109375, 0.11305999755859375, 0.1221771240234375, 0.13129425048828125, 0.140411376953125, 0.14952850341796875, 0.1586456298828125, 0.16776275634765625, 0.1768798828125, 0.18599700927734375, 0.1951141357421875, 0.20423126220703125, 0.213348388671875, 0.22246551513671875, 0.2315826416015625, 0.24069976806640625, 0.24981689453125, 0.25893402099609375, 0.2680511474609375, 0.27716827392578125, 0.286285400390625, 0.29540252685546875, 0.3045196533203125, 0.31363677978515625, 0.32275390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 6.0, 20.0, 9.0, 26.0, 68.0, 127.0, 222.0, 234.0, 144.0, 82.0, 36.0, 9.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09480094909667969, -0.09164047241210938, -0.08847999572753906, -0.08531951904296875, -0.08215904235839844, -0.07899856567382812, -0.07583808898925781, -0.0726776123046875, -0.06951713562011719, -0.06635665893554688, -0.06319618225097656, -0.06003570556640625, -0.05687522888183594, -0.053714752197265625, -0.05055427551269531, -0.047393798828125, -0.04423332214355469, -0.041072845458984375, -0.03791236877441406, -0.03475189208984375, -0.03159141540527344, -0.028430938720703125, -0.025270462036132812, -0.0221099853515625, -0.018949508666992188, -0.015789031982421875, -0.012628555297851562, -0.00946807861328125, -0.0063076019287109375, -0.003147125244140625, 1.33514404296875e-05, 0.003173828125, 0.0063343048095703125, 0.009494781494140625, 0.012655258178710938, 0.01581573486328125, 0.018976211547851562, 0.022136688232421875, 0.025297164916992188, 0.0284576416015625, 0.03161811828613281, 0.034778594970703125, 0.03793907165527344, 0.04109954833984375, 0.04426002502441406, 0.047420501708984375, 0.05058097839355469, 0.053741455078125, 0.05690193176269531, 0.060062408447265625, 0.06322288513183594, 0.06638336181640625, 0.06954383850097656, 0.07270431518554688, 0.07586479187011719, 0.0790252685546875, 0.08218574523925781, 0.08534622192382812, 0.08850669860839844, 0.09166717529296875, 0.09482765197753906, 0.09798812866210938, 0.10114860534667969, 0.10430908203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 11.0, 12.0, 16.0, 27.0, 27.0, 39.0, 86.0, 124.0, 264.0, 489.0, 965.0, 2391.0, 7433.0, 43299.0, 760428.0, 209280.0, 16509.0, 4095.0, 1512.0, 694.0, 349.0, 191.0, 95.0, 81.0, 35.0, 32.0, 13.0, 11.0, 15.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.34722137451171875, -0.3355560302734375, -0.32389068603515625, -0.312225341796875, -0.30055999755859375, -0.2888946533203125, -0.27722930908203125, -0.26556396484375, -0.25389862060546875, -0.2422332763671875, -0.23056793212890625, -0.218902587890625, -0.20723724365234375, -0.1955718994140625, -0.18390655517578125, -0.1722412109375, -0.16057586669921875, -0.1489105224609375, -0.13724517822265625, -0.125579833984375, -0.11391448974609375, -0.1022491455078125, -0.09058380126953125, -0.07891845703125, -0.06725311279296875, -0.0555877685546875, -0.04392242431640625, -0.032257080078125, -0.02059173583984375, -0.0089263916015625, 0.00273895263671875, 0.014404296875, 0.02606964111328125, 0.0377349853515625, 0.04940032958984375, 0.061065673828125, 0.07273101806640625, 0.0843963623046875, 0.09606170654296875, 0.10772705078125, 0.11939239501953125, 0.1310577392578125, 0.14272308349609375, 0.154388427734375, 0.16605377197265625, 0.1777191162109375, 0.18938446044921875, 0.2010498046875, 0.21271514892578125, 0.2243804931640625, 0.23604583740234375, 0.247711181640625, 0.25937652587890625, 0.2710418701171875, 0.28270721435546875, 0.29437255859375, 0.30603790283203125, 0.3177032470703125, 0.32936859130859375, 0.341033935546875, 0.35269927978515625, 0.3643646240234375, 0.37602996826171875, 0.3876953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 12.0, 19.0, 18.0, 29.0, 32.0, 33.0, 52.0, 48.0, 54.0, 64.0, 62.0, 72.0, 65.0, 72.0, 52.0, 45.0, 42.0, 37.0, 32.0, 20.0, 27.0, 19.0, 21.0, 12.0, 8.0, 5.0, 12.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.29052734375, -0.28219032287597656, -0.2738533020019531, -0.2655162811279297, -0.25717926025390625, -0.2488422393798828, -0.24050521850585938, -0.23216819763183594, -0.2238311767578125, -0.21549415588378906, -0.20715713500976562, -0.1988201141357422, -0.19048309326171875, -0.1821460723876953, -0.17380905151367188, -0.16547203063964844, -0.157135009765625, -0.14879798889160156, -0.14046096801757812, -0.1321239471435547, -0.12378692626953125, -0.11544990539550781, -0.10711288452148438, -0.09877586364746094, -0.0904388427734375, -0.08210182189941406, -0.07376480102539062, -0.06542778015136719, -0.05709075927734375, -0.04875373840332031, -0.040416717529296875, -0.03207969665527344, -0.02374267578125, -0.015405654907226562, -0.007068634033203125, 0.0012683868408203125, 0.00960540771484375, 0.017942428588867188, 0.026279449462890625, 0.03461647033691406, 0.0429534912109375, 0.05129051208496094, 0.059627532958984375, 0.06796455383300781, 0.07630157470703125, 0.08463859558105469, 0.09297561645507812, 0.10131263732910156, 0.109649658203125, 0.11798667907714844, 0.12632369995117188, 0.1346607208251953, 0.14299774169921875, 0.1513347625732422, 0.15967178344726562, 0.16800880432128906, 0.1763458251953125, 0.18468284606933594, 0.19301986694335938, 0.2013568878173828, 0.20969390869140625, 0.2180309295654297, 0.22636795043945312, 0.23470497131347656, 0.2430419921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 12.0, 12.0, 22.0, 26.0, 44.0, 61.0, 79.0, 112.0, 182.0, 236.0, 378.0, 696.0, 1607.0, 4612.0, 52068.0, 974863.0, 8616.0, 2466.0, 1010.0, 499.0, 272.0, 187.0, 126.0, 98.0, 66.0, 55.0, 40.0, 34.0, 15.0, 13.0, 8.0, 7.0, 4.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.394775390625, -0.38126373291015625, -0.3677520751953125, -0.35424041748046875, -0.340728759765625, -0.32721710205078125, -0.3137054443359375, -0.30019378662109375, -0.28668212890625, -0.27317047119140625, -0.2596588134765625, -0.24614715576171875, -0.232635498046875, -0.21912384033203125, -0.2056121826171875, -0.19210052490234375, -0.1785888671875, -0.16507720947265625, -0.1515655517578125, -0.13805389404296875, -0.124542236328125, -0.11103057861328125, -0.0975189208984375, -0.08400726318359375, -0.07049560546875, -0.05698394775390625, -0.0434722900390625, -0.02996063232421875, -0.016448974609375, -0.00293731689453125, 0.0105743408203125, 0.02408599853515625, 0.03759765625, 0.05110931396484375, 0.0646209716796875, 0.07813262939453125, 0.091644287109375, 0.10515594482421875, 0.1186676025390625, 0.13217926025390625, 0.14569091796875, 0.15920257568359375, 0.1727142333984375, 0.18622589111328125, 0.199737548828125, 0.21324920654296875, 0.2267608642578125, 0.24027252197265625, 0.2537841796875, 0.26729583740234375, 0.2808074951171875, 0.29431915283203125, 0.307830810546875, 0.32134246826171875, 0.3348541259765625, 0.34836578369140625, 0.36187744140625, 0.37538909912109375, 0.3889007568359375, 0.40241241455078125, 0.415924072265625, 0.42943572998046875, 0.4429473876953125, 0.45645904541015625, 0.469970703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 6.0, 9.0, 9.0, 6.0, 10.0, 15.0, 9.0, 20.0, 32.0, 33.0, 37.0, 37.0, 43.0, 69.0, 100.0, 92.0, 82.0, 54.0, 62.0, 57.0, 37.0, 32.0, 26.0, 24.0, 18.0, 18.0, 15.0, 8.0, 3.0, 9.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.125471115112305e-05, -8.846446871757507e-05, -8.56742262840271e-05, -8.288398385047913e-05, -8.009374141693115e-05, -7.730349898338318e-05, -7.45132565498352e-05, -7.172301411628723e-05, -6.893277168273926e-05, -6.614252924919128e-05, -6.335228681564331e-05, -6.056204438209534e-05, -5.777180194854736e-05, -5.498155951499939e-05, -5.2191317081451416e-05, -4.940107464790344e-05, -4.661083221435547e-05, -4.3820589780807495e-05, -4.103034734725952e-05, -3.824010491371155e-05, -3.5449862480163574e-05, -3.26596200466156e-05, -2.9869377613067627e-05, -2.7079135179519653e-05, -2.428889274597168e-05, -2.1498650312423706e-05, -1.8708407878875732e-05, -1.591816544532776e-05, -1.3127923011779785e-05, -1.0337680578231812e-05, -7.547438144683838e-06, -4.757195711135864e-06, -1.9669532775878906e-06, 8.23289155960083e-07, 3.6135315895080566e-06, 6.40377402305603e-06, 9.194016456604004e-06, 1.1984258890151978e-05, 1.4774501323699951e-05, 1.7564743757247925e-05, 2.03549861907959e-05, 2.3145228624343872e-05, 2.5935471057891846e-05, 2.872571349143982e-05, 3.151595592498779e-05, 3.4306198358535767e-05, 3.709644079208374e-05, 3.9886683225631714e-05, 4.267692565917969e-05, 4.546716809272766e-05, 4.8257410526275635e-05, 5.104765295982361e-05, 5.383789539337158e-05, 5.6628137826919556e-05, 5.941838026046753e-05, 6.22086226940155e-05, 6.499886512756348e-05, 6.778910756111145e-05, 7.057934999465942e-05, 7.33695924282074e-05, 7.615983486175537e-05, 7.895007729530334e-05, 8.174031972885132e-05, 8.453056216239929e-05, 8.732080459594727e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 6.0, 11.0, 10.0, 13.0, 5.0, 23.0, 21.0, 23.0, 30.0, 48.0, 63.0, 111.0, 194.0, 322.0, 695.0, 1476.0, 3702.0, 12068.0, 178932.0, 817142.0, 24037.0, 5429.0, 2139.0, 890.0, 439.0, 247.0, 151.0, 79.0, 66.0, 42.0, 40.0, 27.0, 17.0, 9.0, 12.0, 5.0, 4.0, 8.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1595458984375, -0.15367889404296875, -0.1478118896484375, -0.14194488525390625, -0.136077880859375, -0.13021087646484375, -0.1243438720703125, -0.11847686767578125, -0.11260986328125, -0.10674285888671875, -0.1008758544921875, -0.09500885009765625, -0.089141845703125, -0.08327484130859375, -0.0774078369140625, -0.07154083251953125, -0.065673828125, -0.05980682373046875, -0.0539398193359375, -0.04807281494140625, -0.042205810546875, -0.03633880615234375, -0.0304718017578125, -0.02460479736328125, -0.01873779296875, -0.01287078857421875, -0.0070037841796875, -0.00113677978515625, 0.004730224609375, 0.01059722900390625, 0.0164642333984375, 0.02233123779296875, 0.0281982421875, 0.03406524658203125, 0.0399322509765625, 0.04579925537109375, 0.051666259765625, 0.05753326416015625, 0.0634002685546875, 0.06926727294921875, 0.07513427734375, 0.08100128173828125, 0.0868682861328125, 0.09273529052734375, 0.098602294921875, 0.10446929931640625, 0.1103363037109375, 0.11620330810546875, 0.1220703125, 0.12793731689453125, 0.1338043212890625, 0.13967132568359375, 0.145538330078125, 0.15140533447265625, 0.1572723388671875, 0.16313934326171875, 0.16900634765625, 0.17487335205078125, 0.1807403564453125, 0.18660736083984375, 0.192474365234375, 0.19834136962890625, 0.2042083740234375, 0.21007537841796875, 0.2159423828125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 11.0, 27.0, 52.0, 161.0, 264.0, 230.0, 123.0, 55.0, 24.0, 10.0, 5.0, 2.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3033027648925781, -0.29508209228515625, -0.2868614196777344, -0.2786407470703125, -0.2704200744628906, -0.26219940185546875, -0.2539787292480469, -0.245758056640625, -0.23753738403320312, -0.22931671142578125, -0.22109603881835938, -0.2128753662109375, -0.20465469360351562, -0.19643402099609375, -0.18821334838867188, -0.17999267578125, -0.17177200317382812, -0.16355133056640625, -0.15533065795898438, -0.1471099853515625, -0.13888931274414062, -0.13066864013671875, -0.12244796752929688, -0.114227294921875, -0.10600662231445312, -0.09778594970703125, -0.08956527709960938, -0.0813446044921875, -0.07312393188476562, -0.06490325927734375, -0.056682586669921875, -0.0484619140625, -0.040241241455078125, -0.03202056884765625, -0.023799896240234375, -0.0155792236328125, -0.007358551025390625, 0.00086212158203125, 0.009082794189453125, 0.017303466796875, 0.025524139404296875, 0.03374481201171875, 0.041965484619140625, 0.0501861572265625, 0.058406829833984375, 0.06662750244140625, 0.07484817504882812, 0.08306884765625, 0.09128952026367188, 0.09951019287109375, 0.10773086547851562, 0.1159515380859375, 0.12417221069335938, 0.13239288330078125, 0.14061355590820312, 0.148834228515625, 0.15705490112304688, 0.16527557373046875, 0.17349624633789062, 0.1817169189453125, 0.18993759155273438, 0.19815826416015625, 0.20637893676757812, 0.214599609375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 8.0, 15.0, 40.0, 111.0, 333.0, 337.0, 108.0, 31.0, 7.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.772488594055176, -4.659119606018066, -4.545750617980957, -4.432381629943848, -4.319012641906738, -4.205643653869629, -4.0922746658325195, -3.97890567779541, -3.865536689758301, -3.7521677017211914, -3.638798713684082, -3.5254297256469727, -3.4120607376098633, -3.298691749572754, -3.1853227615356445, -3.071953773498535, -2.958585023880005, -2.8452160358428955, -2.731847047805786, -2.6184780597686768, -2.5051090717315674, -2.391740083694458, -2.2783713340759277, -2.1650023460388184, -2.051633358001709, -1.9382643699645996, -1.8248953819274902, -1.7115263938903809, -1.5981574058532715, -1.484788417816162, -1.3714195489883423, -1.258050560951233, -1.144681692123413, -1.0313127040863037, -0.9179437160491943, -0.8045747876167297, -0.6912057995796204, -0.577836811542511, -0.4644678831100464, -0.351098895072937, -0.23772990703582764, -0.12436093389987946, -0.010991960763931274, 0.10237699747085571, 0.2157459855079651, 0.32911497354507446, 0.44248390197753906, 0.5558528900146484, 0.6692218780517578, 0.7825908660888672, 0.8959598541259766, 1.009328842163086, 1.1226978302001953, 1.2360668182373047, 1.3494356870651245, 1.4628046751022339, 1.5761736631393433, 1.6895426511764526, 1.802911639213562, 1.9162805080413818, 2.029649496078491, 2.1430184841156006, 2.25638747215271, 2.3697564601898193, 2.4831254482269287]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 6.0, 15.0, 18.0, 17.0, 19.0, 28.0, 25.0, 38.0, 36.0, 47.0, 47.0, 57.0, 70.0, 55.0, 52.0, 49.0, 51.0, 39.0, 53.0, 50.0, 47.0, 39.0, 22.0, 20.0, 15.0, 17.0, 11.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5680876970291138, -1.5160160064697266, -1.4639441967010498, -1.411872386932373, -1.3598006963729858, -1.3077290058135986, -1.2556571960449219, -1.2035853862762451, -1.151513695716858, -1.0994420051574707, -1.047370195388794, -0.995298445224762, -0.94322669506073, -0.891154944896698, -0.839083194732666, -0.787011444568634, -0.734939694404602, -0.6828679442405701, -0.6307961940765381, -0.5787244439125061, -0.5266526937484741, -0.47458094358444214, -0.42250919342041016, -0.3704374432563782, -0.3183656930923462, -0.2662939429283142, -0.21422219276428223, -0.16215044260025024, -0.11007869243621826, -0.05800694227218628, -0.005935192108154297, 0.046136558055877686, 0.09820842742919922, 0.1502801775932312, 0.20235192775726318, 0.25442367792129517, 0.30649542808532715, 0.35856717824935913, 0.4106389284133911, 0.4627106785774231, 0.5147824287414551, 0.5668541789054871, 0.618925929069519, 0.670997679233551, 0.723069429397583, 0.775141179561615, 0.827212929725647, 0.879284679889679, 0.9313564300537109, 0.9834281802177429, 1.035499930381775, 1.087571620941162, 1.1396434307098389, 1.1917152404785156, 1.2437869310379028, 1.29585862159729, 1.3479304313659668, 1.4000022411346436, 1.4520739316940308, 1.504145622253418, 1.5562174320220947, 1.6082892417907715, 1.6603609323501587, 1.712432622909546, 1.7645044326782227]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 21.0, 23.0, 54.0, 102.0, 258.0, 848.0, 6127.0, 4109695.0, 74126.0, 2219.0, 479.0, 154.0, 60.0, 49.0, 28.0, 7.0, 19.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7734375, -0.7498550415039062, -0.7262725830078125, -0.7026901245117188, -0.679107666015625, -0.6555252075195312, -0.6319427490234375, -0.6083602905273438, -0.58477783203125, -0.5611953735351562, -0.5376129150390625, -0.5140304565429688, -0.490447998046875, -0.46686553955078125, -0.4432830810546875, -0.41970062255859375, -0.3961181640625, -0.37253570556640625, -0.3489532470703125, -0.32537078857421875, -0.301788330078125, -0.27820587158203125, -0.2546234130859375, -0.23104095458984375, -0.20745849609375, -0.18387603759765625, -0.1602935791015625, -0.13671112060546875, -0.113128662109375, -0.08954620361328125, -0.0659637451171875, -0.04238128662109375, -0.018798828125, 0.00478363037109375, 0.0283660888671875, 0.05194854736328125, 0.075531005859375, 0.09911346435546875, 0.1226959228515625, 0.14627838134765625, 0.16986083984375, 0.19344329833984375, 0.2170257568359375, 0.24060821533203125, 0.264190673828125, 0.28777313232421875, 0.3113555908203125, 0.33493804931640625, 0.3585205078125, 0.38210296630859375, 0.4056854248046875, 0.42926788330078125, 0.452850341796875, 0.47643280029296875, 0.5000152587890625, 0.5235977172851562, 0.54718017578125, 0.5707626342773438, 0.5943450927734375, 0.6179275512695312, 0.641510009765625, 0.6650924682617188, 0.6886749267578125, 0.7122573852539062, 0.73583984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 9.0, 26.0, 43.0, 79.0, 129.0, 216.0, 181.0, 150.0, 73.0, 38.0, 21.0, 8.0, 9.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09442138671875, -0.09136486053466797, -0.08830833435058594, -0.0852518081665039, -0.08219528198242188, -0.07913875579833984, -0.07608222961425781, -0.07302570343017578, -0.06996917724609375, -0.06691265106201172, -0.06385612487792969, -0.060799598693847656, -0.057743072509765625, -0.054686546325683594, -0.05163002014160156, -0.04857349395751953, -0.0455169677734375, -0.04246044158935547, -0.03940391540527344, -0.036347389221191406, -0.033290863037109375, -0.030234336853027344, -0.027177810668945312, -0.02412128448486328, -0.02106475830078125, -0.01800823211669922, -0.014951705932617188, -0.011895179748535156, -0.008838653564453125, -0.005782127380371094, -0.0027256011962890625, 0.00033092498779296875, 0.003387451171875, 0.006443977355957031, 0.009500503540039062, 0.012557029724121094, 0.015613555908203125, 0.018670082092285156, 0.021726608276367188, 0.02478313446044922, 0.02783966064453125, 0.03089618682861328, 0.03395271301269531, 0.037009239196777344, 0.040065765380859375, 0.043122291564941406, 0.04617881774902344, 0.04923534393310547, 0.0522918701171875, 0.05534839630126953, 0.05840492248535156, 0.061461448669433594, 0.06451797485351562, 0.06757450103759766, 0.07063102722167969, 0.07368755340576172, 0.07674407958984375, 0.07980060577392578, 0.08285713195800781, 0.08591365814208984, 0.08897018432617188, 0.0920267105102539, 0.09508323669433594, 0.09813976287841797, 0.1011962890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 11.0, 13.0, 23.0, 29.0, 60.0, 89.0, 177.0, 414.0, 1100.0, 4916.0, 153116.0, 4023207.0, 8529.0, 1680.0, 486.0, 221.0, 81.0, 57.0, 37.0, 14.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.970703125, -0.9465179443359375, -0.922332763671875, -0.8981475830078125, -0.87396240234375, -0.8497772216796875, -0.825592041015625, -0.8014068603515625, -0.7772216796875, -0.7530364990234375, -0.728851318359375, -0.7046661376953125, -0.68048095703125, -0.6562957763671875, -0.632110595703125, -0.6079254150390625, -0.583740234375, -0.5595550537109375, -0.535369873046875, -0.5111846923828125, -0.48699951171875, -0.4628143310546875, -0.438629150390625, -0.4144439697265625, -0.3902587890625, -0.3660736083984375, -0.341888427734375, -0.3177032470703125, -0.29351806640625, -0.2693328857421875, -0.245147705078125, -0.2209625244140625, -0.19677734375, -0.1725921630859375, -0.148406982421875, -0.1242218017578125, -0.10003662109375, -0.0758514404296875, -0.051666259765625, -0.0274810791015625, -0.0032958984375, 0.0208892822265625, 0.045074462890625, 0.0692596435546875, 0.09344482421875, 0.1176300048828125, 0.141815185546875, 0.1660003662109375, 0.190185546875, 0.2143707275390625, 0.238555908203125, 0.2627410888671875, 0.28692626953125, 0.3111114501953125, 0.335296630859375, 0.3594818115234375, 0.3836669921875, 0.4078521728515625, 0.432037353515625, 0.4562225341796875, 0.48040771484375, 0.5045928955078125, 0.528778076171875, 0.5529632568359375, 0.5771484375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 16.0, 29.0, 69.0, 288.0, 3327.0, 245.0, 46.0, 17.0, 12.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2158203125, -0.21020889282226562, -0.20459747314453125, -0.19898605346679688, -0.1933746337890625, -0.18776321411132812, -0.18215179443359375, -0.17654037475585938, -0.170928955078125, -0.16531753540039062, -0.15970611572265625, -0.15409469604492188, -0.1484832763671875, -0.14287185668945312, -0.13726043701171875, -0.13164901733398438, -0.12603759765625, -0.12042617797851562, -0.11481475830078125, -0.10920333862304688, -0.1035919189453125, -0.09798049926757812, -0.09236907958984375, -0.08675765991210938, -0.081146240234375, -0.07553482055664062, -0.06992340087890625, -0.06431198120117188, -0.0587005615234375, -0.053089141845703125, -0.04747772216796875, -0.041866302490234375, -0.0362548828125, -0.030643463134765625, -0.02503204345703125, -0.019420623779296875, -0.0138092041015625, -0.008197784423828125, -0.00258636474609375, 0.003025054931640625, 0.008636474609375, 0.014247894287109375, 0.01985931396484375, 0.025470733642578125, 0.0310821533203125, 0.036693572998046875, 0.04230499267578125, 0.047916412353515625, 0.05352783203125, 0.059139251708984375, 0.06475067138671875, 0.07036209106445312, 0.0759735107421875, 0.08158493041992188, 0.08719635009765625, 0.09280776977539062, 0.098419189453125, 0.10403060913085938, 0.10964202880859375, 0.11525344848632812, 0.1208648681640625, 0.12647628784179688, 0.13208770751953125, 0.13769912719726562, 0.143310546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 10.0, 59.0, 351.0, 524.0, 56.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796971321105957, -1.7426871061325073, -1.6884030103683472, -1.6341187953948975, -1.5798345804214478, -1.5255504846572876, -1.471266269683838, -1.4169821739196777, -1.362697958946228, -1.3084137439727783, -1.2541296482086182, -1.1998454332351685, -1.1455612182617188, -1.0912771224975586, -1.0369929075241089, -0.982708752155304, -0.9284245371818542, -0.8741403818130493, -0.8198561668395996, -0.7655720114707947, -0.7112878561019897, -0.65700364112854, -0.6027194857597351, -0.5484353303909302, -0.49415114521980286, -0.43986696004867554, -0.3855828046798706, -0.3312986195087433, -0.27701443433761597, -0.22273027896881104, -0.16844609379768372, -0.11416193842887878, -0.059877753257751465, -0.005593579262495041, 0.04869059473276138, 0.1029747724533081, 0.15725894272327423, 0.21154311299324036, 0.2658272981643677, 0.3201114535331726, 0.3743956387042999, 0.42867982387542725, 0.4829639792442322, 0.5372481346130371, 0.5915323495864868, 0.6458165049552917, 0.7001006603240967, 0.7543848752975464, 0.8086690306663513, 0.8629531860351562, 0.917237401008606, 0.9715215563774109, 1.0258057117462158, 1.0800899267196655, 1.1343741416931152, 1.1886582374572754, 1.242942452430725, 1.2972266674041748, 1.351510763168335, 1.4057949781417847, 1.4600791931152344, 1.5143632888793945, 1.5686475038528442, 1.622931718826294, 1.677215814590454]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 9.0, 10.0, 11.0, 14.0, 18.0, 31.0, 30.0, 32.0, 39.0, 36.0, 50.0, 52.0, 65.0, 61.0, 60.0, 59.0, 63.0, 53.0, 56.0, 31.0, 41.0, 34.0, 38.0, 16.0, 17.0, 17.0, 7.0, 5.0, 5.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3317965865135193, -0.32152053713798523, -0.31124448776245117, -0.3009684383869171, -0.29069238901138306, -0.2804163098335266, -0.27014029026031494, -0.2598642110824585, -0.24958816170692444, -0.23931211233139038, -0.22903606295585632, -0.21876001358032227, -0.20848394930362701, -0.19820789992809296, -0.1879318505525589, -0.17765578627586365, -0.16737975180149078, -0.15710370242595673, -0.14682765305042267, -0.13655158877372742, -0.12627553939819336, -0.1159994900226593, -0.10572344064712524, -0.09544738382101059, -0.08517133444547653, -0.07489528506994247, -0.06461922824382782, -0.05434317886829376, -0.044067125767469406, -0.03379107266664505, -0.023515023291110992, -0.013238966464996338, -0.0029629170894622803, 0.007313135080039501, 0.017589187249541283, 0.02786523848772049, 0.038141291588544846, 0.0484173446893692, 0.05869339406490326, 0.06896945089101791, 0.07924550026655197, 0.08952154964208603, 0.09979760646820068, 0.11007365584373474, 0.1203497052192688, 0.13062575459480286, 0.14090180397033691, 0.15117786824703217, 0.16145391762256622, 0.17172996699810028, 0.18200601637363434, 0.1922820806503296, 0.20255813002586365, 0.2128341794013977, 0.22311022877693176, 0.23338627815246582, 0.24366232752799988, 0.25393837690353394, 0.264214426279068, 0.27449047565460205, 0.2847665250301361, 0.29504257440567017, 0.3053186535835266, 0.31559470295906067, 0.3258707523345947]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 5.0, 8.0, 9.0, 10.0, 16.0, 17.0, 31.0, 50.0, 73.0, 123.0, 187.0, 303.0, 569.0, 1118.0, 2759.0, 10632.0, 96672.0, 835743.0, 85329.0, 9657.0, 2754.0, 1090.0, 538.0, 325.0, 154.0, 118.0, 75.0, 55.0, 33.0, 27.0, 20.0, 17.0, 8.0, 3.0, 6.0, 1.0, 6.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.255126953125, -0.24511337280273438, -0.23509979248046875, -0.22508621215820312, -0.2150726318359375, -0.20505905151367188, -0.19504547119140625, -0.18503189086914062, -0.175018310546875, -0.16500473022460938, -0.15499114990234375, -0.14497756958007812, -0.1349639892578125, -0.12495040893554688, -0.11493682861328125, -0.10492324829101562, -0.09490966796875, -0.08489608764648438, -0.07488250732421875, -0.06486892700195312, -0.0548553466796875, -0.044841766357421875, -0.03482818603515625, -0.024814605712890625, -0.014801025390625, -0.004787445068359375, 0.00522613525390625, 0.015239715576171875, 0.0252532958984375, 0.035266876220703125, 0.04528045654296875, 0.055294036865234375, 0.0653076171875, 0.07532119750976562, 0.08533477783203125, 0.09534835815429688, 0.1053619384765625, 0.11537551879882812, 0.12538909912109375, 0.13540267944335938, 0.145416259765625, 0.15542984008789062, 0.16544342041015625, 0.17545700073242188, 0.1854705810546875, 0.19548416137695312, 0.20549774169921875, 0.21551132202148438, 0.22552490234375, 0.23553848266601562, 0.24555206298828125, 0.2555656433105469, 0.2655792236328125, 0.2755928039550781, 0.28560638427734375, 0.2956199645996094, 0.305633544921875, 0.3156471252441406, 0.32566070556640625, 0.3356742858886719, 0.3456878662109375, 0.3557014465332031, 0.36571502685546875, 0.3757286071777344, 0.3857421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 6.0, 9.0, 22.0, 30.0, 54.0, 90.0, 171.0, 192.0, 160.0, 131.0, 49.0, 40.0, 18.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0921630859375, -0.08923912048339844, -0.08631515502929688, -0.08339118957519531, -0.08046722412109375, -0.07754325866699219, -0.07461929321289062, -0.07169532775878906, -0.0687713623046875, -0.06584739685058594, -0.06292343139648438, -0.05999946594238281, -0.05707550048828125, -0.05415153503417969, -0.051227569580078125, -0.04830360412597656, -0.045379638671875, -0.04245567321777344, -0.039531707763671875, -0.03660774230957031, -0.03368377685546875, -0.030759811401367188, -0.027835845947265625, -0.024911880493164062, -0.0219879150390625, -0.019063949584960938, -0.016139984130859375, -0.013216018676757812, -0.01029205322265625, -0.0073680877685546875, -0.004444122314453125, -0.0015201568603515625, 0.00140380859375, 0.0043277740478515625, 0.007251739501953125, 0.010175704956054688, 0.01309967041015625, 0.016023635864257812, 0.018947601318359375, 0.021871566772460938, 0.0247955322265625, 0.027719497680664062, 0.030643463134765625, 0.03356742858886719, 0.03649139404296875, 0.03941535949707031, 0.042339324951171875, 0.04526329040527344, 0.048187255859375, 0.05111122131347656, 0.054035186767578125, 0.05695915222167969, 0.05988311767578125, 0.06280708312988281, 0.06573104858398438, 0.06865501403808594, 0.0715789794921875, 0.07450294494628906, 0.07742691040039062, 0.08035087585449219, 0.08327484130859375, 0.08619880676269531, 0.08912277221679688, 0.09204673767089844, 0.094970703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 7.0, 8.0, 16.0, 10.0, 28.0, 19.0, 35.0, 44.0, 61.0, 92.0, 130.0, 199.0, 271.0, 424.0, 753.0, 1477.0, 3296.0, 8694.0, 30525.0, 176676.0, 656045.0, 131086.0, 24951.0, 7484.0, 2881.0, 1344.0, 698.0, 396.0, 286.0, 200.0, 120.0, 84.0, 50.0, 38.0, 26.0, 22.0, 12.0, 11.0, 10.0, 10.0, 7.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.204345703125, -0.1978435516357422, -0.19134140014648438, -0.18483924865722656, -0.17833709716796875, -0.17183494567871094, -0.16533279418945312, -0.1588306427001953, -0.1523284912109375, -0.1458263397216797, -0.13932418823242188, -0.13282203674316406, -0.12631988525390625, -0.11981773376464844, -0.11331558227539062, -0.10681343078613281, -0.100311279296875, -0.09380912780761719, -0.08730697631835938, -0.08080482482910156, -0.07430267333984375, -0.06780052185058594, -0.061298370361328125, -0.05479621887207031, -0.0482940673828125, -0.04179191589355469, -0.035289764404296875, -0.028787612915039062, -0.02228546142578125, -0.015783309936523438, -0.009281158447265625, -0.0027790069580078125, 0.00372314453125, 0.010225296020507812, 0.016727447509765625, 0.023229598999023438, 0.02973175048828125, 0.03623390197753906, 0.042736053466796875, 0.04923820495605469, 0.0557403564453125, 0.06224250793457031, 0.06874465942382812, 0.07524681091308594, 0.08174896240234375, 0.08825111389160156, 0.09475326538085938, 0.10125541687011719, 0.107757568359375, 0.11425971984863281, 0.12076187133789062, 0.12726402282714844, 0.13376617431640625, 0.14026832580566406, 0.14677047729492188, 0.1532726287841797, 0.1597747802734375, 0.1662769317626953, 0.17277908325195312, 0.17928123474121094, 0.18578338623046875, 0.19228553771972656, 0.19878768920898438, 0.2052898406982422, 0.2117919921875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 6.0, 5.0, 7.0, 16.0, 11.0, 16.0, 17.0, 14.0, 17.0, 22.0, 38.0, 24.0, 18.0, 41.0, 24.0, 38.0, 39.0, 39.0, 39.0, 31.0, 42.0, 44.0, 42.0, 42.0, 43.0, 30.0, 34.0, 41.0, 22.0, 31.0, 22.0, 24.0, 20.0, 11.0, 22.0, 14.0, 9.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.177490234375, -0.17191123962402344, -0.16633224487304688, -0.1607532501220703, -0.15517425537109375, -0.1495952606201172, -0.14401626586914062, -0.13843727111816406, -0.1328582763671875, -0.12727928161621094, -0.12170028686523438, -0.11612129211425781, -0.11054229736328125, -0.10496330261230469, -0.09938430786132812, -0.09380531311035156, -0.088226318359375, -0.08264732360839844, -0.07706832885742188, -0.07148933410644531, -0.06591033935546875, -0.06033134460449219, -0.054752349853515625, -0.04917335510253906, -0.0435943603515625, -0.03801536560058594, -0.032436370849609375, -0.026857376098632812, -0.02127838134765625, -0.015699386596679688, -0.010120391845703125, -0.0045413970947265625, 0.00103759765625, 0.0066165924072265625, 0.012195587158203125, 0.017774581909179688, 0.02335357666015625, 0.028932571411132812, 0.034511566162109375, 0.04009056091308594, 0.0456695556640625, 0.05124855041503906, 0.056827545166015625, 0.06240653991699219, 0.06798553466796875, 0.07356452941894531, 0.07914352416992188, 0.08472251892089844, 0.090301513671875, 0.09588050842285156, 0.10145950317382812, 0.10703849792480469, 0.11261749267578125, 0.11819648742675781, 0.12377548217773438, 0.12935447692871094, 0.1349334716796875, 0.14051246643066406, 0.14609146118164062, 0.1516704559326172, 0.15724945068359375, 0.1628284454345703, 0.16840744018554688, 0.17398643493652344, 0.1795654296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 10.0, 11.0, 10.0, 10.0, 31.0, 37.0, 58.0, 86.0, 139.0, 261.0, 537.0, 1189.0, 3098.0, 11869.0, 108733.0, 830764.0, 77292.0, 9568.0, 2643.0, 1074.0, 445.0, 256.0, 140.0, 96.0, 62.0, 41.0, 26.0, 17.0, 9.0, 11.0, 4.0, 11.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11126708984375, -0.10748767852783203, -0.10370826721191406, -0.0999288558959961, -0.09614944458007812, -0.09237003326416016, -0.08859062194824219, -0.08481121063232422, -0.08103179931640625, -0.07725238800048828, -0.07347297668457031, -0.06969356536865234, -0.06591415405273438, -0.062134742736816406, -0.05835533142089844, -0.05457592010498047, -0.0507965087890625, -0.04701709747314453, -0.04323768615722656, -0.039458274841308594, -0.035678863525390625, -0.031899452209472656, -0.028120040893554688, -0.02434062957763672, -0.02056121826171875, -0.01678180694580078, -0.013002395629882812, -0.009222984313964844, -0.005443572998046875, -0.0016641616821289062, 0.0021152496337890625, 0.005894660949707031, 0.009674072265625, 0.013453483581542969, 0.017232894897460938, 0.021012306213378906, 0.024791717529296875, 0.028571128845214844, 0.03235054016113281, 0.03612995147705078, 0.03990936279296875, 0.04368877410888672, 0.04746818542480469, 0.051247596740722656, 0.055027008056640625, 0.058806419372558594, 0.06258583068847656, 0.06636524200439453, 0.0701446533203125, 0.07392406463623047, 0.07770347595214844, 0.0814828872680664, 0.08526229858398438, 0.08904170989990234, 0.09282112121582031, 0.09660053253173828, 0.10037994384765625, 0.10415935516357422, 0.10793876647949219, 0.11171817779541016, 0.11549758911132812, 0.1192770004272461, 0.12305641174316406, 0.12683582305908203, 0.130615234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 13.0, 10.0, 8.0, 15.0, 18.0, 19.0, 32.0, 34.0, 52.0, 53.0, 69.0, 97.0, 124.0, 95.0, 78.0, 46.0, 33.0, 29.0, 28.0, 25.0, 20.0, 18.0, 5.0, 11.0, 7.0, 5.0, 10.0, 4.0, 8.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.82012939453125e-05, -7.562246173620224e-05, -7.304362952709198e-05, -7.046479731798172e-05, -6.788596510887146e-05, -6.53071328997612e-05, -6.272830069065094e-05, -6.014946848154068e-05, -5.757063627243042e-05, -5.499180406332016e-05, -5.24129718542099e-05, -4.983413964509964e-05, -4.725530743598938e-05, -4.467647522687912e-05, -4.209764301776886e-05, -3.95188108086586e-05, -3.693997859954834e-05, -3.436114639043808e-05, -3.178231418132782e-05, -2.920348197221756e-05, -2.66246497631073e-05, -2.404581755399704e-05, -2.146698534488678e-05, -1.888815313577652e-05, -1.630932092666626e-05, -1.3730488717556e-05, -1.115165650844574e-05, -8.57282429933548e-06, -5.99399209022522e-06, -3.4151598811149597e-06, -8.363276720046997e-07, 1.7425045371055603e-06, 4.32133674621582e-06, 6.90016895532608e-06, 9.47900116443634e-06, 1.20578333735466e-05, 1.463666558265686e-05, 1.721549779176712e-05, 1.979433000087738e-05, 2.237316220998764e-05, 2.49519944190979e-05, 2.753082662820816e-05, 3.010965883731842e-05, 3.268849104642868e-05, 3.526732325553894e-05, 3.78461554646492e-05, 4.042498767375946e-05, 4.300381988286972e-05, 4.558265209197998e-05, 4.816148430109024e-05, 5.07403165102005e-05, 5.331914871931076e-05, 5.589798092842102e-05, 5.847681313753128e-05, 6.105564534664154e-05, 6.36344775557518e-05, 6.621330976486206e-05, 6.879214197397232e-05, 7.137097418308258e-05, 7.394980639219284e-05, 7.65286386013031e-05, 7.910747081041336e-05, 8.168630301952362e-05, 8.426513522863388e-05, 8.684396743774414e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 7.0, 7.0, 11.0, 17.0, 9.0, 19.0, 22.0, 37.0, 40.0, 75.0, 114.0, 133.0, 220.0, 356.0, 590.0, 1177.0, 2397.0, 5347.0, 16255.0, 84129.0, 701185.0, 195141.0, 26965.0, 7887.0, 3018.0, 1385.0, 766.0, 414.0, 236.0, 170.0, 114.0, 79.0, 61.0, 44.0, 30.0, 23.0, 20.0, 16.0, 4.0, 7.0, 9.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.091552734375, -0.08856868743896484, -0.08558464050292969, -0.08260059356689453, -0.07961654663085938, -0.07663249969482422, -0.07364845275878906, -0.0706644058227539, -0.06768035888671875, -0.0646963119506836, -0.06171226501464844, -0.05872821807861328, -0.055744171142578125, -0.05276012420654297, -0.04977607727050781, -0.046792030334472656, -0.0438079833984375, -0.040823936462402344, -0.03783988952636719, -0.03485584259033203, -0.031871795654296875, -0.02888774871826172, -0.025903701782226562, -0.022919654846191406, -0.01993560791015625, -0.016951560974121094, -0.013967514038085938, -0.010983467102050781, -0.007999420166015625, -0.005015373229980469, -0.0020313262939453125, 0.0009527206420898438, 0.003936767578125, 0.006920814514160156, 0.009904861450195312, 0.012888908386230469, 0.015872955322265625, 0.01885700225830078, 0.021841049194335938, 0.024825096130371094, 0.02780914306640625, 0.030793190002441406, 0.03377723693847656, 0.03676128387451172, 0.039745330810546875, 0.04272937774658203, 0.04571342468261719, 0.048697471618652344, 0.0516815185546875, 0.054665565490722656, 0.05764961242675781, 0.06063365936279297, 0.06361770629882812, 0.06660175323486328, 0.06958580017089844, 0.0725698471069336, 0.07555389404296875, 0.0785379409790039, 0.08152198791503906, 0.08450603485107422, 0.08749008178710938, 0.09047412872314453, 0.09345817565917969, 0.09644222259521484, 0.09942626953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 11.0, 13.0, 20.0, 24.0, 49.0, 75.0, 115.0, 158.0, 174.0, 107.0, 71.0, 52.0, 27.0, 19.0, 10.0, 12.0, 5.0, 6.0, 8.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.172607421875, -0.16793251037597656, -0.16325759887695312, -0.1585826873779297, -0.15390777587890625, -0.1492328643798828, -0.14455795288085938, -0.13988304138183594, -0.1352081298828125, -0.13053321838378906, -0.12585830688476562, -0.12118339538574219, -0.11650848388671875, -0.11183357238769531, -0.10715866088867188, -0.10248374938964844, -0.097808837890625, -0.09313392639160156, -0.08845901489257812, -0.08378410339355469, -0.07910919189453125, -0.07443428039550781, -0.06975936889648438, -0.06508445739746094, -0.0604095458984375, -0.05573463439941406, -0.051059722900390625, -0.04638481140136719, -0.04170989990234375, -0.03703498840332031, -0.032360076904296875, -0.027685165405273438, -0.02301025390625, -0.018335342407226562, -0.013660430908203125, -0.008985519409179688, -0.00431060791015625, 0.0003643035888671875, 0.005039215087890625, 0.009714126586914062, 0.0143890380859375, 0.019063949584960938, 0.023738861083984375, 0.028413772583007812, 0.03308868408203125, 0.03776359558105469, 0.042438507080078125, 0.04711341857910156, 0.051788330078125, 0.05646324157714844, 0.061138153076171875, 0.06581306457519531, 0.07048797607421875, 0.07516288757324219, 0.07983779907226562, 0.08451271057128906, 0.0891876220703125, 0.09386253356933594, 0.09853744506835938, 0.10321235656738281, 0.10788726806640625, 0.11256217956542969, 0.11723709106445312, 0.12191200256347656, 0.1265869140625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 22.0, 73.0, 365.0, 428.0, 86.0, 18.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.296441078186035, -4.186485767364502, -4.076530456542969, -3.9665749073028564, -3.8566195964813232, -3.74666428565979, -3.6367087364196777, -3.5267534255981445, -3.4167981147766113, -3.306842803955078, -3.196887493133545, -3.0869319438934326, -2.9769766330718994, -2.867021322250366, -2.757065773010254, -2.6471104621887207, -2.5371551513671875, -2.4271998405456543, -2.317244529724121, -2.207288980484009, -2.0973336696624756, -1.9873783588409424, -1.8774229288101196, -1.7674674987792969, -1.6575121879577637, -1.5475568771362305, -1.4376014471054077, -1.327646017074585, -1.2176907062530518, -1.1077353954315186, -0.9977799654006958, -0.8878245949745178, -0.7778692245483398, -0.6679138541221619, -0.5579584836959839, -0.4480031132698059, -0.33804774284362793, -0.22809237241744995, -0.11813700199127197, -0.008181631565093994, 0.10177373886108398, 0.21172910928726196, 0.32168447971343994, 0.4316398501396179, 0.5415952205657959, 0.6515505909919739, 0.7615059614181519, 0.8714613318443298, 0.9814167022705078, 1.091372013092041, 1.2013274431228638, 1.3112828731536865, 1.4212381839752197, 1.531193494796753, 1.6411489248275757, 1.7511043548583984, 1.8610596656799316, 1.9710149765014648, 2.080970287322998, 2.1909258365631104, 2.3008811473846436, 2.4108364582061768, 2.520792007446289, 2.6307473182678223, 2.7407026290893555]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 10.0, 19.0, 7.0, 24.0, 27.0, 34.0, 36.0, 23.0, 65.0, 51.0, 39.0, 60.0, 55.0, 65.0, 70.0, 50.0, 48.0, 50.0, 38.0, 39.0, 35.0, 37.0, 19.0, 14.0, 17.0, 17.0, 10.0, 12.0, 10.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.976169228553772, -0.932508111000061, -0.8888469934463501, -0.8451858758926392, -0.8015247583389282, -0.7578636407852173, -0.7142025828361511, -0.6705414652824402, -0.6268803477287292, -0.5832192301750183, -0.5395581126213074, -0.4958970248699188, -0.4522359073162079, -0.40857478976249695, -0.3649137020111084, -0.32125258445739746, -0.2775914669036865, -0.23393034934997559, -0.19026924669742584, -0.1466081440448761, -0.10294702649116516, -0.059285908937454224, -0.015624821186065674, 0.028036296367645264, 0.0716974139213562, 0.11535852402448654, 0.15901963412761688, 0.20268073678016663, 0.24634185433387756, 0.2900029718875885, 0.33366405963897705, 0.377325177192688, 0.4209862947463989, 0.46464741230010986, 0.5083085298538208, 0.5519696474075317, 0.5956307649612427, 0.6392918825149536, 0.6829529404640198, 0.7266140580177307, 0.7702751755714417, 0.8139362931251526, 0.8575974106788635, 0.9012584686279297, 0.9449195861816406, 0.9885807037353516, 1.0322418212890625, 1.0759029388427734, 1.1195640563964844, 1.1632251739501953, 1.2068862915039062, 1.2505474090576172, 1.2942085266113281, 1.337869644165039, 1.38153076171875, 1.425191879272461, 1.4688529968261719, 1.5125141143798828, 1.5561752319335938, 1.5998363494873047, 1.6434974670410156, 1.6871585845947266, 1.7308197021484375, 1.7744808197021484, 1.8181418180465698]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 5.0, 4.0, 3.0, 12.0, 13.0, 12.0, 23.0, 34.0, 59.0, 87.0, 134.0, 282.0, 526.0, 1290.0, 4424.0, 26498.0, 3661290.0, 477847.0, 16311.0, 3333.0, 1082.0, 446.0, 209.0, 122.0, 83.0, 48.0, 27.0, 26.0, 13.0, 11.0, 11.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.3885231018066406, -0.37738800048828125, -0.3662528991699219, -0.3551177978515625, -0.3439826965332031, -0.33284759521484375, -0.3217124938964844, -0.310577392578125, -0.2994422912597656, -0.28830718994140625, -0.2771720886230469, -0.2660369873046875, -0.2549018859863281, -0.24376678466796875, -0.23263168334960938, -0.22149658203125, -0.21036148071289062, -0.19922637939453125, -0.18809127807617188, -0.1769561767578125, -0.16582107543945312, -0.15468597412109375, -0.14355087280273438, -0.132415771484375, -0.12128067016601562, -0.11014556884765625, -0.09901046752929688, -0.0878753662109375, -0.07674026489257812, -0.06560516357421875, -0.054470062255859375, -0.0433349609375, -0.032199859619140625, -0.02106475830078125, -0.009929656982421875, 0.0012054443359375, 0.012340545654296875, 0.02347564697265625, 0.034610748291015625, 0.045745849609375, 0.056880950927734375, 0.06801605224609375, 0.07915115356445312, 0.0902862548828125, 0.10142135620117188, 0.11255645751953125, 0.12369155883789062, 0.13482666015625, 0.14596176147460938, 0.15709686279296875, 0.16823196411132812, 0.1793670654296875, 0.19050216674804688, 0.20163726806640625, 0.21277236938476562, 0.223907470703125, 0.23504257202148438, 0.24617767333984375, 0.2573127746582031, 0.2684478759765625, 0.2795829772949219, 0.29071807861328125, 0.3018531799316406, 0.31298828125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 10.0, 13.0, 19.0, 31.0, 68.0, 122.0, 167.0, 200.0, 146.0, 101.0, 52.0, 31.0, 14.0, 13.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0926513671875, -0.08968544006347656, -0.08671951293945312, -0.08375358581542969, -0.08078765869140625, -0.07782173156738281, -0.07485580444335938, -0.07188987731933594, -0.0689239501953125, -0.06595802307128906, -0.06299209594726562, -0.06002616882324219, -0.05706024169921875, -0.05409431457519531, -0.051128387451171875, -0.04816246032714844, -0.045196533203125, -0.04223060607910156, -0.039264678955078125, -0.03629875183105469, -0.03333282470703125, -0.030366897583007812, -0.027400970458984375, -0.024435043334960938, -0.0214691162109375, -0.018503189086914062, -0.015537261962890625, -0.012571334838867188, -0.00960540771484375, -0.0066394805908203125, -0.003673553466796875, -0.0007076263427734375, 0.00225830078125, 0.0052242279052734375, 0.008190155029296875, 0.011156082153320312, 0.01412200927734375, 0.017087936401367188, 0.020053863525390625, 0.023019790649414062, 0.0259857177734375, 0.028951644897460938, 0.031917572021484375, 0.03488349914550781, 0.03784942626953125, 0.04081535339355469, 0.043781280517578125, 0.04674720764160156, 0.049713134765625, 0.05267906188964844, 0.055644989013671875, 0.05861091613769531, 0.06157684326171875, 0.06454277038574219, 0.06750869750976562, 0.07047462463378906, 0.0734405517578125, 0.07640647888183594, 0.07937240600585938, 0.08233833312988281, 0.08530426025390625, 0.08827018737792969, 0.09123611450195312, 0.09420204162597656, 0.09716796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 9.0, 14.0, 18.0, 17.0, 31.0, 42.0, 91.0, 148.0, 243.0, 499.0, 1150.0, 3314.0, 15548.0, 226204.0, 3887875.0, 48825.0, 7042.0, 1813.0, 704.0, 307.0, 146.0, 89.0, 50.0, 34.0, 27.0, 14.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.405517578125, -0.3946342468261719, -0.38375091552734375, -0.3728675842285156, -0.3619842529296875, -0.3511009216308594, -0.34021759033203125, -0.3293342590332031, -0.318450927734375, -0.3075675964355469, -0.29668426513671875, -0.2858009338378906, -0.2749176025390625, -0.2640342712402344, -0.25315093994140625, -0.24226760864257812, -0.23138427734375, -0.22050094604492188, -0.20961761474609375, -0.19873428344726562, -0.1878509521484375, -0.17696762084960938, -0.16608428955078125, -0.15520095825195312, -0.144317626953125, -0.13343429565429688, -0.12255096435546875, -0.11166763305664062, -0.1007843017578125, -0.08990097045898438, -0.07901763916015625, -0.06813430786132812, -0.0572509765625, -0.046367645263671875, -0.03548431396484375, -0.024600982666015625, -0.0137176513671875, -0.002834320068359375, 0.00804901123046875, 0.018932342529296875, 0.029815673828125, 0.040699005126953125, 0.05158233642578125, 0.062465667724609375, 0.0733489990234375, 0.08423233032226562, 0.09511566162109375, 0.10599899291992188, 0.11688232421875, 0.12776565551757812, 0.13864898681640625, 0.14953231811523438, 0.1604156494140625, 0.17129898071289062, 0.18218231201171875, 0.19306564331054688, 0.203948974609375, 0.21483230590820312, 0.22571563720703125, 0.23659896850585938, 0.2474822998046875, 0.2583656311035156, 0.26924896240234375, 0.2801322937011719, 0.291015625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 16.0, 27.0, 52.0, 79.0, 197.0, 816.0, 2258.0, 366.0, 111.0, 57.0, 27.0, 20.0, 11.0, 10.0, 5.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1929931640625, -0.18842697143554688, -0.18386077880859375, -0.17929458618164062, -0.1747283935546875, -0.17016220092773438, -0.16559600830078125, -0.16102981567382812, -0.156463623046875, -0.15189743041992188, -0.14733123779296875, -0.14276504516601562, -0.1381988525390625, -0.13363265991210938, -0.12906646728515625, -0.12450027465820312, -0.11993408203125, -0.11536788940429688, -0.11080169677734375, -0.10623550415039062, -0.1016693115234375, -0.09710311889648438, -0.09253692626953125, -0.08797073364257812, -0.083404541015625, -0.07883834838867188, -0.07427215576171875, -0.06970596313476562, -0.0651397705078125, -0.060573577880859375, -0.05600738525390625, -0.051441192626953125, -0.046875, -0.042308807373046875, -0.03774261474609375, -0.033176422119140625, -0.0286102294921875, -0.024044036865234375, -0.01947784423828125, -0.014911651611328125, -0.010345458984375, -0.005779266357421875, -0.00121307373046875, 0.003353118896484375, 0.0079193115234375, 0.012485504150390625, 0.01705169677734375, 0.021617889404296875, 0.02618408203125, 0.030750274658203125, 0.03531646728515625, 0.039882659912109375, 0.0444488525390625, 0.049015045166015625, 0.05358123779296875, 0.058147430419921875, 0.062713623046875, 0.06727981567382812, 0.07184600830078125, 0.07641220092773438, 0.0809783935546875, 0.08554458618164062, 0.09011077880859375, 0.09467697143554688, 0.0992431640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 12.0, 28.0, 91.0, 184.0, 347.0, 247.0, 61.0, 23.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.449288010597229, -0.418795108795166, -0.38830217719078064, -0.35780927538871765, -0.3273163437843323, -0.2968234419822693, -0.2663305401802063, -0.23583760857582092, -0.20534469187259674, -0.17485177516937256, -0.14435885846614838, -0.11386594921350479, -0.08337303251028061, -0.052880123257637024, -0.022387206554412842, 0.00810571014881134, 0.03859862685203552, 0.0690915435552597, 0.09958446025848389, 0.13007736206054688, 0.16057029366493225, 0.19106319546699524, 0.22155611217021942, 0.2520490288734436, 0.2825419306755066, 0.3130348324775696, 0.34352776408195496, 0.37402066588401794, 0.4045135974884033, 0.4350064992904663, 0.4654994010925293, 0.4959923326969147, 0.5264852643013, 0.556978166103363, 0.587471067905426, 0.6179640293121338, 0.6484569311141968, 0.6789498329162598, 0.7094427347183228, 0.7399356365203857, 0.7704285979270935, 0.8009214997291565, 0.8314144015312195, 0.8619073629379272, 0.8924002647399902, 0.9228931665420532, 0.9533860683441162, 0.9838789701461792, 1.0143718719482422, 1.0448647737503052, 1.0753576755523682, 1.1058505773544312, 1.1363434791564941, 1.1668365001678467, 1.1973294019699097, 1.2278223037719727, 1.2583152055740356, 1.2888081073760986, 1.3193010091781616, 1.3497939109802246, 1.3802868127822876, 1.4107797145843506, 1.4412727355957031, 1.4717656373977661, 1.502258539199829]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 2.0, 4.0, 11.0, 12.0, 28.0, 30.0, 38.0, 47.0, 44.0, 73.0, 59.0, 81.0, 75.0, 60.0, 61.0, 61.0, 58.0, 51.0, 45.0, 44.0, 28.0, 36.0, 23.0, 11.0, 9.0, 11.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5464600324630737, -0.5318363308906555, -0.5172126293182373, -0.5025889277458191, -0.4879651963710785, -0.4733414947986603, -0.4587177634239197, -0.44409406185150146, -0.42947036027908325, -0.41484665870666504, -0.4002229571342468, -0.3855992257595062, -0.370975524187088, -0.3563518226146698, -0.3417280912399292, -0.327104389667511, -0.3124806880950928, -0.29785698652267456, -0.28323328495025635, -0.26860955357551575, -0.25398585200309753, -0.23936215043067932, -0.22473843395709991, -0.2101147174835205, -0.1954910159111023, -0.18086731433868408, -0.16624359786510468, -0.15161988139152527, -0.13699617981910706, -0.12237247079610825, -0.10774876177310944, -0.09312505275011063, -0.07850134372711182, -0.063877634704113, -0.0492539256811142, -0.03463021665811539, -0.020006507635116577, -0.005382798612117767, 0.009240910410881042, 0.023864619433879852, 0.03848832845687866, 0.05311203747987747, 0.06773574650287628, 0.08235945552587509, 0.0969831645488739, 0.11160687357187271, 0.12623058259487152, 0.14085429906845093, 0.15547800064086914, 0.17010170221328735, 0.18472541868686676, 0.19934913516044617, 0.21397283673286438, 0.2285965383052826, 0.243220254778862, 0.2578439712524414, 0.2724676728248596, 0.28709137439727783, 0.30171507596969604, 0.31633880734443665, 0.33096250891685486, 0.34558621048927307, 0.36020994186401367, 0.3748336434364319, 0.3894573450088501]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 3.0, 8.0, 8.0, 17.0, 26.0, 36.0, 40.0, 51.0, 79.0, 120.0, 208.0, 337.0, 547.0, 1137.0, 2931.0, 10573.0, 81968.0, 832629.0, 100043.0, 12005.0, 3159.0, 1174.0, 564.0, 310.0, 176.0, 118.0, 83.0, 56.0, 46.0, 21.0, 29.0, 16.0, 7.0, 4.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.369384765625, -0.3589897155761719, -0.34859466552734375, -0.3381996154785156, -0.3278045654296875, -0.3174095153808594, -0.30701446533203125, -0.2966194152832031, -0.286224365234375, -0.2758293151855469, -0.26543426513671875, -0.2550392150878906, -0.2446441650390625, -0.23424911499023438, -0.22385406494140625, -0.21345901489257812, -0.20306396484375, -0.19266891479492188, -0.18227386474609375, -0.17187881469726562, -0.1614837646484375, -0.15108871459960938, -0.14069366455078125, -0.13029861450195312, -0.119903564453125, -0.10950851440429688, -0.09911346435546875, -0.08871841430664062, -0.0783233642578125, -0.06792831420898438, -0.05753326416015625, -0.047138214111328125, -0.0367431640625, -0.026348114013671875, -0.01595306396484375, -0.005558013916015625, 0.0048370361328125, 0.015232086181640625, 0.02562713623046875, 0.036022186279296875, 0.046417236328125, 0.056812286376953125, 0.06720733642578125, 0.07760238647460938, 0.0879974365234375, 0.09839248657226562, 0.10878753662109375, 0.11918258666992188, 0.12957763671875, 0.13997268676757812, 0.15036773681640625, 0.16076278686523438, 0.1711578369140625, 0.18155288696289062, 0.19194793701171875, 0.20234298706054688, 0.212738037109375, 0.22313308715820312, 0.23352813720703125, 0.24392318725585938, 0.2543182373046875, 0.2647132873535156, 0.27510833740234375, 0.2855033874511719, 0.2958984375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 12.0, 8.0, 13.0, 16.0, 34.0, 68.0, 110.0, 169.0, 201.0, 148.0, 88.0, 61.0, 40.0, 13.0, 9.0, 7.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09661865234375, -0.0936279296875, -0.09063720703125, -0.087646484375, -0.08465576171875, -0.0816650390625, -0.07867431640625, -0.07568359375, -0.07269287109375, -0.0697021484375, -0.06671142578125, -0.063720703125, -0.06072998046875, -0.0577392578125, -0.05474853515625, -0.0517578125, -0.04876708984375, -0.0457763671875, -0.04278564453125, -0.039794921875, -0.03680419921875, -0.0338134765625, -0.03082275390625, -0.02783203125, -0.02484130859375, -0.0218505859375, -0.01885986328125, -0.015869140625, -0.01287841796875, -0.0098876953125, -0.00689697265625, -0.00390625, -0.00091552734375, 0.0020751953125, 0.00506591796875, 0.008056640625, 0.01104736328125, 0.0140380859375, 0.01702880859375, 0.02001953125, 0.02301025390625, 0.0260009765625, 0.02899169921875, 0.031982421875, 0.03497314453125, 0.0379638671875, 0.04095458984375, 0.0439453125, 0.04693603515625, 0.0499267578125, 0.05291748046875, 0.055908203125, 0.05889892578125, 0.0618896484375, 0.06488037109375, 0.06787109375, 0.07086181640625, 0.0738525390625, 0.07684326171875, 0.079833984375, 0.08282470703125, 0.0858154296875, 0.08880615234375, 0.091796875, 0.09478759765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 16.0, 12.0, 15.0, 15.0, 27.0, 34.0, 60.0, 67.0, 111.0, 170.0, 217.0, 399.0, 631.0, 1133.0, 2114.0, 4385.0, 11041.0, 33562.0, 159299.0, 641184.0, 142587.0, 31508.0, 10584.0, 4347.0, 2164.0, 1084.0, 652.0, 370.0, 225.0, 153.0, 120.0, 75.0, 58.0, 36.0, 31.0, 16.0, 13.0, 14.0, 4.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.211181640625, -0.20554542541503906, -0.19990921020507812, -0.1942729949951172, -0.18863677978515625, -0.1830005645751953, -0.17736434936523438, -0.17172813415527344, -0.1660919189453125, -0.16045570373535156, -0.15481948852539062, -0.1491832733154297, -0.14354705810546875, -0.1379108428955078, -0.13227462768554688, -0.12663841247558594, -0.121002197265625, -0.11536598205566406, -0.10972976684570312, -0.10409355163574219, -0.09845733642578125, -0.09282112121582031, -0.08718490600585938, -0.08154869079589844, -0.0759124755859375, -0.07027626037597656, -0.06464004516601562, -0.05900382995605469, -0.05336761474609375, -0.04773139953613281, -0.042095184326171875, -0.03645896911621094, -0.03082275390625, -0.025186538696289062, -0.019550323486328125, -0.013914108276367188, -0.00827789306640625, -0.0026416778564453125, 0.002994537353515625, 0.008630752563476562, 0.0142669677734375, 0.019903182983398438, 0.025539398193359375, 0.031175613403320312, 0.03681182861328125, 0.04244804382324219, 0.048084259033203125, 0.05372047424316406, 0.059356689453125, 0.06499290466308594, 0.07062911987304688, 0.07626533508300781, 0.08190155029296875, 0.08753776550292969, 0.09317398071289062, 0.09881019592285156, 0.1044464111328125, 0.11008262634277344, 0.11571884155273438, 0.12135505676269531, 0.12699127197265625, 0.1326274871826172, 0.13826370239257812, 0.14389991760253906, 0.1495361328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 9.0, 11.0, 9.0, 15.0, 23.0, 25.0, 35.0, 28.0, 41.0, 37.0, 59.0, 50.0, 51.0, 61.0, 63.0, 74.0, 54.0, 53.0, 52.0, 40.0, 34.0, 31.0, 30.0, 25.0, 26.0, 9.0, 11.0, 3.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.274658203125, -0.2673473358154297, -0.2600364685058594, -0.25272560119628906, -0.24541473388671875, -0.23810386657714844, -0.23079299926757812, -0.2234821319580078, -0.2161712646484375, -0.2088603973388672, -0.20154953002929688, -0.19423866271972656, -0.18692779541015625, -0.17961692810058594, -0.17230606079101562, -0.1649951934814453, -0.157684326171875, -0.1503734588623047, -0.14306259155273438, -0.13575172424316406, -0.12844085693359375, -0.12112998962402344, -0.11381912231445312, -0.10650825500488281, -0.0991973876953125, -0.09188652038574219, -0.08457565307617188, -0.07726478576660156, -0.06995391845703125, -0.06264305114746094, -0.055332183837890625, -0.04802131652832031, -0.04071044921875, -0.03339958190917969, -0.026088714599609375, -0.018777847290039062, -0.01146697998046875, -0.0041561126708984375, 0.003154754638671875, 0.010465621948242188, 0.0177764892578125, 0.025087356567382812, 0.032398223876953125, 0.03970909118652344, 0.04701995849609375, 0.05433082580566406, 0.061641693115234375, 0.06895256042480469, 0.076263427734375, 0.08357429504394531, 0.09088516235351562, 0.09819602966308594, 0.10550689697265625, 0.11281776428222656, 0.12012863159179688, 0.1274394989013672, 0.1347503662109375, 0.1420612335205078, 0.14937210083007812, 0.15668296813964844, 0.16399383544921875, 0.17130470275878906, 0.17861557006835938, 0.1859264373779297, 0.1932373046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 7.0, 7.0, 13.0, 15.0, 28.0, 37.0, 47.0, 89.0, 143.0, 303.0, 741.0, 2285.0, 8319.0, 45936.0, 873661.0, 99405.0, 12416.0, 3132.0, 1052.0, 406.0, 180.0, 107.0, 60.0, 52.0, 24.0, 18.0, 13.0, 17.0, 4.0, 2.0, 2.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16552734375, -0.15974807739257812, -0.15396881103515625, -0.14818954467773438, -0.1424102783203125, -0.13663101196289062, -0.13085174560546875, -0.12507247924804688, -0.119293212890625, -0.11351394653320312, -0.10773468017578125, -0.10195541381835938, -0.0961761474609375, -0.09039688110351562, -0.08461761474609375, -0.07883834838867188, -0.07305908203125, -0.06727981567382812, -0.06150054931640625, -0.055721282958984375, -0.0499420166015625, -0.044162750244140625, -0.03838348388671875, -0.032604217529296875, -0.026824951171875, -0.021045684814453125, -0.01526641845703125, -0.009487152099609375, -0.0037078857421875, 0.002071380615234375, 0.00785064697265625, 0.013629913330078125, 0.0194091796875, 0.025188446044921875, 0.03096771240234375, 0.036746978759765625, 0.0425262451171875, 0.048305511474609375, 0.05408477783203125, 0.059864044189453125, 0.065643310546875, 0.07142257690429688, 0.07720184326171875, 0.08298110961914062, 0.0887603759765625, 0.09453964233398438, 0.10031890869140625, 0.10609817504882812, 0.11187744140625, 0.11765670776367188, 0.12343597412109375, 0.12921524047851562, 0.1349945068359375, 0.14077377319335938, 0.14655303955078125, 0.15233230590820312, 0.158111572265625, 0.16389083862304688, 0.16967010498046875, 0.17544937133789062, 0.1812286376953125, 0.18700790405273438, 0.19278717041015625, 0.19856643676757812, 0.204345703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 7.0, 8.0, 5.0, 3.0, 7.0, 8.0, 14.0, 20.0, 20.0, 16.0, 25.0, 32.0, 42.0, 67.0, 72.0, 107.0, 97.0, 104.0, 81.0, 53.0, 32.0, 25.0, 21.0, 20.0, 18.0, 16.0, 14.0, 6.0, 10.0, 8.0, 7.0, 10.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.153915405273438e-05, -7.901154458522797e-05, -7.648393511772156e-05, -7.395632565021515e-05, -7.142871618270874e-05, -6.890110671520233e-05, -6.637349724769592e-05, -6.384588778018951e-05, -6.13182783126831e-05, -5.87906688451767e-05, -5.626305937767029e-05, -5.373544991016388e-05, -5.120784044265747e-05, -4.868023097515106e-05, -4.615262150764465e-05, -4.3625012040138245e-05, -4.1097402572631836e-05, -3.856979310512543e-05, -3.604218363761902e-05, -3.351457417011261e-05, -3.09869647026062e-05, -2.8459355235099792e-05, -2.5931745767593384e-05, -2.3404136300086975e-05, -2.0876526832580566e-05, -1.8348917365074158e-05, -1.582130789756775e-05, -1.329369843006134e-05, -1.0766088962554932e-05, -8.238479495048523e-06, -5.710870027542114e-06, -3.1832605600357056e-06, -6.556510925292969e-07, 1.8719583749771118e-06, 4.3995678424835205e-06, 6.927177309989929e-06, 9.454786777496338e-06, 1.1982396245002747e-05, 1.4510005712509155e-05, 1.7037615180015564e-05, 1.9565224647521973e-05, 2.209283411502838e-05, 2.462044358253479e-05, 2.71480530500412e-05, 2.9675662517547607e-05, 3.2203271985054016e-05, 3.4730881452560425e-05, 3.7258490920066833e-05, 3.978610038757324e-05, 4.231370985507965e-05, 4.484131932258606e-05, 4.736892879009247e-05, 4.989653825759888e-05, 5.2424147725105286e-05, 5.4951757192611694e-05, 5.74793666601181e-05, 6.000697612762451e-05, 6.253458559513092e-05, 6.506219506263733e-05, 6.758980453014374e-05, 7.011741399765015e-05, 7.264502346515656e-05, 7.517263293266296e-05, 7.770024240016937e-05, 8.022785186767578e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 16.0, 28.0, 31.0, 50.0, 73.0, 88.0, 184.0, 205.0, 397.0, 664.0, 1299.0, 2639.0, 5931.0, 15977.0, 75319.0, 795829.0, 116039.0, 19827.0, 7246.0, 3161.0, 1538.0, 793.0, 444.0, 278.0, 158.0, 91.0, 59.0, 48.0, 26.0, 21.0, 13.0, 10.0, 12.0, 9.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10601806640625, -0.10203075408935547, -0.09804344177246094, -0.0940561294555664, -0.09006881713867188, -0.08608150482177734, -0.08209419250488281, -0.07810688018798828, -0.07411956787109375, -0.07013225555419922, -0.06614494323730469, -0.062157630920410156, -0.058170318603515625, -0.054183006286621094, -0.05019569396972656, -0.04620838165283203, -0.0422210693359375, -0.03823375701904297, -0.03424644470214844, -0.030259132385253906, -0.026271820068359375, -0.022284507751464844, -0.018297195434570312, -0.014309883117675781, -0.01032257080078125, -0.006335258483886719, -0.0023479461669921875, 0.0016393661499023438, 0.005626678466796875, 0.009613990783691406, 0.013601303100585938, 0.01758861541748047, 0.021575927734375, 0.02556324005126953, 0.029550552368164062, 0.033537864685058594, 0.037525177001953125, 0.041512489318847656, 0.04549980163574219, 0.04948711395263672, 0.05347442626953125, 0.05746173858642578, 0.06144905090332031, 0.06543636322021484, 0.06942367553710938, 0.0734109878540039, 0.07739830017089844, 0.08138561248779297, 0.0853729248046875, 0.08936023712158203, 0.09334754943847656, 0.0973348617553711, 0.10132217407226562, 0.10530948638916016, 0.10929679870605469, 0.11328411102294922, 0.11727142333984375, 0.12125873565673828, 0.1252460479736328, 0.12923336029052734, 0.13322067260742188, 0.1372079849243164, 0.14119529724121094, 0.14518260955810547, 0.149169921875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 8.0, 13.0, 14.0, 20.0, 50.0, 74.0, 194.0, 330.0, 109.0, 49.0, 30.0, 17.0, 21.0, 8.0, 7.0, 3.0, 8.0, 4.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2073974609375, -0.1998004913330078, -0.19220352172851562, -0.18460655212402344, -0.17700958251953125, -0.16941261291503906, -0.16181564331054688, -0.1542186737060547, -0.1466217041015625, -0.1390247344970703, -0.13142776489257812, -0.12383079528808594, -0.11623382568359375, -0.10863685607910156, -0.10103988647460938, -0.09344291687011719, -0.085845947265625, -0.07824897766113281, -0.07065200805664062, -0.06305503845214844, -0.05545806884765625, -0.04786109924316406, -0.040264129638671875, -0.03266716003417969, -0.0250701904296875, -0.017473220825195312, -0.009876251220703125, -0.0022792816162109375, 0.00531768798828125, 0.012914657592773438, 0.020511627197265625, 0.028108596801757812, 0.03570556640625, 0.04330253601074219, 0.050899505615234375, 0.05849647521972656, 0.06609344482421875, 0.07369041442871094, 0.08128738403320312, 0.08888435363769531, 0.0964813232421875, 0.10407829284667969, 0.11167526245117188, 0.11927223205566406, 0.12686920166015625, 0.13446617126464844, 0.14206314086914062, 0.1496601104736328, 0.157257080078125, 0.1648540496826172, 0.17245101928710938, 0.18004798889160156, 0.18764495849609375, 0.19524192810058594, 0.20283889770507812, 0.2104358673095703, 0.2180328369140625, 0.2256298065185547, 0.23322677612304688, 0.24082374572753906, 0.24842071533203125, 0.25601768493652344, 0.2636146545410156, 0.2712116241455078, 0.27880859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 21.0, 11.0, 19.0, 68.0, 176.0, 328.0, 269.0, 73.0, 25.0, 2.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7482235431671143, -3.662583827972412, -3.576944351196289, -3.491304636001587, -3.4056649208068848, -3.3200254440307617, -3.2343857288360596, -3.1487460136413574, -3.0631065368652344, -2.9774668216705322, -2.891827344894409, -2.806187629699707, -2.720547914505005, -2.6349081993103027, -2.5492687225341797, -2.4636290073394775, -2.3779892921447754, -2.2923495769500732, -2.20671010017395, -2.121070384979248, -2.035430669784546, -1.9497910737991333, -1.8641514778137207, -1.7785117626190186, -1.692872166633606, -1.6072325706481934, -1.5215928554534912, -1.4359532594680786, -1.350313663482666, -1.2646739482879639, -1.1790343523025513, -1.0933947563171387, -1.0077552795410156, -0.9221156239509583, -0.8364759683609009, -0.7508363723754883, -0.6651967167854309, -0.5795570611953735, -0.49391746520996094, -0.40827780961990356, -0.3226381540298462, -0.23699851334095, -0.15135887265205383, -0.06571924686431885, 0.019920408725738525, 0.1055600643157959, 0.1911996603012085, 0.27683931589126587, 0.36247897148132324, 0.4481186270713806, 0.533758282661438, 0.6193978786468506, 0.705037534236908, 0.7906771898269653, 0.8763167858123779, 0.9619564414024353, 1.0475960969924927, 1.1332356929779053, 1.2188754081726074, 1.30451500415802, 1.3901546001434326, 1.4757943153381348, 1.5614339113235474, 1.64707350730896, 1.732713222503662]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 7.0, 2.0, 11.0, 11.0, 8.0, 13.0, 12.0, 14.0, 28.0, 22.0, 32.0, 35.0, 36.0, 29.0, 42.0, 44.0, 42.0, 44.0, 51.0, 53.0, 56.0, 42.0, 36.0, 27.0, 35.0, 33.0, 40.0, 30.0, 23.0, 22.0, 16.0, 17.0, 21.0, 20.0, 8.0, 8.0, 4.0, 4.0, 5.0, 6.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0845484733581543, -1.0480408668518066, -1.0115331411361694, -0.9750255346298218, -0.9385178685188293, -0.9020102024078369, -0.8655025959014893, -0.8289949297904968, -0.7924872636795044, -0.755979597568512, -0.7194719910621643, -0.6829643249511719, -0.6464566588401794, -0.609948992729187, -0.5734413862228394, -0.5369337201118469, -0.5004261136054993, -0.4639184772968292, -0.4274108111858368, -0.39090317487716675, -0.3543955087661743, -0.3178878724575043, -0.28138023614883423, -0.2448725700378418, -0.20836493372917175, -0.17185728251934052, -0.13534963130950928, -0.09884199500083923, -0.062334343791007996, -0.025826692581176758, 0.010680943727493286, 0.04718860983848572, 0.08369624614715576, 0.120203897356987, 0.15671154856681824, 0.19321918487548828, 0.22972683608531952, 0.26623448729515076, 0.3027421236038208, 0.33924978971481323, 0.3757574260234833, 0.4122650623321533, 0.44877272844314575, 0.4852803647518158, 0.5217880010604858, 0.5582956671714783, 0.5948033332824707, 0.6313109397888184, 0.6678186058998108, 0.7043262720108032, 0.7408338785171509, 0.7773415446281433, 0.8138492107391357, 0.8503568172454834, 0.8868644833564758, 0.9233721494674683, 0.9598797559738159, 0.9963874220848083, 1.0328950881958008, 1.0694026947021484, 1.105910301208496, 1.1424180269241333, 1.178925633430481, 1.2154333591461182, 1.2519409656524658]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 13.0, 15.0, 19.0, 42.0, 69.0, 136.0, 283.0, 609.0, 1920.0, 12701.0, 3996934.0, 173006.0, 6254.0, 1314.0, 471.0, 215.0, 111.0, 58.0, 42.0, 18.0, 15.0, 10.0, 0.0, 6.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467529296875, -0.4518623352050781, -0.43619537353515625, -0.4205284118652344, -0.4048614501953125, -0.3891944885253906, -0.37352752685546875, -0.3578605651855469, -0.342193603515625, -0.3265266418457031, -0.31085968017578125, -0.2951927185058594, -0.2795257568359375, -0.2638587951660156, -0.24819183349609375, -0.23252487182617188, -0.21685791015625, -0.20119094848632812, -0.18552398681640625, -0.16985702514648438, -0.1541900634765625, -0.13852310180664062, -0.12285614013671875, -0.10718917846679688, -0.091522216796875, -0.07585525512695312, -0.06018829345703125, -0.044521331787109375, -0.0288543701171875, -0.013187408447265625, 0.00247955322265625, 0.018146514892578125, 0.0338134765625, 0.049480438232421875, 0.06514739990234375, 0.08081436157226562, 0.0964813232421875, 0.11214828491210938, 0.12781524658203125, 0.14348220825195312, 0.159149169921875, 0.17481613159179688, 0.19048309326171875, 0.20615005493164062, 0.2218170166015625, 0.23748397827148438, 0.25315093994140625, 0.2688179016113281, 0.28448486328125, 0.3001518249511719, 0.31581878662109375, 0.3314857482910156, 0.3471527099609375, 0.3628196716308594, 0.37848663330078125, 0.3941535949707031, 0.409820556640625, 0.4254875183105469, 0.44115447998046875, 0.4568214416503906, 0.4724884033203125, 0.4881553649902344, 0.5038223266601562, 0.5194892883300781, 0.53515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 9.0, 12.0, 22.0, 32.0, 65.0, 115.0, 155.0, 180.0, 127.0, 113.0, 67.0, 42.0, 25.0, 12.0, 10.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0966796875, -0.09369945526123047, -0.09071922302246094, -0.0877389907836914, -0.08475875854492188, -0.08177852630615234, -0.07879829406738281, -0.07581806182861328, -0.07283782958984375, -0.06985759735107422, -0.06687736511230469, -0.06389713287353516, -0.060916900634765625, -0.057936668395996094, -0.05495643615722656, -0.05197620391845703, -0.0489959716796875, -0.04601573944091797, -0.04303550720214844, -0.040055274963378906, -0.037075042724609375, -0.034094810485839844, -0.031114578247070312, -0.02813434600830078, -0.02515411376953125, -0.02217388153076172, -0.019193649291992188, -0.016213417053222656, -0.013233184814453125, -0.010252952575683594, -0.0072727203369140625, -0.004292488098144531, -0.001312255859375, 0.0016679763793945312, 0.0046482086181640625, 0.007628440856933594, 0.010608673095703125, 0.013588905334472656, 0.016569137573242188, 0.01954936981201172, 0.02252960205078125, 0.02550983428955078, 0.028490066528320312, 0.031470298767089844, 0.034450531005859375, 0.037430763244628906, 0.04041099548339844, 0.04339122772216797, 0.0463714599609375, 0.04935169219970703, 0.05233192443847656, 0.055312156677246094, 0.058292388916015625, 0.061272621154785156, 0.06425285339355469, 0.06723308563232422, 0.07021331787109375, 0.07319355010986328, 0.07617378234863281, 0.07915401458740234, 0.08213424682617188, 0.0851144790649414, 0.08809471130371094, 0.09107494354248047, 0.09405517578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 12.0, 22.0, 27.0, 46.0, 54.0, 56.0, 99.0, 134.0, 175.0, 247.0, 321.0, 473.0, 667.0, 1106.0, 2260.0, 7380.0, 48461.0, 3934971.0, 176400.0, 13965.0, 3456.0, 1401.0, 781.0, 543.0, 346.0, 265.0, 168.0, 135.0, 103.0, 45.0, 45.0, 27.0, 26.0, 20.0, 13.0, 6.0, 1.0, 7.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.368408203125, -0.3591289520263672, -0.3498497009277344, -0.34057044982910156, -0.33129119873046875, -0.32201194763183594, -0.3127326965332031, -0.3034534454345703, -0.2941741943359375, -0.2848949432373047, -0.2756156921386719, -0.26633644104003906, -0.25705718994140625, -0.24777793884277344, -0.23849868774414062, -0.2292194366455078, -0.219940185546875, -0.2106609344482422, -0.20138168334960938, -0.19210243225097656, -0.18282318115234375, -0.17354393005371094, -0.16426467895507812, -0.1549854278564453, -0.1457061767578125, -0.1364269256591797, -0.12714767456054688, -0.11786842346191406, -0.10858917236328125, -0.09930992126464844, -0.09003067016601562, -0.08075141906738281, -0.07147216796875, -0.06219291687011719, -0.052913665771484375, -0.04363441467285156, -0.03435516357421875, -0.025075912475585938, -0.015796661376953125, -0.0065174102783203125, 0.0027618408203125, 0.012041091918945312, 0.021320343017578125, 0.030599594116210938, 0.03987884521484375, 0.04915809631347656, 0.058437347412109375, 0.06771659851074219, 0.076995849609375, 0.08627510070800781, 0.09555435180664062, 0.10483360290527344, 0.11411285400390625, 0.12339210510253906, 0.13267135620117188, 0.1419506072998047, 0.1512298583984375, 0.1605091094970703, 0.16978836059570312, 0.17906761169433594, 0.18834686279296875, 0.19762611389160156, 0.20690536499023438, 0.2161846160888672, 0.2254638671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 1.0, 10.0, 19.0, 40.0, 94.0, 415.0, 3033.0, 334.0, 64.0, 28.0, 14.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2269287109375, -0.2214508056640625, -0.215972900390625, -0.2104949951171875, -0.20501708984375, -0.1995391845703125, -0.194061279296875, -0.1885833740234375, -0.18310546875, -0.1776275634765625, -0.172149658203125, -0.1666717529296875, -0.16119384765625, -0.1557159423828125, -0.150238037109375, -0.1447601318359375, -0.1392822265625, -0.1338043212890625, -0.128326416015625, -0.1228485107421875, -0.11737060546875, -0.1118927001953125, -0.106414794921875, -0.1009368896484375, -0.095458984375, -0.0899810791015625, -0.084503173828125, -0.0790252685546875, -0.07354736328125, -0.0680694580078125, -0.062591552734375, -0.0571136474609375, -0.0516357421875, -0.0461578369140625, -0.040679931640625, -0.0352020263671875, -0.02972412109375, -0.0242462158203125, -0.018768310546875, -0.0132904052734375, -0.0078125, -0.0023345947265625, 0.003143310546875, 0.0086212158203125, 0.01409912109375, 0.0195770263671875, 0.025054931640625, 0.0305328369140625, 0.0360107421875, 0.0414886474609375, 0.046966552734375, 0.0524444580078125, 0.05792236328125, 0.0634002685546875, 0.068878173828125, 0.0743560791015625, 0.079833984375, 0.0853118896484375, 0.090789794921875, 0.0962677001953125, 0.10174560546875, 0.1072235107421875, 0.112701416015625, 0.1181793212890625, 0.1236572265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 9.0, 13.0, 46.0, 109.0, 384.0, 340.0, 88.0, 14.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1068203449249268, -2.0655229091644287, -2.0242257118225098, -1.9829282760620117, -1.9416308403015137, -1.9003335237503052, -1.8590360879898071, -1.8177387714385986, -1.7764413356781006, -1.735144019126892, -1.693846583366394, -1.6525492668151855, -1.6112518310546875, -1.569954514503479, -1.528657078742981, -1.4873597621917725, -1.4460623264312744, -1.404765009880066, -1.3634675741195679, -1.3221702575683594, -1.2808728218078613, -1.2395755052566528, -1.1982780694961548, -1.1569807529449463, -1.1156834363937378, -1.0743861198425293, -1.0330886840820312, -0.991791307926178, -0.9504939317703247, -0.9091965556144714, -0.8678991794586182, -0.8266018629074097, -0.7853043675422668, -0.7440069913864136, -0.7027096152305603, -0.661412239074707, -0.6201148629188538, -0.5788174867630005, -0.537520170211792, -0.49622276425361633, -0.45492538809776306, -0.4136280119419098, -0.3723306357860565, -0.33103328943252563, -0.28973591327667236, -0.2484385222196579, -0.20714116096496582, -0.16584378480911255, -0.12454640865325928, -0.083249032497406, -0.04195166379213333, -0.0006542950868606567, 0.040643081068992615, 0.08194045722484589, 0.12323781847953796, 0.16453519463539124, 0.2058325707912445, 0.24712994694709778, 0.28842732310295105, 0.32972466945648193, 0.3710220456123352, 0.4123194217681885, 0.45361679792404175, 0.494914174079895, 0.5362115502357483]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 2.0, 11.0, 7.0, 14.0, 14.0, 15.0, 14.0, 20.0, 36.0, 26.0, 45.0, 35.0, 47.0, 46.0, 52.0, 48.0, 43.0, 55.0, 54.0, 43.0, 48.0, 47.0, 43.0, 41.0, 29.0, 30.0, 23.0, 23.0, 18.0, 18.0, 19.0, 12.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2975556254386902, -0.2845814824104309, -0.27160730957984924, -0.25863316655158997, -0.2456590086221695, -0.23268485069274902, -0.21971070766448975, -0.20673654973506927, -0.1937623918056488, -0.18078823387622833, -0.16781407594680786, -0.15483993291854858, -0.1418657749891281, -0.12889161705970764, -0.11591746658086777, -0.1029433161020279, -0.08996915817260742, -0.07699500024318695, -0.06402084976434708, -0.051046695560216904, -0.03807254135608673, -0.02509838342666626, -0.012124232947826385, 0.0008499175310134888, 0.01382407546043396, 0.026798229664564133, 0.039772383868694305, 0.05274653807282448, 0.06572069227695465, 0.07869485020637512, 0.091669000685215, 0.10464315116405487, 0.11761730909347534, 0.1305914670228958, 0.14356562495231628, 0.15653976798057556, 0.16951392590999603, 0.1824880838394165, 0.19546222686767578, 0.20843638479709625, 0.22141054272651672, 0.2343847006559372, 0.24735885858535767, 0.26033300161361694, 0.2733071446418762, 0.2862813174724579, 0.29925546050071716, 0.31222963333129883, 0.3252037763595581, 0.3381779193878174, 0.35115209221839905, 0.3641262352466583, 0.37710040807724, 0.39007455110549927, 0.40304869413375854, 0.4160228371620178, 0.4289970099925995, 0.44197115302085876, 0.45494532585144043, 0.4679194688796997, 0.480893611907959, 0.49386778473854065, 0.5068419575691223, 0.5198161005973816, 0.5327902436256409]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 1.0, 4.0, 4.0, 11.0, 11.0, 16.0, 31.0, 28.0, 47.0, 83.0, 95.0, 150.0, 227.0, 344.0, 605.0, 1210.0, 2542.0, 7392.0, 30398.0, 226056.0, 673792.0, 82208.0, 14841.0, 4352.0, 1856.0, 872.0, 475.0, 289.0, 199.0, 131.0, 75.0, 62.0, 32.0, 25.0, 24.0, 11.0, 14.0, 7.0, 7.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.262451171875, -0.2543182373046875, -0.246185302734375, -0.2380523681640625, -0.22991943359375, -0.2217864990234375, -0.213653564453125, -0.2055206298828125, -0.1973876953125, -0.1892547607421875, -0.181121826171875, -0.1729888916015625, -0.16485595703125, -0.1567230224609375, -0.148590087890625, -0.1404571533203125, -0.13232421875, -0.1241912841796875, -0.116058349609375, -0.1079254150390625, -0.09979248046875, -0.0916595458984375, -0.083526611328125, -0.0753936767578125, -0.0672607421875, -0.0591278076171875, -0.050994873046875, -0.0428619384765625, -0.03472900390625, -0.0265960693359375, -0.018463134765625, -0.0103302001953125, -0.002197265625, 0.0059356689453125, 0.014068603515625, 0.0222015380859375, 0.03033447265625, 0.0384674072265625, 0.046600341796875, 0.0547332763671875, 0.0628662109375, 0.0709991455078125, 0.079132080078125, 0.0872650146484375, 0.09539794921875, 0.1035308837890625, 0.111663818359375, 0.1197967529296875, 0.1279296875, 0.1360626220703125, 0.144195556640625, 0.1523284912109375, 0.16046142578125, 0.1685943603515625, 0.176727294921875, 0.1848602294921875, 0.1929931640625, 0.2011260986328125, 0.209259033203125, 0.2173919677734375, 0.22552490234375, 0.2336578369140625, 0.241790771484375, 0.2499237060546875, 0.258056640625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 13.0, 11.0, 31.0, 44.0, 73.0, 110.0, 156.0, 156.0, 121.0, 98.0, 66.0, 43.0, 29.0, 15.0, 13.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.097412109375, -0.09440135955810547, -0.09139060974121094, -0.0883798599243164, -0.08536911010742188, -0.08235836029052734, -0.07934761047363281, -0.07633686065673828, -0.07332611083984375, -0.07031536102294922, -0.06730461120605469, -0.06429386138916016, -0.061283111572265625, -0.058272361755371094, -0.05526161193847656, -0.05225086212158203, -0.0492401123046875, -0.04622936248779297, -0.04321861267089844, -0.040207862854003906, -0.037197113037109375, -0.034186363220214844, -0.031175613403320312, -0.02816486358642578, -0.02515411376953125, -0.02214336395263672, -0.019132614135742188, -0.016121864318847656, -0.013111114501953125, -0.010100364685058594, -0.0070896148681640625, -0.004078865051269531, -0.001068115234375, 0.0019426345825195312, 0.0049533843994140625, 0.007964134216308594, 0.010974884033203125, 0.013985633850097656, 0.016996383666992188, 0.02000713348388672, 0.02301788330078125, 0.02602863311767578, 0.029039382934570312, 0.032050132751464844, 0.035060882568359375, 0.038071632385253906, 0.04108238220214844, 0.04409313201904297, 0.0471038818359375, 0.05011463165283203, 0.05312538146972656, 0.056136131286621094, 0.059146881103515625, 0.062157630920410156, 0.06516838073730469, 0.06817913055419922, 0.07118988037109375, 0.07420063018798828, 0.07721138000488281, 0.08022212982177734, 0.08323287963867188, 0.0862436294555664, 0.08925437927246094, 0.09226512908935547, 0.09527587890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 7.0, 14.0, 16.0, 16.0, 38.0, 55.0, 113.0, 121.0, 247.0, 455.0, 1027.0, 2399.0, 7356.0, 33275.0, 365486.0, 578564.0, 44925.0, 9191.0, 2880.0, 1091.0, 553.0, 281.0, 145.0, 98.0, 54.0, 39.0, 22.0, 18.0, 16.0, 15.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2844085693359375, -0.274627685546875, -0.2648468017578125, -0.25506591796875, -0.2452850341796875, -0.235504150390625, -0.2257232666015625, -0.2159423828125, -0.2061614990234375, -0.196380615234375, -0.1865997314453125, -0.17681884765625, -0.1670379638671875, -0.157257080078125, -0.1474761962890625, -0.1376953125, -0.1279144287109375, -0.118133544921875, -0.1083526611328125, -0.09857177734375, -0.0887908935546875, -0.079010009765625, -0.0692291259765625, -0.0594482421875, -0.0496673583984375, -0.039886474609375, -0.0301055908203125, -0.02032470703125, -0.0105438232421875, -0.000762939453125, 0.0090179443359375, 0.018798828125, 0.0285797119140625, 0.038360595703125, 0.0481414794921875, 0.05792236328125, 0.0677032470703125, 0.077484130859375, 0.0872650146484375, 0.0970458984375, 0.1068267822265625, 0.116607666015625, 0.1263885498046875, 0.13616943359375, 0.1459503173828125, 0.155731201171875, 0.1655120849609375, 0.17529296875, 0.1850738525390625, 0.194854736328125, 0.2046356201171875, 0.21441650390625, 0.2241973876953125, 0.233978271484375, 0.2437591552734375, 0.2535400390625, 0.2633209228515625, 0.273101806640625, 0.2828826904296875, 0.29266357421875, 0.3024444580078125, 0.312225341796875, 0.3220062255859375, 0.331787109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 11.0, 14.0, 8.0, 13.0, 16.0, 17.0, 16.0, 24.0, 30.0, 35.0, 34.0, 42.0, 44.0, 33.0, 51.0, 54.0, 44.0, 60.0, 42.0, 46.0, 37.0, 49.0, 39.0, 40.0, 35.0, 25.0, 21.0, 15.0, 17.0, 15.0, 7.0, 7.0, 12.0, 2.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.2412109375, -0.2338104248046875, -0.226409912109375, -0.2190093994140625, -0.21160888671875, -0.2042083740234375, -0.196807861328125, -0.1894073486328125, -0.1820068359375, -0.1746063232421875, -0.167205810546875, -0.1598052978515625, -0.15240478515625, -0.1450042724609375, -0.137603759765625, -0.1302032470703125, -0.122802734375, -0.1154022216796875, -0.108001708984375, -0.1006011962890625, -0.09320068359375, -0.0858001708984375, -0.078399658203125, -0.0709991455078125, -0.0635986328125, -0.0561981201171875, -0.048797607421875, -0.0413970947265625, -0.03399658203125, -0.0265960693359375, -0.019195556640625, -0.0117950439453125, -0.00439453125, 0.0030059814453125, 0.010406494140625, 0.0178070068359375, 0.02520751953125, 0.0326080322265625, 0.040008544921875, 0.0474090576171875, 0.0548095703125, 0.0622100830078125, 0.069610595703125, 0.0770111083984375, 0.08441162109375, 0.0918121337890625, 0.099212646484375, 0.1066131591796875, 0.114013671875, 0.1214141845703125, 0.128814697265625, 0.1362152099609375, 0.14361572265625, 0.1510162353515625, 0.158416748046875, 0.1658172607421875, 0.1732177734375, 0.1806182861328125, 0.188018798828125, 0.1954193115234375, 0.20281982421875, 0.2102203369140625, 0.217620849609375, 0.2250213623046875, 0.232421875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 5.0, 13.0, 16.0, 24.0, 25.0, 66.0, 147.0, 318.0, 698.0, 2742.0, 85185.0, 951640.0, 5862.0, 1042.0, 369.0, 191.0, 75.0, 47.0, 25.0, 24.0, 9.0, 6.0, 11.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60107421875, -0.583984375, -0.56689453125, -0.5498046875, -0.53271484375, -0.515625, -0.49853515625, -0.4814453125, -0.46435546875, -0.447265625, -0.43017578125, -0.4130859375, -0.39599609375, -0.37890625, -0.36181640625, -0.3447265625, -0.32763671875, -0.310546875, -0.29345703125, -0.2763671875, -0.25927734375, -0.2421875, -0.22509765625, -0.2080078125, -0.19091796875, -0.173828125, -0.15673828125, -0.1396484375, -0.12255859375, -0.10546875, -0.08837890625, -0.0712890625, -0.05419921875, -0.037109375, -0.02001953125, -0.0029296875, 0.01416015625, 0.03125, 0.04833984375, 0.0654296875, 0.08251953125, 0.099609375, 0.11669921875, 0.1337890625, 0.15087890625, 0.16796875, 0.18505859375, 0.2021484375, 0.21923828125, 0.236328125, 0.25341796875, 0.2705078125, 0.28759765625, 0.3046875, 0.32177734375, 0.3388671875, 0.35595703125, 0.373046875, 0.39013671875, 0.4072265625, 0.42431640625, 0.44140625, 0.45849609375, 0.4755859375, 0.49267578125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 13.0, 12.0, 18.0, 14.0, 20.0, 27.0, 22.0, 33.0, 45.0, 60.0, 90.0, 113.0, 99.0, 91.0, 63.0, 47.0, 39.0, 27.0, 26.0, 26.0, 21.0, 11.0, 14.0, 9.0, 9.0, 12.0, 3.0, 9.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.655952453613281e-05, -9.356345981359482e-05, -9.056739509105682e-05, -8.757133036851883e-05, -8.457526564598083e-05, -8.157920092344284e-05, -7.858313620090485e-05, -7.558707147836685e-05, -7.259100675582886e-05, -6.959494203329086e-05, -6.659887731075287e-05, -6.360281258821487e-05, -6.060674786567688e-05, -5.7610683143138885e-05, -5.461461842060089e-05, -5.16185536980629e-05, -4.86224889755249e-05, -4.562642425298691e-05, -4.2630359530448914e-05, -3.963429480791092e-05, -3.6638230085372925e-05, -3.364216536283493e-05, -3.0646100640296936e-05, -2.765003591775894e-05, -2.4653971195220947e-05, -2.1657906472682953e-05, -1.866184175014496e-05, -1.5665777027606964e-05, -1.266971230506897e-05, -9.673647582530975e-06, -6.677582859992981e-06, -3.6815181374549866e-06, -6.854534149169922e-07, 2.310611307621002e-06, 5.306676030158997e-06, 8.302740752696991e-06, 1.1298805475234985e-05, 1.429487019777298e-05, 1.7290934920310974e-05, 2.028699964284897e-05, 2.3283064365386963e-05, 2.6279129087924957e-05, 2.927519381046295e-05, 3.2271258533000946e-05, 3.526732325553894e-05, 3.8263387978076935e-05, 4.125945270061493e-05, 4.4255517423152924e-05, 4.725158214569092e-05, 5.024764686822891e-05, 5.324371159076691e-05, 5.62397763133049e-05, 5.9235841035842896e-05, 6.223190575838089e-05, 6.522797048091888e-05, 6.822403520345688e-05, 7.122009992599487e-05, 7.421616464853287e-05, 7.721222937107086e-05, 8.020829409360886e-05, 8.320435881614685e-05, 8.620042353868484e-05, 8.919648826122284e-05, 9.219255298376083e-05, 9.518861770629883e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 5.0, 8.0, 6.0, 12.0, 16.0, 22.0, 24.0, 29.0, 56.0, 90.0, 192.0, 319.0, 761.0, 1987.0, 6923.0, 47078.0, 895140.0, 81873.0, 9492.0, 2610.0, 965.0, 409.0, 203.0, 111.0, 75.0, 56.0, 30.0, 16.0, 6.0, 7.0, 0.0, 14.0, 9.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.248046875, -0.2406635284423828, -0.23328018188476562, -0.22589683532714844, -0.21851348876953125, -0.21113014221191406, -0.20374679565429688, -0.1963634490966797, -0.1889801025390625, -0.1815967559814453, -0.17421340942382812, -0.16683006286621094, -0.15944671630859375, -0.15206336975097656, -0.14468002319335938, -0.1372966766357422, -0.129913330078125, -0.12252998352050781, -0.11514663696289062, -0.10776329040527344, -0.10037994384765625, -0.09299659729003906, -0.08561325073242188, -0.07822990417480469, -0.0708465576171875, -0.06346321105957031, -0.056079864501953125, -0.04869651794433594, -0.04131317138671875, -0.03392982482910156, -0.026546478271484375, -0.019163131713867188, -0.01177978515625, -0.0043964385986328125, 0.002986907958984375, 0.010370254516601562, 0.01775360107421875, 0.025136947631835938, 0.032520294189453125, 0.03990364074707031, 0.0472869873046875, 0.05467033386230469, 0.062053680419921875, 0.06943702697753906, 0.07682037353515625, 0.08420372009277344, 0.09158706665039062, 0.09897041320800781, 0.106353759765625, 0.11373710632324219, 0.12112045288085938, 0.12850379943847656, 0.13588714599609375, 0.14327049255371094, 0.15065383911132812, 0.1580371856689453, 0.1654205322265625, 0.1728038787841797, 0.18018722534179688, 0.18757057189941406, 0.19495391845703125, 0.20233726501464844, 0.20972061157226562, 0.2171039581298828, 0.2244873046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 5.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 7.0, 8.0, 13.0, 14.0, 24.0, 50.0, 67.0, 119.0, 275.0, 159.0, 102.0, 44.0, 30.0, 16.0, 11.0, 10.0, 7.0, 9.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.3042259216308594, -0.29570770263671875, -0.2871894836425781, -0.2786712646484375, -0.2701530456542969, -0.26163482666015625, -0.2531166076660156, -0.244598388671875, -0.23608016967773438, -0.22756195068359375, -0.21904373168945312, -0.2105255126953125, -0.20200729370117188, -0.19348907470703125, -0.18497085571289062, -0.17645263671875, -0.16793441772460938, -0.15941619873046875, -0.15089797973632812, -0.1423797607421875, -0.13386154174804688, -0.12534332275390625, -0.11682510375976562, -0.108306884765625, -0.09978866577148438, -0.09127044677734375, -0.08275222778320312, -0.0742340087890625, -0.06571578979492188, -0.05719757080078125, -0.048679351806640625, -0.0401611328125, -0.031642913818359375, -0.02312469482421875, -0.014606475830078125, -0.0060882568359375, 0.002429962158203125, 0.01094818115234375, 0.019466400146484375, 0.027984619140625, 0.036502838134765625, 0.04502105712890625, 0.053539276123046875, 0.0620574951171875, 0.07057571411132812, 0.07909393310546875, 0.08761215209960938, 0.09613037109375, 0.10464859008789062, 0.11316680908203125, 0.12168502807617188, 0.1302032470703125, 0.13872146606445312, 0.14723968505859375, 0.15575790405273438, 0.164276123046875, 0.17279434204101562, 0.18131256103515625, 0.18983078002929688, 0.1983489990234375, 0.20686721801757812, 0.21538543701171875, 0.22390365600585938, 0.232421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 41.0, 322.0, 580.0, 40.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.710500717163086, -11.44558334350586, -11.180665016174316, -10.91574764251709, -10.650829315185547, -10.38591194152832, -10.120994567871094, -9.85607624053955, -9.591158866882324, -9.326241493225098, -9.061323165893555, -8.796405792236328, -8.531487464904785, -8.266570091247559, -8.001651763916016, -7.736734390258789, -7.471816539764404, -7.2068986892700195, -6.941980838775635, -6.67706298828125, -6.412145614624023, -6.147227764129639, -5.882309913635254, -5.617392063140869, -5.352474212646484, -5.0875563621521, -4.822638511657715, -4.557721138000488, -4.2928032875061035, -4.027885437011719, -3.762967586517334, -3.498049736022949, -3.233132839202881, -2.968214988708496, -2.7032973766326904, -2.4383795261383057, -2.1734619140625, -1.9085440635681152, -1.6436262130737305, -1.3787084817886353, -1.11379075050354, -0.8488730192184448, -0.5839552283287048, -0.31903743743896484, -0.05411970615386963, 0.21079802513122559, 0.47571587562561035, 0.7406336069107056, 1.0055513381958008, 1.270469069480896, 1.5353868007659912, 1.800304651260376, 2.0652222633361816, 2.3301401138305664, 2.595057964324951, 2.859975814819336, 3.1248934268951416, 3.3898112773895264, 3.654728889465332, 3.919646739959717, 4.184564590454102, 4.449481964111328, 4.714400291442871, 4.979317665100098, 5.244235515594482]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 10.0, 8.0, 15.0, 22.0, 27.0, 20.0, 30.0, 33.0, 62.0, 35.0, 55.0, 42.0, 56.0, 61.0, 67.0, 46.0, 54.0, 55.0, 37.0, 33.0, 47.0, 37.0, 23.0, 26.0, 19.0, 13.0, 11.0, 11.0, 14.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4613746404647827, -1.4001802206039429, -1.3389859199523926, -1.2777915000915527, -1.216597080230713, -1.155402660369873, -1.0942083597183228, -1.033013939857483, -0.9718195796012878, -0.9106252193450928, -0.8494307994842529, -0.7882364392280579, -0.7270420789718628, -0.665847659111023, -0.6046532988548279, -0.5434589385986328, -0.48226451873779297, -0.4210701286792755, -0.35987573862075806, -0.298681378364563, -0.23748698830604553, -0.17629259824752808, -0.11509823799133301, -0.05390384793281555, 0.007290542125701904, 0.06848492473363876, 0.12967930734157562, 0.19087368249893188, 0.25206807255744934, 0.3132624626159668, 0.37445682287216187, 0.4356512129306793, 0.4968454837799072, 0.5580398440361023, 0.6192342638969421, 0.6804286241531372, 0.741623044013977, 0.8028174042701721, 0.8640117645263672, 0.925206184387207, 0.9864005446434021, 1.0475949048995972, 1.108789324760437, 1.1699836254119873, 1.2311780452728271, 1.292372465133667, 1.3535668849945068, 1.4147611856460571, 1.475955605506897, 1.5371500253677368, 1.598344326019287, 1.659538745880127, 1.7207331657409668, 1.7819275856018066, 1.843121886253357, 1.9043163061141968, 1.965510606765747, 2.026705026626587, 2.0878994464874268, 2.1490936279296875, 2.2102880477905273, 2.271482467651367, 2.332676887512207, 2.393871307373047, 2.4550657272338867]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 8.0, 10.0, 13.0, 17.0, 41.0, 57.0, 80.0, 150.0, 280.0, 521.0, 1160.0, 2835.0, 9257.0, 48158.0, 3859858.0, 242071.0, 20550.0, 5454.0, 1947.0, 844.0, 418.0, 201.0, 127.0, 82.0, 41.0, 27.0, 22.0, 12.0, 8.0, 7.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.268310546875, -0.26012420654296875, -0.2519378662109375, -0.24375152587890625, -0.235565185546875, -0.22737884521484375, -0.2191925048828125, -0.21100616455078125, -0.20281982421875, -0.19463348388671875, -0.1864471435546875, -0.17826080322265625, -0.170074462890625, -0.16188812255859375, -0.1537017822265625, -0.14551544189453125, -0.1373291015625, -0.12914276123046875, -0.1209564208984375, -0.11277008056640625, -0.104583740234375, -0.09639739990234375, -0.0882110595703125, -0.08002471923828125, -0.07183837890625, -0.06365203857421875, -0.0554656982421875, -0.04727935791015625, -0.039093017578125, -0.03090667724609375, -0.0227203369140625, -0.01453399658203125, -0.00634765625, 0.00183868408203125, 0.0100250244140625, 0.01821136474609375, 0.026397705078125, 0.03458404541015625, 0.0427703857421875, 0.05095672607421875, 0.05914306640625, 0.06732940673828125, 0.0755157470703125, 0.08370208740234375, 0.091888427734375, 0.10007476806640625, 0.1082611083984375, 0.11644744873046875, 0.1246337890625, 0.13282012939453125, 0.1410064697265625, 0.14919281005859375, 0.157379150390625, 0.16556549072265625, 0.1737518310546875, 0.18193817138671875, 0.19012451171875, 0.19831085205078125, 0.2064971923828125, 0.21468353271484375, 0.222869873046875, 0.23105621337890625, 0.2392425537109375, 0.24742889404296875, 0.255615234375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 8.0, 12.0, 20.0, 34.0, 47.0, 71.0, 98.0, 109.0, 138.0, 120.0, 109.0, 70.0, 46.0, 41.0, 23.0, 17.0, 10.0, 11.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09686279296875, -0.09388446807861328, -0.09090614318847656, -0.08792781829833984, -0.08494949340820312, -0.0819711685180664, -0.07899284362792969, -0.07601451873779297, -0.07303619384765625, -0.07005786895751953, -0.06707954406738281, -0.0641012191772461, -0.061122894287109375, -0.058144569396972656, -0.05516624450683594, -0.05218791961669922, -0.0492095947265625, -0.04623126983642578, -0.04325294494628906, -0.040274620056152344, -0.037296295166015625, -0.034317970275878906, -0.03133964538574219, -0.02836132049560547, -0.02538299560546875, -0.02240467071533203, -0.019426345825195312, -0.016448020935058594, -0.013469696044921875, -0.010491371154785156, -0.0075130462646484375, -0.004534721374511719, -0.001556396484375, 0.0014219284057617188, 0.0044002532958984375, 0.007378578186035156, 0.010356903076171875, 0.013335227966308594, 0.016313552856445312, 0.01929187774658203, 0.02227020263671875, 0.02524852752685547, 0.028226852416992188, 0.031205177307128906, 0.034183502197265625, 0.037161827087402344, 0.04014015197753906, 0.04311847686767578, 0.0460968017578125, 0.04907512664794922, 0.05205345153808594, 0.055031776428222656, 0.058010101318359375, 0.060988426208496094, 0.06396675109863281, 0.06694507598876953, 0.06992340087890625, 0.07290172576904297, 0.07588005065917969, 0.0788583755493164, 0.08183670043945312, 0.08481502532958984, 0.08779335021972656, 0.09077167510986328, 0.09375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 23.0, 29.0, 36.0, 65.0, 92.0, 113.0, 233.0, 440.0, 744.0, 1259.0, 2808.0, 8921.0, 74956.0, 4025171.0, 64996.0, 8380.0, 2918.0, 1324.0, 718.0, 388.0, 223.0, 139.0, 120.0, 64.0, 44.0, 18.0, 19.0, 7.0, 8.0, 5.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.40478515625, -0.3933753967285156, -0.38196563720703125, -0.3705558776855469, -0.3591461181640625, -0.3477363586425781, -0.33632659912109375, -0.3249168395996094, -0.313507080078125, -0.3020973205566406, -0.29068756103515625, -0.2792778015136719, -0.2678680419921875, -0.2564582824707031, -0.24504852294921875, -0.23363876342773438, -0.22222900390625, -0.21081924438476562, -0.19940948486328125, -0.18799972534179688, -0.1765899658203125, -0.16518020629882812, -0.15377044677734375, -0.14236068725585938, -0.130950927734375, -0.11954116821289062, -0.10813140869140625, -0.09672164916992188, -0.0853118896484375, -0.07390213012695312, -0.06249237060546875, -0.051082611083984375, -0.0396728515625, -0.028263092041015625, -0.01685333251953125, -0.005443572998046875, 0.0059661865234375, 0.017375946044921875, 0.02878570556640625, 0.040195465087890625, 0.051605224609375, 0.06301498413085938, 0.07442474365234375, 0.08583450317382812, 0.0972442626953125, 0.10865402221679688, 0.12006378173828125, 0.13147354125976562, 0.14288330078125, 0.15429306030273438, 0.16570281982421875, 0.17711257934570312, 0.1885223388671875, 0.19993209838867188, 0.21134185791015625, 0.22275161743164062, 0.234161376953125, 0.24557113647460938, 0.25698089599609375, 0.2683906555175781, 0.2798004150390625, 0.2912101745605469, 0.30261993408203125, 0.3140296936035156, 0.325439453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 14.0, 34.0, 89.0, 501.0, 3077.0, 221.0, 55.0, 29.0, 18.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.27099609375, -0.2633190155029297, -0.2556419372558594, -0.24796485900878906, -0.24028778076171875, -0.23261070251464844, -0.22493362426757812, -0.2172565460205078, -0.2095794677734375, -0.2019023895263672, -0.19422531127929688, -0.18654823303222656, -0.17887115478515625, -0.17119407653808594, -0.16351699829101562, -0.1558399200439453, -0.148162841796875, -0.1404857635498047, -0.13280868530273438, -0.12513160705566406, -0.11745452880859375, -0.10977745056152344, -0.10210037231445312, -0.09442329406738281, -0.0867462158203125, -0.07906913757324219, -0.07139205932617188, -0.06371498107910156, -0.05603790283203125, -0.04836082458496094, -0.040683746337890625, -0.03300666809082031, -0.02532958984375, -0.017652511596679688, -0.009975433349609375, -0.0022983551025390625, 0.00537872314453125, 0.013055801391601562, 0.020732879638671875, 0.028409957885742188, 0.0360870361328125, 0.04376411437988281, 0.051441192626953125, 0.05911827087402344, 0.06679534912109375, 0.07447242736816406, 0.08214950561523438, 0.08982658386230469, 0.097503662109375, 0.10518074035644531, 0.11285781860351562, 0.12053489685058594, 0.12821197509765625, 0.13588905334472656, 0.14356613159179688, 0.1512432098388672, 0.1589202880859375, 0.1665973663330078, 0.17427444458007812, 0.18195152282714844, 0.18962860107421875, 0.19730567932128906, 0.20498275756835938, 0.2126598358154297, 0.2203369140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 15.0, 41.0, 72.0, 199.0, 283.0, 214.0, 85.0, 50.0, 20.0, 5.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7644767761230469, -0.7356289625167847, -0.7067811489105225, -0.6779333353042603, -0.649085521697998, -0.6202377080917358, -0.5913898944854736, -0.5625420808792114, -0.5336942672729492, -0.504846453666687, -0.4759986400604248, -0.4471508264541626, -0.4183030128479004, -0.3894551992416382, -0.360607385635376, -0.33175957202911377, -0.30291175842285156, -0.27406394481658936, -0.24521613121032715, -0.21636831760406494, -0.18752050399780273, -0.15867269039154053, -0.12982487678527832, -0.10097706317901611, -0.0721292495727539, -0.0432814359664917, -0.014433622360229492, 0.014414191246032715, 0.04326200485229492, 0.07210981845855713, 0.10095763206481934, 0.12980544567108154, 0.15865325927734375, 0.18750107288360596, 0.21634888648986816, 0.24519670009613037, 0.2740445137023926, 0.3028923273086548, 0.331740140914917, 0.3605879545211792, 0.3894357681274414, 0.4182835817337036, 0.4471313953399658, 0.475979208946228, 0.5048270225524902, 0.5336748361587524, 0.5625226497650146, 0.5913704633712769, 0.6202182769775391, 0.6490660905838013, 0.6779139041900635, 0.7067617177963257, 0.7356095314025879, 0.7644573450088501, 0.7933051586151123, 0.8221529722213745, 0.8510007858276367, 0.8798485994338989, 0.9086964130401611, 0.9375442266464233, 0.9663920402526855, 0.9952398538589478, 1.02408766746521, 1.0529354810714722, 1.0817832946777344]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 10.0, 7.0, 5.0, 5.0, 12.0, 9.0, 23.0, 18.0, 22.0, 19.0, 21.0, 36.0, 27.0, 28.0, 30.0, 38.0, 40.0, 38.0, 46.0, 44.0, 47.0, 32.0, 39.0, 35.0, 29.0, 45.0, 40.0, 34.0, 35.0, 35.0, 31.0, 16.0, 20.0, 13.0, 21.0, 10.0, 6.0, 7.0, 9.0, 5.0, 6.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3800247311592102, -0.3687201142311096, -0.35741546750068665, -0.34611085057258606, -0.3348062038421631, -0.3235015869140625, -0.3121969699859619, -0.30089232325553894, -0.28958767652511597, -0.2782830595970154, -0.2669784128665924, -0.2556737959384918, -0.24436914920806885, -0.23306453227996826, -0.22175990045070648, -0.2104552686214447, -0.19915065169334412, -0.18784601986408234, -0.17654138803482056, -0.16523677110671997, -0.153932124376297, -0.1426275074481964, -0.13132287561893463, -0.12001824378967285, -0.10871361196041107, -0.09740898013114929, -0.08610434830188751, -0.07479972392320633, -0.06349509209394455, -0.05219046026468277, -0.04088583588600159, -0.029581204056739807, -0.018276572227478027, -0.006971942260861397, 0.004332687705755234, 0.015637315809726715, 0.026941947638988495, 0.038246579468250275, 0.04955120384693146, 0.06085583567619324, 0.07216046750545502, 0.0834650993347168, 0.09476973116397858, 0.10607435554265976, 0.11737898737192154, 0.12868362665176392, 0.1399882435798645, 0.15129287540912628, 0.16259750723838806, 0.17390213906764984, 0.18520677089691162, 0.1965113878250122, 0.20781603455543518, 0.21912065148353577, 0.23042528331279755, 0.24172991514205933, 0.2530345320701599, 0.2643391489982605, 0.27564379572868347, 0.28694841265678406, 0.29825305938720703, 0.3095576763153076, 0.3208622932434082, 0.3321669399738312, 0.34347158670425415]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 9.0, 15.0, 16.0, 40.0, 44.0, 97.0, 131.0, 288.0, 611.0, 1787.0, 6866.0, 50388.0, 910813.0, 65977.0, 7944.0, 2024.0, 764.0, 352.0, 156.0, 74.0, 47.0, 38.0, 21.0, 21.0, 9.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41943359375, -0.4061393737792969, -0.39284515380859375, -0.3795509338378906, -0.3662567138671875, -0.3529624938964844, -0.33966827392578125, -0.3263740539550781, -0.313079833984375, -0.2997856140136719, -0.28649139404296875, -0.2731971740722656, -0.2599029541015625, -0.24660873413085938, -0.23331451416015625, -0.22002029418945312, -0.20672607421875, -0.19343185424804688, -0.18013763427734375, -0.16684341430664062, -0.1535491943359375, -0.14025497436523438, -0.12696075439453125, -0.11366653442382812, -0.100372314453125, -0.08707809448242188, -0.07378387451171875, -0.060489654541015625, -0.0471954345703125, -0.033901214599609375, -0.02060699462890625, -0.007312774658203125, 0.0059814453125, 0.019275665283203125, 0.03256988525390625, 0.045864105224609375, 0.0591583251953125, 0.07245254516601562, 0.08574676513671875, 0.09904098510742188, 0.112335205078125, 0.12562942504882812, 0.13892364501953125, 0.15221786499023438, 0.1655120849609375, 0.17880630493164062, 0.19210052490234375, 0.20539474487304688, 0.21868896484375, 0.23198318481445312, 0.24527740478515625, 0.2585716247558594, 0.2718658447265625, 0.2851600646972656, 0.29845428466796875, 0.3117485046386719, 0.325042724609375, 0.3383369445800781, 0.35163116455078125, 0.3649253845214844, 0.3782196044921875, 0.3915138244628906, 0.40480804443359375, 0.4181022644042969, 0.431396484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 7.0, 13.0, 20.0, 25.0, 55.0, 90.0, 89.0, 121.0, 116.0, 118.0, 97.0, 76.0, 58.0, 36.0, 20.0, 21.0, 17.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09857177734375, -0.09554195404052734, -0.09251213073730469, -0.08948230743408203, -0.08645248413085938, -0.08342266082763672, -0.08039283752441406, -0.0773630142211914, -0.07433319091796875, -0.0713033676147461, -0.06827354431152344, -0.06524372100830078, -0.062213897705078125, -0.05918407440185547, -0.05615425109863281, -0.053124427795410156, -0.0500946044921875, -0.047064781188964844, -0.04403495788574219, -0.04100513458251953, -0.037975311279296875, -0.03494548797607422, -0.03191566467285156, -0.028885841369628906, -0.02585601806640625, -0.022826194763183594, -0.019796371459960938, -0.01676654815673828, -0.013736724853515625, -0.010706901550292969, -0.0076770782470703125, -0.004647254943847656, -0.001617431640625, 0.0014123916625976562, 0.0044422149658203125, 0.007472038269042969, 0.010501861572265625, 0.013531684875488281, 0.016561508178710938, 0.019591331481933594, 0.02262115478515625, 0.025650978088378906, 0.028680801391601562, 0.03171062469482422, 0.034740447998046875, 0.03777027130126953, 0.04080009460449219, 0.043829917907714844, 0.0468597412109375, 0.049889564514160156, 0.05291938781738281, 0.05594921112060547, 0.058979034423828125, 0.06200885772705078, 0.06503868103027344, 0.0680685043334961, 0.07109832763671875, 0.0741281509399414, 0.07715797424316406, 0.08018779754638672, 0.08321762084960938, 0.08624744415283203, 0.08927726745605469, 0.09230709075927734, 0.0953369140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 10.0, 29.0, 27.0, 35.0, 62.0, 73.0, 119.0, 162.0, 336.0, 663.0, 1460.0, 3972.0, 14290.0, 109056.0, 856077.0, 48096.0, 8905.0, 2773.0, 1139.0, 498.0, 283.0, 155.0, 93.0, 66.0, 36.0, 23.0, 32.0, 14.0, 7.0, 8.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33251953125, -0.3225440979003906, -0.31256866455078125, -0.3025932312011719, -0.2926177978515625, -0.2826423645019531, -0.27266693115234375, -0.2626914978027344, -0.252716064453125, -0.24274063110351562, -0.23276519775390625, -0.22278976440429688, -0.2128143310546875, -0.20283889770507812, -0.19286346435546875, -0.18288803100585938, -0.17291259765625, -0.16293716430664062, -0.15296173095703125, -0.14298629760742188, -0.1330108642578125, -0.12303543090820312, -0.11305999755859375, -0.10308456420898438, -0.093109130859375, -0.08313369750976562, -0.07315826416015625, -0.06318283081054688, -0.0532073974609375, -0.043231964111328125, -0.03325653076171875, -0.023281097412109375, -0.0133056640625, -0.003330230712890625, 0.00664520263671875, 0.016620635986328125, 0.0265960693359375, 0.036571502685546875, 0.04654693603515625, 0.056522369384765625, 0.066497802734375, 0.07647323608398438, 0.08644866943359375, 0.09642410278320312, 0.1063995361328125, 0.11637496948242188, 0.12635040283203125, 0.13632583618164062, 0.14630126953125, 0.15627670288085938, 0.16625213623046875, 0.17622756958007812, 0.1862030029296875, 0.19617843627929688, 0.20615386962890625, 0.21612930297851562, 0.226104736328125, 0.23608016967773438, 0.24605560302734375, 0.2560310363769531, 0.2660064697265625, 0.2759819030761719, 0.28595733642578125, 0.2959327697753906, 0.305908203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 0.0, 3.0, 11.0, 6.0, 13.0, 16.0, 22.0, 29.0, 35.0, 40.0, 31.0, 50.0, 80.0, 82.0, 82.0, 72.0, 66.0, 63.0, 48.0, 65.0, 50.0, 39.0, 23.0, 15.0, 14.0, 8.0, 14.0, 5.0, 5.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.3832244873046875, -0.372650146484375, -0.3620758056640625, -0.35150146484375, -0.3409271240234375, -0.330352783203125, -0.3197784423828125, -0.3092041015625, -0.2986297607421875, -0.288055419921875, -0.2774810791015625, -0.26690673828125, -0.2563323974609375, -0.245758056640625, -0.2351837158203125, -0.224609375, -0.2140350341796875, -0.203460693359375, -0.1928863525390625, -0.18231201171875, -0.1717376708984375, -0.161163330078125, -0.1505889892578125, -0.1400146484375, -0.1294403076171875, -0.118865966796875, -0.1082916259765625, -0.09771728515625, -0.0871429443359375, -0.076568603515625, -0.0659942626953125, -0.055419921875, -0.0448455810546875, -0.034271240234375, -0.0236968994140625, -0.01312255859375, -0.0025482177734375, 0.008026123046875, 0.0186004638671875, 0.0291748046875, 0.0397491455078125, 0.050323486328125, 0.0608978271484375, 0.07147216796875, 0.0820465087890625, 0.092620849609375, 0.1031951904296875, 0.11376953125, 0.1243438720703125, 0.134918212890625, 0.1454925537109375, 0.15606689453125, 0.1666412353515625, 0.177215576171875, 0.1877899169921875, 0.1983642578125, 0.2089385986328125, 0.219512939453125, 0.2300872802734375, 0.24066162109375, 0.2512359619140625, 0.261810302734375, 0.2723846435546875, 0.282958984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 13.0, 17.0, 23.0, 25.0, 58.0, 108.0, 157.0, 407.0, 1029.0, 5020.0, 65001.0, 927842.0, 43109.0, 4058.0, 933.0, 354.0, 175.0, 68.0, 43.0, 44.0, 19.0, 5.0, 9.0, 14.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2034912109375, -0.19758224487304688, -0.19167327880859375, -0.18576431274414062, -0.1798553466796875, -0.17394638061523438, -0.16803741455078125, -0.16212844848632812, -0.156219482421875, -0.15031051635742188, -0.14440155029296875, -0.13849258422851562, -0.1325836181640625, -0.12667465209960938, -0.12076568603515625, -0.11485671997070312, -0.10894775390625, -0.10303878784179688, -0.09712982177734375, -0.09122085571289062, -0.0853118896484375, -0.07940292358398438, -0.07349395751953125, -0.06758499145507812, -0.061676025390625, -0.055767059326171875, -0.04985809326171875, -0.043949127197265625, -0.0380401611328125, -0.032131195068359375, -0.02622222900390625, -0.020313262939453125, -0.014404296875, -0.008495330810546875, -0.00258636474609375, 0.003322601318359375, 0.0092315673828125, 0.015140533447265625, 0.02104949951171875, 0.026958465576171875, 0.032867431640625, 0.038776397705078125, 0.04468536376953125, 0.050594329833984375, 0.0565032958984375, 0.062412261962890625, 0.06832122802734375, 0.07423019409179688, 0.08013916015625, 0.08604812622070312, 0.09195709228515625, 0.09786605834960938, 0.1037750244140625, 0.10968399047851562, 0.11559295654296875, 0.12150192260742188, 0.127410888671875, 0.13331985473632812, 0.13922882080078125, 0.14513778686523438, 0.1510467529296875, 0.15695571899414062, 0.16286468505859375, 0.16877365112304688, 0.1746826171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 9.0, 9.0, 18.0, 24.0, 36.0, 45.0, 76.0, 115.0, 151.0, 145.0, 113.0, 70.0, 43.0, 32.0, 18.0, 19.0, 15.0, 8.0, 10.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.435415267944336e-05, -9.129848331212997e-05, -8.824281394481659e-05, -8.51871445775032e-05, -8.213147521018982e-05, -7.907580584287643e-05, -7.602013647556305e-05, -7.296446710824966e-05, -6.990879774093628e-05, -6.68531283736229e-05, -6.379745900630951e-05, -6.0741789638996124e-05, -5.768612027168274e-05, -5.4630450904369354e-05, -5.157478153705597e-05, -4.8519112169742584e-05, -4.54634428024292e-05, -4.2407773435115814e-05, -3.935210406780243e-05, -3.6296434700489044e-05, -3.324076533317566e-05, -3.0185095965862274e-05, -2.712942659854889e-05, -2.4073757231235504e-05, -2.101808786392212e-05, -1.7962418496608734e-05, -1.4906749129295349e-05, -1.1851079761981964e-05, -8.795410394668579e-06, -5.739741027355194e-06, -2.684071660041809e-06, 3.7159770727157593e-07, 3.427267074584961e-06, 6.482936441898346e-06, 9.538605809211731e-06, 1.2594275176525116e-05, 1.56499445438385e-05, 1.8705613911151886e-05, 2.176128327846527e-05, 2.4816952645778656e-05, 2.787262201309204e-05, 3.0928291380405426e-05, 3.398396074771881e-05, 3.7039630115032196e-05, 4.009529948234558e-05, 4.3150968849658966e-05, 4.620663821697235e-05, 4.9262307584285736e-05, 5.231797695159912e-05, 5.5373646318912506e-05, 5.842931568622589e-05, 6.148498505353928e-05, 6.454065442085266e-05, 6.759632378816605e-05, 7.065199315547943e-05, 7.370766252279282e-05, 7.67633318901062e-05, 7.981900125741959e-05, 8.287467062473297e-05, 8.593033999204636e-05, 8.898600935935974e-05, 9.204167872667313e-05, 9.509734809398651e-05, 9.81530174612999e-05, 0.00010120868682861328]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 15.0, 11.0, 17.0, 16.0, 33.0, 57.0, 88.0, 140.0, 257.0, 442.0, 935.0, 2887.0, 15500.0, 216035.0, 780499.0, 25326.0, 3824.0, 1227.0, 520.0, 278.0, 146.0, 98.0, 66.0, 45.0, 28.0, 16.0, 10.0, 9.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2137451171875, -0.20841598510742188, -0.20308685302734375, -0.19775772094726562, -0.1924285888671875, -0.18709945678710938, -0.18177032470703125, -0.17644119262695312, -0.171112060546875, -0.16578292846679688, -0.16045379638671875, -0.15512466430664062, -0.1497955322265625, -0.14446640014648438, -0.13913726806640625, -0.13380813598632812, -0.12847900390625, -0.12314987182617188, -0.11782073974609375, -0.11249160766601562, -0.1071624755859375, -0.10183334350585938, -0.09650421142578125, -0.09117507934570312, -0.085845947265625, -0.08051681518554688, -0.07518768310546875, -0.06985855102539062, -0.0645294189453125, -0.059200286865234375, -0.05387115478515625, -0.048542022705078125, -0.043212890625, -0.037883758544921875, -0.03255462646484375, -0.027225494384765625, -0.0218963623046875, -0.016567230224609375, -0.01123809814453125, -0.005908966064453125, -0.000579833984375, 0.004749298095703125, 0.01007843017578125, 0.015407562255859375, 0.0207366943359375, 0.026065826416015625, 0.03139495849609375, 0.036724090576171875, 0.04205322265625, 0.047382354736328125, 0.05271148681640625, 0.058040618896484375, 0.0633697509765625, 0.06869888305664062, 0.07402801513671875, 0.07935714721679688, 0.084686279296875, 0.09001541137695312, 0.09534454345703125, 0.10067367553710938, 0.1060028076171875, 0.11133193969726562, 0.11666107177734375, 0.12199020385742188, 0.1273193359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 11.0, 12.0, 15.0, 22.0, 20.0, 23.0, 25.0, 43.0, 58.0, 218.0, 266.0, 52.0, 33.0, 25.0, 34.0, 25.0, 10.0, 15.0, 11.0, 12.0, 8.0, 5.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1099853515625, -0.10632896423339844, -0.10267257690429688, -0.09901618957519531, -0.09535980224609375, -0.09170341491699219, -0.08804702758789062, -0.08439064025878906, -0.0807342529296875, -0.07707786560058594, -0.07342147827148438, -0.06976509094238281, -0.06610870361328125, -0.06245231628417969, -0.058795928955078125, -0.05513954162597656, -0.051483154296875, -0.04782676696777344, -0.044170379638671875, -0.04051399230957031, -0.03685760498046875, -0.03320121765136719, -0.029544830322265625, -0.025888442993164062, -0.0222320556640625, -0.018575668334960938, -0.014919281005859375, -0.011262893676757812, -0.00760650634765625, -0.0039501190185546875, -0.000293731689453125, 0.0033626556396484375, 0.00701904296875, 0.010675430297851562, 0.014331817626953125, 0.017988204956054688, 0.02164459228515625, 0.025300979614257812, 0.028957366943359375, 0.03261375427246094, 0.0362701416015625, 0.03992652893066406, 0.043582916259765625, 0.04723930358886719, 0.05089569091796875, 0.05455207824707031, 0.058208465576171875, 0.06186485290527344, 0.065521240234375, 0.06917762756347656, 0.07283401489257812, 0.07649040222167969, 0.08014678955078125, 0.08380317687988281, 0.08745956420898438, 0.09111595153808594, 0.0947723388671875, 0.09842872619628906, 0.10208511352539062, 0.10574150085449219, 0.10939788818359375, 0.11305427551269531, 0.11671066284179688, 0.12036705017089844, 0.1240234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 859.0, 146.0, 6.0], "bins": [-34.48314666748047, -33.9256477355957, -33.36814880371094, -32.810646057128906, -32.25314712524414, -31.695648193359375, -31.13814926147461, -30.58064842224121, -30.023149490356445, -29.46565055847168, -28.90814971923828, -28.350650787353516, -27.79315185546875, -27.23565101623535, -26.678152084350586, -26.120651245117188, -25.563152313232422, -25.005653381347656, -24.448152542114258, -23.890653610229492, -23.333152770996094, -22.775653839111328, -22.218154907226562, -21.660654067993164, -21.1031551361084, -20.545656204223633, -19.988155364990234, -19.43065643310547, -18.873157501220703, -18.315656661987305, -17.75815773010254, -17.20065689086914, -16.643157958984375, -16.08565902709961, -15.528158187866211, -14.970659255981445, -14.413159370422363, -13.855659484863281, -13.298160552978516, -12.740660667419434, -12.183160781860352, -11.62566089630127, -11.068161010742188, -10.510662078857422, -9.95316219329834, -9.395662307739258, -8.838163375854492, -8.28066349029541, -7.72316312789917, -7.165663719177246, -6.608163833618164, -6.050663948059082, -5.493164539337158, -4.935665130615234, -4.378165245056152, -3.8206655979156494, -3.2631659507751465, -2.7056663036346436, -2.1481666564941406, -1.5906670093536377, -1.0331673622131348, -0.47566771507263184, 0.0818319320678711, 0.639331579208374, 1.1968311071395874]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 6.0, 9.0, 9.0, 8.0, 16.0, 13.0, 25.0, 20.0, 29.0, 27.0, 39.0, 21.0, 32.0, 40.0, 48.0, 44.0, 61.0, 50.0, 47.0, 53.0, 32.0, 54.0, 41.0, 32.0, 39.0, 33.0, 22.0, 21.0, 22.0, 14.0, 20.0, 8.0, 12.0, 15.0, 11.0, 6.0, 6.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2465689182281494, -1.2084039449691772, -1.1702390909194946, -1.1320741176605225, -1.0939092636108398, -1.0557442903518677, -1.0175793170928955, -0.9794144630432129, -0.9412494897842407, -0.9030845761299133, -0.8649196624755859, -0.8267546892166138, -0.7885897755622864, -0.750424861907959, -0.7122599482536316, -0.6740950345993042, -0.6359301209449768, -0.5977652072906494, -0.559600293636322, -0.5214353799819946, -0.48327040672302246, -0.44510549306869507, -0.4069405794143677, -0.3687756359577179, -0.3306107223033905, -0.2924458086490631, -0.25428086519241333, -0.21611595153808594, -0.17795102298259735, -0.13978609442710876, -0.10162118077278137, -0.06345623731613159, -0.0252913236618042, 0.012873601168394089, 0.05103852599859238, 0.08920344710350037, 0.12736837565898895, 0.16553330421447754, 0.20369821786880493, 0.2418631613254547, 0.2800280749797821, 0.3181929886341095, 0.3563579320907593, 0.39452284574508667, 0.43268775939941406, 0.47085270285606384, 0.5090175867080688, 0.547182559967041, 0.5853474736213684, 0.6235123872756958, 0.6616773009300232, 0.6998422145843506, 0.7380071878433228, 0.7761721014976501, 0.8143370151519775, 0.8525019884109497, 0.8906668424606323, 0.9288317561149597, 0.9669966697692871, 1.0051616430282593, 1.043326497077942, 1.081491470336914, 1.1196563243865967, 1.1578212976455688, 1.195986270904541]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 7.0, 11.0, 24.0, 28.0, 32.0, 93.0, 244.0, 753.0, 3201.0, 33354.0, 4099736.0, 51174.0, 4197.0, 873.0, 295.0, 114.0, 54.0, 35.0, 24.0, 11.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498291015625, -0.4825019836425781, -0.46671295166015625, -0.4509239196777344, -0.4351348876953125, -0.4193458557128906, -0.40355682373046875, -0.3877677917480469, -0.371978759765625, -0.3561897277832031, -0.34040069580078125, -0.3246116638183594, -0.3088226318359375, -0.2930335998535156, -0.27724456787109375, -0.2614555358886719, -0.24566650390625, -0.22987747192382812, -0.21408843994140625, -0.19829940795898438, -0.1825103759765625, -0.16672134399414062, -0.15093231201171875, -0.13514328002929688, -0.119354248046875, -0.10356521606445312, -0.08777618408203125, -0.07198715209960938, -0.0561981201171875, -0.040409088134765625, -0.02462005615234375, -0.008831024169921875, 0.0069580078125, 0.022747039794921875, 0.03853607177734375, 0.054325103759765625, 0.0701141357421875, 0.08590316772460938, 0.10169219970703125, 0.11748123168945312, 0.133270263671875, 0.14905929565429688, 0.16484832763671875, 0.18063735961914062, 0.1964263916015625, 0.21221542358398438, 0.22800445556640625, 0.24379348754882812, 0.25958251953125, 0.2753715515136719, 0.29116058349609375, 0.3069496154785156, 0.3227386474609375, 0.3385276794433594, 0.35431671142578125, 0.3701057434082031, 0.385894775390625, 0.4016838073730469, 0.41747283935546875, 0.4332618713378906, 0.4490509033203125, 0.4648399353027344, 0.48062896728515625, 0.4964179992675781, 0.51220703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 10.0, 9.0, 9.0, 20.0, 33.0, 43.0, 70.0, 82.0, 102.0, 119.0, 107.0, 105.0, 78.0, 68.0, 50.0, 23.0, 19.0, 25.0, 14.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1007080078125, -0.09765243530273438, -0.09459686279296875, -0.09154129028320312, -0.0884857177734375, -0.08543014526367188, -0.08237457275390625, -0.07931900024414062, -0.076263427734375, -0.07320785522460938, -0.07015228271484375, -0.06709671020507812, -0.0640411376953125, -0.060985565185546875, -0.05792999267578125, -0.054874420166015625, -0.05181884765625, -0.048763275146484375, -0.04570770263671875, -0.042652130126953125, -0.0395965576171875, -0.036540985107421875, -0.03348541259765625, -0.030429840087890625, -0.027374267578125, -0.024318695068359375, -0.02126312255859375, -0.018207550048828125, -0.0151519775390625, -0.012096405029296875, -0.00904083251953125, -0.005985260009765625, -0.0029296875, 0.000125885009765625, 0.00318145751953125, 0.006237030029296875, 0.0092926025390625, 0.012348175048828125, 0.01540374755859375, 0.018459320068359375, 0.021514892578125, 0.024570465087890625, 0.02762603759765625, 0.030681610107421875, 0.0337371826171875, 0.036792755126953125, 0.03984832763671875, 0.042903900146484375, 0.04595947265625, 0.049015045166015625, 0.05207061767578125, 0.055126190185546875, 0.0581817626953125, 0.061237335205078125, 0.06429290771484375, 0.06734848022460938, 0.070404052734375, 0.07345962524414062, 0.07651519775390625, 0.07957077026367188, 0.0826263427734375, 0.08568191528320312, 0.08873748779296875, 0.09179306030273438, 0.0948486328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 18.0, 22.0, 33.0, 68.0, 89.0, 177.0, 294.0, 496.0, 904.0, 2091.0, 7983.0, 83395.0, 4032252.0, 56045.0, 6706.0, 1786.0, 823.0, 461.0, 276.0, 139.0, 93.0, 57.0, 31.0, 17.0, 9.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.390380859375, -0.3779640197753906, -0.36554718017578125, -0.3531303405761719, -0.3407135009765625, -0.3282966613769531, -0.31587982177734375, -0.3034629821777344, -0.291046142578125, -0.2786293029785156, -0.26621246337890625, -0.2537956237792969, -0.2413787841796875, -0.22896194458007812, -0.21654510498046875, -0.20412826538085938, -0.19171142578125, -0.17929458618164062, -0.16687774658203125, -0.15446090698242188, -0.1420440673828125, -0.12962722778320312, -0.11721038818359375, -0.10479354858398438, -0.092376708984375, -0.07995986938476562, -0.06754302978515625, -0.055126190185546875, -0.0427093505859375, -0.030292510986328125, -0.01787567138671875, -0.005458831787109375, 0.0069580078125, 0.019374847412109375, 0.03179168701171875, 0.044208526611328125, 0.0566253662109375, 0.06904220581054688, 0.08145904541015625, 0.09387588500976562, 0.106292724609375, 0.11870956420898438, 0.13112640380859375, 0.14354324340820312, 0.1559600830078125, 0.16837692260742188, 0.18079376220703125, 0.19321060180664062, 0.20562744140625, 0.21804428100585938, 0.23046112060546875, 0.24287796020507812, 0.2552947998046875, 0.2677116394042969, 0.28012847900390625, 0.2925453186035156, 0.304962158203125, 0.3173789978027344, 0.32979583740234375, 0.3422126770019531, 0.3546295166015625, 0.3670463562011719, 0.37946319580078125, 0.3918800354003906, 0.404296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 11.0, 13.0, 28.0, 56.0, 225.0, 2719.0, 819.0, 102.0, 45.0, 21.0, 12.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2066650390625, -0.20037269592285156, -0.19408035278320312, -0.1877880096435547, -0.18149566650390625, -0.1752033233642578, -0.16891098022460938, -0.16261863708496094, -0.1563262939453125, -0.15003395080566406, -0.14374160766601562, -0.1374492645263672, -0.13115692138671875, -0.12486457824707031, -0.11857223510742188, -0.11227989196777344, -0.105987548828125, -0.09969520568847656, -0.09340286254882812, -0.08711051940917969, -0.08081817626953125, -0.07452583312988281, -0.06823348999023438, -0.06194114685058594, -0.0556488037109375, -0.04935646057128906, -0.043064117431640625, -0.03677177429199219, -0.03047943115234375, -0.024187088012695312, -0.017894744873046875, -0.011602401733398438, -0.00531005859375, 0.0009822845458984375, 0.007274627685546875, 0.013566970825195312, 0.01985931396484375, 0.026151657104492188, 0.032444000244140625, 0.03873634338378906, 0.0450286865234375, 0.05132102966308594, 0.057613372802734375, 0.06390571594238281, 0.07019805908203125, 0.07649040222167969, 0.08278274536132812, 0.08907508850097656, 0.095367431640625, 0.10165977478027344, 0.10795211791992188, 0.11424446105957031, 0.12053680419921875, 0.1268291473388672, 0.13312149047851562, 0.13941383361816406, 0.1457061767578125, 0.15199851989746094, 0.15829086303710938, 0.1645832061767578, 0.17087554931640625, 0.1771678924560547, 0.18346023559570312, 0.18975257873535156, 0.196044921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 12.0, 15.0, 47.0, 65.0, 174.0, 297.0, 212.0, 93.0, 51.0, 14.0, 10.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49684569239616394, -0.4729893207550049, -0.4491329491138458, -0.42527657747268677, -0.4014201760292053, -0.37756383419036865, -0.3537074327468872, -0.32985106110572815, -0.3059946894645691, -0.28213831782341003, -0.258281946182251, -0.23442555963993073, -0.21056918799877167, -0.1867128163576126, -0.16285642981529236, -0.1390000581741333, -0.11514368653297424, -0.09128731489181519, -0.06743093580007553, -0.043574556708335876, -0.01971818506717682, 0.004138186573982239, 0.02799457311630249, 0.05185094475746155, 0.0757073163986206, 0.09956368803977966, 0.12342006713151932, 0.14727644622325897, 0.17113281786441803, 0.1949891895055771, 0.21884557604789734, 0.2427019476890564, 0.26655828952789307, 0.2904146611690521, 0.3142710328102112, 0.3381274342536926, 0.3619837760925293, 0.38584017753601074, 0.4096965491771698, 0.43355292081832886, 0.4574092924594879, 0.481265664100647, 0.5051220655441284, 0.5289784073829651, 0.5528348088264465, 0.5766911506652832, 0.6005475521087646, 0.6244039535522461, 0.6482602953910828, 0.6721166968345642, 0.6959730386734009, 0.7198294401168823, 0.743685781955719, 0.7675421833992004, 0.7913985252380371, 0.8152549266815186, 0.839111328125, 0.8629677295684814, 0.8868240714073181, 0.9106804728507996, 0.9345368146896362, 0.9583932161331177, 0.9822496175765991, 1.006105899810791, 1.0299623012542725]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 6.0, 14.0, 19.0, 12.0, 13.0, 28.0, 31.0, 28.0, 36.0, 46.0, 48.0, 47.0, 61.0, 70.0, 70.0, 66.0, 61.0, 49.0, 55.0, 53.0, 50.0, 36.0, 29.0, 19.0, 17.0, 13.0, 9.0, 3.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36349231004714966, -0.34973224997520447, -0.3359721899032593, -0.3222121298313141, -0.3084520697593689, -0.2946920096874237, -0.2809319496154785, -0.2671718895435333, -0.25341182947158813, -0.23965176939964294, -0.22589170932769775, -0.21213164925575256, -0.19837158918380737, -0.18461152911186218, -0.170851469039917, -0.1570914089679718, -0.1433313637971878, -0.12957130372524261, -0.11581124365329742, -0.10205118358135223, -0.08829112350940704, -0.07453107088804245, -0.06077101081609726, -0.04701095074415207, -0.03325089067220688, -0.019490830600261688, -0.005730772390961647, 0.008029285818338394, 0.021789345890283585, 0.03554940223693848, 0.04930946230888367, 0.06306952238082886, 0.07682958245277405, 0.09058964252471924, 0.10434970259666443, 0.11810976266860962, 0.1318698227405548, 0.1456298828125, 0.1593899428844452, 0.17315000295639038, 0.18691006302833557, 0.20067012310028076, 0.21443018317222595, 0.22819024324417114, 0.24195030331611633, 0.2557103633880615, 0.2694704234600067, 0.2832304835319519, 0.2969905138015747, 0.3107505738735199, 0.3245106339454651, 0.3382706940174103, 0.35203075408935547, 0.36579081416130066, 0.37955087423324585, 0.39331093430519104, 0.40707099437713623, 0.4208310544490814, 0.4345911145210266, 0.4483511745929718, 0.462111234664917, 0.4758712947368622, 0.4896313548088074, 0.5033913850784302, 0.5171514749526978]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 9.0, 14.0, 22.0, 30.0, 45.0, 79.0, 109.0, 179.0, 299.0, 529.0, 1141.0, 2583.0, 7776.0, 29681.0, 264451.0, 675588.0, 48622.0, 10878.0, 3557.0, 1382.0, 642.0, 338.0, 215.0, 118.0, 73.0, 41.0, 33.0, 27.0, 25.0, 19.0, 15.0, 5.0, 2.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.217529296875, -0.2109661102294922, -0.20440292358398438, -0.19783973693847656, -0.19127655029296875, -0.18471336364746094, -0.17815017700195312, -0.1715869903564453, -0.1650238037109375, -0.1584606170654297, -0.15189743041992188, -0.14533424377441406, -0.13877105712890625, -0.13220787048339844, -0.12564468383789062, -0.11908149719238281, -0.112518310546875, -0.10595512390136719, -0.09939193725585938, -0.09282875061035156, -0.08626556396484375, -0.07970237731933594, -0.07313919067382812, -0.06657600402832031, -0.0600128173828125, -0.05344963073730469, -0.046886444091796875, -0.04032325744628906, -0.03376007080078125, -0.027196884155273438, -0.020633697509765625, -0.014070510864257812, -0.00750732421875, -0.0009441375732421875, 0.005619049072265625, 0.012182235717773438, 0.01874542236328125, 0.025308609008789062, 0.031871795654296875, 0.03843498229980469, 0.0449981689453125, 0.05156135559082031, 0.058124542236328125, 0.06468772888183594, 0.07125091552734375, 0.07781410217285156, 0.08437728881835938, 0.09094047546386719, 0.097503662109375, 0.10406684875488281, 0.11063003540039062, 0.11719322204589844, 0.12375640869140625, 0.13031959533691406, 0.13688278198242188, 0.1434459686279297, 0.1500091552734375, 0.1565723419189453, 0.16313552856445312, 0.16969871520996094, 0.17626190185546875, 0.18282508850097656, 0.18938827514648438, 0.1959514617919922, 0.2025146484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 13.0, 12.0, 18.0, 36.0, 36.0, 61.0, 99.0, 101.0, 105.0, 108.0, 98.0, 88.0, 67.0, 43.0, 33.0, 20.0, 20.0, 14.0, 14.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.103515625, -0.10038471221923828, -0.09725379943847656, -0.09412288665771484, -0.09099197387695312, -0.0878610610961914, -0.08473014831542969, -0.08159923553466797, -0.07846832275390625, -0.07533740997314453, -0.07220649719238281, -0.0690755844116211, -0.06594467163085938, -0.06281375885009766, -0.05968284606933594, -0.05655193328857422, -0.0534210205078125, -0.05029010772705078, -0.04715919494628906, -0.044028282165527344, -0.040897369384765625, -0.037766456604003906, -0.03463554382324219, -0.03150463104248047, -0.02837371826171875, -0.02524280548095703, -0.022111892700195312, -0.018980979919433594, -0.015850067138671875, -0.012719154357910156, -0.009588241577148438, -0.006457328796386719, -0.003326416015625, -0.00019550323486328125, 0.0029354095458984375, 0.006066322326660156, 0.009197235107421875, 0.012328147888183594, 0.015459060668945312, 0.01858997344970703, 0.02172088623046875, 0.02485179901123047, 0.027982711791992188, 0.031113624572753906, 0.034244537353515625, 0.037375450134277344, 0.04050636291503906, 0.04363727569580078, 0.0467681884765625, 0.04989910125732422, 0.05303001403808594, 0.056160926818847656, 0.059291839599609375, 0.062422752380371094, 0.06555366516113281, 0.06868457794189453, 0.07181549072265625, 0.07494640350341797, 0.07807731628417969, 0.0812082290649414, 0.08433914184570312, 0.08747005462646484, 0.09060096740722656, 0.09373188018798828, 0.09686279296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 6.0, 11.0, 22.0, 25.0, 35.0, 50.0, 73.0, 132.0, 228.0, 400.0, 867.0, 2081.0, 6551.0, 26575.0, 186767.0, 742393.0, 62874.0, 12956.0, 3651.0, 1428.0, 630.0, 300.0, 170.0, 106.0, 80.0, 37.0, 23.0, 18.0, 18.0, 17.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2271728515625, -0.22072982788085938, -0.21428680419921875, -0.20784378051757812, -0.2014007568359375, -0.19495773315429688, -0.18851470947265625, -0.18207168579101562, -0.175628662109375, -0.16918563842773438, -0.16274261474609375, -0.15629959106445312, -0.1498565673828125, -0.14341354370117188, -0.13697052001953125, -0.13052749633789062, -0.12408447265625, -0.11764144897460938, -0.11119842529296875, -0.10475540161132812, -0.0983123779296875, -0.09186935424804688, -0.08542633056640625, -0.07898330688476562, -0.072540283203125, -0.06609725952148438, -0.05965423583984375, -0.053211212158203125, -0.0467681884765625, -0.040325164794921875, -0.03388214111328125, -0.027439117431640625, -0.02099609375, -0.014553070068359375, -0.00811004638671875, -0.001667022705078125, 0.0047760009765625, 0.011219024658203125, 0.01766204833984375, 0.024105072021484375, 0.030548095703125, 0.036991119384765625, 0.04343414306640625, 0.049877166748046875, 0.0563201904296875, 0.06276321411132812, 0.06920623779296875, 0.07564926147460938, 0.08209228515625, 0.08853530883789062, 0.09497833251953125, 0.10142135620117188, 0.1078643798828125, 0.11430740356445312, 0.12075042724609375, 0.12719345092773438, 0.133636474609375, 0.14007949829101562, 0.14652252197265625, 0.15296554565429688, 0.1594085693359375, 0.16585159301757812, 0.17229461669921875, 0.17873764038085938, 0.1851806640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 6.0, 7.0, 11.0, 13.0, 15.0, 13.0, 22.0, 26.0, 32.0, 48.0, 44.0, 41.0, 43.0, 60.0, 59.0, 49.0, 54.0, 45.0, 44.0, 35.0, 37.0, 36.0, 34.0, 39.0, 43.0, 24.0, 18.0, 17.0, 17.0, 10.0, 13.0, 4.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.27587890625, -0.2677764892578125, -0.259674072265625, -0.2515716552734375, -0.24346923828125, -0.2353668212890625, -0.227264404296875, -0.2191619873046875, -0.2110595703125, -0.2029571533203125, -0.194854736328125, -0.1867523193359375, -0.17864990234375, -0.1705474853515625, -0.162445068359375, -0.1543426513671875, -0.146240234375, -0.1381378173828125, -0.130035400390625, -0.1219329833984375, -0.11383056640625, -0.1057281494140625, -0.097625732421875, -0.0895233154296875, -0.0814208984375, -0.0733184814453125, -0.065216064453125, -0.0571136474609375, -0.04901123046875, -0.0409088134765625, -0.032806396484375, -0.0247039794921875, -0.0166015625, -0.0084991455078125, -0.000396728515625, 0.0077056884765625, 0.01580810546875, 0.0239105224609375, 0.032012939453125, 0.0401153564453125, 0.0482177734375, 0.0563201904296875, 0.064422607421875, 0.0725250244140625, 0.08062744140625, 0.0887298583984375, 0.096832275390625, 0.1049346923828125, 0.113037109375, 0.1211395263671875, 0.129241943359375, 0.1373443603515625, 0.14544677734375, 0.1535491943359375, 0.161651611328125, 0.1697540283203125, 0.1778564453125, 0.1859588623046875, 0.194061279296875, 0.2021636962890625, 0.21026611328125, 0.2183685302734375, 0.226470947265625, 0.2345733642578125, 0.24267578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 5.0, 3.0, 10.0, 12.0, 13.0, 21.0, 28.0, 66.0, 100.0, 232.0, 541.0, 1723.0, 9890.0, 188998.0, 820126.0, 22581.0, 2848.0, 731.0, 287.0, 124.0, 59.0, 45.0, 28.0, 21.0, 12.0, 8.0, 9.0, 5.0, 5.0, 8.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1407470703125, -0.1365032196044922, -0.13225936889648438, -0.12801551818847656, -0.12377166748046875, -0.11952781677246094, -0.11528396606445312, -0.11104011535644531, -0.1067962646484375, -0.10255241394042969, -0.09830856323242188, -0.09406471252441406, -0.08982086181640625, -0.08557701110839844, -0.08133316040039062, -0.07708930969238281, -0.072845458984375, -0.06860160827636719, -0.06435775756835938, -0.06011390686035156, -0.05587005615234375, -0.05162620544433594, -0.047382354736328125, -0.04313850402832031, -0.0388946533203125, -0.03465080261230469, -0.030406951904296875, -0.026163101196289062, -0.02191925048828125, -0.017675399780273438, -0.013431549072265625, -0.009187698364257812, -0.00494384765625, -0.0006999969482421875, 0.003543853759765625, 0.0077877044677734375, 0.01203155517578125, 0.016275405883789062, 0.020519256591796875, 0.024763107299804688, 0.0290069580078125, 0.03325080871582031, 0.037494659423828125, 0.04173851013183594, 0.04598236083984375, 0.05022621154785156, 0.054470062255859375, 0.05871391296386719, 0.062957763671875, 0.06720161437988281, 0.07144546508789062, 0.07568931579589844, 0.07993316650390625, 0.08417701721191406, 0.08842086791992188, 0.09266471862792969, 0.0969085693359375, 0.10115242004394531, 0.10539627075195312, 0.10964012145996094, 0.11388397216796875, 0.11812782287597656, 0.12237167358398438, 0.1266155242919922, 0.130859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 1.0, 10.0, 15.0, 20.0, 30.0, 25.0, 61.0, 71.0, 88.0, 134.0, 135.0, 123.0, 81.0, 51.0, 37.0, 24.0, 19.0, 13.0, 9.0, 4.0, 8.0, 1.0, 5.0, 12.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18235969543457e-05, -6.908830255270004e-05, -6.635300815105438e-05, -6.361771374940872e-05, -6.088241934776306e-05, -5.81471249461174e-05, -5.541183054447174e-05, -5.267653614282608e-05, -4.994124174118042e-05, -4.720594733953476e-05, -4.44706529378891e-05, -4.173535853624344e-05, -3.900006413459778e-05, -3.626476973295212e-05, -3.352947533130646e-05, -3.07941809296608e-05, -2.8058886528015137e-05, -2.5323592126369476e-05, -2.2588297724723816e-05, -1.9853003323078156e-05, -1.7117708921432495e-05, -1.4382414519786835e-05, -1.1647120118141174e-05, -8.911825716495514e-06, -6.1765313148498535e-06, -3.441236913204193e-06, -7.059425115585327e-07, 2.0293518900871277e-06, 4.764646291732788e-06, 7.4999406933784485e-06, 1.0235235095024109e-05, 1.297052949666977e-05, 1.570582389831543e-05, 1.844111829996109e-05, 2.117641270160675e-05, 2.391170710325241e-05, 2.664700150489807e-05, 2.938229590654373e-05, 3.211759030818939e-05, 3.485288470983505e-05, 3.758817911148071e-05, 4.032347351312637e-05, 4.3058767914772034e-05, 4.5794062316417694e-05, 4.8529356718063354e-05, 5.1264651119709015e-05, 5.3999945521354675e-05, 5.6735239923000336e-05, 5.9470534324645996e-05, 6.220582872629166e-05, 6.494112312793732e-05, 6.767641752958298e-05, 7.041171193122864e-05, 7.31470063328743e-05, 7.588230073451996e-05, 7.861759513616562e-05, 8.135288953781128e-05, 8.408818393945694e-05, 8.68234783411026e-05, 8.955877274274826e-05, 9.229406714439392e-05, 9.502936154603958e-05, 9.776465594768524e-05, 0.0001004999503493309, 0.00010323524475097656]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 7.0, 17.0, 32.0, 60.0, 95.0, 227.0, 551.0, 2060.0, 15387.0, 770148.0, 247639.0, 9890.0, 1552.0, 493.0, 170.0, 93.0, 50.0, 21.0, 22.0, 11.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103271484375, -0.09833335876464844, -0.09339523315429688, -0.08845710754394531, -0.08351898193359375, -0.07858085632324219, -0.07364273071289062, -0.06870460510253906, -0.0637664794921875, -0.05882835388183594, -0.053890228271484375, -0.04895210266113281, -0.04401397705078125, -0.03907585144042969, -0.034137725830078125, -0.029199600219726562, -0.024261474609375, -0.019323348999023438, -0.014385223388671875, -0.009447097778320312, -0.00450897216796875, 0.0004291534423828125, 0.005367279052734375, 0.010305404663085938, 0.0152435302734375, 0.020181655883789062, 0.025119781494140625, 0.030057907104492188, 0.03499603271484375, 0.03993415832519531, 0.044872283935546875, 0.04981040954589844, 0.05474853515625, 0.05968666076660156, 0.06462478637695312, 0.06956291198730469, 0.07450103759765625, 0.07943916320800781, 0.08437728881835938, 0.08931541442871094, 0.0942535400390625, 0.09919166564941406, 0.10412979125976562, 0.10906791687011719, 0.11400604248046875, 0.11894416809082031, 0.12388229370117188, 0.12882041931152344, 0.133758544921875, 0.13869667053222656, 0.14363479614257812, 0.1485729217529297, 0.15351104736328125, 0.1584491729736328, 0.16338729858398438, 0.16832542419433594, 0.1732635498046875, 0.17820167541503906, 0.18313980102539062, 0.1880779266357422, 0.19301605224609375, 0.1979541778564453, 0.20289230346679688, 0.20783042907714844, 0.2127685546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 7.0, 9.0, 7.0, 8.0, 20.0, 33.0, 50.0, 51.0, 88.0, 274.0, 183.0, 74.0, 50.0, 39.0, 29.0, 13.0, 15.0, 10.0, 7.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08233642578125, -0.0787210464477539, -0.07510566711425781, -0.07149028778076172, -0.06787490844726562, -0.06425952911376953, -0.06064414978027344, -0.057028770446777344, -0.05341339111328125, -0.049798011779785156, -0.04618263244628906, -0.04256725311279297, -0.038951873779296875, -0.03533649444580078, -0.03172111511230469, -0.028105735778808594, -0.0244903564453125, -0.020874977111816406, -0.017259597778320312, -0.013644218444824219, -0.010028839111328125, -0.006413459777832031, -0.0027980804443359375, 0.0008172988891601562, 0.00443267822265625, 0.008048057556152344, 0.011663436889648438, 0.015278816223144531, 0.018894195556640625, 0.02250957489013672, 0.026124954223632812, 0.029740333557128906, 0.033355712890625, 0.036971092224121094, 0.04058647155761719, 0.04420185089111328, 0.047817230224609375, 0.05143260955810547, 0.05504798889160156, 0.058663368225097656, 0.06227874755859375, 0.06589412689208984, 0.06950950622558594, 0.07312488555908203, 0.07674026489257812, 0.08035564422607422, 0.08397102355957031, 0.0875864028930664, 0.0912017822265625, 0.0948171615600586, 0.09843254089355469, 0.10204792022705078, 0.10566329956054688, 0.10927867889404297, 0.11289405822753906, 0.11650943756103516, 0.12012481689453125, 0.12374019622802734, 0.12735557556152344, 0.13097095489501953, 0.13458633422851562, 0.13820171356201172, 0.1418170928955078, 0.1454324722290039, 0.1490478515625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 573.0, 421.0, 12.0, 4.0], "bins": [-16.600149154663086, -16.327838897705078, -16.055530548095703, -15.783220291137695, -15.510910987854004, -15.238601684570312, -14.966291427612305, -14.693982124328613, -14.421672821044922, -14.14936351776123, -13.877053260803223, -13.604743957519531, -13.33243465423584, -13.060125350952148, -12.78781509399414, -12.51550579071045, -12.243196487426758, -11.970887184143066, -11.698576927185059, -11.426267623901367, -11.153958320617676, -10.881649017333984, -10.609338760375977, -10.337029457092285, -10.064719200134277, -9.792409896850586, -9.520099639892578, -9.247790336608887, -8.975481033325195, -8.703171730041504, -8.430861473083496, -8.158552169799805, -7.8862433433532715, -7.613933563232422, -7.3416242599487305, -7.069314479827881, -6.7970051765441895, -6.52469539642334, -6.252386093139648, -5.980076313018799, -5.707766532897949, -5.4354567527771, -5.163147449493408, -4.890837669372559, -4.618528366088867, -4.346218585968018, -4.073908805847168, -3.8015995025634766, -3.529290199279785, -3.2569806575775146, -2.984671115875244, -2.7123613357543945, -2.440052032470703, -2.1677422523498535, -1.895432710647583, -1.6231231689453125, -1.350813627243042, -1.0785040855407715, -0.8061944842338562, -0.5338848829269409, -0.2615753412246704, 0.010734200477600098, 0.28304386138916016, 0.5553534030914307, 0.827663004398346]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 6.0, 1.0, 5.0, 5.0, 3.0, 8.0, 11.0, 7.0, 14.0, 9.0, 12.0, 13.0, 20.0, 18.0, 24.0, 28.0, 33.0, 21.0, 30.0, 32.0, 32.0, 31.0, 28.0, 42.0, 39.0, 38.0, 45.0, 38.0, 46.0, 38.0, 30.0, 40.0, 32.0, 23.0, 23.0, 18.0, 26.0, 27.0, 13.0, 26.0, 18.0, 10.0, 8.0, 10.0, 6.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9027281999588013, -0.8719969391822815, -0.8412656188011169, -0.8105343580245972, -0.7798030376434326, -0.7490717768669128, -0.7183405160903931, -0.6876091957092285, -0.6568779349327087, -0.626146674156189, -0.5954153537750244, -0.5646840929985046, -0.5339527726173401, -0.5032215118408203, -0.47249022126197815, -0.441758930683136, -0.4110276401042938, -0.38029634952545166, -0.3495650589466095, -0.31883376836776733, -0.28810250759124756, -0.2573712170124054, -0.22663992643356323, -0.19590865075588226, -0.1651773601770401, -0.13444606959819794, -0.10371479392051697, -0.0729835033416748, -0.04225222021341324, -0.011520937085151672, 0.01921035349369049, 0.04994162917137146, 0.08067291975021362, 0.11140420287847519, 0.14213548600673676, 0.17286677658557892, 0.2035980522632599, 0.23432934284210205, 0.2650606334209442, 0.2957919239997864, 0.32652318477630615, 0.3572544753551483, 0.3879857659339905, 0.41871702671051025, 0.4494483172893524, 0.4801796078681946, 0.5109108686447144, 0.5416421890258789, 0.5723735094070435, 0.6031047701835632, 0.6338360905647278, 0.6645673513412476, 0.6952986717224121, 0.7260299324989319, 0.7567611932754517, 0.7874925136566162, 0.818223774433136, 0.8489550352096558, 0.8796863555908203, 0.9104176163673401, 0.9411489367485046, 0.9718801975250244, 1.002611517906189, 1.033342719078064, 1.0640740394592285]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 15.0, 10.0, 15.0, 27.0, 102.0, 254.0, 931.0, 7670.0, 4042339.0, 138076.0, 3841.0, 650.0, 189.0, 71.0, 34.0, 22.0, 9.0, 11.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.0216293334960938, -0.9905242919921875, -0.9594192504882812, -0.928314208984375, -0.8972091674804688, -0.8661041259765625, -0.8349990844726562, -0.80389404296875, -0.7727890014648438, -0.7416839599609375, -0.7105789184570312, -0.679473876953125, -0.6483688354492188, -0.6172637939453125, -0.5861587524414062, -0.5550537109375, -0.5239486694335938, -0.4928436279296875, -0.46173858642578125, -0.430633544921875, -0.39952850341796875, -0.3684234619140625, -0.33731842041015625, -0.30621337890625, -0.27510833740234375, -0.2440032958984375, -0.21289825439453125, -0.181793212890625, -0.15068817138671875, -0.1195831298828125, -0.08847808837890625, -0.057373046875, -0.02626800537109375, 0.0048370361328125, 0.03594207763671875, 0.067047119140625, 0.09815216064453125, 0.1292572021484375, 0.16036224365234375, 0.19146728515625, 0.22257232666015625, 0.2536773681640625, 0.28478240966796875, 0.315887451171875, 0.34699249267578125, 0.3780975341796875, 0.40920257568359375, 0.4403076171875, 0.47141265869140625, 0.5025177001953125, 0.5336227416992188, 0.564727783203125, 0.5958328247070312, 0.6269378662109375, 0.6580429077148438, 0.68914794921875, 0.7202529907226562, 0.7513580322265625, 0.7824630737304688, 0.813568115234375, 0.8446731567382812, 0.8757781982421875, 0.9068832397460938, 0.93798828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 8.0, 15.0, 29.0, 31.0, 63.0, 67.0, 105.0, 108.0, 115.0, 109.0, 90.0, 70.0, 51.0, 43.0, 23.0, 21.0, 16.0, 9.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.10394287109375, -0.10083866119384766, -0.09773445129394531, -0.09463024139404297, -0.09152603149414062, -0.08842182159423828, -0.08531761169433594, -0.0822134017944336, -0.07910919189453125, -0.0760049819946289, -0.07290077209472656, -0.06979656219482422, -0.06669235229492188, -0.06358814239501953, -0.06048393249511719, -0.057379722595214844, -0.0542755126953125, -0.051171302795410156, -0.04806709289550781, -0.04496288299560547, -0.041858673095703125, -0.03875446319580078, -0.03565025329589844, -0.032546043395996094, -0.02944183349609375, -0.026337623596191406, -0.023233413696289062, -0.02012920379638672, -0.017024993896484375, -0.013920783996582031, -0.010816574096679688, -0.007712364196777344, -0.004608154296875, -0.0015039443969726562, 0.0016002655029296875, 0.004704475402832031, 0.007808685302734375, 0.010912895202636719, 0.014017105102539062, 0.017121315002441406, 0.02022552490234375, 0.023329734802246094, 0.026433944702148438, 0.02953815460205078, 0.032642364501953125, 0.03574657440185547, 0.03885078430175781, 0.041954994201660156, 0.0450592041015625, 0.048163414001464844, 0.05126762390136719, 0.05437183380126953, 0.057476043701171875, 0.06058025360107422, 0.06368446350097656, 0.0667886734008789, 0.06989288330078125, 0.0729970932006836, 0.07610130310058594, 0.07920551300048828, 0.08230972290039062, 0.08541393280029297, 0.08851814270019531, 0.09162235260009766, 0.0947265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 6.0, 16.0, 20.0, 30.0, 30.0, 47.0, 71.0, 73.0, 105.0, 162.0, 269.0, 387.0, 693.0, 1213.0, 2525.0, 7550.0, 44504.0, 3855720.0, 255311.0, 16880.0, 4449.0, 1724.0, 903.0, 563.0, 314.0, 219.0, 124.0, 110.0, 69.0, 46.0, 40.0, 34.0, 21.0, 11.0, 12.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.375396728515625, -0.36187744140625, -0.348358154296875, -0.3348388671875, -0.321319580078125, -0.30780029296875, -0.294281005859375, -0.28076171875, -0.267242431640625, -0.25372314453125, -0.240203857421875, -0.2266845703125, -0.213165283203125, -0.19964599609375, -0.186126708984375, -0.172607421875, -0.159088134765625, -0.14556884765625, -0.132049560546875, -0.1185302734375, -0.105010986328125, -0.09149169921875, -0.077972412109375, -0.064453125, -0.050933837890625, -0.03741455078125, -0.023895263671875, -0.0103759765625, 0.003143310546875, 0.01666259765625, 0.030181884765625, 0.043701171875, 0.057220458984375, 0.07073974609375, 0.084259033203125, 0.0977783203125, 0.111297607421875, 0.12481689453125, 0.138336181640625, 0.15185546875, 0.165374755859375, 0.17889404296875, 0.192413330078125, 0.2059326171875, 0.219451904296875, 0.23297119140625, 0.246490478515625, 0.260009765625, 0.273529052734375, 0.28704833984375, 0.300567626953125, 0.3140869140625, 0.327606201171875, 0.34112548828125, 0.354644775390625, 0.3681640625, 0.381683349609375, 0.39520263671875, 0.408721923828125, 0.4222412109375, 0.435760498046875, 0.44927978515625, 0.462799072265625, 0.476318359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 7.0, 7.0, 21.0, 37.0, 173.0, 3066.0, 615.0, 80.0, 27.0, 16.0, 11.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322265625, -0.31180572509765625, -0.3013458251953125, -0.29088592529296875, -0.280426025390625, -0.26996612548828125, -0.2595062255859375, -0.24904632568359375, -0.23858642578125, -0.22812652587890625, -0.2176666259765625, -0.20720672607421875, -0.196746826171875, -0.18628692626953125, -0.1758270263671875, -0.16536712646484375, -0.1549072265625, -0.14444732666015625, -0.1339874267578125, -0.12352752685546875, -0.113067626953125, -0.10260772705078125, -0.0921478271484375, -0.08168792724609375, -0.07122802734375, -0.06076812744140625, -0.0503082275390625, -0.03984832763671875, -0.029388427734375, -0.01892852783203125, -0.0084686279296875, 0.00199127197265625, 0.012451171875, 0.02291107177734375, 0.0333709716796875, 0.04383087158203125, 0.054290771484375, 0.06475067138671875, 0.0752105712890625, 0.08567047119140625, 0.09613037109375, 0.10659027099609375, 0.1170501708984375, 0.12751007080078125, 0.137969970703125, 0.14842987060546875, 0.1588897705078125, 0.16934967041015625, 0.1798095703125, 0.19026947021484375, 0.2007293701171875, 0.21118927001953125, 0.221649169921875, 0.23210906982421875, 0.2425689697265625, 0.25302886962890625, 0.26348876953125, 0.27394866943359375, 0.2844085693359375, 0.29486846923828125, 0.305328369140625, 0.31578826904296875, 0.3262481689453125, 0.33670806884765625, 0.34716796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 10.0, 7.0, 19.0, 25.0, 39.0, 52.0, 99.0, 143.0, 172.0, 144.0, 123.0, 68.0, 36.0, 17.0, 11.0, 12.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.7999388575553894, -0.7821212410926819, -0.7643036246299744, -0.7464860081672668, -0.7286684513092041, -0.7108508348464966, -0.6930332183837891, -0.6752156019210815, -0.657397985458374, -0.6395803689956665, -0.621762752532959, -0.6039451360702515, -0.586127519607544, -0.5683099627494812, -0.5504923462867737, -0.5326747298240662, -0.5148571133613586, -0.4970394968986511, -0.4792218804359436, -0.46140429377555847, -0.44358667731285095, -0.42576906085014343, -0.4079514741897583, -0.3901338577270508, -0.37231624126434326, -0.35449862480163574, -0.3366810083389282, -0.3188634216785431, -0.30104580521583557, -0.28322818875312805, -0.2654106020927429, -0.2475929856300354, -0.2297753095626831, -0.21195769309997559, -0.19414009153842926, -0.17632248997688293, -0.15850487351417542, -0.1406872570514679, -0.12286965548992157, -0.10505204647779465, -0.08723443746566772, -0.0694168284535408, -0.05159921944141388, -0.03378161042928696, -0.015964001417160034, 0.0018536075949668884, 0.01967121660709381, 0.037488825619220734, 0.055306434631347656, 0.07312404364347458, 0.0909416526556015, 0.10875926166772842, 0.12657687067985535, 0.14439448714256287, 0.1622120887041092, 0.18002969026565552, 0.19784730672836304, 0.21566492319107056, 0.23348252475261688, 0.2513001263141632, 0.2691177427768707, 0.28693535923957825, 0.3047529458999634, 0.3225705623626709, 0.3403881788253784]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 7.0, 17.0, 17.0, 27.0, 20.0, 39.0, 35.0, 53.0, 51.0, 65.0, 59.0, 57.0, 57.0, 77.0, 67.0, 53.0, 46.0, 40.0, 34.0, 35.0, 24.0, 24.0, 20.0, 21.0, 14.0, 16.0, 2.0, 6.0, 3.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4931862950325012, -0.4745917022228241, -0.45599713921546936, -0.43740254640579224, -0.4188079833984375, -0.4002133905887604, -0.38161879777908325, -0.3630242347717285, -0.3444296419620514, -0.32583504915237427, -0.30724048614501953, -0.2886458933353424, -0.2700513005256653, -0.25145673751831055, -0.23286214470863342, -0.2142675668001175, -0.19567298889160156, -0.17707841098308563, -0.1584838330745697, -0.13988924026489258, -0.12129466235637665, -0.10270008444786072, -0.08410549908876419, -0.06551091372966766, -0.04691633582115173, -0.028321754187345505, -0.009727172553539276, 0.008867409080266953, 0.02746199071407318, 0.04605656862258911, 0.06465115398168564, 0.08324573934078217, 0.1018403172492981, 0.12043489515781403, 0.13902947306632996, 0.15762406587600708, 0.176218643784523, 0.19481322169303894, 0.21340781450271606, 0.232002392411232, 0.2505969703197479, 0.26919156312942505, 0.2877861261367798, 0.3063807189464569, 0.32497531175613403, 0.34356987476348877, 0.3621644675731659, 0.380759060382843, 0.39935362339019775, 0.4179482161998749, 0.4365427792072296, 0.45513737201690674, 0.4737319350242615, 0.4923265278339386, 0.5109211206436157, 0.5295156836509705, 0.5481102466583252, 0.5667048096656799, 0.5852994322776794, 0.6038939952850342, 0.6224885582923889, 0.6410831212997437, 0.6596777439117432, 0.6782723069190979, 0.6968669295310974]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 6.0, 12.0, 20.0, 27.0, 54.0, 66.0, 124.0, 219.0, 470.0, 1084.0, 3153.0, 15151.0, 150078.0, 780443.0, 83253.0, 10291.0, 2371.0, 873.0, 364.0, 213.0, 102.0, 70.0, 36.0, 22.0, 14.0, 13.0, 7.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4668159484863281, -0.45145416259765625, -0.4360923767089844, -0.4207305908203125, -0.4053688049316406, -0.39000701904296875, -0.3746452331542969, -0.359283447265625, -0.3439216613769531, -0.32855987548828125, -0.3131980895996094, -0.2978363037109375, -0.2824745178222656, -0.26711273193359375, -0.2517509460449219, -0.23638916015625, -0.22102737426757812, -0.20566558837890625, -0.19030380249023438, -0.1749420166015625, -0.15958023071289062, -0.14421844482421875, -0.12885665893554688, -0.113494873046875, -0.09813308715820312, -0.08277130126953125, -0.06740951538085938, -0.0520477294921875, -0.036685943603515625, -0.02132415771484375, -0.005962371826171875, 0.0093994140625, 0.024761199951171875, 0.04012298583984375, 0.055484771728515625, 0.0708465576171875, 0.08620834350585938, 0.10157012939453125, 0.11693191528320312, 0.132293701171875, 0.14765548706054688, 0.16301727294921875, 0.17837905883789062, 0.1937408447265625, 0.20910263061523438, 0.22446441650390625, 0.23982620239257812, 0.25518798828125, 0.2705497741699219, 0.28591156005859375, 0.3012733459472656, 0.3166351318359375, 0.3319969177246094, 0.34735870361328125, 0.3627204895019531, 0.378082275390625, 0.3934440612792969, 0.40880584716796875, 0.4241676330566406, 0.4395294189453125, 0.4548912048339844, 0.47025299072265625, 0.4856147766113281, 0.5009765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 13.0, 16.0, 21.0, 41.0, 58.0, 73.0, 108.0, 99.0, 112.0, 97.0, 80.0, 68.0, 56.0, 45.0, 36.0, 30.0, 17.0, 11.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1090087890625, -0.10567378997802734, -0.10233879089355469, -0.09900379180908203, -0.09566879272460938, -0.09233379364013672, -0.08899879455566406, -0.0856637954711914, -0.08232879638671875, -0.0789937973022461, -0.07565879821777344, -0.07232379913330078, -0.06898880004882812, -0.06565380096435547, -0.06231880187988281, -0.058983802795410156, -0.0556488037109375, -0.052313804626464844, -0.04897880554199219, -0.04564380645751953, -0.042308807373046875, -0.03897380828857422, -0.03563880920410156, -0.032303810119628906, -0.02896881103515625, -0.025633811950683594, -0.022298812866210938, -0.01896381378173828, -0.015628814697265625, -0.012293815612792969, -0.008958816528320312, -0.005623817443847656, -0.002288818359375, 0.0010461807250976562, 0.0043811798095703125, 0.007716178894042969, 0.011051177978515625, 0.014386177062988281, 0.017721176147460938, 0.021056175231933594, 0.02439117431640625, 0.027726173400878906, 0.031061172485351562, 0.03439617156982422, 0.037731170654296875, 0.04106616973876953, 0.04440116882324219, 0.047736167907714844, 0.0510711669921875, 0.054406166076660156, 0.05774116516113281, 0.06107616424560547, 0.06441116333007812, 0.06774616241455078, 0.07108116149902344, 0.0744161605834961, 0.07775115966796875, 0.0810861587524414, 0.08442115783691406, 0.08775615692138672, 0.09109115600585938, 0.09442615509033203, 0.09776115417480469, 0.10109615325927734, 0.10443115234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 11.0, 5.0, 13.0, 21.0, 17.0, 25.0, 40.0, 48.0, 97.0, 146.0, 199.0, 373.0, 705.0, 1532.0, 3224.0, 9062.0, 39620.0, 451851.0, 484211.0, 41631.0, 9288.0, 3253.0, 1441.0, 717.0, 367.0, 220.0, 132.0, 100.0, 49.0, 40.0, 32.0, 22.0, 13.0, 8.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.423095703125, -0.4110107421875, -0.39892578125, -0.3868408203125, -0.374755859375, -0.3626708984375, -0.3505859375, -0.3385009765625, -0.326416015625, -0.3143310546875, -0.30224609375, -0.2901611328125, -0.278076171875, -0.2659912109375, -0.25390625, -0.2418212890625, -0.229736328125, -0.2176513671875, -0.20556640625, -0.1934814453125, -0.181396484375, -0.1693115234375, -0.1572265625, -0.1451416015625, -0.133056640625, -0.1209716796875, -0.10888671875, -0.0968017578125, -0.084716796875, -0.0726318359375, -0.060546875, -0.0484619140625, -0.036376953125, -0.0242919921875, -0.01220703125, -0.0001220703125, 0.011962890625, 0.0240478515625, 0.0361328125, 0.0482177734375, 0.060302734375, 0.0723876953125, 0.08447265625, 0.0965576171875, 0.108642578125, 0.1207275390625, 0.1328125, 0.1448974609375, 0.156982421875, 0.1690673828125, 0.18115234375, 0.1932373046875, 0.205322265625, 0.2174072265625, 0.2294921875, 0.2415771484375, 0.253662109375, 0.2657470703125, 0.27783203125, 0.2899169921875, 0.302001953125, 0.3140869140625, 0.326171875, 0.3382568359375, 0.350341796875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 1.0, 9.0, 15.0, 6.0, 17.0, 16.0, 24.0, 22.0, 41.0, 36.0, 44.0, 80.0, 55.0, 56.0, 61.0, 67.0, 63.0, 65.0, 54.0, 46.0, 40.0, 35.0, 32.0, 26.0, 14.0, 18.0, 12.0, 7.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.384521484375, -0.372802734375, -0.361083984375, -0.349365234375, -0.337646484375, -0.325927734375, -0.314208984375, -0.302490234375, -0.290771484375, -0.279052734375, -0.267333984375, -0.255615234375, -0.243896484375, -0.232177734375, -0.220458984375, -0.208740234375, -0.197021484375, -0.185302734375, -0.173583984375, -0.161865234375, -0.150146484375, -0.138427734375, -0.126708984375, -0.114990234375, -0.103271484375, -0.091552734375, -0.079833984375, -0.068115234375, -0.056396484375, -0.044677734375, -0.032958984375, -0.021240234375, -0.009521484375, 0.002197265625, 0.013916015625, 0.025634765625, 0.037353515625, 0.049072265625, 0.060791015625, 0.072509765625, 0.084228515625, 0.095947265625, 0.107666015625, 0.119384765625, 0.131103515625, 0.142822265625, 0.154541015625, 0.166259765625, 0.177978515625, 0.189697265625, 0.201416015625, 0.213134765625, 0.224853515625, 0.236572265625, 0.248291015625, 0.260009765625, 0.271728515625, 0.283447265625, 0.295166015625, 0.306884765625, 0.318603515625, 0.330322265625, 0.342041015625, 0.353759765625, 0.365478515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 3.0, 10.0, 11.0, 13.0, 22.0, 29.0, 52.0, 53.0, 84.0, 135.0, 211.0, 337.0, 673.0, 1321.0, 3301.0, 13476.0, 752050.0, 261560.0, 9687.0, 2841.0, 1217.0, 585.0, 306.0, 178.0, 129.0, 78.0, 44.0, 49.0, 38.0, 21.0, 15.0, 15.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.441650390625, -0.42862701416015625, -0.4156036376953125, -0.40258026123046875, -0.389556884765625, -0.37653350830078125, -0.3635101318359375, -0.35048675537109375, -0.33746337890625, -0.32444000244140625, -0.3114166259765625, -0.29839324951171875, -0.285369873046875, -0.27234649658203125, -0.2593231201171875, -0.24629974365234375, -0.2332763671875, -0.22025299072265625, -0.2072296142578125, -0.19420623779296875, -0.181182861328125, -0.16815948486328125, -0.1551361083984375, -0.14211273193359375, -0.12908935546875, -0.11606597900390625, -0.1030426025390625, -0.09001922607421875, -0.076995849609375, -0.06397247314453125, -0.0509490966796875, -0.03792572021484375, -0.02490234375, -0.01187896728515625, 0.0011444091796875, 0.01416778564453125, 0.027191162109375, 0.04021453857421875, 0.0532379150390625, 0.06626129150390625, 0.07928466796875, 0.09230804443359375, 0.1053314208984375, 0.11835479736328125, 0.131378173828125, 0.14440155029296875, 0.1574249267578125, 0.17044830322265625, 0.1834716796875, 0.19649505615234375, 0.2095184326171875, 0.22254180908203125, 0.235565185546875, 0.24858856201171875, 0.2616119384765625, 0.27463531494140625, 0.28765869140625, 0.30068206787109375, 0.3137054443359375, 0.32672882080078125, 0.339752197265625, 0.35277557373046875, 0.3657989501953125, 0.37882232666015625, 0.391845703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 5.0, 10.0, 16.0, 17.0, 36.0, 48.0, 55.0, 70.0, 131.0, 137.0, 125.0, 101.0, 64.0, 42.0, 39.0, 30.0, 19.0, 18.0, 6.0, 5.0, 6.0, 9.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015151500701904297, -0.00014660321176052094, -0.0001416914165019989, -0.00013677962124347687, -0.00013186782598495483, -0.0001269560307264328, -0.00012204423546791077, -0.00011713244020938873, -0.0001122206449508667, -0.00010730884969234467, -0.00010239705443382263, -9.74852591753006e-05, -9.257346391677856e-05, -8.766166865825653e-05, -8.27498733997345e-05, -7.783807814121246e-05, -7.292628288269043e-05, -6.80144876241684e-05, -6.310269236564636e-05, -5.819089710712433e-05, -5.3279101848602295e-05, -4.836730659008026e-05, -4.345551133155823e-05, -3.8543716073036194e-05, -3.363192081451416e-05, -2.8720125555992126e-05, -2.3808330297470093e-05, -1.889653503894806e-05, -1.3984739780426025e-05, -9.072944521903992e-06, -4.161149263381958e-06, 7.506459951400757e-07, 5.662441253662109e-06, 1.0574236512184143e-05, 1.5486031770706177e-05, 2.039782702922821e-05, 2.5309622287750244e-05, 3.0221417546272278e-05, 3.513321280479431e-05, 4.0045008063316345e-05, 4.495680332183838e-05, 4.986859858036041e-05, 5.4780393838882446e-05, 5.969218909740448e-05, 6.460398435592651e-05, 6.951577961444855e-05, 7.442757487297058e-05, 7.933937013149261e-05, 8.425116539001465e-05, 8.916296064853668e-05, 9.407475590705872e-05, 9.898655116558075e-05, 0.00010389834642410278, 0.00010881014168262482, 0.00011372193694114685, 0.00011863373219966888, 0.00012354552745819092, 0.00012845732271671295, 0.00013336911797523499, 0.00013828091323375702, 0.00014319270849227905, 0.00014810450375080109, 0.00015301629900932312, 0.00015792809426784515, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 11.0, 22.0, 23.0, 73.0, 154.0, 411.0, 1543.0, 22925.0, 1011717.0, 9942.0, 1105.0, 352.0, 137.0, 64.0, 25.0, 11.0, 6.0, 4.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7578125, -0.7344207763671875, -0.711029052734375, -0.6876373291015625, -0.66424560546875, -0.6408538818359375, -0.617462158203125, -0.5940704345703125, -0.5706787109375, -0.5472869873046875, -0.523895263671875, -0.5005035400390625, -0.47711181640625, -0.4537200927734375, -0.430328369140625, -0.4069366455078125, -0.383544921875, -0.3601531982421875, -0.336761474609375, -0.3133697509765625, -0.28997802734375, -0.2665863037109375, -0.243194580078125, -0.2198028564453125, -0.1964111328125, -0.1730194091796875, -0.149627685546875, -0.1262359619140625, -0.10284423828125, -0.0794525146484375, -0.056060791015625, -0.0326690673828125, -0.00927734375, 0.0141143798828125, 0.037506103515625, 0.0608978271484375, 0.08428955078125, 0.1076812744140625, 0.131072998046875, 0.1544647216796875, 0.1778564453125, 0.2012481689453125, 0.224639892578125, 0.2480316162109375, 0.27142333984375, 0.2948150634765625, 0.318206787109375, 0.3415985107421875, 0.364990234375, 0.3883819580078125, 0.411773681640625, 0.4351654052734375, 0.45855712890625, 0.4819488525390625, 0.505340576171875, 0.5287322998046875, 0.5521240234375, 0.5755157470703125, 0.598907470703125, 0.6222991943359375, 0.64569091796875, 0.6690826416015625, 0.692474365234375, 0.7158660888671875, 0.7392578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 10.0, 10.0, 15.0, 46.0, 141.0, 512.0, 169.0, 45.0, 23.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5220947265625, -0.495361328125, -0.4686279296875, -0.44189453125, -0.4151611328125, -0.388427734375, -0.3616943359375, -0.3349609375, -0.3082275390625, -0.281494140625, -0.2547607421875, -0.22802734375, -0.2012939453125, -0.174560546875, -0.1478271484375, -0.12109375, -0.0943603515625, -0.067626953125, -0.0408935546875, -0.01416015625, 0.0125732421875, 0.039306640625, 0.0660400390625, 0.0927734375, 0.1195068359375, 0.146240234375, 0.1729736328125, 0.19970703125, 0.2264404296875, 0.253173828125, 0.2799072265625, 0.306640625, 0.3333740234375, 0.360107421875, 0.3868408203125, 0.41357421875, 0.4403076171875, 0.467041015625, 0.4937744140625, 0.5205078125, 0.5472412109375, 0.573974609375, 0.6007080078125, 0.62744140625, 0.6541748046875, 0.680908203125, 0.7076416015625, 0.734375, 0.7611083984375, 0.787841796875, 0.8145751953125, 0.84130859375, 0.8680419921875, 0.894775390625, 0.9215087890625, 0.9482421875, 0.9749755859375, 1.001708984375, 1.0284423828125, 1.05517578125, 1.0819091796875, 1.108642578125, 1.1353759765625, 1.162109375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 9.0, 17.0, 29.0, 59.0, 118.0, 194.0, 235.0, 176.0, 83.0, 36.0, 15.0, 8.0, 9.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.157985687255859, -4.037571430206299, -3.917156934738159, -3.7967426776885986, -3.676328182220459, -3.5559139251708984, -3.435499429702759, -3.3150851726531982, -3.1946706771850586, -3.074256420135498, -2.9538419246673584, -2.833427667617798, -2.713013172149658, -2.5925989151000977, -2.472184419631958, -2.3517701625823975, -2.231355667114258, -2.1109414100646973, -1.9905269145965576, -1.8701125383377075, -1.7496981620788574, -1.6292839050292969, -1.5088694095611572, -1.3884551525115967, -1.2680408954620361, -1.147626519203186, -1.027212142944336, -0.9067977666854858, -0.7863833904266357, -0.6659690737724304, -0.5455546975135803, -0.4251403212547302, -0.30472588539123535, -0.18431150913238525, -0.06389714777469635, 0.056517213582992554, 0.17693158984184265, 0.29734593629837036, 0.41776031255722046, 0.5381746888160706, 0.6585890650749207, 0.7790034413337708, 0.8994178175926208, 1.0198321342468262, 1.1402465105056763, 1.2606608867645264, 1.3810752630233765, 1.5014896392822266, 1.6219040155410767, 1.7423183917999268, 1.8627327680587769, 1.983147144317627, 2.1035614013671875, 2.223975896835327, 2.3443901538848877, 2.4648046493530273, 2.585218906402588, 2.7056331634521484, 2.826047658920288, 2.9464619159698486, 3.0668764114379883, 3.187290668487549, 3.3077051639556885, 3.428119421005249, 3.5485339164733887]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 6.0, 9.0, 6.0, 4.0, 8.0, 13.0, 17.0, 20.0, 18.0, 28.0, 34.0, 45.0, 45.0, 41.0, 59.0, 45.0, 53.0, 53.0, 53.0, 44.0, 48.0, 41.0, 54.0, 43.0, 32.0, 27.0, 34.0, 24.0, 23.0, 20.0, 18.0, 13.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.561328887939453, -2.4870734214782715, -2.41281795501709, -2.338562488555908, -2.2643070220947266, -2.190051555633545, -2.1157960891723633, -2.0415403842926025, -1.967284917831421, -1.8930294513702393, -1.8187739849090576, -1.744518518447876, -1.6702629327774048, -1.5960074663162231, -1.5217519998550415, -1.4474964141845703, -1.3732410669326782, -1.2989856004714966, -1.224730134010315, -1.1504745483398438, -1.076219081878662, -1.0019636154174805, -0.9277081489562988, -0.8534526228904724, -0.7791971564292908, -0.7049416899681091, -0.6306861639022827, -0.5564306974411011, -0.48217520117759705, -0.407919704914093, -0.3336642384529114, -0.25940871238708496, -0.18515324592590332, -0.11089775711297989, -0.03664226830005646, 0.03761321306228638, 0.1118687093257904, 0.18612420558929443, 0.2603796720504761, 0.3346351981163025, 0.40889066457748413, 0.48314616084098816, 0.5574016571044922, 0.6316571235656738, 0.7059125900268555, 0.7801681160926819, 0.8544235825538635, 0.9286791086196899, 1.0029345750808716, 1.0771900415420532, 1.1514455080032349, 1.225701093673706, 1.2999565601348877, 1.3742120265960693, 1.448467493057251, 1.5227229595184326, 1.5969784259796143, 1.671233892440796, 1.7454893589019775, 1.8197448253631592, 1.8940004110336304, 1.968255877494812, 2.042511463165283, 2.116766929626465, 2.1910223960876465]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 13.0, 11.0, 22.0, 17.0, 38.0, 58.0, 104.0, 185.0, 234.0, 486.0, 909.0, 1835.0, 4201.0, 11720.0, 50951.0, 2982629.0, 1078251.0, 43814.0, 10908.0, 4004.0, 1767.0, 919.0, 490.0, 280.0, 170.0, 85.0, 53.0, 37.0, 24.0, 19.0, 8.0, 7.0, 11.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.2596549987792969, -0.25002288818359375, -0.24039077758789062, -0.2307586669921875, -0.22112655639648438, -0.21149444580078125, -0.20186233520507812, -0.192230224609375, -0.18259811401367188, -0.17296600341796875, -0.16333389282226562, -0.1537017822265625, -0.14406967163085938, -0.13443756103515625, -0.12480545043945312, -0.11517333984375, -0.10554122924804688, -0.09590911865234375, -0.08627700805664062, -0.0766448974609375, -0.06701278686523438, -0.05738067626953125, -0.047748565673828125, -0.038116455078125, -0.028484344482421875, -0.01885223388671875, -0.009220123291015625, 0.0004119873046875, 0.010044097900390625, 0.01967620849609375, 0.029308319091796875, 0.0389404296875, 0.048572540283203125, 0.05820465087890625, 0.06783676147460938, 0.0774688720703125, 0.08710098266601562, 0.09673309326171875, 0.10636520385742188, 0.115997314453125, 0.12562942504882812, 0.13526153564453125, 0.14489364624023438, 0.1545257568359375, 0.16415786743164062, 0.17378997802734375, 0.18342208862304688, 0.19305419921875, 0.20268630981445312, 0.21231842041015625, 0.22195053100585938, 0.2315826416015625, 0.24121475219726562, 0.25084686279296875, 0.2604789733886719, 0.270111083984375, 0.2797431945800781, 0.28937530517578125, 0.2990074157714844, 0.3086395263671875, 0.3182716369628906, 0.32790374755859375, 0.3375358581542969, 0.34716796875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 15.0, 7.0, 11.0, 16.0, 20.0, 30.0, 42.0, 50.0, 67.0, 72.0, 72.0, 79.0, 84.0, 74.0, 87.0, 53.0, 49.0, 40.0, 30.0, 26.0, 27.0, 18.0, 13.0, 10.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10955810546875, -0.10634708404541016, -0.10313606262207031, -0.09992504119873047, -0.09671401977539062, -0.09350299835205078, -0.09029197692871094, -0.0870809555053711, -0.08386993408203125, -0.0806589126586914, -0.07744789123535156, -0.07423686981201172, -0.07102584838867188, -0.06781482696533203, -0.06460380554199219, -0.061392784118652344, -0.0581817626953125, -0.054970741271972656, -0.05175971984863281, -0.04854869842529297, -0.045337677001953125, -0.04212665557861328, -0.03891563415527344, -0.035704612731933594, -0.03249359130859375, -0.029282569885253906, -0.026071548461914062, -0.02286052703857422, -0.019649505615234375, -0.01643848419189453, -0.013227462768554688, -0.010016441345214844, -0.006805419921875, -0.0035943984985351562, -0.0003833770751953125, 0.0028276443481445312, 0.006038665771484375, 0.009249687194824219, 0.012460708618164062, 0.015671730041503906, 0.01888275146484375, 0.022093772888183594, 0.025304794311523438, 0.02851581573486328, 0.031726837158203125, 0.03493785858154297, 0.03814888000488281, 0.041359901428222656, 0.0445709228515625, 0.047781944274902344, 0.05099296569824219, 0.05420398712158203, 0.057415008544921875, 0.06062602996826172, 0.06383705139160156, 0.0670480728149414, 0.07025909423828125, 0.0734701156616211, 0.07668113708496094, 0.07989215850830078, 0.08310317993164062, 0.08631420135498047, 0.08952522277832031, 0.09273624420166016, 0.095947265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 10.0, 7.0, 22.0, 25.0, 27.0, 68.0, 107.0, 172.0, 297.0, 460.0, 884.0, 1654.0, 3581.0, 11512.0, 94162.0, 3877589.0, 179242.0, 15842.0, 4316.0, 1891.0, 1049.0, 549.0, 319.0, 165.0, 101.0, 73.0, 33.0, 47.0, 18.0, 10.0, 15.0, 9.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.476318359375, -0.4625511169433594, -0.44878387451171875, -0.4350166320800781, -0.4212493896484375, -0.4074821472167969, -0.39371490478515625, -0.3799476623535156, -0.366180419921875, -0.3524131774902344, -0.33864593505859375, -0.3248786926269531, -0.3111114501953125, -0.2973442077636719, -0.28357696533203125, -0.2698097229003906, -0.25604248046875, -0.24227523803710938, -0.22850799560546875, -0.21474075317382812, -0.2009735107421875, -0.18720626831054688, -0.17343902587890625, -0.15967178344726562, -0.145904541015625, -0.13213729858398438, -0.11837005615234375, -0.10460281372070312, -0.0908355712890625, -0.07706832885742188, -0.06330108642578125, -0.049533843994140625, -0.0357666015625, -0.021999359130859375, -0.00823211669921875, 0.005535125732421875, 0.0193023681640625, 0.033069610595703125, 0.04683685302734375, 0.060604095458984375, 0.074371337890625, 0.08813858032226562, 0.10190582275390625, 0.11567306518554688, 0.1294403076171875, 0.14320755004882812, 0.15697479248046875, 0.17074203491210938, 0.18450927734375, 0.19827651977539062, 0.21204376220703125, 0.22581100463867188, 0.2395782470703125, 0.2533454895019531, 0.26711273193359375, 0.2808799743652344, 0.294647216796875, 0.3084144592285156, 0.32218170166015625, 0.3359489440917969, 0.3497161865234375, 0.3634834289550781, 0.37725067138671875, 0.3910179138183594, 0.40478515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 15.0, 14.0, 42.0, 130.0, 510.0, 2775.0, 397.0, 108.0, 24.0, 18.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.431640625, -0.42170143127441406, -0.4117622375488281, -0.4018230438232422, -0.39188385009765625, -0.3819446563720703, -0.3720054626464844, -0.36206626892089844, -0.3521270751953125, -0.34218788146972656, -0.3322486877441406, -0.3223094940185547, -0.31237030029296875, -0.3024311065673828, -0.2924919128417969, -0.28255271911621094, -0.272613525390625, -0.26267433166503906, -0.2527351379394531, -0.2427959442138672, -0.23285675048828125, -0.2229175567626953, -0.21297836303710938, -0.20303916931152344, -0.1930999755859375, -0.18316078186035156, -0.17322158813476562, -0.1632823944091797, -0.15334320068359375, -0.1434040069580078, -0.13346481323242188, -0.12352561950683594, -0.11358642578125, -0.10364723205566406, -0.09370803833007812, -0.08376884460449219, -0.07382965087890625, -0.06389045715332031, -0.053951263427734375, -0.04401206970214844, -0.0340728759765625, -0.024133682250976562, -0.014194488525390625, -0.0042552947998046875, 0.00568389892578125, 0.015623092651367188, 0.025562286376953125, 0.03550148010253906, 0.045440673828125, 0.05537986755371094, 0.06531906127929688, 0.07525825500488281, 0.08519744873046875, 0.09513664245605469, 0.10507583618164062, 0.11501502990722656, 0.1249542236328125, 0.13489341735839844, 0.14483261108398438, 0.1547718048095703, 0.16471099853515625, 0.1746501922607422, 0.18458938598632812, 0.19452857971191406, 0.2044677734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 16.0, 100.0, 348.0, 442.0, 79.0, 14.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.101809024810791, -4.994061470031738, -4.8863139152526855, -4.778566360473633, -4.670818328857422, -4.563070774078369, -4.455323219299316, -4.347575664520264, -4.239828109741211, -4.132080554962158, -4.0243330001831055, -3.9165852069854736, -3.808837652206421, -3.701089859008789, -3.5933423042297363, -3.4855947494506836, -3.3778469562530518, -3.270099401473999, -3.162351608276367, -3.0546040534973145, -2.9468564987182617, -2.839108943939209, -2.731361150741577, -2.6236135959625244, -2.5158658027648926, -2.40811824798584, -2.300370454788208, -2.1926229000091553, -2.0848753452301025, -1.9771276712417603, -1.869379997253418, -1.7616324424743652, -1.6538846492767334, -1.5461369752883911, -1.4383894205093384, -1.330641746520996, -1.2228941917419434, -1.115146517753601, -1.0073988437652588, -0.8996512293815613, -0.7919036149978638, -0.6841560006141663, -0.5764083862304688, -0.46866071224212646, -0.36091309785842896, -0.25316548347473145, -0.14541780948638916, -0.03767019510269165, 0.07007741928100586, 0.17782504856586456, 0.28557267785072327, 0.39332032203674316, 0.5010679364204407, 0.6088155508041382, 0.7165632247924805, 0.824310839176178, 0.9320584535598755, 1.0398061275482178, 1.1475536823272705, 1.2553013563156128, 1.363049030303955, 1.4707965850830078, 1.57854425907135, 1.6862919330596924, 1.7940394878387451]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 10.0, 7.0, 11.0, 11.0, 13.0, 13.0, 18.0, 21.0, 18.0, 20.0, 28.0, 32.0, 44.0, 49.0, 45.0, 50.0, 43.0, 39.0, 46.0, 41.0, 46.0, 51.0, 43.0, 35.0, 27.0, 34.0, 31.0, 29.0, 23.0, 26.0, 13.0, 24.0, 12.0, 11.0, 5.0, 7.0, 8.0, 6.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0], "bins": [-0.8993347883224487, -0.8758382797241211, -0.8523417711257935, -0.8288452625274658, -0.8053486943244934, -0.7818521857261658, -0.7583556771278381, -0.7348591685295105, -0.7113626003265381, -0.6878660917282104, -0.6643695831298828, -0.6408730745315552, -0.6173765063285828, -0.5938799977302551, -0.5703834891319275, -0.5468869805335999, -0.5233904719352722, -0.4998939633369446, -0.47639742493629456, -0.4529009163379669, -0.4294043779373169, -0.40590786933898926, -0.3824113607406616, -0.358914852142334, -0.33541831374168396, -0.3119218051433563, -0.2884252667427063, -0.26492875814437866, -0.24143223464488983, -0.217935711145401, -0.19443920254707336, -0.17094267904758453, -0.14744609594345093, -0.1239495724439621, -0.10045305639505386, -0.07695654034614563, -0.0534600168466568, -0.02996349334716797, -0.006466984748840332, 0.0170295387506485, 0.04052606225013733, 0.06402258574962616, 0.0875191017985344, 0.11101561784744263, 0.13451214134693146, 0.1580086648464203, 0.18150517344474792, 0.20500169694423676, 0.22849822044372559, 0.2519947290420532, 0.27549126744270325, 0.2989877760410309, 0.3224843144416809, 0.34598082304000854, 0.3694773316383362, 0.3929738402366638, 0.41647037863731384, 0.4399668872356415, 0.4634634256362915, 0.48695993423461914, 0.5104564428329468, 0.5339529514312744, 0.557449460029602, 0.5809460282325745, 0.6044425368309021]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 12.0, 19.0, 36.0, 43.0, 90.0, 137.0, 247.0, 442.0, 954.0, 2180.0, 6229.0, 23835.0, 146770.0, 653325.0, 175509.0, 27232.0, 6954.0, 2392.0, 1017.0, 494.0, 266.0, 145.0, 74.0, 48.0, 27.0, 20.0, 12.0, 9.0, 10.0, 7.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37890625, -0.365631103515625, -0.35235595703125, -0.339080810546875, -0.3258056640625, -0.312530517578125, -0.29925537109375, -0.285980224609375, -0.272705078125, -0.259429931640625, -0.24615478515625, -0.232879638671875, -0.2196044921875, -0.206329345703125, -0.19305419921875, -0.179779052734375, -0.16650390625, -0.153228759765625, -0.13995361328125, -0.126678466796875, -0.1134033203125, -0.100128173828125, -0.08685302734375, -0.073577880859375, -0.060302734375, -0.047027587890625, -0.03375244140625, -0.020477294921875, -0.0072021484375, 0.006072998046875, 0.01934814453125, 0.032623291015625, 0.0458984375, 0.059173583984375, 0.07244873046875, 0.085723876953125, 0.0989990234375, 0.112274169921875, 0.12554931640625, 0.138824462890625, 0.152099609375, 0.165374755859375, 0.17864990234375, 0.191925048828125, 0.2052001953125, 0.218475341796875, 0.23175048828125, 0.245025634765625, 0.25830078125, 0.271575927734375, 0.28485107421875, 0.298126220703125, 0.3114013671875, 0.324676513671875, 0.33795166015625, 0.351226806640625, 0.364501953125, 0.377777099609375, 0.39105224609375, 0.404327392578125, 0.4176025390625, 0.430877685546875, 0.44415283203125, 0.457427978515625, 0.470703125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 7.0, 8.0, 10.0, 13.0, 11.0, 20.0, 32.0, 34.0, 40.0, 51.0, 47.0, 69.0, 78.0, 56.0, 77.0, 69.0, 59.0, 54.0, 53.0, 46.0, 43.0, 24.0, 25.0, 16.0, 21.0, 10.0, 8.0, 13.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11181640625, -0.10854911804199219, -0.10528182983398438, -0.10201454162597656, -0.09874725341796875, -0.09547996520996094, -0.09221267700195312, -0.08894538879394531, -0.0856781005859375, -0.08241081237792969, -0.07914352416992188, -0.07587623596191406, -0.07260894775390625, -0.06934165954589844, -0.06607437133789062, -0.06280708312988281, -0.059539794921875, -0.05627250671386719, -0.053005218505859375, -0.04973793029785156, -0.04647064208984375, -0.04320335388183594, -0.039936065673828125, -0.03666877746582031, -0.0334014892578125, -0.030134201049804688, -0.026866912841796875, -0.023599624633789062, -0.02033233642578125, -0.017065048217773438, -0.013797760009765625, -0.010530471801757812, -0.00726318359375, -0.0039958953857421875, -0.000728607177734375, 0.0025386810302734375, 0.00580596923828125, 0.009073257446289062, 0.012340545654296875, 0.015607833862304688, 0.0188751220703125, 0.022142410278320312, 0.025409698486328125, 0.028676986694335938, 0.03194427490234375, 0.03521156311035156, 0.038478851318359375, 0.04174613952636719, 0.045013427734375, 0.04828071594238281, 0.051548004150390625, 0.05481529235839844, 0.05808258056640625, 0.06134986877441406, 0.06461715698242188, 0.06788444519042969, 0.0711517333984375, 0.07441902160644531, 0.07768630981445312, 0.08095359802246094, 0.08422088623046875, 0.08748817443847656, 0.09075546264648438, 0.09402275085449219, 0.0972900390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 7.0, 6.0, 7.0, 12.0, 15.0, 22.0, 47.0, 70.0, 87.0, 159.0, 247.0, 421.0, 787.0, 1874.0, 4854.0, 17872.0, 117831.0, 752276.0, 124993.0, 18097.0, 4956.0, 1930.0, 883.0, 435.0, 233.0, 133.0, 82.0, 58.0, 44.0, 37.0, 21.0, 17.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 4.0, 2.0], "bins": [-0.66552734375, -0.6477851867675781, -0.6300430297851562, -0.6123008728027344, -0.5945587158203125, -0.5768165588378906, -0.5590744018554688, -0.5413322448730469, -0.523590087890625, -0.5058479309082031, -0.48810577392578125, -0.4703636169433594, -0.4526214599609375, -0.4348793029785156, -0.41713714599609375, -0.3993949890136719, -0.38165283203125, -0.3639106750488281, -0.34616851806640625, -0.3284263610839844, -0.3106842041015625, -0.2929420471191406, -0.27519989013671875, -0.2574577331542969, -0.239715576171875, -0.22197341918945312, -0.20423126220703125, -0.18648910522460938, -0.1687469482421875, -0.15100479125976562, -0.13326263427734375, -0.11552047729492188, -0.0977783203125, -0.08003616333007812, -0.06229400634765625, -0.044551849365234375, -0.0268096923828125, -0.009067535400390625, 0.00867462158203125, 0.026416778564453125, 0.044158935546875, 0.061901092529296875, 0.07964324951171875, 0.09738540649414062, 0.1151275634765625, 0.13286972045898438, 0.15061187744140625, 0.16835403442382812, 0.18609619140625, 0.20383834838867188, 0.22158050537109375, 0.23932266235351562, 0.2570648193359375, 0.2748069763183594, 0.29254913330078125, 0.3102912902832031, 0.328033447265625, 0.3457756042480469, 0.36351776123046875, 0.3812599182128906, 0.3990020751953125, 0.4167442321777344, 0.43448638916015625, 0.4522285461425781, 0.469970703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 10.0, 13.0, 16.0, 18.0, 29.0, 32.0, 44.0, 53.0, 47.0, 41.0, 53.0, 63.0, 55.0, 72.0, 46.0, 41.0, 56.0, 60.0, 43.0, 33.0, 36.0, 29.0, 26.0, 11.0, 7.0, 7.0, 7.0, 10.0, 10.0, 8.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6171875, -0.5978469848632812, -0.5785064697265625, -0.5591659545898438, -0.539825439453125, -0.5204849243164062, -0.5011444091796875, -0.48180389404296875, -0.46246337890625, -0.44312286376953125, -0.4237823486328125, -0.40444183349609375, -0.385101318359375, -0.36576080322265625, -0.3464202880859375, -0.32707977294921875, -0.3077392578125, -0.28839874267578125, -0.2690582275390625, -0.24971771240234375, -0.230377197265625, -0.21103668212890625, -0.1916961669921875, -0.17235565185546875, -0.15301513671875, -0.13367462158203125, -0.1143341064453125, -0.09499359130859375, -0.075653076171875, -0.05631256103515625, -0.0369720458984375, -0.01763153076171875, 0.001708984375, 0.02104949951171875, 0.0403900146484375, 0.05973052978515625, 0.079071044921875, 0.09841156005859375, 0.1177520751953125, 0.13709259033203125, 0.15643310546875, 0.17577362060546875, 0.1951141357421875, 0.21445465087890625, 0.233795166015625, 0.25313568115234375, 0.2724761962890625, 0.29181671142578125, 0.3111572265625, 0.33049774169921875, 0.3498382568359375, 0.36917877197265625, 0.388519287109375, 0.40785980224609375, 0.4272003173828125, 0.44654083251953125, 0.46588134765625, 0.48522186279296875, 0.5045623779296875, 0.5239028930664062, 0.543243408203125, 0.5625839233398438, 0.5819244384765625, 0.6012649536132812, 0.62060546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 13.0, 13.0, 26.0, 33.0, 58.0, 117.0, 150.0, 313.0, 667.0, 1720.0, 6164.0, 49868.0, 813363.0, 159395.0, 12210.0, 2583.0, 888.0, 441.0, 205.0, 121.0, 65.0, 36.0, 48.0, 11.0, 13.0, 9.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.384765625, -0.37334442138671875, -0.3619232177734375, -0.35050201416015625, -0.339080810546875, -0.32765960693359375, -0.3162384033203125, -0.30481719970703125, -0.29339599609375, -0.28197479248046875, -0.2705535888671875, -0.25913238525390625, -0.247711181640625, -0.23628997802734375, -0.2248687744140625, -0.21344757080078125, -0.2020263671875, -0.19060516357421875, -0.1791839599609375, -0.16776275634765625, -0.156341552734375, -0.14492034912109375, -0.1334991455078125, -0.12207794189453125, -0.11065673828125, -0.09923553466796875, -0.0878143310546875, -0.07639312744140625, -0.064971923828125, -0.05355072021484375, -0.0421295166015625, -0.03070831298828125, -0.019287109375, -0.00786590576171875, 0.0035552978515625, 0.01497650146484375, 0.026397705078125, 0.03781890869140625, 0.0492401123046875, 0.06066131591796875, 0.07208251953125, 0.08350372314453125, 0.0949249267578125, 0.10634613037109375, 0.117767333984375, 0.12918853759765625, 0.1406097412109375, 0.15203094482421875, 0.1634521484375, 0.17487335205078125, 0.1862945556640625, 0.19771575927734375, 0.209136962890625, 0.22055816650390625, 0.2319793701171875, 0.24340057373046875, 0.25482177734375, 0.26624298095703125, 0.2776641845703125, 0.28908538818359375, 0.300506591796875, 0.31192779541015625, 0.3233489990234375, 0.33477020263671875, 0.34619140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 12.0, 19.0, 28.0, 24.0, 45.0, 59.0, 72.0, 87.0, 115.0, 92.0, 88.0, 88.0, 59.0, 56.0, 33.0, 28.0, 20.0, 15.0, 13.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.952617645263672e-05, -8.549727499485016e-05, -8.14683735370636e-05, -7.743947207927704e-05, -7.341057062149048e-05, -6.938166916370392e-05, -6.535276770591736e-05, -6.13238662481308e-05, -5.729496479034424e-05, -5.326606333255768e-05, -4.923716187477112e-05, -4.520826041698456e-05, -4.1179358959198e-05, -3.715045750141144e-05, -3.312155604362488e-05, -2.9092654585838318e-05, -2.5063753128051758e-05, -2.1034851670265198e-05, -1.7005950212478638e-05, -1.2977048754692078e-05, -8.948147296905518e-06, -4.9192458391189575e-06, -8.903443813323975e-07, 3.1385570764541626e-06, 7.167458534240723e-06, 1.1196359992027283e-05, 1.5225261449813843e-05, 1.9254162907600403e-05, 2.3283064365386963e-05, 2.7311965823173523e-05, 3.134086728096008e-05, 3.536976873874664e-05, 3.93986701965332e-05, 4.342757165431976e-05, 4.745647311210632e-05, 5.148537456989288e-05, 5.551427602767944e-05, 5.9543177485466003e-05, 6.357207894325256e-05, 6.760098040103912e-05, 7.162988185882568e-05, 7.565878331661224e-05, 7.96876847743988e-05, 8.371658623218536e-05, 8.774548768997192e-05, 9.177438914775848e-05, 9.580329060554504e-05, 9.98321920633316e-05, 0.00010386109352111816, 0.00010788999497890472, 0.00011191889643669128, 0.00011594779789447784, 0.0001199766993522644, 0.00012400560081005096, 0.00012803450226783752, 0.00013206340372562408, 0.00013609230518341064, 0.0001401212066411972, 0.00014415010809898376, 0.00014817900955677032, 0.00015220791101455688, 0.00015623681247234344, 0.00016026571393013, 0.00016429461538791656, 0.00016832351684570312]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 9.0, 11.0, 15.0, 23.0, 46.0, 81.0, 143.0, 262.0, 415.0, 872.0, 2362.0, 10599.0, 100646.0, 821192.0, 97352.0, 10352.0, 2293.0, 860.0, 414.0, 218.0, 156.0, 89.0, 52.0, 33.0, 13.0, 13.0, 5.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31103515625, -0.3011589050292969, -0.29128265380859375, -0.2814064025878906, -0.2715301513671875, -0.2616539001464844, -0.25177764892578125, -0.24190139770507812, -0.232025146484375, -0.22214889526367188, -0.21227264404296875, -0.20239639282226562, -0.1925201416015625, -0.18264389038085938, -0.17276763916015625, -0.16289138793945312, -0.15301513671875, -0.14313888549804688, -0.13326263427734375, -0.12338638305664062, -0.1135101318359375, -0.10363388061523438, -0.09375762939453125, -0.08388137817382812, -0.074005126953125, -0.06412887573242188, -0.05425262451171875, -0.044376373291015625, -0.0345001220703125, -0.024623870849609375, -0.01474761962890625, -0.004871368408203125, 0.0050048828125, 0.014881134033203125, 0.02475738525390625, 0.034633636474609375, 0.0445098876953125, 0.054386138916015625, 0.06426239013671875, 0.07413864135742188, 0.084014892578125, 0.09389114379882812, 0.10376739501953125, 0.11364364624023438, 0.1235198974609375, 0.13339614868164062, 0.14327239990234375, 0.15314865112304688, 0.16302490234375, 0.17290115356445312, 0.18277740478515625, 0.19265365600585938, 0.2025299072265625, 0.21240615844726562, 0.22228240966796875, 0.23215866088867188, 0.242034912109375, 0.2519111633300781, 0.26178741455078125, 0.2716636657714844, 0.2815399169921875, 0.2914161682128906, 0.30129241943359375, 0.3111686706542969, 0.321044921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 9.0, 6.0, 12.0, 22.0, 25.0, 34.0, 56.0, 87.0, 146.0, 206.0, 147.0, 88.0, 51.0, 45.0, 21.0, 14.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4208984375, -0.4070167541503906, -0.39313507080078125, -0.3792533874511719, -0.3653717041015625, -0.3514900207519531, -0.33760833740234375, -0.3237266540527344, -0.309844970703125, -0.2959632873535156, -0.28208160400390625, -0.2681999206542969, -0.2543182373046875, -0.24043655395507812, -0.22655487060546875, -0.21267318725585938, -0.19879150390625, -0.18490982055664062, -0.17102813720703125, -0.15714645385742188, -0.1432647705078125, -0.12938308715820312, -0.11550140380859375, -0.10161972045898438, -0.087738037109375, -0.07385635375976562, -0.05997467041015625, -0.046092987060546875, -0.0322113037109375, -0.018329620361328125, -0.00444793701171875, 0.009433746337890625, 0.0233154296875, 0.037197113037109375, 0.05107879638671875, 0.06496047973632812, 0.0788421630859375, 0.09272384643554688, 0.10660552978515625, 0.12048721313476562, 0.134368896484375, 0.14825057983398438, 0.16213226318359375, 0.17601394653320312, 0.1898956298828125, 0.20377731323242188, 0.21765899658203125, 0.23154067993164062, 0.24542236328125, 0.2593040466308594, 0.27318572998046875, 0.2870674133300781, 0.3009490966796875, 0.3148307800292969, 0.32871246337890625, 0.3425941467285156, 0.356475830078125, 0.3703575134277344, 0.38423919677734375, 0.3981208801269531, 0.4120025634765625, 0.4258842468261719, 0.43976593017578125, 0.4536476135253906, 0.467529296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 29.0, 114.0, 413.0, 360.0, 66.0, 14.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-18.472187042236328, -18.136234283447266, -17.800283432006836, -17.464330673217773, -17.128379821777344, -16.79242706298828, -16.45647621154785, -16.12052345275879, -15.784571647644043, -15.448619842529297, -15.11266803741455, -14.776716232299805, -14.440764427185059, -14.104812622070312, -13.76885986328125, -13.432908058166504, -13.096956253051758, -12.761004447937012, -12.425052642822266, -12.08910083770752, -11.753149032592773, -11.417196273803711, -11.081245422363281, -10.745292663574219, -10.409341812133789, -10.073390007019043, -9.737438201904297, -9.40148639678955, -9.065534591674805, -8.729581832885742, -8.393630981445312, -8.05767822265625, -7.721726417541504, -7.385774612426758, -7.049822807312012, -6.713871002197266, -6.377918720245361, -6.041966915130615, -5.706015110015869, -5.370062828063965, -5.034111022949219, -4.698159217834473, -4.362207412719727, -4.0262556076049805, -3.690303325653076, -3.35435152053833, -3.018399715423584, -2.682447671890259, -2.346496105194092, -2.0105443000793457, -1.6745922565460205, -1.3386404514312744, -1.0026885271072388, -0.6667366027832031, -0.33078479766845703, 0.005167245864868164, 0.34111905097961426, 0.6770709753036499, 1.0130228996276855, 1.3489747047424316, 1.6849266290664673, 2.020878553390503, 2.356830358505249, 2.692782402038574, 3.0287342071533203]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 3.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 32.0, 20.0, 30.0, 23.0, 28.0, 32.0, 51.0, 41.0, 30.0, 47.0, 60.0, 41.0, 41.0, 42.0, 47.0, 41.0, 35.0, 57.0, 43.0, 31.0, 29.0, 28.0, 15.0, 30.0, 14.0, 12.0, 13.0, 7.0, 10.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1834774017333984, -3.0944883823394775, -3.0054993629455566, -2.916510581970215, -2.827521562576294, -2.738532543182373, -2.649543523788452, -2.5605545043945312, -2.4715657234191895, -2.3825767040252686, -2.2935876846313477, -2.204598903656006, -2.115609884262085, -2.026620864868164, -1.9376318454742432, -1.8486428260803223, -1.7596538066864014, -1.6706647872924805, -1.5816758871078491, -1.4926868677139282, -1.4036979675292969, -1.314708948135376, -1.225719928741455, -1.1367309093475342, -1.0477420091629028, -0.9587530493736267, -0.8697640895843506, -0.7807750701904297, -0.6917861104011536, -0.6027971506118774, -0.5138081312179565, -0.4248191714286804, -0.3358302116394043, -0.24684123694896698, -0.15785226225852966, -0.06886327266693115, 0.02012568712234497, 0.1091146469116211, 0.198103666305542, 0.2870926260948181, 0.37608158588409424, 0.46507054567337036, 0.5540595054626465, 0.6430485248565674, 0.7320374846458435, 0.8210264444351196, 0.9100154638290405, 0.9990044236183167, 1.0879933834075928, 1.1769824028015137, 1.265971302986145, 1.354960322380066, 1.4439492225646973, 1.5329382419586182, 1.621927261352539, 1.71091628074646, 1.7999051809310913, 1.8888942003250122, 1.9778831005096436, 2.0668721199035645, 2.1558611392974854, 2.2448501586914062, 2.333838939666748, 2.422827959060669, 2.51181697845459]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 5.0, 8.0, 17.0, 18.0, 37.0, 60.0, 89.0, 143.0, 230.0, 358.0, 714.0, 1549.0, 4371.0, 21955.0, 3997562.0, 151801.0, 10216.0, 2729.0, 1069.0, 533.0, 300.0, 202.0, 106.0, 80.0, 47.0, 26.0, 18.0, 14.0, 11.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6250038146972656, -0.6088943481445312, -0.5927848815917969, -0.5766754150390625, -0.5605659484863281, -0.5444564819335938, -0.5283470153808594, -0.512237548828125, -0.4961280822753906, -0.48001861572265625, -0.4639091491699219, -0.4477996826171875, -0.4316902160644531, -0.41558074951171875, -0.3994712829589844, -0.38336181640625, -0.3672523498535156, -0.35114288330078125, -0.3350334167480469, -0.3189239501953125, -0.3028144836425781, -0.28670501708984375, -0.2705955505371094, -0.254486083984375, -0.23837661743164062, -0.22226715087890625, -0.20615768432617188, -0.1900482177734375, -0.17393875122070312, -0.15782928466796875, -0.14171981811523438, -0.1256103515625, -0.10950088500976562, -0.09339141845703125, -0.07728195190429688, -0.0611724853515625, -0.045063018798828125, -0.02895355224609375, -0.012844085693359375, 0.003265380859375, 0.019374847412109375, 0.03548431396484375, 0.051593780517578125, 0.0677032470703125, 0.08381271362304688, 0.09992218017578125, 0.11603164672851562, 0.13214111328125, 0.14825057983398438, 0.16436004638671875, 0.18046951293945312, 0.1965789794921875, 0.21268844604492188, 0.22879791259765625, 0.24490737915039062, 0.261016845703125, 0.2771263122558594, 0.29323577880859375, 0.3093452453613281, 0.3254547119140625, 0.3415641784667969, 0.35767364501953125, 0.3737831115722656, 0.389892578125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 10.0, 6.0, 15.0, 20.0, 22.0, 29.0, 25.0, 39.0, 65.0, 58.0, 79.0, 79.0, 72.0, 65.0, 63.0, 71.0, 54.0, 46.0, 45.0, 37.0, 28.0, 27.0, 16.0, 8.0, 8.0, 5.0, 10.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1572265625, -0.15317344665527344, -0.14912033081054688, -0.1450672149658203, -0.14101409912109375, -0.1369609832763672, -0.13290786743164062, -0.12885475158691406, -0.1248016357421875, -0.12074851989746094, -0.11669540405273438, -0.11264228820800781, -0.10858917236328125, -0.10453605651855469, -0.10048294067382812, -0.09642982482910156, -0.092376708984375, -0.08832359313964844, -0.08427047729492188, -0.08021736145019531, -0.07616424560546875, -0.07211112976074219, -0.06805801391601562, -0.06400489807128906, -0.0599517822265625, -0.05589866638183594, -0.051845550537109375, -0.04779243469238281, -0.04373931884765625, -0.03968620300292969, -0.035633087158203125, -0.03157997131347656, -0.02752685546875, -0.023473739624023438, -0.019420623779296875, -0.015367507934570312, -0.01131439208984375, -0.0072612762451171875, -0.003208160400390625, 0.0008449554443359375, 0.0048980712890625, 0.008951187133789062, 0.013004302978515625, 0.017057418823242188, 0.02111053466796875, 0.025163650512695312, 0.029216766357421875, 0.03326988220214844, 0.037322998046875, 0.04137611389160156, 0.045429229736328125, 0.04948234558105469, 0.05353546142578125, 0.05758857727050781, 0.061641693115234375, 0.06569480895996094, 0.0697479248046875, 0.07380104064941406, 0.07785415649414062, 0.08190727233886719, 0.08596038818359375, 0.09001350402832031, 0.09406661987304688, 0.09811973571777344, 0.1021728515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 8.0, 12.0, 12.0, 28.0, 35.0, 24.0, 54.0, 66.0, 107.0, 148.0, 180.0, 249.0, 359.0, 508.0, 764.0, 1123.0, 2091.0, 4964.0, 15430.0, 110436.0, 3958032.0, 76783.0, 13005.0, 4427.0, 1967.0, 1111.0, 700.0, 458.0, 309.0, 216.0, 170.0, 149.0, 98.0, 48.0, 53.0, 49.0, 19.0, 24.0, 23.0, 6.0, 14.0, 1.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4658203125, -0.4510002136230469, -0.43618011474609375, -0.4213600158691406, -0.4065399169921875, -0.3917198181152344, -0.37689971923828125, -0.3620796203613281, -0.347259521484375, -0.3324394226074219, -0.31761932373046875, -0.3027992248535156, -0.2879791259765625, -0.2731590270996094, -0.25833892822265625, -0.24351882934570312, -0.22869873046875, -0.21387863159179688, -0.19905853271484375, -0.18423843383789062, -0.1694183349609375, -0.15459823608398438, -0.13977813720703125, -0.12495803833007812, -0.110137939453125, -0.09531784057617188, -0.08049774169921875, -0.06567764282226562, -0.0508575439453125, -0.036037445068359375, -0.02121734619140625, -0.006397247314453125, 0.0084228515625, 0.023242950439453125, 0.03806304931640625, 0.052883148193359375, 0.0677032470703125, 0.08252334594726562, 0.09734344482421875, 0.11216354370117188, 0.126983642578125, 0.14180374145507812, 0.15662384033203125, 0.17144393920898438, 0.1862640380859375, 0.20108413696289062, 0.21590423583984375, 0.23072433471679688, 0.24554443359375, 0.2603645324707031, 0.27518463134765625, 0.2900047302246094, 0.3048248291015625, 0.3196449279785156, 0.33446502685546875, 0.3492851257324219, 0.364105224609375, 0.3789253234863281, 0.39374542236328125, 0.4085655212402344, 0.4233856201171875, 0.4382057189941406, 0.45302581787109375, 0.4678459167480469, 0.482666015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 19.0, 72.0, 445.0, 3269.0, 149.0, 62.0, 15.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1943359375, -0.18881607055664062, -0.18329620361328125, -0.17777633666992188, -0.1722564697265625, -0.16673660278320312, -0.16121673583984375, -0.15569686889648438, -0.150177001953125, -0.14465713500976562, -0.13913726806640625, -0.13361740112304688, -0.1280975341796875, -0.12257766723632812, -0.11705780029296875, -0.11153793334960938, -0.10601806640625, -0.10049819946289062, -0.09497833251953125, -0.08945846557617188, -0.0839385986328125, -0.07841873168945312, -0.07289886474609375, -0.06737899780273438, -0.061859130859375, -0.056339263916015625, -0.05081939697265625, -0.045299530029296875, -0.0397796630859375, -0.034259796142578125, -0.02873992919921875, -0.023220062255859375, -0.0177001953125, -0.012180328369140625, -0.00666046142578125, -0.001140594482421875, 0.0043792724609375, 0.009899139404296875, 0.01541900634765625, 0.020938873291015625, 0.026458740234375, 0.031978607177734375, 0.03749847412109375, 0.043018341064453125, 0.0485382080078125, 0.054058074951171875, 0.05957794189453125, 0.06509780883789062, 0.07061767578125, 0.07613754272460938, 0.08165740966796875, 0.08717727661132812, 0.0926971435546875, 0.09821701049804688, 0.10373687744140625, 0.10925674438476562, 0.114776611328125, 0.12029647827148438, 0.12581634521484375, 0.13133621215820312, 0.1368560791015625, 0.14237594604492188, 0.14789581298828125, 0.15341567993164062, 0.158935546875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 17.0, 14.0, 24.0, 55.0, 107.0, 140.0, 157.0, 149.0, 136.0, 72.0, 53.0, 28.0, 12.0, 12.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6229955554008484, -0.6078831553459167, -0.5927706956863403, -0.5776582956314087, -0.562545895576477, -0.5474334359169006, -0.532321035861969, -0.5172086358070374, -0.5020961761474609, -0.4869837462902069, -0.47187134623527527, -0.45675891637802124, -0.4416464865207672, -0.42653408646583557, -0.41142165660858154, -0.3963092565536499, -0.38119685649871826, -0.36608442664146423, -0.3509720265865326, -0.33585959672927856, -0.32074716687202454, -0.3056347668170929, -0.29052233695983887, -0.2754099369049072, -0.2602974772453308, -0.24518506228923798, -0.23007263243198395, -0.2149602174758911, -0.19984780251979828, -0.18473538756370544, -0.16962295770645142, -0.15451054275035858, -0.13939812779426575, -0.12428570538759232, -0.10917329043149948, -0.09406086802482605, -0.07894845306873322, -0.06383603066205978, -0.04872360825538635, -0.03361119329929352, -0.018498770892620087, -0.003386351279914379, 0.011726068332791328, 0.02683848887681961, 0.041950907558202744, 0.057063326239585876, 0.07217574864625931, 0.08728816360235214, 0.10240058600902557, 0.117513008415699, 0.13262543082237244, 0.14773784577846527, 0.1628502607345581, 0.17796269059181213, 0.19307510554790497, 0.2081875205039978, 0.22329995036125183, 0.23841236531734467, 0.2535247802734375, 0.26863721013069153, 0.28374963998794556, 0.2988620400428772, 0.3139744699001312, 0.32908689975738525, 0.3441992998123169]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 4.0, 15.0, 7.0, 13.0, 11.0, 15.0, 29.0, 20.0, 29.0, 28.0, 35.0, 38.0, 39.0, 36.0, 48.0, 40.0, 43.0, 45.0, 42.0, 42.0, 42.0, 40.0, 34.0, 34.0, 44.0, 30.0, 34.0, 25.0, 18.0, 26.0, 20.0, 12.0, 14.0, 8.0, 8.0, 5.0, 1.0, 10.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25805431604385376, -0.24963845312595367, -0.2412225902080536, -0.2328067272901535, -0.22439086437225342, -0.21597498655319214, -0.20755912363529205, -0.19914326071739197, -0.19072739779949188, -0.1823115348815918, -0.1738956719636917, -0.16547980904579163, -0.15706393122673035, -0.14864808320999146, -0.14023220539093018, -0.1318163424730301, -0.12340047955513, -0.11498461663722992, -0.10656875371932983, -0.09815288335084915, -0.08973702043294907, -0.08132115751504898, -0.0729052871465683, -0.06448942422866821, -0.05607356131076813, -0.04765769839286804, -0.03924183174967766, -0.030825966969132423, -0.02241010218858719, -0.013994239270687103, -0.005578372627496719, 0.0028374940156936646, 0.01125335693359375, 0.019669221714138985, 0.02808508649468422, 0.0365009531378746, 0.04491681605577469, 0.053332678973674774, 0.06174854561686516, 0.07016441226005554, 0.07858027517795563, 0.08699613809585571, 0.0954120010137558, 0.10382787138223648, 0.11224373430013657, 0.12065959721803665, 0.12907546758651733, 0.13749133050441742, 0.1459071934223175, 0.1543230563402176, 0.16273891925811768, 0.17115478217601776, 0.17957064509391785, 0.18798652291297913, 0.1964023858308792, 0.2048182487487793, 0.21323411166667938, 0.22164997458457947, 0.23006583750247955, 0.23848170042037964, 0.24689757823944092, 0.2553134262561798, 0.2637293040752411, 0.27214515209198, 0.28056102991104126]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 4.0, 8.0, 9.0, 13.0, 30.0, 31.0, 70.0, 126.0, 190.0, 368.0, 784.0, 1656.0, 3779.0, 10519.0, 35390.0, 188160.0, 602514.0, 157818.0, 30978.0, 9590.0, 3486.0, 1497.0, 695.0, 378.0, 183.0, 114.0, 66.0, 31.0, 17.0, 17.0, 9.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4077873229980469, -0.39345550537109375, -0.3791236877441406, -0.3647918701171875, -0.3504600524902344, -0.33612823486328125, -0.3217964172363281, -0.307464599609375, -0.2931327819824219, -0.27880096435546875, -0.2644691467285156, -0.2501373291015625, -0.23580551147460938, -0.22147369384765625, -0.20714187622070312, -0.19281005859375, -0.17847824096679688, -0.16414642333984375, -0.14981460571289062, -0.1354827880859375, -0.12115097045898438, -0.10681915283203125, -0.09248733520507812, -0.078155517578125, -0.06382369995117188, -0.04949188232421875, -0.035160064697265625, -0.0208282470703125, -0.006496429443359375, 0.00783538818359375, 0.022167205810546875, 0.0364990234375, 0.050830841064453125, 0.06516265869140625, 0.07949447631835938, 0.0938262939453125, 0.10815811157226562, 0.12248992919921875, 0.13682174682617188, 0.151153564453125, 0.16548538208007812, 0.17981719970703125, 0.19414901733398438, 0.2084808349609375, 0.22281265258789062, 0.23714447021484375, 0.2514762878417969, 0.26580810546875, 0.2801399230957031, 0.29447174072265625, 0.3088035583496094, 0.3231353759765625, 0.3374671936035156, 0.35179901123046875, 0.3661308288574219, 0.380462646484375, 0.3947944641113281, 0.40912628173828125, 0.4234580993652344, 0.4377899169921875, 0.4521217346191406, 0.46645355224609375, 0.4807853698730469, 0.4951171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 10.0, 19.0, 18.0, 23.0, 29.0, 23.0, 27.0, 41.0, 63.0, 53.0, 81.0, 64.0, 86.0, 70.0, 62.0, 53.0, 56.0, 48.0, 38.0, 40.0, 27.0, 17.0, 11.0, 14.0, 12.0, 7.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1629638671875, -0.15884017944335938, -0.15471649169921875, -0.15059280395507812, -0.1464691162109375, -0.14234542846679688, -0.13822174072265625, -0.13409805297851562, -0.129974365234375, -0.12585067749023438, -0.12172698974609375, -0.11760330200195312, -0.1134796142578125, -0.10935592651367188, -0.10523223876953125, -0.10110855102539062, -0.09698486328125, -0.09286117553710938, -0.08873748779296875, -0.08461380004882812, -0.0804901123046875, -0.07636642456054688, -0.07224273681640625, -0.06811904907226562, -0.063995361328125, -0.059871673583984375, -0.05574798583984375, -0.051624298095703125, -0.0475006103515625, -0.043376922607421875, -0.03925323486328125, -0.035129547119140625, -0.031005859375, -0.026882171630859375, -0.02275848388671875, -0.018634796142578125, -0.0145111083984375, -0.010387420654296875, -0.00626373291015625, -0.002140045166015625, 0.001983642578125, 0.006107330322265625, 0.01023101806640625, 0.014354705810546875, 0.0184783935546875, 0.022602081298828125, 0.02672576904296875, 0.030849456787109375, 0.03497314453125, 0.039096832275390625, 0.04322052001953125, 0.047344207763671875, 0.0514678955078125, 0.055591583251953125, 0.05971527099609375, 0.06383895874023438, 0.067962646484375, 0.07208633422851562, 0.07621002197265625, 0.08033370971679688, 0.0844573974609375, 0.08858108520507812, 0.09270477294921875, 0.09682846069335938, 0.1009521484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 7.0, 4.0, 12.0, 10.0, 23.0, 20.0, 26.0, 35.0, 55.0, 99.0, 134.0, 230.0, 333.0, 556.0, 921.0, 1707.0, 3545.0, 8304.0, 27038.0, 147167.0, 654281.0, 159162.0, 28331.0, 8665.0, 3636.0, 1730.0, 959.0, 575.0, 357.0, 195.0, 134.0, 97.0, 51.0, 53.0, 20.0, 20.0, 12.0, 9.0, 13.0, 8.0, 7.0, 2.0, 1.0, 6.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4716796875, -0.4567146301269531, -0.44174957275390625, -0.4267845153808594, -0.4118194580078125, -0.3968544006347656, -0.38188934326171875, -0.3669242858886719, -0.351959228515625, -0.3369941711425781, -0.32202911376953125, -0.3070640563964844, -0.2920989990234375, -0.2771339416503906, -0.26216888427734375, -0.24720382690429688, -0.23223876953125, -0.21727371215820312, -0.20230865478515625, -0.18734359741210938, -0.1723785400390625, -0.15741348266601562, -0.14244842529296875, -0.12748336791992188, -0.112518310546875, -0.09755325317382812, -0.08258819580078125, -0.06762313842773438, -0.0526580810546875, -0.037693023681640625, -0.02272796630859375, -0.007762908935546875, 0.0072021484375, 0.022167205810546875, 0.03713226318359375, 0.052097320556640625, 0.0670623779296875, 0.08202743530273438, 0.09699249267578125, 0.11195755004882812, 0.126922607421875, 0.14188766479492188, 0.15685272216796875, 0.17181777954101562, 0.1867828369140625, 0.20174789428710938, 0.21671295166015625, 0.23167800903320312, 0.24664306640625, 0.2616081237792969, 0.27657318115234375, 0.2915382385253906, 0.3065032958984375, 0.3214683532714844, 0.33643341064453125, 0.3513984680175781, 0.366363525390625, 0.3813285827636719, 0.39629364013671875, 0.4112586975097656, 0.4262237548828125, 0.4411888122558594, 0.45615386962890625, 0.4711189270019531, 0.486083984375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 6.0, 10.0, 15.0, 13.0, 37.0, 34.0, 35.0, 48.0, 48.0, 54.0, 69.0, 72.0, 59.0, 74.0, 65.0, 65.0, 49.0, 49.0, 42.0, 30.0, 28.0, 25.0, 19.0, 14.0, 10.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68994140625, -0.6648635864257812, -0.6397857666015625, -0.6147079467773438, -0.589630126953125, -0.5645523071289062, -0.5394744873046875, -0.5143966674804688, -0.48931884765625, -0.46424102783203125, -0.4391632080078125, -0.41408538818359375, -0.389007568359375, -0.36392974853515625, -0.3388519287109375, -0.31377410888671875, -0.2886962890625, -0.26361846923828125, -0.2385406494140625, -0.21346282958984375, -0.188385009765625, -0.16330718994140625, -0.1382293701171875, -0.11315155029296875, -0.08807373046875, -0.06299591064453125, -0.0379180908203125, -0.01284027099609375, 0.012237548828125, 0.03731536865234375, 0.0623931884765625, 0.08747100830078125, 0.112548828125, 0.13762664794921875, 0.1627044677734375, 0.18778228759765625, 0.212860107421875, 0.23793792724609375, 0.2630157470703125, 0.28809356689453125, 0.31317138671875, 0.33824920654296875, 0.3633270263671875, 0.38840484619140625, 0.413482666015625, 0.43856048583984375, 0.4636383056640625, 0.48871612548828125, 0.5137939453125, 0.5388717651367188, 0.5639495849609375, 0.5890274047851562, 0.614105224609375, 0.6391830444335938, 0.6642608642578125, 0.6893386840820312, 0.71441650390625, 0.7394943237304688, 0.7645721435546875, 0.7896499633789062, 0.814727783203125, 0.8398056030273438, 0.8648834228515625, 0.8899612426757812, 0.9150390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 4.0, 21.0, 21.0, 30.0, 68.0, 132.0, 243.0, 736.0, 2845.0, 32082.0, 969000.0, 39054.0, 3006.0, 755.0, 283.0, 113.0, 72.0, 33.0, 24.0, 11.0, 9.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.41339874267578125, -0.3922271728515625, -0.37105560302734375, -0.349884033203125, -0.32871246337890625, -0.3075408935546875, -0.28636932373046875, -0.26519775390625, -0.24402618408203125, -0.2228546142578125, -0.20168304443359375, -0.180511474609375, -0.15933990478515625, -0.1381683349609375, -0.11699676513671875, -0.0958251953125, -0.07465362548828125, -0.0534820556640625, -0.03231048583984375, -0.011138916015625, 0.01003265380859375, 0.0312042236328125, 0.05237579345703125, 0.07354736328125, 0.09471893310546875, 0.1158905029296875, 0.13706207275390625, 0.158233642578125, 0.17940521240234375, 0.2005767822265625, 0.22174835205078125, 0.242919921875, 0.26409149169921875, 0.2852630615234375, 0.30643463134765625, 0.327606201171875, 0.34877777099609375, 0.3699493408203125, 0.39112091064453125, 0.41229248046875, 0.43346405029296875, 0.4546356201171875, 0.47580718994140625, 0.496978759765625, 0.5181503295898438, 0.5393218994140625, 0.5604934692382812, 0.5816650390625, 0.6028366088867188, 0.6240081787109375, 0.6451797485351562, 0.666351318359375, 0.6875228881835938, 0.7086944580078125, 0.7298660278320312, 0.75103759765625, 0.7722091674804688, 0.7933807373046875, 0.8145523071289062, 0.835723876953125, 0.8568954467773438, 0.8780670166015625, 0.8992385864257812, 0.92041015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 14.0, 10.0, 29.0, 53.0, 62.0, 102.0, 146.0, 186.0, 144.0, 108.0, 62.0, 29.0, 18.0, 17.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020694732666015625, -0.00020056962966918945, -0.00019419193267822266, -0.00018781423568725586, -0.00018143653869628906, -0.00017505884170532227, -0.00016868114471435547, -0.00016230344772338867, -0.00015592575073242188, -0.00014954805374145508, -0.00014317035675048828, -0.00013679265975952148, -0.0001304149627685547, -0.0001240372657775879, -0.0001176595687866211, -0.0001112818717956543, -0.0001049041748046875, -9.85264778137207e-05, -9.21487808227539e-05, -8.577108383178711e-05, -7.939338684082031e-05, -7.301568984985352e-05, -6.663799285888672e-05, -6.026029586791992e-05, -5.3882598876953125e-05, -4.750490188598633e-05, -4.112720489501953e-05, -3.4749507904052734e-05, -2.8371810913085938e-05, -2.199411392211914e-05, -1.5616416931152344e-05, -9.238719940185547e-06, -2.86102294921875e-06, 3.516674041748047e-06, 9.894371032714844e-06, 1.627206802368164e-05, 2.2649765014648438e-05, 2.9027462005615234e-05, 3.540515899658203e-05, 4.178285598754883e-05, 4.8160552978515625e-05, 5.453824996948242e-05, 6.091594696044922e-05, 6.729364395141602e-05, 7.367134094238281e-05, 8.004903793334961e-05, 8.64267349243164e-05, 9.28044319152832e-05, 9.918212890625e-05, 0.0001055598258972168, 0.0001119375228881836, 0.00011831521987915039, 0.0001246929168701172, 0.00013107061386108398, 0.00013744831085205078, 0.00014382600784301758, 0.00015020370483398438, 0.00015658140182495117, 0.00016295909881591797, 0.00016933679580688477, 0.00017571449279785156, 0.00018209218978881836, 0.00018846988677978516, 0.00019484758377075195, 0.00020122528076171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 6.0, 2.0, 8.0, 9.0, 19.0, 20.0, 33.0, 49.0, 83.0, 164.0, 280.0, 564.0, 1280.0, 3651.0, 16292.0, 219629.0, 750166.0, 45604.0, 6929.0, 2033.0, 833.0, 398.0, 185.0, 114.0, 69.0, 46.0, 21.0, 16.0, 12.0, 10.0, 12.0, 9.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.32464599609375, -0.3145751953125, -0.30450439453125, -0.29443359375, -0.28436279296875, -0.2742919921875, -0.26422119140625, -0.254150390625, -0.24407958984375, -0.2340087890625, -0.22393798828125, -0.2138671875, -0.20379638671875, -0.1937255859375, -0.18365478515625, -0.173583984375, -0.16351318359375, -0.1534423828125, -0.14337158203125, -0.13330078125, -0.12322998046875, -0.1131591796875, -0.10308837890625, -0.093017578125, -0.08294677734375, -0.0728759765625, -0.06280517578125, -0.052734375, -0.04266357421875, -0.0325927734375, -0.02252197265625, -0.012451171875, -0.00238037109375, 0.0076904296875, 0.01776123046875, 0.02783203125, 0.03790283203125, 0.0479736328125, 0.05804443359375, 0.068115234375, 0.07818603515625, 0.0882568359375, 0.09832763671875, 0.1083984375, 0.11846923828125, 0.1285400390625, 0.13861083984375, 0.148681640625, 0.15875244140625, 0.1688232421875, 0.17889404296875, 0.18896484375, 0.19903564453125, 0.2091064453125, 0.21917724609375, 0.229248046875, 0.23931884765625, 0.2493896484375, 0.25946044921875, 0.26953125, 0.27960205078125, 0.2896728515625, 0.29974365234375, 0.309814453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 11.0, 9.0, 15.0, 23.0, 22.0, 25.0, 36.0, 56.0, 88.0, 128.0, 130.0, 133.0, 81.0, 57.0, 45.0, 34.0, 29.0, 21.0, 10.0, 10.0, 5.0, 2.0, 11.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37158203125, -0.3608589172363281, -0.35013580322265625, -0.3394126892089844, -0.3286895751953125, -0.3179664611816406, -0.30724334716796875, -0.2965202331542969, -0.285797119140625, -0.2750740051269531, -0.26435089111328125, -0.2536277770996094, -0.2429046630859375, -0.23218154907226562, -0.22145843505859375, -0.21073532104492188, -0.20001220703125, -0.18928909301757812, -0.17856597900390625, -0.16784286499023438, -0.1571197509765625, -0.14639663696289062, -0.13567352294921875, -0.12495040893554688, -0.114227294921875, -0.10350418090820312, -0.09278106689453125, -0.08205795288085938, -0.0713348388671875, -0.060611724853515625, -0.04988861083984375, -0.039165496826171875, -0.0284423828125, -0.017719268798828125, -0.00699615478515625, 0.003726959228515625, 0.0144500732421875, 0.025173187255859375, 0.03589630126953125, 0.046619415283203125, 0.057342529296875, 0.06806564331054688, 0.07878875732421875, 0.08951187133789062, 0.1002349853515625, 0.11095809936523438, 0.12168121337890625, 0.13240432739257812, 0.14312744140625, 0.15385055541992188, 0.16457366943359375, 0.17529678344726562, 0.1860198974609375, 0.19674301147460938, 0.20746612548828125, 0.21818923950195312, 0.228912353515625, 0.23963546752929688, 0.25035858154296875, 0.2610816955566406, 0.2718048095703125, 0.2825279235839844, 0.29325103759765625, 0.3039741516113281, 0.314697265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 4.0, 20.0, 53.0, 119.0, 222.0, 278.0, 177.0, 75.0, 28.0, 13.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.642379760742188, -9.41045093536377, -9.178521156311035, -8.946592330932617, -8.714662551879883, -8.482733726501465, -8.25080394744873, -8.018875122070312, -7.786945343017578, -7.555016040802002, -7.323086738586426, -7.09115743637085, -6.859228134155273, -6.627298831939697, -6.395369529724121, -6.163440704345703, -5.931511402130127, -5.699582099914551, -5.467652797698975, -5.235723495483398, -5.003794193267822, -4.771864891052246, -4.539936065673828, -4.308006286621094, -4.076077461242676, -3.8441481590270996, -3.6122188568115234, -3.3802895545959473, -3.148360252380371, -2.916430950164795, -2.684501886367798, -2.4525725841522217, -2.2206435203552246, -1.9887142181396484, -1.7567849159240723, -1.5248557329177856, -1.2929264307022095, -1.0609971284866333, -0.8290679454803467, -0.5971386432647705, -0.36520934104919434, -0.13328006863594055, 0.09864920377731323, 0.33057844638824463, 0.5625077486038208, 0.794437050819397, 1.0263662338256836, 1.2582955360412598, 1.490224838256836, 1.722154140472412, 1.9540834426879883, 2.1860127449035645, 2.4179420471191406, 2.649871349334717, 2.881800413131714, 3.11372971534729, 3.345659017562866, 3.5775883197784424, 3.8095176219940186, 4.041446685791016, 4.273375988006592, 4.505305290222168, 4.737234592437744, 4.96916389465332, 5.2010931968688965]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 6.0, 4.0, 3.0, 12.0, 12.0, 12.0, 6.0, 17.0, 19.0, 21.0, 30.0, 30.0, 28.0, 44.0, 42.0, 46.0, 48.0, 44.0, 46.0, 49.0, 61.0, 47.0, 59.0, 42.0, 46.0, 44.0, 28.0, 23.0, 20.0, 21.0, 18.0, 14.0, 13.0, 10.0, 7.0, 5.0, 6.0, 6.0, 2.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1959125995635986, -3.0993895530700684, -3.002866268157959, -2.9063432216644287, -2.8098199367523193, -2.713296890258789, -2.6167736053466797, -2.5202505588531494, -2.423727512359619, -2.327204465866089, -2.2306811809539795, -2.134158134460449, -2.03763484954834, -1.9411118030548096, -1.8445886373519897, -1.74806547164917, -1.6515421867370605, -1.5550190210342407, -1.458495855331421, -1.3619728088378906, -1.2654495239257812, -1.168926477432251, -1.0724033117294312, -0.9758801460266113, -0.8793569803237915, -0.7828338146209717, -0.6863106489181519, -0.5897875428199768, -0.493264377117157, -0.39674121141433716, -0.3002181053161621, -0.20369493961334229, -0.10717201232910156, -0.010648861527442932, 0.0858742892742157, 0.18239742517471313, 0.27892059087753296, 0.3754437565803528, 0.47196686267852783, 0.5684900283813477, 0.6650131940841675, 0.7615363597869873, 0.8580595254898071, 0.9545826315879822, 1.0511057376861572, 1.1476290225982666, 1.2441520690917969, 1.3406752347946167, 1.4371984004974365, 1.5337215662002563, 1.6302447319030762, 1.7267677783966064, 1.8232910633087158, 1.919814109802246, 2.0163373947143555, 2.1128604412078857, 2.209383487701416, 2.3059065341949463, 2.4024298191070557, 2.498952865600586, 2.5954761505126953, 2.6919991970062256, 2.788522243499756, 2.8850455284118652, 2.9815688133239746]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 6.0, 7.0, 8.0, 14.0, 14.0, 23.0, 33.0, 61.0, 80.0, 110.0, 220.0, 332.0, 611.0, 1188.0, 2708.0, 7137.0, 31063.0, 3952858.0, 173193.0, 15834.0, 4709.0, 1974.0, 922.0, 467.0, 287.0, 142.0, 92.0, 74.0, 35.0, 21.0, 17.0, 12.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7001953125, -0.6830329895019531, -0.6658706665039062, -0.6487083435058594, -0.6315460205078125, -0.6143836975097656, -0.5972213745117188, -0.5800590515136719, -0.562896728515625, -0.5457344055175781, -0.5285720825195312, -0.5114097595214844, -0.4942474365234375, -0.4770851135253906, -0.45992279052734375, -0.4427604675292969, -0.42559814453125, -0.4084358215332031, -0.39127349853515625, -0.3741111755371094, -0.3569488525390625, -0.3397865295410156, -0.32262420654296875, -0.3054618835449219, -0.288299560546875, -0.2711372375488281, -0.25397491455078125, -0.23681259155273438, -0.2196502685546875, -0.20248794555664062, -0.18532562255859375, -0.16816329956054688, -0.1510009765625, -0.13383865356445312, -0.11667633056640625, -0.09951400756835938, -0.0823516845703125, -0.06518936157226562, -0.04802703857421875, -0.030864715576171875, -0.013702392578125, 0.003459930419921875, 0.02062225341796875, 0.037784576416015625, 0.0549468994140625, 0.07210922241210938, 0.08927154541015625, 0.10643386840820312, 0.12359619140625, 0.14075851440429688, 0.15792083740234375, 0.17508316040039062, 0.1922454833984375, 0.20940780639648438, 0.22657012939453125, 0.24373245239257812, 0.260894775390625, 0.2780570983886719, 0.29521942138671875, 0.3123817443847656, 0.3295440673828125, 0.3467063903808594, 0.36386871337890625, 0.3810310363769531, 0.398193359375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 7.0, 13.0, 17.0, 23.0, 31.0, 35.0, 46.0, 49.0, 70.0, 74.0, 84.0, 83.0, 63.0, 75.0, 71.0, 59.0, 46.0, 42.0, 24.0, 27.0, 19.0, 11.0, 12.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.212158203125, -0.20728492736816406, -0.20241165161132812, -0.1975383758544922, -0.19266510009765625, -0.1877918243408203, -0.18291854858398438, -0.17804527282714844, -0.1731719970703125, -0.16829872131347656, -0.16342544555664062, -0.1585521697998047, -0.15367889404296875, -0.1488056182861328, -0.14393234252929688, -0.13905906677246094, -0.134185791015625, -0.12931251525878906, -0.12443923950195312, -0.11956596374511719, -0.11469268798828125, -0.10981941223144531, -0.10494613647460938, -0.10007286071777344, -0.0951995849609375, -0.09032630920410156, -0.08545303344726562, -0.08057975769042969, -0.07570648193359375, -0.07083320617675781, -0.06595993041992188, -0.06108665466308594, -0.05621337890625, -0.05134010314941406, -0.046466827392578125, -0.04159355163574219, -0.03672027587890625, -0.03184700012207031, -0.026973724365234375, -0.022100448608398438, -0.0172271728515625, -0.012353897094726562, -0.007480621337890625, -0.0026073455810546875, 0.00226593017578125, 0.0071392059326171875, 0.012012481689453125, 0.016885757446289062, 0.021759033203125, 0.026632308959960938, 0.031505584716796875, 0.03637886047363281, 0.04125213623046875, 0.04612541198730469, 0.050998687744140625, 0.05587196350097656, 0.0607452392578125, 0.06561851501464844, 0.07049179077148438, 0.07536506652832031, 0.08023834228515625, 0.08511161804199219, 0.08998489379882812, 0.09485816955566406, 0.0997314453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 6.0, 12.0, 7.0, 25.0, 21.0, 46.0, 51.0, 68.0, 100.0, 145.0, 187.0, 250.0, 434.0, 606.0, 966.0, 1687.0, 3049.0, 6478.0, 19508.0, 124772.0, 3913656.0, 92330.0, 16845.0, 5885.0, 2788.0, 1518.0, 886.0, 605.0, 413.0, 242.0, 205.0, 101.0, 107.0, 79.0, 60.0, 35.0, 30.0, 19.0, 19.0, 14.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.57470703125, -0.5569915771484375, -0.539276123046875, -0.5215606689453125, -0.50384521484375, -0.4861297607421875, -0.468414306640625, -0.4506988525390625, -0.4329833984375, -0.4152679443359375, -0.397552490234375, -0.3798370361328125, -0.36212158203125, -0.3444061279296875, -0.326690673828125, -0.3089752197265625, -0.291259765625, -0.2735443115234375, -0.255828857421875, -0.2381134033203125, -0.22039794921875, -0.2026824951171875, -0.184967041015625, -0.1672515869140625, -0.1495361328125, -0.1318206787109375, -0.114105224609375, -0.0963897705078125, -0.07867431640625, -0.0609588623046875, -0.043243408203125, -0.0255279541015625, -0.0078125, 0.0099029541015625, 0.027618408203125, 0.0453338623046875, 0.06304931640625, 0.0807647705078125, 0.098480224609375, 0.1161956787109375, 0.1339111328125, 0.1516265869140625, 0.169342041015625, 0.1870574951171875, 0.20477294921875, 0.2224884033203125, 0.240203857421875, 0.2579193115234375, 0.275634765625, 0.2933502197265625, 0.311065673828125, 0.3287811279296875, 0.34649658203125, 0.3642120361328125, 0.381927490234375, 0.3996429443359375, 0.4173583984375, 0.4350738525390625, 0.452789306640625, 0.4705047607421875, 0.48822021484375, 0.5059356689453125, 0.523651123046875, 0.5413665771484375, 0.55908203125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 11.0, 28.0, 70.0, 208.0, 3332.0, 278.0, 66.0, 31.0, 10.0, 11.0, 7.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3038444519042969, -0.29616546630859375, -0.2884864807128906, -0.2808074951171875, -0.2731285095214844, -0.26544952392578125, -0.2577705383300781, -0.250091552734375, -0.24241256713867188, -0.23473358154296875, -0.22705459594726562, -0.2193756103515625, -0.21169662475585938, -0.20401763916015625, -0.19633865356445312, -0.18865966796875, -0.18098068237304688, -0.17330169677734375, -0.16562271118164062, -0.1579437255859375, -0.15026473999023438, -0.14258575439453125, -0.13490676879882812, -0.127227783203125, -0.11954879760742188, -0.11186981201171875, -0.10419082641601562, -0.0965118408203125, -0.08883285522460938, -0.08115386962890625, -0.07347488403320312, -0.0657958984375, -0.058116912841796875, -0.05043792724609375, -0.042758941650390625, -0.0350799560546875, -0.027400970458984375, -0.01972198486328125, -0.012042999267578125, -0.004364013671875, 0.003314971923828125, 0.01099395751953125, 0.018672943115234375, 0.0263519287109375, 0.034030914306640625, 0.04170989990234375, 0.049388885498046875, 0.05706787109375, 0.06474685668945312, 0.07242584228515625, 0.08010482788085938, 0.0877838134765625, 0.09546279907226562, 0.10314178466796875, 0.11082077026367188, 0.118499755859375, 0.12617874145507812, 0.13385772705078125, 0.14153671264648438, 0.1492156982421875, 0.15689468383789062, 0.16457366943359375, 0.17225265502929688, 0.179931640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 9.0, 18.0, 44.0, 51.0, 153.0, 167.0, 219.0, 167.0, 80.0, 50.0, 29.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7165275812149048, -1.682455062866211, -1.6483824253082275, -1.6143099069595337, -1.5802373886108398, -1.5461647510528564, -1.5120922327041626, -1.4780197143554688, -1.4439470767974854, -1.4098745584487915, -1.375801920890808, -1.3417294025421143, -1.3076568841934204, -1.2735843658447266, -1.2395117282867432, -1.2054392099380493, -1.1713666915893555, -1.1372941732406616, -1.1032215356826782, -1.0691490173339844, -1.0350764989852905, -1.0010039806365967, -0.9669313430786133, -0.9328588247299194, -0.8987862467765808, -0.8647136688232422, -0.8306411504745483, -0.7965685725212097, -0.7624959945678711, -0.7284234762191772, -0.6943508982658386, -0.6602783203125, -0.6262056827545166, -0.592133104801178, -0.5580605864524841, -0.5239880084991455, -0.4899154603481293, -0.45584291219711304, -0.4217703342437744, -0.3876977860927582, -0.35362523794174194, -0.3195526897907257, -0.2854801416397095, -0.25140756368637085, -0.21733501553535461, -0.18326246738433838, -0.14918990433216095, -0.11511734127998352, -0.08104479312896729, -0.04697223752737045, -0.01289968192577362, 0.02117287367582321, 0.055245429277420044, 0.08931797742843628, 0.12339054048061371, 0.15746310353279114, 0.19153565168380737, 0.2256081998348236, 0.25968074798583984, 0.29375332593917847, 0.3278258740901947, 0.36189842224121094, 0.39597100019454956, 0.4300435483455658, 0.46411609649658203]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 6.0, 9.0, 6.0, 12.0, 21.0, 21.0, 21.0, 21.0, 23.0, 26.0, 22.0, 26.0, 47.0, 53.0, 45.0, 39.0, 39.0, 45.0, 44.0, 55.0, 55.0, 35.0, 40.0, 32.0, 45.0, 34.0, 31.0, 20.0, 27.0, 21.0, 16.0, 12.0, 12.0, 9.0, 11.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.45489203929901123, -0.4417952001094818, -0.4286983609199524, -0.41560155153274536, -0.40250471234321594, -0.3894078731536865, -0.3763110339641571, -0.3632141947746277, -0.35011738538742065, -0.33702054619789124, -0.3239237070083618, -0.3108268976211548, -0.29773005843162537, -0.28463321924209595, -0.27153638005256653, -0.2584395408630371, -0.24534271657466888, -0.23224587738513947, -0.21914905309677124, -0.20605221390724182, -0.1929553896188736, -0.17985855042934418, -0.16676172614097595, -0.15366488695144653, -0.14056804776191711, -0.1274712085723877, -0.11437438428401947, -0.10127754509449005, -0.08818072080612183, -0.07508388161659241, -0.061987049877643585, -0.04889021813869476, -0.03579339385032654, -0.022696562111377716, -0.009599728509783745, 0.0034971050918102264, 0.01659393683075905, 0.02969077229499817, 0.04278760403394699, 0.05588443577289581, 0.06898126751184464, 0.08207809925079346, 0.09517493098974228, 0.1082717627286911, 0.12136860191822052, 0.13446542620658875, 0.14756226539611816, 0.16065910458564758, 0.1737559288740158, 0.18685276806354523, 0.19994959235191345, 0.21304643154144287, 0.2261432558298111, 0.23924009501934052, 0.25233691930770874, 0.26543375849723816, 0.2785305976867676, 0.291627436876297, 0.3047242760658264, 0.31782108545303345, 0.33091792464256287, 0.3440147638320923, 0.3571116030216217, 0.3702084422111511, 0.38330525159835815]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 11.0, 9.0, 10.0, 16.0, 22.0, 49.0, 88.0, 152.0, 299.0, 522.0, 1137.0, 2294.0, 5345.0, 14581.0, 54679.0, 318271.0, 516207.0, 99080.0, 22287.0, 7444.0, 3089.0, 1390.0, 751.0, 380.0, 201.0, 97.0, 58.0, 33.0, 14.0, 3.0, 14.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.484375, -0.4697761535644531, -0.45517730712890625, -0.4405784606933594, -0.4259796142578125, -0.4113807678222656, -0.39678192138671875, -0.3821830749511719, -0.367584228515625, -0.3529853820800781, -0.33838653564453125, -0.3237876892089844, -0.3091888427734375, -0.2945899963378906, -0.27999114990234375, -0.2653923034667969, -0.25079345703125, -0.23619461059570312, -0.22159576416015625, -0.20699691772460938, -0.1923980712890625, -0.17779922485351562, -0.16320037841796875, -0.14860153198242188, -0.134002685546875, -0.11940383911132812, -0.10480499267578125, -0.09020614624023438, -0.0756072998046875, -0.061008453369140625, -0.04640960693359375, -0.031810760498046875, -0.0172119140625, -0.002613067626953125, 0.01198577880859375, 0.026584625244140625, 0.0411834716796875, 0.055782318115234375, 0.07038116455078125, 0.08498001098632812, 0.099578857421875, 0.11417770385742188, 0.12877655029296875, 0.14337539672851562, 0.1579742431640625, 0.17257308959960938, 0.18717193603515625, 0.20177078247070312, 0.21636962890625, 0.23096847534179688, 0.24556732177734375, 0.2601661682128906, 0.2747650146484375, 0.2893638610839844, 0.30396270751953125, 0.3185615539550781, 0.333160400390625, 0.3477592468261719, 0.36235809326171875, 0.3769569396972656, 0.3915557861328125, 0.4061546325683594, 0.42075347900390625, 0.4353523254394531, 0.449951171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 9.0, 9.0, 8.0, 19.0, 25.0, 21.0, 28.0, 38.0, 43.0, 46.0, 62.0, 60.0, 52.0, 75.0, 71.0, 62.0, 63.0, 55.0, 57.0, 44.0, 34.0, 20.0, 24.0, 17.0, 15.0, 15.0, 13.0, 8.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.189208984375, -0.1845846176147461, -0.1799602508544922, -0.17533588409423828, -0.17071151733398438, -0.16608715057373047, -0.16146278381347656, -0.15683841705322266, -0.15221405029296875, -0.14758968353271484, -0.14296531677246094, -0.13834095001220703, -0.13371658325195312, -0.12909221649169922, -0.12446784973144531, -0.1198434829711914, -0.1152191162109375, -0.1105947494506836, -0.10597038269042969, -0.10134601593017578, -0.09672164916992188, -0.09209728240966797, -0.08747291564941406, -0.08284854888916016, -0.07822418212890625, -0.07359981536865234, -0.06897544860839844, -0.06435108184814453, -0.059726715087890625, -0.05510234832763672, -0.05047798156738281, -0.045853614807128906, -0.041229248046875, -0.036604881286621094, -0.03198051452636719, -0.02735614776611328, -0.022731781005859375, -0.01810741424560547, -0.013483047485351562, -0.008858680725097656, -0.00423431396484375, 0.00039005279541015625, 0.0050144195556640625, 0.009638786315917969, 0.014263153076171875, 0.01888751983642578, 0.023511886596679688, 0.028136253356933594, 0.0327606201171875, 0.037384986877441406, 0.04200935363769531, 0.04663372039794922, 0.051258087158203125, 0.05588245391845703, 0.06050682067871094, 0.06513118743896484, 0.06975555419921875, 0.07437992095947266, 0.07900428771972656, 0.08362865447998047, 0.08825302124023438, 0.09287738800048828, 0.09750175476074219, 0.1021261215209961, 0.10675048828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 6.0, 13.0, 18.0, 23.0, 37.0, 59.0, 107.0, 208.0, 350.0, 800.0, 2434.0, 12181.0, 402013.0, 611154.0, 14658.0, 2747.0, 878.0, 356.0, 203.0, 106.0, 68.0, 50.0, 21.0, 14.0, 16.0, 8.0, 4.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99169921875, -0.9536209106445312, -0.9155426025390625, -0.8774642944335938, -0.839385986328125, -0.8013076782226562, -0.7632293701171875, -0.7251510620117188, -0.68707275390625, -0.6489944458007812, -0.6109161376953125, -0.5728378295898438, -0.534759521484375, -0.49668121337890625, -0.4586029052734375, -0.42052459716796875, -0.3824462890625, -0.34436798095703125, -0.3062896728515625, -0.26821136474609375, -0.230133056640625, -0.19205474853515625, -0.1539764404296875, -0.11589813232421875, -0.07781982421875, -0.03974151611328125, -0.0016632080078125, 0.03641510009765625, 0.074493408203125, 0.11257171630859375, 0.1506500244140625, 0.18872833251953125, 0.226806640625, 0.26488494873046875, 0.3029632568359375, 0.34104156494140625, 0.379119873046875, 0.41719818115234375, 0.4552764892578125, 0.49335479736328125, 0.53143310546875, 0.5695114135742188, 0.6075897216796875, 0.6456680297851562, 0.683746337890625, 0.7218246459960938, 0.7599029541015625, 0.7979812622070312, 0.8360595703125, 0.8741378784179688, 0.9122161865234375, 0.9502944946289062, 0.988372802734375, 1.0264511108398438, 1.0645294189453125, 1.1026077270507812, 1.14068603515625, 1.1787643432617188, 1.2168426513671875, 1.2549209594726562, 1.292999267578125, 1.3310775756835938, 1.3691558837890625, 1.4072341918945312, 1.4453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 7.0, 10.0, 17.0, 10.0, 25.0, 28.0, 33.0, 35.0, 46.0, 61.0, 50.0, 57.0, 72.0, 67.0, 65.0, 69.0, 55.0, 45.0, 59.0, 50.0, 30.0, 21.0, 18.0, 18.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7767257690429688, -0.7472991943359375, -0.7178726196289062, -0.688446044921875, -0.6590194702148438, -0.6295928955078125, -0.6001663208007812, -0.57073974609375, -0.5413131713867188, -0.5118865966796875, -0.48246002197265625, -0.453033447265625, -0.42360687255859375, -0.3941802978515625, -0.36475372314453125, -0.3353271484375, -0.30590057373046875, -0.2764739990234375, -0.24704742431640625, -0.217620849609375, -0.18819427490234375, -0.1587677001953125, -0.12934112548828125, -0.09991455078125, -0.07048797607421875, -0.0410614013671875, -0.01163482666015625, 0.017791748046875, 0.04721832275390625, 0.0766448974609375, 0.10607147216796875, 0.135498046875, 0.16492462158203125, 0.1943511962890625, 0.22377777099609375, 0.253204345703125, 0.28263092041015625, 0.3120574951171875, 0.34148406982421875, 0.37091064453125, 0.40033721923828125, 0.4297637939453125, 0.45919036865234375, 0.488616943359375, 0.5180435180664062, 0.5474700927734375, 0.5768966674804688, 0.6063232421875, 0.6357498168945312, 0.6651763916015625, 0.6946029663085938, 0.724029541015625, 0.7534561157226562, 0.7828826904296875, 0.8123092651367188, 0.84173583984375, 0.8711624145507812, 0.9005889892578125, 0.9300155639648438, 0.959442138671875, 0.9888687133789062, 1.0182952880859375, 1.0477218627929688, 1.0771484375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 10.0, 13.0, 31.0, 65.0, 144.0, 393.0, 1447.0, 18329.0, 1016425.0, 10015.0, 1084.0, 298.0, 143.0, 78.0, 23.0, 17.0, 10.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.3265380859375, -1.272216796875, -1.2178955078125, -1.16357421875, -1.1092529296875, -1.054931640625, -1.0006103515625, -0.9462890625, -0.8919677734375, -0.837646484375, -0.7833251953125, -0.72900390625, -0.6746826171875, -0.620361328125, -0.5660400390625, -0.51171875, -0.4573974609375, -0.403076171875, -0.3487548828125, -0.29443359375, -0.2401123046875, -0.185791015625, -0.1314697265625, -0.0771484375, -0.0228271484375, 0.031494140625, 0.0858154296875, 0.14013671875, 0.1944580078125, 0.248779296875, 0.3031005859375, 0.357421875, 0.4117431640625, 0.466064453125, 0.5203857421875, 0.57470703125, 0.6290283203125, 0.683349609375, 0.7376708984375, 0.7919921875, 0.8463134765625, 0.900634765625, 0.9549560546875, 1.00927734375, 1.0635986328125, 1.117919921875, 1.1722412109375, 1.2265625, 1.2808837890625, 1.335205078125, 1.3895263671875, 1.44384765625, 1.4981689453125, 1.552490234375, 1.6068115234375, 1.6611328125, 1.7154541015625, 1.769775390625, 1.8240966796875, 1.87841796875, 1.9327392578125, 1.987060546875, 2.0413818359375, 2.095703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 10.0, 14.0, 17.0, 19.0, 27.0, 35.0, 51.0, 41.0, 75.0, 67.0, 76.0, 114.0, 93.0, 68.0, 64.0, 51.0, 42.0, 25.0, 28.0, 15.0, 16.0, 12.0, 11.0, 8.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.08970832824707e-05, -8.780695497989655e-05, -8.471682667732239e-05, -8.162669837474823e-05, -7.853657007217407e-05, -7.544644176959991e-05, -7.235631346702576e-05, -6.92661851644516e-05, -6.617605686187744e-05, -6.308592855930328e-05, -5.9995800256729126e-05, -5.690567195415497e-05, -5.381554365158081e-05, -5.072541534900665e-05, -4.7635287046432495e-05, -4.454515874385834e-05, -4.145503044128418e-05, -3.836490213871002e-05, -3.5274773836135864e-05, -3.2184645533561707e-05, -2.909451723098755e-05, -2.600438892841339e-05, -2.2914260625839233e-05, -1.9824132323265076e-05, -1.6734004020690918e-05, -1.364387571811676e-05, -1.0553747415542603e-05, -7.463619112968445e-06, -4.373490810394287e-06, -1.2833625078201294e-06, 1.8067657947540283e-06, 4.896894097328186e-06, 7.987022399902344e-06, 1.1077150702476501e-05, 1.416727900505066e-05, 1.7257407307624817e-05, 2.0347535610198975e-05, 2.3437663912773132e-05, 2.652779221534729e-05, 2.9617920517921448e-05, 3.2708048820495605e-05, 3.579817712306976e-05, 3.888830542564392e-05, 4.197843372821808e-05, 4.5068562030792236e-05, 4.8158690333366394e-05, 5.124881863594055e-05, 5.433894693851471e-05, 5.742907524108887e-05, 6.0519203543663025e-05, 6.360933184623718e-05, 6.669946014881134e-05, 6.97895884513855e-05, 7.287971675395966e-05, 7.596984505653381e-05, 7.905997335910797e-05, 8.215010166168213e-05, 8.524022996425629e-05, 8.833035826683044e-05, 9.14204865694046e-05, 9.451061487197876e-05, 9.760074317455292e-05, 0.00010069087147712708, 0.00010378099977970123, 0.00010687112808227539]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 9.0, 15.0, 15.0, 33.0, 73.0, 138.0, 305.0, 762.0, 2849.0, 40938.0, 978501.0, 21482.0, 2274.0, 630.0, 246.0, 118.0, 63.0, 31.0, 17.0, 12.0, 3.0, 6.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9033203125, -0.8691253662109375, -0.834930419921875, -0.8007354736328125, -0.76654052734375, -0.7323455810546875, -0.698150634765625, -0.6639556884765625, -0.6297607421875, -0.5955657958984375, -0.561370849609375, -0.5271759033203125, -0.49298095703125, -0.4587860107421875, -0.424591064453125, -0.3903961181640625, -0.356201171875, -0.3220062255859375, -0.287811279296875, -0.2536163330078125, -0.21942138671875, -0.1852264404296875, -0.151031494140625, -0.1168365478515625, -0.0826416015625, -0.0484466552734375, -0.014251708984375, 0.0199432373046875, 0.05413818359375, 0.0883331298828125, 0.122528076171875, 0.1567230224609375, 0.19091796875, 0.2251129150390625, 0.259307861328125, 0.2935028076171875, 0.32769775390625, 0.3618927001953125, 0.396087646484375, 0.4302825927734375, 0.4644775390625, 0.4986724853515625, 0.532867431640625, 0.5670623779296875, 0.60125732421875, 0.6354522705078125, 0.669647216796875, 0.7038421630859375, 0.738037109375, 0.7722320556640625, 0.806427001953125, 0.8406219482421875, 0.87481689453125, 0.9090118408203125, 0.943206787109375, 0.9774017333984375, 1.0115966796875, 1.0457916259765625, 1.079986572265625, 1.1141815185546875, 1.14837646484375, 1.1825714111328125, 1.216766357421875, 1.2509613037109375, 1.28515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 20.0, 21.0, 21.0, 65.0, 111.0, 299.0, 248.0, 86.0, 47.0, 28.0, 22.0, 8.0, 6.0, 6.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.1816558837890625, -1.144561767578125, -1.1074676513671875, -1.07037353515625, -1.0332794189453125, -0.996185302734375, -0.9590911865234375, -0.9219970703125, -0.8849029541015625, -0.847808837890625, -0.8107147216796875, -0.77362060546875, -0.7365264892578125, -0.699432373046875, -0.6623382568359375, -0.625244140625, -0.5881500244140625, -0.551055908203125, -0.5139617919921875, -0.47686767578125, -0.4397735595703125, -0.402679443359375, -0.3655853271484375, -0.3284912109375, -0.2913970947265625, -0.254302978515625, -0.2172088623046875, -0.18011474609375, -0.1430206298828125, -0.105926513671875, -0.0688323974609375, -0.03173828125, 0.0053558349609375, 0.042449951171875, 0.0795440673828125, 0.11663818359375, 0.1537322998046875, 0.190826416015625, 0.2279205322265625, 0.2650146484375, 0.3021087646484375, 0.339202880859375, 0.3762969970703125, 0.41339111328125, 0.4504852294921875, 0.487579345703125, 0.5246734619140625, 0.561767578125, 0.5988616943359375, 0.635955810546875, 0.6730499267578125, 0.71014404296875, 0.7472381591796875, 0.784332275390625, 0.8214263916015625, 0.8585205078125, 0.8956146240234375, 0.932708740234375, 0.9698028564453125, 1.00689697265625, 1.0439910888671875, 1.081085205078125, 1.1181793212890625, 1.1552734375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 34.0, 179.0, 582.0, 188.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.54459762573242, -31.744001388549805, -30.943405151367188, -30.14280891418457, -29.342212677001953, -28.54161834716797, -27.74102210998535, -26.940425872802734, -26.139829635620117, -25.3392333984375, -24.538637161254883, -23.738040924072266, -22.93744659423828, -22.13684844970703, -21.336254119873047, -20.53565788269043, -19.735061645507812, -18.934465408325195, -18.133869171142578, -17.33327293395996, -16.532676696777344, -15.732081413269043, -14.931486129760742, -14.130889892578125, -13.330293655395508, -12.52969741821289, -11.729101181030273, -10.928505897521973, -10.127909660339355, -9.327313423156738, -8.526718139648438, -7.72612190246582, -6.925527572631836, -6.124931335449219, -5.32433557510376, -4.523739814758301, -3.7231435775756836, -2.9225473403930664, -2.1219515800476074, -1.3213558197021484, -0.5207595825195312, 0.27983641624450684, 1.080432415008545, 1.881028413772583, 2.681624412536621, 3.4822206497192383, 4.282816410064697, 5.083412170410156, 5.884008407592773, 6.684604644775391, 7.48520040512085, 8.285796165466309, 9.086392402648926, 9.886988639831543, 10.687583923339844, 11.488180160522461, 12.288776397705078, 13.089372634887695, 13.889968872070312, 14.690564155578613, 15.49116039276123, 16.29175567626953, 17.09235191345215, 17.892948150634766, 18.693544387817383]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 4.0, 5.0, 2.0, 8.0, 6.0, 14.0, 14.0, 16.0, 25.0, 20.0, 31.0, 38.0, 31.0, 45.0, 52.0, 50.0, 56.0, 65.0, 63.0, 52.0, 59.0, 50.0, 47.0, 37.0, 38.0, 23.0, 29.0, 32.0, 19.0, 7.0, 17.0, 12.0, 3.0, 10.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.801705360412598, -4.664665222167969, -4.527624607086182, -4.390584468841553, -4.253543853759766, -4.116503715515137, -3.979463577270508, -3.8424232006073, -3.705382823944092, -3.568342447280884, -3.431302070617676, -3.294261932373047, -3.157221555709839, -3.020181179046631, -2.883141040802002, -2.746100664138794, -2.609060287475586, -2.472019910812378, -2.33497953414917, -2.197939395904541, -2.060899019241333, -1.923858642578125, -1.7868183851242065, -1.649778127670288, -1.51273775100708, -1.375697374343872, -1.2386571168899536, -1.1016168594360352, -0.9645764827728271, -0.8275361657142639, -0.6904958486557007, -0.5534555315971375, -0.4164149761199951, -0.2793746590614319, -0.14233434200286865, -0.00529402494430542, 0.1317462921142578, 0.26878660917282104, 0.4058269262313843, 0.5428672432899475, 0.6799075603485107, 0.816947877407074, 0.9539881944656372, 1.0910284519195557, 1.2280688285827637, 1.3651092052459717, 1.5021494626998901, 1.6391897201538086, 1.7762300968170166, 1.9132704734802246, 2.0503106117248535, 2.1873509883880615, 2.3243913650512695, 2.4614317417144775, 2.5984721183776855, 2.7355122566223145, 2.8725526332855225, 3.0095930099487305, 3.1466331481933594, 3.2836735248565674, 3.4207139015197754, 3.5577542781829834, 3.6947946548461914, 3.8318347930908203, 3.9688751697540283]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 9.0, 22.0, 34.0, 74.0, 125.0, 283.0, 555.0, 2165.0, 18343.0, 4149482.0, 19641.0, 2367.0, 646.0, 250.0, 111.0, 62.0, 34.0, 14.0, 21.0, 9.0, 9.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.131591796875, -2.07763671875, -2.023681640625, -1.9697265625, -1.915771484375, -1.86181640625, -1.807861328125, -1.75390625, -1.699951171875, -1.64599609375, -1.592041015625, -1.5380859375, -1.484130859375, -1.43017578125, -1.376220703125, -1.322265625, -1.268310546875, -1.21435546875, -1.160400390625, -1.1064453125, -1.052490234375, -0.99853515625, -0.944580078125, -0.890625, -0.836669921875, -0.78271484375, -0.728759765625, -0.6748046875, -0.620849609375, -0.56689453125, -0.512939453125, -0.458984375, -0.405029296875, -0.35107421875, -0.297119140625, -0.2431640625, -0.189208984375, -0.13525390625, -0.081298828125, -0.02734375, 0.026611328125, 0.08056640625, 0.134521484375, 0.1884765625, 0.242431640625, 0.29638671875, 0.350341796875, 0.404296875, 0.458251953125, 0.51220703125, 0.566162109375, 0.6201171875, 0.674072265625, 0.72802734375, 0.781982421875, 0.8359375, 0.889892578125, 0.94384765625, 0.997802734375, 1.0517578125, 1.105712890625, 1.15966796875, 1.213623046875, 1.267578125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 10.0, 5.0, 11.0, 16.0, 17.0, 22.0, 25.0, 29.0, 35.0, 50.0, 52.0, 51.0, 54.0, 61.0, 59.0, 59.0, 58.0, 59.0, 44.0, 57.0, 46.0, 30.0, 37.0, 20.0, 22.0, 14.0, 16.0, 10.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1588134765625, -0.15386199951171875, -0.1489105224609375, -0.14395904541015625, -0.139007568359375, -0.13405609130859375, -0.1291046142578125, -0.12415313720703125, -0.11920166015625, -0.11425018310546875, -0.1092987060546875, -0.10434722900390625, -0.099395751953125, -0.09444427490234375, -0.0894927978515625, -0.08454132080078125, -0.07958984375, -0.07463836669921875, -0.0696868896484375, -0.06473541259765625, -0.059783935546875, -0.05483245849609375, -0.0498809814453125, -0.04492950439453125, -0.03997802734375, -0.03502655029296875, -0.0300750732421875, -0.02512359619140625, -0.020172119140625, -0.01522064208984375, -0.0102691650390625, -0.00531768798828125, -0.0003662109375, 0.00458526611328125, 0.0095367431640625, 0.01448822021484375, 0.019439697265625, 0.02439117431640625, 0.0293426513671875, 0.03429412841796875, 0.03924560546875, 0.04419708251953125, 0.0491485595703125, 0.05410003662109375, 0.059051513671875, 0.06400299072265625, 0.0689544677734375, 0.07390594482421875, 0.078857421875, 0.08380889892578125, 0.0887603759765625, 0.09371185302734375, 0.098663330078125, 0.10361480712890625, 0.1085662841796875, 0.11351776123046875, 0.11846923828125, 0.12342071533203125, 0.1283721923828125, 0.13332366943359375, 0.138275146484375, 0.14322662353515625, 0.1481781005859375, 0.15312957763671875, 0.1580810546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 8.0, 9.0, 6.0, 23.0, 20.0, 34.0, 61.0, 70.0, 115.0, 206.0, 351.0, 644.0, 1355.0, 3387.0, 13231.0, 3602592.0, 554068.0, 12094.0, 3139.0, 1295.0, 622.0, 362.0, 211.0, 125.0, 74.0, 49.0, 41.0, 21.0, 19.0, 12.0, 7.0, 11.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7158203125, -1.6706390380859375, -1.625457763671875, -1.5802764892578125, -1.53509521484375, -1.4899139404296875, -1.444732666015625, -1.3995513916015625, -1.3543701171875, -1.3091888427734375, -1.264007568359375, -1.2188262939453125, -1.17364501953125, -1.1284637451171875, -1.083282470703125, -1.0381011962890625, -0.992919921875, -0.9477386474609375, -0.902557373046875, -0.8573760986328125, -0.81219482421875, -0.7670135498046875, -0.721832275390625, -0.6766510009765625, -0.6314697265625, -0.5862884521484375, -0.541107177734375, -0.4959259033203125, -0.45074462890625, -0.4055633544921875, -0.360382080078125, -0.3152008056640625, -0.27001953125, -0.2248382568359375, -0.179656982421875, -0.1344757080078125, -0.08929443359375, -0.0441131591796875, 0.001068115234375, 0.0462493896484375, 0.0914306640625, 0.1366119384765625, 0.181793212890625, 0.2269744873046875, 0.27215576171875, 0.3173370361328125, 0.362518310546875, 0.4076995849609375, 0.452880859375, 0.4980621337890625, 0.543243408203125, 0.5884246826171875, 0.63360595703125, 0.6787872314453125, 0.723968505859375, 0.7691497802734375, 0.8143310546875, 0.8595123291015625, 0.904693603515625, 0.9498748779296875, 0.99505615234375, 1.0402374267578125, 1.085418701171875, 1.1305999755859375, 1.17578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 4.0, 7.0, 12.0, 26.0, 36.0, 92.0, 450.0, 3201.0, 140.0, 46.0, 21.0, 9.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33203125, -0.3241539001464844, -0.31627655029296875, -0.3083992004394531, -0.3005218505859375, -0.2926445007324219, -0.28476715087890625, -0.2768898010253906, -0.269012451171875, -0.2611351013183594, -0.25325775146484375, -0.24538040161132812, -0.2375030517578125, -0.22962570190429688, -0.22174835205078125, -0.21387100219726562, -0.20599365234375, -0.19811630249023438, -0.19023895263671875, -0.18236160278320312, -0.1744842529296875, -0.16660690307617188, -0.15872955322265625, -0.15085220336914062, -0.142974853515625, -0.13509750366210938, -0.12722015380859375, -0.11934280395507812, -0.1114654541015625, -0.10358810424804688, -0.09571075439453125, -0.08783340454101562, -0.0799560546875, -0.07207870483398438, -0.06420135498046875, -0.056324005126953125, -0.0484466552734375, -0.040569305419921875, -0.03269195556640625, -0.024814605712890625, -0.016937255859375, -0.009059906005859375, -0.00118255615234375, 0.006694793701171875, 0.0145721435546875, 0.022449493408203125, 0.03032684326171875, 0.038204193115234375, 0.04608154296875, 0.053958892822265625, 0.06183624267578125, 0.06971359252929688, 0.0775909423828125, 0.08546829223632812, 0.09334564208984375, 0.10122299194335938, 0.109100341796875, 0.11697769165039062, 0.12485504150390625, 0.13273239135742188, 0.1406097412109375, 0.14848709106445312, 0.15636444091796875, 0.16424179077148438, 0.172119140625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 8.0, 16.0, 24.0, 52.0, 95.0, 143.0, 205.0, 184.0, 135.0, 69.0, 38.0, 17.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3066192865371704, -1.2592202425003052, -1.2118213176727295, -1.1644222736358643, -1.117023229598999, -1.0696241855621338, -1.022225260734558, -0.9748262166976929, -0.9274272322654724, -0.880028247833252, -0.8326292037963867, -0.7852302193641663, -0.7378312349319458, -0.6904321908950806, -0.6430332064628601, -0.5956342220306396, -0.5482351779937744, -0.500836193561554, -0.4534371495246887, -0.40603816509246826, -0.3586391508579254, -0.31124013662338257, -0.2638411521911621, -0.21644213795661926, -0.16904312372207642, -0.12164411693811417, -0.07424511015415192, -0.026846110820770264, 0.020552903413772583, 0.06795191764831543, 0.11535090208053589, 0.16274991631507874, 0.21014904975891113, 0.257548063993454, 0.3049470782279968, 0.3523460626602173, 0.39974507689476013, 0.447144091129303, 0.49454307556152344, 0.5419421195983887, 0.5893411040306091, 0.6367400884628296, 0.6841391324996948, 0.7315381169319153, 0.7789371013641357, 0.826336145401001, 0.8737351298332214, 0.9211341142654419, 0.9685331583023071, 1.0159322023391724, 1.063331127166748, 1.1107301712036133, 1.1581292152404785, 1.2055282592773438, 1.2529271841049194, 1.3003262281417847, 1.3477251529693604, 1.3951241970062256, 1.4425231218338013, 1.4899221658706665, 1.5373212099075317, 1.5847201347351074, 1.6321191787719727, 1.679518222808838, 1.7269172668457031]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 12.0, 13.0, 13.0, 7.0, 10.0, 15.0, 23.0, 24.0, 25.0, 29.0, 31.0, 35.0, 31.0, 24.0, 43.0, 40.0, 40.0, 39.0, 49.0, 46.0, 44.0, 39.0, 38.0, 28.0, 45.0, 26.0, 35.0, 26.0, 25.0, 25.0, 27.0, 13.0, 20.0, 14.0, 14.0, 7.0, 9.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6180504560470581, -0.5989565849304199, -0.5798627138137817, -0.5607688426971436, -0.5416749715805054, -0.5225811004638672, -0.503487229347229, -0.48439332842826843, -0.46529945731163025, -0.44620558619499207, -0.4271117150783539, -0.4080178439617157, -0.3889239430427551, -0.36983007192611694, -0.35073620080947876, -0.3316423296928406, -0.3125484585762024, -0.2934545874595642, -0.274360716342926, -0.25526684522628784, -0.23617295920848846, -0.21707908809185028, -0.1979852020740509, -0.17889133095741272, -0.15979745984077454, -0.14070358872413635, -0.12160971015691757, -0.10251583158969879, -0.08342196047306061, -0.06432808935642242, -0.045234210789203644, -0.026140332221984863, -0.007046401500701904, 0.012047473341226578, 0.03114134818315506, 0.05023522302508354, 0.06932909786701202, 0.08842296898365021, 0.10751684755086899, 0.12661072611808777, 0.14570459723472595, 0.16479846835136414, 0.18389233946800232, 0.2029862254858017, 0.22208009660243988, 0.24117396771907806, 0.26026785373687744, 0.2793617248535156, 0.2984555959701538, 0.317549467086792, 0.3366433382034302, 0.35573720932006836, 0.37483108043670654, 0.3939249515533447, 0.4130188524723053, 0.4321127235889435, 0.45120659470558167, 0.47030046582221985, 0.48939433693885803, 0.5084882378578186, 0.5275821089744568, 0.546675980091095, 0.5657698512077332, 0.5848637223243713, 0.6039575934410095]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 18.0, 13.0, 19.0, 41.0, 56.0, 80.0, 161.0, 360.0, 629.0, 1598.0, 5181.0, 27970.0, 337749.0, 614470.0, 48735.0, 7682.0, 2183.0, 779.0, 385.0, 171.0, 115.0, 54.0, 43.0, 13.0, 16.0, 6.0, 8.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8076171875, -0.7852630615234375, -0.762908935546875, -0.7405548095703125, -0.71820068359375, -0.6958465576171875, -0.673492431640625, -0.6511383056640625, -0.6287841796875, -0.6064300537109375, -0.584075927734375, -0.5617218017578125, -0.53936767578125, -0.5170135498046875, -0.494659423828125, -0.4723052978515625, -0.449951171875, -0.4275970458984375, -0.405242919921875, -0.3828887939453125, -0.36053466796875, -0.3381805419921875, -0.315826416015625, -0.2934722900390625, -0.2711181640625, -0.2487640380859375, -0.226409912109375, -0.2040557861328125, -0.18170166015625, -0.1593475341796875, -0.136993408203125, -0.1146392822265625, -0.09228515625, -0.0699310302734375, -0.047576904296875, -0.0252227783203125, -0.00286865234375, 0.0194854736328125, 0.041839599609375, 0.0641937255859375, 0.0865478515625, 0.1089019775390625, 0.131256103515625, 0.1536102294921875, 0.17596435546875, 0.1983184814453125, 0.220672607421875, 0.2430267333984375, 0.265380859375, 0.2877349853515625, 0.310089111328125, 0.3324432373046875, 0.35479736328125, 0.3771514892578125, 0.399505615234375, 0.4218597412109375, 0.4442138671875, 0.4665679931640625, 0.488922119140625, 0.5112762451171875, 0.53363037109375, 0.5559844970703125, 0.578338623046875, 0.6006927490234375, 0.623046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 7.0, 11.0, 16.0, 22.0, 22.0, 20.0, 33.0, 41.0, 39.0, 62.0, 48.0, 58.0, 58.0, 62.0, 57.0, 57.0, 52.0, 45.0, 45.0, 46.0, 36.0, 31.0, 27.0, 17.0, 17.0, 12.0, 11.0, 4.0, 9.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.169921875, -0.16457176208496094, -0.15922164916992188, -0.1538715362548828, -0.14852142333984375, -0.1431713104248047, -0.13782119750976562, -0.13247108459472656, -0.1271209716796875, -0.12177085876464844, -0.11642074584960938, -0.11107063293457031, -0.10572052001953125, -0.10037040710449219, -0.09502029418945312, -0.08967018127441406, -0.084320068359375, -0.07896995544433594, -0.07361984252929688, -0.06826972961425781, -0.06291961669921875, -0.05756950378417969, -0.052219390869140625, -0.04686927795410156, -0.0415191650390625, -0.03616905212402344, -0.030818939208984375, -0.025468826293945312, -0.02011871337890625, -0.014768600463867188, -0.009418487548828125, -0.0040683746337890625, 0.00128173828125, 0.0066318511962890625, 0.011981964111328125, 0.017332077026367188, 0.02268218994140625, 0.028032302856445312, 0.033382415771484375, 0.03873252868652344, 0.0440826416015625, 0.04943275451660156, 0.054782867431640625, 0.06013298034667969, 0.06548309326171875, 0.07083320617675781, 0.07618331909179688, 0.08153343200683594, 0.086883544921875, 0.09223365783691406, 0.09758377075195312, 0.10293388366699219, 0.10828399658203125, 0.11363410949707031, 0.11898422241210938, 0.12433433532714844, 0.1296844482421875, 0.13503456115722656, 0.14038467407226562, 0.1457347869873047, 0.15108489990234375, 0.1564350128173828, 0.16178512573242188, 0.16713523864746094, 0.1724853515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 6.0, 9.0, 9.0, 23.0, 32.0, 30.0, 67.0, 86.0, 150.0, 283.0, 695.0, 2126.0, 10374.0, 305979.0, 707410.0, 16910.0, 2726.0, 857.0, 332.0, 174.0, 105.0, 58.0, 37.0, 16.0, 17.0, 7.0, 8.0, 10.0, 6.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.416015625, -1.3831634521484375, -1.350311279296875, -1.3174591064453125, -1.28460693359375, -1.2517547607421875, -1.218902587890625, -1.1860504150390625, -1.1531982421875, -1.1203460693359375, -1.087493896484375, -1.0546417236328125, -1.02178955078125, -0.9889373779296875, -0.956085205078125, -0.9232330322265625, -0.890380859375, -0.8575286865234375, -0.824676513671875, -0.7918243408203125, -0.75897216796875, -0.7261199951171875, -0.693267822265625, -0.6604156494140625, -0.6275634765625, -0.5947113037109375, -0.561859130859375, -0.5290069580078125, -0.49615478515625, -0.4633026123046875, -0.430450439453125, -0.3975982666015625, -0.36474609375, -0.3318939208984375, -0.299041748046875, -0.2661895751953125, -0.23333740234375, -0.2004852294921875, -0.167633056640625, -0.1347808837890625, -0.1019287109375, -0.0690765380859375, -0.036224365234375, -0.0033721923828125, 0.02947998046875, 0.0623321533203125, 0.095184326171875, 0.1280364990234375, 0.160888671875, 0.1937408447265625, 0.226593017578125, 0.2594451904296875, 0.29229736328125, 0.3251495361328125, 0.358001708984375, 0.3908538818359375, 0.4237060546875, 0.4565582275390625, 0.489410400390625, 0.5222625732421875, 0.55511474609375, 0.5879669189453125, 0.620819091796875, 0.6536712646484375, 0.6865234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 17.0, 13.0, 13.0, 30.0, 29.0, 27.0, 35.0, 58.0, 57.0, 68.0, 65.0, 66.0, 77.0, 65.0, 62.0, 44.0, 40.0, 51.0, 36.0, 27.0, 30.0, 20.0, 23.0, 13.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94384765625, -0.9093399047851562, -0.8748321533203125, -0.8403244018554688, -0.805816650390625, -0.7713088989257812, -0.7368011474609375, -0.7022933959960938, -0.66778564453125, -0.6332778930664062, -0.5987701416015625, -0.5642623901367188, -0.529754638671875, -0.49524688720703125, -0.4607391357421875, -0.42623138427734375, -0.3917236328125, -0.35721588134765625, -0.3227081298828125, -0.28820037841796875, -0.253692626953125, -0.21918487548828125, -0.1846771240234375, -0.15016937255859375, -0.11566162109375, -0.08115386962890625, -0.0466461181640625, -0.01213836669921875, 0.022369384765625, 0.05687713623046875, 0.0913848876953125, 0.12589263916015625, 0.160400390625, 0.19490814208984375, 0.2294158935546875, 0.26392364501953125, 0.298431396484375, 0.33293914794921875, 0.3674468994140625, 0.40195465087890625, 0.43646240234375, 0.47097015380859375, 0.5054779052734375, 0.5399856567382812, 0.574493408203125, 0.6090011596679688, 0.6435089111328125, 0.6780166625976562, 0.7125244140625, 0.7470321655273438, 0.7815399169921875, 0.8160476684570312, 0.850555419921875, 0.8850631713867188, 0.9195709228515625, 0.9540786743164062, 0.98858642578125, 1.0230941772460938, 1.0576019287109375, 1.0921096801757812, 1.126617431640625, 1.1611251831054688, 1.1956329345703125, 1.2301406860351562, 1.2646484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 10.0, 16.0, 28.0, 100.0, 223.0, 785.0, 5090.0, 918788.0, 120327.0, 2382.0, 503.0, 152.0, 73.0, 35.0, 11.0, 15.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08203125, -1.041717529296875, -1.00140380859375, -0.961090087890625, -0.9207763671875, -0.880462646484375, -0.84014892578125, -0.799835205078125, -0.759521484375, -0.719207763671875, -0.67889404296875, -0.638580322265625, -0.5982666015625, -0.557952880859375, -0.51763916015625, -0.477325439453125, -0.43701171875, -0.396697998046875, -0.35638427734375, -0.316070556640625, -0.2757568359375, -0.235443115234375, -0.19512939453125, -0.154815673828125, -0.114501953125, -0.074188232421875, -0.03387451171875, 0.006439208984375, 0.0467529296875, 0.087066650390625, 0.12738037109375, 0.167694091796875, 0.2080078125, 0.248321533203125, 0.28863525390625, 0.328948974609375, 0.3692626953125, 0.409576416015625, 0.44989013671875, 0.490203857421875, 0.530517578125, 0.570831298828125, 0.61114501953125, 0.651458740234375, 0.6917724609375, 0.732086181640625, 0.77239990234375, 0.812713623046875, 0.85302734375, 0.893341064453125, 0.93365478515625, 0.973968505859375, 1.0142822265625, 1.054595947265625, 1.09490966796875, 1.135223388671875, 1.175537109375, 1.215850830078125, 1.25616455078125, 1.296478271484375, 1.3367919921875, 1.377105712890625, 1.41741943359375, 1.457733154296875, 1.498046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 10.0, 15.0, 15.0, 19.0, 30.0, 30.0, 45.0, 63.0, 81.0, 111.0, 119.0, 104.0, 75.0, 81.0, 53.0, 38.0, 32.0, 24.0, 14.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00012874603271484375, -0.00012563727796077728, -0.00012252852320671082, -0.00011941976845264435, -0.00011631101369857788, -0.00011320225894451141, -0.00011009350419044495, -0.00010698474943637848, -0.00010387599468231201, -0.00010076723992824554, -9.765848517417908e-05, -9.454973042011261e-05, -9.144097566604614e-05, -8.833222091197968e-05, -8.522346615791321e-05, -8.211471140384674e-05, -7.900595664978027e-05, -7.58972018957138e-05, -7.278844714164734e-05, -6.967969238758087e-05, -6.65709376335144e-05, -6.346218287944794e-05, -6.035342812538147e-05, -5.7244673371315e-05, -5.4135918617248535e-05, -5.102716386318207e-05, -4.79184091091156e-05, -4.480965435504913e-05, -4.1700899600982666e-05, -3.85921448469162e-05, -3.548339009284973e-05, -3.2374635338783264e-05, -2.9265880584716797e-05, -2.615712583065033e-05, -2.3048371076583862e-05, -1.9939616322517395e-05, -1.6830861568450928e-05, -1.372210681438446e-05, -1.0613352060317993e-05, -7.504597306251526e-06, -4.395842552185059e-06, -1.2870877981185913e-06, 1.821666955947876e-06, 4.930421710014343e-06, 8.03917646408081e-06, 1.1147931218147278e-05, 1.4256685972213745e-05, 1.7365440726280212e-05, 2.047419548034668e-05, 2.3582950234413147e-05, 2.6691704988479614e-05, 2.980045974254608e-05, 3.290921449661255e-05, 3.6017969250679016e-05, 3.9126724004745483e-05, 4.223547875881195e-05, 4.534423351287842e-05, 4.8452988266944885e-05, 5.156174302101135e-05, 5.467049777507782e-05, 5.777925252914429e-05, 6.0888007283210754e-05, 6.399676203727722e-05, 6.710551679134369e-05, 7.021427154541016e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 4.0, 4.0, 13.0, 22.0, 47.0, 95.0, 174.0, 470.0, 1713.0, 14816.0, 907970.0, 117352.0, 4384.0, 877.0, 331.0, 116.0, 78.0, 38.0, 21.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1337890625, -1.1059722900390625, -1.078155517578125, -1.0503387451171875, -1.02252197265625, -0.9947052001953125, -0.966888427734375, -0.9390716552734375, -0.9112548828125, -0.8834381103515625, -0.855621337890625, -0.8278045654296875, -0.79998779296875, -0.7721710205078125, -0.744354248046875, -0.7165374755859375, -0.688720703125, -0.6609039306640625, -0.633087158203125, -0.6052703857421875, -0.57745361328125, -0.5496368408203125, -0.521820068359375, -0.4940032958984375, -0.4661865234375, -0.4383697509765625, -0.410552978515625, -0.3827362060546875, -0.35491943359375, -0.3271026611328125, -0.299285888671875, -0.2714691162109375, -0.24365234375, -0.2158355712890625, -0.188018798828125, -0.1602020263671875, -0.13238525390625, -0.1045684814453125, -0.076751708984375, -0.0489349365234375, -0.0211181640625, 0.0066986083984375, 0.034515380859375, 0.0623321533203125, 0.09014892578125, 0.1179656982421875, 0.145782470703125, 0.1735992431640625, 0.201416015625, 0.2292327880859375, 0.257049560546875, 0.2848663330078125, 0.31268310546875, 0.3404998779296875, 0.368316650390625, 0.3961334228515625, 0.4239501953125, 0.4517669677734375, 0.479583740234375, 0.5074005126953125, 0.53521728515625, 0.5630340576171875, 0.590850830078125, 0.6186676025390625, 0.646484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 8.0, 19.0, 29.0, 28.0, 48.0, 90.0, 132.0, 156.0, 169.0, 102.0, 71.0, 41.0, 44.0, 21.0, 16.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6992645263671875, -0.680755615234375, -0.6622467041015625, -0.64373779296875, -0.6252288818359375, -0.606719970703125, -0.5882110595703125, -0.5697021484375, -0.5511932373046875, -0.532684326171875, -0.5141754150390625, -0.49566650390625, -0.4771575927734375, -0.458648681640625, -0.4401397705078125, -0.421630859375, -0.4031219482421875, -0.384613037109375, -0.3661041259765625, -0.34759521484375, -0.3290863037109375, -0.310577392578125, -0.2920684814453125, -0.2735595703125, -0.2550506591796875, -0.236541748046875, -0.2180328369140625, -0.19952392578125, -0.1810150146484375, -0.162506103515625, -0.1439971923828125, -0.12548828125, -0.1069793701171875, -0.088470458984375, -0.0699615478515625, -0.05145263671875, -0.0329437255859375, -0.014434814453125, 0.0040740966796875, 0.0225830078125, 0.0410919189453125, 0.059600830078125, 0.0781097412109375, 0.09661865234375, 0.1151275634765625, 0.133636474609375, 0.1521453857421875, 0.170654296875, 0.1891632080078125, 0.207672119140625, 0.2261810302734375, 0.24468994140625, 0.2631988525390625, 0.281707763671875, 0.3002166748046875, 0.3187255859375, 0.3372344970703125, 0.355743408203125, 0.3742523193359375, 0.39276123046875, 0.4112701416015625, 0.429779052734375, 0.4482879638671875, 0.466796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 9.0, 11.0, 63.0, 296.0, 433.0, 162.0, 26.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.198760986328125, -26.678014755249023, -26.157270431518555, -25.636524200439453, -25.115779876708984, -24.595033645629883, -24.07428741455078, -23.553543090820312, -23.03279685974121, -22.51205062866211, -21.99130630493164, -21.47056007385254, -20.94981575012207, -20.42906951904297, -19.9083251953125, -19.3875789642334, -18.866832733154297, -18.346086502075195, -17.825342178344727, -17.304595947265625, -16.783851623535156, -16.263105392456055, -15.74236011505127, -15.221614837646484, -14.700870513916016, -14.18012523651123, -13.659379959106445, -13.138633728027344, -12.617888450622559, -12.097143173217773, -11.576397895812988, -11.055652618408203, -10.534905433654785, -10.01416015625, -9.493414878845215, -8.97266960144043, -8.451923370361328, -7.931178092956543, -7.410432815551758, -6.889687538146973, -6.368941783905029, -5.848196506500244, -5.327450752258301, -4.806705474853516, -4.2859601974487305, -3.765214443206787, -3.244469165802002, -2.7237236499786377, -2.2029781341552734, -1.6822326183319092, -1.1614872217178345, -0.6407418251037598, -0.11999630928039551, 0.40074920654296875, 0.9214944839477539, 1.4422399997711182, 1.9629855155944824, 2.4837310314178467, 3.004476547241211, 3.525221824645996, 4.045967102050781, 4.566712856292725, 5.08745813369751, 5.608203887939453, 6.128949165344238]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 2.0, 12.0, 6.0, 10.0, 2.0, 13.0, 11.0, 14.0, 17.0, 17.0, 17.0, 27.0, 35.0, 27.0, 31.0, 24.0, 50.0, 32.0, 42.0, 49.0, 40.0, 46.0, 55.0, 37.0, 39.0, 54.0, 41.0, 30.0, 28.0, 28.0, 32.0, 20.0, 21.0, 17.0, 12.0, 17.0, 8.0, 9.0, 5.0, 6.0, 3.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.625253915786743, -3.512847900390625, -3.400442123413086, -3.288036346435547, -3.1756303310394287, -3.0632243156433105, -2.9508185386657715, -2.8384127616882324, -2.7260067462921143, -2.613600730895996, -2.501194953918457, -2.388789176940918, -2.2763831615448, -2.1639771461486816, -2.0515713691711426, -1.939165472984314, -1.8267595767974854, -1.7143536806106567, -1.6019477844238281, -1.4895418882369995, -1.377135992050171, -1.2647300958633423, -1.1523241996765137, -1.039918303489685, -0.9275124073028564, -0.8151065111160278, -0.7027006149291992, -0.5902947187423706, -0.477888822555542, -0.3654829263687134, -0.25307703018188477, -0.14067113399505615, -0.02826523780822754, 0.08414065837860107, 0.1965465545654297, 0.3089524507522583, 0.4213583469390869, 0.5337642431259155, 0.6461701393127441, 0.7585760354995728, 0.8709819316864014, 0.98338782787323, 1.0957937240600586, 1.2081996202468872, 1.3206055164337158, 1.4330114126205444, 1.545417308807373, 1.6578232049942017, 1.7702291011810303, 1.8826349973678589, 1.9950408935546875, 2.1074466705322266, 2.2198526859283447, 2.332258701324463, 2.444664478302002, 2.557070255279541, 2.669476270675659, 2.7818822860717773, 2.8942880630493164, 3.0066938400268555, 3.1190998554229736, 3.231505870819092, 3.343911647796631, 3.45631742477417, 3.568723440170288]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 5.0, 2.0, 11.0, 4.0, 8.0, 15.0, 18.0, 34.0, 45.0, 77.0, 106.0, 193.0, 324.0, 561.0, 1241.0, 3367.0, 15033.0, 318368.0, 3823686.0, 23414.0, 4701.0, 1561.0, 662.0, 323.0, 186.0, 117.0, 78.0, 49.0, 33.0, 22.0, 16.0, 13.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.1328125, -1.105255126953125, -1.07769775390625, -1.050140380859375, -1.0225830078125, -0.995025634765625, -0.96746826171875, -0.939910888671875, -0.912353515625, -0.884796142578125, -0.85723876953125, -0.829681396484375, -0.8021240234375, -0.774566650390625, -0.74700927734375, -0.719451904296875, -0.69189453125, -0.664337158203125, -0.63677978515625, -0.609222412109375, -0.5816650390625, -0.554107666015625, -0.52655029296875, -0.498992919921875, -0.471435546875, -0.443878173828125, -0.41632080078125, -0.388763427734375, -0.3612060546875, -0.333648681640625, -0.30609130859375, -0.278533935546875, -0.2509765625, -0.223419189453125, -0.19586181640625, -0.168304443359375, -0.1407470703125, -0.113189697265625, -0.08563232421875, -0.058074951171875, -0.030517578125, -0.002960205078125, 0.02459716796875, 0.052154541015625, 0.0797119140625, 0.107269287109375, 0.13482666015625, 0.162384033203125, 0.18994140625, 0.217498779296875, 0.24505615234375, 0.272613525390625, 0.3001708984375, 0.327728271484375, 0.35528564453125, 0.382843017578125, 0.410400390625, 0.437957763671875, 0.46551513671875, 0.493072509765625, 0.5206298828125, 0.548187255859375, 0.57574462890625, 0.603302001953125, 0.630859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 3.0, 8.0, 8.0, 12.0, 9.0, 19.0, 14.0, 35.0, 24.0, 31.0, 46.0, 62.0, 35.0, 56.0, 61.0, 66.0, 76.0, 64.0, 78.0, 40.0, 35.0, 50.0, 37.0, 29.0, 30.0, 18.0, 12.0, 9.0, 5.0, 4.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.20751953125, -0.2017230987548828, -0.19592666625976562, -0.19013023376464844, -0.18433380126953125, -0.17853736877441406, -0.17274093627929688, -0.1669445037841797, -0.1611480712890625, -0.1553516387939453, -0.14955520629882812, -0.14375877380371094, -0.13796234130859375, -0.13216590881347656, -0.12636947631835938, -0.12057304382324219, -0.114776611328125, -0.10898017883300781, -0.10318374633789062, -0.09738731384277344, -0.09159088134765625, -0.08579444885253906, -0.07999801635742188, -0.07420158386230469, -0.0684051513671875, -0.06260871887207031, -0.056812286376953125, -0.05101585388183594, -0.04521942138671875, -0.03942298889160156, -0.033626556396484375, -0.027830123901367188, -0.02203369140625, -0.016237258911132812, -0.010440826416015625, -0.0046443939208984375, 0.00115203857421875, 0.0069484710693359375, 0.012744903564453125, 0.018541336059570312, 0.0243377685546875, 0.030134201049804688, 0.035930633544921875, 0.04172706604003906, 0.04752349853515625, 0.05331993103027344, 0.059116363525390625, 0.06491279602050781, 0.070709228515625, 0.07650566101074219, 0.08230209350585938, 0.08809852600097656, 0.09389495849609375, 0.09969139099121094, 0.10548782348632812, 0.11128425598144531, 0.1170806884765625, 0.12287712097167969, 0.12867355346679688, 0.13446998596191406, 0.14026641845703125, 0.14606285095214844, 0.15185928344726562, 0.1576557159423828, 0.1634521484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 18.0, 8.0, 15.0, 34.0, 41.0, 79.0, 114.0, 250.0, 657.0, 2326.0, 10367.0, 173912.0, 3974481.0, 25913.0, 4043.0, 1109.0, 422.0, 171.0, 94.0, 59.0, 45.0, 36.0, 15.0, 13.0, 11.0, 11.0, 2.0, 9.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.634765625, -1.589630126953125, -1.54449462890625, -1.499359130859375, -1.4542236328125, -1.409088134765625, -1.36395263671875, -1.318817138671875, -1.273681640625, -1.228546142578125, -1.18341064453125, -1.138275146484375, -1.0931396484375, -1.048004150390625, -1.00286865234375, -0.957733154296875, -0.91259765625, -0.867462158203125, -0.82232666015625, -0.777191162109375, -0.7320556640625, -0.686920166015625, -0.64178466796875, -0.596649169921875, -0.551513671875, -0.506378173828125, -0.46124267578125, -0.416107177734375, -0.3709716796875, -0.325836181640625, -0.28070068359375, -0.235565185546875, -0.1904296875, -0.145294189453125, -0.10015869140625, -0.055023193359375, -0.0098876953125, 0.035247802734375, 0.08038330078125, 0.125518798828125, 0.170654296875, 0.215789794921875, 0.26092529296875, 0.306060791015625, 0.3511962890625, 0.396331787109375, 0.44146728515625, 0.486602783203125, 0.53173828125, 0.576873779296875, 0.62200927734375, 0.667144775390625, 0.7122802734375, 0.757415771484375, 0.80255126953125, 0.847686767578125, 0.892822265625, 0.937957763671875, 0.98309326171875, 1.028228759765625, 1.0733642578125, 1.118499755859375, 1.16363525390625, 1.208770751953125, 1.25390625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 8.0, 25.0, 34.0, 46.0, 115.0, 353.0, 2960.0, 282.0, 93.0, 61.0, 30.0, 14.0, 17.0, 7.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 3.0], "bins": [-0.638671875, -0.6257495880126953, -0.6128273010253906, -0.5999050140380859, -0.5869827270507812, -0.5740604400634766, -0.5611381530761719, -0.5482158660888672, -0.5352935791015625, -0.5223712921142578, -0.5094490051269531, -0.49652671813964844, -0.48360443115234375, -0.47068214416503906, -0.4577598571777344, -0.4448375701904297, -0.431915283203125, -0.4189929962158203, -0.4060707092285156, -0.39314842224121094, -0.38022613525390625, -0.36730384826660156, -0.3543815612792969, -0.3414592742919922, -0.3285369873046875, -0.3156147003173828, -0.3026924133300781, -0.28977012634277344, -0.27684783935546875, -0.26392555236816406, -0.2510032653808594, -0.2380809783935547, -0.22515869140625, -0.2122364044189453, -0.19931411743164062, -0.18639183044433594, -0.17346954345703125, -0.16054725646972656, -0.14762496948242188, -0.1347026824951172, -0.1217803955078125, -0.10885810852050781, -0.09593582153320312, -0.08301353454589844, -0.07009124755859375, -0.05716896057128906, -0.044246673583984375, -0.03132438659667969, -0.018402099609375, -0.0054798126220703125, 0.007442474365234375, 0.020364761352539062, 0.03328704833984375, 0.04620933532714844, 0.059131622314453125, 0.07205390930175781, 0.0849761962890625, 0.09789848327636719, 0.11082077026367188, 0.12374305725097656, 0.13666534423828125, 0.14958763122558594, 0.16250991821289062, 0.1754322052001953, 0.1883544921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 7.0, 13.0, 12.0, 16.0, 37.0, 45.0, 85.0, 147.0, 169.0, 155.0, 128.0, 76.0, 46.0, 26.0, 15.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.813605785369873, -1.7510530948638916, -1.6885004043579102, -1.6259477138519287, -1.5633951425552368, -1.5008424520492554, -1.438289761543274, -1.3757370710372925, -1.3131844997406006, -1.2506318092346191, -1.1880791187286377, -1.1255264282226562, -1.0629738569259644, -1.000421166419983, -0.9378684759140015, -0.87531578540802, -0.8127630949020386, -0.7502104043960571, -0.6876577734947205, -0.625105082988739, -0.5625524520874023, -0.4999997615814209, -0.43744707107543945, -0.3748944103717804, -0.31234174966812134, -0.24978908896446228, -0.18723641335964203, -0.12468373775482178, -0.06213107705116272, 0.0004215836524963379, 0.06297427415847778, 0.12552693486213684, 0.1880795955657959, 0.25063225626945496, 0.313184916973114, 0.37573760747909546, 0.4382902681827545, 0.5008429288864136, 0.563395619392395, 0.6259483098983765, 0.6885009407997131, 0.7510536313056946, 0.8136062622070312, 0.8761589527130127, 0.9387116432189941, 1.0012643337249756, 1.063817024230957, 1.126369595527649, 1.1889222860336304, 1.2514749765396118, 1.3140276670455933, 1.3765802383422852, 1.4391329288482666, 1.501685619354248, 1.5642383098602295, 1.626791000366211, 1.6893436908721924, 1.7518963813781738, 1.8144490718841553, 1.8770017623901367, 1.9395543336868286, 2.0021071434020996, 2.064659595489502, 2.1272122859954834, 2.189764976501465]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 2.0, 11.0, 5.0, 8.0, 13.0, 17.0, 17.0, 17.0, 30.0, 24.0, 28.0, 37.0, 45.0, 48.0, 49.0, 69.0, 62.0, 52.0, 57.0, 54.0, 46.0, 57.0, 34.0, 38.0, 34.0, 26.0, 25.0, 21.0, 22.0, 11.0, 12.0, 8.0, 8.0, 2.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9570510983467102, -0.918036162853241, -0.8790212273597717, -0.8400062918663025, -0.8009912967681885, -0.7619763612747192, -0.72296142578125, -0.6839464902877808, -0.6449315547943115, -0.6059166193008423, -0.566901683807373, -0.5278867483139038, -0.4888717830181122, -0.44985684752464294, -0.4108418822288513, -0.3718269467353821, -0.33281201124191284, -0.2937970757484436, -0.25478214025497437, -0.21576717495918274, -0.1767522394657135, -0.13773730397224426, -0.09872235357761383, -0.0597074031829834, -0.02069246768951416, 0.018322475254535675, 0.05733741819858551, 0.09635236114263535, 0.13536730408668518, 0.17438223958015442, 0.21339718997478485, 0.2524121403694153, 0.2914271354675293, 0.33044207096099854, 0.3694570064544678, 0.4084719717502594, 0.44748690724372864, 0.4865018427371979, 0.5255168080329895, 0.5645317435264587, 0.603546679019928, 0.6425616145133972, 0.6815765500068665, 0.7205914855003357, 0.7596064805984497, 0.798621416091919, 0.8376363515853882, 0.8766512870788574, 0.9156662225723267, 0.9546811580657959, 0.9936960935592651, 1.0327110290527344, 1.0717259645462036, 1.1107409000396729, 1.149755835533142, 1.1887707710266113, 1.2277858257293701, 1.2668007612228394, 1.3058156967163086, 1.3448306322097778, 1.383845567703247, 1.4228605031967163, 1.4618754386901855, 1.5008904933929443, 1.539905309677124]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 9.0, 7.0, 13.0, 20.0, 33.0, 78.0, 109.0, 276.0, 518.0, 1302.0, 3795.0, 14472.0, 75954.0, 488421.0, 388131.0, 58453.0, 11688.0, 3278.0, 1041.0, 470.0, 224.0, 118.0, 53.0, 35.0, 14.0, 17.0, 6.0, 8.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5131072998046875, -0.492523193359375, -0.4719390869140625, -0.45135498046875, -0.4307708740234375, -0.410186767578125, -0.3896026611328125, -0.3690185546875, -0.3484344482421875, -0.327850341796875, -0.3072662353515625, -0.28668212890625, -0.2660980224609375, -0.245513916015625, -0.2249298095703125, -0.204345703125, -0.1837615966796875, -0.163177490234375, -0.1425933837890625, -0.12200927734375, -0.1014251708984375, -0.080841064453125, -0.0602569580078125, -0.0396728515625, -0.0190887451171875, 0.001495361328125, 0.0220794677734375, 0.04266357421875, 0.0632476806640625, 0.083831787109375, 0.1044158935546875, 0.125, 0.1455841064453125, 0.166168212890625, 0.1867523193359375, 0.20733642578125, 0.2279205322265625, 0.248504638671875, 0.2690887451171875, 0.2896728515625, 0.3102569580078125, 0.330841064453125, 0.3514251708984375, 0.37200927734375, 0.3925933837890625, 0.413177490234375, 0.4337615966796875, 0.454345703125, 0.4749298095703125, 0.495513916015625, 0.5160980224609375, 0.53668212890625, 0.5572662353515625, 0.577850341796875, 0.5984344482421875, 0.6190185546875, 0.6396026611328125, 0.660186767578125, 0.6807708740234375, 0.70135498046875, 0.7219390869140625, 0.742523193359375, 0.7631072998046875, 0.78369140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 10.0, 5.0, 6.0, 9.0, 12.0, 14.0, 23.0, 20.0, 23.0, 34.0, 48.0, 47.0, 53.0, 65.0, 60.0, 60.0, 66.0, 79.0, 54.0, 42.0, 38.0, 40.0, 25.0, 40.0, 35.0, 32.0, 16.0, 12.0, 12.0, 5.0, 5.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.231201171875, -0.2251148223876953, -0.21902847290039062, -0.21294212341308594, -0.20685577392578125, -0.20076942443847656, -0.19468307495117188, -0.1885967254638672, -0.1825103759765625, -0.1764240264892578, -0.17033767700195312, -0.16425132751464844, -0.15816497802734375, -0.15207862854003906, -0.14599227905273438, -0.1399059295654297, -0.133819580078125, -0.1277332305908203, -0.12164688110351562, -0.11556053161621094, -0.10947418212890625, -0.10338783264160156, -0.09730148315429688, -0.09121513366699219, -0.0851287841796875, -0.07904243469238281, -0.07295608520507812, -0.06686973571777344, -0.06078338623046875, -0.05469703674316406, -0.048610687255859375, -0.04252433776855469, -0.03643798828125, -0.030351638793945312, -0.024265289306640625, -0.018178939819335938, -0.01209259033203125, -0.0060062408447265625, 8.0108642578125e-05, 0.0061664581298828125, 0.0122528076171875, 0.018339157104492188, 0.024425506591796875, 0.030511856079101562, 0.03659820556640625, 0.04268455505371094, 0.048770904541015625, 0.05485725402832031, 0.060943603515625, 0.06702995300292969, 0.07311630249023438, 0.07920265197753906, 0.08528900146484375, 0.09137535095214844, 0.09746170043945312, 0.10354804992675781, 0.1096343994140625, 0.11572074890136719, 0.12180709838867188, 0.12789344787597656, 0.13397979736328125, 0.14006614685058594, 0.14615249633789062, 0.1522388458251953, 0.1583251953125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 11.0, 14.0, 18.0, 18.0, 25.0, 43.0, 38.0, 72.0, 107.0, 155.0, 217.0, 392.0, 678.0, 1470.0, 4229.0, 22178.0, 301824.0, 663196.0, 43415.0, 6399.0, 1936.0, 863.0, 429.0, 267.0, 160.0, 126.0, 81.0, 41.0, 39.0, 24.0, 18.0, 22.0, 6.0, 10.0, 6.0, 8.0, 2.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.96484375, -0.9365921020507812, -0.9083404541015625, -0.8800888061523438, -0.851837158203125, -0.8235855102539062, -0.7953338623046875, -0.7670822143554688, -0.73883056640625, -0.7105789184570312, -0.6823272705078125, -0.6540756225585938, -0.625823974609375, -0.5975723266601562, -0.5693206787109375, -0.5410690307617188, -0.5128173828125, -0.48456573486328125, -0.4563140869140625, -0.42806243896484375, -0.399810791015625, -0.37155914306640625, -0.3433074951171875, -0.31505584716796875, -0.28680419921875, -0.25855255126953125, -0.2303009033203125, -0.20204925537109375, -0.173797607421875, -0.14554595947265625, -0.1172943115234375, -0.08904266357421875, -0.060791015625, -0.03253936767578125, -0.0042877197265625, 0.02396392822265625, 0.052215576171875, 0.08046722412109375, 0.1087188720703125, 0.13697052001953125, 0.16522216796875, 0.19347381591796875, 0.2217254638671875, 0.24997711181640625, 0.278228759765625, 0.30648040771484375, 0.3347320556640625, 0.36298370361328125, 0.3912353515625, 0.41948699951171875, 0.4477386474609375, 0.47599029541015625, 0.504241943359375, 0.5324935913085938, 0.5607452392578125, 0.5889968872070312, 0.61724853515625, 0.6455001831054688, 0.6737518310546875, 0.7020034790039062, 0.730255126953125, 0.7585067749023438, 0.7867584228515625, 0.8150100708007812, 0.84326171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 4.0, 4.0, 9.0, 6.0, 12.0, 8.0, 20.0, 17.0, 17.0, 28.0, 30.0, 29.0, 40.0, 42.0, 35.0, 60.0, 60.0, 60.0, 67.0, 56.0, 61.0, 60.0, 42.0, 35.0, 19.0, 42.0, 28.0, 25.0, 17.0, 8.0, 12.0, 9.0, 10.0, 6.0, 11.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.1005859375, -1.0703506469726562, -1.0401153564453125, -1.0098800659179688, -0.979644775390625, -0.9494094848632812, -0.9191741943359375, -0.8889389038085938, -0.85870361328125, -0.8284683227539062, -0.7982330322265625, -0.7679977416992188, -0.737762451171875, -0.7075271606445312, -0.6772918701171875, -0.6470565795898438, -0.6168212890625, -0.5865859985351562, -0.5563507080078125, -0.5261154174804688, -0.495880126953125, -0.46564483642578125, -0.4354095458984375, -0.40517425537109375, -0.37493896484375, -0.34470367431640625, -0.3144683837890625, -0.28423309326171875, -0.253997802734375, -0.22376251220703125, -0.1935272216796875, -0.16329193115234375, -0.133056640625, -0.10282135009765625, -0.0725860595703125, -0.04235076904296875, -0.012115478515625, 0.01811981201171875, 0.0483551025390625, 0.07859039306640625, 0.10882568359375, 0.13906097412109375, 0.1692962646484375, 0.19953155517578125, 0.229766845703125, 0.26000213623046875, 0.2902374267578125, 0.32047271728515625, 0.3507080078125, 0.38094329833984375, 0.4111785888671875, 0.44141387939453125, 0.471649169921875, 0.5018844604492188, 0.5321197509765625, 0.5623550415039062, 0.59259033203125, 0.6228256225585938, 0.6530609130859375, 0.6832962036132812, 0.713531494140625, 0.7437667846679688, 0.7740020751953125, 0.8042373657226562, 0.83447265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 14.0, 20.0, 39.0, 61.0, 143.0, 235.0, 701.0, 2586.0, 32533.0, 972247.0, 35882.0, 2757.0, 727.0, 278.0, 148.0, 66.0, 40.0, 24.0, 12.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.88330078125, -0.858428955078125, -0.83355712890625, -0.808685302734375, -0.7838134765625, -0.758941650390625, -0.73406982421875, -0.709197998046875, -0.684326171875, -0.659454345703125, -0.63458251953125, -0.609710693359375, -0.5848388671875, -0.559967041015625, -0.53509521484375, -0.510223388671875, -0.4853515625, -0.460479736328125, -0.43560791015625, -0.410736083984375, -0.3858642578125, -0.360992431640625, -0.33612060546875, -0.311248779296875, -0.286376953125, -0.261505126953125, -0.23663330078125, -0.211761474609375, -0.1868896484375, -0.162017822265625, -0.13714599609375, -0.112274169921875, -0.08740234375, -0.062530517578125, -0.03765869140625, -0.012786865234375, 0.0120849609375, 0.036956787109375, 0.06182861328125, 0.086700439453125, 0.111572265625, 0.136444091796875, 0.16131591796875, 0.186187744140625, 0.2110595703125, 0.235931396484375, 0.26080322265625, 0.285675048828125, 0.310546875, 0.335418701171875, 0.36029052734375, 0.385162353515625, 0.4100341796875, 0.434906005859375, 0.45977783203125, 0.484649658203125, 0.509521484375, 0.534393310546875, 0.55926513671875, 0.584136962890625, 0.6090087890625, 0.633880615234375, 0.65875244140625, 0.683624267578125, 0.70849609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 10.0, 10.0, 21.0, 16.0, 37.0, 33.0, 51.0, 50.0, 69.0, 114.0, 149.0, 106.0, 78.0, 57.0, 51.0, 40.0, 26.0, 23.0, 11.0, 13.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012046098709106445, -0.00011662300676107407, -0.00011278502643108368, -0.00010894704610109329, -0.0001051090657711029, -0.00010127108544111252, -9.743310511112213e-05, -9.359512478113174e-05, -8.975714445114136e-05, -8.591916412115097e-05, -8.208118379116058e-05, -7.82432034611702e-05, -7.440522313117981e-05, -7.056724280118942e-05, -6.672926247119904e-05, -6.289128214120865e-05, -5.905330181121826e-05, -5.5215321481227875e-05, -5.137734115123749e-05, -4.75393608212471e-05, -4.3701380491256714e-05, -3.986340016126633e-05, -3.602541983127594e-05, -3.218743950128555e-05, -2.8349459171295166e-05, -2.451147884130478e-05, -2.0673498511314392e-05, -1.6835518181324005e-05, -1.2997537851333618e-05, -9.159557521343231e-06, -5.321577191352844e-06, -1.4835968613624573e-06, 2.3543834686279297e-06, 6.192363798618317e-06, 1.0030344128608704e-05, 1.386832445859909e-05, 1.7706304788589478e-05, 2.1544285118579865e-05, 2.538226544857025e-05, 2.922024577856064e-05, 3.3058226108551025e-05, 3.689620643854141e-05, 4.07341867685318e-05, 4.4572167098522186e-05, 4.841014742851257e-05, 5.224812775850296e-05, 5.608610808849335e-05, 5.9924088418483734e-05, 6.376206874847412e-05, 6.760004907846451e-05, 7.14380294084549e-05, 7.527600973844528e-05, 7.911399006843567e-05, 8.295197039842606e-05, 8.678995072841644e-05, 9.062793105840683e-05, 9.446591138839722e-05, 9.83038917183876e-05, 0.00010214187204837799, 0.00010597985237836838, 0.00010981783270835876, 0.00011365581303834915, 0.00011749379336833954, 0.00012133177369832993, 0.0001251697540283203]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 13.0, 16.0, 25.0, 39.0, 83.0, 147.0, 288.0, 712.0, 2463.0, 20264.0, 849496.0, 165694.0, 6994.0, 1311.0, 486.0, 223.0, 135.0, 62.0, 42.0, 27.0, 8.0, 8.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5466690063476562, -0.5254669189453125, -0.5042648315429688, -0.483062744140625, -0.46186065673828125, -0.4406585693359375, -0.41945648193359375, -0.39825439453125, -0.37705230712890625, -0.3558502197265625, -0.33464813232421875, -0.313446044921875, -0.29224395751953125, -0.2710418701171875, -0.24983978271484375, -0.2286376953125, -0.20743560791015625, -0.1862335205078125, -0.16503143310546875, -0.143829345703125, -0.12262725830078125, -0.1014251708984375, -0.08022308349609375, -0.05902099609375, -0.03781890869140625, -0.0166168212890625, 0.00458526611328125, 0.025787353515625, 0.04698944091796875, 0.0681915283203125, 0.08939361572265625, 0.110595703125, 0.13179779052734375, 0.1529998779296875, 0.17420196533203125, 0.195404052734375, 0.21660614013671875, 0.2378082275390625, 0.25901031494140625, 0.28021240234375, 0.30141448974609375, 0.3226165771484375, 0.34381866455078125, 0.365020751953125, 0.38622283935546875, 0.4074249267578125, 0.42862701416015625, 0.4498291015625, 0.47103118896484375, 0.4922332763671875, 0.5134353637695312, 0.534637451171875, 0.5558395385742188, 0.5770416259765625, 0.5982437133789062, 0.61944580078125, 0.6406478881835938, 0.6618499755859375, 0.6830520629882812, 0.704254150390625, 0.7254562377929688, 0.7466583251953125, 0.7678604125976562, 0.7890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 5.0, 16.0, 22.0, 27.0, 58.0, 65.0, 136.0, 168.0, 172.0, 124.0, 77.0, 43.0, 32.0, 22.0, 11.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.471923828125, -0.4530067443847656, -0.43408966064453125, -0.4151725769042969, -0.3962554931640625, -0.3773384094238281, -0.35842132568359375, -0.3395042419433594, -0.320587158203125, -0.3016700744628906, -0.28275299072265625, -0.2638359069824219, -0.2449188232421875, -0.22600173950195312, -0.20708465576171875, -0.18816757202148438, -0.16925048828125, -0.15033340454101562, -0.13141632080078125, -0.11249923706054688, -0.0935821533203125, -0.07466506958007812, -0.05574798583984375, -0.036830902099609375, -0.017913818359375, 0.001003265380859375, 0.01992034912109375, 0.038837432861328125, 0.0577545166015625, 0.07667160034179688, 0.09558868408203125, 0.11450576782226562, 0.1334228515625, 0.15233993530273438, 0.17125701904296875, 0.19017410278320312, 0.2090911865234375, 0.22800827026367188, 0.24692535400390625, 0.2658424377441406, 0.284759521484375, 0.3036766052246094, 0.32259368896484375, 0.3415107727050781, 0.3604278564453125, 0.3793449401855469, 0.39826202392578125, 0.4171791076660156, 0.43609619140625, 0.4550132751464844, 0.47393035888671875, 0.4928474426269531, 0.5117645263671875, 0.5306816101074219, 0.5495986938476562, 0.5685157775878906, 0.587432861328125, 0.6063499450683594, 0.6252670288085938, 0.6441841125488281, 0.6631011962890625, 0.6820182800292969, 0.7009353637695312, 0.7198524475097656, 0.73876953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 34.0, 175.0, 456.0, 269.0, 52.0, 7.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.47958755493164, -17.929616928100586, -17.37964630126953, -16.829673767089844, -16.27970314025879, -15.729732513427734, -15.17976188659668, -14.629790306091309, -14.079818725585938, -13.529848098754883, -12.979876518249512, -12.429905891418457, -11.879934310913086, -11.329963684082031, -10.779993057250977, -10.230021476745605, -9.68005084991455, -9.130080223083496, -8.580108642578125, -8.03013801574707, -7.480166435241699, -6.9301958084106445, -6.380224704742432, -5.830253601074219, -5.280282497406006, -4.730311393737793, -4.18034029006958, -3.6303694248199463, -3.0803983211517334, -2.5304272174835205, -1.9804563522338867, -1.4304852485656738, -0.8805141448974609, -0.3305431008338928, 0.2194279432296753, 0.7693989276885986, 1.3193700313568115, 1.8693411350250244, 2.419312000274658, 2.969283103942871, 3.519254207611084, 4.069225311279297, 4.61919641494751, 5.169167518615723, 5.719138145446777, 6.269109725952148, 6.819080352783203, 7.369051456451416, 7.919022560119629, 8.468993186950684, 9.018964767456055, 9.56893539428711, 10.11890697479248, 10.668877601623535, 11.218849182128906, 11.768819808959961, 12.318790435791016, 12.86876106262207, 13.418732643127441, 13.968703269958496, 14.518674850463867, 15.068645477294922, 15.618616104125977, 16.16858673095703, 16.71855926513672]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 5.0, 6.0, 9.0, 6.0, 11.0, 11.0, 9.0, 15.0, 27.0, 28.0, 38.0, 33.0, 44.0, 49.0, 50.0, 50.0, 62.0, 51.0, 47.0, 59.0, 54.0, 39.0, 39.0, 40.0, 29.0, 31.0, 29.0, 20.0, 16.0, 11.0, 13.0, 10.0, 9.0, 11.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0], "bins": [-4.85911750793457, -4.733467102050781, -4.607816696166992, -4.482166290283203, -4.356515884399414, -4.230865478515625, -4.105215072631836, -3.979564666748047, -3.853914260864258, -3.7282638549804688, -3.6026134490966797, -3.4769630432128906, -3.3513126373291016, -3.2256622314453125, -3.1000118255615234, -2.9743614196777344, -2.8487110137939453, -2.7230606079101562, -2.597410202026367, -2.471759796142578, -2.346109390258789, -2.220458984375, -2.094808578491211, -1.9691581726074219, -1.8435077667236328, -1.7178573608398438, -1.5922069549560547, -1.4665565490722656, -1.3409061431884766, -1.2152557373046875, -1.0896053314208984, -0.9639549255371094, -0.8383049964904785, -0.7126545906066895, -0.5870041847229004, -0.46135377883911133, -0.33570337295532227, -0.2100529670715332, -0.08440256118774414, 0.04124784469604492, 0.16689825057983398, 0.29254865646362305, 0.4181990623474121, 0.5438494682312012, 0.6694998741149902, 0.7951502799987793, 0.9208006858825684, 1.0464510917663574, 1.1721014976501465, 1.2977519035339355, 1.4234023094177246, 1.5490527153015137, 1.6747031211853027, 1.8003535270690918, 1.9260039329528809, 2.05165433883667, 2.177304744720459, 2.302955150604248, 2.428605556488037, 2.554255962371826, 2.6799063682556152, 2.8055567741394043, 2.9312071800231934, 3.0568575859069824, 3.1825079917907715]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 5.0, 6.0, 3.0, 13.0, 6.0, 14.0, 11.0, 11.0, 15.0, 34.0, 48.0, 74.0, 99.0, 165.0, 284.0, 516.0, 824.0, 1455.0, 3198.0, 7884.0, 25760.0, 170495.0, 3578722.0, 347712.0, 38791.0, 10644.0, 3794.0, 1749.0, 861.0, 464.0, 244.0, 162.0, 79.0, 56.0, 31.0, 15.0, 12.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.56640625, -0.5513496398925781, -0.5362930297851562, -0.5212364196777344, -0.5061798095703125, -0.4911231994628906, -0.47606658935546875, -0.4610099792480469, -0.445953369140625, -0.4308967590332031, -0.41584014892578125, -0.4007835388183594, -0.3857269287109375, -0.3706703186035156, -0.35561370849609375, -0.3405570983886719, -0.32550048828125, -0.3104438781738281, -0.29538726806640625, -0.2803306579589844, -0.2652740478515625, -0.2502174377441406, -0.23516082763671875, -0.22010421752929688, -0.205047607421875, -0.18999099731445312, -0.17493438720703125, -0.15987777709960938, -0.1448211669921875, -0.12976455688476562, -0.11470794677734375, -0.09965133666992188, -0.0845947265625, -0.06953811645507812, -0.05448150634765625, -0.039424896240234375, -0.0243682861328125, -0.009311676025390625, 0.00574493408203125, 0.020801544189453125, 0.035858154296875, 0.050914764404296875, 0.06597137451171875, 0.08102798461914062, 0.0960845947265625, 0.11114120483398438, 0.12619781494140625, 0.14125442504882812, 0.15631103515625, 0.17136764526367188, 0.18642425537109375, 0.20148086547851562, 0.2165374755859375, 0.23159408569335938, 0.24665069580078125, 0.2617073059082031, 0.276763916015625, 0.2918205261230469, 0.30687713623046875, 0.3219337463378906, 0.3369903564453125, 0.3520469665527344, 0.36710357666015625, 0.3821601867675781, 0.397216796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 8.0, 10.0, 12.0, 19.0, 20.0, 46.0, 56.0, 70.0, 75.0, 85.0, 94.0, 95.0, 77.0, 76.0, 50.0, 47.0, 54.0, 33.0, 29.0, 12.0, 10.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.3583984375, -0.35002708435058594, -0.3416557312011719, -0.3332843780517578, -0.32491302490234375, -0.3165416717529297, -0.3081703186035156, -0.29979896545410156, -0.2914276123046875, -0.28305625915527344, -0.2746849060058594, -0.2663135528564453, -0.25794219970703125, -0.2495708465576172, -0.24119949340820312, -0.23282814025878906, -0.224456787109375, -0.21608543395996094, -0.20771408081054688, -0.1993427276611328, -0.19097137451171875, -0.1826000213623047, -0.17422866821289062, -0.16585731506347656, -0.1574859619140625, -0.14911460876464844, -0.14074325561523438, -0.1323719024658203, -0.12400054931640625, -0.11562919616699219, -0.10725784301757812, -0.09888648986816406, -0.09051513671875, -0.08214378356933594, -0.07377243041992188, -0.06540107727050781, -0.05702972412109375, -0.04865837097167969, -0.040287017822265625, -0.03191566467285156, -0.0235443115234375, -0.015172958374023438, -0.006801605224609375, 0.0015697479248046875, 0.00994110107421875, 0.018312454223632812, 0.026683807373046875, 0.03505516052246094, 0.043426513671875, 0.05179786682128906, 0.060169219970703125, 0.06854057312011719, 0.07691192626953125, 0.08528327941894531, 0.09365463256835938, 0.10202598571777344, 0.1103973388671875, 0.11876869201660156, 0.12714004516601562, 0.1355113983154297, 0.14388275146484375, 0.1522541046142578, 0.16062545776367188, 0.16899681091308594, 0.1773681640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 4.0, 17.0, 15.0, 26.0, 46.0, 67.0, 122.0, 224.0, 425.0, 1032.0, 2828.0, 9604.0, 57120.0, 3151320.0, 924665.0, 35539.0, 7232.0, 2227.0, 858.0, 397.0, 195.0, 112.0, 66.0, 45.0, 26.0, 15.0, 15.0, 8.0, 7.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.802734375, -0.7783279418945312, -0.7539215087890625, -0.7295150756835938, -0.705108642578125, -0.6807022094726562, -0.6562957763671875, -0.6318893432617188, -0.60748291015625, -0.5830764770507812, -0.5586700439453125, -0.5342636108398438, -0.509857177734375, -0.48545074462890625, -0.4610443115234375, -0.43663787841796875, -0.4122314453125, -0.38782501220703125, -0.3634185791015625, -0.33901214599609375, -0.314605712890625, -0.29019927978515625, -0.2657928466796875, -0.24138641357421875, -0.21697998046875, -0.19257354736328125, -0.1681671142578125, -0.14376068115234375, -0.119354248046875, -0.09494781494140625, -0.0705413818359375, -0.04613494873046875, -0.021728515625, 0.00267791748046875, 0.0270843505859375, 0.05149078369140625, 0.075897216796875, 0.10030364990234375, 0.1247100830078125, 0.14911651611328125, 0.17352294921875, 0.19792938232421875, 0.2223358154296875, 0.24674224853515625, 0.271148681640625, 0.29555511474609375, 0.3199615478515625, 0.34436798095703125, 0.3687744140625, 0.39318084716796875, 0.4175872802734375, 0.44199371337890625, 0.466400146484375, 0.49080657958984375, 0.5152130126953125, 0.5396194458007812, 0.56402587890625, 0.5884323120117188, 0.6128387451171875, 0.6372451782226562, 0.661651611328125, 0.6860580444335938, 0.7104644775390625, 0.7348709106445312, 0.75927734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 3.0, 8.0, 13.0, 14.0, 19.0, 32.0, 54.0, 88.0, 168.0, 349.0, 971.0, 1362.0, 489.0, 214.0, 94.0, 75.0, 27.0, 21.0, 20.0, 12.0, 12.0, 5.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7548828125, -0.7327651977539062, -0.7106475830078125, -0.6885299682617188, -0.666412353515625, -0.6442947387695312, -0.6221771240234375, -0.6000595092773438, -0.57794189453125, -0.5558242797851562, -0.5337066650390625, -0.5115890502929688, -0.489471435546875, -0.46735382080078125, -0.4452362060546875, -0.42311859130859375, -0.4010009765625, -0.37888336181640625, -0.3567657470703125, -0.33464813232421875, -0.312530517578125, -0.29041290283203125, -0.2682952880859375, -0.24617767333984375, -0.22406005859375, -0.20194244384765625, -0.1798248291015625, -0.15770721435546875, -0.135589599609375, -0.11347198486328125, -0.0913543701171875, -0.06923675537109375, -0.047119140625, -0.02500152587890625, -0.0028839111328125, 0.01923370361328125, 0.041351318359375, 0.06346893310546875, 0.0855865478515625, 0.10770416259765625, 0.12982177734375, 0.15193939208984375, 0.1740570068359375, 0.19617462158203125, 0.218292236328125, 0.24040985107421875, 0.2625274658203125, 0.28464508056640625, 0.3067626953125, 0.32888031005859375, 0.3509979248046875, 0.37311553955078125, 0.395233154296875, 0.41735076904296875, 0.4394683837890625, 0.46158599853515625, 0.48370361328125, 0.5058212280273438, 0.5279388427734375, 0.5500564575195312, 0.572174072265625, 0.5942916870117188, 0.6164093017578125, 0.6385269165039062, 0.66064453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 22.0, 94.0, 288.0, 386.0, 148.0, 34.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.180972099304199, -6.842856407165527, -6.5047407150268555, -6.166625022888184, -5.828509330749512, -5.49039363861084, -5.15227746963501, -4.814161777496338, -4.476046085357666, -4.137930393218994, -3.7998147010803223, -3.4616987705230713, -3.1235830783843994, -2.7854673862457275, -2.4473514556884766, -2.1092357635498047, -1.7711200714111328, -1.433004379272461, -1.0948885679244995, -0.7567727565765381, -0.4186570644378662, -0.08054137229919434, 0.25757455825805664, 0.5956902503967285, 0.9338059425354004, 1.2719216346740723, 1.6100374460220337, 1.9481532573699951, 2.286268949508667, 2.624384641647339, 2.96250057220459, 3.3006162643432617, 3.638731002807617, 3.976846694946289, 4.314962387084961, 4.653078079223633, 4.991193771362305, 5.329309463500977, 5.667425632476807, 6.0055413246154785, 6.34365701675415, 6.681772708892822, 7.019888401031494, 7.358004570007324, 7.696120262145996, 8.034235954284668, 8.37235164642334, 8.710467338562012, 9.048583030700684, 9.386698722839355, 9.724814414978027, 10.0629301071167, 10.401045799255371, 10.739161491394043, 11.077278137207031, 11.415393829345703, 11.753509521484375, 12.091625213623047, 12.429740905761719, 12.76785659790039, 13.105972290039062, 13.444087982177734, 13.782203674316406, 14.120319366455078, 14.45843505859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 9.0, 12.0, 11.0, 14.0, 21.0, 19.0, 27.0, 31.0, 30.0, 49.0, 36.0, 27.0, 33.0, 45.0, 32.0, 49.0, 44.0, 50.0, 58.0, 43.0, 40.0, 37.0, 36.0, 24.0, 28.0, 20.0, 29.0, 26.0, 18.0, 18.0, 7.0, 14.0, 8.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.060170888900757, -1.991247296333313, -1.9223237037658691, -1.8534002304077148, -1.784476637840271, -1.7155530452728271, -1.6466295719146729, -1.577705979347229, -1.5087823867797852, -1.4398587942123413, -1.3709352016448975, -1.3020117282867432, -1.2330881357192993, -1.1641645431518555, -1.0952410697937012, -1.0263174772262573, -0.9573938846588135, -0.8884702920913696, -0.8195467591285706, -0.7506232261657715, -0.6816996335983276, -0.6127760410308838, -0.5438525080680847, -0.47492894530296326, -0.4060053825378418, -0.33708181977272034, -0.2681582570075989, -0.19923469424247742, -0.13031113147735596, -0.0613875687122345, 0.007535994052886963, 0.07645955681800842, 0.14538335800170898, 0.21430692076683044, 0.2832304835319519, 0.35215404629707336, 0.4210776090621948, 0.4900011718273163, 0.5589247345924377, 0.6278482675552368, 0.6967718601226807, 0.7656954526901245, 0.8346189856529236, 0.9035425186157227, 0.9724661111831665, 1.0413897037506104, 1.1103131771087646, 1.1792367696762085, 1.2481603622436523, 1.3170839548110962, 1.38600754737854, 1.4549310207366943, 1.5238546133041382, 1.592778205871582, 1.6617016792297363, 1.7306252717971802, 1.799548864364624, 1.8684724569320679, 1.9373960494995117, 2.006319522857666, 2.0752429962158203, 2.1441667079925537, 2.213090181350708, 2.2820138931274414, 2.3509373664855957]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 9.0, 19.0, 17.0, 33.0, 58.0, 96.0, 150.0, 241.0, 425.0, 773.0, 1536.0, 3157.0, 7367.0, 20199.0, 69340.0, 315976.0, 474402.0, 107676.0, 28874.0, 10054.0, 4095.0, 1875.0, 882.0, 546.0, 289.0, 159.0, 109.0, 65.0, 48.0, 25.0, 16.0, 7.0, 11.0, 7.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6328697204589844, -0.6158370971679688, -0.5988044738769531, -0.5817718505859375, -0.5647392272949219, -0.5477066040039062, -0.5306739807128906, -0.513641357421875, -0.4966087341308594, -0.47957611083984375, -0.4625434875488281, -0.4455108642578125, -0.4284782409667969, -0.41144561767578125, -0.3944129943847656, -0.37738037109375, -0.3603477478027344, -0.34331512451171875, -0.3262825012207031, -0.3092498779296875, -0.2922172546386719, -0.27518463134765625, -0.2581520080566406, -0.241119384765625, -0.22408676147460938, -0.20705413818359375, -0.19002151489257812, -0.1729888916015625, -0.15595626831054688, -0.13892364501953125, -0.12189102172851562, -0.1048583984375, -0.08782577514648438, -0.07079315185546875, -0.053760528564453125, -0.0367279052734375, -0.019695281982421875, -0.00266265869140625, 0.014369964599609375, 0.031402587890625, 0.048435211181640625, 0.06546783447265625, 0.08250045776367188, 0.0995330810546875, 0.11656570434570312, 0.13359832763671875, 0.15063095092773438, 0.16766357421875, 0.18469619750976562, 0.20172882080078125, 0.21876144409179688, 0.2357940673828125, 0.2528266906738281, 0.26985931396484375, 0.2868919372558594, 0.303924560546875, 0.3209571838378906, 0.33798980712890625, 0.3550224304199219, 0.3720550537109375, 0.3890876770019531, 0.40612030029296875, 0.4231529235839844, 0.440185546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 11.0, 21.0, 15.0, 27.0, 32.0, 60.0, 49.0, 65.0, 59.0, 76.0, 89.0, 69.0, 70.0, 67.0, 52.0, 49.0, 33.0, 35.0, 27.0, 29.0, 23.0, 4.0, 6.0, 6.0, 0.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.2538928985595703, -0.24655532836914062, -0.23921775817871094, -0.23188018798828125, -0.22454261779785156, -0.21720504760742188, -0.2098674774169922, -0.2025299072265625, -0.1951923370361328, -0.18785476684570312, -0.18051719665527344, -0.17317962646484375, -0.16584205627441406, -0.15850448608398438, -0.1511669158935547, -0.143829345703125, -0.1364917755126953, -0.12915420532226562, -0.12181663513183594, -0.11447906494140625, -0.10714149475097656, -0.09980392456054688, -0.09246635437011719, -0.0851287841796875, -0.07779121398925781, -0.07045364379882812, -0.06311607360839844, -0.05577850341796875, -0.04844093322753906, -0.041103363037109375, -0.03376579284667969, -0.02642822265625, -0.019090652465820312, -0.011753082275390625, -0.0044155120849609375, 0.00292205810546875, 0.010259628295898438, 0.017597198486328125, 0.024934768676757812, 0.0322723388671875, 0.03960990905761719, 0.046947479248046875, 0.05428504943847656, 0.06162261962890625, 0.06896018981933594, 0.07629776000976562, 0.08363533020019531, 0.090972900390625, 0.09831047058105469, 0.10564804077148438, 0.11298561096191406, 0.12032318115234375, 0.12766075134277344, 0.13499832153320312, 0.1423358917236328, 0.1496734619140625, 0.1570110321044922, 0.16434860229492188, 0.17168617248535156, 0.17902374267578125, 0.18636131286621094, 0.19369888305664062, 0.2010364532470703, 0.2083740234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 9.0, 17.0, 21.0, 28.0, 44.0, 65.0, 119.0, 199.0, 392.0, 955.0, 2641.0, 13089.0, 433675.0, 578056.0, 14616.0, 2718.0, 933.0, 437.0, 199.0, 125.0, 79.0, 28.0, 32.0, 13.0, 16.0, 7.0, 7.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1689453125, -1.1240234375, -1.0791015625, -1.0341796875, -0.9892578125, -0.9443359375, -0.8994140625, -0.8544921875, -0.8095703125, -0.7646484375, -0.7197265625, -0.6748046875, -0.6298828125, -0.5849609375, -0.5400390625, -0.4951171875, -0.4501953125, -0.4052734375, -0.3603515625, -0.3154296875, -0.2705078125, -0.2255859375, -0.1806640625, -0.1357421875, -0.0908203125, -0.0458984375, -0.0009765625, 0.0439453125, 0.0888671875, 0.1337890625, 0.1787109375, 0.2236328125, 0.2685546875, 0.3134765625, 0.3583984375, 0.4033203125, 0.4482421875, 0.4931640625, 0.5380859375, 0.5830078125, 0.6279296875, 0.6728515625, 0.7177734375, 0.7626953125, 0.8076171875, 0.8525390625, 0.8974609375, 0.9423828125, 0.9873046875, 1.0322265625, 1.0771484375, 1.1220703125, 1.1669921875, 1.2119140625, 1.2568359375, 1.3017578125, 1.3466796875, 1.3916015625, 1.4365234375, 1.4814453125, 1.5263671875, 1.5712890625, 1.6162109375, 1.6611328125, 1.7060546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 12.0, 9.0, 11.0, 18.0, 26.0, 19.0, 22.0, 32.0, 42.0, 51.0, 63.0, 52.0, 63.0, 86.0, 71.0, 58.0, 62.0, 57.0, 44.0, 42.0, 32.0, 25.0, 15.0, 27.0, 17.0, 17.0, 9.0, 8.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9423828125, -0.9064178466796875, -0.870452880859375, -0.8344879150390625, -0.79852294921875, -0.7625579833984375, -0.726593017578125, -0.6906280517578125, -0.6546630859375, -0.6186981201171875, -0.582733154296875, -0.5467681884765625, -0.51080322265625, -0.4748382568359375, -0.438873291015625, -0.4029083251953125, -0.366943359375, -0.3309783935546875, -0.295013427734375, -0.2590484619140625, -0.22308349609375, -0.1871185302734375, -0.151153564453125, -0.1151885986328125, -0.0792236328125, -0.0432586669921875, -0.007293701171875, 0.0286712646484375, 0.06463623046875, 0.1006011962890625, 0.136566162109375, 0.1725311279296875, 0.20849609375, 0.2444610595703125, 0.280426025390625, 0.3163909912109375, 0.35235595703125, 0.3883209228515625, 0.424285888671875, 0.4602508544921875, 0.4962158203125, 0.5321807861328125, 0.568145751953125, 0.6041107177734375, 0.64007568359375, 0.6760406494140625, 0.712005615234375, 0.7479705810546875, 0.783935546875, 0.8199005126953125, 0.855865478515625, 0.8918304443359375, 0.92779541015625, 0.9637603759765625, 0.999725341796875, 1.0356903076171875, 1.0716552734375, 1.1076202392578125, 1.143585205078125, 1.1795501708984375, 1.21551513671875, 1.2514801025390625, 1.287445068359375, 1.3234100341796875, 1.359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 12.0, 16.0, 7.0, 10.0, 34.0, 59.0, 111.0, 249.0, 663.0, 2142.0, 14385.0, 868329.0, 154152.0, 6203.0, 1287.0, 445.0, 181.0, 120.0, 51.0, 29.0, 24.0, 14.0, 5.0, 8.0, 1.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.7785797119140625, -0.749542236328125, -0.7205047607421875, -0.69146728515625, -0.6624298095703125, -0.633392333984375, -0.6043548583984375, -0.5753173828125, -0.5462799072265625, -0.517242431640625, -0.4882049560546875, -0.45916748046875, -0.4301300048828125, -0.401092529296875, -0.3720550537109375, -0.343017578125, -0.3139801025390625, -0.284942626953125, -0.2559051513671875, -0.22686767578125, -0.1978302001953125, -0.168792724609375, -0.1397552490234375, -0.1107177734375, -0.0816802978515625, -0.052642822265625, -0.0236053466796875, 0.00543212890625, 0.0344696044921875, 0.063507080078125, 0.0925445556640625, 0.12158203125, 0.1506195068359375, 0.179656982421875, 0.2086944580078125, 0.23773193359375, 0.2667694091796875, 0.295806884765625, 0.3248443603515625, 0.3538818359375, 0.3829193115234375, 0.411956787109375, 0.4409942626953125, 0.47003173828125, 0.4990692138671875, 0.528106689453125, 0.5571441650390625, 0.586181640625, 0.6152191162109375, 0.644256591796875, 0.6732940673828125, 0.70233154296875, 0.7313690185546875, 0.760406494140625, 0.7894439697265625, 0.8184814453125, 0.8475189208984375, 0.876556396484375, 0.9055938720703125, 0.93463134765625, 0.9636688232421875, 0.992706298828125, 1.0217437744140625, 1.05078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 17.0, 20.0, 40.0, 62.0, 86.0, 107.0, 146.0, 128.0, 104.0, 79.0, 60.0, 46.0, 25.0, 21.0, 10.0, 12.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021529197692871094, -0.00020461156964302063, -0.00019393116235733032, -0.00018325075507164001, -0.0001725703477859497, -0.0001618899405002594, -0.0001512095332145691, -0.00014052912592887878, -0.00012984871864318848, -0.00011916831135749817, -0.00010848790407180786, -9.780749678611755e-05, -8.712708950042725e-05, -7.644668221473694e-05, -6.576627492904663e-05, -5.508586764335632e-05, -4.4405460357666016e-05, -3.372505307197571e-05, -2.30446457862854e-05, -1.2364238500595093e-05, -1.6838312149047852e-06, 8.996576070785522e-06, 1.967698335647583e-05, 3.0357390642166138e-05, 4.1037797927856445e-05, 5.171820521354675e-05, 6.239861249923706e-05, 7.307901978492737e-05, 8.375942707061768e-05, 9.443983435630798e-05, 0.00010512024164199829, 0.0001158006489276886, 0.0001264810562133789, 0.00013716146349906921, 0.00014784187078475952, 0.00015852227807044983, 0.00016920268535614014, 0.00017988309264183044, 0.00019056349992752075, 0.00020124390721321106, 0.00021192431449890137, 0.00022260472178459167, 0.00023328512907028198, 0.0002439655363559723, 0.0002546459436416626, 0.0002653263509273529, 0.0002760067582130432, 0.0002866871654987335, 0.00029736757278442383, 0.00030804798007011414, 0.00031872838735580444, 0.00032940879464149475, 0.00034008920192718506, 0.00035076960921287537, 0.0003614500164985657, 0.000372130423784256, 0.0003828108310699463, 0.0003934912383556366, 0.0004041716456413269, 0.0004148520529270172, 0.0004255324602127075, 0.00043621286749839783, 0.00044689327478408813, 0.00045757368206977844, 0.00046825408935546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 4.0, 16.0, 23.0, 38.0, 37.0, 77.0, 90.0, 162.0, 270.0, 505.0, 1018.0, 2762.0, 13351.0, 219298.0, 773084.0, 30374.0, 4470.0, 1408.0, 700.0, 329.0, 186.0, 127.0, 62.0, 51.0, 30.0, 28.0, 13.0, 10.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5458984375, -0.52581787109375, -0.5057373046875, -0.48565673828125, -0.465576171875, -0.44549560546875, -0.4254150390625, -0.40533447265625, -0.38525390625, -0.36517333984375, -0.3450927734375, -0.32501220703125, -0.304931640625, -0.28485107421875, -0.2647705078125, -0.24468994140625, -0.224609375, -0.20452880859375, -0.1844482421875, -0.16436767578125, -0.144287109375, -0.12420654296875, -0.1041259765625, -0.08404541015625, -0.06396484375, -0.04388427734375, -0.0238037109375, -0.00372314453125, 0.016357421875, 0.03643798828125, 0.0565185546875, 0.07659912109375, 0.0966796875, 0.11676025390625, 0.1368408203125, 0.15692138671875, 0.177001953125, 0.19708251953125, 0.2171630859375, 0.23724365234375, 0.25732421875, 0.27740478515625, 0.2974853515625, 0.31756591796875, 0.337646484375, 0.35772705078125, 0.3778076171875, 0.39788818359375, 0.41796875, 0.43804931640625, 0.4581298828125, 0.47821044921875, 0.498291015625, 0.51837158203125, 0.5384521484375, 0.55853271484375, 0.57861328125, 0.59869384765625, 0.6187744140625, 0.63885498046875, 0.658935546875, 0.67901611328125, 0.6990966796875, 0.71917724609375, 0.7392578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 6.0, 8.0, 14.0, 8.0, 23.0, 34.0, 33.0, 48.0, 58.0, 63.0, 72.0, 98.0, 87.0, 78.0, 67.0, 67.0, 44.0, 47.0, 32.0, 26.0, 13.0, 10.0, 16.0, 9.0, 4.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32421875, -0.3105316162109375, -0.296844482421875, -0.2831573486328125, -0.26947021484375, -0.2557830810546875, -0.242095947265625, -0.2284088134765625, -0.2147216796875, -0.2010345458984375, -0.187347412109375, -0.1736602783203125, -0.15997314453125, -0.1462860107421875, -0.132598876953125, -0.1189117431640625, -0.105224609375, -0.0915374755859375, -0.077850341796875, -0.0641632080078125, -0.05047607421875, -0.0367889404296875, -0.023101806640625, -0.0094146728515625, 0.0042724609375, 0.0179595947265625, 0.031646728515625, 0.0453338623046875, 0.05902099609375, 0.0727081298828125, 0.086395263671875, 0.1000823974609375, 0.11376953125, 0.1274566650390625, 0.141143798828125, 0.1548309326171875, 0.16851806640625, 0.1822052001953125, 0.195892333984375, 0.2095794677734375, 0.2232666015625, 0.2369537353515625, 0.250640869140625, 0.2643280029296875, 0.27801513671875, 0.2917022705078125, 0.305389404296875, 0.3190765380859375, 0.332763671875, 0.3464508056640625, 0.360137939453125, 0.3738250732421875, 0.38751220703125, 0.4011993408203125, 0.414886474609375, 0.4285736083984375, 0.4422607421875, 0.4559478759765625, 0.469635009765625, 0.4833221435546875, 0.49700927734375, 0.5106964111328125, 0.524383544921875, 0.5380706787109375, 0.5517578125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 52.0, 164.0, 389.0, 244.0, 96.0, 26.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.409454345703125, -10.003876686096191, -9.598299026489258, -9.192720413208008, -8.787142753601074, -8.38156509399414, -7.975986957550049, -7.570408821105957, -7.164831161499023, -6.75925350189209, -6.353675365447998, -5.948097229003906, -5.542519569396973, -5.136941909790039, -4.731363773345947, -4.3257856369018555, -3.920207977294922, -3.514630079269409, -3.1090521812438965, -2.703474283218384, -2.297896385192871, -1.8923184871673584, -1.4867405891418457, -1.081162691116333, -0.6755847930908203, -0.2700068950653076, 0.13557100296020508, 0.5411489009857178, 0.9467267990112305, 1.3523046970367432, 1.7578825950622559, 2.1634604930877686, 2.5690383911132812, 2.974616289138794, 3.3801941871643066, 3.7857720851898193, 4.191349983215332, 4.596927642822266, 5.002505779266357, 5.408083915710449, 5.813661575317383, 6.219239234924316, 6.624817371368408, 7.0303955078125, 7.435973167419434, 7.841550827026367, 8.247129440307617, 8.65270709991455, 9.058284759521484, 9.463862419128418, 9.869440078735352, 10.275018692016602, 10.680596351623535, 11.086174011230469, 11.491752624511719, 11.897330284118652, 12.302907943725586, 12.70848560333252, 13.114063262939453, 13.519641876220703, 13.925219535827637, 14.33079719543457, 14.73637580871582, 15.141953468322754, 15.547531127929688]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 10.0, 4.0, 5.0, 14.0, 9.0, 15.0, 12.0, 24.0, 30.0, 27.0, 40.0, 38.0, 52.0, 49.0, 62.0, 60.0, 64.0, 61.0, 53.0, 47.0, 54.0, 54.0, 35.0, 29.0, 30.0, 26.0, 16.0, 14.0, 16.0, 12.0, 8.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-4.932521343231201, -4.801183223724365, -4.669845104217529, -4.538506984710693, -4.407168388366699, -4.275830268859863, -4.144492149353027, -4.013154029846191, -3.8818159103393555, -3.7504777908325195, -3.6191396713256836, -3.4878013134002686, -3.3564631938934326, -3.2251250743865967, -3.0937867164611816, -2.9624485969543457, -2.8311104774475098, -2.699772357940674, -2.568434238433838, -2.437095880508423, -2.305757761001587, -2.174419641494751, -2.043081283569336, -1.9117431640625, -1.780405044555664, -1.6490669250488281, -1.5177286863327026, -1.3863904476165771, -1.2550523281097412, -1.1237142086029053, -0.9923759698867798, -0.8610377907752991, -0.7296993732452393, -0.5983611941337585, -0.46702301502227783, -0.3356848359107971, -0.2043466567993164, -0.0730084776878357, 0.05832970142364502, 0.18966788053512573, 0.32100605964660645, 0.45234423875808716, 0.5836824178695679, 0.7150205969810486, 0.8463587760925293, 0.97769695520401, 1.1090351343154907, 1.2403733730316162, 1.3717114925384521, 1.503049612045288, 1.6343878507614136, 1.765726089477539, 1.897064208984375, 2.028402328491211, 2.159740447998047, 2.291078805923462, 2.422416925430298, 2.553755044937134, 2.685093402862549, 2.8164315223693848, 2.9477696418762207, 3.0791077613830566, 3.2104458808898926, 3.3417842388153076, 3.4731223583221436]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 13.0, 8.0, 10.0, 17.0, 16.0, 29.0, 34.0, 68.0, 140.0, 414.0, 4166860.0, 26001.0, 344.0, 153.0, 78.0, 35.0, 22.0, 12.0, 10.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.23394775390625, -7.9835205078125, -7.73309326171875, -7.482666015625, -7.23223876953125, -6.9818115234375, -6.73138427734375, -6.48095703125, -6.23052978515625, -5.9801025390625, -5.72967529296875, -5.479248046875, -5.22882080078125, -4.9783935546875, -4.72796630859375, -4.4775390625, -4.22711181640625, -3.9766845703125, -3.72625732421875, -3.475830078125, -3.22540283203125, -2.9749755859375, -2.72454833984375, -2.47412109375, -2.22369384765625, -1.9732666015625, -1.72283935546875, -1.472412109375, -1.22198486328125, -0.9715576171875, -0.72113037109375, -0.470703125, -0.22027587890625, 0.0301513671875, 0.28057861328125, 0.531005859375, 0.78143310546875, 1.0318603515625, 1.28228759765625, 1.53271484375, 1.78314208984375, 2.0335693359375, 2.28399658203125, 2.534423828125, 2.78485107421875, 3.0352783203125, 3.28570556640625, 3.5361328125, 3.78656005859375, 4.0369873046875, 4.28741455078125, 4.537841796875, 4.78826904296875, 5.0386962890625, 5.28912353515625, 5.53955078125, 5.78997802734375, 6.0404052734375, 6.29083251953125, 6.541259765625, 6.79168701171875, 7.0421142578125, 7.29254150390625, 7.54296875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 8.0, 10.0, 20.0, 16.0, 21.0, 39.0, 66.0, 77.0, 90.0, 108.0, 113.0, 88.0, 73.0, 67.0, 58.0, 46.0, 36.0, 17.0, 12.0, 8.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.45654296875, -0.4466590881347656, -0.43677520751953125, -0.4268913269042969, -0.4170074462890625, -0.4071235656738281, -0.39723968505859375, -0.3873558044433594, -0.377471923828125, -0.3675880432128906, -0.35770416259765625, -0.3478202819824219, -0.3379364013671875, -0.3280525207519531, -0.31816864013671875, -0.3082847595214844, -0.29840087890625, -0.2885169982910156, -0.27863311767578125, -0.2687492370605469, -0.2588653564453125, -0.24898147583007812, -0.23909759521484375, -0.22921371459960938, -0.219329833984375, -0.20944595336914062, -0.19956207275390625, -0.18967819213867188, -0.1797943115234375, -0.16991043090820312, -0.16002655029296875, -0.15014266967773438, -0.1402587890625, -0.13037490844726562, -0.12049102783203125, -0.11060714721679688, -0.1007232666015625, -0.09083938598632812, -0.08095550537109375, -0.07107162475585938, -0.061187744140625, -0.051303863525390625, -0.04141998291015625, -0.031536102294921875, -0.0216522216796875, -0.011768341064453125, -0.00188446044921875, 0.007999420166015625, 0.01788330078125, 0.027767181396484375, 0.03765106201171875, 0.047534942626953125, 0.0574188232421875, 0.06730270385742188, 0.07718658447265625, 0.08707046508789062, 0.096954345703125, 0.10683822631835938, 0.11672210693359375, 0.12660598754882812, 0.1364898681640625, 0.14637374877929688, 0.15625762939453125, 0.16614151000976562, 0.176025390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 13.0, 19.0, 27.0, 42.0, 62.0, 117.0, 182.0, 320.0, 583.0, 1057.0, 2172.0, 4560.0, 11104.0, 33615.0, 144002.0, 1693643.0, 2090298.0, 157754.0, 34820.0, 11418.0, 4292.0, 2041.0, 907.0, 484.0, 275.0, 154.0, 99.0, 51.0, 50.0, 23.0, 16.0, 21.0, 11.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.468017578125, -0.45571136474609375, -0.4434051513671875, -0.43109893798828125, -0.418792724609375, -0.40648651123046875, -0.3941802978515625, -0.38187408447265625, -0.36956787109375, -0.35726165771484375, -0.3449554443359375, -0.33264923095703125, -0.320343017578125, -0.30803680419921875, -0.2957305908203125, -0.28342437744140625, -0.2711181640625, -0.25881195068359375, -0.2465057373046875, -0.23419952392578125, -0.221893310546875, -0.20958709716796875, -0.1972808837890625, -0.18497467041015625, -0.17266845703125, -0.16036224365234375, -0.1480560302734375, -0.13574981689453125, -0.123443603515625, -0.11113739013671875, -0.0988311767578125, -0.08652496337890625, -0.07421875, -0.06191253662109375, -0.0496063232421875, -0.03730010986328125, -0.024993896484375, -0.01268768310546875, -0.0003814697265625, 0.01192474365234375, 0.02423095703125, 0.03653717041015625, 0.0488433837890625, 0.06114959716796875, 0.073455810546875, 0.08576202392578125, 0.0980682373046875, 0.11037445068359375, 0.1226806640625, 0.13498687744140625, 0.1472930908203125, 0.15959930419921875, 0.171905517578125, 0.18421173095703125, 0.1965179443359375, 0.20882415771484375, 0.22113037109375, 0.23343658447265625, 0.2457427978515625, 0.25804901123046875, 0.270355224609375, 0.28266143798828125, 0.2949676513671875, 0.30727386474609375, 0.319580078125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 9.0, 17.0, 30.0, 23.0, 37.0, 58.0, 123.0, 218.0, 308.0, 668.0, 1123.0, 644.0, 361.0, 149.0, 105.0, 54.0, 46.0, 21.0, 15.0, 10.0, 4.0, 11.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460693359375, -0.4444999694824219, -0.42830657958984375, -0.4121131896972656, -0.3959197998046875, -0.3797264099121094, -0.36353302001953125, -0.3473396301269531, -0.331146240234375, -0.3149528503417969, -0.29875946044921875, -0.2825660705566406, -0.2663726806640625, -0.2501792907714844, -0.23398590087890625, -0.21779251098632812, -0.20159912109375, -0.18540573120117188, -0.16921234130859375, -0.15301895141601562, -0.1368255615234375, -0.12063217163085938, -0.10443878173828125, -0.08824539184570312, -0.072052001953125, -0.055858612060546875, -0.03966522216796875, -0.023471832275390625, -0.0072784423828125, 0.008914947509765625, 0.02510833740234375, 0.041301727294921875, 0.0574951171875, 0.07368850708007812, 0.08988189697265625, 0.10607528686523438, 0.1222686767578125, 0.13846206665039062, 0.15465545654296875, 0.17084884643554688, 0.187042236328125, 0.20323562622070312, 0.21942901611328125, 0.23562240600585938, 0.2518157958984375, 0.2680091857910156, 0.28420257568359375, 0.3003959655761719, 0.31658935546875, 0.3327827453613281, 0.34897613525390625, 0.3651695251464844, 0.3813629150390625, 0.3975563049316406, 0.41374969482421875, 0.4299430847167969, 0.446136474609375, 0.4623298645019531, 0.47852325439453125, 0.4947166442871094, 0.5109100341796875, 0.5271034240722656, 0.5432968139648438, 0.5594902038574219, 0.57568359375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 4.0, 2.0, 4.0, 9.0, 8.0, 14.0, 63.0, 133.0, 269.0, 260.0, 153.0, 56.0, 11.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.224889755249023, -9.033588409423828, -8.842286109924316, -8.650983810424805, -8.45968246459961, -8.268381118774414, -8.077078819274902, -7.885776996612549, -7.694475173950195, -7.503173351287842, -7.311871528625488, -7.120569705963135, -6.929267883300781, -6.737966060638428, -6.546664237976074, -6.355362415313721, -6.164060592651367, -5.972758769989014, -5.78145694732666, -5.590155124664307, -5.398853302001953, -5.2075514793396, -5.016249656677246, -4.824947834014893, -4.633646011352539, -4.4423441886901855, -4.251042366027832, -4.0597405433654785, -3.868438720703125, -3.6771368980407715, -3.485835075378418, -3.2945332527160645, -3.10323166847229, -2.9119298458099365, -2.720628023147583, -2.5293262004852295, -2.338024377822876, -2.1467225551605225, -1.955420732498169, -1.7641189098358154, -1.572817087173462, -1.3815152645111084, -1.1902134418487549, -0.9989116191864014, -0.8076097965240479, -0.6163079738616943, -0.4250061511993408, -0.2337043285369873, -0.04240250587463379, 0.14889931678771973, 0.34020113945007324, 0.5315029621124268, 0.7228047847747803, 0.9141066074371338, 1.1054084300994873, 1.2967102527618408, 1.4880120754241943, 1.6793138980865479, 1.8706157207489014, 2.061917543411255, 2.2532193660736084, 2.444521188735962, 2.6358230113983154, 2.827124834060669, 3.0184266567230225]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 9.0, 13.0, 16.0, 14.0, 10.0, 27.0, 30.0, 27.0, 35.0, 42.0, 51.0, 48.0, 50.0, 57.0, 54.0, 51.0, 59.0, 54.0, 49.0, 42.0, 48.0, 32.0, 35.0, 28.0, 29.0, 20.0, 22.0, 13.0, 15.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1493704319000244, -2.072101593017578, -1.9948326349258423, -1.917563796043396, -1.8402948379516602, -1.7630259990692139, -1.6857571601867676, -1.6084883213043213, -1.5312193632125854, -1.4539505243301392, -1.3766815662384033, -1.299412727355957, -1.2221438884735107, -1.144874930381775, -1.0676060914993286, -0.9903371930122375, -0.9130682945251465, -0.8357993960380554, -0.7585304975509644, -0.6812616586685181, -0.603992760181427, -0.5267238616943359, -0.44945499300956726, -0.3721861243247986, -0.2949172258377075, -0.21764834225177765, -0.14037945866584778, -0.06311057507991791, 0.014158308506011963, 0.09142720699310303, 0.1686960756778717, 0.24596494436264038, 0.32323408126831055, 0.4005029797554016, 0.4777718484401703, 0.555040717124939, 0.63230961561203, 0.7095785140991211, 0.7868473529815674, 0.8641162514686584, 0.9413851499557495, 1.0186539888381958, 1.0959229469299316, 1.173191785812378, 1.2504606246948242, 1.32772958278656, 1.4049984216690063, 1.4822673797607422, 1.5595362186431885, 1.6368050575256348, 1.7140740156173706, 1.791342854499817, 1.8686118125915527, 1.945880651473999, 2.0231494903564453, 2.1004183292388916, 2.177687168121338, 2.254956007003784, 2.3322248458862305, 2.409493923187256, 2.486762762069702, 2.5640316009521484, 2.6413004398345947, 2.718569278717041, 2.7958383560180664]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 9.0, 9.0, 10.0, 17.0, 17.0, 41.0, 56.0, 86.0, 154.0, 226.0, 402.0, 742.0, 1244.0, 2476.0, 4875.0, 10753.0, 27938.0, 85719.0, 311572.0, 416518.0, 121543.0, 37714.0, 13917.0, 5928.0, 2880.0, 1535.0, 859.0, 494.0, 313.0, 185.0, 116.0, 65.0, 42.0, 36.0, 19.0, 17.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.5107421875, -0.49620819091796875, -0.4816741943359375, -0.46714019775390625, -0.452606201171875, -0.43807220458984375, -0.4235382080078125, -0.40900421142578125, -0.39447021484375, -0.37993621826171875, -0.3654022216796875, -0.35086822509765625, -0.336334228515625, -0.32180023193359375, -0.3072662353515625, -0.29273223876953125, -0.2781982421875, -0.26366424560546875, -0.2491302490234375, -0.23459625244140625, -0.220062255859375, -0.20552825927734375, -0.1909942626953125, -0.17646026611328125, -0.16192626953125, -0.14739227294921875, -0.1328582763671875, -0.11832427978515625, -0.103790283203125, -0.08925628662109375, -0.0747222900390625, -0.06018829345703125, -0.045654296875, -0.03112030029296875, -0.0165863037109375, -0.00205230712890625, 0.012481689453125, 0.02701568603515625, 0.0415496826171875, 0.05608367919921875, 0.07061767578125, 0.08515167236328125, 0.0996856689453125, 0.11421966552734375, 0.128753662109375, 0.14328765869140625, 0.1578216552734375, 0.17235565185546875, 0.1868896484375, 0.20142364501953125, 0.2159576416015625, 0.23049163818359375, 0.245025634765625, 0.25955963134765625, 0.2740936279296875, 0.28862762451171875, 0.30316162109375, 0.31769561767578125, 0.3322296142578125, 0.34676361083984375, 0.361297607421875, 0.37583160400390625, 0.3903656005859375, 0.40489959716796875, 0.41943359375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 6.0, 5.0, 10.0, 15.0, 14.0, 15.0, 28.0, 40.0, 32.0, 41.0, 59.0, 37.0, 71.0, 73.0, 73.0, 79.0, 54.0, 54.0, 51.0, 44.0, 33.0, 30.0, 27.0, 22.0, 26.0, 10.0, 11.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24365234375, -0.2369537353515625, -0.230255126953125, -0.2235565185546875, -0.21685791015625, -0.2101593017578125, -0.203460693359375, -0.1967620849609375, -0.1900634765625, -0.1833648681640625, -0.176666259765625, -0.1699676513671875, -0.16326904296875, -0.1565704345703125, -0.149871826171875, -0.1431732177734375, -0.136474609375, -0.1297760009765625, -0.123077392578125, -0.1163787841796875, -0.10968017578125, -0.1029815673828125, -0.096282958984375, -0.0895843505859375, -0.0828857421875, -0.0761871337890625, -0.069488525390625, -0.0627899169921875, -0.05609130859375, -0.0493927001953125, -0.042694091796875, -0.0359954833984375, -0.029296875, -0.0225982666015625, -0.015899658203125, -0.0092010498046875, -0.00250244140625, 0.0041961669921875, 0.010894775390625, 0.0175933837890625, 0.0242919921875, 0.0309906005859375, 0.037689208984375, 0.0443878173828125, 0.05108642578125, 0.0577850341796875, 0.064483642578125, 0.0711822509765625, 0.077880859375, 0.0845794677734375, 0.091278076171875, 0.0979766845703125, 0.10467529296875, 0.1113739013671875, 0.118072509765625, 0.1247711181640625, 0.1314697265625, 0.1381683349609375, 0.144866943359375, 0.1515655517578125, 0.15826416015625, 0.1649627685546875, 0.171661376953125, 0.1783599853515625, 0.18505859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 9.0, 12.0, 19.0, 38.0, 54.0, 86.0, 119.0, 238.0, 501.0, 1154.0, 3395.0, 16267.0, 178315.0, 776068.0, 60576.0, 7893.0, 2134.0, 838.0, 387.0, 169.0, 107.0, 59.0, 36.0, 23.0, 13.0, 15.0, 5.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8017578125, -0.7700653076171875, -0.738372802734375, -0.7066802978515625, -0.67498779296875, -0.6432952880859375, -0.611602783203125, -0.5799102783203125, -0.5482177734375, -0.5165252685546875, -0.484832763671875, -0.4531402587890625, -0.42144775390625, -0.3897552490234375, -0.358062744140625, -0.3263702392578125, -0.294677734375, -0.2629852294921875, -0.231292724609375, -0.1996002197265625, -0.16790771484375, -0.1362152099609375, -0.104522705078125, -0.0728302001953125, -0.0411376953125, -0.0094451904296875, 0.022247314453125, 0.0539398193359375, 0.08563232421875, 0.1173248291015625, 0.149017333984375, 0.1807098388671875, 0.21240234375, 0.2440948486328125, 0.275787353515625, 0.3074798583984375, 0.33917236328125, 0.3708648681640625, 0.402557373046875, 0.4342498779296875, 0.4659423828125, 0.4976348876953125, 0.529327392578125, 0.5610198974609375, 0.59271240234375, 0.6244049072265625, 0.656097412109375, 0.6877899169921875, 0.719482421875, 0.7511749267578125, 0.782867431640625, 0.8145599365234375, 0.84625244140625, 0.8779449462890625, 0.909637451171875, 0.9413299560546875, 0.9730224609375, 1.0047149658203125, 1.036407470703125, 1.0680999755859375, 1.09979248046875, 1.1314849853515625, 1.163177490234375, 1.1948699951171875, 1.2265625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 6.0, 1.0, 4.0, 9.0, 5.0, 17.0, 19.0, 25.0, 28.0, 44.0, 46.0, 45.0, 53.0, 67.0, 67.0, 73.0, 60.0, 77.0, 50.0, 58.0, 46.0, 43.0, 43.0, 33.0, 29.0, 11.0, 13.0, 11.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7060546875, -0.672393798828125, -0.63873291015625, -0.605072021484375, -0.5714111328125, -0.537750244140625, -0.50408935546875, -0.470428466796875, -0.436767578125, -0.403106689453125, -0.36944580078125, -0.335784912109375, -0.3021240234375, -0.268463134765625, -0.23480224609375, -0.201141357421875, -0.16748046875, -0.133819580078125, -0.10015869140625, -0.066497802734375, -0.0328369140625, 0.000823974609375, 0.03448486328125, 0.068145751953125, 0.101806640625, 0.135467529296875, 0.16912841796875, 0.202789306640625, 0.2364501953125, 0.270111083984375, 0.30377197265625, 0.337432861328125, 0.37109375, 0.404754638671875, 0.43841552734375, 0.472076416015625, 0.5057373046875, 0.539398193359375, 0.57305908203125, 0.606719970703125, 0.640380859375, 0.674041748046875, 0.70770263671875, 0.741363525390625, 0.7750244140625, 0.808685302734375, 0.84234619140625, 0.876007080078125, 0.90966796875, 0.943328857421875, 0.97698974609375, 1.010650634765625, 1.0443115234375, 1.077972412109375, 1.11163330078125, 1.145294189453125, 1.178955078125, 1.212615966796875, 1.24627685546875, 1.279937744140625, 1.3135986328125, 1.347259521484375, 1.38092041015625, 1.414581298828125, 1.4482421875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 5.0, 4.0, 9.0, 4.0, 8.0, 28.0, 20.0, 36.0, 69.0, 125.0, 218.0, 437.0, 1011.0, 3180.0, 20365.0, 833644.0, 177482.0, 8594.0, 1823.0, 724.0, 327.0, 167.0, 80.0, 70.0, 35.0, 22.0, 18.0, 16.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.8161392211914062, -0.7904815673828125, -0.7648239135742188, -0.739166259765625, -0.7135086059570312, -0.6878509521484375, -0.6621932983398438, -0.63653564453125, -0.6108779907226562, -0.5852203369140625, -0.5595626831054688, -0.533905029296875, -0.5082473754882812, -0.4825897216796875, -0.45693206787109375, -0.4312744140625, -0.40561676025390625, -0.3799591064453125, -0.35430145263671875, -0.328643798828125, -0.30298614501953125, -0.2773284912109375, -0.25167083740234375, -0.22601318359375, -0.20035552978515625, -0.1746978759765625, -0.14904022216796875, -0.123382568359375, -0.09772491455078125, -0.0720672607421875, -0.04640960693359375, -0.020751953125, 0.00490570068359375, 0.0305633544921875, 0.05622100830078125, 0.081878662109375, 0.10753631591796875, 0.1331939697265625, 0.15885162353515625, 0.18450927734375, 0.21016693115234375, 0.2358245849609375, 0.26148223876953125, 0.287139892578125, 0.31279754638671875, 0.3384552001953125, 0.36411285400390625, 0.3897705078125, 0.41542816162109375, 0.4410858154296875, 0.46674346923828125, 0.492401123046875, 0.5180587768554688, 0.5437164306640625, 0.5693740844726562, 0.59503173828125, 0.6206893920898438, 0.6463470458984375, 0.6720046997070312, 0.697662353515625, 0.7233200073242188, 0.7489776611328125, 0.7746353149414062, 0.80029296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 3.0, 11.0, 8.0, 18.0, 9.0, 23.0, 24.0, 28.0, 28.0, 37.0, 52.0, 81.0, 103.0, 119.0, 100.0, 88.0, 62.0, 43.0, 34.0, 24.0, 15.0, 16.0, 16.0, 7.0, 4.0, 4.0, 7.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013399124145507812, -0.0001301141455769539, -0.00012623704969882965, -0.00012235995382070541, -0.00011848285794258118, -0.00011460576206445694, -0.0001107286661863327, -0.00010685157030820847, -0.00010297447443008423, -9.909737855195999e-05, -9.522028267383575e-05, -9.134318679571152e-05, -8.746609091758728e-05, -8.358899503946304e-05, -7.97118991613388e-05, -7.583480328321457e-05, -7.195770740509033e-05, -6.80806115269661e-05, -6.420351564884186e-05, -6.032641977071762e-05, -5.6449323892593384e-05, -5.257222801446915e-05, -4.869513213634491e-05, -4.481803625822067e-05, -4.0940940380096436e-05, -3.70638445019722e-05, -3.318674862384796e-05, -2.9309652745723724e-05, -2.5432556867599487e-05, -2.155546098947525e-05, -1.7678365111351013e-05, -1.3801269233226776e-05, -9.924173355102539e-06, -6.047077476978302e-06, -2.169981598854065e-06, 1.7071142792701721e-06, 5.584210157394409e-06, 9.461306035518646e-06, 1.3338401913642883e-05, 1.721549779176712e-05, 2.1092593669891357e-05, 2.4969689548015594e-05, 2.884678542613983e-05, 3.272388130426407e-05, 3.6600977182388306e-05, 4.047807306051254e-05, 4.435516893863678e-05, 4.823226481676102e-05, 5.2109360694885254e-05, 5.598645657300949e-05, 5.986355245113373e-05, 6.374064832925797e-05, 6.76177442073822e-05, 7.149484008550644e-05, 7.537193596363068e-05, 7.924903184175491e-05, 8.312612771987915e-05, 8.700322359800339e-05, 9.088031947612762e-05, 9.475741535425186e-05, 9.86345112323761e-05, 0.00010251160711050034, 0.00010638870298862457, 0.00011026579886674881, 0.00011414289474487305]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 8.0, 14.0, 17.0, 38.0, 41.0, 61.0, 85.0, 146.0, 285.0, 483.0, 1091.0, 3219.0, 14736.0, 229280.0, 762668.0, 28458.0, 4949.0, 1538.0, 613.0, 304.0, 190.0, 91.0, 63.0, 44.0, 40.0, 27.0, 9.0, 12.0, 10.0, 5.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6992568969726562, -0.6787872314453125, -0.6583175659179688, -0.637847900390625, -0.6173782348632812, -0.5969085693359375, -0.5764389038085938, -0.55596923828125, -0.5354995727539062, -0.5150299072265625, -0.49456024169921875, -0.474090576171875, -0.45362091064453125, -0.4331512451171875, -0.41268157958984375, -0.3922119140625, -0.37174224853515625, -0.3512725830078125, -0.33080291748046875, -0.310333251953125, -0.28986358642578125, -0.2693939208984375, -0.24892425537109375, -0.22845458984375, -0.20798492431640625, -0.1875152587890625, -0.16704559326171875, -0.146575927734375, -0.12610626220703125, -0.1056365966796875, -0.08516693115234375, -0.064697265625, -0.04422760009765625, -0.0237579345703125, -0.00328826904296875, 0.017181396484375, 0.03765106201171875, 0.0581207275390625, 0.07859039306640625, 0.09906005859375, 0.11952972412109375, 0.1399993896484375, 0.16046905517578125, 0.180938720703125, 0.20140838623046875, 0.2218780517578125, 0.24234771728515625, 0.2628173828125, 0.28328704833984375, 0.3037567138671875, 0.32422637939453125, 0.344696044921875, 0.36516571044921875, 0.3856353759765625, 0.40610504150390625, 0.42657470703125, 0.44704437255859375, 0.4675140380859375, 0.48798370361328125, 0.508453369140625, 0.5289230346679688, 0.5493927001953125, 0.5698623657226562, 0.59033203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 6.0, 10.0, 11.0, 8.0, 11.0, 14.0, 18.0, 23.0, 38.0, 45.0, 80.0, 99.0, 125.0, 117.0, 123.0, 70.0, 41.0, 53.0, 21.0, 17.0, 19.0, 15.0, 4.0, 10.0, 7.0, 7.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.52685546875, -0.5129890441894531, -0.49912261962890625, -0.4852561950683594, -0.4713897705078125, -0.4575233459472656, -0.44365692138671875, -0.4297904968261719, -0.415924072265625, -0.4020576477050781, -0.38819122314453125, -0.3743247985839844, -0.3604583740234375, -0.3465919494628906, -0.33272552490234375, -0.3188591003417969, -0.30499267578125, -0.2911262512207031, -0.27725982666015625, -0.2633934020996094, -0.2495269775390625, -0.23566055297851562, -0.22179412841796875, -0.20792770385742188, -0.194061279296875, -0.18019485473632812, -0.16632843017578125, -0.15246200561523438, -0.1385955810546875, -0.12472915649414062, -0.11086273193359375, -0.09699630737304688, -0.0831298828125, -0.06926345825195312, -0.05539703369140625, -0.041530609130859375, -0.0276641845703125, -0.013797760009765625, 6.866455078125e-05, 0.013935089111328125, 0.027801513671875, 0.041667938232421875, 0.05553436279296875, 0.06940078735351562, 0.0832672119140625, 0.09713363647460938, 0.11100006103515625, 0.12486648559570312, 0.13873291015625, 0.15259933471679688, 0.16646575927734375, 0.18033218383789062, 0.1941986083984375, 0.20806503295898438, 0.22193145751953125, 0.23579788208007812, 0.249664306640625, 0.2635307312011719, 0.27739715576171875, 0.2912635803222656, 0.3051300048828125, 0.3189964294433594, 0.33286285400390625, 0.3467292785644531, 0.360595703125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 8.0, 29.0, 66.0, 159.0, 274.0, 243.0, 125.0, 37.0, 23.0, 10.0, 8.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.0038423538208, -11.729766845703125, -11.45569133758545, -11.181615829467773, -10.907540321350098, -10.633464813232422, -10.359389305114746, -10.08531379699707, -9.811239242553711, -9.537163734436035, -9.26308822631836, -8.989012718200684, -8.714937210083008, -8.440861701965332, -8.166786193847656, -7.892711162567139, -7.618635177612305, -7.344559669494629, -7.070484161376953, -6.796408653259277, -6.522333145141602, -6.248257637023926, -5.974182605743408, -5.700107097625732, -5.426031589508057, -5.151956081390381, -4.877880573272705, -4.603805065155029, -4.329730033874512, -4.055654525756836, -3.78157901763916, -3.5075035095214844, -3.2334280014038086, -2.959352493286133, -2.685276985168457, -2.4112017154693604, -2.1371262073516846, -1.8630506992340088, -1.5889753103256226, -1.3148999214172363, -1.0408244132995605, -0.7667489647865295, -0.49267351627349854, -0.21859806776046753, 0.05547738075256348, 0.32955288887023926, 0.6036282777786255, 0.8777036666870117, 1.1517791748046875, 1.4258546829223633, 1.6999300718307495, 1.9740054607391357, 2.2480809688568115, 2.5221564769744873, 2.796231746673584, 3.0703072547912598, 3.3443827629089355, 3.6184582710266113, 3.892533779144287, 4.166609287261963, 4.4406843185424805, 4.714759826660156, 4.988835334777832, 5.262910842895508, 5.536986351013184]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 11.0, 7.0, 5.0, 9.0, 11.0, 11.0, 9.0, 22.0, 27.0, 23.0, 33.0, 38.0, 33.0, 32.0, 34.0, 57.0, 62.0, 57.0, 67.0, 61.0, 60.0, 50.0, 32.0, 37.0, 42.0, 19.0, 33.0, 20.0, 24.0, 13.0, 17.0, 11.0, 8.0, 10.0, 9.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.661123752593994, -3.5503969192504883, -3.4396703243255615, -3.3289434909820557, -3.21821665763855, -3.107490062713623, -2.996763229370117, -2.8860363960266113, -2.7753095626831055, -2.6645827293395996, -2.553856134414673, -2.443129301071167, -2.332402467727661, -2.2216758728027344, -2.1109490394592285, -2.0002222061157227, -1.8894954919815063, -1.77876877784729, -1.6680419445037842, -1.5573152303695679, -1.446588397026062, -1.3358616828918457, -1.2251348495483398, -1.1144081354141235, -1.0036814212799072, -0.8929546475410461, -0.7822278738021851, -0.6715011596679688, -0.5607743263244629, -0.4500476121902466, -0.3393208384513855, -0.22859406471252441, -0.11786723136901855, -0.007140465080738068, 0.10358630120754242, 0.2143130600452423, 0.3250398337841034, 0.4357665777206421, 0.5464933514595032, 0.6572201251983643, 0.7679468989372253, 0.8786736726760864, 0.9894004464149475, 1.1001272201538086, 1.210853934288025, 1.3215806484222412, 1.432307481765747, 1.543034315109253, 1.6537610292434692, 1.7644877433776855, 1.8752145767211914, 1.9859412908554077, 2.096668004989624, 2.20739483833313, 2.3181216716766357, 2.4288482666015625, 2.5395750999450684, 2.650301933288574, 2.761028528213501, 2.871755361557007, 2.9824821949005127, 3.0932087898254395, 3.2039356231689453, 3.314662456512451, 3.425389289855957]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 20.0, 17.0, 21.0, 28.0, 49.0, 74.0, 174.0, 620.0, 3348.0, 36471.0, 3619891.0, 518704.0, 12440.0, 1680.0, 383.0, 148.0, 71.0, 36.0, 32.0, 19.0, 14.0, 7.0, 7.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.904296875, -0.8775482177734375, -0.850799560546875, -0.8240509033203125, -0.79730224609375, -0.7705535888671875, -0.743804931640625, -0.7170562744140625, -0.6903076171875, -0.6635589599609375, -0.636810302734375, -0.6100616455078125, -0.58331298828125, -0.5565643310546875, -0.529815673828125, -0.5030670166015625, -0.476318359375, -0.4495697021484375, -0.422821044921875, -0.3960723876953125, -0.36932373046875, -0.3425750732421875, -0.315826416015625, -0.2890777587890625, -0.2623291015625, -0.2355804443359375, -0.208831787109375, -0.1820831298828125, -0.15533447265625, -0.1285858154296875, -0.101837158203125, -0.0750885009765625, -0.04833984375, -0.0215911865234375, 0.005157470703125, 0.0319061279296875, 0.05865478515625, 0.0854034423828125, 0.112152099609375, 0.1389007568359375, 0.1656494140625, 0.1923980712890625, 0.219146728515625, 0.2458953857421875, 0.27264404296875, 0.2993927001953125, 0.326141357421875, 0.3528900146484375, 0.379638671875, 0.4063873291015625, 0.433135986328125, 0.4598846435546875, 0.48663330078125, 0.5133819580078125, 0.540130615234375, 0.5668792724609375, 0.5936279296875, 0.6203765869140625, 0.647125244140625, 0.6738739013671875, 0.70062255859375, 0.7273712158203125, 0.754119873046875, 0.7808685302734375, 0.8076171875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 10.0, 5.0, 9.0, 8.0, 11.0, 14.0, 37.0, 46.0, 29.0, 49.0, 63.0, 59.0, 55.0, 75.0, 72.0, 65.0, 57.0, 55.0, 49.0, 44.0, 33.0, 29.0, 35.0, 16.0, 16.0, 12.0, 11.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201904296875, -0.1954517364501953, -0.18899917602539062, -0.18254661560058594, -0.17609405517578125, -0.16964149475097656, -0.16318893432617188, -0.1567363739013672, -0.1502838134765625, -0.1438312530517578, -0.13737869262695312, -0.13092613220214844, -0.12447357177734375, -0.11802101135253906, -0.11156845092773438, -0.10511589050292969, -0.098663330078125, -0.09221076965332031, -0.08575820922851562, -0.07930564880371094, -0.07285308837890625, -0.06640052795410156, -0.059947967529296875, -0.05349540710449219, -0.0470428466796875, -0.04059028625488281, -0.034137725830078125, -0.027685165405273438, -0.02123260498046875, -0.014780044555664062, -0.008327484130859375, -0.0018749237060546875, 0.00457763671875, 0.011030197143554688, 0.017482757568359375, 0.023935317993164062, 0.03038787841796875, 0.03684043884277344, 0.043292999267578125, 0.04974555969238281, 0.0561981201171875, 0.06265068054199219, 0.06910324096679688, 0.07555580139160156, 0.08200836181640625, 0.08846092224121094, 0.09491348266601562, 0.10136604309082031, 0.107818603515625, 0.11427116394042969, 0.12072372436523438, 0.12717628479003906, 0.13362884521484375, 0.14008140563964844, 0.14653396606445312, 0.1529865264892578, 0.1594390869140625, 0.1658916473388672, 0.17234420776367188, 0.17879676818847656, 0.18524932861328125, 0.19170188903808594, 0.19815444946289062, 0.2046070098876953, 0.2110595703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 1.0, 7.0, 5.0, 14.0, 9.0, 15.0, 20.0, 32.0, 51.0, 83.0, 136.0, 223.0, 380.0, 773.0, 1910.0, 5772.0, 21823.0, 136969.0, 2683311.0, 1242836.0, 79484.0, 14073.0, 3795.0, 1338.0, 534.0, 260.0, 160.0, 74.0, 63.0, 41.0, 15.0, 19.0, 16.0, 11.0, 6.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43017578125, -0.415283203125, -0.400390625, -0.385498046875, -0.37060546875, -0.355712890625, -0.3408203125, -0.325927734375, -0.31103515625, -0.296142578125, -0.28125, -0.266357421875, -0.25146484375, -0.236572265625, -0.2216796875, -0.206787109375, -0.19189453125, -0.177001953125, -0.162109375, -0.147216796875, -0.13232421875, -0.117431640625, -0.1025390625, -0.087646484375, -0.07275390625, -0.057861328125, -0.04296875, -0.028076171875, -0.01318359375, 0.001708984375, 0.0166015625, 0.031494140625, 0.04638671875, 0.061279296875, 0.076171875, 0.091064453125, 0.10595703125, 0.120849609375, 0.1357421875, 0.150634765625, 0.16552734375, 0.180419921875, 0.1953125, 0.210205078125, 0.22509765625, 0.239990234375, 0.2548828125, 0.269775390625, 0.28466796875, 0.299560546875, 0.314453125, 0.329345703125, 0.34423828125, 0.359130859375, 0.3740234375, 0.388916015625, 0.40380859375, 0.418701171875, 0.43359375, 0.448486328125, 0.46337890625, 0.478271484375, 0.4931640625, 0.508056640625, 0.52294921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 3.0, 11.0, 15.0, 12.0, 21.0, 28.0, 22.0, 30.0, 40.0, 47.0, 82.0, 165.0, 196.0, 260.0, 455.0, 641.0, 654.0, 489.0, 280.0, 177.0, 118.0, 98.0, 63.0, 36.0, 31.0, 30.0, 12.0, 12.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419921875, -0.4068260192871094, -0.39373016357421875, -0.3806343078613281, -0.3675384521484375, -0.3544425964355469, -0.34134674072265625, -0.3282508850097656, -0.315155029296875, -0.3020591735839844, -0.28896331787109375, -0.2758674621582031, -0.2627716064453125, -0.24967575073242188, -0.23657989501953125, -0.22348403930664062, -0.21038818359375, -0.19729232788085938, -0.18419647216796875, -0.17110061645507812, -0.1580047607421875, -0.14490890502929688, -0.13181304931640625, -0.11871719360351562, -0.105621337890625, -0.09252548217773438, -0.07942962646484375, -0.06633377075195312, -0.0532379150390625, -0.040142059326171875, -0.02704620361328125, -0.013950347900390625, -0.0008544921875, 0.012241363525390625, 0.02533721923828125, 0.038433074951171875, 0.0515289306640625, 0.06462478637695312, 0.07772064208984375, 0.09081649780273438, 0.103912353515625, 0.11700820922851562, 0.13010406494140625, 0.14319992065429688, 0.1562957763671875, 0.16939163208007812, 0.18248748779296875, 0.19558334350585938, 0.20867919921875, 0.22177505493164062, 0.23487091064453125, 0.24796676635742188, 0.2610626220703125, 0.2741584777832031, 0.28725433349609375, 0.3003501892089844, 0.313446044921875, 0.3265419006347656, 0.33963775634765625, 0.3527336120605469, 0.3658294677734375, 0.3789253234863281, 0.39202117919921875, 0.4051170349121094, 0.418212890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 12.0, 34.0, 150.0, 413.0, 301.0, 63.0, 14.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.2432918548584, -16.897762298583984, -16.55223274230957, -16.206703186035156, -15.861173629760742, -15.515644073486328, -15.170114517211914, -14.8245849609375, -14.479055404663086, -14.133525848388672, -13.787996292114258, -13.442466735839844, -13.09693717956543, -12.751407623291016, -12.405878067016602, -12.060348510742188, -11.714818954467773, -11.36928939819336, -11.023759841918945, -10.678230285644531, -10.332700729370117, -9.987171173095703, -9.641641616821289, -9.296112060546875, -8.950581550598145, -8.60505199432373, -8.259522438049316, -7.913992881774902, -7.568463325500488, -7.222933769226074, -6.87740421295166, -6.531874656677246, -6.186345100402832, -5.840815544128418, -5.495285987854004, -5.14975643157959, -4.804226875305176, -4.458697319030762, -4.113167762756348, -3.7676379680633545, -3.4221084117889404, -3.0765788555145264, -2.7310492992401123, -2.385519504547119, -2.039989948272705, -1.6944605112075806, -1.348930835723877, -1.003401279449463, -0.6578717231750488, -0.3123421370983124, 0.03318744897842407, 0.3787170648574829, 0.724246621131897, 1.069776177406311, 1.4153058528900146, 1.7608354091644287, 2.1063649654388428, 2.451894521713257, 2.797424077987671, 3.142953872680664, 3.488483428955078, 3.834012985229492, 4.179542541503906, 4.52507209777832, 4.870601654052734]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 5.0, 2.0, 4.0, 7.0, 7.0, 10.0, 10.0, 20.0, 21.0, 33.0, 22.0, 30.0, 24.0, 32.0, 43.0, 40.0, 27.0, 37.0, 44.0, 45.0, 52.0, 33.0, 52.0, 51.0, 44.0, 43.0, 33.0, 26.0, 33.0, 21.0, 21.0, 17.0, 17.0, 26.0, 9.0, 12.0, 8.0, 5.0, 7.0, 9.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.052689790725708, -1.9804867506027222, -1.9082838296890259, -1.83608078956604, -1.7638778686523438, -1.691674828529358, -1.619471788406372, -1.5472688674926758, -1.47506582736969, -1.402862787246704, -1.3306598663330078, -1.258456826210022, -1.1862537860870361, -1.1140508651733398, -1.041847825050354, -0.9696448445320129, -0.8974418640136719, -0.8252388834953308, -0.7530359029769897, -0.6808328628540039, -0.6086298823356628, -0.5364269018173218, -0.4642238914966583, -0.3920208811759949, -0.3198179006576538, -0.24761490523815155, -0.1754119098186493, -0.10320891439914703, -0.031005918979644775, 0.04119706153869629, 0.11340007185935974, 0.1856030821800232, 0.25780582427978516, 0.3300088047981262, 0.4022118151187897, 0.4744148254394531, 0.5466178059577942, 0.6188207864761353, 0.6910238265991211, 0.7632268071174622, 0.8354297876358032, 0.9076327681541443, 0.9798357486724854, 1.0520387887954712, 1.124241828918457, 1.1964447498321533, 1.2686477899551392, 1.340850830078125, 1.4130537509918213, 1.4852567911148071, 1.5574597120285034, 1.6296627521514893, 1.7018656730651855, 1.7740687131881714, 1.8462717533111572, 1.9184746742248535, 1.9906777143478394, 2.062880754470825, 2.1350836753845215, 2.2072865962982178, 2.279489755630493, 2.3516926765441895, 2.4238955974578857, 2.496098756790161, 2.5683016777038574]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 11.0, 4.0, 8.0, 6.0, 23.0, 23.0, 32.0, 49.0, 61.0, 106.0, 166.0, 299.0, 516.0, 882.0, 1697.0, 3578.0, 8014.0, 19844.0, 52870.0, 151186.0, 385726.0, 271309.0, 94513.0, 33467.0, 12974.0, 5640.0, 2578.0, 1279.0, 648.0, 393.0, 225.0, 132.0, 88.0, 77.0, 44.0, 30.0, 22.0, 8.0, 12.0, 5.0, 3.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364501953125, -0.35137939453125, -0.3382568359375, -0.32513427734375, -0.31201171875, -0.29888916015625, -0.2857666015625, -0.27264404296875, -0.259521484375, -0.24639892578125, -0.2332763671875, -0.22015380859375, -0.20703125, -0.19390869140625, -0.1807861328125, -0.16766357421875, -0.154541015625, -0.14141845703125, -0.1282958984375, -0.11517333984375, -0.10205078125, -0.08892822265625, -0.0758056640625, -0.06268310546875, -0.049560546875, -0.03643798828125, -0.0233154296875, -0.01019287109375, 0.0029296875, 0.01605224609375, 0.0291748046875, 0.04229736328125, 0.055419921875, 0.06854248046875, 0.0816650390625, 0.09478759765625, 0.10791015625, 0.12103271484375, 0.1341552734375, 0.14727783203125, 0.160400390625, 0.17352294921875, 0.1866455078125, 0.19976806640625, 0.212890625, 0.22601318359375, 0.2391357421875, 0.25225830078125, 0.265380859375, 0.27850341796875, 0.2916259765625, 0.30474853515625, 0.31787109375, 0.33099365234375, 0.3441162109375, 0.35723876953125, 0.370361328125, 0.38348388671875, 0.3966064453125, 0.40972900390625, 0.4228515625, 0.43597412109375, 0.4490966796875, 0.46221923828125, 0.475341796875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 2.0, 5.0, 3.0, 8.0, 10.0, 13.0, 10.0, 17.0, 31.0, 35.0, 32.0, 53.0, 53.0, 58.0, 69.0, 77.0, 61.0, 55.0, 42.0, 53.0, 56.0, 43.0, 39.0, 35.0, 30.0, 16.0, 26.0, 19.0, 7.0, 10.0, 8.0, 4.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.193603515625, -0.187255859375, -0.180908203125, -0.174560546875, -0.168212890625, -0.161865234375, -0.155517578125, -0.149169921875, -0.142822265625, -0.136474609375, -0.130126953125, -0.123779296875, -0.117431640625, -0.111083984375, -0.104736328125, -0.098388671875, -0.092041015625, -0.085693359375, -0.079345703125, -0.072998046875, -0.066650390625, -0.060302734375, -0.053955078125, -0.047607421875, -0.041259765625, -0.034912109375, -0.028564453125, -0.022216796875, -0.015869140625, -0.009521484375, -0.003173828125, 0.003173828125, 0.009521484375, 0.015869140625, 0.022216796875, 0.028564453125, 0.034912109375, 0.041259765625, 0.047607421875, 0.053955078125, 0.060302734375, 0.066650390625, 0.072998046875, 0.079345703125, 0.085693359375, 0.092041015625, 0.098388671875, 0.104736328125, 0.111083984375, 0.117431640625, 0.123779296875, 0.130126953125, 0.136474609375, 0.142822265625, 0.149169921875, 0.155517578125, 0.161865234375, 0.168212890625, 0.174560546875, 0.180908203125, 0.187255859375, 0.193603515625, 0.199951171875, 0.206298828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 9.0, 7.0, 18.0, 33.0, 44.0, 69.0, 144.0, 264.0, 531.0, 1187.0, 3430.0, 17867.0, 485431.0, 515788.0, 17827.0, 3453.0, 1271.0, 523.0, 277.0, 159.0, 94.0, 45.0, 29.0, 24.0, 12.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2138671875, -1.1720123291015625, -1.130157470703125, -1.0883026123046875, -1.04644775390625, -1.0045928955078125, -0.962738037109375, -0.9208831787109375, -0.8790283203125, -0.8371734619140625, -0.795318603515625, -0.7534637451171875, -0.71160888671875, -0.6697540283203125, -0.627899169921875, -0.5860443115234375, -0.544189453125, -0.5023345947265625, -0.460479736328125, -0.4186248779296875, -0.37677001953125, -0.3349151611328125, -0.293060302734375, -0.2512054443359375, -0.2093505859375, -0.1674957275390625, -0.125640869140625, -0.0837860107421875, -0.04193115234375, -7.62939453125e-05, 0.041778564453125, 0.0836334228515625, 0.12548828125, 0.1673431396484375, 0.209197998046875, 0.2510528564453125, 0.29290771484375, 0.3347625732421875, 0.376617431640625, 0.4184722900390625, 0.4603271484375, 0.5021820068359375, 0.544036865234375, 0.5858917236328125, 0.62774658203125, 0.6696014404296875, 0.711456298828125, 0.7533111572265625, 0.795166015625, 0.8370208740234375, 0.878875732421875, 0.9207305908203125, 0.96258544921875, 1.0044403076171875, 1.046295166015625, 1.0881500244140625, 1.1300048828125, 1.1718597412109375, 1.213714599609375, 1.2555694580078125, 1.29742431640625, 1.3392791748046875, 1.381134033203125, 1.4229888916015625, 1.46484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 13.0, 10.0, 15.0, 17.0, 21.0, 44.0, 52.0, 61.0, 54.0, 49.0, 52.0, 76.0, 75.0, 67.0, 79.0, 73.0, 50.0, 38.0, 30.0, 21.0, 24.0, 22.0, 11.0, 5.0, 6.0, 9.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.5966796875, -1.5577545166015625, -1.518829345703125, -1.4799041748046875, -1.44097900390625, -1.4020538330078125, -1.363128662109375, -1.3242034912109375, -1.2852783203125, -1.2463531494140625, -1.207427978515625, -1.1685028076171875, -1.12957763671875, -1.0906524658203125, -1.051727294921875, -1.0128021240234375, -0.973876953125, -0.9349517822265625, -0.896026611328125, -0.8571014404296875, -0.81817626953125, -0.7792510986328125, -0.740325927734375, -0.7014007568359375, -0.6624755859375, -0.6235504150390625, -0.584625244140625, -0.5457000732421875, -0.50677490234375, -0.4678497314453125, -0.428924560546875, -0.3899993896484375, -0.35107421875, -0.3121490478515625, -0.273223876953125, -0.2342987060546875, -0.19537353515625, -0.1564483642578125, -0.117523193359375, -0.0785980224609375, -0.0396728515625, -0.0007476806640625, 0.038177490234375, 0.0771026611328125, 0.11602783203125, 0.1549530029296875, 0.193878173828125, 0.2328033447265625, 0.271728515625, 0.3106536865234375, 0.349578857421875, 0.3885040283203125, 0.42742919921875, 0.4663543701171875, 0.505279541015625, 0.5442047119140625, 0.5831298828125, 0.6220550537109375, 0.660980224609375, 0.6999053955078125, 0.73883056640625, 0.7777557373046875, 0.816680908203125, 0.8556060791015625, 0.89453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 9.0, 4.0, 12.0, 19.0, 14.0, 32.0, 32.0, 65.0, 134.0, 225.0, 467.0, 1055.0, 3202.0, 15121.0, 174019.0, 800635.0, 43811.0, 6448.0, 1758.0, 695.0, 315.0, 190.0, 103.0, 63.0, 34.0, 29.0, 18.0, 11.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.609375, -0.591583251953125, -0.57379150390625, -0.555999755859375, -0.5382080078125, -0.520416259765625, -0.50262451171875, -0.484832763671875, -0.467041015625, -0.449249267578125, -0.43145751953125, -0.413665771484375, -0.3958740234375, -0.378082275390625, -0.36029052734375, -0.342498779296875, -0.32470703125, -0.306915283203125, -0.28912353515625, -0.271331787109375, -0.2535400390625, -0.235748291015625, -0.21795654296875, -0.200164794921875, -0.182373046875, -0.164581298828125, -0.14678955078125, -0.128997802734375, -0.1112060546875, -0.093414306640625, -0.07562255859375, -0.057830810546875, -0.0400390625, -0.022247314453125, -0.00445556640625, 0.013336181640625, 0.0311279296875, 0.048919677734375, 0.06671142578125, 0.084503173828125, 0.102294921875, 0.120086669921875, 0.13787841796875, 0.155670166015625, 0.1734619140625, 0.191253662109375, 0.20904541015625, 0.226837158203125, 0.24462890625, 0.262420654296875, 0.28021240234375, 0.298004150390625, 0.3157958984375, 0.333587646484375, 0.35137939453125, 0.369171142578125, 0.386962890625, 0.404754638671875, 0.42254638671875, 0.440338134765625, 0.4581298828125, 0.475921630859375, 0.49371337890625, 0.511505126953125, 0.529296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 5.0, 9.0, 5.0, 12.0, 8.0, 16.0, 15.0, 19.0, 21.0, 35.0, 30.0, 47.0, 44.0, 59.0, 71.0, 75.0, 77.0, 62.0, 70.0, 62.0, 56.0, 33.0, 29.0, 30.0, 23.0, 14.0, 16.0, 14.0, 15.0, 4.0, 9.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0001323223114013672, -0.0001287553459405899, -0.00012518838047981262, -0.00012162141501903534, -0.00011805444955825806, -0.00011448748409748077, -0.00011092051863670349, -0.00010735355317592621, -0.00010378658771514893, -0.00010021962225437164, -9.665265679359436e-05, -9.308569133281708e-05, -8.95187258720398e-05, -8.595176041126251e-05, -8.238479495048523e-05, -7.881782948970795e-05, -7.525086402893066e-05, -7.168389856815338e-05, -6.81169331073761e-05, -6.454996764659882e-05, -6.098300218582153e-05, -5.741603672504425e-05, -5.384907126426697e-05, -5.0282105803489685e-05, -4.67151403427124e-05, -4.314817488193512e-05, -3.958120942115784e-05, -3.6014243960380554e-05, -3.244727849960327e-05, -2.888031303882599e-05, -2.5313347578048706e-05, -2.1746382117271423e-05, -1.817941665649414e-05, -1.4612451195716858e-05, -1.1045485734939575e-05, -7.4785202741622925e-06, -3.91155481338501e-06, -3.4458935260772705e-07, 3.2223761081695557e-06, 6.789341568946838e-06, 1.0356307029724121e-05, 1.3923272490501404e-05, 1.7490237951278687e-05, 2.105720341205597e-05, 2.4624168872833252e-05, 2.8191134333610535e-05, 3.175809979438782e-05, 3.53250652551651e-05, 3.889203071594238e-05, 4.2458996176719666e-05, 4.602596163749695e-05, 4.959292709827423e-05, 5.3159892559051514e-05, 5.6726858019828796e-05, 6.029382348060608e-05, 6.386078894138336e-05, 6.742775440216064e-05, 7.099471986293793e-05, 7.456168532371521e-05, 7.812865078449249e-05, 8.169561624526978e-05, 8.526258170604706e-05, 8.882954716682434e-05, 9.239651262760162e-05, 9.59634780883789e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 0.0, 8.0, 8.0, 9.0, 10.0, 15.0, 32.0, 54.0, 83.0, 173.0, 257.0, 686.0, 2007.0, 8895.0, 135885.0, 870459.0, 24248.0, 3801.0, 1047.0, 425.0, 187.0, 97.0, 52.0, 38.0, 25.0, 19.0, 10.0, 9.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.87939453125, -0.8551254272460938, -0.8308563232421875, -0.8065872192382812, -0.782318115234375, -0.7580490112304688, -0.7337799072265625, -0.7095108032226562, -0.68524169921875, -0.6609725952148438, -0.6367034912109375, -0.6124343872070312, -0.588165283203125, -0.5638961791992188, -0.5396270751953125, -0.5153579711914062, -0.4910888671875, -0.46681976318359375, -0.4425506591796875, -0.41828155517578125, -0.394012451171875, -0.36974334716796875, -0.3454742431640625, -0.32120513916015625, -0.29693603515625, -0.27266693115234375, -0.2483978271484375, -0.22412872314453125, -0.199859619140625, -0.17559051513671875, -0.1513214111328125, -0.12705230712890625, -0.102783203125, -0.07851409912109375, -0.0542449951171875, -0.02997589111328125, -0.005706787109375, 0.01856231689453125, 0.0428314208984375, 0.06710052490234375, 0.09136962890625, 0.11563873291015625, 0.1399078369140625, 0.16417694091796875, 0.188446044921875, 0.21271514892578125, 0.2369842529296875, 0.26125335693359375, 0.2855224609375, 0.30979156494140625, 0.3340606689453125, 0.35832977294921875, 0.382598876953125, 0.40686798095703125, 0.4311370849609375, 0.45540618896484375, 0.47967529296875, 0.5039443969726562, 0.5282135009765625, 0.5524826049804688, 0.576751708984375, 0.6010208129882812, 0.6252899169921875, 0.6495590209960938, 0.673828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 13.0, 15.0, 22.0, 30.0, 34.0, 47.0, 61.0, 83.0, 108.0, 99.0, 105.0, 98.0, 78.0, 62.0, 37.0, 21.0, 13.0, 13.0, 9.0, 11.0, 8.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.54296875, -0.5287208557128906, -0.5144729614257812, -0.5002250671386719, -0.4859771728515625, -0.4717292785644531, -0.45748138427734375, -0.4432334899902344, -0.428985595703125, -0.4147377014160156, -0.40048980712890625, -0.3862419128417969, -0.3719940185546875, -0.3577461242675781, -0.34349822998046875, -0.3292503356933594, -0.31500244140625, -0.3007545471191406, -0.28650665283203125, -0.2722587585449219, -0.2580108642578125, -0.24376296997070312, -0.22951507568359375, -0.21526718139648438, -0.201019287109375, -0.18677139282226562, -0.17252349853515625, -0.15827560424804688, -0.1440277099609375, -0.12977981567382812, -0.11553192138671875, -0.10128402709960938, -0.0870361328125, -0.07278823852539062, -0.05854034423828125, -0.044292449951171875, -0.0300445556640625, -0.015796661376953125, -0.00154876708984375, 0.012699127197265625, 0.026947021484375, 0.041194915771484375, 0.05544281005859375, 0.06969070434570312, 0.0839385986328125, 0.09818649291992188, 0.11243438720703125, 0.12668228149414062, 0.14093017578125, 0.15517807006835938, 0.16942596435546875, 0.18367385864257812, 0.1979217529296875, 0.21216964721679688, 0.22641754150390625, 0.24066543579101562, 0.254913330078125, 0.2691612243652344, 0.28340911865234375, 0.2976570129394531, 0.3119049072265625, 0.3261528015136719, 0.34040069580078125, 0.3546485900878906, 0.368896484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 9.0, 15.0, 31.0, 72.0, 110.0, 196.0, 250.0, 134.0, 75.0, 35.0, 25.0, 15.0, 9.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.048914909362793, -5.83397102355957, -5.619027137756348, -5.404083251953125, -5.189139366149902, -4.97419548034668, -4.759251594543457, -4.544307708740234, -4.329363822937012, -4.114419937133789, -3.8994760513305664, -3.6845321655273438, -3.469588279724121, -3.2546443939208984, -3.0397002696990967, -2.824756383895874, -2.6098122596740723, -2.3948683738708496, -2.179924488067627, -1.9649804830551147, -1.750036597251892, -1.5350927114486694, -1.3201487064361572, -1.1052048206329346, -0.8902609348297119, -0.6753170490264893, -0.4603731036186218, -0.2454291582107544, -0.03048527240753174, 0.18445861339569092, 0.3994026184082031, 0.6143465042114258, 0.8292899131774902, 1.044233798980713, 1.2591776847839355, 1.4741216897964478, 1.6890655755996704, 1.904009461402893, 2.1189534664154053, 2.333897352218628, 2.5488412380218506, 2.7637851238250732, 2.978729009628296, 3.1936731338500977, 3.4086170196533203, 3.623560905456543, 3.8385047912597656, 4.053448677062988, 4.268392562866211, 4.483336448669434, 4.698280334472656, 4.913224220275879, 5.128168106079102, 5.343111991882324, 5.558055877685547, 5.7729997634887695, 5.987943649291992, 6.202887535095215, 6.4178314208984375, 6.63277530670166, 6.847719192504883, 7.0626630783081055, 7.277606964111328, 7.492550849914551, 7.707495212554932]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 3.0, 4.0, 13.0, 5.0, 9.0, 21.0, 15.0, 19.0, 25.0, 25.0, 23.0, 34.0, 39.0, 40.0, 37.0, 42.0, 40.0, 57.0, 65.0, 56.0, 37.0, 54.0, 37.0, 29.0, 40.0, 39.0, 32.0, 20.0, 14.0, 20.0, 13.0, 15.0, 16.0, 15.0, 9.0, 9.0, 10.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.35766339302063, -3.2456111907958984, -3.133558988571167, -3.0215067863464355, -2.909454822540283, -2.7974026203155518, -2.6853504180908203, -2.573298215866089, -2.4612460136413574, -2.349193811416626, -2.2371416091918945, -2.125089645385742, -2.0130374431610107, -1.9009852409362793, -1.7889330387115479, -1.6768808364868164, -1.564828872680664, -1.4527766704559326, -1.3407245874404907, -1.2286723852157593, -1.1166203022003174, -1.004568099975586, -0.8925158977508545, -0.7804637551307678, -0.6684116125106812, -0.5563594698905945, -0.4443072974681854, -0.33225512504577637, -0.2202029824256897, -0.10815083980560303, 0.003901362419128418, 0.11595350503921509, 0.22800588607788086, 0.34005802869796753, 0.4521102011203766, 0.5641623735427856, 0.6762145161628723, 0.788266658782959, 0.9003188610076904, 1.0123710632324219, 1.1244231462478638, 1.2364753484725952, 1.348527431488037, 1.4605796337127686, 1.5726318359375, 1.684683918952942, 1.7967361211776733, 1.9087882041931152, 2.0208404064178467, 2.132892608642578, 2.2449448108673096, 2.356997013092041, 2.4690489768981934, 2.581101179122925, 2.6931533813476562, 2.8052055835723877, 2.917257785797119, 3.0293099880218506, 3.141362190246582, 3.2534141540527344, 3.365466356277466, 3.4775185585021973, 3.5895707607269287, 3.70162296295166, 3.8136749267578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 13.0, 13.0, 15.0, 29.0, 49.0, 79.0, 157.0, 317.0, 726.0, 1666.0, 4762.0, 17324.0, 111431.0, 2894953.0, 1092376.0, 54001.0, 10574.0, 3231.0, 1248.0, 573.0, 282.0, 196.0, 91.0, 47.0, 37.0, 14.0, 23.0, 14.0, 16.0, 3.0, 5.0, 1.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.33251953125, -0.3191375732421875, -0.305755615234375, -0.2923736572265625, -0.27899169921875, -0.2656097412109375, -0.252227783203125, -0.2388458251953125, -0.2254638671875, -0.2120819091796875, -0.198699951171875, -0.1853179931640625, -0.17193603515625, -0.1585540771484375, -0.145172119140625, -0.1317901611328125, -0.118408203125, -0.1050262451171875, -0.091644287109375, -0.0782623291015625, -0.06488037109375, -0.0514984130859375, -0.038116455078125, -0.0247344970703125, -0.0113525390625, 0.0020294189453125, 0.015411376953125, 0.0287933349609375, 0.04217529296875, 0.0555572509765625, 0.068939208984375, 0.0823211669921875, 0.095703125, 0.1090850830078125, 0.122467041015625, 0.1358489990234375, 0.14923095703125, 0.1626129150390625, 0.175994873046875, 0.1893768310546875, 0.2027587890625, 0.2161407470703125, 0.229522705078125, 0.2429046630859375, 0.25628662109375, 0.2696685791015625, 0.283050537109375, 0.2964324951171875, 0.309814453125, 0.3231964111328125, 0.336578369140625, 0.3499603271484375, 0.36334228515625, 0.3767242431640625, 0.390106201171875, 0.4034881591796875, 0.4168701171875, 0.4302520751953125, 0.443634033203125, 0.4570159912109375, 0.47039794921875, 0.4837799072265625, 0.497161865234375, 0.5105438232421875, 0.52392578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 2.0, 4.0, 4.0, 14.0, 13.0, 12.0, 16.0, 30.0, 30.0, 36.0, 49.0, 53.0, 53.0, 70.0, 62.0, 65.0, 55.0, 74.0, 65.0, 56.0, 37.0, 47.0, 31.0, 27.0, 25.0, 15.0, 15.0, 13.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.186279296875, -0.17932510375976562, -0.17237091064453125, -0.16541671752929688, -0.1584625244140625, -0.15150833129882812, -0.14455413818359375, -0.13759994506835938, -0.130645751953125, -0.12369155883789062, -0.11673736572265625, -0.10978317260742188, -0.1028289794921875, -0.09587478637695312, -0.08892059326171875, -0.08196640014648438, -0.07501220703125, -0.06805801391601562, -0.06110382080078125, -0.054149627685546875, -0.0471954345703125, -0.040241241455078125, -0.03328704833984375, -0.026332855224609375, -0.019378662109375, -0.012424468994140625, -0.00547027587890625, 0.001483917236328125, 0.0084381103515625, 0.015392303466796875, 0.02234649658203125, 0.029300689697265625, 0.0362548828125, 0.043209075927734375, 0.05016326904296875, 0.057117462158203125, 0.0640716552734375, 0.07102584838867188, 0.07798004150390625, 0.08493423461914062, 0.091888427734375, 0.09884262084960938, 0.10579681396484375, 0.11275100708007812, 0.1197052001953125, 0.12665939331054688, 0.13361358642578125, 0.14056777954101562, 0.14752197265625, 0.15447616577148438, 0.16143035888671875, 0.16838455200195312, 0.1753387451171875, 0.18229293823242188, 0.18924713134765625, 0.19620132446289062, 0.203155517578125, 0.21010971069335938, 0.21706390380859375, 0.22401809692382812, 0.2309722900390625, 0.23792648315429688, 0.24488067626953125, 0.2518348693847656, 0.2587890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 7.0, 15.0, 14.0, 34.0, 37.0, 64.0, 104.0, 144.0, 256.0, 497.0, 1019.0, 2422.0, 7580.0, 34120.0, 324734.0, 3518839.0, 265292.0, 29104.0, 6101.0, 1956.0, 816.0, 461.0, 241.0, 125.0, 110.0, 53.0, 32.0, 22.0, 16.0, 9.0, 10.0, 7.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4140625, -0.39898681640625, -0.3839111328125, -0.36883544921875, -0.353759765625, -0.33868408203125, -0.3236083984375, -0.30853271484375, -0.29345703125, -0.27838134765625, -0.2633056640625, -0.24822998046875, -0.233154296875, -0.21807861328125, -0.2030029296875, -0.18792724609375, -0.1728515625, -0.15777587890625, -0.1427001953125, -0.12762451171875, -0.112548828125, -0.09747314453125, -0.0823974609375, -0.06732177734375, -0.05224609375, -0.03717041015625, -0.0220947265625, -0.00701904296875, 0.008056640625, 0.02313232421875, 0.0382080078125, 0.05328369140625, 0.068359375, 0.08343505859375, 0.0985107421875, 0.11358642578125, 0.128662109375, 0.14373779296875, 0.1588134765625, 0.17388916015625, 0.18896484375, 0.20404052734375, 0.2191162109375, 0.23419189453125, 0.249267578125, 0.26434326171875, 0.2794189453125, 0.29449462890625, 0.3095703125, 0.32464599609375, 0.3397216796875, 0.35479736328125, 0.369873046875, 0.38494873046875, 0.4000244140625, 0.41510009765625, 0.43017578125, 0.44525146484375, 0.4603271484375, 0.47540283203125, 0.490478515625, 0.50555419921875, 0.5206298828125, 0.53570556640625, 0.55078125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 2.0, 6.0, 8.0, 14.0, 23.0, 38.0, 47.0, 76.0, 115.0, 215.0, 392.0, 913.0, 1033.0, 534.0, 272.0, 140.0, 71.0, 58.0, 34.0, 28.0, 20.0, 8.0, 10.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66015625, -0.6413803100585938, -0.6226043701171875, -0.6038284301757812, -0.585052490234375, -0.5662765502929688, -0.5475006103515625, -0.5287246704101562, -0.50994873046875, -0.49117279052734375, -0.4723968505859375, -0.45362091064453125, -0.434844970703125, -0.41606903076171875, -0.3972930908203125, -0.37851715087890625, -0.3597412109375, -0.34096527099609375, -0.3221893310546875, -0.30341339111328125, -0.284637451171875, -0.26586151123046875, -0.2470855712890625, -0.22830963134765625, -0.20953369140625, -0.19075775146484375, -0.1719818115234375, -0.15320587158203125, -0.134429931640625, -0.11565399169921875, -0.0968780517578125, -0.07810211181640625, -0.059326171875, -0.04055023193359375, -0.0217742919921875, -0.00299835205078125, 0.015777587890625, 0.03455352783203125, 0.0533294677734375, 0.07210540771484375, 0.09088134765625, 0.10965728759765625, 0.1284332275390625, 0.14720916748046875, 0.165985107421875, 0.18476104736328125, 0.2035369873046875, 0.22231292724609375, 0.2410888671875, 0.25986480712890625, 0.2786407470703125, 0.29741668701171875, 0.316192626953125, 0.33496856689453125, 0.3537445068359375, 0.37252044677734375, 0.39129638671875, 0.41007232666015625, 0.4288482666015625, 0.44762420654296875, 0.466400146484375, 0.48517608642578125, 0.5039520263671875, 0.5227279663085938, 0.54150390625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 6.0, 26.0, 64.0, 161.0, 313.0, 258.0, 102.0, 31.0, 11.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21705961227417, -5.012783527374268, -4.808507919311523, -4.604231834411621, -4.399955749511719, -4.195680141448975, -3.9914040565490723, -3.787128210067749, -3.582852363586426, -3.3785765171051025, -3.1743004322052, -2.970024585723877, -2.7657487392425537, -2.5614728927612305, -2.357196807861328, -2.152920961380005, -1.9486448764801025, -1.7443689107894897, -1.5400930643081665, -1.3358170986175537, -1.1315412521362305, -0.9272652864456177, -0.7229893207550049, -0.5187134742736816, -0.31443750858306885, -0.11016158759593964, 0.09411433339118958, 0.29839026927948, 0.502666175365448, 0.706942081451416, 0.9112180471420288, 1.115493893623352, 1.3197698593139648, 1.5240458250045776, 1.7283216714859009, 1.9325976371765137, 2.136873483657837, 2.34114933013916, 2.5454254150390625, 2.7497012615203857, 2.953977108001709, 3.1582529544830322, 3.3625290393829346, 3.566804885864258, 3.771080732345581, 3.9753565788269043, 4.179632663726807, 4.383908271789551, 4.588184356689453, 4.7924604415893555, 4.9967360496521, 5.201012134552002, 5.405288219451904, 5.609563827514648, 5.813839912414551, 6.018115997314453, 6.2223920822143555, 6.426668167114258, 6.630943775177002, 6.835219860076904, 7.039495944976807, 7.243771553039551, 7.448047637939453, 7.6523237228393555, 7.8565993309021]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 2.0, 8.0, 3.0, 8.0, 11.0, 10.0, 10.0, 15.0, 19.0, 17.0, 16.0, 25.0, 26.0, 34.0, 30.0, 37.0, 33.0, 45.0, 54.0, 42.0, 59.0, 49.0, 44.0, 38.0, 45.0, 43.0, 36.0, 39.0, 28.0, 32.0, 24.0, 25.0, 19.0, 16.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.229215621948242, -2.1623589992523193, -2.0955023765563965, -2.0286459922790527, -1.9617893695831299, -1.894932746887207, -1.8280762434005737, -1.7612197399139404, -1.6943631172180176, -1.6275064945220947, -1.5606499910354614, -1.4937934875488281, -1.4269368648529053, -1.3600802421569824, -1.2932237386703491, -1.2263672351837158, -1.159510612487793, -1.0926539897918701, -1.0257974863052368, -0.9589409232139587, -0.8920843601226807, -0.8252277970314026, -0.7583712339401245, -0.6915146708488464, -0.6246581077575684, -0.5578015446662903, -0.4909449815750122, -0.42408841848373413, -0.35723185539245605, -0.290375292301178, -0.2235187292098999, -0.15666216611862183, -0.08980584144592285, -0.022949278354644775, 0.0439072847366333, 0.11076384782791138, 0.17762041091918945, 0.24447697401046753, 0.3113335371017456, 0.3781901001930237, 0.44504666328430176, 0.5119032263755798, 0.5787597894668579, 0.645616352558136, 0.7124729156494141, 0.7793294787406921, 0.8461860418319702, 0.9130426049232483, 0.9798991680145264, 1.0467557907104492, 1.1136122941970825, 1.1804687976837158, 1.2473254203796387, 1.3141820430755615, 1.3810385465621948, 1.4478950500488281, 1.514751672744751, 1.5816082954406738, 1.6484647989273071, 1.7153213024139404, 1.7821779251098633, 1.8490345478057861, 1.9158910512924194, 1.9827475547790527, 2.0496041774749756]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 9.0, 20.0, 28.0, 47.0, 84.0, 131.0, 237.0, 472.0, 970.0, 2544.0, 6826.0, 23086.0, 99484.0, 492421.0, 334327.0, 63401.0, 15831.0, 5059.0, 1867.0, 799.0, 400.0, 208.0, 96.0, 66.0, 45.0, 21.0, 16.0, 13.0, 13.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5927734375, -0.5735626220703125, -0.554351806640625, -0.5351409912109375, -0.51593017578125, -0.4967193603515625, -0.477508544921875, -0.4582977294921875, -0.4390869140625, -0.4198760986328125, -0.400665283203125, -0.3814544677734375, -0.36224365234375, -0.3430328369140625, -0.323822021484375, -0.3046112060546875, -0.285400390625, -0.2661895751953125, -0.246978759765625, -0.2277679443359375, -0.20855712890625, -0.1893463134765625, -0.170135498046875, -0.1509246826171875, -0.1317138671875, -0.1125030517578125, -0.093292236328125, -0.0740814208984375, -0.05487060546875, -0.0356597900390625, -0.016448974609375, 0.0027618408203125, 0.02197265625, 0.0411834716796875, 0.060394287109375, 0.0796051025390625, 0.09881591796875, 0.1180267333984375, 0.137237548828125, 0.1564483642578125, 0.1756591796875, 0.1948699951171875, 0.214080810546875, 0.2332916259765625, 0.25250244140625, 0.2717132568359375, 0.290924072265625, 0.3101348876953125, 0.329345703125, 0.3485565185546875, 0.367767333984375, 0.3869781494140625, 0.40618896484375, 0.4253997802734375, 0.444610595703125, 0.4638214111328125, 0.4830322265625, 0.5022430419921875, 0.521453857421875, 0.5406646728515625, 0.55987548828125, 0.5790863037109375, 0.598297119140625, 0.6175079345703125, 0.63671875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 3.0, 5.0, 4.0, 9.0, 18.0, 15.0, 22.0, 35.0, 36.0, 37.0, 51.0, 55.0, 62.0, 48.0, 62.0, 60.0, 75.0, 56.0, 68.0, 54.0, 44.0, 34.0, 33.0, 26.0, 17.0, 17.0, 15.0, 13.0, 7.0, 4.0, 7.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1907958984375, -0.18406295776367188, -0.17733001708984375, -0.17059707641601562, -0.1638641357421875, -0.15713119506835938, -0.15039825439453125, -0.14366531372070312, -0.136932373046875, -0.13019943237304688, -0.12346649169921875, -0.11673355102539062, -0.1100006103515625, -0.10326766967773438, -0.09653472900390625, -0.08980178833007812, -0.08306884765625, -0.07633590698242188, -0.06960296630859375, -0.06287002563476562, -0.0561370849609375, -0.049404144287109375, -0.04267120361328125, -0.035938262939453125, -0.029205322265625, -0.022472381591796875, -0.01573944091796875, -0.009006500244140625, -0.0022735595703125, 0.004459381103515625, 0.01119232177734375, 0.017925262451171875, 0.024658203125, 0.031391143798828125, 0.03812408447265625, 0.044857025146484375, 0.0515899658203125, 0.058322906494140625, 0.06505584716796875, 0.07178878784179688, 0.078521728515625, 0.08525466918945312, 0.09198760986328125, 0.09872055053710938, 0.1054534912109375, 0.11218643188476562, 0.11891937255859375, 0.12565231323242188, 0.13238525390625, 0.13911819458007812, 0.14585113525390625, 0.15258407592773438, 0.1593170166015625, 0.16604995727539062, 0.17278289794921875, 0.17951583862304688, 0.186248779296875, 0.19298171997070312, 0.19971466064453125, 0.20644760131835938, 0.2131805419921875, 0.21991348266601562, 0.22664642333984375, 0.23337936401367188, 0.2401123046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 15.0, 4.0, 26.0, 26.0, 55.0, 87.0, 138.0, 270.0, 604.0, 1554.0, 6946.0, 88050.0, 904599.0, 39638.0, 4354.0, 1174.0, 490.0, 189.0, 121.0, 68.0, 50.0, 22.0, 24.0, 11.0, 10.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.5316162109375, -1.487060546875, -1.4425048828125, -1.39794921875, -1.3533935546875, -1.308837890625, -1.2642822265625, -1.2197265625, -1.1751708984375, -1.130615234375, -1.0860595703125, -1.04150390625, -0.9969482421875, -0.952392578125, -0.9078369140625, -0.86328125, -0.8187255859375, -0.774169921875, -0.7296142578125, -0.68505859375, -0.6405029296875, -0.595947265625, -0.5513916015625, -0.5068359375, -0.4622802734375, -0.417724609375, -0.3731689453125, -0.32861328125, -0.2840576171875, -0.239501953125, -0.1949462890625, -0.150390625, -0.1058349609375, -0.061279296875, -0.0167236328125, 0.02783203125, 0.0723876953125, 0.116943359375, 0.1614990234375, 0.2060546875, 0.2506103515625, 0.295166015625, 0.3397216796875, 0.38427734375, 0.4288330078125, 0.473388671875, 0.5179443359375, 0.5625, 0.6070556640625, 0.651611328125, 0.6961669921875, 0.74072265625, 0.7852783203125, 0.829833984375, 0.8743896484375, 0.9189453125, 0.9635009765625, 1.008056640625, 1.0526123046875, 1.09716796875, 1.1417236328125, 1.186279296875, 1.2308349609375, 1.275390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 4.0, 5.0, 4.0, 4.0, 9.0, 11.0, 6.0, 11.0, 15.0, 17.0, 28.0, 31.0, 44.0, 44.0, 45.0, 54.0, 73.0, 74.0, 61.0, 79.0, 43.0, 63.0, 48.0, 40.0, 40.0, 33.0, 28.0, 12.0, 20.0, 6.0, 10.0, 12.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0185546875, -0.9913482666015625, -0.964141845703125, -0.9369354248046875, -0.90972900390625, -0.8825225830078125, -0.855316162109375, -0.8281097412109375, -0.8009033203125, -0.7736968994140625, -0.746490478515625, -0.7192840576171875, -0.69207763671875, -0.6648712158203125, -0.637664794921875, -0.6104583740234375, -0.583251953125, -0.5560455322265625, -0.528839111328125, -0.5016326904296875, -0.47442626953125, -0.4472198486328125, -0.420013427734375, -0.3928070068359375, -0.3656005859375, -0.3383941650390625, -0.311187744140625, -0.2839813232421875, -0.25677490234375, -0.2295684814453125, -0.202362060546875, -0.1751556396484375, -0.14794921875, -0.1207427978515625, -0.093536376953125, -0.0663299560546875, -0.03912353515625, -0.0119171142578125, 0.015289306640625, 0.0424957275390625, 0.0697021484375, 0.0969085693359375, 0.124114990234375, 0.1513214111328125, 0.17852783203125, 0.2057342529296875, 0.232940673828125, 0.2601470947265625, 0.287353515625, 0.3145599365234375, 0.341766357421875, 0.3689727783203125, 0.39617919921875, 0.4233856201171875, 0.450592041015625, 0.4777984619140625, 0.5050048828125, 0.5322113037109375, 0.559417724609375, 0.5866241455078125, 0.61383056640625, 0.6410369873046875, 0.668243408203125, 0.6954498291015625, 0.72265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 2.0, 4.0, 5.0, 8.0, 15.0, 19.0, 35.0, 47.0, 81.0, 157.0, 377.0, 1017.0, 4009.0, 40631.0, 920899.0, 73268.0, 5811.0, 1293.0, 453.0, 174.0, 98.0, 57.0, 33.0, 24.0, 11.0, 3.0, 6.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66064453125, -0.6397323608398438, -0.6188201904296875, -0.5979080200195312, -0.576995849609375, -0.5560836791992188, -0.5351715087890625, -0.5142593383789062, -0.49334716796875, -0.47243499755859375, -0.4515228271484375, -0.43061065673828125, -0.409698486328125, -0.38878631591796875, -0.3678741455078125, -0.34696197509765625, -0.3260498046875, -0.30513763427734375, -0.2842254638671875, -0.26331329345703125, -0.242401123046875, -0.22148895263671875, -0.2005767822265625, -0.17966461181640625, -0.15875244140625, -0.13784027099609375, -0.1169281005859375, -0.09601593017578125, -0.075103759765625, -0.05419158935546875, -0.0332794189453125, -0.01236724853515625, 0.008544921875, 0.02945709228515625, 0.0503692626953125, 0.07128143310546875, 0.092193603515625, 0.11310577392578125, 0.1340179443359375, 0.15493011474609375, 0.17584228515625, 0.19675445556640625, 0.2176666259765625, 0.23857879638671875, 0.259490966796875, 0.28040313720703125, 0.3013153076171875, 0.32222747802734375, 0.3431396484375, 0.36405181884765625, 0.3849639892578125, 0.40587615966796875, 0.426788330078125, 0.44770050048828125, 0.4686126708984375, 0.48952484130859375, 0.51043701171875, 0.5313491821289062, 0.5522613525390625, 0.5731735229492188, 0.594085693359375, 0.6149978637695312, 0.6359100341796875, 0.6568222045898438, 0.677734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 6.0, 9.0, 6.0, 13.0, 16.0, 17.0, 23.0, 37.0, 39.0, 53.0, 70.0, 117.0, 144.0, 142.0, 76.0, 54.0, 36.0, 29.0, 20.0, 16.0, 17.0, 12.0, 11.0, 6.0, 8.0, 6.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.910894393920898e-05, -8.535105735063553e-05, -8.159317076206207e-05, -7.783528417348862e-05, -7.407739758491516e-05, -7.03195109963417e-05, -6.656162440776825e-05, -6.28037378191948e-05, -5.904585123062134e-05, -5.528796464204788e-05, -5.1530078053474426e-05, -4.777219146490097e-05, -4.4014304876327515e-05, -4.025641828775406e-05, -3.64985316991806e-05, -3.274064511060715e-05, -2.898275852203369e-05, -2.5224871933460236e-05, -2.146698534488678e-05, -1.7709098756313324e-05, -1.3951212167739868e-05, -1.0193325579166412e-05, -6.4354389905929565e-06, -2.6775524020195007e-06, 1.080334186553955e-06, 4.838220775127411e-06, 8.596107363700867e-06, 1.2353993952274323e-05, 1.611188054084778e-05, 1.9869767129421234e-05, 2.362765371799469e-05, 2.7385540306568146e-05, 3.11434268951416e-05, 3.490131348371506e-05, 3.865920007228851e-05, 4.241708666086197e-05, 4.6174973249435425e-05, 4.993285983800888e-05, 5.3690746426582336e-05, 5.744863301515579e-05, 6.120651960372925e-05, 6.49644061923027e-05, 6.872229278087616e-05, 7.248017936944962e-05, 7.623806595802307e-05, 7.999595254659653e-05, 8.375383913516998e-05, 8.751172572374344e-05, 9.12696123123169e-05, 9.502749890089035e-05, 9.87853854894638e-05, 0.00010254327207803726, 0.00010630115866661072, 0.00011005904525518417, 0.00011381693184375763, 0.00011757481843233109, 0.00012133270502090454, 0.000125090591609478, 0.00012884847819805145, 0.0001326063647866249, 0.00013636425137519836, 0.00014012213796377182, 0.00014388002455234528, 0.00014763791114091873, 0.0001513957977294922]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 7.0, 18.0, 25.0, 41.0, 67.0, 106.0, 229.0, 407.0, 978.0, 3479.0, 19025.0, 522602.0, 477111.0, 19075.0, 3493.0, 964.0, 431.0, 221.0, 107.0, 51.0, 36.0, 20.0, 14.0, 8.0, 9.0, 6.0, 8.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64404296875, -0.625640869140625, -0.60723876953125, -0.588836669921875, -0.5704345703125, -0.552032470703125, -0.53363037109375, -0.515228271484375, -0.496826171875, -0.478424072265625, -0.46002197265625, -0.441619873046875, -0.4232177734375, -0.404815673828125, -0.38641357421875, -0.368011474609375, -0.349609375, -0.331207275390625, -0.31280517578125, -0.294403076171875, -0.2760009765625, -0.257598876953125, -0.23919677734375, -0.220794677734375, -0.202392578125, -0.183990478515625, -0.16558837890625, -0.147186279296875, -0.1287841796875, -0.110382080078125, -0.09197998046875, -0.073577880859375, -0.05517578125, -0.036773681640625, -0.01837158203125, 3.0517578125e-05, 0.0184326171875, 0.036834716796875, 0.05523681640625, 0.073638916015625, 0.092041015625, 0.110443115234375, 0.12884521484375, 0.147247314453125, 0.1656494140625, 0.184051513671875, 0.20245361328125, 0.220855712890625, 0.2392578125, 0.257659912109375, 0.27606201171875, 0.294464111328125, 0.3128662109375, 0.331268310546875, 0.34967041015625, 0.368072509765625, 0.386474609375, 0.404876708984375, 0.42327880859375, 0.441680908203125, 0.4600830078125, 0.478485107421875, 0.49688720703125, 0.515289306640625, 0.53369140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 6.0, 10.0, 8.0, 14.0, 13.0, 9.0, 21.0, 30.0, 39.0, 54.0, 81.0, 106.0, 136.0, 121.0, 92.0, 77.0, 46.0, 23.0, 23.0, 22.0, 13.0, 10.0, 9.0, 5.0, 6.0, 3.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.3099098205566406, -0.29779815673828125, -0.2856864929199219, -0.2735748291015625, -0.2614631652832031, -0.24935150146484375, -0.23723983764648438, -0.225128173828125, -0.21301651000976562, -0.20090484619140625, -0.18879318237304688, -0.1766815185546875, -0.16456985473632812, -0.15245819091796875, -0.14034652709960938, -0.12823486328125, -0.11612319946289062, -0.10401153564453125, -0.09189987182617188, -0.0797882080078125, -0.06767654418945312, -0.05556488037109375, -0.043453216552734375, -0.031341552734375, -0.019229888916015625, -0.00711822509765625, 0.004993438720703125, 0.0171051025390625, 0.029216766357421875, 0.04132843017578125, 0.053440093994140625, 0.0655517578125, 0.07766342163085938, 0.08977508544921875, 0.10188674926757812, 0.1139984130859375, 0.12611007690429688, 0.13822174072265625, 0.15033340454101562, 0.162445068359375, 0.17455673217773438, 0.18666839599609375, 0.19878005981445312, 0.2108917236328125, 0.22300338745117188, 0.23511505126953125, 0.24722671508789062, 0.25933837890625, 0.2714500427246094, 0.28356170654296875, 0.2956733703613281, 0.3077850341796875, 0.3198966979980469, 0.33200836181640625, 0.3441200256347656, 0.356231689453125, 0.3683433532714844, 0.38045501708984375, 0.3925666809082031, 0.4046783447265625, 0.4167900085449219, 0.42890167236328125, 0.4410133361816406, 0.453125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 8.0, 17.0, 43.0, 66.0, 119.0, 197.0, 251.0, 156.0, 70.0, 28.0, 15.0, 9.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.248492240905762, -7.053330421447754, -6.858168125152588, -6.66300630569458, -6.467844009399414, -6.272682189941406, -6.077520370483398, -5.882358551025391, -5.687196254730225, -5.492034435272217, -5.296872138977051, -5.101710319519043, -4.906548500061035, -4.711386203765869, -4.516224384307861, -4.321062088012695, -4.1259002685546875, -3.9307382106781006, -3.7355761528015137, -3.540414333343506, -3.345252275466919, -3.150090217590332, -2.954928398132324, -2.7597663402557373, -2.5646042823791504, -2.3694422245025635, -2.1742801666259766, -1.9791183471679688, -1.7839562892913818, -1.588794231414795, -1.3936322927474976, -1.1984703540802002, -1.0033082962036133, -0.8081462979316711, -0.612984299659729, -0.41782230138778687, -0.22266030311584473, -0.027498304843902588, 0.16766369342803955, 0.3628256320953369, 0.5579876899719238, 0.753149688243866, 0.9483116865158081, 1.1434736251831055, 1.3386356830596924, 1.5337977409362793, 1.7289596796035767, 1.924121618270874, 2.119283676147461, 2.314445734024048, 2.5096077919006348, 2.7047696113586426, 2.8999316692352295, 3.0950937271118164, 3.290255546569824, 3.485417604446411, 3.680579662322998, 3.875741720199585, 4.070903778076172, 4.26606559753418, 4.4612274169921875, 4.6563897132873535, 4.851551532745361, 5.046713829040527, 5.241875648498535]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 13.0, 6.0, 13.0, 10.0, 10.0, 20.0, 35.0, 32.0, 36.0, 43.0, 41.0, 69.0, 80.0, 66.0, 61.0, 72.0, 60.0, 46.0, 46.0, 28.0, 39.0, 34.0, 28.0, 22.0, 18.0, 17.0, 12.0, 5.0, 12.0, 3.0, 4.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5050852298736572, -3.396188735961914, -3.287292242050171, -3.1783957481384277, -3.0694992542266846, -2.9606027603149414, -2.8517065048217773, -2.742809772491455, -2.633913516998291, -2.525017023086548, -2.4161205291748047, -2.3072240352630615, -2.1983275413513184, -2.089431047439575, -1.9805346727371216, -1.8716381788253784, -1.7627415657043457, -1.6538450717926025, -1.5449485778808594, -1.4360520839691162, -1.327155590057373, -1.2182590961456299, -1.1093627214431763, -1.000466227531433, -0.8915697336196899, -0.7826732397079468, -0.6737767457962036, -0.5648803114891052, -0.45598381757736206, -0.3470873236656189, -0.2381908893585205, -0.12929439544677734, -0.020397663116455078, 0.08849881589412689, 0.19739529490470886, 0.30629175901412964, 0.4151882529258728, 0.524084746837616, 0.6329811811447144, 0.7418776750564575, 0.8507741689682007, 0.9596706628799438, 1.068567156791687, 1.1774635314941406, 1.2863600254058838, 1.395256519317627, 1.5041530132293701, 1.6130495071411133, 1.7219460010528564, 1.8308424949645996, 1.9397389888763428, 2.048635482788086, 2.157531976699829, 2.2664284706115723, 2.3753247261047363, 2.4842214584350586, 2.5931177139282227, 2.702014207839966, 2.810910701751709, 2.919807195663452, 3.0287036895751953, 3.1376001834869385, 3.2464966773986816, 3.3553929328918457, 3.464289665222168]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 10.0, 17.0, 14.0, 23.0, 48.0, 71.0, 117.0, 250.0, 512.0, 1323.0, 3936.0, 17400.0, 344443.0, 3757122.0, 56495.0, 8276.0, 2429.0, 902.0, 398.0, 168.0, 107.0, 66.0, 41.0, 20.0, 28.0, 12.0, 11.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.552734375, -0.5338516235351562, -0.5149688720703125, -0.49608612060546875, -0.477203369140625, -0.45832061767578125, -0.4394378662109375, -0.42055511474609375, -0.40167236328125, -0.38278961181640625, -0.3639068603515625, -0.34502410888671875, -0.326141357421875, -0.30725860595703125, -0.2883758544921875, -0.26949310302734375, -0.2506103515625, -0.23172760009765625, -0.2128448486328125, -0.19396209716796875, -0.175079345703125, -0.15619659423828125, -0.1373138427734375, -0.11843109130859375, -0.09954833984375, -0.08066558837890625, -0.0617828369140625, -0.04290008544921875, -0.024017333984375, -0.00513458251953125, 0.0137481689453125, 0.03263092041015625, 0.051513671875, 0.07039642333984375, 0.0892791748046875, 0.10816192626953125, 0.127044677734375, 0.14592742919921875, 0.1648101806640625, 0.18369293212890625, 0.20257568359375, 0.22145843505859375, 0.2403411865234375, 0.25922393798828125, 0.278106689453125, 0.29698944091796875, 0.3158721923828125, 0.33475494384765625, 0.3536376953125, 0.37252044677734375, 0.3914031982421875, 0.41028594970703125, 0.429168701171875, 0.44805145263671875, 0.4669342041015625, 0.48581695556640625, 0.50469970703125, 0.5235824584960938, 0.5424652099609375, 0.5613479614257812, 0.580230712890625, 0.5991134643554688, 0.6179962158203125, 0.6368789672851562, 0.65576171875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 13.0, 23.0, 31.0, 52.0, 63.0, 73.0, 97.0, 96.0, 89.0, 112.0, 103.0, 66.0, 55.0, 46.0, 41.0, 12.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396484375, -0.3861656188964844, -0.37584686279296875, -0.3655281066894531, -0.3552093505859375, -0.3448905944824219, -0.33457183837890625, -0.3242530822753906, -0.313934326171875, -0.3036155700683594, -0.29329681396484375, -0.2829780578613281, -0.2726593017578125, -0.2623405456542969, -0.25202178955078125, -0.24170303344726562, -0.23138427734375, -0.22106552124023438, -0.21074676513671875, -0.20042800903320312, -0.1901092529296875, -0.17979049682617188, -0.16947174072265625, -0.15915298461914062, -0.148834228515625, -0.13851547241210938, -0.12819671630859375, -0.11787796020507812, -0.1075592041015625, -0.09724044799804688, -0.08692169189453125, -0.07660293579101562, -0.0662841796875, -0.055965423583984375, -0.04564666748046875, -0.035327911376953125, -0.0250091552734375, -0.014690399169921875, -0.00437164306640625, 0.005947113037109375, 0.016265869140625, 0.026584625244140625, 0.03690338134765625, 0.047222137451171875, 0.0575408935546875, 0.06785964965820312, 0.07817840576171875, 0.08849716186523438, 0.09881591796875, 0.10913467407226562, 0.11945343017578125, 0.12977218627929688, 0.1400909423828125, 0.15040969848632812, 0.16072845458984375, 0.17104721069335938, 0.181365966796875, 0.19168472290039062, 0.20200347900390625, 0.21232223510742188, 0.2226409912109375, 0.23295974731445312, 0.24327850341796875, 0.2535972595214844, 0.263916015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 11.0, 4.0, 8.0, 18.0, 24.0, 17.0, 36.0, 30.0, 58.0, 80.0, 114.0, 196.0, 264.0, 448.0, 799.0, 1565.0, 3700.0, 11946.0, 62166.0, 1745370.0, 2281030.0, 66937.0, 12028.0, 3646.0, 1708.0, 822.0, 423.0, 268.0, 164.0, 128.0, 87.0, 45.0, 42.0, 27.0, 9.0, 22.0, 12.0, 5.0, 8.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.5068359375, -0.4919395446777344, -0.47704315185546875, -0.4621467590332031, -0.4472503662109375, -0.4323539733886719, -0.41745758056640625, -0.4025611877441406, -0.387664794921875, -0.3727684020996094, -0.35787200927734375, -0.3429756164550781, -0.3280792236328125, -0.3131828308105469, -0.29828643798828125, -0.2833900451660156, -0.26849365234375, -0.2535972595214844, -0.23870086669921875, -0.22380447387695312, -0.2089080810546875, -0.19401168823242188, -0.17911529541015625, -0.16421890258789062, -0.149322509765625, -0.13442611694335938, -0.11952972412109375, -0.10463333129882812, -0.0897369384765625, -0.07484054565429688, -0.05994415283203125, -0.045047760009765625, -0.0301513671875, -0.015254974365234375, -0.00035858154296875, 0.014537811279296875, 0.0294342041015625, 0.044330596923828125, 0.05922698974609375, 0.07412338256835938, 0.089019775390625, 0.10391616821289062, 0.11881256103515625, 0.13370895385742188, 0.1486053466796875, 0.16350173950195312, 0.17839813232421875, 0.19329452514648438, 0.20819091796875, 0.22308731079101562, 0.23798370361328125, 0.2528800964355469, 0.2677764892578125, 0.2826728820800781, 0.29756927490234375, 0.3124656677246094, 0.327362060546875, 0.3422584533691406, 0.35715484619140625, 0.3720512390136719, 0.3869476318359375, 0.4018440246582031, 0.41674041748046875, 0.4316368103027344, 0.446533203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 9.0, 12.0, 12.0, 18.0, 23.0, 53.0, 45.0, 87.0, 99.0, 199.0, 502.0, 1024.0, 980.0, 433.0, 203.0, 116.0, 72.0, 53.0, 33.0, 28.0, 12.0, 8.0, 15.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.43750762939453125, -0.4233551025390625, -0.40920257568359375, -0.395050048828125, -0.38089752197265625, -0.3667449951171875, -0.35259246826171875, -0.33843994140625, -0.32428741455078125, -0.3101348876953125, -0.29598236083984375, -0.281829833984375, -0.26767730712890625, -0.2535247802734375, -0.23937225341796875, -0.2252197265625, -0.21106719970703125, -0.1969146728515625, -0.18276214599609375, -0.168609619140625, -0.15445709228515625, -0.1403045654296875, -0.12615203857421875, -0.11199951171875, -0.09784698486328125, -0.0836944580078125, -0.06954193115234375, -0.055389404296875, -0.04123687744140625, -0.0270843505859375, -0.01293182373046875, 0.001220703125, 0.01537322998046875, 0.0295257568359375, 0.04367828369140625, 0.057830810546875, 0.07198333740234375, 0.0861358642578125, 0.10028839111328125, 0.11444091796875, 0.12859344482421875, 0.1427459716796875, 0.15689849853515625, 0.171051025390625, 0.18520355224609375, 0.1993560791015625, 0.21350860595703125, 0.2276611328125, 0.24181365966796875, 0.2559661865234375, 0.27011871337890625, 0.284271240234375, 0.29842376708984375, 0.3125762939453125, 0.32672882080078125, 0.34088134765625, 0.35503387451171875, 0.3691864013671875, 0.38333892822265625, 0.397491455078125, 0.41164398193359375, 0.4257965087890625, 0.43994903564453125, 0.4541015625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 10.0, 16.0, 49.0, 135.0, 283.0, 304.0, 122.0, 47.0, 14.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.207853317260742, -6.019106388092041, -5.83035945892334, -5.6416120529174805, -5.452865123748779, -5.264118194580078, -5.075370788574219, -4.886623859405518, -4.697876930236816, -4.509130001068115, -4.320383071899414, -4.131635665893555, -3.9428887367248535, -3.7541418075561523, -3.565394639968872, -3.376647472381592, -3.1879005432128906, -2.9991536140441895, -2.810406446456909, -2.621659278869629, -2.4329123497009277, -2.2441654205322266, -2.0554182529449463, -1.8666712045669556, -1.6779241561889648, -1.4891771078109741, -1.3004300594329834, -1.1116830110549927, -0.922935962677002, -0.7341889142990112, -0.5454418659210205, -0.3566948175430298, -0.16794776916503906, 0.02079927921295166, 0.20954632759094238, 0.3982933759689331, 0.5870404243469238, 0.7757874727249146, 0.9645345211029053, 1.153281569480896, 1.3420286178588867, 1.5307756662368774, 1.7195227146148682, 1.9082697629928589, 2.0970168113708496, 2.285763740539551, 2.474510908126831, 2.6632580757141113, 2.8520050048828125, 3.0407519340515137, 3.229499101638794, 3.418246269226074, 3.6069931983947754, 3.7957401275634766, 3.984487295150757, 4.173234462738037, 4.361981391906738, 4.5507283210754395, 4.739475250244141, 4.92822265625, 5.116969585418701, 5.305716514587402, 5.494463920593262, 5.683210849761963, 5.871957778930664]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 12.0, 10.0, 11.0, 15.0, 21.0, 16.0, 32.0, 32.0, 15.0, 31.0, 36.0, 37.0, 45.0, 37.0, 47.0, 43.0, 41.0, 54.0, 46.0, 35.0, 43.0, 33.0, 29.0, 42.0, 36.0, 34.0, 22.0, 23.0, 16.0, 14.0, 16.0, 8.0, 14.0, 4.0, 8.0, 7.0, 2.0, 3.0, 0.0, 3.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5050184726715088, -1.4553773403167725, -1.4057360887527466, -1.3560948371887207, -1.3064537048339844, -1.256812572479248, -1.2071713209152222, -1.1575300693511963, -1.10788893699646, -1.0582478046417236, -1.0086065530776978, -0.9589653611183167, -0.9093241691589355, -0.8596829771995544, -0.8100417852401733, -0.7604005932807922, -0.7107594013214111, -0.66111820936203, -0.6114770174026489, -0.5618358254432678, -0.5121946334838867, -0.4625534415245056, -0.4129122495651245, -0.3632710576057434, -0.3136298656463623, -0.2639886736869812, -0.2143474817276001, -0.164706289768219, -0.11506509780883789, -0.06542390584945679, -0.015782713890075684, 0.03385847806930542, 0.08349967002868652, 0.13314086198806763, 0.18278205394744873, 0.23242324590682983, 0.28206443786621094, 0.33170562982559204, 0.38134682178497314, 0.43098801374435425, 0.48062920570373535, 0.5302703976631165, 0.5799115896224976, 0.6295527815818787, 0.6791939735412598, 0.7288351655006409, 0.778476357460022, 0.8281175494194031, 0.8777587413787842, 0.9273999333381653, 0.9770411252975464, 1.0266823768615723, 1.0763235092163086, 1.125964641571045, 1.1756058931350708, 1.2252471446990967, 1.274888277053833, 1.3245294094085693, 1.3741706609725952, 1.423811912536621, 1.4734530448913574, 1.5230941772460938, 1.5727354288101196, 1.6223766803741455, 1.6720178127288818]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 8.0, 7.0, 13.0, 30.0, 36.0, 58.0, 102.0, 201.0, 444.0, 1398.0, 5727.0, 45333.0, 669596.0, 300414.0, 20293.0, 3228.0, 926.0, 341.0, 165.0, 101.0, 35.0, 29.0, 24.0, 11.0, 11.0, 8.0, 7.0, 5.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.712890625, -0.6863174438476562, -0.6597442626953125, -0.6331710815429688, -0.606597900390625, -0.5800247192382812, -0.5534515380859375, -0.5268783569335938, -0.50030517578125, -0.47373199462890625, -0.4471588134765625, -0.42058563232421875, -0.394012451171875, -0.36743927001953125, -0.3408660888671875, -0.31429290771484375, -0.2877197265625, -0.26114654541015625, -0.2345733642578125, -0.20800018310546875, -0.181427001953125, -0.15485382080078125, -0.1282806396484375, -0.10170745849609375, -0.07513427734375, -0.04856109619140625, -0.0219879150390625, 0.00458526611328125, 0.031158447265625, 0.05773162841796875, 0.0843048095703125, 0.11087799072265625, 0.137451171875, 0.16402435302734375, 0.1905975341796875, 0.21717071533203125, 0.243743896484375, 0.27031707763671875, 0.2968902587890625, 0.32346343994140625, 0.35003662109375, 0.37660980224609375, 0.4031829833984375, 0.42975616455078125, 0.456329345703125, 0.48290252685546875, 0.5094757080078125, 0.5360488891601562, 0.5626220703125, 0.5891952514648438, 0.6157684326171875, 0.6423416137695312, 0.668914794921875, 0.6954879760742188, 0.7220611572265625, 0.7486343383789062, 0.77520751953125, 0.8017807006835938, 0.8283538818359375, 0.8549270629882812, 0.881500244140625, 0.9080734252929688, 0.9346466064453125, 0.9612197875976562, 0.98779296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 11.0, 14.0, 21.0, 29.0, 48.0, 59.0, 82.0, 87.0, 109.0, 107.0, 82.0, 78.0, 73.0, 71.0, 42.0, 31.0, 27.0, 9.0, 12.0, 6.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.376708984375, -0.366668701171875, -0.35662841796875, -0.346588134765625, -0.3365478515625, -0.326507568359375, -0.31646728515625, -0.306427001953125, -0.29638671875, -0.286346435546875, -0.27630615234375, -0.266265869140625, -0.2562255859375, -0.246185302734375, -0.23614501953125, -0.226104736328125, -0.216064453125, -0.206024169921875, -0.19598388671875, -0.185943603515625, -0.1759033203125, -0.165863037109375, -0.15582275390625, -0.145782470703125, -0.1357421875, -0.125701904296875, -0.11566162109375, -0.105621337890625, -0.0955810546875, -0.085540771484375, -0.07550048828125, -0.065460205078125, -0.055419921875, -0.045379638671875, -0.03533935546875, -0.025299072265625, -0.0152587890625, -0.005218505859375, 0.00482177734375, 0.014862060546875, 0.02490234375, 0.034942626953125, 0.04498291015625, 0.055023193359375, 0.0650634765625, 0.075103759765625, 0.08514404296875, 0.095184326171875, 0.105224609375, 0.115264892578125, 0.12530517578125, 0.135345458984375, 0.1453857421875, 0.155426025390625, 0.16546630859375, 0.175506591796875, 0.185546875, 0.195587158203125, 0.20562744140625, 0.215667724609375, 0.2257080078125, 0.235748291015625, 0.24578857421875, 0.255828857421875, 0.265869140625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 5.0, 9.0, 12.0, 12.0, 13.0, 25.0, 38.0, 56.0, 71.0, 114.0, 155.0, 333.0, 784.0, 2113.0, 7827.0, 53837.0, 703657.0, 248922.0, 23514.0, 4439.0, 1371.0, 551.0, 224.0, 167.0, 67.0, 64.0, 38.0, 31.0, 25.0, 15.0, 12.0, 8.0, 11.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7236328125, -0.7039718627929688, -0.6843109130859375, -0.6646499633789062, -0.644989013671875, -0.6253280639648438, -0.6056671142578125, -0.5860061645507812, -0.56634521484375, -0.5466842651367188, -0.5270233154296875, -0.5073623657226562, -0.487701416015625, -0.46804046630859375, -0.4483795166015625, -0.42871856689453125, -0.4090576171875, -0.38939666748046875, -0.3697357177734375, -0.35007476806640625, -0.330413818359375, -0.31075286865234375, -0.2910919189453125, -0.27143096923828125, -0.25177001953125, -0.23210906982421875, -0.2124481201171875, -0.19278717041015625, -0.173126220703125, -0.15346527099609375, -0.1338043212890625, -0.11414337158203125, -0.094482421875, -0.07482147216796875, -0.0551605224609375, -0.03549957275390625, -0.015838623046875, 0.00382232666015625, 0.0234832763671875, 0.04314422607421875, 0.06280517578125, 0.08246612548828125, 0.1021270751953125, 0.12178802490234375, 0.141448974609375, 0.16110992431640625, 0.1807708740234375, 0.20043182373046875, 0.2200927734375, 0.23975372314453125, 0.2594146728515625, 0.27907562255859375, 0.298736572265625, 0.31839752197265625, 0.3380584716796875, 0.35771942138671875, 0.37738037109375, 0.39704132080078125, 0.4167022705078125, 0.43636322021484375, 0.456024169921875, 0.47568511962890625, 0.4953460693359375, 0.5150070190429688, 0.53466796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 11.0, 21.0, 29.0, 43.0, 46.0, 47.0, 54.0, 65.0, 66.0, 72.0, 78.0, 77.0, 62.0, 74.0, 53.0, 47.0, 42.0, 28.0, 21.0, 20.0, 12.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93603515625, -0.9078140258789062, -0.8795928955078125, -0.8513717651367188, -0.823150634765625, -0.7949295043945312, -0.7667083740234375, -0.7384872436523438, -0.71026611328125, -0.6820449829101562, -0.6538238525390625, -0.6256027221679688, -0.597381591796875, -0.5691604614257812, -0.5409393310546875, -0.5127182006835938, -0.4844970703125, -0.45627593994140625, -0.4280548095703125, -0.39983367919921875, -0.371612548828125, -0.34339141845703125, -0.3151702880859375, -0.28694915771484375, -0.25872802734375, -0.23050689697265625, -0.2022857666015625, -0.17406463623046875, -0.145843505859375, -0.11762237548828125, -0.0894012451171875, -0.06118011474609375, -0.032958984375, -0.00473785400390625, 0.0234832763671875, 0.05170440673828125, 0.079925537109375, 0.10814666748046875, 0.1363677978515625, 0.16458892822265625, 0.19281005859375, 0.22103118896484375, 0.2492523193359375, 0.27747344970703125, 0.305694580078125, 0.33391571044921875, 0.3621368408203125, 0.39035797119140625, 0.4185791015625, 0.44680023193359375, 0.4750213623046875, 0.5032424926757812, 0.531463623046875, 0.5596847534179688, 0.5879058837890625, 0.6161270141601562, 0.64434814453125, 0.6725692749023438, 0.7007904052734375, 0.7290115356445312, 0.757232666015625, 0.7854537963867188, 0.8136749267578125, 0.8418960571289062, 0.8701171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 9.0, 14.0, 17.0, 44.0, 80.0, 178.0, 474.0, 1778.0, 10743.0, 142688.0, 850764.0, 35758.0, 4511.0, 911.0, 325.0, 109.0, 47.0, 26.0, 21.0, 16.0, 10.0, 10.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3798828125, -0.3684654235839844, -0.35704803466796875, -0.3456306457519531, -0.3342132568359375, -0.3227958679199219, -0.31137847900390625, -0.2999610900878906, -0.288543701171875, -0.2771263122558594, -0.26570892333984375, -0.2542915344238281, -0.2428741455078125, -0.23145675659179688, -0.22003936767578125, -0.20862197875976562, -0.19720458984375, -0.18578720092773438, -0.17436981201171875, -0.16295242309570312, -0.1515350341796875, -0.14011764526367188, -0.12870025634765625, -0.11728286743164062, -0.105865478515625, -0.09444808959960938, -0.08303070068359375, -0.07161331176757812, -0.0601959228515625, -0.048778533935546875, -0.03736114501953125, -0.025943756103515625, -0.0145263671875, -0.003108978271484375, 0.00830841064453125, 0.019725799560546875, 0.0311431884765625, 0.042560577392578125, 0.05397796630859375, 0.06539535522460938, 0.076812744140625, 0.08823013305664062, 0.09964752197265625, 0.11106491088867188, 0.1224822998046875, 0.13389968872070312, 0.14531707763671875, 0.15673446655273438, 0.16815185546875, 0.17956924438476562, 0.19098663330078125, 0.20240402221679688, 0.2138214111328125, 0.22523880004882812, 0.23665618896484375, 0.24807357788085938, 0.259490966796875, 0.2709083557128906, 0.28232574462890625, 0.2937431335449219, 0.3051605224609375, 0.3165779113769531, 0.32799530029296875, 0.3394126892089844, 0.350830078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 6.0, 7.0, 2.0, 10.0, 11.0, 19.0, 31.0, 58.0, 74.0, 101.0, 114.0, 153.0, 136.0, 75.0, 59.0, 32.0, 24.0, 24.0, 17.0, 8.0, 7.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010478496551513672, -0.00010211393237113953, -9.944289922714233e-05, -9.677186608314514e-05, -9.410083293914795e-05, -9.142979979515076e-05, -8.875876665115356e-05, -8.608773350715637e-05, -8.341670036315918e-05, -8.074566721916199e-05, -7.80746340751648e-05, -7.54036009311676e-05, -7.273256778717041e-05, -7.006153464317322e-05, -6.739050149917603e-05, -6.471946835517883e-05, -6.204843521118164e-05, -5.937740206718445e-05, -5.6706368923187256e-05, -5.4035335779190063e-05, -5.136430263519287e-05, -4.869326949119568e-05, -4.6022236347198486e-05, -4.3351203203201294e-05, -4.06801700592041e-05, -3.800913691520691e-05, -3.533810377120972e-05, -3.2667070627212524e-05, -2.9996037483215332e-05, -2.732500433921814e-05, -2.4653971195220947e-05, -2.1982938051223755e-05, -1.9311904907226562e-05, -1.664087176322937e-05, -1.3969838619232178e-05, -1.1298805475234985e-05, -8.627772331237793e-06, -5.956739187240601e-06, -3.285706043243408e-06, -6.146728992462158e-07, 2.0563602447509766e-06, 4.727393388748169e-06, 7.398426532745361e-06, 1.0069459676742554e-05, 1.2740492820739746e-05, 1.541152596473694e-05, 1.808255910873413e-05, 2.0753592252731323e-05, 2.3424625396728516e-05, 2.6095658540725708e-05, 2.87666916847229e-05, 3.143772482872009e-05, 3.4108757972717285e-05, 3.677979111671448e-05, 3.945082426071167e-05, 4.212185740470886e-05, 4.4792890548706055e-05, 4.746392369270325e-05, 5.013495683670044e-05, 5.280598998069763e-05, 5.5477023124694824e-05, 5.8148056268692017e-05, 6.081908941268921e-05, 6.34901225566864e-05, 6.61611557006836e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 5.0, 6.0, 11.0, 16.0, 39.0, 54.0, 167.0, 571.0, 2757.0, 25498.0, 920559.0, 92083.0, 5431.0, 926.0, 252.0, 81.0, 38.0, 25.0, 9.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.373779296875, -0.3579978942871094, -0.34221649169921875, -0.3264350891113281, -0.3106536865234375, -0.2948722839355469, -0.27909088134765625, -0.2633094787597656, -0.247528076171875, -0.23174667358398438, -0.21596527099609375, -0.20018386840820312, -0.1844024658203125, -0.16862106323242188, -0.15283966064453125, -0.13705825805664062, -0.12127685546875, -0.10549545288085938, -0.08971405029296875, -0.07393264770507812, -0.0581512451171875, -0.042369842529296875, -0.02658843994140625, -0.010807037353515625, 0.004974365234375, 0.020755767822265625, 0.03653717041015625, 0.052318572998046875, 0.0680999755859375, 0.08388137817382812, 0.09966278076171875, 0.11544418334960938, 0.1312255859375, 0.14700698852539062, 0.16278839111328125, 0.17856979370117188, 0.1943511962890625, 0.21013259887695312, 0.22591400146484375, 0.24169540405273438, 0.257476806640625, 0.2732582092285156, 0.28903961181640625, 0.3048210144042969, 0.3206024169921875, 0.3363838195800781, 0.35216522216796875, 0.3679466247558594, 0.38372802734375, 0.3995094299316406, 0.41529083251953125, 0.4310722351074219, 0.4468536376953125, 0.4626350402832031, 0.47841644287109375, 0.4941978454589844, 0.509979248046875, 0.5257606506347656, 0.5415420532226562, 0.5573234558105469, 0.5731048583984375, 0.5888862609863281, 0.6046676635742188, 0.6204490661621094, 0.63623046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 7.0, 8.0, 7.0, 19.0, 28.0, 44.0, 45.0, 107.0, 125.0, 132.0, 145.0, 114.0, 72.0, 28.0, 39.0, 20.0, 16.0, 10.0, 7.0, 1.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.315185546875, -0.30636024475097656, -0.2975349426269531, -0.2887096405029297, -0.27988433837890625, -0.2710590362548828, -0.2622337341308594, -0.25340843200683594, -0.2445831298828125, -0.23575782775878906, -0.22693252563476562, -0.2181072235107422, -0.20928192138671875, -0.2004566192626953, -0.19163131713867188, -0.18280601501464844, -0.173980712890625, -0.16515541076660156, -0.15633010864257812, -0.1475048065185547, -0.13867950439453125, -0.1298542022705078, -0.12102890014648438, -0.11220359802246094, -0.1033782958984375, -0.09455299377441406, -0.08572769165039062, -0.07690238952636719, -0.06807708740234375, -0.05925178527832031, -0.050426483154296875, -0.04160118103027344, -0.03277587890625, -0.023950576782226562, -0.015125274658203125, -0.0062999725341796875, 0.00252532958984375, 0.011350631713867188, 0.020175933837890625, 0.029001235961914062, 0.0378265380859375, 0.04665184020996094, 0.055477142333984375, 0.06430244445800781, 0.07312774658203125, 0.08195304870605469, 0.09077835083007812, 0.09960365295410156, 0.108428955078125, 0.11725425720214844, 0.12607955932617188, 0.1349048614501953, 0.14373016357421875, 0.1525554656982422, 0.16138076782226562, 0.17020606994628906, 0.1790313720703125, 0.18785667419433594, 0.19668197631835938, 0.2055072784423828, 0.21433258056640625, 0.2231578826904297, 0.23198318481445312, 0.24080848693847656, 0.2496337890625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 10.0, 5.0, 10.0, 18.0, 30.0, 68.0, 105.0, 145.0, 202.0, 144.0, 98.0, 64.0, 34.0, 22.0, 14.0, 5.0, 2.0, 4.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.164175033569336, -3.0608623027801514, -2.9575493335723877, -2.854236602783203, -2.7509236335754395, -2.647610902786255, -2.5442981719970703, -2.4409852027893066, -2.337672472000122, -2.2343597412109375, -2.131046772003174, -2.0277340412139893, -1.9244211912155151, -1.821108341217041, -1.7177956104278564, -1.6144827604293823, -1.5111699104309082, -1.407857060432434, -1.30454421043396, -1.2012314796447754, -1.0979186296463013, -0.9946057796478271, -0.8912929892539978, -0.7879801988601685, -0.6846673488616943, -0.5813544988632202, -0.47804170846939087, -0.37472888827323914, -0.2714160680770874, -0.16810321807861328, -0.06479042768478394, 0.03852236270904541, 0.14183497428894043, 0.24514779448509216, 0.3484606146812439, 0.45177343487739563, 0.5550862550735474, 0.6583991050720215, 0.7617118954658508, 0.8650246858596802, 0.9683375358581543, 1.0716503858566284, 1.1749632358551025, 1.278275966644287, 1.3815888166427612, 1.4849016666412354, 1.58821439743042, 1.691527247428894, 1.7948400974273682, 1.8981529474258423, 2.0014657974243164, 2.104778528213501, 2.2080912590026855, 2.311404228210449, 2.414716958999634, 2.5180296897888184, 2.621342658996582, 2.7246553897857666, 2.8279683589935303, 2.931281089782715, 3.0345940589904785, 3.137906789779663, 3.2412195205688477, 3.3445324897766113, 3.447845220565796]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 5.0, 6.0, 3.0, 11.0, 7.0, 20.0, 15.0, 15.0, 23.0, 28.0, 21.0, 38.0, 35.0, 54.0, 50.0, 61.0, 66.0, 74.0, 62.0, 61.0, 46.0, 41.0, 31.0, 22.0, 30.0, 38.0, 22.0, 16.0, 16.0, 19.0, 16.0, 9.0, 9.0, 5.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.1785826683044434, -3.0959415435791016, -3.0133001804351807, -2.930659055709839, -2.848017692565918, -2.765376567840576, -2.6827352046966553, -2.6000940799713135, -2.5174527168273926, -2.434811592102051, -2.35217022895813, -2.269529104232788, -2.186887741088867, -2.1042466163635254, -2.0216052532196045, -1.9389641284942627, -1.856323003768921, -1.7736817598342896, -1.6910405158996582, -1.6083992719650269, -1.5257580280303955, -1.4431169033050537, -1.3604756593704224, -1.277834415435791, -1.1951931715011597, -1.1125519275665283, -1.029910683631897, -0.9472694993019104, -0.864628255367279, -0.7819870114326477, -0.6993458271026611, -0.6167045831680298, -0.5340631008148193, -0.451421856880188, -0.36878064274787903, -0.28613942861557007, -0.20349818468093872, -0.12085694074630737, -0.03821572661399841, 0.04442548751831055, 0.1270667314529419, 0.20970796048641205, 0.2923491895198822, 0.37499040365219116, 0.4576316475868225, 0.5402728915214539, 0.6229140758514404, 0.7055553197860718, 0.7881965637207031, 0.8708378076553345, 0.9534790515899658, 1.0361202955245972, 1.1187615394592285, 1.2014026641845703, 1.2840439081192017, 1.366685152053833, 1.4493263959884644, 1.5319676399230957, 1.614608883857727, 1.6972501277923584, 1.7798912525177002, 1.862532615661621, 1.945173740386963, 2.0278148651123047, 2.1104562282562256]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 3.0, 12.0, 10.0, 7.0, 18.0, 34.0, 40.0, 63.0, 93.0, 171.0, 318.0, 674.0, 1662.0, 4597.0, 16369.0, 115491.0, 3390179.0, 613094.0, 37682.0, 8345.0, 2914.0, 1220.0, 521.0, 289.0, 177.0, 79.0, 64.0, 51.0, 24.0, 18.0, 12.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.359130859375, -0.3478202819824219, -0.33650970458984375, -0.3251991271972656, -0.3138885498046875, -0.3025779724121094, -0.29126739501953125, -0.2799568176269531, -0.268646240234375, -0.2573356628417969, -0.24602508544921875, -0.23471450805664062, -0.2234039306640625, -0.21209335327148438, -0.20078277587890625, -0.18947219848632812, -0.17816162109375, -0.16685104370117188, -0.15554046630859375, -0.14422988891601562, -0.1329193115234375, -0.12160873413085938, -0.11029815673828125, -0.09898757934570312, -0.087677001953125, -0.07636642456054688, -0.06505584716796875, -0.053745269775390625, -0.0424346923828125, -0.031124114990234375, -0.01981353759765625, -0.008502960205078125, 0.0028076171875, 0.014118194580078125, 0.02542877197265625, 0.036739349365234375, 0.0480499267578125, 0.059360504150390625, 0.07067108154296875, 0.08198165893554688, 0.093292236328125, 0.10460281372070312, 0.11591339111328125, 0.12722396850585938, 0.1385345458984375, 0.14984512329101562, 0.16115570068359375, 0.17246627807617188, 0.18377685546875, 0.19508743286132812, 0.20639801025390625, 0.21770858764648438, 0.2290191650390625, 0.24032974243164062, 0.25164031982421875, 0.2629508972167969, 0.274261474609375, 0.2855720520019531, 0.29688262939453125, 0.3081932067871094, 0.3195037841796875, 0.3308143615722656, 0.34212493896484375, 0.3534355163574219, 0.36474609375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 18.0, 23.0, 40.0, 57.0, 86.0, 93.0, 112.0, 117.0, 89.0, 79.0, 71.0, 62.0, 53.0, 28.0, 27.0, 12.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382080078125, -0.3721656799316406, -0.36225128173828125, -0.3523368835449219, -0.3424224853515625, -0.3325080871582031, -0.32259368896484375, -0.3126792907714844, -0.302764892578125, -0.2928504943847656, -0.28293609619140625, -0.2730216979980469, -0.2631072998046875, -0.2531929016113281, -0.24327850341796875, -0.23336410522460938, -0.22344970703125, -0.21353530883789062, -0.20362091064453125, -0.19370651245117188, -0.1837921142578125, -0.17387771606445312, -0.16396331787109375, -0.15404891967773438, -0.144134521484375, -0.13422012329101562, -0.12430572509765625, -0.11439132690429688, -0.1044769287109375, -0.09456253051757812, -0.08464813232421875, -0.07473373413085938, -0.0648193359375, -0.054904937744140625, -0.04499053955078125, -0.035076141357421875, -0.0251617431640625, -0.015247344970703125, -0.00533294677734375, 0.004581451416015625, 0.014495849609375, 0.024410247802734375, 0.03432464599609375, 0.044239044189453125, 0.0541534423828125, 0.06406784057617188, 0.07398223876953125, 0.08389663696289062, 0.09381103515625, 0.10372543334960938, 0.11363983154296875, 0.12355422973632812, 0.1334686279296875, 0.14338302612304688, 0.15329742431640625, 0.16321182250976562, 0.173126220703125, 0.18304061889648438, 0.19295501708984375, 0.20286941528320312, 0.2127838134765625, 0.22269821166992188, 0.23261260986328125, 0.24252700805664062, 0.25244140625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 16.0, 17.0, 38.0, 51.0, 87.0, 144.0, 232.0, 535.0, 1763.0, 13596.0, 349777.0, 3777382.0, 44856.0, 4156.0, 861.0, 335.0, 179.0, 92.0, 52.0, 33.0, 26.0, 21.0, 14.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.712890625, -0.691436767578125, -0.66998291015625, -0.648529052734375, -0.6270751953125, -0.605621337890625, -0.58416748046875, -0.562713623046875, -0.541259765625, -0.519805908203125, -0.49835205078125, -0.476898193359375, -0.4554443359375, -0.433990478515625, -0.41253662109375, -0.391082763671875, -0.36962890625, -0.348175048828125, -0.32672119140625, -0.305267333984375, -0.2838134765625, -0.262359619140625, -0.24090576171875, -0.219451904296875, -0.197998046875, -0.176544189453125, -0.15509033203125, -0.133636474609375, -0.1121826171875, -0.090728759765625, -0.06927490234375, -0.047821044921875, -0.0263671875, -0.004913330078125, 0.01654052734375, 0.037994384765625, 0.0594482421875, 0.080902099609375, 0.10235595703125, 0.123809814453125, 0.145263671875, 0.166717529296875, 0.18817138671875, 0.209625244140625, 0.2310791015625, 0.252532958984375, 0.27398681640625, 0.295440673828125, 0.31689453125, 0.338348388671875, 0.35980224609375, 0.381256103515625, 0.4027099609375, 0.424163818359375, 0.44561767578125, 0.467071533203125, 0.488525390625, 0.509979248046875, 0.53143310546875, 0.552886962890625, 0.5743408203125, 0.595794677734375, 0.61724853515625, 0.638702392578125, 0.66015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 15.0, 12.0, 19.0, 23.0, 31.0, 38.0, 63.0, 120.0, 210.0, 411.0, 1007.0, 1075.0, 503.0, 184.0, 121.0, 62.0, 41.0, 39.0, 29.0, 13.0, 10.0, 10.0, 8.0, 2.0, 2.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.433837890625, -0.421112060546875, -0.40838623046875, -0.395660400390625, -0.3829345703125, -0.370208740234375, -0.35748291015625, -0.344757080078125, -0.33203125, -0.319305419921875, -0.30657958984375, -0.293853759765625, -0.2811279296875, -0.268402099609375, -0.25567626953125, -0.242950439453125, -0.230224609375, -0.217498779296875, -0.20477294921875, -0.192047119140625, -0.1793212890625, -0.166595458984375, -0.15386962890625, -0.141143798828125, -0.12841796875, -0.115692138671875, -0.10296630859375, -0.090240478515625, -0.0775146484375, -0.064788818359375, -0.05206298828125, -0.039337158203125, -0.026611328125, -0.013885498046875, -0.00115966796875, 0.011566162109375, 0.0242919921875, 0.037017822265625, 0.04974365234375, 0.062469482421875, 0.0751953125, 0.087921142578125, 0.10064697265625, 0.113372802734375, 0.1260986328125, 0.138824462890625, 0.15155029296875, 0.164276123046875, 0.177001953125, 0.189727783203125, 0.20245361328125, 0.215179443359375, 0.2279052734375, 0.240631103515625, 0.25335693359375, 0.266082763671875, 0.27880859375, 0.291534423828125, 0.30426025390625, 0.316986083984375, 0.3297119140625, 0.342437744140625, 0.35516357421875, 0.367889404296875, 0.380615234375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 16.0, 31.0, 67.0, 138.0, 206.0, 206.0, 154.0, 91.0, 40.0, 15.0, 10.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.637744188308716, -3.5208239555358887, -3.4039037227630615, -3.2869834899902344, -3.1700632572174072, -3.05314302444458, -2.936222553253174, -2.819302558898926, -2.7023820877075195, -2.5854618549346924, -2.4685416221618652, -2.351621389389038, -2.234701156616211, -2.117780923843384, -2.0008606910705566, -1.88394033908844, -1.7670202255249023, -1.6500999927520752, -1.533179759979248, -1.416259527206421, -1.2993392944335938, -1.1824190616607666, -1.06549870967865, -0.9485784769058228, -0.8316582441329956, -0.7147380113601685, -0.5978177785873413, -0.4808974862098694, -0.36397725343704224, -0.2470570206642151, -0.13013672828674316, -0.013216495513916016, 0.10370397567749023, 0.22062422335147858, 0.3375444710254669, 0.45446473360061646, 0.5713849663734436, 0.6883051991462708, 0.8052254915237427, 0.9221457242965698, 1.039065957069397, 1.1559861898422241, 1.2729064226150513, 1.389826774597168, 1.5067470073699951, 1.6236672401428223, 1.7405874729156494, 1.8575077056884766, 1.9744279384613037, 2.091348171234131, 2.208268404006958, 2.325188636779785, 2.4421088695526123, 2.5590291023254395, 2.6759495735168457, 2.7928695678710938, 2.9097900390625, 3.026710271835327, 3.1436305046081543, 3.2605507373809814, 3.3774709701538086, 3.4943912029266357, 3.611311435699463, 3.728231906890869, 3.845151901245117]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 3.0, 6.0, 6.0, 9.0, 5.0, 9.0, 11.0, 21.0, 20.0, 17.0, 23.0, 22.0, 37.0, 26.0, 38.0, 31.0, 41.0, 39.0, 43.0, 46.0, 44.0, 45.0, 58.0, 42.0, 29.0, 30.0, 43.0, 33.0, 36.0, 28.0, 21.0, 15.0, 23.0, 13.0, 14.0, 16.0, 11.0, 9.0, 10.0, 6.0, 12.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1957745552062988, -1.1551610231399536, -1.1145474910736084, -1.0739339590072632, -1.033320426940918, -0.9927068948745728, -0.9520934224128723, -0.9114798903465271, -0.8708663582801819, -0.8302528262138367, -0.7896392941474915, -0.7490257620811462, -0.7084122896194458, -0.6677987575531006, -0.6271852254867554, -0.5865716934204102, -0.5459581613540649, -0.5053446292877197, -0.4647310972213745, -0.4241175949573517, -0.38350406289100647, -0.34289053082466125, -0.3022770285606384, -0.2616634964942932, -0.221049964427948, -0.18043643236160278, -0.13982291519641876, -0.09920939058065414, -0.058595865964889526, -0.01798233389854431, 0.02263118326663971, 0.06324470043182373, 0.10385823249816895, 0.14447176456451416, 0.18508528172969818, 0.2256987988948822, 0.2663123309612274, 0.30692586302757263, 0.34753936529159546, 0.3881528973579407, 0.4287664294242859, 0.4693799614906311, 0.5099934935569763, 0.5506070256233215, 0.591220498085022, 0.6318340301513672, 0.6724475622177124, 0.7130610942840576, 0.7536746263504028, 0.794288158416748, 0.8349016904830933, 0.8755152225494385, 0.9161287546157837, 0.9567422866821289, 0.9973557591438293, 1.0379693508148193, 1.078582763671875, 1.1191962957382202, 1.1598098278045654, 1.2004233598709106, 1.2410368919372559, 1.281650424003601, 1.3222639560699463, 1.362877368927002, 1.4034910202026367]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 20.0, 20.0, 47.0, 88.0, 141.0, 320.0, 867.0, 3034.0, 16633.0, 177840.0, 741914.0, 93769.0, 10408.0, 2171.0, 687.0, 283.0, 139.0, 75.0, 35.0, 15.0, 13.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84814453125, -0.8271408081054688, -0.8061370849609375, -0.7851333618164062, -0.764129638671875, -0.7431259155273438, -0.7221221923828125, -0.7011184692382812, -0.68011474609375, -0.6591110229492188, -0.6381072998046875, -0.6171035766601562, -0.596099853515625, -0.5750961303710938, -0.5540924072265625, -0.5330886840820312, -0.5120849609375, -0.49108123779296875, -0.4700775146484375, -0.44907379150390625, -0.428070068359375, -0.40706634521484375, -0.3860626220703125, -0.36505889892578125, -0.34405517578125, -0.32305145263671875, -0.3020477294921875, -0.28104400634765625, -0.260040283203125, -0.23903656005859375, -0.2180328369140625, -0.19702911376953125, -0.176025390625, -0.15502166748046875, -0.1340179443359375, -0.11301422119140625, -0.092010498046875, -0.07100677490234375, -0.0500030517578125, -0.02899932861328125, -0.00799560546875, 0.01300811767578125, 0.0340118408203125, 0.05501556396484375, 0.076019287109375, 0.09702301025390625, 0.1180267333984375, 0.13903045654296875, 0.1600341796875, 0.18103790283203125, 0.2020416259765625, 0.22304534912109375, 0.244049072265625, 0.26505279541015625, 0.2860565185546875, 0.30706024169921875, 0.32806396484375, 0.34906768798828125, 0.3700714111328125, 0.39107513427734375, 0.412078857421875, 0.43308258056640625, 0.4540863037109375, 0.47509002685546875, 0.49609375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 11.0, 11.0, 17.0, 30.0, 47.0, 65.0, 71.0, 92.0, 104.0, 96.0, 100.0, 79.0, 76.0, 62.0, 45.0, 29.0, 22.0, 23.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380859375, -0.3709678649902344, -0.36107635498046875, -0.3511848449707031, -0.3412933349609375, -0.3314018249511719, -0.32151031494140625, -0.3116188049316406, -0.301727294921875, -0.2918357849121094, -0.28194427490234375, -0.2720527648925781, -0.2621612548828125, -0.2522697448730469, -0.24237823486328125, -0.23248672485351562, -0.22259521484375, -0.21270370483398438, -0.20281219482421875, -0.19292068481445312, -0.1830291748046875, -0.17313766479492188, -0.16324615478515625, -0.15335464477539062, -0.143463134765625, -0.13357162475585938, -0.12368011474609375, -0.11378860473632812, -0.1038970947265625, -0.09400558471679688, -0.08411407470703125, -0.07422256469726562, -0.0643310546875, -0.054439544677734375, -0.04454803466796875, -0.034656524658203125, -0.0247650146484375, -0.014873504638671875, -0.00498199462890625, 0.004909515380859375, 0.014801025390625, 0.024692535400390625, 0.03458404541015625, 0.044475555419921875, 0.0543670654296875, 0.06425857543945312, 0.07415008544921875, 0.08404159545898438, 0.09393310546875, 0.10382461547851562, 0.11371612548828125, 0.12360763549804688, 0.1334991455078125, 0.14339065551757812, 0.15328216552734375, 0.16317367553710938, 0.173065185546875, 0.18295669555664062, 0.19284820556640625, 0.20273971557617188, 0.2126312255859375, 0.22252273559570312, 0.23241424560546875, 0.24230575561523438, 0.252197265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 5.0, 7.0, 17.0, 15.0, 32.0, 50.0, 53.0, 98.0, 161.0, 286.0, 656.0, 1777.0, 7553.0, 64893.0, 862603.0, 97198.0, 9488.0, 2082.0, 736.0, 322.0, 172.0, 101.0, 64.0, 64.0, 35.0, 17.0, 15.0, 10.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7041015625, -0.6810684204101562, -0.6580352783203125, -0.6350021362304688, -0.611968994140625, -0.5889358520507812, -0.5659027099609375, -0.5428695678710938, -0.51983642578125, -0.49680328369140625, -0.4737701416015625, -0.45073699951171875, -0.427703857421875, -0.40467071533203125, -0.3816375732421875, -0.35860443115234375, -0.3355712890625, -0.31253814697265625, -0.2895050048828125, -0.26647186279296875, -0.243438720703125, -0.22040557861328125, -0.1973724365234375, -0.17433929443359375, -0.15130615234375, -0.12827301025390625, -0.1052398681640625, -0.08220672607421875, -0.059173583984375, -0.03614044189453125, -0.0131072998046875, 0.00992584228515625, 0.032958984375, 0.05599212646484375, 0.0790252685546875, 0.10205841064453125, 0.125091552734375, 0.14812469482421875, 0.1711578369140625, 0.19419097900390625, 0.21722412109375, 0.24025726318359375, 0.2632904052734375, 0.28632354736328125, 0.309356689453125, 0.33238983154296875, 0.3554229736328125, 0.37845611572265625, 0.4014892578125, 0.42452239990234375, 0.4475555419921875, 0.47058868408203125, 0.493621826171875, 0.5166549682617188, 0.5396881103515625, 0.5627212524414062, 0.58575439453125, 0.6087875366210938, 0.6318206787109375, 0.6548538208007812, 0.677886962890625, 0.7009201049804688, 0.7239532470703125, 0.7469863891601562, 0.77001953125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 5.0, 1.0, 4.0, 9.0, 8.0, 6.0, 14.0, 22.0, 25.0, 42.0, 39.0, 45.0, 59.0, 44.0, 74.0, 65.0, 73.0, 78.0, 66.0, 60.0, 43.0, 53.0, 28.0, 29.0, 23.0, 21.0, 9.0, 8.0, 9.0, 6.0, 3.0, 5.0, 3.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.71435546875, -0.6890487670898438, -0.6637420654296875, -0.6384353637695312, -0.613128662109375, -0.5878219604492188, -0.5625152587890625, -0.5372085571289062, -0.51190185546875, -0.48659515380859375, -0.4612884521484375, -0.43598175048828125, -0.410675048828125, -0.38536834716796875, -0.3600616455078125, -0.33475494384765625, -0.3094482421875, -0.28414154052734375, -0.2588348388671875, -0.23352813720703125, -0.208221435546875, -0.18291473388671875, -0.1576080322265625, -0.13230133056640625, -0.10699462890625, -0.08168792724609375, -0.0563812255859375, -0.03107452392578125, -0.005767822265625, 0.01953887939453125, 0.0448455810546875, 0.07015228271484375, 0.095458984375, 0.12076568603515625, 0.1460723876953125, 0.17137908935546875, 0.196685791015625, 0.22199249267578125, 0.2472991943359375, 0.27260589599609375, 0.29791259765625, 0.32321929931640625, 0.3485260009765625, 0.37383270263671875, 0.399139404296875, 0.42444610595703125, 0.4497528076171875, 0.47505950927734375, 0.5003662109375, 0.5256729125976562, 0.5509796142578125, 0.5762863159179688, 0.601593017578125, 0.6268997192382812, 0.6522064208984375, 0.6775131225585938, 0.70281982421875, 0.7281265258789062, 0.7534332275390625, 0.7787399291992188, 0.804046630859375, 0.8293533325195312, 0.8546600341796875, 0.8799667358398438, 0.9052734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 11.0, 7.0, 19.0, 19.0, 30.0, 60.0, 92.0, 180.0, 415.0, 1041.0, 3900.0, 19236.0, 286148.0, 705022.0, 25461.0, 4679.0, 1293.0, 460.0, 194.0, 110.0, 55.0, 42.0, 21.0, 12.0, 14.0, 10.0, 5.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2261962890625, -0.21751976013183594, -0.20884323120117188, -0.2001667022705078, -0.19149017333984375, -0.1828136444091797, -0.17413711547851562, -0.16546058654785156, -0.1567840576171875, -0.14810752868652344, -0.13943099975585938, -0.1307544708251953, -0.12207794189453125, -0.11340141296386719, -0.10472488403320312, -0.09604835510253906, -0.087371826171875, -0.07869529724121094, -0.07001876831054688, -0.06134223937988281, -0.05266571044921875, -0.04398918151855469, -0.035312652587890625, -0.026636123657226562, -0.0179595947265625, -0.009283065795898438, -0.000606536865234375, 0.008069992065429688, 0.01674652099609375, 0.025423049926757812, 0.034099578857421875, 0.04277610778808594, 0.05145263671875, 0.06012916564941406, 0.06880569458007812, 0.07748222351074219, 0.08615875244140625, 0.09483528137207031, 0.10351181030273438, 0.11218833923339844, 0.1208648681640625, 0.12954139709472656, 0.13821792602539062, 0.1468944549560547, 0.15557098388671875, 0.1642475128173828, 0.17292404174804688, 0.18160057067871094, 0.190277099609375, 0.19895362854003906, 0.20763015747070312, 0.2163066864013672, 0.22498321533203125, 0.2336597442626953, 0.24233627319335938, 0.25101280212402344, 0.2596893310546875, 0.26836585998535156, 0.2770423889160156, 0.2857189178466797, 0.29439544677734375, 0.3030719757080078, 0.3117485046386719, 0.32042503356933594, 0.3291015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 9.0, 8.0, 15.0, 11.0, 14.0, 24.0, 30.0, 39.0, 65.0, 68.0, 106.0, 131.0, 128.0, 100.0, 45.0, 53.0, 32.0, 20.0, 19.0, 16.0, 14.0, 7.0, 7.0, 7.0, 7.0, 3.0, 0.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3882598876953125e-05, -5.207117646932602e-05, -5.0259754061698914e-05, -4.844833165407181e-05, -4.66369092464447e-05, -4.4825486838817596e-05, -4.301406443119049e-05, -4.1202642023563385e-05, -3.939121961593628e-05, -3.7579797208309174e-05, -3.576837480068207e-05, -3.395695239305496e-05, -3.2145529985427856e-05, -3.033410757780075e-05, -2.8522685170173645e-05, -2.671126276254654e-05, -2.4899840354919434e-05, -2.3088417947292328e-05, -2.1276995539665222e-05, -1.9465573132038116e-05, -1.765415072441101e-05, -1.5842728316783905e-05, -1.40313059091568e-05, -1.2219883501529694e-05, -1.0408461093902588e-05, -8.597038686275482e-06, -6.7856162786483765e-06, -4.974193871021271e-06, -3.162771463394165e-06, -1.3513490557670593e-06, 4.600733518600464e-07, 2.271495759487152e-06, 4.082918167114258e-06, 5.8943405747413635e-06, 7.70576298236847e-06, 9.517185389995575e-06, 1.132860779762268e-05, 1.3140030205249786e-05, 1.4951452612876892e-05, 1.6762875020503998e-05, 1.8574297428131104e-05, 2.038571983575821e-05, 2.2197142243385315e-05, 2.400856465101242e-05, 2.5819987058639526e-05, 2.7631409466266632e-05, 2.9442831873893738e-05, 3.1254254281520844e-05, 3.306567668914795e-05, 3.4877099096775055e-05, 3.668852150440216e-05, 3.8499943912029266e-05, 4.031136631965637e-05, 4.212278872728348e-05, 4.3934211134910583e-05, 4.574563354253769e-05, 4.7557055950164795e-05, 4.93684783577919e-05, 5.1179900765419006e-05, 5.299132317304611e-05, 5.480274558067322e-05, 5.6614167988300323e-05, 5.842559039592743e-05, 6.0237012803554535e-05, 6.204843521118164e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 9.0, 11.0, 12.0, 16.0, 38.0, 30.0, 65.0, 68.0, 117.0, 203.0, 355.0, 747.0, 1546.0, 4044.0, 12658.0, 51933.0, 656707.0, 267466.0, 36784.0, 9591.0, 3272.0, 1322.0, 710.0, 337.0, 181.0, 103.0, 82.0, 52.0, 23.0, 13.0, 15.0, 8.0, 7.0, 9.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.1324939727783203, -0.12717056274414062, -0.12184715270996094, -0.11652374267578125, -0.11120033264160156, -0.10587692260742188, -0.10055351257324219, -0.0952301025390625, -0.08990669250488281, -0.08458328247070312, -0.07925987243652344, -0.07393646240234375, -0.06861305236816406, -0.06328964233398438, -0.05796623229980469, -0.052642822265625, -0.04731941223144531, -0.041996002197265625, -0.03667259216308594, -0.03134918212890625, -0.026025772094726562, -0.020702362060546875, -0.015378952026367188, -0.0100555419921875, -0.0047321319580078125, 0.000591278076171875, 0.0059146881103515625, 0.01123809814453125, 0.016561508178710938, 0.021884918212890625, 0.027208328247070312, 0.03253173828125, 0.03785514831542969, 0.043178558349609375, 0.04850196838378906, 0.05382537841796875, 0.05914878845214844, 0.06447219848632812, 0.06979560852050781, 0.0751190185546875, 0.08044242858886719, 0.08576583862304688, 0.09108924865722656, 0.09641265869140625, 0.10173606872558594, 0.10705947875976562, 0.11238288879394531, 0.117706298828125, 0.12302970886230469, 0.12835311889648438, 0.13367652893066406, 0.13899993896484375, 0.14432334899902344, 0.14964675903320312, 0.1549701690673828, 0.1602935791015625, 0.1656169891357422, 0.17094039916992188, 0.17626380920410156, 0.18158721923828125, 0.18691062927246094, 0.19223403930664062, 0.1975574493408203, 0.202880859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 7.0, 6.0, 8.0, 12.0, 15.0, 17.0, 26.0, 35.0, 45.0, 57.0, 97.0, 108.0, 117.0, 124.0, 82.0, 53.0, 39.0, 35.0, 14.0, 17.0, 15.0, 24.0, 6.0, 6.0, 4.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127197265625, -0.12171554565429688, -0.11623382568359375, -0.11075210571289062, -0.1052703857421875, -0.09978866577148438, -0.09430694580078125, -0.08882522583007812, -0.083343505859375, -0.07786178588867188, -0.07238006591796875, -0.06689834594726562, -0.0614166259765625, -0.055934906005859375, -0.05045318603515625, -0.044971466064453125, -0.03948974609375, -0.034008026123046875, -0.02852630615234375, -0.023044586181640625, -0.0175628662109375, -0.012081146240234375, -0.00659942626953125, -0.001117706298828125, 0.004364013671875, 0.009845733642578125, 0.01532745361328125, 0.020809173583984375, 0.0262908935546875, 0.031772613525390625, 0.03725433349609375, 0.042736053466796875, 0.0482177734375, 0.053699493408203125, 0.05918121337890625, 0.06466293334960938, 0.0701446533203125, 0.07562637329101562, 0.08110809326171875, 0.08658981323242188, 0.092071533203125, 0.09755325317382812, 0.10303497314453125, 0.10851669311523438, 0.1139984130859375, 0.11948013305664062, 0.12496185302734375, 0.13044357299804688, 0.13592529296875, 0.14140701293945312, 0.14688873291015625, 0.15237045288085938, 0.1578521728515625, 0.16333389282226562, 0.16881561279296875, 0.17429733276367188, 0.179779052734375, 0.18526077270507812, 0.19074249267578125, 0.19622421264648438, 0.2017059326171875, 0.20718765258789062, 0.21266937255859375, 0.21815109252929688, 0.2236328125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 14.0, 44.0, 141.0, 446.0, 219.0, 81.0, 17.0, 15.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.024956703186035, -8.797606468200684, -8.570255279541016, -8.342905044555664, -8.115553855895996, -7.888203144073486, -7.660852432250977, -7.433501720428467, -7.206151008605957, -6.978800296783447, -6.7514495849609375, -6.524098873138428, -6.296748161315918, -6.069397449493408, -5.842046737670898, -5.614696025848389, -5.387345314025879, -5.159994602203369, -4.932643890380859, -4.70529317855835, -4.47794246673584, -4.25059175491333, -4.02324104309082, -3.7958903312683105, -3.568540096282959, -3.341189384460449, -3.1138386726379395, -2.8864879608154297, -2.65913724899292, -2.43178653717041, -2.2044358253479004, -1.9770852327346802, -1.7497344017028809, -1.522383689880371, -1.2950329780578613, -1.0676822662353516, -0.8403316140174866, -0.6129809617996216, -0.3856302499771118, -0.15827953815460205, 0.06907117366790771, 0.2964218854904175, 0.5237725973129272, 0.7511232495307922, 0.978473961353302, 1.205824613571167, 1.4331753253936768, 1.6605260372161865, 1.8878767490386963, 2.115227460861206, 2.342578172683716, 2.5699288845062256, 2.7972795963287354, 3.024630069732666, 3.251980781555176, 3.4793314933776855, 3.7066822052001953, 3.934032917022705, 4.161383628845215, 4.388734340667725, 4.616085052490234, 4.843435764312744, 5.070786476135254, 5.298137187957764, 5.525487899780273]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 12.0, 3.0, 13.0, 10.0, 9.0, 18.0, 14.0, 19.0, 21.0, 27.0, 26.0, 37.0, 40.0, 41.0, 43.0, 60.0, 67.0, 85.0, 71.0, 50.0, 55.0, 36.0, 21.0, 25.0, 26.0, 31.0, 27.0, 15.0, 16.0, 11.0, 8.0, 11.0, 12.0, 11.0, 4.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.055661201477051, -1.980941891670227, -1.9062225818634033, -1.8315033912658691, -1.7567840814590454, -1.6820647716522217, -1.6073455810546875, -1.5326262712478638, -1.45790696144104, -1.3831876516342163, -1.3084683418273926, -1.2337491512298584, -1.1590298414230347, -1.084310531616211, -1.0095913410186768, -0.934872031211853, -0.8601527214050293, -0.7854334115982056, -0.7107141613960266, -0.6359949111938477, -0.5612756013870239, -0.4865563213825226, -0.41183704137802124, -0.3371177911758423, -0.26239848136901855, -0.1876792013645172, -0.11295992136001587, -0.038240641355514526, 0.036478638648986816, 0.11119791865348816, 0.1859171986579895, 0.26063644886016846, 0.3353555202484131, 0.41007480025291443, 0.48479408025741577, 0.5595133304595947, 0.6342326402664185, 0.7089519500732422, 0.7836712002754211, 0.8583904504776001, 0.9331097602844238, 1.0078290700912476, 1.0825483798980713, 1.1572675704956055, 1.2319868803024292, 1.306706190109253, 1.381425380706787, 1.4561446905136108, 1.5308640003204346, 1.6055833101272583, 1.680302619934082, 1.7550218105316162, 1.82974112033844, 1.9044604301452637, 1.9791796207427979, 2.053898811340332, 2.1286182403564453, 2.2033374309539795, 2.2780568599700928, 2.352776050567627, 2.4274954795837402, 2.5022146701812744, 2.5769338607788086, 2.651653289794922, 2.726372480392456]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 13.0, 9.0, 22.0, 39.0, 48.0, 83.0, 123.0, 232.0, 476.0, 829.0, 1833.0, 4947.0, 15595.0, 78996.0, 1862591.0, 2121040.0, 81630.0, 16362.0, 5117.0, 2055.0, 948.0, 505.0, 286.0, 152.0, 112.0, 68.0, 49.0, 22.0, 19.0, 12.0, 15.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.3469886779785156, -0.33460235595703125, -0.3222160339355469, -0.3098297119140625, -0.2974433898925781, -0.28505706787109375, -0.2726707458496094, -0.260284423828125, -0.24789810180664062, -0.23551177978515625, -0.22312545776367188, -0.2107391357421875, -0.19835281372070312, -0.18596649169921875, -0.17358016967773438, -0.16119384765625, -0.14880752563476562, -0.13642120361328125, -0.12403488159179688, -0.1116485595703125, -0.09926223754882812, -0.08687591552734375, -0.07448959350585938, -0.062103271484375, -0.049716949462890625, -0.03733062744140625, -0.024944305419921875, -0.0125579833984375, -0.000171661376953125, 0.01221466064453125, 0.024600982666015625, 0.0369873046875, 0.049373626708984375, 0.06175994873046875, 0.07414627075195312, 0.0865325927734375, 0.09891891479492188, 0.11130523681640625, 0.12369155883789062, 0.136077880859375, 0.14846420288085938, 0.16085052490234375, 0.17323684692382812, 0.1856231689453125, 0.19800949096679688, 0.21039581298828125, 0.22278213500976562, 0.23516845703125, 0.24755477905273438, 0.25994110107421875, 0.2723274230957031, 0.2847137451171875, 0.2971000671386719, 0.30948638916015625, 0.3218727111816406, 0.334259033203125, 0.3466453552246094, 0.35903167724609375, 0.3714179992675781, 0.3838043212890625, 0.3961906433105469, 0.40857696533203125, 0.4209632873535156, 0.433349609375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 10.0, 9.0, 14.0, 24.0, 31.0, 32.0, 51.0, 58.0, 55.0, 78.0, 100.0, 95.0, 90.0, 56.0, 65.0, 59.0, 46.0, 33.0, 24.0, 23.0, 19.0, 13.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.282958984375, -0.2747344970703125, -0.266510009765625, -0.2582855224609375, -0.25006103515625, -0.2418365478515625, -0.233612060546875, -0.2253875732421875, -0.2171630859375, -0.2089385986328125, -0.200714111328125, -0.1924896240234375, -0.18426513671875, -0.1760406494140625, -0.167816162109375, -0.1595916748046875, -0.1513671875, -0.1431427001953125, -0.134918212890625, -0.1266937255859375, -0.11846923828125, -0.1102447509765625, -0.102020263671875, -0.0937957763671875, -0.0855712890625, -0.0773468017578125, -0.069122314453125, -0.0608978271484375, -0.05267333984375, -0.0444488525390625, -0.036224365234375, -0.0279998779296875, -0.019775390625, -0.0115509033203125, -0.003326416015625, 0.0048980712890625, 0.01312255859375, 0.0213470458984375, 0.029571533203125, 0.0377960205078125, 0.0460205078125, 0.0542449951171875, 0.062469482421875, 0.0706939697265625, 0.07891845703125, 0.0871429443359375, 0.095367431640625, 0.1035919189453125, 0.11181640625, 0.1200408935546875, 0.128265380859375, 0.1364898681640625, 0.14471435546875, 0.1529388427734375, 0.161163330078125, 0.1693878173828125, 0.1776123046875, 0.1858367919921875, 0.194061279296875, 0.2022857666015625, 0.21051025390625, 0.2187347412109375, 0.226959228515625, 0.2351837158203125, 0.243408203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 10.0, 18.0, 20.0, 23.0, 29.0, 55.0, 88.0, 102.0, 207.0, 395.0, 982.0, 3606.0, 19123.0, 223546.0, 3786054.0, 140549.0, 14654.0, 2971.0, 918.0, 346.0, 192.0, 114.0, 79.0, 44.0, 33.0, 27.0, 15.0, 17.0, 14.0, 12.0, 8.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5478515625, -0.52984619140625, -0.5118408203125, -0.49383544921875, -0.475830078125, -0.45782470703125, -0.4398193359375, -0.42181396484375, -0.40380859375, -0.38580322265625, -0.3677978515625, -0.34979248046875, -0.331787109375, -0.31378173828125, -0.2957763671875, -0.27777099609375, -0.259765625, -0.24176025390625, -0.2237548828125, -0.20574951171875, -0.187744140625, -0.16973876953125, -0.1517333984375, -0.13372802734375, -0.11572265625, -0.09771728515625, -0.0797119140625, -0.06170654296875, -0.043701171875, -0.02569580078125, -0.0076904296875, 0.01031494140625, 0.0283203125, 0.04632568359375, 0.0643310546875, 0.08233642578125, 0.100341796875, 0.11834716796875, 0.1363525390625, 0.15435791015625, 0.17236328125, 0.19036865234375, 0.2083740234375, 0.22637939453125, 0.244384765625, 0.26239013671875, 0.2803955078125, 0.29840087890625, 0.31640625, 0.33441162109375, 0.3524169921875, 0.37042236328125, 0.388427734375, 0.40643310546875, 0.4244384765625, 0.44244384765625, 0.46044921875, 0.47845458984375, 0.4964599609375, 0.51446533203125, 0.532470703125, 0.55047607421875, 0.5684814453125, 0.58648681640625, 0.6044921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 5.0, 6.0, 6.0, 11.0, 8.0, 19.0, 25.0, 35.0, 42.0, 46.0, 82.0, 108.0, 226.0, 387.0, 707.0, 912.0, 579.0, 306.0, 187.0, 81.0, 79.0, 53.0, 31.0, 36.0, 15.0, 13.0, 13.0, 10.0, 3.0, 5.0, 6.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32177734375, -0.3099822998046875, -0.298187255859375, -0.2863922119140625, -0.27459716796875, -0.2628021240234375, -0.251007080078125, -0.2392120361328125, -0.2274169921875, -0.2156219482421875, -0.203826904296875, -0.1920318603515625, -0.18023681640625, -0.1684417724609375, -0.156646728515625, -0.1448516845703125, -0.133056640625, -0.1212615966796875, -0.109466552734375, -0.0976715087890625, -0.08587646484375, -0.0740814208984375, -0.062286376953125, -0.0504913330078125, -0.0386962890625, -0.0269012451171875, -0.015106201171875, -0.0033111572265625, 0.00848388671875, 0.0202789306640625, 0.032073974609375, 0.0438690185546875, 0.0556640625, 0.0674591064453125, 0.079254150390625, 0.0910491943359375, 0.10284423828125, 0.1146392822265625, 0.126434326171875, 0.1382293701171875, 0.1500244140625, 0.1618194580078125, 0.173614501953125, 0.1854095458984375, 0.19720458984375, 0.2089996337890625, 0.220794677734375, 0.2325897216796875, 0.244384765625, 0.2561798095703125, 0.267974853515625, 0.2797698974609375, 0.29156494140625, 0.3033599853515625, 0.315155029296875, 0.3269500732421875, 0.3387451171875, 0.3505401611328125, 0.362335205078125, 0.3741302490234375, 0.38592529296875, 0.3977203369140625, 0.409515380859375, 0.4213104248046875, 0.43310546875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 9.0, 31.0, 58.0, 156.0, 205.0, 197.0, 147.0, 92.0, 38.0, 23.0, 13.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564911365509033, -2.437615394592285, -2.310319185256958, -2.183022975921631, -2.055727005004883, -1.9284309148788452, -1.8011348247528076, -1.67383873462677, -1.5465426445007324, -1.4192465543746948, -1.2919504642486572, -1.1646543741226196, -1.037358283996582, -0.9100621938705444, -0.7827661037445068, -0.6554700136184692, -0.5281739234924316, -0.40087783336639404, -0.27358174324035645, -0.14628565311431885, -0.01898956298828125, 0.10830652713775635, 0.23560261726379395, 0.36289870738983154, 0.49019479751586914, 0.6174908876419067, 0.7447869777679443, 0.8720830678939819, 0.9993791580200195, 1.1266752481460571, 1.2539713382720947, 1.3812674283981323, 1.50856351852417, 1.6358596086502075, 1.7631556987762451, 1.8904517889022827, 2.0177478790283203, 2.1450438499450684, 2.2723400592803955, 2.3996362686157227, 2.5269322395324707, 2.6542282104492188, 2.781524419784546, 2.908820629119873, 3.036116600036621, 3.163412570953369, 3.2907087802886963, 3.4180049896240234, 3.5453009605407715, 3.6725969314575195, 3.7998931407928467, 3.927189350128174, 4.054485321044922, 4.18178129196167, 4.309077262878418, 4.436373710632324, 4.563669681549072, 4.69096565246582, 4.818262100219727, 4.945558071136475, 5.072854042053223, 5.200150012969971, 5.327445983886719, 5.454742431640625, 5.582038402557373]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 18.0, 20.0, 17.0, 18.0, 28.0, 25.0, 30.0, 37.0, 38.0, 37.0, 45.0, 51.0, 52.0, 50.0, 53.0, 60.0, 46.0, 36.0, 32.0, 45.0, 23.0, 26.0, 25.0, 21.0, 23.0, 13.0, 18.0, 19.0, 16.0, 5.0, 8.0, 8.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-1.9096438884735107, -1.860107183456421, -1.8105703592300415, -1.7610336542129517, -1.7114969491958618, -1.661960244178772, -1.6124234199523926, -1.5628867149353027, -1.513350009918213, -1.463813304901123, -1.4142764806747437, -1.3647397756576538, -1.315203070640564, -1.2656663656234741, -1.2161295413970947, -1.1665928363800049, -1.117056131362915, -1.0675194263458252, -1.0179826021194458, -0.968445897102356, -0.9189091920852661, -0.8693724274635315, -0.8198356628417969, -0.770298957824707, -0.7207621335983276, -0.671225368976593, -0.6216886639595032, -0.5721518993377686, -0.5226151943206787, -0.4730784296989441, -0.42354169487953186, -0.37400496006011963, -0.3244682550430298, -0.27493152022361755, -0.22539478540420532, -0.1758580356836319, -0.12632130086421967, -0.07678456604480743, -0.02724781632423401, 0.022288918495178223, 0.07182565331459045, 0.12136238813400269, 0.17089912295341492, 0.22043587267398834, 0.26997262239456177, 0.3195093274116516, 0.36904609203338623, 0.41858282685279846, 0.4681195616722107, 0.5176563262939453, 0.5671930313110352, 0.6167297959327698, 0.6662665009498596, 0.7158032655715942, 0.7653399705886841, 0.8148767352104187, 0.8644134998321533, 0.9139502644538879, 0.9634869694709778, 1.0130237340927124, 1.0625604391098022, 1.112097144126892, 1.1616339683532715, 1.2111706733703613, 1.2607073783874512]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 16.0, 17.0, 27.0, 40.0, 63.0, 121.0, 211.0, 382.0, 730.0, 1748.0, 4312.0, 13260.0, 49967.0, 262569.0, 557631.0, 118241.0, 26329.0, 7650.0, 2839.0, 1185.0, 519.0, 257.0, 157.0, 83.0, 53.0, 38.0, 27.0, 16.0, 13.0, 10.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.55908203125, -0.5432319641113281, -0.5273818969726562, -0.5115318298339844, -0.4956817626953125, -0.4798316955566406, -0.46398162841796875, -0.4481315612792969, -0.432281494140625, -0.4164314270019531, -0.40058135986328125, -0.3847312927246094, -0.3688812255859375, -0.3530311584472656, -0.33718109130859375, -0.3213310241699219, -0.30548095703125, -0.2896308898925781, -0.27378082275390625, -0.2579307556152344, -0.2420806884765625, -0.22623062133789062, -0.21038055419921875, -0.19453048706054688, -0.178680419921875, -0.16283035278320312, -0.14698028564453125, -0.13113021850585938, -0.1152801513671875, -0.09943008422851562, -0.08358001708984375, -0.06772994995117188, -0.0518798828125, -0.036029815673828125, -0.02017974853515625, -0.004329681396484375, 0.0115203857421875, 0.027370452880859375, 0.04322052001953125, 0.059070587158203125, 0.074920654296875, 0.09077072143554688, 0.10662078857421875, 0.12247085571289062, 0.1383209228515625, 0.15417098999023438, 0.17002105712890625, 0.18587112426757812, 0.20172119140625, 0.21757125854492188, 0.23342132568359375, 0.24927139282226562, 0.2651214599609375, 0.2809715270996094, 0.29682159423828125, 0.3126716613769531, 0.328521728515625, 0.3443717956542969, 0.36022186279296875, 0.3760719299316406, 0.3919219970703125, 0.4077720642089844, 0.42362213134765625, 0.4394721984863281, 0.455322265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 10.0, 6.0, 25.0, 26.0, 31.0, 27.0, 56.0, 57.0, 71.0, 73.0, 74.0, 93.0, 85.0, 66.0, 60.0, 44.0, 42.0, 38.0, 40.0, 25.0, 20.0, 17.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28271484375, -0.2745037078857422, -0.2662925720214844, -0.25808143615722656, -0.24987030029296875, -0.24165916442871094, -0.23344802856445312, -0.2252368927001953, -0.2170257568359375, -0.2088146209716797, -0.20060348510742188, -0.19239234924316406, -0.18418121337890625, -0.17597007751464844, -0.16775894165039062, -0.1595478057861328, -0.151336669921875, -0.1431255340576172, -0.13491439819335938, -0.12670326232910156, -0.11849212646484375, -0.11028099060058594, -0.10206985473632812, -0.09385871887207031, -0.0856475830078125, -0.07743644714355469, -0.06922531127929688, -0.06101417541503906, -0.05280303955078125, -0.04459190368652344, -0.036380767822265625, -0.028169631958007812, -0.01995849609375, -0.011747360229492188, -0.003536224365234375, 0.0046749114990234375, 0.01288604736328125, 0.021097183227539062, 0.029308319091796875, 0.03751945495605469, 0.0457305908203125, 0.05394172668457031, 0.062152862548828125, 0.07036399841308594, 0.07857513427734375, 0.08678627014160156, 0.09499740600585938, 0.10320854187011719, 0.111419677734375, 0.11963081359863281, 0.12784194946289062, 0.13605308532714844, 0.14426422119140625, 0.15247535705566406, 0.16068649291992188, 0.1688976287841797, 0.1771087646484375, 0.1853199005126953, 0.19353103637695312, 0.20174217224121094, 0.20995330810546875, 0.21816444396972656, 0.22637557983398438, 0.2345867156982422, 0.2427978515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 3.0, 1.0, 9.0, 7.0, 11.0, 15.0, 26.0, 23.0, 42.0, 83.0, 136.0, 250.0, 541.0, 1324.0, 3884.0, 16296.0, 171782.0, 803394.0, 40124.0, 6954.0, 1986.0, 787.0, 374.0, 200.0, 95.0, 70.0, 39.0, 29.0, 17.0, 11.0, 10.0, 5.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.79931640625, -0.7759628295898438, -0.7526092529296875, -0.7292556762695312, -0.705902099609375, -0.6825485229492188, -0.6591949462890625, -0.6358413696289062, -0.61248779296875, -0.5891342163085938, -0.5657806396484375, -0.5424270629882812, -0.519073486328125, -0.49571990966796875, -0.4723663330078125, -0.44901275634765625, -0.4256591796875, -0.40230560302734375, -0.3789520263671875, -0.35559844970703125, -0.332244873046875, -0.30889129638671875, -0.2855377197265625, -0.26218414306640625, -0.23883056640625, -0.21547698974609375, -0.1921234130859375, -0.16876983642578125, -0.145416259765625, -0.12206268310546875, -0.0987091064453125, -0.07535552978515625, -0.052001953125, -0.02864837646484375, -0.0052947998046875, 0.01805877685546875, 0.041412353515625, 0.06476593017578125, 0.0881195068359375, 0.11147308349609375, 0.13482666015625, 0.15818023681640625, 0.1815338134765625, 0.20488739013671875, 0.228240966796875, 0.25159454345703125, 0.2749481201171875, 0.29830169677734375, 0.3216552734375, 0.34500885009765625, 0.3683624267578125, 0.39171600341796875, 0.415069580078125, 0.43842315673828125, 0.4617767333984375, 0.48513031005859375, 0.50848388671875, 0.5318374633789062, 0.5551910400390625, 0.5785446166992188, 0.601898193359375, 0.6252517700195312, 0.6486053466796875, 0.6719589233398438, 0.6953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 9.0, 6.0, 8.0, 14.0, 18.0, 23.0, 36.0, 26.0, 27.0, 48.0, 52.0, 54.0, 60.0, 68.0, 67.0, 72.0, 69.0, 56.0, 51.0, 47.0, 35.0, 27.0, 25.0, 17.0, 13.0, 16.0, 11.0, 9.0, 3.0, 5.0, 2.0, 3.0, 5.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.73974609375, -0.7147140502929688, -0.6896820068359375, -0.6646499633789062, -0.639617919921875, -0.6145858764648438, -0.5895538330078125, -0.5645217895507812, -0.53948974609375, -0.5144577026367188, -0.4894256591796875, -0.46439361572265625, -0.439361572265625, -0.41432952880859375, -0.3892974853515625, -0.36426544189453125, -0.3392333984375, -0.31420135498046875, -0.2891693115234375, -0.26413726806640625, -0.239105224609375, -0.21407318115234375, -0.1890411376953125, -0.16400909423828125, -0.13897705078125, -0.11394500732421875, -0.0889129638671875, -0.06388092041015625, -0.038848876953125, -0.01381683349609375, 0.0112152099609375, 0.03624725341796875, 0.061279296875, 0.08631134033203125, 0.1113433837890625, 0.13637542724609375, 0.161407470703125, 0.18643951416015625, 0.2114715576171875, 0.23650360107421875, 0.26153564453125, 0.28656768798828125, 0.3115997314453125, 0.33663177490234375, 0.361663818359375, 0.38669586181640625, 0.4117279052734375, 0.43675994873046875, 0.4617919921875, 0.48682403564453125, 0.5118560791015625, 0.5368881225585938, 0.561920166015625, 0.5869522094726562, 0.6119842529296875, 0.6370162963867188, 0.66204833984375, 0.6870803833007812, 0.7121124267578125, 0.7371444702148438, 0.762176513671875, 0.7872085571289062, 0.8122406005859375, 0.8372726440429688, 0.8623046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 6.0, 7.0, 3.0, 14.0, 16.0, 19.0, 30.0, 53.0, 103.0, 212.0, 497.0, 1451.0, 5098.0, 33994.0, 946305.0, 51821.0, 6161.0, 1601.0, 624.0, 219.0, 107.0, 55.0, 42.0, 19.0, 14.0, 11.0, 11.0, 7.0, 8.0, 6.0, 3.0, 1.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.351806640625, -0.3390464782714844, -0.32628631591796875, -0.3135261535644531, -0.3007659912109375, -0.2880058288574219, -0.27524566650390625, -0.2624855041503906, -0.249725341796875, -0.23696517944335938, -0.22420501708984375, -0.21144485473632812, -0.1986846923828125, -0.18592453002929688, -0.17316436767578125, -0.16040420532226562, -0.14764404296875, -0.13488388061523438, -0.12212371826171875, -0.10936355590820312, -0.0966033935546875, -0.08384323120117188, -0.07108306884765625, -0.058322906494140625, -0.045562744140625, -0.032802581787109375, -0.02004241943359375, -0.007282257080078125, 0.0054779052734375, 0.018238067626953125, 0.03099822998046875, 0.043758392333984375, 0.0565185546875, 0.06927871704101562, 0.08203887939453125, 0.09479904174804688, 0.1075592041015625, 0.12031936645507812, 0.13307952880859375, 0.14583969116210938, 0.158599853515625, 0.17136001586914062, 0.18412017822265625, 0.19688034057617188, 0.2096405029296875, 0.22240066528320312, 0.23516082763671875, 0.24792098999023438, 0.26068115234375, 0.2734413146972656, 0.28620147705078125, 0.2989616394042969, 0.3117218017578125, 0.3244819641113281, 0.33724212646484375, 0.3500022888183594, 0.362762451171875, 0.3755226135253906, 0.38828277587890625, 0.4010429382324219, 0.4138031005859375, 0.4265632629394531, 0.43932342529296875, 0.4520835876464844, 0.46484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 9.0, 10.0, 8.0, 15.0, 18.0, 14.0, 25.0, 23.0, 29.0, 23.0, 41.0, 69.0, 76.0, 97.0, 105.0, 90.0, 71.0, 44.0, 34.0, 35.0, 23.0, 20.0, 19.0, 14.0, 11.0, 11.0, 12.0, 8.0, 13.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.61611557006836e-05, -6.39650970697403e-05, -6.1769038438797e-05, -5.95729798078537e-05, -5.73769211769104e-05, -5.51808625459671e-05, -5.2984803915023804e-05, -5.0788745284080505e-05, -4.859268665313721e-05, -4.639662802219391e-05, -4.420056939125061e-05, -4.200451076030731e-05, -3.9808452129364014e-05, -3.7612393498420715e-05, -3.541633486747742e-05, -3.322027623653412e-05, -3.102421760559082e-05, -2.8828158974647522e-05, -2.6632100343704224e-05, -2.4436041712760925e-05, -2.2239983081817627e-05, -2.004392445087433e-05, -1.784786581993103e-05, -1.5651807188987732e-05, -1.3455748558044434e-05, -1.1259689927101135e-05, -9.063631296157837e-06, -6.8675726652145386e-06, -4.67151403427124e-06, -2.475455403327942e-06, -2.7939677238464355e-07, 1.9166618585586548e-06, 4.112720489501953e-06, 6.3087791204452515e-06, 8.50483775138855e-06, 1.0700896382331848e-05, 1.2896955013275146e-05, 1.5093013644218445e-05, 1.7289072275161743e-05, 1.948513090610504e-05, 2.168118953704834e-05, 2.3877248167991638e-05, 2.6073306798934937e-05, 2.8269365429878235e-05, 3.0465424060821533e-05, 3.266148269176483e-05, 3.485754132270813e-05, 3.705359995365143e-05, 3.9249658584594727e-05, 4.1445717215538025e-05, 4.364177584648132e-05, 4.583783447742462e-05, 4.803389310836792e-05, 5.022995173931122e-05, 5.2426010370254517e-05, 5.4622069001197815e-05, 5.681812763214111e-05, 5.901418626308441e-05, 6.121024489402771e-05, 6.340630352497101e-05, 6.56023621559143e-05, 6.77984207868576e-05, 6.99944794178009e-05, 7.21905380487442e-05, 7.43865966796875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 2.0, 8.0, 9.0, 11.0, 20.0, 29.0, 33.0, 46.0, 61.0, 92.0, 137.0, 213.0, 390.0, 713.0, 1347.0, 2838.0, 8134.0, 51867.0, 906066.0, 61419.0, 8757.0, 3008.0, 1469.0, 716.0, 409.0, 229.0, 148.0, 104.0, 53.0, 66.0, 34.0, 21.0, 16.0, 13.0, 9.0, 11.0, 12.0, 6.0, 1.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.334228515625, -0.3242607116699219, -0.31429290771484375, -0.3043251037597656, -0.2943572998046875, -0.2843894958496094, -0.27442169189453125, -0.2644538879394531, -0.254486083984375, -0.24451828002929688, -0.23455047607421875, -0.22458267211914062, -0.2146148681640625, -0.20464706420898438, -0.19467926025390625, -0.18471145629882812, -0.17474365234375, -0.16477584838867188, -0.15480804443359375, -0.14484024047851562, -0.1348724365234375, -0.12490463256835938, -0.11493682861328125, -0.10496902465820312, -0.095001220703125, -0.08503341674804688, -0.07506561279296875, -0.06509780883789062, -0.0551300048828125, -0.045162200927734375, -0.03519439697265625, -0.025226593017578125, -0.0152587890625, -0.005290985107421875, 0.00467681884765625, 0.014644622802734375, 0.0246124267578125, 0.034580230712890625, 0.04454803466796875, 0.054515838623046875, 0.064483642578125, 0.07445144653320312, 0.08441925048828125, 0.09438705444335938, 0.1043548583984375, 0.11432266235351562, 0.12429046630859375, 0.13425827026367188, 0.14422607421875, 0.15419387817382812, 0.16416168212890625, 0.17412948608398438, 0.1840972900390625, 0.19406509399414062, 0.20403289794921875, 0.21400070190429688, 0.223968505859375, 0.23393630981445312, 0.24390411376953125, 0.2538719177246094, 0.2638397216796875, 0.2738075256347656, 0.28377532958984375, 0.2937431335449219, 0.3037109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 8.0, 13.0, 17.0, 33.0, 50.0, 114.0, 218.0, 233.0, 127.0, 73.0, 36.0, 16.0, 15.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.3840599060058594, -0.37212371826171875, -0.3601875305175781, -0.3482513427734375, -0.3363151550292969, -0.32437896728515625, -0.3124427795410156, -0.300506591796875, -0.2885704040527344, -0.27663421630859375, -0.2646980285644531, -0.2527618408203125, -0.24082565307617188, -0.22888946533203125, -0.21695327758789062, -0.20501708984375, -0.19308090209960938, -0.18114471435546875, -0.16920852661132812, -0.1572723388671875, -0.14533615112304688, -0.13339996337890625, -0.12146377563476562, -0.109527587890625, -0.09759140014648438, -0.08565521240234375, -0.07371902465820312, -0.0617828369140625, -0.049846649169921875, -0.03791046142578125, -0.025974273681640625, -0.0140380859375, -0.002101898193359375, 0.00983428955078125, 0.021770477294921875, 0.0337066650390625, 0.045642852783203125, 0.05757904052734375, 0.06951522827148438, 0.081451416015625, 0.09338760375976562, 0.10532379150390625, 0.11725997924804688, 0.1291961669921875, 0.14113235473632812, 0.15306854248046875, 0.16500473022460938, 0.17694091796875, 0.18887710571289062, 0.20081329345703125, 0.21274948120117188, 0.2246856689453125, 0.23662185668945312, 0.24855804443359375, 0.2604942321777344, 0.272430419921875, 0.2843666076660156, 0.29630279541015625, 0.3082389831542969, 0.3201751708984375, 0.3321113586425781, 0.34404754638671875, 0.3559837341308594, 0.367919921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 4.0, 17.0, 73.0, 295.0, 436.0, 120.0, 26.0, 10.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.787864685058594, -11.461349487304688, -11.134834289550781, -10.808319091796875, -10.481803894042969, -10.155288696289062, -9.828773498535156, -9.50225830078125, -9.175743103027344, -8.849227905273438, -8.522712707519531, -8.196197509765625, -7.869682312011719, -7.5431671142578125, -7.2166523933410645, -6.890137195587158, -6.56362247467041, -6.237107276916504, -5.910592079162598, -5.584076881408691, -5.257561683654785, -4.931046485900879, -4.604531764984131, -4.278016567230225, -3.9515013694763184, -3.624986171722412, -3.298470973968506, -2.9719560146331787, -2.6454408168792725, -2.318925619125366, -1.9924105405807495, -1.6658954620361328, -1.3393802642822266, -1.0128650665283203, -0.6863499879837036, -0.35983484983444214, -0.033319711685180664, 0.2931954860687256, 0.6197105646133423, 0.946225643157959, 1.2727408409118652, 1.5992560386657715, 1.9257711172103882, 2.252286195755005, 2.578801393508911, 2.9053165912628174, 3.2318315505981445, 3.558346748352051, 3.884861946105957, 4.211377143859863, 4.5378923416137695, 4.864407539367676, 5.190922737121582, 5.517437934875488, 5.843952655792236, 6.170467853546143, 6.496983051300049, 6.823498249053955, 7.150013446807861, 7.476528644561768, 7.803043365478516, 8.129558563232422, 8.456073760986328, 8.782588958740234, 9.10910415649414]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 15.0, 9.0, 17.0, 27.0, 26.0, 29.0, 28.0, 46.0, 56.0, 57.0, 84.0, 130.0, 106.0, 81.0, 55.0, 42.0, 32.0, 29.0, 32.0, 24.0, 14.0, 10.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1053006649017334, -2.9970927238464355, -2.8888845443725586, -2.7806766033172607, -2.672468423843384, -2.564260482788086, -2.456052303314209, -2.347844362258911, -2.2396364212036133, -2.1314284801483154, -2.0232203006744385, -1.9150123596191406, -1.8068042993545532, -1.6985962390899658, -1.5903881788253784, -1.482180118560791, -1.3739720582962036, -1.2657639980316162, -1.1575559377670288, -1.0493478775024414, -0.9411399364471436, -0.8329318761825562, -0.7247238159179688, -0.6165158152580261, -0.5083077549934387, -0.4000997245311737, -0.2918916940689087, -0.1836836338043213, -0.07547560334205627, 0.03273242712020874, 0.14094048738479614, 0.24914848804473877, 0.35735654830932617, 0.4655645787715912, 0.5737726092338562, 0.6819806694984436, 0.7901886701583862, 0.8983967304229736, 1.006604790687561, 1.1148128509521484, 1.2230207920074463, 1.3312288522720337, 1.439436912536621, 1.547644853591919, 1.6558529138565063, 1.7640609741210938, 1.8722690343856812, 1.9804770946502686, 2.0886850357055664, 2.1968929767608643, 2.305101156234741, 2.413309097290039, 2.521517276763916, 2.629725217819214, 2.7379331588745117, 2.8461413383483887, 2.9543495178222656, 3.0625574588775635, 3.1707656383514404, 3.2789735794067383, 3.3871817588806152, 3.495389699935913, 3.603597640991211, 3.711805820465088, 3.8200137615203857]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 8.0, 2.0, 4.0, 6.0, 7.0, 21.0, 12.0, 32.0, 53.0, 81.0, 159.0, 286.0, 649.0, 1619.0, 5699.0, 30079.0, 479366.0, 3471106.0, 180894.0, 17869.0, 3916.0, 1294.0, 530.0, 258.0, 128.0, 68.0, 46.0, 33.0, 26.0, 11.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89111328125, -0.8651809692382812, -0.8392486572265625, -0.8133163452148438, -0.787384033203125, -0.7614517211914062, -0.7355194091796875, -0.7095870971679688, -0.68365478515625, -0.6577224731445312, -0.6317901611328125, -0.6058578491210938, -0.579925537109375, -0.5539932250976562, -0.5280609130859375, -0.5021286010742188, -0.4761962890625, -0.45026397705078125, -0.4243316650390625, -0.39839935302734375, -0.372467041015625, -0.34653472900390625, -0.3206024169921875, -0.29467010498046875, -0.26873779296875, -0.24280548095703125, -0.2168731689453125, -0.19094085693359375, -0.165008544921875, -0.13907623291015625, -0.1131439208984375, -0.08721160888671875, -0.061279296875, -0.03534698486328125, -0.0094146728515625, 0.01651763916015625, 0.042449951171875, 0.06838226318359375, 0.0943145751953125, 0.12024688720703125, 0.14617919921875, 0.17211151123046875, 0.1980438232421875, 0.22397613525390625, 0.249908447265625, 0.27584075927734375, 0.3017730712890625, 0.32770538330078125, 0.3536376953125, 0.37957000732421875, 0.4055023193359375, 0.43143463134765625, 0.457366943359375, 0.48329925537109375, 0.5092315673828125, 0.5351638793945312, 0.56109619140625, 0.5870285034179688, 0.6129608154296875, 0.6388931274414062, 0.664825439453125, 0.6907577514648438, 0.7166900634765625, 0.7426223754882812, 0.7685546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 10.0, 11.0, 18.0, 29.0, 21.0, 19.0, 32.0, 41.0, 50.0, 57.0, 62.0, 78.0, 62.0, 74.0, 74.0, 56.0, 47.0, 58.0, 34.0, 37.0, 35.0, 22.0, 22.0, 14.0, 13.0, 12.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15185546875, -0.1450042724609375, -0.138153076171875, -0.1313018798828125, -0.12445068359375, -0.1175994873046875, -0.110748291015625, -0.1038970947265625, -0.0970458984375, -0.0901947021484375, -0.083343505859375, -0.0764923095703125, -0.06964111328125, -0.0627899169921875, -0.055938720703125, -0.0490875244140625, -0.042236328125, -0.0353851318359375, -0.028533935546875, -0.0216827392578125, -0.01483154296875, -0.0079803466796875, -0.001129150390625, 0.0057220458984375, 0.0125732421875, 0.0194244384765625, 0.026275634765625, 0.0331268310546875, 0.03997802734375, 0.0468292236328125, 0.053680419921875, 0.0605316162109375, 0.0673828125, 0.0742340087890625, 0.081085205078125, 0.0879364013671875, 0.09478759765625, 0.1016387939453125, 0.108489990234375, 0.1153411865234375, 0.1221923828125, 0.1290435791015625, 0.135894775390625, 0.1427459716796875, 0.14959716796875, 0.1564483642578125, 0.163299560546875, 0.1701507568359375, 0.177001953125, 0.1838531494140625, 0.190704345703125, 0.1975555419921875, 0.20440673828125, 0.2112579345703125, 0.218109130859375, 0.2249603271484375, 0.2318115234375, 0.2386627197265625, 0.245513916015625, 0.2523651123046875, 0.25921630859375, 0.2660675048828125, 0.272918701171875, 0.2797698974609375, 0.28662109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 11.0, 8.0, 16.0, 11.0, 33.0, 37.0, 68.0, 126.0, 190.0, 354.0, 730.0, 1801.0, 4852.0, 27935.0, 2342841.0, 1780808.0, 26325.0, 4745.0, 1677.0, 797.0, 357.0, 199.0, 103.0, 76.0, 42.0, 22.0, 17.0, 15.0, 12.0, 10.0, 10.0, 4.0, 7.0, 4.0, 1.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3681640625, -1.3290557861328125, -1.289947509765625, -1.2508392333984375, -1.21173095703125, -1.1726226806640625, -1.133514404296875, -1.0944061279296875, -1.0552978515625, -1.0161895751953125, -0.977081298828125, -0.9379730224609375, -0.89886474609375, -0.8597564697265625, -0.820648193359375, -0.7815399169921875, -0.742431640625, -0.7033233642578125, -0.664215087890625, -0.6251068115234375, -0.58599853515625, -0.5468902587890625, -0.507781982421875, -0.4686737060546875, -0.4295654296875, -0.3904571533203125, -0.351348876953125, -0.3122406005859375, -0.27313232421875, -0.2340240478515625, -0.194915771484375, -0.1558074951171875, -0.11669921875, -0.0775909423828125, -0.038482666015625, 0.0006256103515625, 0.03973388671875, 0.0788421630859375, 0.117950439453125, 0.1570587158203125, 0.1961669921875, 0.2352752685546875, 0.274383544921875, 0.3134918212890625, 0.35260009765625, 0.3917083740234375, 0.430816650390625, 0.4699249267578125, 0.509033203125, 0.5481414794921875, 0.587249755859375, 0.6263580322265625, 0.66546630859375, 0.7045745849609375, 0.743682861328125, 0.7827911376953125, 0.8218994140625, 0.8610076904296875, 0.900115966796875, 0.9392242431640625, 0.97833251953125, 1.0174407958984375, 1.056549072265625, 1.0956573486328125, 1.134765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 4.0, 7.0, 22.0, 22.0, 44.0, 74.0, 118.0, 207.0, 425.0, 787.0, 998.0, 607.0, 322.0, 176.0, 113.0, 48.0, 36.0, 15.0, 10.0, 10.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89697265625, -0.8599014282226562, -0.8228302001953125, -0.7857589721679688, -0.748687744140625, -0.7116165161132812, -0.6745452880859375, -0.6374740600585938, -0.60040283203125, -0.5633316040039062, -0.5262603759765625, -0.48918914794921875, -0.452117919921875, -0.41504669189453125, -0.3779754638671875, -0.34090423583984375, -0.3038330078125, -0.26676177978515625, -0.2296905517578125, -0.19261932373046875, -0.155548095703125, -0.11847686767578125, -0.0814056396484375, -0.04433441162109375, -0.00726318359375, 0.02980804443359375, 0.0668792724609375, 0.10395050048828125, 0.141021728515625, 0.17809295654296875, 0.2151641845703125, 0.25223541259765625, 0.289306640625, 0.32637786865234375, 0.3634490966796875, 0.40052032470703125, 0.437591552734375, 0.47466278076171875, 0.5117340087890625, 0.5488052368164062, 0.58587646484375, 0.6229476928710938, 0.6600189208984375, 0.6970901489257812, 0.734161376953125, 0.7712326049804688, 0.8083038330078125, 0.8453750610351562, 0.8824462890625, 0.9195175170898438, 0.9565887451171875, 0.9936599731445312, 1.030731201171875, 1.0678024291992188, 1.1048736572265625, 1.1419448852539062, 1.17901611328125, 1.2160873413085938, 1.2531585693359375, 1.2902297973632812, 1.327301025390625, 1.3643722534179688, 1.4014434814453125, 1.4385147094726562, 1.4755859375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 10.0, 13.0, 35.0, 48.0, 151.0, 269.0, 233.0, 117.0, 54.0, 27.0, 8.0, 9.0, 2.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.487607955932617, -14.043328285217285, -13.599048614501953, -13.154767990112305, -12.710488319396973, -12.26620864868164, -11.821928977966309, -11.377649307250977, -10.933368682861328, -10.489089012145996, -10.044809341430664, -9.600528717041016, -9.156249046325684, -8.711969375610352, -8.26768970489502, -7.8234100341796875, -7.3791303634643555, -6.934850692749023, -6.490570545196533, -6.046290874481201, -5.602010726928711, -5.157731056213379, -4.713451385498047, -4.269171714782715, -3.8248915672302246, -3.3806116580963135, -2.9363317489624023, -2.4920520782470703, -2.047772169113159, -1.603492259979248, -1.159212589263916, -0.7149326801300049, -0.27065181732177734, 0.173628032207489, 0.6179078817367554, 1.062187671661377, 1.506467580795288, 1.9507474899291992, 2.3950271606445312, 2.8393070697784424, 3.2835869789123535, 3.7278668880462646, 4.172146797180176, 4.616426467895508, 5.06070613861084, 5.50498628616333, 5.949265956878662, 6.393546104431152, 6.837825775146484, 7.282105445861816, 7.726385593414307, 8.170665740966797, 8.614945411682129, 9.059225082397461, 9.503504753112793, 9.947784423828125, 10.392065048217773, 10.836344718933105, 11.280624389648438, 11.724905014038086, 12.169184684753418, 12.61346435546875, 13.057744026184082, 13.502023696899414, 13.946303367614746]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 3.0, 12.0, 17.0, 19.0, 22.0, 24.0, 43.0, 45.0, 54.0, 70.0, 72.0, 87.0, 87.0, 91.0, 77.0, 70.0, 53.0, 38.0, 31.0, 25.0, 14.0, 20.0, 6.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.083523750305176, -7.839505672454834, -7.595487117767334, -7.351469039916992, -7.10745096206665, -6.863432884216309, -6.619414329528809, -6.375396251678467, -6.131378173828125, -5.887360095977783, -5.643341541290283, -5.399323463439941, -5.1553053855896, -4.911287307739258, -4.667268753051758, -4.423250675201416, -4.179232120513916, -3.935213804244995, -3.6911957263946533, -3.4471774101257324, -3.2031593322753906, -2.9591410160064697, -2.715122699737549, -2.471104621887207, -2.227086305618286, -1.9830681085586548, -1.7390499114990234, -1.4950315952301025, -1.2510133981704712, -1.0069952011108398, -0.762976884841919, -0.5189586877822876, -0.27494049072265625, -0.030922263860702515, 0.21309596300125122, 0.45711421966552734, 0.7011324167251587, 0.94515061378479, 1.189168930053711, 1.4331871271133423, 1.6772053241729736, 1.921223521232605, 2.1652417182922363, 2.4092600345611572, 2.653278350830078, 2.89729642868042, 3.141314744949341, 3.3853330612182617, 3.6293511390686035, 3.8733694553375244, 4.117387771606445, 4.361405849456787, 4.605423927307129, 4.849442481994629, 5.093460559844971, 5.3374786376953125, 5.5814971923828125, 5.825515270233154, 6.069533824920654, 6.313551902770996, 6.557569980621338, 6.80158805847168, 7.04560661315918, 7.2896246910095215, 7.533642768859863]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 17.0, 17.0, 30.0, 26.0, 44.0, 77.0, 160.0, 210.0, 353.0, 740.0, 1579.0, 3722.0, 11115.0, 41219.0, 243979.0, 604639.0, 106388.0, 22605.0, 6593.0, 2595.0, 1139.0, 550.0, 303.0, 158.0, 107.0, 56.0, 32.0, 24.0, 23.0, 18.0, 9.0, 10.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.414306640625, -0.40256500244140625, -0.3908233642578125, -0.37908172607421875, -0.367340087890625, -0.35559844970703125, -0.3438568115234375, -0.33211517333984375, -0.32037353515625, -0.30863189697265625, -0.2968902587890625, -0.28514862060546875, -0.273406982421875, -0.26166534423828125, -0.2499237060546875, -0.23818206787109375, -0.2264404296875, -0.21469879150390625, -0.2029571533203125, -0.19121551513671875, -0.179473876953125, -0.16773223876953125, -0.1559906005859375, -0.14424896240234375, -0.13250732421875, -0.12076568603515625, -0.1090240478515625, -0.09728240966796875, -0.085540771484375, -0.07379913330078125, -0.0620574951171875, -0.05031585693359375, -0.03857421875, -0.02683258056640625, -0.0150909423828125, -0.00334930419921875, 0.008392333984375, 0.02013397216796875, 0.0318756103515625, 0.04361724853515625, 0.05535888671875, 0.06710052490234375, 0.0788421630859375, 0.09058380126953125, 0.102325439453125, 0.11406707763671875, 0.1258087158203125, 0.13755035400390625, 0.1492919921875, 0.16103363037109375, 0.1727752685546875, 0.18451690673828125, 0.196258544921875, 0.20800018310546875, 0.2197418212890625, 0.23148345947265625, 0.24322509765625, 0.25496673583984375, 0.2667083740234375, 0.27845001220703125, 0.290191650390625, 0.30193328857421875, 0.3136749267578125, 0.32541656494140625, 0.337158203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 9.0, 9.0, 20.0, 24.0, 34.0, 52.0, 50.0, 69.0, 81.0, 73.0, 73.0, 110.0, 96.0, 67.0, 64.0, 52.0, 34.0, 31.0, 20.0, 16.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.34853363037109375, -0.3359832763671875, -0.32343292236328125, -0.310882568359375, -0.29833221435546875, -0.2857818603515625, -0.27323150634765625, -0.26068115234375, -0.24813079833984375, -0.2355804443359375, -0.22303009033203125, -0.210479736328125, -0.19792938232421875, -0.1853790283203125, -0.17282867431640625, -0.1602783203125, -0.14772796630859375, -0.1351776123046875, -0.12262725830078125, -0.110076904296875, -0.09752655029296875, -0.0849761962890625, -0.07242584228515625, -0.05987548828125, -0.04732513427734375, -0.0347747802734375, -0.02222442626953125, -0.009674072265625, 0.00287628173828125, 0.0154266357421875, 0.02797698974609375, 0.04052734375, 0.05307769775390625, 0.0656280517578125, 0.07817840576171875, 0.090728759765625, 0.10327911376953125, 0.1158294677734375, 0.12837982177734375, 0.14093017578125, 0.15348052978515625, 0.1660308837890625, 0.17858123779296875, 0.191131591796875, 0.20368194580078125, 0.2162322998046875, 0.22878265380859375, 0.2413330078125, 0.25388336181640625, 0.2664337158203125, 0.27898406982421875, 0.291534423828125, 0.30408477783203125, 0.3166351318359375, 0.32918548583984375, 0.34173583984375, 0.35428619384765625, 0.3668365478515625, 0.37938690185546875, 0.391937255859375, 0.40448760986328125, 0.4170379638671875, 0.42958831787109375, 0.442138671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 9.0, 5.0, 11.0, 18.0, 21.0, 57.0, 65.0, 111.0, 217.0, 494.0, 1269.0, 4957.0, 41759.0, 927159.0, 63294.0, 6406.0, 1576.0, 532.0, 257.0, 125.0, 68.0, 54.0, 27.0, 20.0, 15.0, 12.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6595535278320312, -0.6399078369140625, -0.6202621459960938, -0.600616455078125, -0.5809707641601562, -0.5613250732421875, -0.5416793823242188, -0.52203369140625, -0.5023880004882812, -0.4827423095703125, -0.46309661865234375, -0.443450927734375, -0.42380523681640625, -0.4041595458984375, -0.38451385498046875, -0.3648681640625, -0.34522247314453125, -0.3255767822265625, -0.30593109130859375, -0.286285400390625, -0.26663970947265625, -0.2469940185546875, -0.22734832763671875, -0.20770263671875, -0.18805694580078125, -0.1684112548828125, -0.14876556396484375, -0.129119873046875, -0.10947418212890625, -0.0898284912109375, -0.07018280029296875, -0.050537109375, -0.03089141845703125, -0.0112457275390625, 0.00839996337890625, 0.028045654296875, 0.04769134521484375, 0.0673370361328125, 0.08698272705078125, 0.10662841796875, 0.12627410888671875, 0.1459197998046875, 0.16556549072265625, 0.185211181640625, 0.20485687255859375, 0.2245025634765625, 0.24414825439453125, 0.2637939453125, 0.28343963623046875, 0.3030853271484375, 0.32273101806640625, 0.342376708984375, 0.36202239990234375, 0.3816680908203125, 0.40131378173828125, 0.42095947265625, 0.44060516357421875, 0.4602508544921875, 0.47989654541015625, 0.499542236328125, 0.5191879272460938, 0.5388336181640625, 0.5584793090820312, 0.578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 11.0, 5.0, 4.0, 10.0, 14.0, 26.0, 29.0, 33.0, 28.0, 43.0, 80.0, 86.0, 109.0, 120.0, 83.0, 90.0, 54.0, 46.0, 32.0, 27.0, 21.0, 11.0, 10.0, 14.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.44403076171875, -1.3978271484375, -1.35162353515625, -1.305419921875, -1.25921630859375, -1.2130126953125, -1.16680908203125, -1.12060546875, -1.07440185546875, -1.0281982421875, -0.98199462890625, -0.935791015625, -0.88958740234375, -0.8433837890625, -0.79718017578125, -0.7509765625, -0.70477294921875, -0.6585693359375, -0.61236572265625, -0.566162109375, -0.51995849609375, -0.4737548828125, -0.42755126953125, -0.38134765625, -0.33514404296875, -0.2889404296875, -0.24273681640625, -0.196533203125, -0.15032958984375, -0.1041259765625, -0.05792236328125, -0.01171875, 0.03448486328125, 0.0806884765625, 0.12689208984375, 0.173095703125, 0.21929931640625, 0.2655029296875, 0.31170654296875, 0.35791015625, 0.40411376953125, 0.4503173828125, 0.49652099609375, 0.542724609375, 0.58892822265625, 0.6351318359375, 0.68133544921875, 0.7275390625, 0.77374267578125, 0.8199462890625, 0.86614990234375, 0.912353515625, 0.95855712890625, 1.0047607421875, 1.05096435546875, 1.09716796875, 1.14337158203125, 1.1895751953125, 1.23577880859375, 1.281982421875, 1.32818603515625, 1.3743896484375, 1.42059326171875, 1.466796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 7.0, 11.0, 14.0, 15.0, 24.0, 43.0, 31.0, 63.0, 89.0, 149.0, 223.0, 389.0, 735.0, 1512.0, 3619.0, 9903.0, 39305.0, 779845.0, 175079.0, 24639.0, 7394.0, 2721.0, 1173.0, 594.0, 361.0, 202.0, 138.0, 69.0, 51.0, 42.0, 33.0, 20.0, 6.0, 13.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06195068359375, -0.05987548828125, -0.05780029296875, -0.05572509765625, -0.05364990234375, -0.05157470703125, -0.04949951171875, -0.04742431640625, -0.04534912109375, -0.04327392578125, -0.04119873046875, -0.03912353515625, -0.03704833984375, -0.03497314453125, -0.03289794921875, -0.03082275390625, -0.02874755859375, -0.02667236328125, -0.02459716796875, -0.02252197265625, -0.02044677734375, -0.01837158203125, -0.01629638671875, -0.01422119140625, -0.01214599609375, -0.01007080078125, -0.00799560546875, -0.00592041015625, -0.00384521484375, -0.00177001953125, 0.00030517578125, 0.00238037109375, 0.00445556640625, 0.00653076171875, 0.00860595703125, 0.01068115234375, 0.01275634765625, 0.01483154296875, 0.01690673828125, 0.01898193359375, 0.02105712890625, 0.02313232421875, 0.02520751953125, 0.02728271484375, 0.02935791015625, 0.03143310546875, 0.03350830078125, 0.03558349609375, 0.03765869140625, 0.03973388671875, 0.04180908203125, 0.04388427734375, 0.04595947265625, 0.04803466796875, 0.05010986328125, 0.05218505859375, 0.05426025390625, 0.05633544921875, 0.05841064453125, 0.06048583984375, 0.06256103515625, 0.06463623046875, 0.06671142578125, 0.06878662109375, 0.07086181640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 5.0, 4.0, 8.0, 5.0, 14.0, 14.0, 20.0, 27.0, 33.0, 59.0, 73.0, 87.0, 92.0, 87.0, 95.0, 89.0, 58.0, 51.0, 29.0, 30.0, 16.0, 14.0, 18.0, 9.0, 9.0, 9.0, 8.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3543834686279297e-05, -2.2739171981811523e-05, -2.193450927734375e-05, -2.1129846572875977e-05, -2.0325183868408203e-05, -1.952052116394043e-05, -1.8715858459472656e-05, -1.7911195755004883e-05, -1.710653305053711e-05, -1.6301870346069336e-05, -1.5497207641601562e-05, -1.4692544937133789e-05, -1.3887882232666016e-05, -1.3083219528198242e-05, -1.2278556823730469e-05, -1.1473894119262695e-05, -1.0669231414794922e-05, -9.864568710327148e-06, -9.059906005859375e-06, -8.255243301391602e-06, -7.450580596923828e-06, -6.645917892456055e-06, -5.841255187988281e-06, -5.036592483520508e-06, -4.231929779052734e-06, -3.427267074584961e-06, -2.6226043701171875e-06, -1.817941665649414e-06, -1.0132789611816406e-06, -2.086162567138672e-07, 5.960464477539062e-07, 1.4007091522216797e-06, 2.205371856689453e-06, 3.0100345611572266e-06, 3.814697265625e-06, 4.6193599700927734e-06, 5.424022674560547e-06, 6.22868537902832e-06, 7.033348083496094e-06, 7.838010787963867e-06, 8.64267349243164e-06, 9.447336196899414e-06, 1.0251998901367188e-05, 1.1056661605834961e-05, 1.1861324310302734e-05, 1.2665987014770508e-05, 1.3470649719238281e-05, 1.4275312423706055e-05, 1.5079975128173828e-05, 1.58846378326416e-05, 1.6689300537109375e-05, 1.749396324157715e-05, 1.8298625946044922e-05, 1.9103288650512695e-05, 1.990795135498047e-05, 2.0712614059448242e-05, 2.1517276763916016e-05, 2.232193946838379e-05, 2.3126602172851562e-05, 2.3931264877319336e-05, 2.473592758178711e-05, 2.5540590286254883e-05, 2.6345252990722656e-05, 2.714991569519043e-05, 2.7954578399658203e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 10.0, 15.0, 12.0, 22.0, 32.0, 47.0, 76.0, 122.0, 217.0, 323.0, 697.0, 1242.0, 2780.0, 6594.0, 20306.0, 93633.0, 819907.0, 73873.0, 17553.0, 6072.0, 2501.0, 1131.0, 586.0, 305.0, 177.0, 106.0, 69.0, 41.0, 20.0, 20.0, 14.0, 11.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07025146484375, -0.06815052032470703, -0.06604957580566406, -0.0639486312866211, -0.061847686767578125, -0.059746742248535156, -0.05764579772949219, -0.05554485321044922, -0.05344390869140625, -0.05134296417236328, -0.04924201965332031, -0.047141075134277344, -0.045040130615234375, -0.042939186096191406, -0.04083824157714844, -0.03873729705810547, -0.0366363525390625, -0.03453540802001953, -0.03243446350097656, -0.030333518981933594, -0.028232574462890625, -0.026131629943847656, -0.024030685424804688, -0.02192974090576172, -0.01982879638671875, -0.01772785186767578, -0.015626907348632812, -0.013525962829589844, -0.011425018310546875, -0.009324073791503906, -0.0072231292724609375, -0.005122184753417969, -0.003021240234375, -0.0009202957153320312, 0.0011806488037109375, 0.0032815933227539062, 0.005382537841796875, 0.007483482360839844, 0.009584426879882812, 0.011685371398925781, 0.01378631591796875, 0.01588726043701172, 0.017988204956054688, 0.020089149475097656, 0.022190093994140625, 0.024291038513183594, 0.026391983032226562, 0.02849292755126953, 0.0305938720703125, 0.03269481658935547, 0.03479576110839844, 0.036896705627441406, 0.038997650146484375, 0.041098594665527344, 0.04319953918457031, 0.04530048370361328, 0.04740142822265625, 0.04950237274169922, 0.05160331726074219, 0.053704261779785156, 0.055805206298828125, 0.057906150817871094, 0.06000709533691406, 0.06210803985595703, 0.064208984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 2.0, 5.0, 4.0, 11.0, 11.0, 9.0, 16.0, 22.0, 33.0, 38.0, 60.0, 123.0, 168.0, 156.0, 114.0, 68.0, 45.0, 26.0, 23.0, 13.0, 18.0, 4.0, 8.0, 4.0, 3.0, 1.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13427734375, -0.1302051544189453, -0.12613296508789062, -0.12206077575683594, -0.11798858642578125, -0.11391639709472656, -0.10984420776367188, -0.10577201843261719, -0.1016998291015625, -0.09762763977050781, -0.09355545043945312, -0.08948326110839844, -0.08541107177734375, -0.08133888244628906, -0.07726669311523438, -0.07319450378417969, -0.069122314453125, -0.06505012512207031, -0.060977935791015625, -0.05690574645996094, -0.05283355712890625, -0.04876136779785156, -0.044689178466796875, -0.04061698913574219, -0.0365447998046875, -0.03247261047363281, -0.028400421142578125, -0.024328231811523438, -0.02025604248046875, -0.016183853149414062, -0.012111663818359375, -0.008039474487304688, -0.00396728515625, 0.0001049041748046875, 0.004177093505859375, 0.008249282836914062, 0.01232147216796875, 0.016393661499023438, 0.020465850830078125, 0.024538040161132812, 0.0286102294921875, 0.03268241882324219, 0.036754608154296875, 0.04082679748535156, 0.04489898681640625, 0.04897117614746094, 0.053043365478515625, 0.05711555480957031, 0.061187744140625, 0.06525993347167969, 0.06933212280273438, 0.07340431213378906, 0.07747650146484375, 0.08154869079589844, 0.08562088012695312, 0.08969306945800781, 0.0937652587890625, 0.09783744812011719, 0.10190963745117188, 0.10598182678222656, 0.11005401611328125, 0.11412620544433594, 0.11819839477539062, 0.12227058410644531, 0.1263427734375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 15.0, 32.0, 70.0, 232.0, 488.0, 104.0, 32.0, 10.0, 9.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5393590927124023, -3.2913997173309326, -3.043440341949463, -2.7954812049865723, -2.5475218296051025, -2.299562454223633, -2.051603317260742, -1.8036439418792725, -1.5556845664978027, -1.307725191116333, -1.0597659349441528, -0.8118066191673279, -0.5638473033905029, -0.3158879280090332, -0.06792867183685303, 0.18003058433532715, 0.4279899597167969, 0.6759492754936218, 0.9239085912704468, 1.171867847442627, 1.4198272228240967, 1.6677865982055664, 1.9157458543777466, 2.1637051105499268, 2.4116644859313965, 2.659623861312866, 2.907583236694336, 3.1555423736572266, 3.4035017490386963, 3.651461124420166, 3.8994202613830566, 4.1473798751831055, 4.395339012145996, 4.643298149108887, 4.8912577629089355, 5.139216899871826, 5.387176513671875, 5.635135650634766, 5.883094787597656, 6.131053924560547, 6.379013538360596, 6.626972675323486, 6.874932289123535, 7.122891426086426, 7.370850563049316, 7.618810176849365, 7.866769313812256, 8.114728927612305, 8.362688064575195, 8.610647201538086, 8.858606338500977, 9.106566429138184, 9.354525566101074, 9.602484703063965, 9.850443840026855, 10.098402976989746, 10.346363067626953, 10.594322204589844, 10.842281341552734, 11.090241432189941, 11.338200569152832, 11.586159706115723, 11.834118843078613, 12.082077980041504, 12.330037117004395]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 27.0, 22.0, 37.0, 33.0, 47.0, 88.0, 137.0, 181.0, 170.0, 65.0, 51.0, 24.0, 18.0, 15.0, 16.0, 10.0, 14.0, 12.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.862760543823242, -3.698683738708496, -3.53460693359375, -3.370530128479004, -3.206453323364258, -3.0423765182495117, -2.8782994747161865, -2.7142226696014404, -2.5501458644866943, -2.3860690593719482, -2.221992254257202, -2.057915449142456, -1.8938385248184204, -1.7297617197036743, -1.5656847953796387, -1.4016079902648926, -1.2375311851501465, -1.0734543800354004, -0.9093775153160095, -0.7453006505966187, -0.5812238454818726, -0.41714704036712646, -0.2530701756477356, -0.08899331092834473, 0.07508349418640137, 0.23916032910346985, 0.40323716402053833, 0.5673140287399292, 0.7313908338546753, 0.8954676389694214, 1.059544563293457, 1.2236213684082031, 1.3876981735229492, 1.5517749786376953, 1.7158517837524414, 1.879928708076477, 2.0440053939819336, 2.2080821990966797, 2.372159242630005, 2.536236047744751, 2.700312852859497, 2.864389657974243, 3.0284664630889893, 3.1925432682037354, 3.3566203117370605, 3.5206971168518066, 3.6847739219665527, 3.848850727081299, 4.012927532196045, 4.177004337310791, 4.341081142425537, 4.505157947540283, 4.669234752655029, 4.833311557769775, 4.9973883628845215, 5.161465644836426, 5.325542449951172, 5.489619255065918, 5.653696060180664, 5.81777286529541, 5.981849670410156, 6.145926475524902, 6.310003280639648, 6.4740800857543945, 6.638156890869141]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 12.0, 12.0, 9.0, 20.0, 26.0, 27.0, 42.0, 49.0, 55.0, 193.0, 260.0, 63.0, 48.0, 49.0, 43.0, 19.0, 18.0, 12.0, 18.0, 11.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.4104042053222656, -0.39868927001953125, -0.3869743347167969, -0.3752593994140625, -0.3635444641113281, -0.35182952880859375, -0.3401145935058594, -0.328399658203125, -0.3166847229003906, -0.30496978759765625, -0.2932548522949219, -0.2815399169921875, -0.2698249816894531, -0.25811004638671875, -0.24639511108398438, -0.23468017578125, -0.22296524047851562, -0.21125030517578125, -0.19953536987304688, -0.1878204345703125, -0.17610549926757812, -0.16439056396484375, -0.15267562866210938, -0.140960693359375, -0.12924575805664062, -0.11753082275390625, -0.10581588745117188, -0.0941009521484375, -0.08238601684570312, -0.07067108154296875, -0.058956146240234375, -0.0472412109375, -0.035526275634765625, -0.02381134033203125, -0.012096405029296875, -0.0003814697265625, 0.011333465576171875, 0.02304840087890625, 0.034763336181640625, 0.046478271484375, 0.058193206787109375, 0.06990814208984375, 0.08162307739257812, 0.0933380126953125, 0.10505294799804688, 0.11676788330078125, 0.12848281860351562, 0.14019775390625, 0.15191268920898438, 0.16362762451171875, 0.17534255981445312, 0.1870574951171875, 0.19877243041992188, 0.21048736572265625, 0.22220230102539062, 0.233917236328125, 0.24563217163085938, 0.25734710693359375, 0.2690620422363281, 0.2807769775390625, 0.2924919128417969, 0.30420684814453125, 0.3159217834472656, 0.32763671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 6.0, 20.0, 22.0, 47.0, 50.0, 94.0, 205.0, 469.0, 1528.0, 7696.0, 8334815.0, 38486.0, 3495.0, 904.0, 330.0, 151.0, 89.0, 56.0, 32.0, 23.0, 18.0, 8.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.9818265438079834, -3.879146099090576, -3.77646541595459, -3.6737849712371826, -3.5711042881011963, -3.468423843383789, -3.3657431602478027, -3.2630627155303955, -3.1603822708129883, -3.057701826095581, -2.9550211429595947, -2.8523406982421875, -2.749660015106201, -2.646979570388794, -2.5442991256713867, -2.4416184425354004, -2.338937759399414, -2.236257314682007, -2.1335766315460205, -2.0308961868286133, -1.9282156229019165, -1.8255350589752197, -1.722854495048523, -1.6201739311218262, -1.517493486404419, -1.4148129224777222, -1.3121323585510254, -1.2094519138336182, -1.1067713499069214, -1.0040907859802246, -0.9014102220535278, -0.7987297177314758, -0.6960492134094238, -0.593368649482727, -0.49068814516067505, -0.38800758123397827, -0.2853270471096039, -0.1826465129852295, -0.07996594905853271, 0.022714555263519287, 0.12539511919021606, 0.22807565331459045, 0.33075618743896484, 0.4334367513656616, 0.5361173152923584, 0.6387978196144104, 0.7414783835411072, 0.8441588878631592, 0.946839451789856, 1.0495200157165527, 1.1522005796432495, 1.2548811435699463, 1.3575615882873535, 1.4602421522140503, 1.562922716140747, 1.6656031608581543, 1.7682838439941406, 1.8709644079208374, 1.9736449718475342, 2.0763254165649414, 2.1790060997009277, 2.281686544418335, 2.384366989135742, 2.4870476722717285, 2.5897281169891357]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 1.0, 1.0, 3.0, 8.0, 1.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.363250732421875, -4.21594762802124, -4.068645000457764, -3.921341896057129, -3.7740390300750732, -3.6267361640930176, -3.479433059692383, -3.332130193710327, -3.1848273277282715, -3.037524461746216, -2.89022159576416, -2.7429184913635254, -2.5956156253814697, -2.448312759399414, -2.3010096549987793, -2.1537067890167236, -2.006403923034668, -1.8591010570526123, -1.711798071861267, -1.5644950866699219, -1.4171922206878662, -1.2698893547058105, -1.1225863695144653, -0.9752833843231201, -0.8279805183410645, -0.680677592754364, -0.5333746671676636, -0.38607174158096313, -0.2387688159942627, -0.09146589040756226, 0.055837035179138184, 0.2031400203704834, 0.35044240951538086, 0.4977453351020813, 0.6450482606887817, 0.7923511862754822, 0.9396541118621826, 1.0869569778442383, 1.2342599630355835, 1.3815629482269287, 1.5288658142089844, 1.67616868019104, 1.8234716653823853, 1.9707746505737305, 2.118077516555786, 2.265380382537842, 2.4126834869384766, 2.5599863529205322, 2.707289218902588, 2.8545920848846436, 3.001894950866699, 3.149198055267334, 3.2965009212493896, 3.4438037872314453, 3.59110689163208, 3.7384097576141357, 3.8857126235961914, 4.033015727996826, 4.180318355560303, 4.3276214599609375, 4.474924087524414, 4.622227191925049, 4.769530296325684, 4.91683292388916, 5.064136028289795]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 9.0, 6.0, 17.0, 18.0, 18.0, 33.0, 38.0, 74.0, 104.0, 136.0, 238.0, 417.0, 679.0, 1239.0, 2526.0, 5244.0, 11636.0, 25904.0, 58287.0, 122839.0, 148148.0, 80688.0, 35853.0, 15720.0, 7145.0, 3309.0, 1691.0, 896.0, 474.0, 289.0, 180.0, 108.0, 85.0, 46.0, 37.0, 38.0, 22.0, 23.0, 15.0, 14.0, 8.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.3087158203125, -1.263916015625, -1.2191162109375, -1.17431640625, -1.1295166015625, -1.084716796875, -1.0399169921875, -0.9951171875, -0.9503173828125, -0.905517578125, -0.8607177734375, -0.81591796875, -0.7711181640625, -0.726318359375, -0.6815185546875, -0.63671875, -0.5919189453125, -0.547119140625, -0.5023193359375, -0.45751953125, -0.4127197265625, -0.367919921875, -0.3231201171875, -0.2783203125, -0.2335205078125, -0.188720703125, -0.1439208984375, -0.09912109375, -0.0543212890625, -0.009521484375, 0.0352783203125, 0.080078125, 0.1248779296875, 0.169677734375, 0.2144775390625, 0.25927734375, 0.3040771484375, 0.348876953125, 0.3936767578125, 0.4384765625, 0.4832763671875, 0.528076171875, 0.5728759765625, 0.61767578125, 0.6624755859375, 0.707275390625, 0.7520751953125, 0.796875, 0.8416748046875, 0.886474609375, 0.9312744140625, 0.97607421875, 1.0208740234375, 1.065673828125, 1.1104736328125, 1.1552734375, 1.2000732421875, 1.244873046875, 1.2896728515625, 1.33447265625, 1.3792724609375, 1.424072265625, 1.4688720703125, 1.513671875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 9.0, 25.0, 27.0, 43.0, 65.0, 116.0, 99.0, 120.0, 144.0, 89.0, 78.0, 55.0, 34.0, 28.0, 26.0, 12.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67041015625, -0.652801513671875, -0.63519287109375, -0.617584228515625, -0.5999755859375, -0.582366943359375, -0.56475830078125, -0.547149658203125, -0.529541015625, -0.511932373046875, -0.49432373046875, -0.476715087890625, -0.4591064453125, -0.441497802734375, -0.42388916015625, -0.406280517578125, -0.388671875, -0.371063232421875, -0.35345458984375, -0.335845947265625, -0.3182373046875, -0.300628662109375, -0.28302001953125, -0.265411376953125, -0.247802734375, -0.230194091796875, -0.21258544921875, -0.194976806640625, -0.1773681640625, -0.159759521484375, -0.14215087890625, -0.124542236328125, -0.10693359375, -0.089324951171875, -0.07171630859375, -0.054107666015625, -0.0364990234375, -0.018890380859375, -0.00128173828125, 0.016326904296875, 0.033935546875, 0.051544189453125, 0.06915283203125, 0.086761474609375, 0.1043701171875, 0.121978759765625, 0.13958740234375, 0.157196044921875, 0.1748046875, 0.192413330078125, 0.21002197265625, 0.227630615234375, 0.2452392578125, 0.262847900390625, 0.28045654296875, 0.298065185546875, 0.315673828125, 0.333282470703125, 0.35089111328125, 0.368499755859375, 0.3861083984375, 0.403717041015625, 0.42132568359375, 0.438934326171875, 0.45654296875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 19.0, 25.0, 63.0, 84.0, 109.0, 62.0, 32.0, 29.0, 16.0, 16.0, 8.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640334129333496, -4.501906394958496, -4.363478183746338, -4.225050449371338, -4.086622714996338, -3.948194742202759, -3.8097667694091797, -3.6713390350341797, -3.5329113006591797, -3.3944833278656006, -3.2560555934906006, -3.1176276206970215, -2.9791998863220215, -2.8407719135284424, -2.7023439407348633, -2.5639162063598633, -2.425488233566284, -2.287060260772705, -2.148632526397705, -2.010204553604126, -1.871776819229126, -1.7333488464355469, -1.5949209928512573, -1.4564931392669678, -1.3180652856826782, -1.1796374320983887, -1.0412095785140991, -0.9027816653251648, -0.7643538117408752, -0.6259259581565857, -0.48749804496765137, -0.3490701913833618, -0.21064233779907227, -0.07221446931362152, 0.06621339917182922, 0.20464128255844116, 0.3430691361427307, 0.48149698972702026, 0.6199249029159546, 0.7583527565002441, 0.8967806100845337, 1.0352084636688232, 1.1736363172531128, 1.3120641708374023, 1.4504921436309814, 1.5889198780059814, 1.7273478507995605, 1.86577570438385, 2.0042035579681396, 2.1426315307617188, 2.2810592651367188, 2.419487237930298, 2.557914972305298, 2.696342945098877, 2.834770679473877, 2.973198652267456, 3.111626625061035, 3.2500545978546143, 3.3884823322296143, 3.5269103050231934, 3.6653380393981934, 3.8037660121917725, 3.9421939849853516, 4.080621719360352, 4.219049453735352]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 1.0, 7.0, 8.0, 19.0, 15.0, 28.0, 32.0, 32.0, 52.0, 45.0, 42.0, 51.0, 33.0, 23.0, 17.0, 17.0, 13.0, 11.0, 10.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310678005218506, -3.2163918018341064, -3.122105598449707, -3.0278191566467285, -2.933532953262329, -2.8392467498779297, -2.7449605464935303, -2.650674343109131, -2.5563879013061523, -2.462101697921753, -2.3678154945373535, -2.273529052734375, -2.1792428493499756, -2.084956645965576, -1.9906704425811768, -1.8963841199874878, -1.8020979166030884, -1.707811713218689, -1.613525390625, -1.5192391872406006, -1.4249528646469116, -1.3306666612625122, -1.2363803386688232, -1.1420941352844238, -1.0478079319000244, -0.9535216689109802, -0.859235405921936, -0.7649492025375366, -0.6706628799438477, -0.5763766765594482, -0.48209041357040405, -0.38780415058135986, -0.2935178279876709, -0.1992315649986267, -0.10494531691074371, -0.010659068822860718, 0.08362719416618347, 0.17791345715522766, 0.27219969034194946, 0.36648595333099365, 0.46077221632003784, 0.555058479309082, 0.6493447422981262, 0.7436310052871704, 0.8379172086715698, 0.9322035312652588, 1.0264897346496582, 1.1207759380340576, 1.2150622606277466, 1.309348464012146, 1.403634786605835, 1.4979209899902344, 1.5922073125839233, 1.6864935159683228, 1.7807798385620117, 1.8750660419464111, 1.9693522453308105, 2.06363844871521, 2.1579246520996094, 2.252211093902588, 2.3464972972869873, 2.4407835006713867, 2.535069704055786, 2.6293559074401855, 2.723642349243164]}, "eval/loss": 4.82772970199585, "eval/wer": 2.4284212614042047, "eval/runtime": 1118.0617, "eval/samples_per_second": 2.363, "eval/steps_per_second": 0.296, "train/train_runtime": 6324.9374, "train/train_samples_per_second": 4.512, "train/train_steps_per_second": 0.141, "train/total_flos": 0.0, "train/train_loss": 4.944881099221952, "_wandb": {"runtime": 7800}} \ No newline at end of file