diff --git "a/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" "b/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 3.4828, "train/learning_rate": 9.11163895486936e-05, "train/epoch": 2.8, "train/global_step": 2500, "_runtime": 15842, "_timestamp": 1647609720, "_step": 2500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 29.0, 55.0, 108.0, 194.0, 237.0, 180.0, 107.0, 59.0, 26.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.772192001342773, -19.59417152404785, -18.41615104675293, -17.238130569458008, -16.060108184814453, -14.882088661193848, -13.70406723022461, -12.526046752929688, -11.348026275634766, -10.170005798339844, -8.991985321044922, -7.813963890075684, -6.635943412780762, -5.45792293548584, -4.27990198135376, -3.1018810272216797, -1.9238605499267578, -0.7458398342132568, 0.43218088150024414, 1.6102015972137451, 2.788222312927246, 3.966242790222168, 5.144263744354248, 6.322284698486328, 7.50030517578125, 8.678325653076172, 9.856346130371094, 11.034367561340332, 12.212388038635254, 13.390408515930176, 14.568429946899414, 15.746450424194336, 16.924468994140625, 18.102489471435547, 19.28050994873047, 20.45853042602539, 21.636550903320312, 22.814571380615234, 23.99259376525879, 25.17061424255371, 26.348634719848633, 27.526655197143555, 28.704675674438477, 29.8826961517334, 31.060718536376953, 32.238739013671875, 33.4167594909668, 34.59477996826172, 35.77280044555664, 36.95082092285156, 38.128841400146484, 39.306861877441406, 40.48488235473633, 41.66290283203125, 42.84092330932617, 44.018943786621094, 45.19696807861328, 46.3749885559082, 47.553009033203125, 48.73102951049805, 49.90904998779297, 51.08707046508789, 52.26509094238281, 53.443115234375, 54.621131896972656]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 7.0, 7.0, 8.0, 18.0, 21.0, 23.0, 20.0, 32.0, 34.0, 35.0, 43.0, 58.0, 54.0, 56.0, 76.0, 61.0, 60.0, 64.0, 50.0, 45.0, 43.0, 34.0, 31.0, 26.0, 20.0, 12.0, 13.0, 11.0, 14.0, 15.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.710323333740234, -42.62649917602539, -41.54267120361328, -40.45884704589844, -39.375022888183594, -38.291194915771484, -37.20737075805664, -36.1235466003418, -35.03971862792969, -33.955894470214844, -32.872066497802734, -31.78824234008789, -30.704416275024414, -29.620590209960938, -28.536766052246094, -27.452939987182617, -26.369115829467773, -25.285289764404297, -24.201465606689453, -23.117639541625977, -22.0338134765625, -20.949989318847656, -19.86616325378418, -18.782337188720703, -17.69851303100586, -16.614686965942383, -15.530861854553223, -14.447036743164062, -13.363210678100586, -12.279385566711426, -11.195560455322266, -10.111734390258789, -9.02790641784668, -7.944080829620361, -6.860255241394043, -5.776430130004883, -4.6926045417785645, -3.608778953552246, -2.524953842163086, -1.4411282539367676, -0.3573026657104492, 0.7265228033065796, 1.8103482723236084, 2.8941736221313477, 3.977999210357666, 5.061824798583984, 6.1456499099731445, 7.229475498199463, 8.313301086425781, 9.397126197814941, 10.480952262878418, 11.564777374267578, 12.648603439331055, 13.732428550720215, 14.816253662109375, 15.900079727172852, 16.983905792236328, 18.067731857299805, 19.15155601501465, 20.235382080078125, 21.3192081451416, 22.403034210205078, 23.486858367919922, 24.5706844329834, 25.654508590698242]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 9.0, 11.0, 10.0, 10.0, 13.0, 10.0, 21.0, 10.0, 24.0, 34.0, 33.0, 29.0, 31.0, 48.0, 38.0, 50.0, 42.0, 51.0, 52.0, 51.0, 40.0, 39.0, 48.0, 44.0, 45.0, 29.0, 34.0, 15.0, 11.0, 21.0, 13.0, 19.0, 8.0, 12.0, 10.0, 6.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3212890625, -1.280242919921875, -1.23919677734375, -1.198150634765625, -1.1571044921875, -1.116058349609375, -1.07501220703125, -1.033966064453125, -0.992919921875, -0.951873779296875, -0.91082763671875, -0.869781494140625, -0.8287353515625, -0.787689208984375, -0.74664306640625, -0.705596923828125, -0.66455078125, -0.623504638671875, -0.58245849609375, -0.541412353515625, -0.5003662109375, -0.459320068359375, -0.41827392578125, -0.377227783203125, -0.336181640625, -0.295135498046875, -0.25408935546875, -0.213043212890625, -0.1719970703125, -0.130950927734375, -0.08990478515625, -0.048858642578125, -0.0078125, 0.033233642578125, 0.07427978515625, 0.115325927734375, 0.1563720703125, 0.197418212890625, 0.23846435546875, 0.279510498046875, 0.320556640625, 0.361602783203125, 0.40264892578125, 0.443695068359375, 0.4847412109375, 0.525787353515625, 0.56683349609375, 0.607879638671875, 0.64892578125, 0.689971923828125, 0.73101806640625, 0.772064208984375, 0.8131103515625, 0.854156494140625, 0.89520263671875, 0.936248779296875, 0.977294921875, 1.018341064453125, 1.05938720703125, 1.100433349609375, 1.1414794921875, 1.182525634765625, 1.22357177734375, 1.264617919921875, 1.3056640625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 4.0, 10.0, 12.0, 25.0, 31.0, 44.0, 73.0, 114.0, 151.0, 296.0, 536.0, 1098.0, 2758.0, 8539.0, 43977.0, 475710.0, 3115904.0, 489514.0, 42823.0, 7803.0, 2439.0, 1061.0, 539.0, 291.0, 179.0, 114.0, 67.0, 57.0, 30.0, 30.0, 18.0, 9.0, 10.0, 7.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.5374755859375, -4.352294921875, -4.1671142578125, -3.98193359375, -3.7967529296875, -3.611572265625, -3.4263916015625, -3.2412109375, -3.0560302734375, -2.870849609375, -2.6856689453125, -2.50048828125, -2.3153076171875, -2.130126953125, -1.9449462890625, -1.759765625, -1.5745849609375, -1.389404296875, -1.2042236328125, -1.01904296875, -0.8338623046875, -0.648681640625, -0.4635009765625, -0.2783203125, -0.0931396484375, 0.092041015625, 0.2772216796875, 0.46240234375, 0.6475830078125, 0.832763671875, 1.0179443359375, 1.203125, 1.3883056640625, 1.573486328125, 1.7586669921875, 1.94384765625, 2.1290283203125, 2.314208984375, 2.4993896484375, 2.6845703125, 2.8697509765625, 3.054931640625, 3.2401123046875, 3.42529296875, 3.6104736328125, 3.795654296875, 3.9808349609375, 4.166015625, 4.3511962890625, 4.536376953125, 4.7215576171875, 4.90673828125, 5.0919189453125, 5.277099609375, 5.4622802734375, 5.6474609375, 5.8326416015625, 6.017822265625, 6.2030029296875, 6.38818359375, 6.5733642578125, 6.758544921875, 6.9437255859375, 7.12890625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 15.0, 9.0, 18.0, 29.0, 30.0, 48.0, 78.0, 128.0, 206.0, 294.0, 447.0, 552.0, 627.0, 496.0, 338.0, 220.0, 206.0, 109.0, 78.0, 56.0, 32.0, 20.0, 17.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.859375, -4.66558837890625, -4.4718017578125, -4.27801513671875, -4.084228515625, -3.89044189453125, -3.6966552734375, -3.50286865234375, -3.30908203125, -3.11529541015625, -2.9215087890625, -2.72772216796875, -2.533935546875, -2.34014892578125, -2.1463623046875, -1.95257568359375, -1.7587890625, -1.56500244140625, -1.3712158203125, -1.17742919921875, -0.983642578125, -0.78985595703125, -0.5960693359375, -0.40228271484375, -0.20849609375, -0.01470947265625, 0.1790771484375, 0.37286376953125, 0.566650390625, 0.76043701171875, 0.9542236328125, 1.14801025390625, 1.341796875, 1.53558349609375, 1.7293701171875, 1.92315673828125, 2.116943359375, 2.31072998046875, 2.5045166015625, 2.69830322265625, 2.89208984375, 3.08587646484375, 3.2796630859375, 3.47344970703125, 3.667236328125, 3.86102294921875, 4.0548095703125, 4.24859619140625, 4.4423828125, 4.63616943359375, 4.8299560546875, 5.02374267578125, 5.217529296875, 5.41131591796875, 5.6051025390625, 5.79888916015625, 5.99267578125, 6.18646240234375, 6.3802490234375, 6.57403564453125, 6.767822265625, 6.96160888671875, 7.1553955078125, 7.34918212890625, 7.54296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 8.0, 13.0, 31.0, 28.0, 71.0, 88.0, 162.0, 352.0, 615.0, 1309.0, 3353.0, 28007.0, 3100188.0, 1043290.0, 11843.0, 2565.0, 1175.0, 539.0, 262.0, 155.0, 82.0, 55.0, 39.0, 16.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.375, -17.759765625, -17.14453125, -16.529296875, -15.9140625, -15.298828125, -14.68359375, -14.068359375, -13.453125, -12.837890625, -12.22265625, -11.607421875, -10.9921875, -10.376953125, -9.76171875, -9.146484375, -8.53125, -7.916015625, -7.30078125, -6.685546875, -6.0703125, -5.455078125, -4.83984375, -4.224609375, -3.609375, -2.994140625, -2.37890625, -1.763671875, -1.1484375, -0.533203125, 0.08203125, 0.697265625, 1.3125, 1.927734375, 2.54296875, 3.158203125, 3.7734375, 4.388671875, 5.00390625, 5.619140625, 6.234375, 6.849609375, 7.46484375, 8.080078125, 8.6953125, 9.310546875, 9.92578125, 10.541015625, 11.15625, 11.771484375, 12.38671875, 13.001953125, 13.6171875, 14.232421875, 14.84765625, 15.462890625, 16.078125, 16.693359375, 17.30859375, 17.923828125, 18.5390625, 19.154296875, 19.76953125, 20.384765625, 21.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 140.0, 567.0, 281.0, 19.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-158.06431579589844, -155.22000122070312, -152.37570190429688, -149.53138732910156, -146.68707275390625, -143.84275817871094, -140.99844360351562, -138.15414428710938, -135.30982971191406, -132.46551513671875, -129.6212158203125, -126.77690124511719, -123.93258666992188, -121.08827209472656, -118.24396514892578, -115.399658203125, -112.55534362792969, -109.71102905273438, -106.8667221069336, -104.02241516113281, -101.1781005859375, -98.33378601074219, -95.4894790649414, -92.64517211914062, -89.80085754394531, -86.95654296875, -84.11223602294922, -81.26792907714844, -78.42361450195312, -75.57929992675781, -72.73499298095703, -69.89068603515625, -67.04637908935547, -64.20207214355469, -61.357757568359375, -58.51344680786133, -55.66913604736328, -52.824825286865234, -49.98051452636719, -47.13620376586914, -44.291893005371094, -41.44758224487305, -38.603271484375, -35.75896072387695, -32.914649963378906, -30.07033920288086, -27.226028442382812, -24.381717681884766, -21.53740692138672, -18.693096160888672, -15.848785400390625, -13.004474639892578, -10.160163879394531, -7.315853118896484, -4.4715423583984375, -1.6272315979003906, 1.2170791625976562, 4.061389923095703, 6.90570068359375, 9.750011444091797, 12.594322204589844, 15.43863296508789, 18.282943725585938, 21.127254486083984, 23.97156524658203]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 2.0, 9.0, 11.0, 12.0, 13.0, 20.0, 12.0, 16.0, 28.0, 36.0, 27.0, 33.0, 46.0, 40.0, 53.0, 45.0, 35.0, 39.0, 55.0, 51.0, 51.0, 46.0, 48.0, 31.0, 36.0, 32.0, 34.0, 16.0, 18.0, 26.0, 15.0, 15.0, 9.0, 11.0, 8.0, 5.0, 0.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.13239860534668, -20.489225387573242, -19.846052169799805, -19.202880859375, -18.559707641601562, -17.916534423828125, -17.273361206054688, -16.63018798828125, -15.987015724182129, -15.343842506408691, -14.70067024230957, -14.057497024536133, -13.414323806762695, -12.771151542663574, -12.127978324890137, -11.484806060791016, -10.841632843017578, -10.19845962524414, -9.55528736114502, -8.912114143371582, -8.268941879272461, -7.625768661499023, -6.982595443725586, -6.339422702789307, -5.696249961853027, -5.053077220916748, -4.409904479980469, -3.7667312622070312, -3.123558521270752, -2.4803857803344727, -1.8372128009796143, -1.1940398216247559, -0.5508670806884766, 0.09230577945709229, 0.7354786396026611, 1.37865149974823, 2.021824359893799, 2.664997100830078, 3.3081700801849365, 3.951343059539795, 4.594515800476074, 5.2376885414123535, 5.880861282348633, 6.52403450012207, 7.16720724105835, 7.810379981994629, 8.453553199768066, 9.096725463867188, 9.739898681640625, 10.383071899414062, 11.026244163513184, 11.669417381286621, 12.312589645385742, 12.95576286315918, 13.598936080932617, 14.242109298706055, 14.885281562805176, 15.528454780578613, 16.171627044677734, 16.814800262451172, 17.45797348022461, 18.101146697998047, 18.74431800842285, 19.38749122619629, 20.030664443969727]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 10.0, 4.0, 11.0, 16.0, 14.0, 16.0, 22.0, 18.0, 27.0, 28.0, 38.0, 35.0, 46.0, 39.0, 48.0, 58.0, 64.0, 58.0, 56.0, 50.0, 47.0, 45.0, 33.0, 45.0, 32.0, 26.0, 32.0, 15.0, 19.0, 15.0, 11.0, 12.0, 5.0, 3.0, 3.0, 2.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9833984375, -1.9329986572265625, -1.882598876953125, -1.8321990966796875, -1.78179931640625, -1.7313995361328125, -1.680999755859375, -1.6305999755859375, -1.5802001953125, -1.5298004150390625, -1.479400634765625, -1.4290008544921875, -1.37860107421875, -1.3282012939453125, -1.277801513671875, -1.2274017333984375, -1.177001953125, -1.1266021728515625, -1.076202392578125, -1.0258026123046875, -0.97540283203125, -0.9250030517578125, -0.874603271484375, -0.8242034912109375, -0.7738037109375, -0.7234039306640625, -0.673004150390625, -0.6226043701171875, -0.57220458984375, -0.5218048095703125, -0.471405029296875, -0.4210052490234375, -0.37060546875, -0.3202056884765625, -0.269805908203125, -0.2194061279296875, -0.16900634765625, -0.1186065673828125, -0.068206787109375, -0.0178070068359375, 0.0325927734375, 0.0829925537109375, 0.133392333984375, 0.1837921142578125, 0.23419189453125, 0.2845916748046875, 0.334991455078125, 0.3853912353515625, 0.435791015625, 0.4861907958984375, 0.536590576171875, 0.5869903564453125, 0.63739013671875, 0.6877899169921875, 0.738189697265625, 0.7885894775390625, 0.8389892578125, 0.8893890380859375, 0.939788818359375, 0.9901885986328125, 1.04058837890625, 1.0909881591796875, 1.141387939453125, 1.1917877197265625, 1.2421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 0.0, 5.0, 8.0, 8.0, 5.0, 22.0, 25.0, 28.0, 59.0, 116.0, 178.0, 326.0, 668.0, 1151.0, 2248.0, 4448.0, 8958.0, 17844.0, 35124.0, 64971.0, 109892.0, 162367.0, 196122.0, 171154.0, 120044.0, 72318.0, 39257.0, 20371.0, 10309.0, 5048.0, 2627.0, 1306.0, 698.0, 368.0, 193.0, 107.0, 62.0, 42.0, 29.0, 22.0, 10.0, 5.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.533203125, -0.513153076171875, -0.49310302734375, -0.473052978515625, -0.4530029296875, -0.432952880859375, -0.41290283203125, -0.392852783203125, -0.372802734375, -0.352752685546875, -0.33270263671875, -0.312652587890625, -0.2926025390625, -0.272552490234375, -0.25250244140625, -0.232452392578125, -0.21240234375, -0.192352294921875, -0.17230224609375, -0.152252197265625, -0.1322021484375, -0.112152099609375, -0.09210205078125, -0.072052001953125, -0.052001953125, -0.031951904296875, -0.01190185546875, 0.008148193359375, 0.0281982421875, 0.048248291015625, 0.06829833984375, 0.088348388671875, 0.1083984375, 0.128448486328125, 0.14849853515625, 0.168548583984375, 0.1885986328125, 0.208648681640625, 0.22869873046875, 0.248748779296875, 0.268798828125, 0.288848876953125, 0.30889892578125, 0.328948974609375, 0.3489990234375, 0.369049072265625, 0.38909912109375, 0.409149169921875, 0.42919921875, 0.449249267578125, 0.46929931640625, 0.489349365234375, 0.5093994140625, 0.529449462890625, 0.54949951171875, 0.569549560546875, 0.589599609375, 0.609649658203125, 0.62969970703125, 0.649749755859375, 0.6697998046875, 0.689849853515625, 0.70989990234375, 0.729949951171875, 0.75]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 5.0, 4.0, 5.0, 9.0, 5.0, 14.0, 14.0, 10.0, 21.0, 21.0, 26.0, 26.0, 28.0, 34.0, 34.0, 45.0, 32.0, 51.0, 39.0, 53.0, 1072.0, 34.0, 45.0, 37.0, 36.0, 33.0, 42.0, 28.0, 30.0, 19.0, 25.0, 19.0, 20.0, 15.0, 14.0, 20.0, 14.0, 11.0, 5.0, 4.0, 8.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.265625, -1.2303466796875, -1.195068359375, -1.1597900390625, -1.12451171875, -1.0892333984375, -1.053955078125, -1.0186767578125, -0.9833984375, -0.9481201171875, -0.912841796875, -0.8775634765625, -0.84228515625, -0.8070068359375, -0.771728515625, -0.7364501953125, -0.701171875, -0.6658935546875, -0.630615234375, -0.5953369140625, -0.56005859375, -0.5247802734375, -0.489501953125, -0.4542236328125, -0.4189453125, -0.3836669921875, -0.348388671875, -0.3131103515625, -0.27783203125, -0.2425537109375, -0.207275390625, -0.1719970703125, -0.13671875, -0.1014404296875, -0.066162109375, -0.0308837890625, 0.00439453125, 0.0396728515625, 0.074951171875, 0.1102294921875, 0.1455078125, 0.1807861328125, 0.216064453125, 0.2513427734375, 0.28662109375, 0.3218994140625, 0.357177734375, 0.3924560546875, 0.427734375, 0.4630126953125, 0.498291015625, 0.5335693359375, 0.56884765625, 0.6041259765625, 0.639404296875, 0.6746826171875, 0.7099609375, 0.7452392578125, 0.780517578125, 0.8157958984375, 0.85107421875, 0.8863525390625, 0.921630859375, 0.9569091796875, 0.9921875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 15.0, 23.0, 37.0, 39.0, 59.0, 87.0, 115.0, 165.0, 205.0, 305.0, 455.0, 539.0, 880.0, 1199.0, 1717.0, 2383.0, 3252.0, 4466.0, 6341.0, 8935.0, 13004.0, 20869.0, 42505.0, 1838350.0, 73839.0, 26161.0, 15606.0, 10383.0, 7198.0, 5139.0, 3617.0, 2715.0, 1907.0, 1283.0, 965.0, 656.0, 501.0, 358.0, 256.0, 163.0, 115.0, 97.0, 72.0, 36.0, 38.0, 30.0, 17.0, 5.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.7177734375, -0.69512939453125, -0.6724853515625, -0.64984130859375, -0.627197265625, -0.60455322265625, -0.5819091796875, -0.55926513671875, -0.53662109375, -0.51397705078125, -0.4913330078125, -0.46868896484375, -0.446044921875, -0.42340087890625, -0.4007568359375, -0.37811279296875, -0.35546875, -0.33282470703125, -0.3101806640625, -0.28753662109375, -0.264892578125, -0.24224853515625, -0.2196044921875, -0.19696044921875, -0.17431640625, -0.15167236328125, -0.1290283203125, -0.10638427734375, -0.083740234375, -0.06109619140625, -0.0384521484375, -0.01580810546875, 0.0068359375, 0.02947998046875, 0.0521240234375, 0.07476806640625, 0.097412109375, 0.12005615234375, 0.1427001953125, 0.16534423828125, 0.18798828125, 0.21063232421875, 0.2332763671875, 0.25592041015625, 0.278564453125, 0.30120849609375, 0.3238525390625, 0.34649658203125, 0.369140625, 0.39178466796875, 0.4144287109375, 0.43707275390625, 0.459716796875, 0.48236083984375, 0.5050048828125, 0.52764892578125, 0.55029296875, 0.57293701171875, 0.5955810546875, 0.61822509765625, 0.640869140625, 0.66351318359375, 0.6861572265625, 0.70880126953125, 0.7314453125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 7.0, 3.0, 1.0, 12.0, 6.0, 5.0, 8.0, 13.0, 18.0, 16.0, 16.0, 19.0, 25.0, 31.0, 44.0, 44.0, 53.0, 62.0, 84.0, 65.0, 73.0, 75.0, 64.0, 56.0, 43.0, 22.0, 22.0, 16.0, 15.0, 17.0, 12.0, 8.0, 3.0, 6.0, 5.0, 3.0, 5.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.03851318359375, -0.037320613861083984, -0.03612804412841797, -0.03493547439575195, -0.03374290466308594, -0.03255033493041992, -0.031357765197753906, -0.03016519546508789, -0.028972625732421875, -0.02778005599975586, -0.026587486267089844, -0.025394916534423828, -0.024202346801757812, -0.023009777069091797, -0.02181720733642578, -0.020624637603759766, -0.01943206787109375, -0.018239498138427734, -0.01704692840576172, -0.015854358673095703, -0.014661788940429688, -0.013469219207763672, -0.012276649475097656, -0.01108407974243164, -0.009891510009765625, -0.00869894027709961, -0.007506370544433594, -0.006313800811767578, -0.0051212310791015625, -0.003928661346435547, -0.0027360916137695312, -0.0015435218811035156, -0.0003509521484375, 0.0008416175842285156, 0.0020341873168945312, 0.003226757049560547, 0.0044193267822265625, 0.005611896514892578, 0.006804466247558594, 0.00799703598022461, 0.009189605712890625, 0.01038217544555664, 0.011574745178222656, 0.012767314910888672, 0.013959884643554688, 0.015152454376220703, 0.01634502410888672, 0.017537593841552734, 0.01873016357421875, 0.019922733306884766, 0.02111530303955078, 0.022307872772216797, 0.023500442504882812, 0.024693012237548828, 0.025885581970214844, 0.02707815170288086, 0.028270721435546875, 0.02946329116821289, 0.030655860900878906, 0.03184843063354492, 0.03304100036621094, 0.03423357009887695, 0.03542613983154297, 0.036618709564208984, 0.037811279296875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 1.0, 7.0, 9.0, 9.0, 9.0, 10.0, 20.0, 17.0, 28.0, 20.0, 24.0, 38.0, 62.0, 58.0, 55.0, 96.0, 92.0, 170.0, 201.0, 291.0, 478.0, 1883.0, 827912.0, 214411.0, 1082.0, 426.0, 277.0, 204.0, 135.0, 89.0, 63.0, 73.0, 56.0, 44.0, 32.0, 26.0, 22.0, 21.0, 14.0, 10.0, 14.0, 18.0, 15.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.65576171875, -0.6345291137695312, -0.6132965087890625, -0.5920639038085938, -0.570831298828125, -0.5495986938476562, -0.5283660888671875, -0.5071334838867188, -0.48590087890625, -0.46466827392578125, -0.4434356689453125, -0.42220306396484375, -0.400970458984375, -0.37973785400390625, -0.3585052490234375, -0.33727264404296875, -0.3160400390625, -0.29480743408203125, -0.2735748291015625, -0.25234222412109375, -0.231109619140625, -0.20987701416015625, -0.1886444091796875, -0.16741180419921875, -0.14617919921875, -0.12494659423828125, -0.1037139892578125, -0.08248138427734375, -0.061248779296875, -0.04001617431640625, -0.0187835693359375, 0.00244903564453125, 0.023681640625, 0.04491424560546875, 0.0661468505859375, 0.08737945556640625, 0.108612060546875, 0.12984466552734375, 0.1510772705078125, 0.17230987548828125, 0.19354248046875, 0.21477508544921875, 0.2360076904296875, 0.25724029541015625, 0.278472900390625, 0.29970550537109375, 0.3209381103515625, 0.34217071533203125, 0.3634033203125, 0.38463592529296875, 0.4058685302734375, 0.42710113525390625, 0.448333740234375, 0.46956634521484375, 0.4907989501953125, 0.5120315551757812, 0.53326416015625, 0.5544967651367188, 0.5757293701171875, 0.5969619750976562, 0.618194580078125, 0.6394271850585938, 0.6606597900390625, 0.6818923950195312, 0.703125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 38.0, 140.0, 618.0, 162.0, 30.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.078096866607666, -1.0469329357147217, -1.015769124031067, -0.9846051931381226, -0.9534412622451782, -0.9222773909568787, -0.8911135196685791, -0.8599495887756348, -0.8287856578826904, -0.7976217865943909, -0.7664578557014465, -0.735293984413147, -0.7041300535202026, -0.6729661822319031, -0.6418023109436035, -0.6106383800506592, -0.5794745087623596, -0.5483106374740601, -0.5171467065811157, -0.48598283529281616, -0.4548189043998718, -0.42365503311157227, -0.3924911320209503, -0.36132723093032837, -0.3301633298397064, -0.2989994287490845, -0.2678355276584625, -0.23667164146900177, -0.20550774037837982, -0.17434383928775787, -0.14317995309829712, -0.11201605200767517, -0.08085215091705322, -0.04968825355172157, -0.018524356186389923, 0.012639537453651428, 0.043803438544273376, 0.07496733963489532, 0.10613122582435608, 0.13729512691497803, 0.16845902800559998, 0.19962292909622192, 0.23078683018684387, 0.2619507312774658, 0.2931146025657654, 0.3242785334587097, 0.3554424047470093, 0.3866063058376312, 0.4177702069282532, 0.4489341080188751, 0.48009800910949707, 0.5112618803977966, 0.542425811290741, 0.5735896825790405, 0.6047536134719849, 0.6359174847602844, 0.667081356048584, 0.6982452273368835, 0.7294091582298279, 0.7605730295181274, 0.7917369604110718, 0.8229008316993713, 0.8540647029876709, 0.8852286338806152, 0.9163925647735596]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 8.0, 17.0, 18.0, 21.0, 32.0, 32.0, 46.0, 63.0, 59.0, 71.0, 73.0, 94.0, 80.0, 81.0, 69.0, 55.0, 50.0, 53.0, 24.0, 15.0, 26.0, 10.0, 9.0, 2.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2161928415298462, -0.20954003930091858, -0.20288723707199097, -0.19623443484306335, -0.18958163261413574, -0.18292883038520813, -0.17627601325511932, -0.1696232110261917, -0.1629704087972641, -0.1563176065683365, -0.14966480433940887, -0.14301200211048126, -0.13635918498039246, -0.12970638275146484, -0.12305358052253723, -0.11640077829360962, -0.109747976064682, -0.1030951738357544, -0.09644237160682678, -0.08978956192731857, -0.08313675969839096, -0.07648395746946335, -0.06983114778995514, -0.06317834556102753, -0.056525543332099915, -0.0498727411031723, -0.04321993514895439, -0.03656712919473648, -0.02991432696580887, -0.023261524736881256, -0.016608718782663345, -0.009955912828445435, -0.0033031105995178223, 0.0033496934920549393, 0.0100024975836277, 0.016655301675200462, 0.023308105766773224, 0.029960907995700836, 0.03661371394991875, 0.04326651990413666, 0.04991932213306427, 0.05657212436199188, 0.0632249265909195, 0.0698777362704277, 0.07653053849935532, 0.08318334072828293, 0.08983615040779114, 0.09648895263671875, 0.10314175486564636, 0.10979455709457397, 0.11644735932350159, 0.1231001690030098, 0.1297529637813568, 0.13640576601028442, 0.14305858314037323, 0.14971138536930084, 0.15636418759822845, 0.16301698982715607, 0.16966979205608368, 0.1763225942850113, 0.1829754114151001, 0.1896282136440277, 0.19628101587295532, 0.20293381810188293, 0.20958662033081055]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 9.0, 6.0, 4.0, 10.0, 20.0, 16.0, 19.0, 25.0, 30.0, 34.0, 41.0, 32.0, 58.0, 51.0, 53.0, 60.0, 52.0, 53.0, 47.0, 55.0, 50.0, 42.0, 49.0, 33.0, 23.0, 21.0, 18.0, 23.0, 14.0, 18.0, 14.0, 7.0, 3.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.7686614990234375, -1.717987060546875, -1.6673126220703125, -1.61663818359375, -1.5659637451171875, -1.515289306640625, -1.4646148681640625, -1.4139404296875, -1.3632659912109375, -1.312591552734375, -1.2619171142578125, -1.21124267578125, -1.1605682373046875, -1.109893798828125, -1.0592193603515625, -1.008544921875, -0.9578704833984375, -0.907196044921875, -0.8565216064453125, -0.80584716796875, -0.7551727294921875, -0.704498291015625, -0.6538238525390625, -0.6031494140625, -0.5524749755859375, -0.501800537109375, -0.4511260986328125, -0.40045166015625, -0.3497772216796875, -0.299102783203125, -0.2484283447265625, -0.19775390625, -0.1470794677734375, -0.096405029296875, -0.0457305908203125, 0.00494384765625, 0.0556182861328125, 0.106292724609375, 0.1569671630859375, 0.2076416015625, 0.2583160400390625, 0.308990478515625, 0.3596649169921875, 0.41033935546875, 0.4610137939453125, 0.511688232421875, 0.5623626708984375, 0.613037109375, 0.6637115478515625, 0.714385986328125, 0.7650604248046875, 0.81573486328125, 0.8664093017578125, 0.917083740234375, 0.9677581787109375, 1.0184326171875, 1.0691070556640625, 1.119781494140625, 1.1704559326171875, 1.22113037109375, 1.2718048095703125, 1.322479248046875, 1.3731536865234375, 1.423828125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 12.0, 14.0, 26.0, 56.0, 76.0, 97.0, 154.0, 235.0, 387.0, 615.0, 940.0, 1664.0, 2994.0, 6128.0, 14001.0, 37013.0, 112340.0, 321122.0, 350635.0, 128177.0, 41915.0, 15506.0, 6640.0, 3275.0, 1750.0, 1041.0, 614.0, 374.0, 274.0, 152.0, 111.0, 66.0, 39.0, 40.0, 26.0, 16.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.82421875, -3.704925537109375, -3.58563232421875, -3.466339111328125, -3.3470458984375, -3.227752685546875, -3.10845947265625, -2.989166259765625, -2.869873046875, -2.750579833984375, -2.63128662109375, -2.511993408203125, -2.3927001953125, -2.273406982421875, -2.15411376953125, -2.034820556640625, -1.91552734375, -1.796234130859375, -1.67694091796875, -1.557647705078125, -1.4383544921875, -1.319061279296875, -1.19976806640625, -1.080474853515625, -0.961181640625, -0.841888427734375, -0.72259521484375, -0.603302001953125, -0.4840087890625, -0.364715576171875, -0.24542236328125, -0.126129150390625, -0.0068359375, 0.112457275390625, 0.23175048828125, 0.351043701171875, 0.4703369140625, 0.589630126953125, 0.70892333984375, 0.828216552734375, 0.947509765625, 1.066802978515625, 1.18609619140625, 1.305389404296875, 1.4246826171875, 1.543975830078125, 1.66326904296875, 1.782562255859375, 1.90185546875, 2.021148681640625, 2.14044189453125, 2.259735107421875, 2.3790283203125, 2.498321533203125, 2.61761474609375, 2.736907958984375, 2.856201171875, 2.975494384765625, 3.09478759765625, 3.214080810546875, 3.3333740234375, 3.452667236328125, 3.57196044921875, 3.691253662109375, 3.810546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 7.0, 3.0, 7.0, 13.0, 11.0, 11.0, 12.0, 19.0, 18.0, 27.0, 27.0, 33.0, 36.0, 38.0, 42.0, 53.0, 87.0, 122.0, 214.0, 1352.0, 285.0, 144.0, 80.0, 54.0, 44.0, 42.0, 39.0, 42.0, 26.0, 25.0, 19.0, 22.0, 23.0, 10.0, 16.0, 14.0, 8.0, 10.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.10650634765625, -3.9630126953125, -3.81951904296875, -3.676025390625, -3.53253173828125, -3.3890380859375, -3.24554443359375, -3.10205078125, -2.95855712890625, -2.8150634765625, -2.67156982421875, -2.528076171875, -2.38458251953125, -2.2410888671875, -2.09759521484375, -1.9541015625, -1.81060791015625, -1.6671142578125, -1.52362060546875, -1.380126953125, -1.23663330078125, -1.0931396484375, -0.94964599609375, -0.80615234375, -0.66265869140625, -0.5191650390625, -0.37567138671875, -0.232177734375, -0.08868408203125, 0.0548095703125, 0.19830322265625, 0.341796875, 0.48529052734375, 0.6287841796875, 0.77227783203125, 0.915771484375, 1.05926513671875, 1.2027587890625, 1.34625244140625, 1.48974609375, 1.63323974609375, 1.7767333984375, 1.92022705078125, 2.063720703125, 2.20721435546875, 2.3507080078125, 2.49420166015625, 2.6376953125, 2.78118896484375, 2.9246826171875, 3.06817626953125, 3.211669921875, 3.35516357421875, 3.4986572265625, 3.64215087890625, 3.78564453125, 3.92913818359375, 4.0726318359375, 4.21612548828125, 4.359619140625, 4.50311279296875, 4.6466064453125, 4.79010009765625, 4.93359375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 6.0, 9.0, 6.0, 10.0, 10.0, 11.0, 15.0, 26.0, 14.0, 33.0, 34.0, 34.0, 29.0, 57.0, 87.0, 164.0, 485.0, 3707.0, 1625574.0, 1510831.0, 3493.0, 527.0, 167.0, 92.0, 52.0, 42.0, 37.0, 23.0, 25.0, 24.0, 18.0, 9.0, 13.0, 6.0, 10.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.4375, -18.86572265625, -18.2939453125, -17.72216796875, -17.150390625, -16.57861328125, -16.0068359375, -15.43505859375, -14.86328125, -14.29150390625, -13.7197265625, -13.14794921875, -12.576171875, -12.00439453125, -11.4326171875, -10.86083984375, -10.2890625, -9.71728515625, -9.1455078125, -8.57373046875, -8.001953125, -7.43017578125, -6.8583984375, -6.28662109375, -5.71484375, -5.14306640625, -4.5712890625, -3.99951171875, -3.427734375, -2.85595703125, -2.2841796875, -1.71240234375, -1.140625, -0.56884765625, 0.0029296875, 0.57470703125, 1.146484375, 1.71826171875, 2.2900390625, 2.86181640625, 3.43359375, 4.00537109375, 4.5771484375, 5.14892578125, 5.720703125, 6.29248046875, 6.8642578125, 7.43603515625, 8.0078125, 8.57958984375, 9.1513671875, 9.72314453125, 10.294921875, 10.86669921875, 11.4384765625, 12.01025390625, 12.58203125, 13.15380859375, 13.7255859375, 14.29736328125, 14.869140625, 15.44091796875, 16.0126953125, 16.58447265625, 17.15625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 26.0, 274.0, 549.0, 149.0, 14.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.7537899017334, -19.397438049316406, -18.041088104248047, -16.684736251831055, -15.328385353088379, -13.972034454345703, -12.615682601928711, -11.259331703186035, -9.90298080444336, -8.546629905700684, -7.19027853012085, -5.833927154541016, -4.47757625579834, -3.121225357055664, -1.7648735046386719, -0.4085226058959961, 0.9478282928466797, 2.3041794300079346, 3.6605305671691895, 5.016881942749023, 6.373232841491699, 7.729583740234375, 9.085935592651367, 10.442286491394043, 11.798637390136719, 13.154988288879395, 14.51133918762207, 15.867691040039062, 17.224040985107422, 18.580392837524414, 19.936744689941406, 21.293094635009766, 22.649444580078125, 24.005796432495117, 25.362146377563477, 26.71849822998047, 28.074848175048828, 29.43120002746582, 30.787551879882812, 32.14390182495117, 33.50025177001953, 34.85660171508789, 36.212955474853516, 37.569305419921875, 38.925655364990234, 40.282005310058594, 41.63835906982422, 42.99470901489258, 44.3510627746582, 45.70741271972656, 47.06376647949219, 48.42011642456055, 49.776466369628906, 51.13282012939453, 52.48917007446289, 53.84552001953125, 55.201873779296875, 56.558223724365234, 57.91457748413086, 59.27092742919922, 60.62727737426758, 61.98362731933594, 63.33998107910156, 64.69633483886719, 66.05268096923828]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 3.0, 5.0, 8.0, 8.0, 9.0, 15.0, 15.0, 13.0, 32.0, 22.0, 28.0, 28.0, 37.0, 29.0, 33.0, 35.0, 47.0, 54.0, 41.0, 40.0, 55.0, 44.0, 46.0, 43.0, 49.0, 42.0, 36.0, 27.0, 18.0, 27.0, 15.0, 26.0, 21.0, 17.0, 10.0, 7.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.851982116699219, -14.342965126037598, -13.833948135375977, -13.324932098388672, -12.81591510772705, -12.30689811706543, -11.797882080078125, -11.288865089416504, -10.779848098754883, -10.270831108093262, -9.76181411743164, -9.252798080444336, -8.743781089782715, -8.234764099121094, -7.725747585296631, -7.216731071472168, -6.707714080810547, -6.198697090148926, -5.689680576324463, -5.1806640625, -4.671647071838379, -4.162630081176758, -3.653613567352295, -3.144596815109253, -2.635580062866211, -2.126563310623169, -1.617546558380127, -1.108529806137085, -0.599513053894043, -0.09049630165100098, 0.418520450592041, 0.927537202835083, 1.4365558624267578, 1.9455726146697998, 2.454589366912842, 2.963606119155884, 3.472622871398926, 3.9816396236419678, 4.49065637588501, 4.999672889709473, 5.508689880371094, 6.017706871032715, 6.526723384857178, 7.035739898681641, 7.544756889343262, 8.053773880004883, 8.562789916992188, 9.071806907653809, 9.58082389831543, 10.08984088897705, 10.598857879638672, 11.107873916625977, 11.616890907287598, 12.125907897949219, 12.634923934936523, 13.143940925598145, 13.652957916259766, 14.161974906921387, 14.670991897583008, 15.180007934570312, 15.689024925231934, 16.198041915893555, 16.70705795288086, 17.216075897216797, 17.7250919342041]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 11.0, 8.0, 11.0, 8.0, 20.0, 16.0, 22.0, 20.0, 42.0, 34.0, 41.0, 36.0, 35.0, 53.0, 44.0, 47.0, 46.0, 62.0, 42.0, 49.0, 37.0, 36.0, 40.0, 31.0, 22.0, 35.0, 29.0, 23.0, 18.0, 20.0, 10.0, 13.0, 9.0, 5.0, 6.0, 7.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.646484375, -1.59808349609375, -1.5496826171875, -1.50128173828125, -1.452880859375, -1.40447998046875, -1.3560791015625, -1.30767822265625, -1.25927734375, -1.21087646484375, -1.1624755859375, -1.11407470703125, -1.065673828125, -1.01727294921875, -0.9688720703125, -0.92047119140625, -0.8720703125, -0.82366943359375, -0.7752685546875, -0.72686767578125, -0.678466796875, -0.63006591796875, -0.5816650390625, -0.53326416015625, -0.48486328125, -0.43646240234375, -0.3880615234375, -0.33966064453125, -0.291259765625, -0.24285888671875, -0.1944580078125, -0.14605712890625, -0.09765625, -0.04925537109375, -0.0008544921875, 0.04754638671875, 0.095947265625, 0.14434814453125, 0.1927490234375, 0.24114990234375, 0.28955078125, 0.33795166015625, 0.3863525390625, 0.43475341796875, 0.483154296875, 0.53155517578125, 0.5799560546875, 0.62835693359375, 0.6767578125, 0.72515869140625, 0.7735595703125, 0.82196044921875, 0.870361328125, 0.91876220703125, 0.9671630859375, 1.01556396484375, 1.06396484375, 1.11236572265625, 1.1607666015625, 1.20916748046875, 1.257568359375, 1.30596923828125, 1.3543701171875, 1.40277099609375, 1.451171875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 4.0, 10.0, 9.0, 22.0, 19.0, 30.0, 44.0, 56.0, 103.0, 133.0, 209.0, 425.0, 922.0, 3035.0, 17513.0, 223707.0, 3348960.0, 562024.0, 30831.0, 3977.0, 1063.0, 456.0, 248.0, 146.0, 99.0, 82.0, 44.0, 23.0, 29.0, 22.0, 17.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.75, -8.4898681640625, -8.229736328125, -7.9696044921875, -7.70947265625, -7.4493408203125, -7.189208984375, -6.9290771484375, -6.6689453125, -6.4088134765625, -6.148681640625, -5.8885498046875, -5.62841796875, -5.3682861328125, -5.108154296875, -4.8480224609375, -4.587890625, -4.3277587890625, -4.067626953125, -3.8074951171875, -3.54736328125, -3.2872314453125, -3.027099609375, -2.7669677734375, -2.5068359375, -2.2467041015625, -1.986572265625, -1.7264404296875, -1.46630859375, -1.2061767578125, -0.946044921875, -0.6859130859375, -0.42578125, -0.1656494140625, 0.094482421875, 0.3546142578125, 0.61474609375, 0.8748779296875, 1.135009765625, 1.3951416015625, 1.6552734375, 1.9154052734375, 2.175537109375, 2.4356689453125, 2.69580078125, 2.9559326171875, 3.216064453125, 3.4761962890625, 3.736328125, 3.9964599609375, 4.256591796875, 4.5167236328125, 4.77685546875, 5.0369873046875, 5.297119140625, 5.5572509765625, 5.8173828125, 6.0775146484375, 6.337646484375, 6.5977783203125, 6.85791015625, 7.1180419921875, 7.378173828125, 7.6383056640625, 7.8984375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 9.0, 21.0, 48.0, 99.0, 205.0, 387.0, 753.0, 1023.0, 738.0, 431.0, 175.0, 97.0, 45.0, 24.0, 8.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.2041015625, -9.869140625, -9.5341796875, -9.19921875, -8.8642578125, -8.529296875, -8.1943359375, -7.859375, -7.5244140625, -7.189453125, -6.8544921875, -6.51953125, -6.1845703125, -5.849609375, -5.5146484375, -5.1796875, -4.8447265625, -4.509765625, -4.1748046875, -3.83984375, -3.5048828125, -3.169921875, -2.8349609375, -2.5, -2.1650390625, -1.830078125, -1.4951171875, -1.16015625, -0.8251953125, -0.490234375, -0.1552734375, 0.1796875, 0.5146484375, 0.849609375, 1.1845703125, 1.51953125, 1.8544921875, 2.189453125, 2.5244140625, 2.859375, 3.1943359375, 3.529296875, 3.8642578125, 4.19921875, 4.5341796875, 4.869140625, 5.2041015625, 5.5390625, 5.8740234375, 6.208984375, 6.5439453125, 6.87890625, 7.2138671875, 7.548828125, 7.8837890625, 8.21875, 8.5537109375, 8.888671875, 9.2236328125, 9.55859375, 9.8935546875, 10.228515625, 10.5634765625, 10.8984375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 17.0, 38.0, 91.0, 195.0, 467.0, 1331.0, 7003.0, 207172.0, 3700790.0, 266905.0, 7989.0, 1393.0, 475.0, 205.0, 106.0, 46.0, 31.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.515625, -18.950439453125, -18.38525390625, -17.820068359375, -17.2548828125, -16.689697265625, -16.12451171875, -15.559326171875, -14.994140625, -14.428955078125, -13.86376953125, -13.298583984375, -12.7333984375, -12.168212890625, -11.60302734375, -11.037841796875, -10.47265625, -9.907470703125, -9.34228515625, -8.777099609375, -8.2119140625, -7.646728515625, -7.08154296875, -6.516357421875, -5.951171875, -5.385986328125, -4.82080078125, -4.255615234375, -3.6904296875, -3.125244140625, -2.56005859375, -1.994873046875, -1.4296875, -0.864501953125, -0.29931640625, 0.265869140625, 0.8310546875, 1.396240234375, 1.96142578125, 2.526611328125, 3.091796875, 3.656982421875, 4.22216796875, 4.787353515625, 5.3525390625, 5.917724609375, 6.48291015625, 7.048095703125, 7.61328125, 8.178466796875, 8.74365234375, 9.308837890625, 9.8740234375, 10.439208984375, 11.00439453125, 11.569580078125, 12.134765625, 12.699951171875, 13.26513671875, 13.830322265625, 14.3955078125, 14.960693359375, 15.52587890625, 16.091064453125, 16.65625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 9.0, 130.0, 509.0, 331.0, 31.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.97829818725586, -54.709991455078125, -51.44168472290039, -48.173377990722656, -44.905067443847656, -41.63676452636719, -38.36845397949219, -35.10014724731445, -31.83184051513672, -28.563533782958984, -25.29522705078125, -22.026918411254883, -18.75861167907715, -15.490304946899414, -12.221996307373047, -8.953689575195312, -5.685382843017578, -2.4170756340026855, 0.851231575012207, 4.119539260864258, 7.387845993041992, 10.656152725219727, 13.924461364746094, 17.192768096923828, 20.461074829101562, 23.729381561279297, 26.99768829345703, 30.2659969329834, 33.5343017578125, 36.8026123046875, 40.070919036865234, 43.33922576904297, 46.60752868652344, 49.87583541870117, 53.144142150878906, 56.412452697753906, 59.680755615234375, 62.949066162109375, 66.21737670898438, 69.48567962646484, 72.75398254394531, 76.02229309082031, 79.29059600830078, 82.55890655517578, 85.82720947265625, 89.09552001953125, 92.36383056640625, 95.63213348388672, 98.90044403076172, 102.16875457763672, 105.43705749511719, 108.70536804199219, 111.97367095947266, 115.24198150634766, 118.51028442382812, 121.77859497070312, 125.04690551757812, 128.31521606445312, 131.58352661132812, 134.85182189941406, 138.12013244628906, 141.38844299316406, 144.65675354003906, 147.925048828125, 151.193359375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 8.0, 9.0, 9.0, 15.0, 12.0, 23.0, 21.0, 22.0, 26.0, 22.0, 27.0, 35.0, 34.0, 38.0, 33.0, 47.0, 46.0, 46.0, 45.0, 43.0, 44.0, 36.0, 25.0, 38.0, 33.0, 32.0, 25.0, 25.0, 30.0, 16.0, 18.0, 24.0, 14.0, 23.0, 9.0, 3.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.619977951049805, -18.075531005859375, -17.531085968017578, -16.98664093017578, -16.44219398498535, -15.897747993469238, -15.353302001953125, -14.808856010437012, -14.264410018920898, -13.719964027404785, -13.175518035888672, -12.631072044372559, -12.086626052856445, -11.542180061340332, -10.997734069824219, -10.453288078308105, -9.908842086791992, -9.364396095275879, -8.819950103759766, -8.275504112243652, -7.731058120727539, -7.186612129211426, -6.6421661376953125, -6.097720146179199, -5.553274154663086, -5.008828163146973, -4.464382171630859, -3.919936180114746, -3.375490188598633, -2.8310441970825195, -2.2865982055664062, -1.742152214050293, -1.1977062225341797, -0.6532602310180664, -0.10881423950195312, 0.43563175201416016, 0.9800777435302734, 1.5245237350463867, 2.0689697265625, 2.6134157180786133, 3.1578617095947266, 3.70230770111084, 4.246753692626953, 4.791199684143066, 5.33564567565918, 5.880091667175293, 6.424537658691406, 6.9689836502075195, 7.513429641723633, 8.057875633239746, 8.60232162475586, 9.146767616271973, 9.691213607788086, 10.2356595993042, 10.780105590820312, 11.324551582336426, 11.868997573852539, 12.413443565368652, 12.957889556884766, 13.502335548400879, 14.046781539916992, 14.591227531433105, 15.135673522949219, 15.680119514465332, 16.224565505981445]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 14.0, 14.0, 13.0, 28.0, 26.0, 37.0, 33.0, 35.0, 43.0, 45.0, 61.0, 55.0, 54.0, 64.0, 52.0, 49.0, 49.0, 36.0, 31.0, 40.0, 44.0, 30.0, 20.0, 26.0, 18.0, 5.0, 18.0, 7.0, 10.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8046875, -1.7506561279296875, -1.696624755859375, -1.6425933837890625, -1.58856201171875, -1.5345306396484375, -1.480499267578125, -1.4264678955078125, -1.3724365234375, -1.3184051513671875, -1.264373779296875, -1.2103424072265625, -1.15631103515625, -1.1022796630859375, -1.048248291015625, -0.9942169189453125, -0.940185546875, -0.8861541748046875, -0.832122802734375, -0.7780914306640625, -0.72406005859375, -0.6700286865234375, -0.615997314453125, -0.5619659423828125, -0.5079345703125, -0.4539031982421875, -0.399871826171875, -0.3458404541015625, -0.29180908203125, -0.2377777099609375, -0.183746337890625, -0.1297149658203125, -0.07568359375, -0.0216522216796875, 0.032379150390625, 0.0864105224609375, 0.14044189453125, 0.1944732666015625, 0.248504638671875, 0.3025360107421875, 0.3565673828125, 0.4105987548828125, 0.464630126953125, 0.5186614990234375, 0.57269287109375, 0.6267242431640625, 0.680755615234375, 0.7347869873046875, 0.788818359375, 0.8428497314453125, 0.896881103515625, 0.9509124755859375, 1.00494384765625, 1.0589752197265625, 1.113006591796875, 1.1670379638671875, 1.2210693359375, 1.2751007080078125, 1.329132080078125, 1.3831634521484375, 1.43719482421875, 1.4912261962890625, 1.545257568359375, 1.5992889404296875, 1.6533203125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 14.0, 12.0, 23.0, 27.0, 37.0, 48.0, 91.0, 143.0, 255.0, 438.0, 815.0, 1539.0, 3029.0, 5823.0, 11229.0, 21138.0, 40078.0, 71530.0, 117768.0, 166548.0, 190576.0, 161182.0, 111010.0, 66578.0, 37249.0, 19747.0, 10268.0, 5490.0, 2686.0, 1447.0, 756.0, 391.0, 227.0, 151.0, 80.0, 43.0, 25.0, 17.0, 22.0, 10.0, 5.0, 3.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.6875, -0.6663055419921875, -0.645111083984375, -0.6239166259765625, -0.60272216796875, -0.5815277099609375, -0.560333251953125, -0.5391387939453125, -0.5179443359375, -0.4967498779296875, -0.475555419921875, -0.4543609619140625, -0.43316650390625, -0.4119720458984375, -0.390777587890625, -0.3695831298828125, -0.348388671875, -0.3271942138671875, -0.305999755859375, -0.2848052978515625, -0.26361083984375, -0.2424163818359375, -0.221221923828125, -0.2000274658203125, -0.1788330078125, -0.1576385498046875, -0.136444091796875, -0.1152496337890625, -0.09405517578125, -0.0728607177734375, -0.051666259765625, -0.0304718017578125, -0.00927734375, 0.0119171142578125, 0.033111572265625, 0.0543060302734375, 0.07550048828125, 0.0966949462890625, 0.117889404296875, 0.1390838623046875, 0.1602783203125, 0.1814727783203125, 0.202667236328125, 0.2238616943359375, 0.24505615234375, 0.2662506103515625, 0.287445068359375, 0.3086395263671875, 0.329833984375, 0.3510284423828125, 0.372222900390625, 0.3934173583984375, 0.41461181640625, 0.4358062744140625, 0.457000732421875, 0.4781951904296875, 0.4993896484375, 0.5205841064453125, 0.541778564453125, 0.5629730224609375, 0.58416748046875, 0.6053619384765625, 0.626556396484375, 0.6477508544921875, 0.6689453125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 6.0, 9.0, 14.0, 7.0, 9.0, 7.0, 17.0, 21.0, 21.0, 25.0, 28.0, 20.0, 27.0, 32.0, 33.0, 50.0, 48.0, 34.0, 46.0, 46.0, 1057.0, 40.0, 42.0, 39.0, 35.0, 33.0, 29.0, 21.0, 36.0, 20.0, 21.0, 25.0, 19.0, 14.0, 17.0, 11.0, 10.0, 14.0, 10.0, 3.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9794769287109375, -0.946258544921875, -0.9130401611328125, -0.87982177734375, -0.8466033935546875, -0.813385009765625, -0.7801666259765625, -0.7469482421875, -0.7137298583984375, -0.680511474609375, -0.6472930908203125, -0.61407470703125, -0.5808563232421875, -0.547637939453125, -0.5144195556640625, -0.481201171875, -0.4479827880859375, -0.414764404296875, -0.3815460205078125, -0.34832763671875, -0.3151092529296875, -0.281890869140625, -0.2486724853515625, -0.2154541015625, -0.1822357177734375, -0.149017333984375, -0.1157989501953125, -0.08258056640625, -0.0493621826171875, -0.016143798828125, 0.0170745849609375, 0.05029296875, 0.0835113525390625, 0.116729736328125, 0.1499481201171875, 0.18316650390625, 0.2163848876953125, 0.249603271484375, 0.2828216552734375, 0.3160400390625, 0.3492584228515625, 0.382476806640625, 0.4156951904296875, 0.44891357421875, 0.4821319580078125, 0.515350341796875, 0.5485687255859375, 0.581787109375, 0.6150054931640625, 0.648223876953125, 0.6814422607421875, 0.71466064453125, 0.7478790283203125, 0.781097412109375, 0.8143157958984375, 0.8475341796875, 0.8807525634765625, 0.913970947265625, 0.9471893310546875, 0.98040771484375, 1.0136260986328125, 1.046844482421875, 1.0800628662109375, 1.11328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 7.0, 5.0, 26.0, 23.0, 52.0, 49.0, 90.0, 137.0, 249.0, 327.0, 537.0, 754.0, 1101.0, 1577.0, 2487.0, 3810.0, 5660.0, 8391.0, 13186.0, 21197.0, 41606.0, 1881107.0, 50609.0, 23239.0, 13957.0, 8837.0, 5883.0, 4071.0, 2750.0, 1734.0, 1241.0, 751.0, 568.0, 361.0, 239.0, 172.0, 96.0, 75.0, 63.0, 40.0, 21.0, 10.0, 15.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.91357421875, -0.8846511840820312, -0.8557281494140625, -0.8268051147460938, -0.797882080078125, -0.7689590454101562, -0.7400360107421875, -0.7111129760742188, -0.68218994140625, -0.6532669067382812, -0.6243438720703125, -0.5954208374023438, -0.566497802734375, -0.5375747680664062, -0.5086517333984375, -0.47972869873046875, -0.4508056640625, -0.42188262939453125, -0.3929595947265625, -0.36403656005859375, -0.335113525390625, -0.30619049072265625, -0.2772674560546875, -0.24834442138671875, -0.21942138671875, -0.19049835205078125, -0.1615753173828125, -0.13265228271484375, -0.103729248046875, -0.07480621337890625, -0.0458831787109375, -0.01696014404296875, 0.011962890625, 0.04088592529296875, 0.0698089599609375, 0.09873199462890625, 0.127655029296875, 0.15657806396484375, 0.1855010986328125, 0.21442413330078125, 0.24334716796875, 0.27227020263671875, 0.3011932373046875, 0.33011627197265625, 0.359039306640625, 0.38796234130859375, 0.4168853759765625, 0.44580841064453125, 0.4747314453125, 0.5036544799804688, 0.5325775146484375, 0.5615005493164062, 0.590423583984375, 0.6193466186523438, 0.6482696533203125, 0.6771926879882812, 0.70611572265625, 0.7350387573242188, 0.7639617919921875, 0.7928848266601562, 0.821807861328125, 0.8507308959960938, 0.8796539306640625, 0.9085769653320312, 0.9375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 6.0, 7.0, 5.0, 3.0, 4.0, 5.0, 7.0, 13.0, 11.0, 14.0, 14.0, 13.0, 28.0, 31.0, 28.0, 28.0, 44.0, 34.0, 53.0, 48.0, 53.0, 55.0, 56.0, 66.0, 49.0, 45.0, 37.0, 44.0, 34.0, 36.0, 15.0, 23.0, 17.0, 18.0, 19.0, 7.0, 8.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01531219482421875, -0.014769434928894043, -0.014226675033569336, -0.013683915138244629, -0.013141155242919922, -0.012598395347595215, -0.012055635452270508, -0.0115128755569458, -0.010970115661621094, -0.010427355766296387, -0.00988459587097168, -0.009341835975646973, -0.008799076080322266, -0.008256316184997559, -0.0077135562896728516, -0.0071707963943481445, -0.0066280364990234375, -0.0060852766036987305, -0.0055425167083740234, -0.004999756813049316, -0.004456996917724609, -0.003914237022399902, -0.0033714771270751953, -0.0028287172317504883, -0.0022859573364257812, -0.0017431974411010742, -0.0012004375457763672, -0.0006576776504516602, -0.00011491775512695312, 0.0004278421401977539, 0.0009706020355224609, 0.001513361930847168, 0.002056121826171875, 0.002598881721496582, 0.003141641616821289, 0.003684401512145996, 0.004227161407470703, 0.00476992130279541, 0.005312681198120117, 0.005855441093444824, 0.006398200988769531, 0.006940960884094238, 0.007483720779418945, 0.008026480674743652, 0.00856924057006836, 0.009112000465393066, 0.009654760360717773, 0.01019752025604248, 0.010740280151367188, 0.011283040046691895, 0.011825799942016602, 0.012368559837341309, 0.012911319732666016, 0.013454079627990723, 0.01399683952331543, 0.014539599418640137, 0.015082359313964844, 0.01562511920928955, 0.016167879104614258, 0.016710638999938965, 0.017253398895263672, 0.01779615879058838, 0.018338918685913086, 0.018881678581237793, 0.0194244384765625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 8.0, 5.0, 18.0, 9.0, 18.0, 26.0, 21.0, 32.0, 40.0, 40.0, 64.0, 91.0, 108.0, 122.0, 171.0, 207.0, 362.0, 1566.0, 43293.0, 878619.0, 119028.0, 3220.0, 434.0, 259.0, 191.0, 108.0, 102.0, 84.0, 68.0, 45.0, 44.0, 32.0, 31.0, 24.0, 18.0, 12.0, 9.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.291259765625, -0.2810859680175781, -0.27091217041015625, -0.2607383728027344, -0.2505645751953125, -0.24039077758789062, -0.23021697998046875, -0.22004318237304688, -0.209869384765625, -0.19969558715820312, -0.18952178955078125, -0.17934799194335938, -0.1691741943359375, -0.15900039672851562, -0.14882659912109375, -0.13865280151367188, -0.12847900390625, -0.11830520629882812, -0.10813140869140625, -0.09795761108398438, -0.0877838134765625, -0.07761001586914062, -0.06743621826171875, -0.057262420654296875, -0.047088623046875, -0.036914825439453125, -0.02674102783203125, -0.016567230224609375, -0.0063934326171875, 0.003780364990234375, 0.01395416259765625, 0.024127960205078125, 0.0343017578125, 0.044475555419921875, 0.05464935302734375, 0.06482315063476562, 0.0749969482421875, 0.08517074584960938, 0.09534454345703125, 0.10551834106445312, 0.115692138671875, 0.12586593627929688, 0.13603973388671875, 0.14621353149414062, 0.1563873291015625, 0.16656112670898438, 0.17673492431640625, 0.18690872192382812, 0.19708251953125, 0.20725631713867188, 0.21743011474609375, 0.22760391235351562, 0.2377777099609375, 0.24795150756835938, 0.25812530517578125, 0.2682991027832031, 0.278472900390625, 0.2886466979980469, 0.29882049560546875, 0.3089942932128906, 0.3191680908203125, 0.3293418884277344, 0.33951568603515625, 0.3496894836425781, 0.35986328125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 14.0, 12.0, 27.0, 74.0, 154.0, 448.0, 189.0, 56.0, 22.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22154544293880463, -0.2088887244462967, -0.19623200595378876, -0.18357528746128082, -0.1709185689687729, -0.15826185047626495, -0.14560513198375702, -0.13294841349124908, -0.12029169499874115, -0.10763497650623322, -0.09497825801372528, -0.08232153952121735, -0.06966482102870941, -0.05700810253620148, -0.04435138404369354, -0.03169466555118561, -0.019037947058677673, -0.006381228566169739, 0.006275489926338196, 0.01893220841884613, 0.031588926911354065, 0.044245645403862, 0.056902363896369934, 0.06955908238887787, 0.0822158008813858, 0.09487251937389374, 0.10752923786640167, 0.1201859563589096, 0.13284267485141754, 0.14549939334392548, 0.1581561118364334, 0.17081283032894135, 0.18346953392028809, 0.19612625241279602, 0.20878297090530396, 0.2214396893978119, 0.23409640789031982, 0.24675312638282776, 0.2594098448753357, 0.27206656336784363, 0.28472328186035156, 0.2973800003528595, 0.31003671884536743, 0.32269343733787537, 0.3353501558303833, 0.34800687432289124, 0.36066359281539917, 0.3733203113079071, 0.38597702980041504, 0.398633748292923, 0.4112904667854309, 0.42394718527793884, 0.4366039037704468, 0.4492606222629547, 0.46191734075546265, 0.4745740592479706, 0.4872307777404785, 0.49988749623298645, 0.5125442147254944, 0.5252009630203247, 0.5378576517105103, 0.5505143404006958, 0.5631710886955261, 0.5758278369903564, 0.588484525680542]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 7.0, 11.0, 15.0, 23.0, 18.0, 24.0, 26.0, 33.0, 33.0, 36.0, 43.0, 43.0, 54.0, 52.0, 57.0, 50.0, 53.0, 52.0, 44.0, 58.0, 39.0, 30.0, 35.0, 31.0, 25.0, 16.0, 15.0, 13.0, 15.0, 9.0, 10.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07489395141601562, -0.07259912043809891, -0.07030428946018219, -0.06800945103168488, -0.06571462005376816, -0.06341978907585144, -0.061124954372644424, -0.05883011966943741, -0.05653528869152069, -0.05424045771360397, -0.05194562301039696, -0.04965078830718994, -0.047355957329273224, -0.045061126351356506, -0.04276629164814949, -0.040471456944942474, -0.03817662596702576, -0.03588179498910904, -0.03358696028590202, -0.03129212558269501, -0.02899729460477829, -0.026702461764216423, -0.024407628923654556, -0.02211279608309269, -0.019817963242530823, -0.017523130401968956, -0.01522829756140709, -0.012933464720845222, -0.010638631880283356, -0.008343799039721489, -0.006048966199159622, -0.0037541333585977554, -0.0014593005180358887, 0.0008355323225259781, 0.003130365163087845, 0.005425198003649712, 0.007720030844211578, 0.010014863684773445, 0.012309696525335312, 0.014604529365897179, 0.016899362206459045, 0.019194195047020912, 0.02148902788758278, 0.023783860728144646, 0.026078693568706512, 0.02837352640926838, 0.030668359249830246, 0.03296319395303726, 0.03525802493095398, 0.0375528559088707, 0.03984769061207771, 0.04214252531528473, 0.04443735629320145, 0.046732187271118164, 0.04902702197432518, 0.051321856677532196, 0.053616687655448914, 0.05591151863336563, 0.05820635333657265, 0.06050118803977966, 0.06279601901769638, 0.0650908499956131, 0.06738568842411041, 0.06968051940202713, 0.07197535037994385]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 6.0, 8.0, 11.0, 9.0, 15.0, 22.0, 19.0, 22.0, 30.0, 30.0, 33.0, 36.0, 57.0, 32.0, 49.0, 49.0, 59.0, 49.0, 51.0, 52.0, 45.0, 41.0, 35.0, 36.0, 38.0, 30.0, 23.0, 17.0, 12.0, 16.0, 16.0, 12.0, 9.0, 8.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.7924957275390625, -1.741241455078125, -1.6899871826171875, -1.63873291015625, -1.5874786376953125, -1.536224365234375, -1.4849700927734375, -1.4337158203125, -1.3824615478515625, -1.331207275390625, -1.2799530029296875, -1.22869873046875, -1.1774444580078125, -1.126190185546875, -1.0749359130859375, -1.023681640625, -0.9724273681640625, -0.921173095703125, -0.8699188232421875, -0.81866455078125, -0.7674102783203125, -0.716156005859375, -0.6649017333984375, -0.6136474609375, -0.5623931884765625, -0.511138916015625, -0.4598846435546875, -0.40863037109375, -0.3573760986328125, -0.306121826171875, -0.2548675537109375, -0.20361328125, -0.1523590087890625, -0.101104736328125, -0.0498504638671875, 0.00140380859375, 0.0526580810546875, 0.103912353515625, 0.1551666259765625, 0.2064208984375, 0.2576751708984375, 0.308929443359375, 0.3601837158203125, 0.41143798828125, 0.4626922607421875, 0.513946533203125, 0.5652008056640625, 0.616455078125, 0.6677093505859375, 0.718963623046875, 0.7702178955078125, 0.82147216796875, 0.8727264404296875, 0.923980712890625, 0.9752349853515625, 1.0264892578125, 1.0777435302734375, 1.128997802734375, 1.1802520751953125, 1.23150634765625, 1.2827606201171875, 1.334014892578125, 1.3852691650390625, 1.4365234375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 1.0, 3.0, 7.0, 8.0, 18.0, 28.0, 43.0, 81.0, 173.0, 283.0, 485.0, 1093.0, 2469.0, 6139.0, 17418.0, 55866.0, 174064.0, 354356.0, 278356.0, 106728.0, 32749.0, 10841.0, 4039.0, 1679.0, 767.0, 372.0, 193.0, 108.0, 74.0, 42.0, 26.0, 16.0, 16.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.1334228515625, -2.061767578125, -1.9901123046875, -1.91845703125, -1.8468017578125, -1.775146484375, -1.7034912109375, -1.6318359375, -1.5601806640625, -1.488525390625, -1.4168701171875, -1.34521484375, -1.2735595703125, -1.201904296875, -1.1302490234375, -1.05859375, -0.9869384765625, -0.915283203125, -0.8436279296875, -0.77197265625, -0.7003173828125, -0.628662109375, -0.5570068359375, -0.4853515625, -0.4136962890625, -0.342041015625, -0.2703857421875, -0.19873046875, -0.1270751953125, -0.055419921875, 0.0162353515625, 0.087890625, 0.1595458984375, 0.231201171875, 0.3028564453125, 0.37451171875, 0.4461669921875, 0.517822265625, 0.5894775390625, 0.6611328125, 0.7327880859375, 0.804443359375, 0.8760986328125, 0.94775390625, 1.0194091796875, 1.091064453125, 1.1627197265625, 1.234375, 1.3060302734375, 1.377685546875, 1.4493408203125, 1.52099609375, 1.5926513671875, 1.664306640625, 1.7359619140625, 1.8076171875, 1.8792724609375, 1.950927734375, 2.0225830078125, 2.09423828125, 2.1658935546875, 2.237548828125, 2.3092041015625, 2.380859375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 8.0, 4.0, 8.0, 10.0, 10.0, 19.0, 9.0, 20.0, 26.0, 20.0, 21.0, 37.0, 33.0, 33.0, 39.0, 49.0, 72.0, 91.0, 216.0, 1362.0, 315.0, 152.0, 86.0, 65.0, 37.0, 40.0, 31.0, 36.0, 27.0, 26.0, 19.0, 27.0, 14.0, 15.0, 16.0, 10.0, 9.0, 8.0, 9.0, 3.0, 6.0, 2.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.68359375, -5.51544189453125, -5.3472900390625, -5.17913818359375, -5.010986328125, -4.84283447265625, -4.6746826171875, -4.50653076171875, -4.33837890625, -4.17022705078125, -4.0020751953125, -3.83392333984375, -3.665771484375, -3.49761962890625, -3.3294677734375, -3.16131591796875, -2.9931640625, -2.82501220703125, -2.6568603515625, -2.48870849609375, -2.320556640625, -2.15240478515625, -1.9842529296875, -1.81610107421875, -1.64794921875, -1.47979736328125, -1.3116455078125, -1.14349365234375, -0.975341796875, -0.80718994140625, -0.6390380859375, -0.47088623046875, -0.302734375, -0.13458251953125, 0.0335693359375, 0.20172119140625, 0.369873046875, 0.53802490234375, 0.7061767578125, 0.87432861328125, 1.04248046875, 1.21063232421875, 1.3787841796875, 1.54693603515625, 1.715087890625, 1.88323974609375, 2.0513916015625, 2.21954345703125, 2.3876953125, 2.55584716796875, 2.7239990234375, 2.89215087890625, 3.060302734375, 3.22845458984375, 3.3966064453125, 3.56475830078125, 3.73291015625, 3.90106201171875, 4.0692138671875, 4.23736572265625, 4.405517578125, 4.57366943359375, 4.7418212890625, 4.90997314453125, 5.078125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 8.0, 9.0, 9.0, 9.0, 13.0, 15.0, 13.0, 19.0, 23.0, 21.0, 31.0, 35.0, 48.0, 67.0, 127.0, 207.0, 479.0, 1546.0, 10000.0, 487935.0, 2585854.0, 54151.0, 3428.0, 833.0, 298.0, 168.0, 81.0, 53.0, 30.0, 40.0, 26.0, 15.0, 16.0, 23.0, 11.0, 10.0, 12.0, 12.0, 8.0, 6.0, 8.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.8525390625, -7.564453125, -7.2763671875, -6.98828125, -6.7001953125, -6.412109375, -6.1240234375, -5.8359375, -5.5478515625, -5.259765625, -4.9716796875, -4.68359375, -4.3955078125, -4.107421875, -3.8193359375, -3.53125, -3.2431640625, -2.955078125, -2.6669921875, -2.37890625, -2.0908203125, -1.802734375, -1.5146484375, -1.2265625, -0.9384765625, -0.650390625, -0.3623046875, -0.07421875, 0.2138671875, 0.501953125, 0.7900390625, 1.078125, 1.3662109375, 1.654296875, 1.9423828125, 2.23046875, 2.5185546875, 2.806640625, 3.0947265625, 3.3828125, 3.6708984375, 3.958984375, 4.2470703125, 4.53515625, 4.8232421875, 5.111328125, 5.3994140625, 5.6875, 5.9755859375, 6.263671875, 6.5517578125, 6.83984375, 7.1279296875, 7.416015625, 7.7041015625, 7.9921875, 8.2802734375, 8.568359375, 8.8564453125, 9.14453125, 9.4326171875, 9.720703125, 10.0087890625, 10.296875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 40.0, 261.0, 491.0, 193.0, 21.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.186340808868408, -6.068256378173828, -4.95017147064209, -3.8320868015289307, -2.7140021324157715, -1.5959172248840332, -0.4778327941894531, 0.640251636505127, 1.7583365440368652, 2.8764212131500244, 3.9945058822631836, 5.112590789794922, 6.230675220489502, 7.34876012802124, 8.46684455871582, 9.584928512573242, 10.703014373779297, 11.821099281311035, 12.939184188842773, 14.057268142700195, 15.175353050231934, 16.293437957763672, 17.411521911621094, 18.529605865478516, 19.64769172668457, 20.765775680541992, 21.883861541748047, 23.00194549560547, 24.12002944946289, 25.238115310668945, 26.356199264526367, 27.474285125732422, 28.592369079589844, 29.710453033447266, 30.82853889465332, 31.946622848510742, 33.0647087097168, 34.18279266357422, 35.30087661743164, 36.41896057128906, 37.53704833984375, 38.65513229370117, 39.773216247558594, 40.89130401611328, 42.0093879699707, 43.127471923828125, 44.24555587768555, 45.36363983154297, 46.48172378540039, 47.59980773925781, 48.717891693115234, 49.83597946166992, 50.954063415527344, 52.072147369384766, 53.19023132324219, 54.30831527709961, 55.42639923095703, 56.54448318481445, 57.662567138671875, 58.78065490722656, 59.898738861083984, 61.016822814941406, 62.13490676879883, 63.25299072265625, 64.37107849121094]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 4.0, 10.0, 8.0, 12.0, 7.0, 12.0, 17.0, 14.0, 15.0, 25.0, 27.0, 19.0, 22.0, 35.0, 22.0, 40.0, 31.0, 23.0, 34.0, 34.0, 27.0, 38.0, 36.0, 44.0, 50.0, 31.0, 36.0, 31.0, 44.0, 22.0, 32.0, 29.0, 21.0, 19.0, 14.0, 19.0, 9.0, 10.0, 8.0, 8.0, 12.0, 8.0, 11.0, 5.0, 7.0, 1.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-14.282691955566406, -13.827649116516113, -13.37260627746582, -12.917563438415527, -12.462520599365234, -12.007476806640625, -11.552433967590332, -11.097391128540039, -10.642348289489746, -10.187305450439453, -9.73226261138916, -9.277219772338867, -8.822175979614258, -8.367134094238281, -7.912090301513672, -7.457047462463379, -7.002004623413086, -6.546961784362793, -6.0919189453125, -5.636875629425049, -5.181832790374756, -4.726789951324463, -4.271746635437012, -3.8167037963867188, -3.361660957336426, -2.906618118286133, -2.4515750408172607, -1.9965320825576782, -1.5414891242980957, -1.0864462852478027, -0.6314032077789307, -0.1763601303100586, 0.2786836624145508, 0.7337266206741333, 1.1887695789337158, 1.6438125371932983, 2.098855495452881, 2.553898334503174, 3.008941411972046, 3.463984489440918, 3.919027328491211, 4.374070167541504, 4.829113006591797, 5.284156322479248, 5.739199161529541, 6.194242000579834, 6.649285316467285, 7.104328155517578, 7.559370994567871, 8.014413833618164, 8.469456672668457, 8.92449951171875, 9.37954330444336, 9.834585189819336, 10.289628982543945, 10.744671821594238, 11.199714660644531, 11.654757499694824, 12.109800338745117, 12.56484317779541, 13.019886016845703, 13.474929809570312, 13.929972648620605, 14.385015487670898, 14.840058326721191]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 10.0, 6.0, 8.0, 7.0, 17.0, 17.0, 22.0, 24.0, 24.0, 25.0, 31.0, 45.0, 44.0, 40.0, 38.0, 51.0, 49.0, 52.0, 61.0, 41.0, 55.0, 32.0, 35.0, 39.0, 31.0, 31.0, 21.0, 30.0, 24.0, 17.0, 11.0, 9.0, 9.0, 11.0, 5.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.796875, -1.744964599609375, -1.69305419921875, -1.641143798828125, -1.5892333984375, -1.537322998046875, -1.48541259765625, -1.433502197265625, -1.381591796875, -1.329681396484375, -1.27777099609375, -1.225860595703125, -1.1739501953125, -1.122039794921875, -1.07012939453125, -1.018218994140625, -0.96630859375, -0.914398193359375, -0.86248779296875, -0.810577392578125, -0.7586669921875, -0.706756591796875, -0.65484619140625, -0.602935791015625, -0.551025390625, -0.499114990234375, -0.44720458984375, -0.395294189453125, -0.3433837890625, -0.291473388671875, -0.23956298828125, -0.187652587890625, -0.1357421875, -0.083831787109375, -0.03192138671875, 0.019989013671875, 0.0718994140625, 0.123809814453125, 0.17572021484375, 0.227630615234375, 0.279541015625, 0.331451416015625, 0.38336181640625, 0.435272216796875, 0.4871826171875, 0.539093017578125, 0.59100341796875, 0.642913818359375, 0.69482421875, 0.746734619140625, 0.79864501953125, 0.850555419921875, 0.9024658203125, 0.954376220703125, 1.00628662109375, 1.058197021484375, 1.110107421875, 1.162017822265625, 1.21392822265625, 1.265838623046875, 1.3177490234375, 1.369659423828125, 1.42156982421875, 1.473480224609375, 1.525390625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 7.0, 12.0, 22.0, 22.0, 36.0, 38.0, 79.0, 97.0, 162.0, 391.0, 1079.0, 5737.0, 64932.0, 1896324.0, 2145355.0, 72548.0, 5609.0, 960.0, 323.0, 174.0, 111.0, 76.0, 52.0, 34.0, 23.0, 23.0, 24.0, 12.0, 7.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.36962890625, -8.0908203125, -7.81201171875, -7.533203125, -7.25439453125, -6.9755859375, -6.69677734375, -6.41796875, -6.13916015625, -5.8603515625, -5.58154296875, -5.302734375, -5.02392578125, -4.7451171875, -4.46630859375, -4.1875, -3.90869140625, -3.6298828125, -3.35107421875, -3.072265625, -2.79345703125, -2.5146484375, -2.23583984375, -1.95703125, -1.67822265625, -1.3994140625, -1.12060546875, -0.841796875, -0.56298828125, -0.2841796875, -0.00537109375, 0.2734375, 0.55224609375, 0.8310546875, 1.10986328125, 1.388671875, 1.66748046875, 1.9462890625, 2.22509765625, 2.50390625, 2.78271484375, 3.0615234375, 3.34033203125, 3.619140625, 3.89794921875, 4.1767578125, 4.45556640625, 4.734375, 5.01318359375, 5.2919921875, 5.57080078125, 5.849609375, 6.12841796875, 6.4072265625, 6.68603515625, 6.96484375, 7.24365234375, 7.5224609375, 7.80126953125, 8.080078125, 8.35888671875, 8.6376953125, 8.91650390625, 9.1953125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 12.0, 6.0, 15.0, 20.0, 20.0, 37.0, 37.0, 65.0, 82.0, 107.0, 175.0, 255.0, 332.0, 401.0, 432.0, 482.0, 411.0, 319.0, 232.0, 191.0, 145.0, 87.0, 69.0, 49.0, 26.0, 22.0, 16.0, 8.0, 9.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.02734375, -5.8726806640625, -5.718017578125, -5.5633544921875, -5.40869140625, -5.2540283203125, -5.099365234375, -4.9447021484375, -4.7900390625, -4.6353759765625, -4.480712890625, -4.3260498046875, -4.17138671875, -4.0167236328125, -3.862060546875, -3.7073974609375, -3.552734375, -3.3980712890625, -3.243408203125, -3.0887451171875, -2.93408203125, -2.7794189453125, -2.624755859375, -2.4700927734375, -2.3154296875, -2.1607666015625, -2.006103515625, -1.8514404296875, -1.69677734375, -1.5421142578125, -1.387451171875, -1.2327880859375, -1.078125, -0.9234619140625, -0.768798828125, -0.6141357421875, -0.45947265625, -0.3048095703125, -0.150146484375, 0.0045166015625, 0.1591796875, 0.3138427734375, 0.468505859375, 0.6231689453125, 0.77783203125, 0.9324951171875, 1.087158203125, 1.2418212890625, 1.396484375, 1.5511474609375, 1.705810546875, 1.8604736328125, 2.01513671875, 2.1697998046875, 2.324462890625, 2.4791259765625, 2.6337890625, 2.7884521484375, 2.943115234375, 3.0977783203125, 3.25244140625, 3.4071044921875, 3.561767578125, 3.7164306640625, 3.87109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 4.0, 13.0, 11.0, 20.0, 16.0, 24.0, 42.0, 74.0, 98.0, 166.0, 355.0, 595.0, 1279.0, 3644.0, 12854.0, 58655.0, 305119.0, 1577006.0, 1786196.0, 357928.0, 68360.0, 14791.0, 4108.0, 1463.0, 613.0, 360.0, 187.0, 110.0, 67.0, 44.0, 28.0, 18.0, 10.0, 15.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.28350830078125, -7.0631103515625, -6.84271240234375, -6.622314453125, -6.40191650390625, -6.1815185546875, -5.96112060546875, -5.74072265625, -5.52032470703125, -5.2999267578125, -5.07952880859375, -4.859130859375, -4.63873291015625, -4.4183349609375, -4.19793701171875, -3.9775390625, -3.75714111328125, -3.5367431640625, -3.31634521484375, -3.095947265625, -2.87554931640625, -2.6551513671875, -2.43475341796875, -2.21435546875, -1.99395751953125, -1.7735595703125, -1.55316162109375, -1.332763671875, -1.11236572265625, -0.8919677734375, -0.67156982421875, -0.451171875, -0.23077392578125, -0.0103759765625, 0.21002197265625, 0.430419921875, 0.65081787109375, 0.8712158203125, 1.09161376953125, 1.31201171875, 1.53240966796875, 1.7528076171875, 1.97320556640625, 2.193603515625, 2.41400146484375, 2.6343994140625, 2.85479736328125, 3.0751953125, 3.29559326171875, 3.5159912109375, 3.73638916015625, 3.956787109375, 4.17718505859375, 4.3975830078125, 4.61798095703125, 4.83837890625, 5.05877685546875, 5.2791748046875, 5.49957275390625, 5.719970703125, 5.94036865234375, 6.1607666015625, 6.38116455078125, 6.6015625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 13.0, 15.0, 28.0, 49.0, 84.0, 129.0, 127.0, 129.0, 145.0, 111.0, 82.0, 49.0, 25.0, 7.0, 9.0, 10.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.495967864990234, -39.54095458984375, -38.58594512939453, -37.63093185424805, -36.67591857910156, -35.720909118652344, -34.76589584350586, -33.810882568359375, -32.855873107910156, -31.900861740112305, -30.94584846496582, -29.99083709716797, -29.035825729370117, -28.080814361572266, -27.12580108642578, -26.17078971862793, -25.215778350830078, -24.260766983032227, -23.305753707885742, -22.35074234008789, -21.39573097229004, -20.440719604492188, -19.485706329345703, -18.53069496154785, -17.575681686401367, -16.620670318603516, -15.665657997131348, -14.71064567565918, -13.755634307861328, -12.80062198638916, -11.845609664916992, -10.89059829711914, -9.935586929321289, -8.980574607849121, -8.02556324005127, -7.070550918579102, -6.11553955078125, -5.160527229309082, -4.205515384674072, -3.2505035400390625, -2.2954916954040527, -1.340479850769043, -0.38546788692474365, 0.5695440769195557, 1.5245559215545654, 2.4795680046081543, 3.434579849243164, 4.389591693878174, 5.344603538513184, 6.299615383148193, 7.254627227783203, 8.209639549255371, 9.164650917053223, 10.11966323852539, 11.074674606323242, 12.02968692779541, 12.984699249267578, 13.939711570739746, 14.894722938537598, 15.849735260009766, 16.804746627807617, 17.75975799560547, 18.714771270751953, 19.669782638549805, 20.624794006347656]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 11.0, 12.0, 14.0, 12.0, 18.0, 17.0, 19.0, 21.0, 26.0, 20.0, 25.0, 33.0, 29.0, 28.0, 51.0, 36.0, 45.0, 29.0, 43.0, 48.0, 40.0, 40.0, 48.0, 34.0, 27.0, 30.0, 32.0, 24.0, 28.0, 20.0, 24.0, 24.0, 11.0, 11.0, 17.0, 5.0, 9.0, 8.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.24262523651123, -12.794083595275879, -12.345542907714844, -11.897001266479492, -11.44845962524414, -10.999917984008789, -10.551377296447754, -10.102835655212402, -9.654294967651367, -9.205753326416016, -8.75721263885498, -8.308670997619629, -7.860129356384277, -7.411588191986084, -6.963047027587891, -6.514505386352539, -6.0659637451171875, -5.617422580718994, -5.168880939483643, -4.720339775085449, -4.271798133850098, -3.8232569694519043, -3.374715805053711, -2.9261744022369385, -2.477632999420166, -2.0290915966033936, -1.5805503129959106, -1.1320090293884277, -0.6834676265716553, -0.2349262237548828, 0.21361494064331055, 0.662156343460083, 1.1106977462768555, 1.559239149093628, 2.0077805519104004, 2.4563217163085938, 2.904863119125366, 3.3534045219421387, 3.801945686340332, 4.250487327575684, 4.699028491973877, 5.14756965637207, 5.596111297607422, 6.044652462005615, 6.493193626403809, 6.94173526763916, 7.3902764320373535, 7.838817596435547, 8.287359237670898, 8.73590087890625, 9.184441566467285, 9.632983207702637, 10.081524848937988, 10.530065536499023, 10.978607177734375, 11.427148818969727, 11.875690460205078, 12.32423210144043, 12.772772789001465, 13.221314430236816, 13.669856071472168, 14.118396759033203, 14.566938400268555, 15.015480041503906, 15.464020729064941]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 13.0, 12.0, 7.0, 13.0, 30.0, 16.0, 21.0, 16.0, 22.0, 31.0, 16.0, 31.0, 29.0, 40.0, 41.0, 36.0, 39.0, 30.0, 46.0, 46.0, 45.0, 43.0, 31.0, 31.0, 36.0, 33.0, 26.0, 19.0, 28.0, 23.0, 16.0, 20.0, 13.0, 14.0, 11.0, 14.0, 5.0, 10.0, 9.0, 4.0, 7.0, 2.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3172607421875, -1.273193359375, -1.2291259765625, -1.18505859375, -1.1409912109375, -1.096923828125, -1.0528564453125, -1.0087890625, -0.9647216796875, -0.920654296875, -0.8765869140625, -0.83251953125, -0.7884521484375, -0.744384765625, -0.7003173828125, -0.65625, -0.6121826171875, -0.568115234375, -0.5240478515625, -0.47998046875, -0.4359130859375, -0.391845703125, -0.3477783203125, -0.3037109375, -0.2596435546875, -0.215576171875, -0.1715087890625, -0.12744140625, -0.0833740234375, -0.039306640625, 0.0047607421875, 0.048828125, 0.0928955078125, 0.136962890625, 0.1810302734375, 0.22509765625, 0.2691650390625, 0.313232421875, 0.3572998046875, 0.4013671875, 0.4454345703125, 0.489501953125, 0.5335693359375, 0.57763671875, 0.6217041015625, 0.665771484375, 0.7098388671875, 0.75390625, 0.7979736328125, 0.842041015625, 0.8861083984375, 0.93017578125, 0.9742431640625, 1.018310546875, 1.0623779296875, 1.1064453125, 1.1505126953125, 1.194580078125, 1.2386474609375, 1.28271484375, 1.3267822265625, 1.370849609375, 1.4149169921875, 1.458984375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 3.0, 18.0, 24.0, 41.0, 75.0, 131.0, 260.0, 404.0, 864.0, 1455.0, 2912.0, 5284.0, 9565.0, 17308.0, 30573.0, 52652.0, 85522.0, 124808.0, 159119.0, 167292.0, 139402.0, 100206.0, 63761.0, 38166.0, 21965.0, 12283.0, 6603.0, 3574.0, 1902.0, 1051.0, 593.0, 318.0, 177.0, 95.0, 56.0, 26.0, 25.0, 17.0, 6.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.642578125, -0.62261962890625, -0.6026611328125, -0.58270263671875, -0.562744140625, -0.54278564453125, -0.5228271484375, -0.50286865234375, -0.48291015625, -0.46295166015625, -0.4429931640625, -0.42303466796875, -0.403076171875, -0.38311767578125, -0.3631591796875, -0.34320068359375, -0.3232421875, -0.30328369140625, -0.2833251953125, -0.26336669921875, -0.243408203125, -0.22344970703125, -0.2034912109375, -0.18353271484375, -0.16357421875, -0.14361572265625, -0.1236572265625, -0.10369873046875, -0.083740234375, -0.06378173828125, -0.0438232421875, -0.02386474609375, -0.00390625, 0.01605224609375, 0.0360107421875, 0.05596923828125, 0.075927734375, 0.09588623046875, 0.1158447265625, 0.13580322265625, 0.15576171875, 0.17572021484375, 0.1956787109375, 0.21563720703125, 0.235595703125, 0.25555419921875, 0.2755126953125, 0.29547119140625, 0.3154296875, 0.33538818359375, 0.3553466796875, 0.37530517578125, 0.395263671875, 0.41522216796875, 0.4351806640625, 0.45513916015625, 0.47509765625, 0.49505615234375, 0.5150146484375, 0.53497314453125, 0.554931640625, 0.57489013671875, 0.5948486328125, 0.61480712890625, 0.634765625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 7.0, 5.0, 5.0, 8.0, 11.0, 8.0, 8.0, 10.0, 12.0, 19.0, 14.0, 26.0, 18.0, 34.0, 33.0, 24.0, 25.0, 22.0, 32.0, 28.0, 55.0, 32.0, 1065.0, 40.0, 47.0, 45.0, 49.0, 25.0, 29.0, 32.0, 21.0, 31.0, 22.0, 26.0, 22.0, 20.0, 17.0, 16.0, 9.0, 16.0, 11.0, 8.0, 11.0, 9.0, 5.0, 5.0, 2.0, 1.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.03125, -0.99859619140625, -0.9659423828125, -0.93328857421875, -0.900634765625, -0.86798095703125, -0.8353271484375, -0.80267333984375, -0.77001953125, -0.73736572265625, -0.7047119140625, -0.67205810546875, -0.639404296875, -0.60675048828125, -0.5740966796875, -0.54144287109375, -0.5087890625, -0.47613525390625, -0.4434814453125, -0.41082763671875, -0.378173828125, -0.34552001953125, -0.3128662109375, -0.28021240234375, -0.24755859375, -0.21490478515625, -0.1822509765625, -0.14959716796875, -0.116943359375, -0.08428955078125, -0.0516357421875, -0.01898193359375, 0.013671875, 0.04632568359375, 0.0789794921875, 0.11163330078125, 0.144287109375, 0.17694091796875, 0.2095947265625, 0.24224853515625, 0.27490234375, 0.30755615234375, 0.3402099609375, 0.37286376953125, 0.405517578125, 0.43817138671875, 0.4708251953125, 0.50347900390625, 0.5361328125, 0.56878662109375, 0.6014404296875, 0.63409423828125, 0.666748046875, 0.69940185546875, 0.7320556640625, 0.76470947265625, 0.79736328125, 0.83001708984375, 0.8626708984375, 0.89532470703125, 0.927978515625, 0.96063232421875, 0.9932861328125, 1.02593994140625, 1.05859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 13.0, 14.0, 23.0, 31.0, 42.0, 56.0, 67.0, 112.0, 122.0, 205.0, 284.0, 388.0, 482.0, 727.0, 990.0, 1557.0, 2084.0, 2953.0, 4004.0, 5688.0, 7982.0, 11552.0, 17698.0, 30128.0, 1635769.0, 288440.0, 29288.0, 17471.0, 11458.0, 7992.0, 5672.0, 3946.0, 2844.0, 2059.0, 1506.0, 1044.0, 724.0, 488.0, 359.0, 236.0, 192.0, 144.0, 79.0, 56.0, 49.0, 30.0, 29.0, 21.0, 9.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.83984375, -0.81512451171875, -0.7904052734375, -0.76568603515625, -0.740966796875, -0.71624755859375, -0.6915283203125, -0.66680908203125, -0.64208984375, -0.61737060546875, -0.5926513671875, -0.56793212890625, -0.543212890625, -0.51849365234375, -0.4937744140625, -0.46905517578125, -0.4443359375, -0.41961669921875, -0.3948974609375, -0.37017822265625, -0.345458984375, -0.32073974609375, -0.2960205078125, -0.27130126953125, -0.24658203125, -0.22186279296875, -0.1971435546875, -0.17242431640625, -0.147705078125, -0.12298583984375, -0.0982666015625, -0.07354736328125, -0.048828125, -0.02410888671875, 0.0006103515625, 0.02532958984375, 0.050048828125, 0.07476806640625, 0.0994873046875, 0.12420654296875, 0.14892578125, 0.17364501953125, 0.1983642578125, 0.22308349609375, 0.247802734375, 0.27252197265625, 0.2972412109375, 0.32196044921875, 0.3466796875, 0.37139892578125, 0.3961181640625, 0.42083740234375, 0.445556640625, 0.47027587890625, 0.4949951171875, 0.51971435546875, 0.54443359375, 0.56915283203125, 0.5938720703125, 0.61859130859375, 0.643310546875, 0.66802978515625, 0.6927490234375, 0.71746826171875, 0.7421875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 4.0, 5.0, 5.0, 16.0, 11.0, 13.0, 9.0, 13.0, 18.0, 25.0, 35.0, 31.0, 43.0, 33.0, 58.0, 60.0, 63.0, 63.0, 56.0, 64.0, 56.0, 56.0, 42.0, 31.0, 40.0, 14.0, 17.0, 16.0, 14.0, 16.0, 8.0, 9.0, 5.0, 7.0, 8.0, 4.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0232696533203125, -0.022517681121826172, -0.021765708923339844, -0.021013736724853516, -0.020261764526367188, -0.01950979232788086, -0.01875782012939453, -0.018005847930908203, -0.017253875732421875, -0.016501903533935547, -0.01574993133544922, -0.01499795913696289, -0.014245986938476562, -0.013494014739990234, -0.012742042541503906, -0.011990070343017578, -0.01123809814453125, -0.010486125946044922, -0.009734153747558594, -0.008982181549072266, -0.008230209350585938, -0.007478237152099609, -0.006726264953613281, -0.005974292755126953, -0.005222320556640625, -0.004470348358154297, -0.0037183761596679688, -0.0029664039611816406, -0.0022144317626953125, -0.0014624595642089844, -0.0007104873657226562, 4.1484832763671875e-05, 0.00079345703125, 0.0015454292297363281, 0.0022974014282226562, 0.0030493736267089844, 0.0038013458251953125, 0.004553318023681641, 0.005305290222167969, 0.006057262420654297, 0.006809234619140625, 0.007561206817626953, 0.008313179016113281, 0.00906515121459961, 0.009817123413085938, 0.010569095611572266, 0.011321067810058594, 0.012073040008544922, 0.01282501220703125, 0.013576984405517578, 0.014328956604003906, 0.015080928802490234, 0.015832901000976562, 0.01658487319946289, 0.01733684539794922, 0.018088817596435547, 0.018840789794921875, 0.019592761993408203, 0.02034473419189453, 0.02109670639038086, 0.021848678588867188, 0.022600650787353516, 0.023352622985839844, 0.024104595184326172, 0.0248565673828125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 5.0, 4.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 11.0, 22.0, 16.0, 25.0, 17.0, 20.0, 33.0, 45.0, 45.0, 57.0, 52.0, 72.0, 121.0, 150.0, 156.0, 220.0, 330.0, 1110.0, 22547.0, 754490.0, 260960.0, 6186.0, 572.0, 274.0, 202.0, 156.0, 110.0, 96.0, 72.0, 52.0, 48.0, 41.0, 28.0, 37.0, 33.0, 23.0, 22.0, 17.0, 6.0, 10.0, 13.0, 3.0, 4.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.34765625, -0.3363761901855469, -0.32509613037109375, -0.3138160705566406, -0.3025360107421875, -0.2912559509277344, -0.27997589111328125, -0.2686958312988281, -0.257415771484375, -0.24613571166992188, -0.23485565185546875, -0.22357559204101562, -0.2122955322265625, -0.20101547241210938, -0.18973541259765625, -0.17845535278320312, -0.16717529296875, -0.15589523315429688, -0.14461517333984375, -0.13333511352539062, -0.1220550537109375, -0.11077499389648438, -0.09949493408203125, -0.08821487426757812, -0.076934814453125, -0.06565475463867188, -0.05437469482421875, -0.043094635009765625, -0.0318145751953125, -0.020534515380859375, -0.00925445556640625, 0.002025604248046875, 0.0133056640625, 0.024585723876953125, 0.03586578369140625, 0.047145843505859375, 0.0584259033203125, 0.06970596313476562, 0.08098602294921875, 0.09226608276367188, 0.103546142578125, 0.11482620239257812, 0.12610626220703125, 0.13738632202148438, 0.1486663818359375, 0.15994644165039062, 0.17122650146484375, 0.18250656127929688, 0.19378662109375, 0.20506668090820312, 0.21634674072265625, 0.22762680053710938, 0.2389068603515625, 0.2501869201660156, 0.26146697998046875, 0.2727470397949219, 0.284027099609375, 0.2953071594238281, 0.30658721923828125, 0.3178672790527344, 0.3291473388671875, 0.3404273986816406, 0.35170745849609375, 0.3629875183105469, 0.374267578125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 36.0, 89.0, 355.0, 414.0, 73.0, 31.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6278042793273926, -0.6117056012153625, -0.5956069231033325, -0.5795082449913025, -0.5634095668792725, -0.5473108291625977, -0.5312122106552124, -0.5151134729385376, -0.49901479482650757, -0.48291611671447754, -0.4668174386024475, -0.4507187604904175, -0.43462005257606506, -0.41852137446403503, -0.402422696352005, -0.386324018239975, -0.37022534012794495, -0.3541266620159149, -0.3380279839038849, -0.32192927598953247, -0.30583059787750244, -0.2897319197654724, -0.2736332416534424, -0.25753456354141235, -0.24143587052822113, -0.2253371924161911, -0.20923849940299988, -0.19313982129096985, -0.17704114317893982, -0.1609424501657486, -0.14484377205371857, -0.12874507904052734, -0.1126464307308197, -0.09654774516820908, -0.08044905960559845, -0.06435038149356842, -0.048251695930957794, -0.03215301036834717, -0.01605433225631714, 4.435330629348755e-05, 0.016143038868904114, 0.03224172443151474, 0.04834040626883507, 0.0644390881061554, 0.08053777366876602, 0.09663645923137665, 0.11273513734340668, 0.1288338303565979, 0.14493250846862793, 0.16103118658065796, 0.17712987959384918, 0.1932285577058792, 0.20932725071907043, 0.22542592883110046, 0.2415246069431305, 0.2576232850551605, 0.27372199296951294, 0.28982067108154297, 0.305919349193573, 0.322018027305603, 0.33811673521995544, 0.3542154133319855, 0.3703140914440155, 0.38641276955604553, 0.40251144766807556]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 7.0, 8.0, 7.0, 10.0, 8.0, 15.0, 15.0, 30.0, 28.0, 32.0, 38.0, 44.0, 39.0, 42.0, 42.0, 46.0, 44.0, 53.0, 47.0, 58.0, 63.0, 52.0, 51.0, 42.0, 32.0, 35.0, 23.0, 24.0, 16.0, 14.0, 8.0, 9.0, 11.0, 5.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039926111698150635, -0.0380634069442749, -0.03620069846510887, -0.03433798998594284, -0.03247528523206711, -0.030612578615546227, -0.028749871999025345, -0.026887165382504463, -0.02502445876598358, -0.0231617521494627, -0.021299045532941818, -0.019436338916420937, -0.017573632299900055, -0.015710925683379173, -0.013848219066858292, -0.01198551245033741, -0.010122805833816528, -0.008260099217295647, -0.006397392600774765, -0.004534685984253883, -0.0026719793677330017, -0.0008092727512121201, 0.0010534338653087616, 0.0029161404818296432, 0.004778847098350525, 0.0066415537148714066, 0.008504260331392288, 0.01036696694791317, 0.012229673564434052, 0.014092380180954933, 0.015955086797475815, 0.017817793413996696, 0.019680500030517578, 0.02154320664703846, 0.02340591326355934, 0.025268619880080223, 0.027131326496601105, 0.028994033113121986, 0.030856739729642868, 0.0327194482088089, 0.03458215296268463, 0.036444857716560364, 0.038307566195726395, 0.040170274674892426, 0.04203297942876816, 0.04389568418264389, 0.04575839266180992, 0.04762110114097595, 0.049483805894851685, 0.05134651064872742, 0.05320921912789345, 0.05507192760705948, 0.05693463236093521, 0.058797337114810944, 0.060660045593976974, 0.062522754073143, 0.06438545882701874, 0.06624816358089447, 0.0681108683347702, 0.06997358053922653, 0.07183628529310226, 0.073698990046978, 0.07556170225143433, 0.07742440700531006, 0.07928711175918579]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 2.0, 13.0, 10.0, 14.0, 7.0, 14.0, 21.0, 17.0, 14.0, 24.0, 36.0, 32.0, 30.0, 30.0, 29.0, 33.0, 34.0, 47.0, 37.0, 44.0, 52.0, 39.0, 47.0, 33.0, 36.0, 33.0, 34.0, 32.0, 28.0, 23.0, 23.0, 22.0, 23.0, 16.0, 16.0, 13.0, 3.0, 7.0, 10.0, 7.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.6630859375, -1.6154632568359375, -1.567840576171875, -1.5202178955078125, -1.47259521484375, -1.4249725341796875, -1.377349853515625, -1.3297271728515625, -1.2821044921875, -1.2344818115234375, -1.186859130859375, -1.1392364501953125, -1.09161376953125, -1.0439910888671875, -0.996368408203125, -0.9487457275390625, -0.901123046875, -0.8535003662109375, -0.805877685546875, -0.7582550048828125, -0.71063232421875, -0.6630096435546875, -0.615386962890625, -0.5677642822265625, -0.5201416015625, -0.4725189208984375, -0.424896240234375, -0.3772735595703125, -0.32965087890625, -0.2820281982421875, -0.234405517578125, -0.1867828369140625, -0.13916015625, -0.0915374755859375, -0.043914794921875, 0.0037078857421875, 0.05133056640625, 0.0989532470703125, 0.146575927734375, 0.1941986083984375, 0.2418212890625, 0.2894439697265625, 0.337066650390625, 0.3846893310546875, 0.43231201171875, 0.4799346923828125, 0.527557373046875, 0.5751800537109375, 0.622802734375, 0.6704254150390625, 0.718048095703125, 0.7656707763671875, 0.81329345703125, 0.8609161376953125, 0.908538818359375, 0.9561614990234375, 1.0037841796875, 1.0514068603515625, 1.099029541015625, 1.1466522216796875, 1.19427490234375, 1.2418975830078125, 1.289520263671875, 1.3371429443359375, 1.384765625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 12.0, 9.0, 20.0, 22.0, 51.0, 68.0, 131.0, 233.0, 489.0, 939.0, 1898.0, 4102.0, 9302.0, 23410.0, 78699.0, 417437.0, 396889.0, 75427.0, 22549.0, 9060.0, 3966.0, 1884.0, 943.0, 470.0, 238.0, 116.0, 70.0, 31.0, 25.0, 24.0, 11.0, 8.0, 4.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.952606201171875, -2.86029052734375, -2.767974853515625, -2.6756591796875, -2.583343505859375, -2.49102783203125, -2.398712158203125, -2.306396484375, -2.214080810546875, -2.12176513671875, -2.029449462890625, -1.9371337890625, -1.844818115234375, -1.75250244140625, -1.660186767578125, -1.56787109375, -1.475555419921875, -1.38323974609375, -1.290924072265625, -1.1986083984375, -1.106292724609375, -1.01397705078125, -0.921661376953125, -0.829345703125, -0.737030029296875, -0.64471435546875, -0.552398681640625, -0.4600830078125, -0.367767333984375, -0.27545166015625, -0.183135986328125, -0.0908203125, 0.001495361328125, 0.09381103515625, 0.186126708984375, 0.2784423828125, 0.370758056640625, 0.46307373046875, 0.555389404296875, 0.647705078125, 0.740020751953125, 0.83233642578125, 0.924652099609375, 1.0169677734375, 1.109283447265625, 1.20159912109375, 1.293914794921875, 1.38623046875, 1.478546142578125, 1.57086181640625, 1.663177490234375, 1.7554931640625, 1.847808837890625, 1.94012451171875, 2.032440185546875, 2.124755859375, 2.217071533203125, 2.30938720703125, 2.401702880859375, 2.4940185546875, 2.586334228515625, 2.67864990234375, 2.770965576171875, 2.86328125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 12.0, 7.0, 11.0, 15.0, 19.0, 20.0, 26.0, 27.0, 41.0, 35.0, 38.0, 33.0, 40.0, 40.0, 59.0, 108.0, 212.0, 1554.0, 215.0, 104.0, 53.0, 46.0, 36.0, 32.0, 48.0, 34.0, 29.0, 24.0, 17.0, 22.0, 19.0, 14.0, 10.0, 6.0, 8.0, 6.0, 3.0, 6.0, 1.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.96875, -5.7850341796875, -5.601318359375, -5.4176025390625, -5.23388671875, -5.0501708984375, -4.866455078125, -4.6827392578125, -4.4990234375, -4.3153076171875, -4.131591796875, -3.9478759765625, -3.76416015625, -3.5804443359375, -3.396728515625, -3.2130126953125, -3.029296875, -2.8455810546875, -2.661865234375, -2.4781494140625, -2.29443359375, -2.1107177734375, -1.927001953125, -1.7432861328125, -1.5595703125, -1.3758544921875, -1.192138671875, -1.0084228515625, -0.82470703125, -0.6409912109375, -0.457275390625, -0.2735595703125, -0.08984375, 0.0938720703125, 0.277587890625, 0.4613037109375, 0.64501953125, 0.8287353515625, 1.012451171875, 1.1961669921875, 1.3798828125, 1.5635986328125, 1.747314453125, 1.9310302734375, 2.11474609375, 2.2984619140625, 2.482177734375, 2.6658935546875, 2.849609375, 3.0333251953125, 3.217041015625, 3.4007568359375, 3.58447265625, 3.7681884765625, 3.951904296875, 4.1356201171875, 4.3193359375, 4.5030517578125, 4.686767578125, 4.8704833984375, 5.05419921875, 5.2379150390625, 5.421630859375, 5.6053466796875, 5.7890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 6.0, 13.0, 13.0, 21.0, 20.0, 28.0, 30.0, 37.0, 73.0, 83.0, 129.0, 185.0, 378.0, 998.0, 4330.0, 39725.0, 2030998.0, 1035808.0, 27494.0, 3466.0, 846.0, 348.0, 192.0, 101.0, 95.0, 57.0, 45.0, 36.0, 25.0, 24.0, 18.0, 16.0, 10.0, 10.0, 6.0, 4.0, 4.0, 6.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.2578125, -7.9908447265625, -7.723876953125, -7.4569091796875, -7.18994140625, -6.9229736328125, -6.656005859375, -6.3890380859375, -6.1220703125, -5.8551025390625, -5.588134765625, -5.3211669921875, -5.05419921875, -4.7872314453125, -4.520263671875, -4.2532958984375, -3.986328125, -3.7193603515625, -3.452392578125, -3.1854248046875, -2.91845703125, -2.6514892578125, -2.384521484375, -2.1175537109375, -1.8505859375, -1.5836181640625, -1.316650390625, -1.0496826171875, -0.78271484375, -0.5157470703125, -0.248779296875, 0.0181884765625, 0.28515625, 0.5521240234375, 0.819091796875, 1.0860595703125, 1.35302734375, 1.6199951171875, 1.886962890625, 2.1539306640625, 2.4208984375, 2.6878662109375, 2.954833984375, 3.2218017578125, 3.48876953125, 3.7557373046875, 4.022705078125, 4.2896728515625, 4.556640625, 4.8236083984375, 5.090576171875, 5.3575439453125, 5.62451171875, 5.8914794921875, 6.158447265625, 6.4254150390625, 6.6923828125, 6.9593505859375, 7.226318359375, 7.4932861328125, 7.76025390625, 8.0272216796875, 8.294189453125, 8.5611572265625, 8.828125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 169.0, 753.0, 96.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.90784454345703, -114.67567443847656, -112.44349670410156, -110.2113265991211, -107.97915649414062, -105.74697875976562, -103.51480865478516, -101.28263854980469, -99.05046081542969, -96.81829071044922, -94.58611297607422, -92.35394287109375, -90.12177276611328, -87.88959503173828, -85.65742492675781, -83.42525482177734, -81.19308471679688, -78.9609146118164, -76.7287368774414, -74.49656677246094, -72.26439666748047, -70.03221893310547, -67.800048828125, -65.56787872314453, -63.33570098876953, -61.1035270690918, -58.87135696411133, -56.639183044433594, -54.40700912475586, -52.174835205078125, -49.942665100097656, -47.71049118041992, -45.47831344604492, -43.24613952636719, -41.01396942138672, -38.781795501708984, -36.54962158203125, -34.31745147705078, -32.08527755737305, -29.853103637695312, -27.62093162536621, -25.38875961303711, -23.156585693359375, -20.924413681030273, -18.692241668701172, -16.460067749023438, -14.227895736694336, -11.995722770690918, -9.7635498046875, -7.531376838684082, -5.299204349517822, -3.0670318603515625, -0.8348588943481445, 1.3973140716552734, 3.629486083984375, 5.861659049987793, 8.093832015991211, 10.326004981994629, 12.558177947998047, 14.790349960327148, 17.02252197265625, 19.254695892333984, 21.486867904663086, 23.719039916992188, 25.951213836669922]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 7.0, 8.0, 7.0, 14.0, 15.0, 15.0, 16.0, 16.0, 19.0, 29.0, 32.0, 29.0, 36.0, 30.0, 38.0, 52.0, 41.0, 37.0, 36.0, 32.0, 35.0, 36.0, 50.0, 33.0, 37.0, 33.0, 29.0, 33.0, 25.0, 23.0, 25.0, 17.0, 17.0, 18.0, 23.0, 10.0, 11.0, 9.0, 7.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-22.23246192932129, -21.618980407714844, -21.00550079345703, -20.392019271850586, -19.778539657592773, -19.165058135986328, -18.551578521728516, -17.93809700012207, -17.324617385864258, -16.711135864257812, -16.09765625, -15.484175682067871, -14.870695114135742, -14.257214546203613, -13.643733978271484, -13.030252456665039, -12.41677188873291, -11.803291320800781, -11.189810752868652, -10.576330184936523, -9.962849617004395, -9.349369049072266, -8.73588752746582, -8.122407913208008, -7.508926868438721, -6.895446300506592, -6.281965732574463, -5.668484687805176, -5.055004119873047, -4.441523551940918, -3.828042984008789, -3.21456241607666, -2.6010818481445312, -1.9876012802124023, -1.3741205930709839, -0.7606399059295654, -0.14715933799743652, 0.4663212299346924, 1.0798020362854004, 1.6932826042175293, 2.306763172149658, 2.920243740081787, 3.533724308013916, 4.147205352783203, 4.760685920715332, 5.374166488647461, 5.98764705657959, 6.601127624511719, 7.214608192443848, 7.828088760375977, 8.441569328308105, 9.055049896240234, 9.668530464172363, 10.282011032104492, 10.895492553710938, 11.50897216796875, 12.122453689575195, 12.735934257507324, 13.349414825439453, 13.962895393371582, 14.576375961303711, 15.18985652923584, 15.803337097167969, 16.416818618774414, 17.030298233032227]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 2.0, 8.0, 8.0, 17.0, 5.0, 14.0, 19.0, 23.0, 24.0, 25.0, 21.0, 30.0, 31.0, 34.0, 30.0, 25.0, 35.0, 38.0, 42.0, 48.0, 36.0, 36.0, 47.0, 41.0, 39.0, 30.0, 33.0, 29.0, 39.0, 22.0, 23.0, 17.0, 26.0, 21.0, 14.0, 9.0, 13.0, 9.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.62890625, -1.5800628662109375, -1.531219482421875, -1.4823760986328125, -1.43353271484375, -1.3846893310546875, -1.335845947265625, -1.2870025634765625, -1.2381591796875, -1.1893157958984375, -1.140472412109375, -1.0916290283203125, -1.04278564453125, -0.9939422607421875, -0.945098876953125, -0.8962554931640625, -0.847412109375, -0.7985687255859375, -0.749725341796875, -0.7008819580078125, -0.65203857421875, -0.6031951904296875, -0.554351806640625, -0.5055084228515625, -0.4566650390625, -0.4078216552734375, -0.358978271484375, -0.3101348876953125, -0.26129150390625, -0.2124481201171875, -0.163604736328125, -0.1147613525390625, -0.06591796875, -0.0170745849609375, 0.031768798828125, 0.0806121826171875, 0.12945556640625, 0.1782989501953125, 0.227142333984375, 0.2759857177734375, 0.3248291015625, 0.3736724853515625, 0.422515869140625, 0.4713592529296875, 0.52020263671875, 0.5690460205078125, 0.617889404296875, 0.6667327880859375, 0.715576171875, 0.7644195556640625, 0.813262939453125, 0.8621063232421875, 0.91094970703125, 0.9597930908203125, 1.008636474609375, 1.0574798583984375, 1.1063232421875, 1.1551666259765625, 1.204010009765625, 1.2528533935546875, 1.30169677734375, 1.3505401611328125, 1.399383544921875, 1.4482269287109375, 1.4970703125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 8.0, 8.0, 10.0, 18.0, 14.0, 20.0, 37.0, 32.0, 69.0, 73.0, 132.0, 252.0, 567.0, 2177.0, 11776.0, 106380.0, 1989775.0, 1962775.0, 105883.0, 11058.0, 1974.0, 564.0, 230.0, 118.0, 80.0, 69.0, 47.0, 38.0, 35.0, 15.0, 13.0, 3.0, 7.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5078125, -5.268310546875, -5.02880859375, -4.789306640625, -4.5498046875, -4.310302734375, -4.07080078125, -3.831298828125, -3.591796875, -3.352294921875, -3.11279296875, -2.873291015625, -2.6337890625, -2.394287109375, -2.15478515625, -1.915283203125, -1.67578125, -1.436279296875, -1.19677734375, -0.957275390625, -0.7177734375, -0.478271484375, -0.23876953125, 0.000732421875, 0.240234375, 0.479736328125, 0.71923828125, 0.958740234375, 1.1982421875, 1.437744140625, 1.67724609375, 1.916748046875, 2.15625, 2.395751953125, 2.63525390625, 2.874755859375, 3.1142578125, 3.353759765625, 3.59326171875, 3.832763671875, 4.072265625, 4.311767578125, 4.55126953125, 4.790771484375, 5.0302734375, 5.269775390625, 5.50927734375, 5.748779296875, 5.98828125, 6.227783203125, 6.46728515625, 6.706787109375, 6.9462890625, 7.185791015625, 7.42529296875, 7.664794921875, 7.904296875, 8.143798828125, 8.38330078125, 8.622802734375, 8.8623046875, 9.101806640625, 9.34130859375, 9.580810546875, 9.8203125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 15.0, 16.0, 18.0, 46.0, 40.0, 59.0, 85.0, 151.0, 204.0, 265.0, 372.0, 503.0, 504.0, 485.0, 369.0, 264.0, 202.0, 147.0, 100.0, 57.0, 53.0, 30.0, 22.0, 21.0, 15.0, 8.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.81561279296875, -4.6468505859375, -4.47808837890625, -4.309326171875, -4.14056396484375, -3.9718017578125, -3.80303955078125, -3.63427734375, -3.46551513671875, -3.2967529296875, -3.12799072265625, -2.959228515625, -2.79046630859375, -2.6217041015625, -2.45294189453125, -2.2841796875, -2.11541748046875, -1.9466552734375, -1.77789306640625, -1.609130859375, -1.44036865234375, -1.2716064453125, -1.10284423828125, -0.93408203125, -0.76531982421875, -0.5965576171875, -0.42779541015625, -0.259033203125, -0.09027099609375, 0.0784912109375, 0.24725341796875, 0.416015625, 0.58477783203125, 0.7535400390625, 0.92230224609375, 1.091064453125, 1.25982666015625, 1.4285888671875, 1.59735107421875, 1.76611328125, 1.93487548828125, 2.1036376953125, 2.27239990234375, 2.441162109375, 2.60992431640625, 2.7786865234375, 2.94744873046875, 3.1162109375, 3.28497314453125, 3.4537353515625, 3.62249755859375, 3.791259765625, 3.96002197265625, 4.1287841796875, 4.29754638671875, 4.46630859375, 4.63507080078125, 4.8038330078125, 4.97259521484375, 5.141357421875, 5.31011962890625, 5.4788818359375, 5.64764404296875, 5.81640625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 10.0, 24.0, 42.0, 41.0, 77.0, 126.0, 234.0, 443.0, 854.0, 2283.0, 8421.0, 51065.0, 439548.0, 2613093.0, 951979.0, 105228.0, 14964.0, 3439.0, 1215.0, 474.0, 279.0, 153.0, 102.0, 56.0, 36.0, 19.0, 21.0, 14.0, 3.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.1796875, -9.8861083984375, -9.592529296875, -9.2989501953125, -9.00537109375, -8.7117919921875, -8.418212890625, -8.1246337890625, -7.8310546875, -7.5374755859375, -7.243896484375, -6.9503173828125, -6.65673828125, -6.3631591796875, -6.069580078125, -5.7760009765625, -5.482421875, -5.1888427734375, -4.895263671875, -4.6016845703125, -4.30810546875, -4.0145263671875, -3.720947265625, -3.4273681640625, -3.1337890625, -2.8402099609375, -2.546630859375, -2.2530517578125, -1.95947265625, -1.6658935546875, -1.372314453125, -1.0787353515625, -0.78515625, -0.4915771484375, -0.197998046875, 0.0955810546875, 0.38916015625, 0.6827392578125, 0.976318359375, 1.2698974609375, 1.5634765625, 1.8570556640625, 2.150634765625, 2.4442138671875, 2.73779296875, 3.0313720703125, 3.324951171875, 3.6185302734375, 3.912109375, 4.2056884765625, 4.499267578125, 4.7928466796875, 5.08642578125, 5.3800048828125, 5.673583984375, 5.9671630859375, 6.2607421875, 6.5543212890625, 6.847900390625, 7.1414794921875, 7.43505859375, 7.7286376953125, 8.022216796875, 8.3157958984375, 8.609375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 13.0, 25.0, 57.0, 73.0, 107.0, 130.0, 145.0, 161.0, 117.0, 77.0, 47.0, 21.0, 14.0, 8.0, 4.0, 3.0, 2.0], "bins": [-56.57752990722656, -55.51911544799805, -54.46070098876953, -53.402286529541016, -52.3438720703125, -51.28545379638672, -50.2270393371582, -49.16862487792969, -48.11021041870117, -47.051795959472656, -45.99338150024414, -44.934967041015625, -43.876548767089844, -42.81813430786133, -41.75971984863281, -40.7013053894043, -39.64289093017578, -38.584476470947266, -37.52606201171875, -36.467647552490234, -35.40923309326172, -34.35081481933594, -33.29240036010742, -32.233985900878906, -31.17557144165039, -30.117156982421875, -29.05874252319336, -28.00032615661621, -26.941911697387695, -25.88349723815918, -24.82508087158203, -23.766666412353516, -22.708251953125, -21.649837493896484, -20.59142303466797, -19.53300666809082, -18.474592208862305, -17.41617774963379, -16.35776138305664, -15.299346923828125, -14.24093246459961, -13.182518005371094, -12.124102592468262, -11.06568717956543, -10.007272720336914, -8.948858261108398, -7.890442848205566, -6.832027912139893, -5.773612976074219, -4.715198040008545, -3.656783103942871, -2.5983681678771973, -1.5399532318115234, -0.4815382957458496, 0.5768766403198242, 1.635291576385498, 2.693706512451172, 3.7521214485168457, 4.8105363845825195, 5.868951320648193, 6.927366256713867, 7.985781192779541, 9.044196128845215, 10.102611541748047, 11.161026000976562]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 15.0, 9.0, 12.0, 13.0, 20.0, 23.0, 41.0, 22.0, 25.0, 44.0, 41.0, 34.0, 40.0, 47.0, 50.0, 54.0, 56.0, 46.0, 41.0, 40.0, 43.0, 41.0, 40.0, 28.0, 26.0, 25.0, 24.0, 17.0, 13.0, 10.0, 16.0, 13.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.550176620483398, -13.98268985748291, -13.415204048156738, -12.84771728515625, -12.280230522155762, -11.712743759155273, -11.145257949829102, -10.577771186828613, -10.010284423828125, -9.442797660827637, -8.875311851501465, -8.307825088500977, -7.740338325500488, -7.172852039337158, -6.605365753173828, -6.03787899017334, -5.470393180847168, -4.902906894683838, -4.33542013168335, -3.7679338455200195, -3.2004473209381104, -2.632960796356201, -2.065474510192871, -1.497987985610962, -0.9305014610290527, -0.36301499605178833, 0.20447146892547607, 0.7719578742980957, 1.3394443988800049, 1.906930923461914, 2.474417209625244, 3.0419037342071533, 3.6093902587890625, 4.176876544952393, 4.744363307952881, 5.311849594116211, 5.879336357116699, 6.446822643280029, 7.014308929443359, 7.581795692443848, 8.149282455444336, 8.716769218444824, 9.284255027770996, 9.851741790771484, 10.419228553771973, 10.986715316772461, 11.554201126098633, 12.121687889099121, 12.689173698425293, 13.256660461425781, 13.824146270751953, 14.391633033752441, 14.95911979675293, 15.526605606079102, 16.094093322753906, 16.661579132080078, 17.22906494140625, 17.796550750732422, 18.364038467407227, 18.9315242767334, 19.49901008605957, 20.066497802734375, 20.633983612060547, 21.20146942138672, 21.768957138061523]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 9.0, 10.0, 15.0, 17.0, 20.0, 17.0, 18.0, 28.0, 31.0, 34.0, 35.0, 46.0, 44.0, 43.0, 37.0, 54.0, 43.0, 36.0, 53.0, 46.0, 55.0, 41.0, 35.0, 31.0, 27.0, 30.0, 28.0, 16.0, 16.0, 21.0, 8.0, 11.0, 6.0, 12.0, 11.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.9669342041015625, -1.908477783203125, -1.8500213623046875, -1.79156494140625, -1.7331085205078125, -1.674652099609375, -1.6161956787109375, -1.5577392578125, -1.4992828369140625, -1.440826416015625, -1.3823699951171875, -1.32391357421875, -1.2654571533203125, -1.207000732421875, -1.1485443115234375, -1.090087890625, -1.0316314697265625, -0.973175048828125, -0.9147186279296875, -0.85626220703125, -0.7978057861328125, -0.739349365234375, -0.6808929443359375, -0.6224365234375, -0.5639801025390625, -0.505523681640625, -0.4470672607421875, -0.38861083984375, -0.3301544189453125, -0.271697998046875, -0.2132415771484375, -0.15478515625, -0.0963287353515625, -0.037872314453125, 0.0205841064453125, 0.07904052734375, 0.1374969482421875, 0.195953369140625, 0.2544097900390625, 0.3128662109375, 0.3713226318359375, 0.429779052734375, 0.4882354736328125, 0.54669189453125, 0.6051483154296875, 0.663604736328125, 0.7220611572265625, 0.780517578125, 0.8389739990234375, 0.897430419921875, 0.9558868408203125, 1.01434326171875, 1.0727996826171875, 1.131256103515625, 1.1897125244140625, 1.2481689453125, 1.3066253662109375, 1.365081787109375, 1.4235382080078125, 1.48199462890625, 1.5404510498046875, 1.598907470703125, 1.6573638916015625, 1.7158203125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 11.0, 11.0, 28.0, 34.0, 56.0, 90.0, 115.0, 201.0, 348.0, 536.0, 900.0, 1461.0, 2539.0, 4078.0, 6768.0, 11405.0, 18632.0, 30199.0, 47440.0, 70757.0, 101073.0, 130409.0, 148042.0, 138443.0, 110928.0, 79534.0, 54336.0, 34463.0, 21649.0, 13507.0, 8132.0, 4902.0, 2983.0, 1813.0, 1062.0, 610.0, 415.0, 237.0, 152.0, 82.0, 52.0, 33.0, 31.0, 19.0, 8.0, 9.0, 4.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.51416015625, -0.4973907470703125, -0.480621337890625, -0.4638519287109375, -0.44708251953125, -0.4303131103515625, -0.413543701171875, -0.3967742919921875, -0.3800048828125, -0.3632354736328125, -0.346466064453125, -0.3296966552734375, -0.31292724609375, -0.2961578369140625, -0.279388427734375, -0.2626190185546875, -0.245849609375, -0.2290802001953125, -0.212310791015625, -0.1955413818359375, -0.17877197265625, -0.1620025634765625, -0.145233154296875, -0.1284637451171875, -0.1116943359375, -0.0949249267578125, -0.078155517578125, -0.0613861083984375, -0.04461669921875, -0.0278472900390625, -0.011077880859375, 0.0056915283203125, 0.0224609375, 0.0392303466796875, 0.055999755859375, 0.0727691650390625, 0.08953857421875, 0.1063079833984375, 0.123077392578125, 0.1398468017578125, 0.1566162109375, 0.1733856201171875, 0.190155029296875, 0.2069244384765625, 0.22369384765625, 0.2404632568359375, 0.257232666015625, 0.2740020751953125, 0.290771484375, 0.3075408935546875, 0.324310302734375, 0.3410797119140625, 0.35784912109375, 0.3746185302734375, 0.391387939453125, 0.4081573486328125, 0.4249267578125, 0.4416961669921875, 0.458465576171875, 0.4752349853515625, 0.49200439453125, 0.5087738037109375, 0.525543212890625, 0.5423126220703125, 0.55908203125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 3.0, 5.0, 13.0, 14.0, 12.0, 11.0, 24.0, 17.0, 26.0, 35.0, 35.0, 35.0, 43.0, 38.0, 35.0, 54.0, 47.0, 1073.0, 45.0, 38.0, 57.0, 42.0, 44.0, 38.0, 38.0, 34.0, 29.0, 29.0, 29.0, 11.0, 14.0, 10.0, 11.0, 8.0, 11.0, 5.0, 2.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4267578125, -1.37860107421875, -1.3304443359375, -1.28228759765625, -1.234130859375, -1.18597412109375, -1.1378173828125, -1.08966064453125, -1.04150390625, -0.99334716796875, -0.9451904296875, -0.89703369140625, -0.848876953125, -0.80072021484375, -0.7525634765625, -0.70440673828125, -0.65625, -0.60809326171875, -0.5599365234375, -0.51177978515625, -0.463623046875, -0.41546630859375, -0.3673095703125, -0.31915283203125, -0.27099609375, -0.22283935546875, -0.1746826171875, -0.12652587890625, -0.078369140625, -0.03021240234375, 0.0179443359375, 0.06610107421875, 0.1142578125, 0.16241455078125, 0.2105712890625, 0.25872802734375, 0.306884765625, 0.35504150390625, 0.4031982421875, 0.45135498046875, 0.49951171875, 0.54766845703125, 0.5958251953125, 0.64398193359375, 0.692138671875, 0.74029541015625, 0.7884521484375, 0.83660888671875, 0.884765625, 0.93292236328125, 0.9810791015625, 1.02923583984375, 1.077392578125, 1.12554931640625, 1.1737060546875, 1.22186279296875, 1.27001953125, 1.31817626953125, 1.3663330078125, 1.41448974609375, 1.462646484375, 1.51080322265625, 1.5589599609375, 1.60711669921875, 1.6552734375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 16.0, 4.0, 13.0, 22.0, 29.0, 28.0, 61.0, 68.0, 92.0, 142.0, 187.0, 255.0, 420.0, 608.0, 909.0, 1256.0, 1941.0, 2785.0, 4129.0, 6215.0, 9403.0, 14044.0, 23695.0, 51002.0, 1878737.0, 40749.0, 21123.0, 12837.0, 8549.0, 5765.0, 3819.0, 2617.0, 1799.0, 1240.0, 771.0, 560.0, 382.0, 275.0, 174.0, 117.0, 89.0, 65.0, 37.0, 35.0, 19.0, 17.0, 7.0, 6.0, 8.0, 10.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.91650390625, -0.888214111328125, -0.85992431640625, -0.831634521484375, -0.8033447265625, -0.775054931640625, -0.74676513671875, -0.718475341796875, -0.690185546875, -0.661895751953125, -0.63360595703125, -0.605316162109375, -0.5770263671875, -0.548736572265625, -0.52044677734375, -0.492156982421875, -0.4638671875, -0.435577392578125, -0.40728759765625, -0.378997802734375, -0.3507080078125, -0.322418212890625, -0.29412841796875, -0.265838623046875, -0.237548828125, -0.209259033203125, -0.18096923828125, -0.152679443359375, -0.1243896484375, -0.096099853515625, -0.06781005859375, -0.039520263671875, -0.01123046875, 0.017059326171875, 0.04534912109375, 0.073638916015625, 0.1019287109375, 0.130218505859375, 0.15850830078125, 0.186798095703125, 0.215087890625, 0.243377685546875, 0.27166748046875, 0.299957275390625, 0.3282470703125, 0.356536865234375, 0.38482666015625, 0.413116455078125, 0.44140625, 0.469696044921875, 0.49798583984375, 0.526275634765625, 0.5545654296875, 0.582855224609375, 0.61114501953125, 0.639434814453125, 0.667724609375, 0.696014404296875, 0.72430419921875, 0.752593994140625, 0.7808837890625, 0.809173583984375, 0.83746337890625, 0.865753173828125, 0.89404296875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 4.0, 3.0, 9.0, 10.0, 11.0, 11.0, 14.0, 18.0, 23.0, 17.0, 20.0, 24.0, 33.0, 32.0, 51.0, 46.0, 43.0, 61.0, 56.0, 39.0, 52.0, 50.0, 47.0, 34.0, 36.0, 33.0, 33.0, 31.0, 20.0, 20.0, 17.0, 18.0, 13.0, 13.0, 12.0, 5.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.02081298828125, -0.020227670669555664, -0.019642353057861328, -0.019057035446166992, -0.018471717834472656, -0.01788640022277832, -0.017301082611083984, -0.01671576499938965, -0.016130447387695312, -0.015545129776000977, -0.01495981216430664, -0.014374494552612305, -0.013789176940917969, -0.013203859329223633, -0.012618541717529297, -0.012033224105834961, -0.011447906494140625, -0.010862588882446289, -0.010277271270751953, -0.009691953659057617, -0.009106636047363281, -0.008521318435668945, -0.00793600082397461, -0.0073506832122802734, -0.0067653656005859375, -0.0061800479888916016, -0.005594730377197266, -0.00500941276550293, -0.004424095153808594, -0.003838777542114258, -0.003253459930419922, -0.002668142318725586, -0.00208282470703125, -0.001497507095336914, -0.0009121894836425781, -0.0003268718719482422, 0.00025844573974609375, 0.0008437633514404297, 0.0014290809631347656, 0.0020143985748291016, 0.0025997161865234375, 0.0031850337982177734, 0.0037703514099121094, 0.004355669021606445, 0.004940986633300781, 0.005526304244995117, 0.006111621856689453, 0.006696939468383789, 0.007282257080078125, 0.007867574691772461, 0.008452892303466797, 0.009038209915161133, 0.009623527526855469, 0.010208845138549805, 0.01079416275024414, 0.011379480361938477, 0.011964797973632812, 0.012550115585327148, 0.013135433197021484, 0.01372075080871582, 0.014306068420410156, 0.014891386032104492, 0.015476703643798828, 0.016062021255493164, 0.0166473388671875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 2.0, 7.0, 8.0, 9.0, 16.0, 26.0, 28.0, 32.0, 60.0, 76.0, 91.0, 142.0, 221.0, 536.0, 1957.0, 35986.0, 905271.0, 99319.0, 3258.0, 710.0, 269.0, 115.0, 112.0, 94.0, 62.0, 42.0, 37.0, 19.0, 18.0, 12.0, 6.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46923828125, -0.453399658203125, -0.43756103515625, -0.421722412109375, -0.4058837890625, -0.390045166015625, -0.37420654296875, -0.358367919921875, -0.342529296875, -0.326690673828125, -0.31085205078125, -0.295013427734375, -0.2791748046875, -0.263336181640625, -0.24749755859375, -0.231658935546875, -0.2158203125, -0.199981689453125, -0.18414306640625, -0.168304443359375, -0.1524658203125, -0.136627197265625, -0.12078857421875, -0.104949951171875, -0.089111328125, -0.073272705078125, -0.05743408203125, -0.041595458984375, -0.0257568359375, -0.009918212890625, 0.00592041015625, 0.021759033203125, 0.03759765625, 0.053436279296875, 0.06927490234375, 0.085113525390625, 0.1009521484375, 0.116790771484375, 0.13262939453125, 0.148468017578125, 0.164306640625, 0.180145263671875, 0.19598388671875, 0.211822509765625, 0.2276611328125, 0.243499755859375, 0.25933837890625, 0.275177001953125, 0.291015625, 0.306854248046875, 0.32269287109375, 0.338531494140625, 0.3543701171875, 0.370208740234375, 0.38604736328125, 0.401885986328125, 0.417724609375, 0.433563232421875, 0.44940185546875, 0.465240478515625, 0.4810791015625, 0.496917724609375, 0.51275634765625, 0.528594970703125, 0.54443359375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 5.0, 11.0, 18.0, 19.0, 46.0, 64.0, 123.0, 200.0, 205.0, 130.0, 60.0, 44.0, 28.0, 21.0, 8.0, 9.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16217677295207977, -0.15677574276924133, -0.1513747125864029, -0.14597368240356445, -0.1405726671218872, -0.13517163693904877, -0.12977060675621033, -0.12436957657337189, -0.11896854639053345, -0.11356751620769501, -0.10816649347543716, -0.10276546329259872, -0.09736443310976028, -0.09196341037750244, -0.086562380194664, -0.08116135001182556, -0.07576032727956772, -0.07035929709672928, -0.06495827436447144, -0.059557244181632996, -0.054156213998794556, -0.048755187541246414, -0.04335416108369827, -0.03795313090085983, -0.03255210444331169, -0.0271510761231184, -0.02175004780292511, -0.01634902134537697, -0.010947993025183678, -0.005546964704990387, -0.00014593824744224548, 0.0052550919353961945, 0.010656118392944336, 0.016057146713137627, 0.021458175033330917, 0.02685920149087906, 0.0322602316737175, 0.03766125813126564, 0.04306228458881378, 0.04846331477165222, 0.05386434122920036, 0.059265367686748505, 0.06466639786958694, 0.07006742060184479, 0.07546845078468323, 0.08086948096752167, 0.08627051115036011, 0.09167154133319855, 0.09707256406545639, 0.10247359424829483, 0.10787461698055267, 0.11327564716339111, 0.11867667734622955, 0.124077707529068, 0.12947872281074524, 0.13487976789474487, 0.14028078317642212, 0.14568181335926056, 0.151082843542099, 0.15648385882377625, 0.16188488900661469, 0.16728591918945312, 0.17268694937229156, 0.17808797955513, 0.18348900973796844]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 11.0, 17.0, 17.0, 16.0, 15.0, 28.0, 27.0, 24.0, 42.0, 48.0, 51.0, 64.0, 48.0, 42.0, 47.0, 53.0, 54.0, 35.0, 64.0, 41.0, 37.0, 37.0, 34.0, 33.0, 22.0, 17.0, 14.0, 17.0, 15.0, 3.0, 7.0, 6.0, 2.0, 6.0, 0.0, 3.0, 1.0], "bins": [-0.03917878866195679, -0.038234733045101166, -0.037290677428245544, -0.03634662553668022, -0.0354025699198246, -0.03445851430296898, -0.033514462411403656, -0.032570406794548035, -0.03162635117769241, -0.030682295560836792, -0.02973824180662632, -0.028794188052415848, -0.027850132435560226, -0.026906076818704605, -0.025962023064494133, -0.02501796931028366, -0.02407391369342804, -0.023129858076572418, -0.022185804322361946, -0.021241750568151474, -0.020297694951295853, -0.01935363933444023, -0.01840958558022976, -0.017465531826019287, -0.016521476209163666, -0.015577421523630619, -0.014633366838097572, -0.013689312152564526, -0.012745257467031479, -0.011801202781498432, -0.010857148095965385, -0.009913093410432339, -0.008969038724899292, -0.008024984039366245, -0.0070809293538331985, -0.006136874668300152, -0.005192819982767105, -0.004248765297234058, -0.0033047106117010117, -0.002360655926167965, -0.0014166012406349182, -0.0004725465551018715, 0.00047150813043117523, 0.001415562815964222, 0.0023596175014972687, 0.0033036721870303154, 0.004247726872563362, 0.005191781558096409, 0.006135836243629456, 0.007079890929162502, 0.008023945614695549, 0.008968000300228596, 0.009912054985761642, 0.01085610967129469, 0.011800164356827736, 0.012744219042360783, 0.01368827372789383, 0.014632328413426876, 0.015576383098959923, 0.016520436853170395, 0.017464492470026016, 0.018408548086881638, 0.01935260184109211, 0.020296655595302582, 0.021240711212158203]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 4.0, 6.0, 13.0, 14.0, 8.0, 21.0, 19.0, 21.0, 21.0, 24.0, 24.0, 29.0, 28.0, 35.0, 36.0, 39.0, 40.0, 30.0, 41.0, 40.0, 37.0, 43.0, 38.0, 33.0, 25.0, 54.0, 40.0, 27.0, 18.0, 26.0, 17.0, 20.0, 22.0, 18.0, 12.0, 14.0, 9.0, 10.0, 12.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.6552734375, -1.6046600341796875, -1.554046630859375, -1.5034332275390625, -1.45281982421875, -1.4022064208984375, -1.351593017578125, -1.3009796142578125, -1.2503662109375, -1.1997528076171875, -1.149139404296875, -1.0985260009765625, -1.04791259765625, -0.9972991943359375, -0.946685791015625, -0.8960723876953125, -0.845458984375, -0.7948455810546875, -0.744232177734375, -0.6936187744140625, -0.64300537109375, -0.5923919677734375, -0.541778564453125, -0.4911651611328125, -0.4405517578125, -0.3899383544921875, -0.339324951171875, -0.2887115478515625, -0.23809814453125, -0.1874847412109375, -0.136871337890625, -0.0862579345703125, -0.03564453125, 0.0149688720703125, 0.065582275390625, 0.1161956787109375, 0.16680908203125, 0.2174224853515625, 0.268035888671875, 0.3186492919921875, 0.3692626953125, 0.4198760986328125, 0.470489501953125, 0.5211029052734375, 0.57171630859375, 0.6223297119140625, 0.672943115234375, 0.7235565185546875, 0.774169921875, 0.8247833251953125, 0.875396728515625, 0.9260101318359375, 0.97662353515625, 1.0272369384765625, 1.077850341796875, 1.1284637451171875, 1.1790771484375, 1.2296905517578125, 1.280303955078125, 1.3309173583984375, 1.38153076171875, 1.4321441650390625, 1.482757568359375, 1.5333709716796875, 1.583984375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 14.0, 25.0, 34.0, 48.0, 75.0, 129.0, 221.0, 296.0, 495.0, 779.0, 1233.0, 2001.0, 3274.0, 5315.0, 8755.0, 15286.0, 27231.0, 49289.0, 89797.0, 158928.0, 231850.0, 193986.0, 114362.0, 62998.0, 34769.0, 19410.0, 11001.0, 6512.0, 3938.0, 2485.0, 1447.0, 967.0, 572.0, 361.0, 257.0, 149.0, 82.0, 70.0, 38.0, 19.0, 17.0, 11.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.01763916015625, -0.9844970703125, -0.95135498046875, -0.918212890625, -0.88507080078125, -0.8519287109375, -0.81878662109375, -0.78564453125, -0.75250244140625, -0.7193603515625, -0.68621826171875, -0.653076171875, -0.61993408203125, -0.5867919921875, -0.55364990234375, -0.5205078125, -0.48736572265625, -0.4542236328125, -0.42108154296875, -0.387939453125, -0.35479736328125, -0.3216552734375, -0.28851318359375, -0.25537109375, -0.22222900390625, -0.1890869140625, -0.15594482421875, -0.122802734375, -0.08966064453125, -0.0565185546875, -0.02337646484375, 0.009765625, 0.04290771484375, 0.0760498046875, 0.10919189453125, 0.142333984375, 0.17547607421875, 0.2086181640625, 0.24176025390625, 0.27490234375, 0.30804443359375, 0.3411865234375, 0.37432861328125, 0.407470703125, 0.44061279296875, 0.4737548828125, 0.50689697265625, 0.5400390625, 0.57318115234375, 0.6063232421875, 0.63946533203125, 0.672607421875, 0.70574951171875, 0.7388916015625, 0.77203369140625, 0.80517578125, 0.83831787109375, 0.8714599609375, 0.90460205078125, 0.937744140625, 0.97088623046875, 1.0040283203125, 1.03717041015625, 1.0703125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 8.0, 3.0, 3.0, 10.0, 11.0, 14.0, 12.0, 14.0, 13.0, 13.0, 23.0, 23.0, 17.0, 28.0, 27.0, 28.0, 31.0, 28.0, 40.0, 49.0, 58.0, 114.0, 319.0, 1468.0, 161.0, 71.0, 52.0, 50.0, 47.0, 26.0, 37.0, 32.0, 28.0, 30.0, 27.0, 15.0, 20.0, 15.0, 13.0, 14.0, 10.0, 8.0, 5.0, 9.0, 4.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-5.70703125, -5.53497314453125, -5.3629150390625, -5.19085693359375, -5.018798828125, -4.84674072265625, -4.6746826171875, -4.50262451171875, -4.33056640625, -4.15850830078125, -3.9864501953125, -3.81439208984375, -3.642333984375, -3.47027587890625, -3.2982177734375, -3.12615966796875, -2.9541015625, -2.78204345703125, -2.6099853515625, -2.43792724609375, -2.265869140625, -2.09381103515625, -1.9217529296875, -1.74969482421875, -1.57763671875, -1.40557861328125, -1.2335205078125, -1.06146240234375, -0.889404296875, -0.71734619140625, -0.5452880859375, -0.37322998046875, -0.201171875, -0.02911376953125, 0.1429443359375, 0.31500244140625, 0.487060546875, 0.65911865234375, 0.8311767578125, 1.00323486328125, 1.17529296875, 1.34735107421875, 1.5194091796875, 1.69146728515625, 1.863525390625, 2.03558349609375, 2.2076416015625, 2.37969970703125, 2.5517578125, 2.72381591796875, 2.8958740234375, 3.06793212890625, 3.239990234375, 3.41204833984375, 3.5841064453125, 3.75616455078125, 3.92822265625, 4.10028076171875, 4.2723388671875, 4.44439697265625, 4.616455078125, 4.78851318359375, 4.9605712890625, 5.13262939453125, 5.3046875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 7.0, 9.0, 5.0, 7.0, 10.0, 11.0, 14.0, 11.0, 14.0, 19.0, 35.0, 32.0, 44.0, 69.0, 75.0, 130.0, 225.0, 369.0, 857.0, 3157.0, 21779.0, 403272.0, 2616002.0, 87898.0, 8529.0, 1622.0, 586.0, 284.0, 187.0, 110.0, 63.0, 41.0, 37.0, 33.0, 26.0, 28.0, 16.0, 15.0, 10.0, 11.0, 15.0, 12.0, 5.0, 5.0, 2.0, 6.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.1484375, -6.919921875, -6.69140625, -6.462890625, -6.234375, -6.005859375, -5.77734375, -5.548828125, -5.3203125, -5.091796875, -4.86328125, -4.634765625, -4.40625, -4.177734375, -3.94921875, -3.720703125, -3.4921875, -3.263671875, -3.03515625, -2.806640625, -2.578125, -2.349609375, -2.12109375, -1.892578125, -1.6640625, -1.435546875, -1.20703125, -0.978515625, -0.75, -0.521484375, -0.29296875, -0.064453125, 0.1640625, 0.392578125, 0.62109375, 0.849609375, 1.078125, 1.306640625, 1.53515625, 1.763671875, 1.9921875, 2.220703125, 2.44921875, 2.677734375, 2.90625, 3.134765625, 3.36328125, 3.591796875, 3.8203125, 4.048828125, 4.27734375, 4.505859375, 4.734375, 4.962890625, 5.19140625, 5.419921875, 5.6484375, 5.876953125, 6.10546875, 6.333984375, 6.5625, 6.791015625, 7.01953125, 7.248046875, 7.4765625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 196.0, 784.0, 38.0, 0.0, 0.0, 1.0], "bins": [-163.405029296875, -160.64833068847656, -157.89161682128906, -155.13491821289062, -152.3782196044922, -149.6215057373047, -146.86480712890625, -144.10809326171875, -141.3513946533203, -138.59469604492188, -135.83798217773438, -133.08128356933594, -130.3245849609375, -127.56787109375, -124.81117248535156, -122.0544662475586, -119.29776000976562, -116.54105377197266, -113.78435516357422, -111.02764892578125, -108.27094268798828, -105.51423645019531, -102.75753784179688, -100.0008316040039, -97.24413299560547, -94.4874267578125, -91.73072814941406, -88.9740219116211, -86.21731567382812, -83.46060943603516, -80.70391082763672, -77.94720458984375, -75.19049072265625, -72.43378448486328, -69.67708587646484, -66.92037963867188, -64.1636734008789, -61.4069709777832, -58.6502685546875, -55.89356231689453, -53.13685989379883, -50.380157470703125, -47.623451232910156, -44.86674880981445, -42.110042572021484, -39.35334014892578, -36.59663391113281, -33.83993148803711, -31.083229064941406, -28.32652473449707, -25.569820404052734, -22.81311798095703, -20.056411743164062, -17.29970932006836, -14.543004989624023, -11.786300659179688, -9.029595375061035, -6.272891044616699, -3.5161871910095215, -0.7594833374023438, 1.9972209930419922, 4.753925323486328, 7.510628700256348, 10.267333030700684, 13.02403736114502]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 11.0, 3.0, 14.0, 13.0, 11.0, 25.0, 16.0, 19.0, 23.0, 28.0, 32.0, 28.0, 35.0, 33.0, 32.0, 33.0, 44.0, 34.0, 41.0, 38.0, 34.0, 42.0, 43.0, 24.0, 35.0, 30.0, 24.0, 29.0, 31.0, 24.0, 24.0, 18.0, 10.0, 17.0, 14.0, 10.0, 6.0, 7.0, 11.0, 4.0, 5.0, 7.0, 5.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-18.224695205688477, -17.638294219970703, -17.05189323425293, -16.465492248535156, -15.879091262817383, -15.29269027709961, -14.706289291381836, -14.119888305664062, -13.533487319946289, -12.947086334228516, -12.360685348510742, -11.774284362792969, -11.187883377075195, -10.601482391357422, -10.015081405639648, -9.428680419921875, -8.842279434204102, -8.255878448486328, -7.669477462768555, -7.083076477050781, -6.496675491333008, -5.910274505615234, -5.323873519897461, -4.7374725341796875, -4.151071548461914, -3.5646705627441406, -2.978269577026367, -2.3918685913085938, -1.8054676055908203, -1.2190666198730469, -0.6326656341552734, -0.0462646484375, 0.5401382446289062, 1.1265392303466797, 1.7129402160644531, 2.2993412017822266, 2.8857421875, 3.4721431732177734, 4.058544158935547, 4.64494514465332, 5.231346130371094, 5.817747116088867, 6.404148101806641, 6.990549087524414, 7.5769500732421875, 8.163351058959961, 8.749752044677734, 9.336153030395508, 9.922554016113281, 10.508955001831055, 11.095355987548828, 11.681756973266602, 12.268157958984375, 12.854558944702148, 13.440959930419922, 14.027360916137695, 14.613761901855469, 15.200162887573242, 15.786563873291016, 16.37296485900879, 16.959365844726562, 17.545766830444336, 18.13216781616211, 18.718568801879883, 19.304969787597656]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 7.0, 8.0, 12.0, 13.0, 17.0, 15.0, 16.0, 24.0, 32.0, 28.0, 29.0, 45.0, 45.0, 43.0, 36.0, 39.0, 46.0, 43.0, 43.0, 54.0, 49.0, 47.0, 43.0, 46.0, 34.0, 27.0, 32.0, 16.0, 24.0, 15.0, 12.0, 12.0, 9.0, 12.0, 8.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.287109375, -2.22467041015625, -2.1622314453125, -2.09979248046875, -2.037353515625, -1.97491455078125, -1.9124755859375, -1.85003662109375, -1.78759765625, -1.72515869140625, -1.6627197265625, -1.60028076171875, -1.537841796875, -1.47540283203125, -1.4129638671875, -1.35052490234375, -1.2880859375, -1.22564697265625, -1.1632080078125, -1.10076904296875, -1.038330078125, -0.97589111328125, -0.9134521484375, -0.85101318359375, -0.78857421875, -0.72613525390625, -0.6636962890625, -0.60125732421875, -0.538818359375, -0.47637939453125, -0.4139404296875, -0.35150146484375, -0.2890625, -0.22662353515625, -0.1641845703125, -0.10174560546875, -0.039306640625, 0.02313232421875, 0.0855712890625, 0.14801025390625, 0.21044921875, 0.27288818359375, 0.3353271484375, 0.39776611328125, 0.460205078125, 0.52264404296875, 0.5850830078125, 0.64752197265625, 0.7099609375, 0.77239990234375, 0.8348388671875, 0.89727783203125, 0.959716796875, 1.02215576171875, 1.0845947265625, 1.14703369140625, 1.20947265625, 1.27191162109375, 1.3343505859375, 1.39678955078125, 1.459228515625, 1.52166748046875, 1.5841064453125, 1.64654541015625, 1.708984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 14.0, 15.0, 12.0, 21.0, 36.0, 35.0, 60.0, 109.0, 147.0, 248.0, 412.0, 832.0, 1930.0, 5979.0, 21957.0, 98762.0, 616951.0, 2503039.0, 786547.0, 121530.0, 25284.0, 6606.0, 2022.0, 762.0, 409.0, 213.0, 96.0, 86.0, 47.0, 38.0, 24.0, 22.0, 14.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.79296875, -5.642730712890625, -5.49249267578125, -5.342254638671875, -5.1920166015625, -5.041778564453125, -4.89154052734375, -4.741302490234375, -4.591064453125, -4.440826416015625, -4.29058837890625, -4.140350341796875, -3.9901123046875, -3.839874267578125, -3.68963623046875, -3.539398193359375, -3.38916015625, -3.238922119140625, -3.08868408203125, -2.938446044921875, -2.7882080078125, -2.637969970703125, -2.48773193359375, -2.337493896484375, -2.187255859375, -2.037017822265625, -1.88677978515625, -1.736541748046875, -1.5863037109375, -1.436065673828125, -1.28582763671875, -1.135589599609375, -0.9853515625, -0.835113525390625, -0.68487548828125, -0.534637451171875, -0.3843994140625, -0.234161376953125, -0.08392333984375, 0.066314697265625, 0.216552734375, 0.366790771484375, 0.51702880859375, 0.667266845703125, 0.8175048828125, 0.967742919921875, 1.11798095703125, 1.268218994140625, 1.41845703125, 1.568695068359375, 1.71893310546875, 1.869171142578125, 2.0194091796875, 2.169647216796875, 2.31988525390625, 2.470123291015625, 2.620361328125, 2.770599365234375, 2.92083740234375, 3.071075439453125, 3.2213134765625, 3.371551513671875, 3.52178955078125, 3.672027587890625, 3.822265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 5.0, 7.0, 10.0, 19.0, 25.0, 32.0, 39.0, 59.0, 70.0, 89.0, 132.0, 163.0, 195.0, 252.0, 338.0, 395.0, 415.0, 387.0, 338.0, 289.0, 182.0, 169.0, 130.0, 79.0, 72.0, 50.0, 36.0, 28.0, 23.0, 9.0, 7.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.87890625, -4.73736572265625, -4.5958251953125, -4.45428466796875, -4.312744140625, -4.17120361328125, -4.0296630859375, -3.88812255859375, -3.74658203125, -3.60504150390625, -3.4635009765625, -3.32196044921875, -3.180419921875, -3.03887939453125, -2.8973388671875, -2.75579833984375, -2.6142578125, -2.47271728515625, -2.3311767578125, -2.18963623046875, -2.048095703125, -1.90655517578125, -1.7650146484375, -1.62347412109375, -1.48193359375, -1.34039306640625, -1.1988525390625, -1.05731201171875, -0.915771484375, -0.77423095703125, -0.6326904296875, -0.49114990234375, -0.349609375, -0.20806884765625, -0.0665283203125, 0.07501220703125, 0.216552734375, 0.35809326171875, 0.4996337890625, 0.64117431640625, 0.78271484375, 0.92425537109375, 1.0657958984375, 1.20733642578125, 1.348876953125, 1.49041748046875, 1.6319580078125, 1.77349853515625, 1.9150390625, 2.05657958984375, 2.1981201171875, 2.33966064453125, 2.481201171875, 2.62274169921875, 2.7642822265625, 2.90582275390625, 3.04736328125, 3.18890380859375, 3.3304443359375, 3.47198486328125, 3.613525390625, 3.75506591796875, 3.8966064453125, 4.03814697265625, 4.1796875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 5.0, 11.0, 22.0, 36.0, 41.0, 63.0, 88.0, 141.0, 282.0, 455.0, 875.0, 1925.0, 4616.0, 12468.0, 38485.0, 131501.0, 471330.0, 1550040.0, 1401491.0, 412268.0, 114934.0, 34286.0, 11153.0, 4142.0, 1721.0, 813.0, 441.0, 227.0, 143.0, 89.0, 59.0, 31.0, 24.0, 21.0, 6.0, 8.0, 9.0, 7.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.9453125, -4.77447509765625, -4.6036376953125, -4.43280029296875, -4.261962890625, -4.09112548828125, -3.9202880859375, -3.74945068359375, -3.57861328125, -3.40777587890625, -3.2369384765625, -3.06610107421875, -2.895263671875, -2.72442626953125, -2.5535888671875, -2.38275146484375, -2.2119140625, -2.04107666015625, -1.8702392578125, -1.69940185546875, -1.528564453125, -1.35772705078125, -1.1868896484375, -1.01605224609375, -0.84521484375, -0.67437744140625, -0.5035400390625, -0.33270263671875, -0.161865234375, 0.00897216796875, 0.1798095703125, 0.35064697265625, 0.521484375, 0.69232177734375, 0.8631591796875, 1.03399658203125, 1.204833984375, 1.37567138671875, 1.5465087890625, 1.71734619140625, 1.88818359375, 2.05902099609375, 2.2298583984375, 2.40069580078125, 2.571533203125, 2.74237060546875, 2.9132080078125, 3.08404541015625, 3.2548828125, 3.42572021484375, 3.5965576171875, 3.76739501953125, 3.938232421875, 4.10906982421875, 4.2799072265625, 4.45074462890625, 4.62158203125, 4.79241943359375, 4.9632568359375, 5.13409423828125, 5.304931640625, 5.47576904296875, 5.6466064453125, 5.81744384765625, 5.98828125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 12.0, 22.0, 53.0, 68.0, 112.0, 158.0, 186.0, 142.0, 106.0, 64.0, 48.0, 23.0, 9.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.400115966796875, -28.201679229736328, -27.003244400024414, -25.804807662963867, -24.60637092590332, -23.407936096191406, -22.20949935913086, -21.011062622070312, -19.812625885009766, -18.61418914794922, -17.415754318237305, -16.217317581176758, -15.018880844116211, -13.82044506072998, -12.62200927734375, -11.423572540283203, -10.225137710571289, -9.026701927185059, -7.828265190124512, -6.629829406738281, -5.431393146514893, -4.232956886291504, -3.0345211029052734, -1.8360843658447266, -0.6376485824584961, 0.560787558555603, 1.7592236995697021, 2.9576597213745117, 4.1560959815979, 5.354532241821289, 6.5529680252075195, 7.751404762268066, 8.949840545654297, 10.148276329040527, 11.346713066101074, 12.545148849487305, 13.743585586547852, 14.942021369934082, 16.140457153320312, 17.33889389038086, 18.537330627441406, 19.735767364501953, 20.934202194213867, 22.132638931274414, 23.33107566833496, 24.529510498046875, 25.727947235107422, 26.92638397216797, 28.124818801879883, 29.32325553894043, 30.521690368652344, 31.72012710571289, 32.91856384277344, 34.117000579833984, 35.31543731689453, 36.51387023925781, 37.71230697631836, 38.910743713378906, 40.10918045043945, 41.3076171875, 42.50605010986328, 43.70448684692383, 44.902923583984375, 46.10136032104492, 47.29979705810547]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 12.0, 9.0, 20.0, 15.0, 18.0, 16.0, 31.0, 39.0, 39.0, 36.0, 37.0, 36.0, 34.0, 46.0, 59.0, 58.0, 55.0, 40.0, 43.0, 46.0, 42.0, 36.0, 39.0, 31.0, 18.0, 17.0, 21.0, 23.0, 13.0, 13.0, 9.0, 13.0, 8.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.001651763916016, -18.42219352722168, -17.84273338317871, -17.263275146484375, -16.683815002441406, -16.10435676574707, -15.524896621704102, -14.945438385009766, -14.365978240966797, -13.786519050598145, -13.207059860229492, -12.62760066986084, -12.048141479492188, -11.468682289123535, -10.889223098754883, -10.309764862060547, -9.730305671691895, -9.150846481323242, -8.57138729095459, -7.9919281005859375, -7.412468910217285, -6.833009719848633, -6.253551006317139, -5.674091815948486, -5.094632625579834, -4.515173435211182, -3.9357142448425293, -3.356255292892456, -2.7767961025238037, -2.1973369121551514, -1.6178779602050781, -1.0384187698364258, -0.45895957946777344, 0.12049955129623413, 0.6999586820602417, 1.2794177532196045, 1.8588769435882568, 2.438336133956909, 3.0177950859069824, 3.5972542762756348, 4.176713466644287, 4.7561726570129395, 5.335631847381592, 5.915090560913086, 6.494549751281738, 7.074008941650391, 7.653468132019043, 8.232927322387695, 8.812386512756348, 9.391845703125, 9.971304893493652, 10.550764083862305, 11.130223274230957, 11.70968246459961, 12.289140701293945, 12.868600845336914, 13.44805908203125, 14.027518272399902, 14.606977462768555, 15.186436653137207, 15.76589584350586, 16.345354080200195, 16.924814224243164, 17.5042724609375, 18.08373260498047]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 8.0, 12.0, 11.0, 15.0, 11.0, 13.0, 15.0, 16.0, 23.0, 32.0, 26.0, 42.0, 29.0, 22.0, 39.0, 48.0, 41.0, 43.0, 42.0, 30.0, 37.0, 38.0, 43.0, 23.0, 33.0, 36.0, 29.0, 25.0, 30.0, 20.0, 27.0, 17.0, 17.0, 12.0, 18.0, 17.0, 7.0, 12.0, 3.0, 6.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.8447265625, -1.7895050048828125, -1.734283447265625, -1.6790618896484375, -1.62384033203125, -1.5686187744140625, -1.513397216796875, -1.4581756591796875, -1.4029541015625, -1.3477325439453125, -1.292510986328125, -1.2372894287109375, -1.18206787109375, -1.1268463134765625, -1.071624755859375, -1.0164031982421875, -0.961181640625, -0.9059600830078125, -0.850738525390625, -0.7955169677734375, -0.74029541015625, -0.6850738525390625, -0.629852294921875, -0.5746307373046875, -0.5194091796875, -0.4641876220703125, -0.408966064453125, -0.3537445068359375, -0.29852294921875, -0.2433013916015625, -0.188079833984375, -0.1328582763671875, -0.07763671875, -0.0224151611328125, 0.032806396484375, 0.0880279541015625, 0.14324951171875, 0.1984710693359375, 0.253692626953125, 0.3089141845703125, 0.3641357421875, 0.4193572998046875, 0.474578857421875, 0.5298004150390625, 0.58502197265625, 0.6402435302734375, 0.695465087890625, 0.7506866455078125, 0.805908203125, 0.8611297607421875, 0.916351318359375, 0.9715728759765625, 1.02679443359375, 1.0820159912109375, 1.137237548828125, 1.1924591064453125, 1.2476806640625, 1.3029022216796875, 1.358123779296875, 1.4133453369140625, 1.46856689453125, 1.5237884521484375, 1.579010009765625, 1.6342315673828125, 1.689453125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 9.0, 4.0, 15.0, 22.0, 18.0, 37.0, 54.0, 72.0, 152.0, 199.0, 302.0, 385.0, 672.0, 1033.0, 1682.0, 2776.0, 4144.0, 6784.0, 10553.0, 16527.0, 24821.0, 37520.0, 54289.0, 75006.0, 97213.0, 116257.0, 125884.0, 118579.0, 100806.0, 78719.0, 57627.0, 40247.0, 26898.0, 17747.0, 11404.0, 7217.0, 4705.0, 2983.0, 1806.0, 1169.0, 755.0, 504.0, 338.0, 210.0, 137.0, 90.0, 56.0, 44.0, 30.0, 21.0, 11.0, 12.0, 7.0, 3.0, 4.0, 2.0], "bins": [-0.5966796875, -0.5794296264648438, -0.5621795654296875, -0.5449295043945312, -0.527679443359375, -0.5104293823242188, -0.4931793212890625, -0.47592926025390625, -0.45867919921875, -0.44142913818359375, -0.4241790771484375, -0.40692901611328125, -0.389678955078125, -0.37242889404296875, -0.3551788330078125, -0.33792877197265625, -0.3206787109375, -0.30342864990234375, -0.2861785888671875, -0.26892852783203125, -0.251678466796875, -0.23442840576171875, -0.2171783447265625, -0.19992828369140625, -0.18267822265625, -0.16542816162109375, -0.1481781005859375, -0.13092803955078125, -0.113677978515625, -0.09642791748046875, -0.0791778564453125, -0.06192779541015625, -0.044677734375, -0.02742767333984375, -0.0101776123046875, 0.00707244873046875, 0.024322509765625, 0.04157257080078125, 0.0588226318359375, 0.07607269287109375, 0.09332275390625, 0.11057281494140625, 0.1278228759765625, 0.14507293701171875, 0.162322998046875, 0.17957305908203125, 0.1968231201171875, 0.21407318115234375, 0.2313232421875, 0.24857330322265625, 0.2658233642578125, 0.28307342529296875, 0.300323486328125, 0.31757354736328125, 0.3348236083984375, 0.35207366943359375, 0.36932373046875, 0.38657379150390625, 0.4038238525390625, 0.42107391357421875, 0.438323974609375, 0.45557403564453125, 0.4728240966796875, 0.49007415771484375, 0.50732421875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 7.0, 4.0, 8.0, 9.0, 12.0, 10.0, 13.0, 23.0, 23.0, 19.0, 15.0, 31.0, 21.0, 38.0, 35.0, 36.0, 22.0, 47.0, 56.0, 35.0, 1061.0, 42.0, 58.0, 38.0, 32.0, 31.0, 35.0, 33.0, 30.0, 42.0, 23.0, 24.0, 15.0, 16.0, 19.0, 11.0, 10.0, 7.0, 12.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.41015625, -1.3653106689453125, -1.320465087890625, -1.2756195068359375, -1.23077392578125, -1.1859283447265625, -1.141082763671875, -1.0962371826171875, -1.0513916015625, -1.0065460205078125, -0.961700439453125, -0.9168548583984375, -0.87200927734375, -0.8271636962890625, -0.782318115234375, -0.7374725341796875, -0.692626953125, -0.6477813720703125, -0.602935791015625, -0.5580902099609375, -0.51324462890625, -0.4683990478515625, -0.423553466796875, -0.3787078857421875, -0.3338623046875, -0.2890167236328125, -0.244171142578125, -0.1993255615234375, -0.15447998046875, -0.1096343994140625, -0.064788818359375, -0.0199432373046875, 0.02490234375, 0.0697479248046875, 0.114593505859375, 0.1594390869140625, 0.20428466796875, 0.2491302490234375, 0.293975830078125, 0.3388214111328125, 0.3836669921875, 0.4285125732421875, 0.473358154296875, 0.5182037353515625, 0.56304931640625, 0.6078948974609375, 0.652740478515625, 0.6975860595703125, 0.742431640625, 0.7872772216796875, 0.832122802734375, 0.8769683837890625, 0.92181396484375, 0.9666595458984375, 1.011505126953125, 1.0563507080078125, 1.1011962890625, 1.1460418701171875, 1.190887451171875, 1.2357330322265625, 1.28057861328125, 1.3254241943359375, 1.370269775390625, 1.4151153564453125, 1.4599609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 9.0, 14.0, 14.0, 29.0, 45.0, 78.0, 111.0, 172.0, 228.0, 425.0, 620.0, 889.0, 1419.0, 2354.0, 3647.0, 5623.0, 8837.0, 14125.0, 24250.0, 55732.0, 1887877.0, 38021.0, 19777.0, 12014.0, 7526.0, 4767.0, 3043.0, 1953.0, 1281.0, 766.0, 511.0, 343.0, 219.0, 132.0, 87.0, 70.0, 41.0, 21.0, 17.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.074371337890625, -1.03643798828125, -0.998504638671875, -0.9605712890625, -0.922637939453125, -0.88470458984375, -0.846771240234375, -0.808837890625, -0.770904541015625, -0.73297119140625, -0.695037841796875, -0.6571044921875, -0.619171142578125, -0.58123779296875, -0.543304443359375, -0.50537109375, -0.467437744140625, -0.42950439453125, -0.391571044921875, -0.3536376953125, -0.315704345703125, -0.27777099609375, -0.239837646484375, -0.201904296875, -0.163970947265625, -0.12603759765625, -0.088104248046875, -0.0501708984375, -0.012237548828125, 0.02569580078125, 0.063629150390625, 0.1015625, 0.139495849609375, 0.17742919921875, 0.215362548828125, 0.2532958984375, 0.291229248046875, 0.32916259765625, 0.367095947265625, 0.405029296875, 0.442962646484375, 0.48089599609375, 0.518829345703125, 0.5567626953125, 0.594696044921875, 0.63262939453125, 0.670562744140625, 0.70849609375, 0.746429443359375, 0.78436279296875, 0.822296142578125, 0.8602294921875, 0.898162841796875, 0.93609619140625, 0.974029541015625, 1.011962890625, 1.049896240234375, 1.08782958984375, 1.125762939453125, 1.1636962890625, 1.201629638671875, 1.23956298828125, 1.277496337890625, 1.3154296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 9.0, 13.0, 7.0, 14.0, 20.0, 35.0, 37.0, 65.0, 67.0, 73.0, 81.0, 73.0, 73.0, 77.0, 78.0, 48.0, 53.0, 50.0, 29.0, 16.0, 15.0, 9.0, 6.0, 9.0, 8.0, 3.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02264404296875, -0.021770954132080078, -0.020897865295410156, -0.020024776458740234, -0.019151687622070312, -0.01827859878540039, -0.01740550994873047, -0.016532421112060547, -0.015659332275390625, -0.014786243438720703, -0.013913154602050781, -0.01304006576538086, -0.012166976928710938, -0.011293888092041016, -0.010420799255371094, -0.009547710418701172, -0.00867462158203125, -0.007801532745361328, -0.006928443908691406, -0.006055355072021484, -0.0051822662353515625, -0.004309177398681641, -0.0034360885620117188, -0.002562999725341797, -0.001689910888671875, -0.0008168220520019531, 5.626678466796875e-05, 0.0009293556213378906, 0.0018024444580078125, 0.0026755332946777344, 0.0035486221313476562, 0.004421710968017578, 0.0052947998046875, 0.006167888641357422, 0.007040977478027344, 0.007914066314697266, 0.008787155151367188, 0.00966024398803711, 0.010533332824707031, 0.011406421661376953, 0.012279510498046875, 0.013152599334716797, 0.014025688171386719, 0.01489877700805664, 0.015771865844726562, 0.016644954681396484, 0.017518043518066406, 0.018391132354736328, 0.01926422119140625, 0.020137310028076172, 0.021010398864746094, 0.021883487701416016, 0.022756576538085938, 0.02362966537475586, 0.02450275421142578, 0.025375843048095703, 0.026248931884765625, 0.027122020721435547, 0.02799510955810547, 0.02886819839477539, 0.029741287231445312, 0.030614376068115234, 0.031487464904785156, 0.03236055374145508, 0.033233642578125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 10.0, 8.0, 5.0, 17.0, 23.0, 26.0, 43.0, 85.0, 124.0, 195.0, 352.0, 984.0, 25929.0, 929553.0, 88437.0, 1659.0, 446.0, 242.0, 132.0, 89.0, 54.0, 36.0, 25.0, 19.0, 11.0, 12.0, 7.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.6044921875, -0.5884284973144531, -0.5723648071289062, -0.5563011169433594, -0.5402374267578125, -0.5241737365722656, -0.5081100463867188, -0.4920463562011719, -0.475982666015625, -0.4599189758300781, -0.44385528564453125, -0.4277915954589844, -0.4117279052734375, -0.3956642150878906, -0.37960052490234375, -0.3635368347167969, -0.34747314453125, -0.3314094543457031, -0.31534576416015625, -0.2992820739746094, -0.2832183837890625, -0.2671546936035156, -0.25109100341796875, -0.23502731323242188, -0.218963623046875, -0.20289993286132812, -0.18683624267578125, -0.17077255249023438, -0.1547088623046875, -0.13864517211914062, -0.12258148193359375, -0.10651779174804688, -0.0904541015625, -0.07439041137695312, -0.05832672119140625, -0.042263031005859375, -0.0261993408203125, -0.010135650634765625, 0.00592803955078125, 0.021991729736328125, 0.038055419921875, 0.054119110107421875, 0.07018280029296875, 0.08624649047851562, 0.1023101806640625, 0.11837387084960938, 0.13443756103515625, 0.15050125122070312, 0.16656494140625, 0.18262863159179688, 0.19869232177734375, 0.21475601196289062, 0.2308197021484375, 0.24688339233398438, 0.26294708251953125, 0.2790107727050781, 0.295074462890625, 0.3111381530761719, 0.32720184326171875, 0.3432655334472656, 0.3593292236328125, 0.3753929138183594, 0.39145660400390625, 0.4075202941894531, 0.423583984375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 1.0, 4.0, 8.0, 9.0, 10.0, 27.0, 56.0, 94.0, 161.0, 240.0, 177.0, 85.0, 54.0, 22.0, 24.0, 12.0, 6.0, 5.0, 0.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31456997990608215, -0.3080880343914032, -0.30160608887672424, -0.2951241433620453, -0.28864219784736633, -0.2821602523326874, -0.2756783068180084, -0.26919636130332947, -0.2627144157886505, -0.25623247027397156, -0.2497505247592926, -0.24326857924461365, -0.2367866337299347, -0.23030468821525574, -0.22382274270057678, -0.21734079718589783, -0.21085883677005768, -0.20437689125537872, -0.19789494574069977, -0.1914130002260208, -0.18493105471134186, -0.1784491091966629, -0.17196714878082275, -0.1654852032661438, -0.15900325775146484, -0.1525213122367859, -0.14603936672210693, -0.13955742120742798, -0.13307547569274902, -0.12659353017807007, -0.12011157721281052, -0.11362963169813156, -0.1071477085351944, -0.10066576302051544, -0.09418381750583649, -0.08770187199115753, -0.08121992647647858, -0.07473798096179962, -0.06825602799654007, -0.061774082481861115, -0.05529213696718216, -0.048810191452503204, -0.04232824593782425, -0.035846296697854996, -0.02936435118317604, -0.022882405668497086, -0.016400456428527832, -0.009918510913848877, -0.003436565399169922, 0.003045381046831608, 0.009527327492833138, 0.016009274870157242, 0.022491220384836197, 0.028973165899515152, 0.035455115139484406, 0.04193706065416336, 0.048419006168842316, 0.05490095168352127, 0.061382897198200226, 0.06786485016345978, 0.07434679567813873, 0.08082874119281769, 0.08731068670749664, 0.0937926322221756, 0.10027457773685455]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 5.0, 5.0, 6.0, 6.0, 13.0, 8.0, 9.0, 12.0, 23.0, 23.0, 20.0, 18.0, 30.0, 33.0, 41.0, 35.0, 39.0, 45.0, 41.0, 44.0, 41.0, 37.0, 39.0, 44.0, 55.0, 44.0, 45.0, 48.0, 29.0, 34.0, 23.0, 24.0, 18.0, 16.0, 9.0, 13.0, 7.0, 9.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.039283037185668945, -0.038230814039707184, -0.037178587168455124, -0.036126360297203064, -0.0350741371512413, -0.03402191400527954, -0.03296968713402748, -0.03191746026277542, -0.03086523711681366, -0.02981301210820675, -0.028760787099599838, -0.027708562090992928, -0.026656337082386017, -0.025604112073779106, -0.024551887065172195, -0.023499662056565285, -0.022447437047958374, -0.021395212039351463, -0.020342987030744553, -0.019290762022137642, -0.01823853701353073, -0.01718631200492382, -0.01613408699631691, -0.015081861987709999, -0.014029636979103088, -0.012977411970496178, -0.011925186961889267, -0.010872961953282356, -0.009820736944675446, -0.008768511936068535, -0.007716286927461624, -0.0066640619188547134, -0.005611836910247803, -0.004559611901640892, -0.0035073868930339813, -0.0024551618844270706, -0.00140293687582016, -0.0003507118672132492, 0.0007015131413936615, 0.0017537381500005722, 0.002805963158607483, 0.0038581881672143936, 0.004910413175821304, 0.005962638184428215, 0.007014863193035126, 0.008067088201642036, 0.009119313210248947, 0.010171538218855858, 0.011223763227462769, 0.01227598823606968, 0.01332821324467659, 0.0143804382532835, 0.015432663261890411, 0.016484888270497322, 0.017537113279104233, 0.018589338287711143, 0.019641563296318054, 0.020693788304924965, 0.021746013313531876, 0.022798238322138786, 0.023850463330745697, 0.024902688339352608, 0.02595491334795952, 0.02700713835656643, 0.02805936336517334]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 5.0, 13.0, 11.0, 16.0, 14.0, 9.0, 19.0, 24.0, 24.0, 27.0, 28.0, 35.0, 28.0, 25.0, 46.0, 35.0, 38.0, 39.0, 49.0, 41.0, 40.0, 41.0, 40.0, 34.0, 43.0, 34.0, 28.0, 24.0, 27.0, 27.0, 20.0, 16.0, 18.0, 15.0, 15.0, 8.0, 9.0, 7.0, 7.0, 7.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.810546875, -1.7525634765625, -1.694580078125, -1.6365966796875, -1.57861328125, -1.5206298828125, -1.462646484375, -1.4046630859375, -1.3466796875, -1.2886962890625, -1.230712890625, -1.1727294921875, -1.11474609375, -1.0567626953125, -0.998779296875, -0.9407958984375, -0.8828125, -0.8248291015625, -0.766845703125, -0.7088623046875, -0.65087890625, -0.5928955078125, -0.534912109375, -0.4769287109375, -0.4189453125, -0.3609619140625, -0.302978515625, -0.2449951171875, -0.18701171875, -0.1290283203125, -0.071044921875, -0.0130615234375, 0.044921875, 0.1029052734375, 0.160888671875, 0.2188720703125, 0.27685546875, 0.3348388671875, 0.392822265625, 0.4508056640625, 0.5087890625, 0.5667724609375, 0.624755859375, 0.6827392578125, 0.74072265625, 0.7987060546875, 0.856689453125, 0.9146728515625, 0.97265625, 1.0306396484375, 1.088623046875, 1.1466064453125, 1.20458984375, 1.2625732421875, 1.320556640625, 1.3785400390625, 1.4365234375, 1.4945068359375, 1.552490234375, 1.6104736328125, 1.66845703125, 1.7264404296875, 1.784423828125, 1.8424072265625, 1.900390625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 13.0, 13.0, 27.0, 56.0, 63.0, 121.0, 191.0, 294.0, 505.0, 816.0, 1377.0, 2289.0, 3751.0, 6367.0, 10863.0, 18403.0, 31695.0, 57227.0, 107735.0, 207046.0, 259333.0, 155858.0, 80278.0, 43902.0, 24583.0, 14508.0, 8546.0, 5001.0, 3008.0, 1840.0, 1096.0, 666.0, 440.0, 238.0, 152.0, 105.0, 68.0, 26.0, 18.0, 5.0, 11.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.5302734375, -1.4868927001953125, -1.443511962890625, -1.4001312255859375, -1.35675048828125, -1.3133697509765625, -1.269989013671875, -1.2266082763671875, -1.1832275390625, -1.1398468017578125, -1.096466064453125, -1.0530853271484375, -1.00970458984375, -0.9663238525390625, -0.922943115234375, -0.8795623779296875, -0.836181640625, -0.7928009033203125, -0.749420166015625, -0.7060394287109375, -0.66265869140625, -0.6192779541015625, -0.575897216796875, -0.5325164794921875, -0.4891357421875, -0.4457550048828125, -0.402374267578125, -0.3589935302734375, -0.31561279296875, -0.2722320556640625, -0.228851318359375, -0.1854705810546875, -0.14208984375, -0.0987091064453125, -0.055328369140625, -0.0119476318359375, 0.03143310546875, 0.0748138427734375, 0.118194580078125, 0.1615753173828125, 0.2049560546875, 0.2483367919921875, 0.291717529296875, 0.3350982666015625, 0.37847900390625, 0.4218597412109375, 0.465240478515625, 0.5086212158203125, 0.552001953125, 0.5953826904296875, 0.638763427734375, 0.6821441650390625, 0.72552490234375, 0.7689056396484375, 0.812286376953125, 0.8556671142578125, 0.8990478515625, 0.9424285888671875, 0.985809326171875, 1.0291900634765625, 1.07257080078125, 1.1159515380859375, 1.159332275390625, 1.2027130126953125, 1.24609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 10.0, 5.0, 8.0, 11.0, 19.0, 19.0, 23.0, 24.0, 31.0, 37.0, 47.0, 46.0, 64.0, 88.0, 207.0, 1521.0, 349.0, 118.0, 71.0, 51.0, 53.0, 45.0, 39.0, 26.0, 24.0, 27.0, 22.0, 15.0, 11.0, 11.0, 12.0, 3.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.1953125, -10.9139404296875, -10.632568359375, -10.3511962890625, -10.06982421875, -9.7884521484375, -9.507080078125, -9.2257080078125, -8.9443359375, -8.6629638671875, -8.381591796875, -8.1002197265625, -7.81884765625, -7.5374755859375, -7.256103515625, -6.9747314453125, -6.693359375, -6.4119873046875, -6.130615234375, -5.8492431640625, -5.56787109375, -5.2864990234375, -5.005126953125, -4.7237548828125, -4.4423828125, -4.1610107421875, -3.879638671875, -3.5982666015625, -3.31689453125, -3.0355224609375, -2.754150390625, -2.4727783203125, -2.19140625, -1.9100341796875, -1.628662109375, -1.3472900390625, -1.06591796875, -0.7845458984375, -0.503173828125, -0.2218017578125, 0.0595703125, 0.3409423828125, 0.622314453125, 0.9036865234375, 1.18505859375, 1.4664306640625, 1.747802734375, 2.0291748046875, 2.310546875, 2.5919189453125, 2.873291015625, 3.1546630859375, 3.43603515625, 3.7174072265625, 3.998779296875, 4.2801513671875, 4.5615234375, 4.8428955078125, 5.124267578125, 5.4056396484375, 5.68701171875, 5.9683837890625, 6.249755859375, 6.5311279296875, 6.8125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 9.0, 10.0, 8.0, 12.0, 21.0, 23.0, 21.0, 33.0, 51.0, 70.0, 104.0, 158.0, 338.0, 971.0, 6204.0, 197205.0, 2869962.0, 65680.0, 3465.0, 631.0, 259.0, 147.0, 91.0, 54.0, 30.0, 37.0, 27.0, 28.0, 15.0, 9.0, 7.0, 10.0, 2.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.712158203125, -8.32275390625, -7.933349609375, -7.5439453125, -7.154541015625, -6.76513671875, -6.375732421875, -5.986328125, -5.596923828125, -5.20751953125, -4.818115234375, -4.4287109375, -4.039306640625, -3.64990234375, -3.260498046875, -2.87109375, -2.481689453125, -2.09228515625, -1.702880859375, -1.3134765625, -0.924072265625, -0.53466796875, -0.145263671875, 0.244140625, 0.633544921875, 1.02294921875, 1.412353515625, 1.8017578125, 2.191162109375, 2.58056640625, 2.969970703125, 3.359375, 3.748779296875, 4.13818359375, 4.527587890625, 4.9169921875, 5.306396484375, 5.69580078125, 6.085205078125, 6.474609375, 6.864013671875, 7.25341796875, 7.642822265625, 8.0322265625, 8.421630859375, 8.81103515625, 9.200439453125, 9.58984375, 9.979248046875, 10.36865234375, 10.758056640625, 11.1474609375, 11.536865234375, 11.92626953125, 12.315673828125, 12.705078125, 13.094482421875, 13.48388671875, 13.873291015625, 14.2626953125, 14.652099609375, 15.04150390625, 15.430908203125, 15.8203125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [7.0, 74.0, 326.0, 447.0, 152.0, 11.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265303611755371, -3.6457877159118652, -2.0262715816497803, -0.4067554473876953, 1.2127604484558105, 2.8322763442993164, 4.4517927169799805, 6.071308135986328, 7.690824508666992, 9.310340881347656, 10.929856300354004, 12.549372673034668, 14.168888092041016, 15.78840446472168, 17.407920837402344, 19.027435302734375, 20.646953582763672, 22.266469955444336, 23.885986328125, 25.50550079345703, 27.125017166137695, 28.74453353881836, 30.364049911499023, 31.983566284179688, 33.60308074951172, 35.22259521484375, 36.84211349487305, 38.46162796020508, 40.081146240234375, 41.700660705566406, 43.32017517089844, 44.939693450927734, 46.559207916259766, 48.1787223815918, 49.798240661621094, 51.417755126953125, 53.03727340698242, 54.65678787231445, 56.27630615234375, 57.89582061767578, 59.51533508300781, 61.134849548339844, 62.75436782836914, 64.37388610839844, 65.99340057373047, 67.6129150390625, 69.23242950439453, 70.85194396972656, 72.47146606445312, 74.09098052978516, 75.71049499511719, 77.33001708984375, 78.94953155517578, 80.56904602050781, 82.18856048583984, 83.80807495117188, 85.4275894165039, 87.04710388183594, 88.66661834716797, 90.28614044189453, 91.90565490722656, 93.5251693725586, 95.14468383789062, 96.76419830322266, 98.38372039794922]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 6.0, 4.0, 14.0, 7.0, 8.0, 11.0, 17.0, 12.0, 11.0, 18.0, 21.0, 25.0, 22.0, 25.0, 25.0, 34.0, 34.0, 33.0, 34.0, 48.0, 36.0, 41.0, 38.0, 52.0, 36.0, 32.0, 30.0, 29.0, 39.0, 31.0, 29.0, 25.0, 28.0, 18.0, 12.0, 23.0, 14.0, 9.0, 10.0, 11.0, 12.0, 6.0, 5.0, 7.0, 6.0, 3.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.150758743286133, -18.50597381591797, -17.861186981201172, -17.216400146484375, -16.57161521911621, -15.92682933807373, -15.28204345703125, -14.63725757598877, -13.992471694946289, -13.347685813903809, -12.702899932861328, -12.058114051818848, -11.413328170776367, -10.768542289733887, -10.123756408691406, -9.478970527648926, -8.834184646606445, -8.189398765563965, -7.544612884521484, -6.899827003479004, -6.255041122436523, -5.610255241394043, -4.9654693603515625, -4.320683479309082, -3.6758975982666016, -3.031111717224121, -2.3863258361816406, -1.7415399551391602, -1.0967540740966797, -0.4519681930541992, 0.19281768798828125, 0.8376035690307617, 1.4823875427246094, 2.12717342376709, 2.7719593048095703, 3.416745185852051, 4.061531066894531, 4.706316947937012, 5.351102828979492, 5.995888710021973, 6.640674591064453, 7.285460472106934, 7.930246353149414, 8.575032234191895, 9.219818115234375, 9.864603996276855, 10.509389877319336, 11.154175758361816, 11.798961639404297, 12.443747520446777, 13.088533401489258, 13.733319282531738, 14.378105163574219, 15.0228910446167, 15.66767692565918, 16.312461853027344, 16.95724868774414, 17.602035522460938, 18.2468204498291, 18.891605377197266, 19.536392211914062, 20.18117904663086, 20.825963973999023, 21.470748901367188, 22.115535736083984]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 6.0, 4.0, 18.0, 14.0, 14.0, 12.0, 26.0, 19.0, 27.0, 23.0, 33.0, 29.0, 29.0, 28.0, 36.0, 46.0, 39.0, 46.0, 38.0, 54.0, 43.0, 36.0, 32.0, 28.0, 34.0, 33.0, 28.0, 27.0, 25.0, 24.0, 16.0, 23.0, 12.0, 19.0, 17.0, 13.0, 7.0, 7.0, 8.0, 9.0, 1.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9326171875, -1.8726043701171875, -1.812591552734375, -1.7525787353515625, -1.69256591796875, -1.6325531005859375, -1.572540283203125, -1.5125274658203125, -1.4525146484375, -1.3925018310546875, -1.332489013671875, -1.2724761962890625, -1.21246337890625, -1.1524505615234375, -1.092437744140625, -1.0324249267578125, -0.972412109375, -0.9123992919921875, -0.852386474609375, -0.7923736572265625, -0.73236083984375, -0.6723480224609375, -0.612335205078125, -0.5523223876953125, -0.4923095703125, -0.4322967529296875, -0.372283935546875, -0.3122711181640625, -0.25225830078125, -0.1922454833984375, -0.132232666015625, -0.0722198486328125, -0.01220703125, 0.0478057861328125, 0.107818603515625, 0.1678314208984375, 0.22784423828125, 0.2878570556640625, 0.347869873046875, 0.4078826904296875, 0.4678955078125, 0.5279083251953125, 0.587921142578125, 0.6479339599609375, 0.70794677734375, 0.7679595947265625, 0.827972412109375, 0.8879852294921875, 0.947998046875, 1.0080108642578125, 1.068023681640625, 1.1280364990234375, 1.18804931640625, 1.2480621337890625, 1.308074951171875, 1.3680877685546875, 1.4281005859375, 1.4881134033203125, 1.548126220703125, 1.6081390380859375, 1.66815185546875, 1.7281646728515625, 1.788177490234375, 1.8481903076171875, 1.908203125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 8.0, 11.0, 12.0, 17.0, 27.0, 40.0, 57.0, 102.0, 150.0, 298.0, 568.0, 1336.0, 3500.0, 11193.0, 41628.0, 195256.0, 1139408.0, 2180451.0, 497951.0, 91327.0, 21573.0, 5898.0, 1920.0, 702.0, 342.0, 148.0, 107.0, 65.0, 45.0, 31.0, 25.0, 21.0, 15.0, 12.0, 5.0, 5.0, 10.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.833984375, -3.688018798828125, -3.54205322265625, -3.396087646484375, -3.2501220703125, -3.104156494140625, -2.95819091796875, -2.812225341796875, -2.666259765625, -2.520294189453125, -2.37432861328125, -2.228363037109375, -2.0823974609375, -1.936431884765625, -1.79046630859375, -1.644500732421875, -1.49853515625, -1.352569580078125, -1.20660400390625, -1.060638427734375, -0.9146728515625, -0.768707275390625, -0.62274169921875, -0.476776123046875, -0.330810546875, -0.184844970703125, -0.03887939453125, 0.107086181640625, 0.2530517578125, 0.399017333984375, 0.54498291015625, 0.690948486328125, 0.8369140625, 0.982879638671875, 1.12884521484375, 1.274810791015625, 1.4207763671875, 1.566741943359375, 1.71270751953125, 1.858673095703125, 2.004638671875, 2.150604248046875, 2.29656982421875, 2.442535400390625, 2.5885009765625, 2.734466552734375, 2.88043212890625, 3.026397705078125, 3.17236328125, 3.318328857421875, 3.46429443359375, 3.610260009765625, 3.7562255859375, 3.902191162109375, 4.04815673828125, 4.194122314453125, 4.340087890625, 4.486053466796875, 4.63201904296875, 4.777984619140625, 4.9239501953125, 5.069915771484375, 5.21588134765625, 5.361846923828125, 5.5078125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 6.0, 10.0, 11.0, 14.0, 17.0, 26.0, 40.0, 44.0, 47.0, 66.0, 85.0, 135.0, 163.0, 204.0, 289.0, 320.0, 341.0, 385.0, 361.0, 292.0, 270.0, 222.0, 143.0, 140.0, 105.0, 78.0, 63.0, 50.0, 38.0, 24.0, 11.0, 10.0, 15.0, 7.0, 10.0, 5.0, 7.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-4.9609375, -4.82501220703125, -4.6890869140625, -4.55316162109375, -4.417236328125, -4.28131103515625, -4.1453857421875, -4.00946044921875, -3.87353515625, -3.73760986328125, -3.6016845703125, -3.46575927734375, -3.329833984375, -3.19390869140625, -3.0579833984375, -2.92205810546875, -2.7861328125, -2.65020751953125, -2.5142822265625, -2.37835693359375, -2.242431640625, -2.10650634765625, -1.9705810546875, -1.83465576171875, -1.69873046875, -1.56280517578125, -1.4268798828125, -1.29095458984375, -1.155029296875, -1.01910400390625, -0.8831787109375, -0.74725341796875, -0.611328125, -0.47540283203125, -0.3394775390625, -0.20355224609375, -0.067626953125, 0.06829833984375, 0.2042236328125, 0.34014892578125, 0.47607421875, 0.61199951171875, 0.7479248046875, 0.88385009765625, 1.019775390625, 1.15570068359375, 1.2916259765625, 1.42755126953125, 1.5634765625, 1.69940185546875, 1.8353271484375, 1.97125244140625, 2.107177734375, 2.24310302734375, 2.3790283203125, 2.51495361328125, 2.65087890625, 2.78680419921875, 2.9227294921875, 3.05865478515625, 3.194580078125, 3.33050537109375, 3.4664306640625, 3.60235595703125, 3.73828125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [4.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 10.0, 13.0, 14.0, 20.0, 24.0, 27.0, 40.0, 78.0, 112.0, 179.0, 289.0, 458.0, 861.0, 1633.0, 4089.0, 10779.0, 34657.0, 119173.0, 437534.0, 1460900.0, 1493204.0, 452605.0, 122990.0, 35565.0, 11014.0, 4083.0, 1759.0, 834.0, 471.0, 264.0, 186.0, 129.0, 89.0, 61.0, 34.0, 24.0, 22.0, 19.0, 6.0, 7.0, 8.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.53277587890625, -4.3585205078125, -4.18426513671875, -4.010009765625, -3.83575439453125, -3.6614990234375, -3.48724365234375, -3.31298828125, -3.13873291015625, -2.9644775390625, -2.79022216796875, -2.615966796875, -2.44171142578125, -2.2674560546875, -2.09320068359375, -1.9189453125, -1.74468994140625, -1.5704345703125, -1.39617919921875, -1.221923828125, -1.04766845703125, -0.8734130859375, -0.69915771484375, -0.52490234375, -0.35064697265625, -0.1763916015625, -0.00213623046875, 0.172119140625, 0.34637451171875, 0.5206298828125, 0.69488525390625, 0.869140625, 1.04339599609375, 1.2176513671875, 1.39190673828125, 1.566162109375, 1.74041748046875, 1.9146728515625, 2.08892822265625, 2.26318359375, 2.43743896484375, 2.6116943359375, 2.78594970703125, 2.960205078125, 3.13446044921875, 3.3087158203125, 3.48297119140625, 3.6572265625, 3.83148193359375, 4.0057373046875, 4.17999267578125, 4.354248046875, 4.52850341796875, 4.7027587890625, 4.87701416015625, 5.05126953125, 5.22552490234375, 5.3997802734375, 5.57403564453125, 5.748291015625, 5.92254638671875, 6.0968017578125, 6.27105712890625, 6.4453125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 7.0, 12.0, 43.0, 66.0, 95.0, 128.0, 139.0, 150.0, 118.0, 101.0, 66.0, 40.0, 20.0, 11.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.083553314208984, -36.93230438232422, -35.78105545043945, -34.62980651855469, -33.47856140136719, -32.32731246948242, -31.176063537597656, -30.02481460571289, -28.873565673828125, -27.72231674194336, -26.571067810058594, -25.41982078552246, -24.268571853637695, -23.11732292175293, -21.966075897216797, -20.81482696533203, -19.663578033447266, -18.5123291015625, -17.361080169677734, -16.2098331451416, -15.058584213256836, -13.90733528137207, -12.756087303161621, -11.604839324951172, -10.453590393066406, -9.30234146118164, -8.151093482971191, -6.999845027923584, -5.848596572875977, -4.697348117828369, -3.5460996627807617, -2.3948516845703125, -1.2436065673828125, -0.09235811233520508, 1.0588903427124023, 2.2101387977600098, 3.361387252807617, 4.512635707855225, 5.663884162902832, 6.815132141113281, 7.966381072998047, 9.117630004882812, 10.268877983093262, 11.420125961303711, 12.571374893188477, 13.722623825073242, 14.873871803283691, 16.02511978149414, 17.176368713378906, 18.327617645263672, 19.478866577148438, 20.63011360168457, 21.781362533569336, 22.9326114654541, 24.083858489990234, 25.235107421875, 26.386356353759766, 27.53760528564453, 28.688854217529297, 29.84010124206543, 30.991350173950195, 32.14259719848633, 33.293846130371094, 34.44509506225586, 35.596343994140625]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 2.0, 5.0, 3.0, 9.0, 6.0, 17.0, 9.0, 12.0, 9.0, 17.0, 24.0, 18.0, 25.0, 22.0, 27.0, 42.0, 34.0, 38.0, 32.0, 48.0, 45.0, 38.0, 36.0, 50.0, 37.0, 29.0, 43.0, 30.0, 28.0, 33.0, 44.0, 25.0, 24.0, 23.0, 18.0, 16.0, 22.0, 13.0, 11.0, 6.0, 10.0, 9.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.05912208557129, -16.521156311035156, -15.983190536499023, -15.445223808288574, -14.907258033752441, -14.369292259216309, -13.83132553100586, -13.293359756469727, -12.755393981933594, -12.217428207397461, -11.679462432861328, -11.141495704650879, -10.603529930114746, -10.065564155578613, -9.527597427368164, -8.989631652832031, -8.451665878295898, -7.913700103759766, -7.375733852386475, -6.837767601013184, -6.299801826477051, -5.761836051940918, -5.223869800567627, -4.685903549194336, -4.147937774658203, -3.609971761703491, -3.0720057487487793, -2.5340397357940674, -1.9960737228393555, -1.4581077098846436, -0.9201416969299316, -0.3821756839752197, 0.155792236328125, 0.6937582492828369, 1.2317242622375488, 1.7696902751922607, 2.3076562881469727, 2.8456223011016846, 3.3835883140563965, 3.9215543270111084, 4.45952033996582, 4.997486114501953, 5.535452365875244, 6.073418617248535, 6.611384391784668, 7.149350166320801, 7.687316417694092, 8.225282669067383, 8.763248443603516, 9.301214218139648, 9.839179992675781, 10.37714672088623, 10.915112495422363, 11.453078269958496, 11.991044998168945, 12.529010772705078, 13.066976547241211, 13.604942321777344, 14.142908096313477, 14.680874824523926, 15.218840599060059, 15.756806373596191, 16.29477310180664, 16.832738876342773, 17.370704650878906]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 1.0, 6.0, 5.0, 4.0, 6.0, 9.0, 9.0, 10.0, 11.0, 20.0, 11.0, 23.0, 21.0, 26.0, 33.0, 35.0, 33.0, 39.0, 36.0, 43.0, 38.0, 30.0, 39.0, 28.0, 39.0, 36.0, 30.0, 40.0, 32.0, 36.0, 34.0, 29.0, 19.0, 20.0, 23.0, 26.0, 25.0, 15.0, 20.0, 13.0, 8.0, 14.0, 3.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8916015625, -1.832244873046875, -1.77288818359375, -1.713531494140625, -1.6541748046875, -1.594818115234375, -1.53546142578125, -1.476104736328125, -1.416748046875, -1.357391357421875, -1.29803466796875, -1.238677978515625, -1.1793212890625, -1.119964599609375, -1.06060791015625, -1.001251220703125, -0.94189453125, -0.882537841796875, -0.82318115234375, -0.763824462890625, -0.7044677734375, -0.645111083984375, -0.58575439453125, -0.526397705078125, -0.467041015625, -0.407684326171875, -0.34832763671875, -0.288970947265625, -0.2296142578125, -0.170257568359375, -0.11090087890625, -0.051544189453125, 0.0078125, 0.067169189453125, 0.12652587890625, 0.185882568359375, 0.2452392578125, 0.304595947265625, 0.36395263671875, 0.423309326171875, 0.482666015625, 0.542022705078125, 0.60137939453125, 0.660736083984375, 0.7200927734375, 0.779449462890625, 0.83880615234375, 0.898162841796875, 0.95751953125, 1.016876220703125, 1.07623291015625, 1.135589599609375, 1.1949462890625, 1.254302978515625, 1.31365966796875, 1.373016357421875, 1.432373046875, 1.491729736328125, 1.55108642578125, 1.610443115234375, 1.6697998046875, 1.729156494140625, 1.78851318359375, 1.847869873046875, 1.9072265625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 11.0, 7.0, 11.0, 22.0, 36.0, 71.0, 107.0, 162.0, 282.0, 388.0, 588.0, 1035.0, 1643.0, 2601.0, 4198.0, 6488.0, 9959.0, 15557.0, 23723.0, 35154.0, 50707.0, 69937.0, 91580.0, 110261.0, 121730.0, 119359.0, 104047.0, 83419.0, 62397.0, 44727.0, 30721.0, 20614.0, 13413.0, 8635.0, 5496.0, 3432.0, 2284.0, 1395.0, 837.0, 589.0, 334.0, 213.0, 147.0, 86.0, 74.0, 30.0, 19.0, 10.0, 12.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5756607055664062, -0.5575714111328125, -0.5394821166992188, -0.521392822265625, -0.5033035278320312, -0.4852142333984375, -0.46712493896484375, -0.44903564453125, -0.43094635009765625, -0.4128570556640625, -0.39476776123046875, -0.376678466796875, -0.35858917236328125, -0.3404998779296875, -0.32241058349609375, -0.3043212890625, -0.28623199462890625, -0.2681427001953125, -0.25005340576171875, -0.231964111328125, -0.21387481689453125, -0.1957855224609375, -0.17769622802734375, -0.15960693359375, -0.14151763916015625, -0.1234283447265625, -0.10533905029296875, -0.087249755859375, -0.06916046142578125, -0.0510711669921875, -0.03298187255859375, -0.014892578125, 0.00319671630859375, 0.0212860107421875, 0.03937530517578125, 0.057464599609375, 0.07555389404296875, 0.0936431884765625, 0.11173248291015625, 0.12982177734375, 0.14791107177734375, 0.1660003662109375, 0.18408966064453125, 0.202178955078125, 0.22026824951171875, 0.2383575439453125, 0.25644683837890625, 0.2745361328125, 0.29262542724609375, 0.3107147216796875, 0.32880401611328125, 0.346893310546875, 0.36498260498046875, 0.3830718994140625, 0.40116119384765625, 0.41925048828125, 0.43733978271484375, 0.4554290771484375, 0.47351837158203125, 0.491607666015625, 0.5096969604492188, 0.5277862548828125, 0.5458755493164062, 0.56396484375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 5.0, 2.0, 6.0, 10.0, 10.0, 8.0, 19.0, 15.0, 21.0, 24.0, 27.0, 28.0, 37.0, 45.0, 30.0, 43.0, 39.0, 44.0, 37.0, 37.0, 1070.0, 31.0, 43.0, 47.0, 44.0, 33.0, 28.0, 41.0, 24.0, 29.0, 26.0, 28.0, 15.0, 16.0, 11.0, 9.0, 13.0, 7.0, 8.0, 2.0, 4.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84765625, -1.79541015625, -1.7431640625, -1.69091796875, -1.638671875, -1.58642578125, -1.5341796875, -1.48193359375, -1.4296875, -1.37744140625, -1.3251953125, -1.27294921875, -1.220703125, -1.16845703125, -1.1162109375, -1.06396484375, -1.01171875, -0.95947265625, -0.9072265625, -0.85498046875, -0.802734375, -0.75048828125, -0.6982421875, -0.64599609375, -0.59375, -0.54150390625, -0.4892578125, -0.43701171875, -0.384765625, -0.33251953125, -0.2802734375, -0.22802734375, -0.17578125, -0.12353515625, -0.0712890625, -0.01904296875, 0.033203125, 0.08544921875, 0.1376953125, 0.18994140625, 0.2421875, 0.29443359375, 0.3466796875, 0.39892578125, 0.451171875, 0.50341796875, 0.5556640625, 0.60791015625, 0.66015625, 0.71240234375, 0.7646484375, 0.81689453125, 0.869140625, 0.92138671875, 0.9736328125, 1.02587890625, 1.078125, 1.13037109375, 1.1826171875, 1.23486328125, 1.287109375, 1.33935546875, 1.3916015625, 1.44384765625, 1.49609375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 5.0, 19.0, 18.0, 29.0, 44.0, 52.0, 97.0, 131.0, 208.0, 303.0, 443.0, 665.0, 1001.0, 1531.0, 2129.0, 3472.0, 4994.0, 7432.0, 11170.0, 17559.0, 31324.0, 1787658.0, 149535.0, 28584.0, 16503.0, 10632.0, 7049.0, 4737.0, 3300.0, 2233.0, 1381.0, 947.0, 652.0, 443.0, 245.0, 185.0, 122.0, 91.0, 73.0, 44.0, 30.0, 22.0, 17.0, 7.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.12890625, -1.0935516357421875, -1.058197021484375, -1.0228424072265625, -0.98748779296875, -0.9521331787109375, -0.916778564453125, -0.8814239501953125, -0.8460693359375, -0.8107147216796875, -0.775360107421875, -0.7400054931640625, -0.70465087890625, -0.6692962646484375, -0.633941650390625, -0.5985870361328125, -0.563232421875, -0.5278778076171875, -0.492523193359375, -0.4571685791015625, -0.42181396484375, -0.3864593505859375, -0.351104736328125, -0.3157501220703125, -0.2803955078125, -0.2450408935546875, -0.209686279296875, -0.1743316650390625, -0.13897705078125, -0.1036224365234375, -0.068267822265625, -0.0329132080078125, 0.00244140625, 0.0377960205078125, 0.073150634765625, 0.1085052490234375, 0.14385986328125, 0.1792144775390625, 0.214569091796875, 0.2499237060546875, 0.2852783203125, 0.3206329345703125, 0.355987548828125, 0.3913421630859375, 0.42669677734375, 0.4620513916015625, 0.497406005859375, 0.5327606201171875, 0.568115234375, 0.6034698486328125, 0.638824462890625, 0.6741790771484375, 0.70953369140625, 0.7448883056640625, 0.780242919921875, 0.8155975341796875, 0.8509521484375, 0.8863067626953125, 0.921661376953125, 0.9570159912109375, 0.99237060546875, 1.0277252197265625, 1.063079833984375, 1.0984344482421875, 1.1337890625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 5.0, 10.0, 15.0, 14.0, 15.0, 12.0, 16.0, 30.0, 24.0, 25.0, 29.0, 25.0, 34.0, 38.0, 32.0, 44.0, 41.0, 42.0, 40.0, 40.0, 38.0, 48.0, 34.0, 33.0, 40.0, 38.0, 24.0, 28.0, 17.0, 17.0, 17.0, 20.0, 12.0, 11.0, 12.0, 9.0, 5.0, 7.0, 4.0, 7.0, 3.0, 2.0, 3.0, 6.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0159912109375, -0.015462875366210938, -0.014934539794921875, -0.014406204223632812, -0.01387786865234375, -0.013349533081054688, -0.012821197509765625, -0.012292861938476562, -0.0117645263671875, -0.011236190795898438, -0.010707855224609375, -0.010179519653320312, -0.00965118408203125, -0.009122848510742188, -0.008594512939453125, -0.008066177368164062, -0.007537841796875, -0.0070095062255859375, -0.006481170654296875, -0.0059528350830078125, -0.00542449951171875, -0.0048961639404296875, -0.004367828369140625, -0.0038394927978515625, -0.0033111572265625, -0.0027828216552734375, -0.002254486083984375, -0.0017261505126953125, -0.00119781494140625, -0.0006694793701171875, -0.000141143798828125, 0.0003871917724609375, 0.00091552734375, 0.0014438629150390625, 0.001972198486328125, 0.0025005340576171875, 0.00302886962890625, 0.0035572052001953125, 0.004085540771484375, 0.0046138763427734375, 0.0051422119140625, 0.0056705474853515625, 0.006198883056640625, 0.0067272186279296875, 0.00725555419921875, 0.0077838897705078125, 0.008312225341796875, 0.008840560913085938, 0.009368896484375, 0.009897232055664062, 0.010425567626953125, 0.010953903198242188, 0.01148223876953125, 0.012010574340820312, 0.012538909912109375, 0.013067245483398438, 0.0135955810546875, 0.014123916625976562, 0.014652252197265625, 0.015180587768554688, 0.01570892333984375, 0.016237258911132812, 0.016765594482421875, 0.017293930053710938, 0.017822265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 9.0, 5.0, 4.0, 7.0, 8.0, 18.0, 26.0, 24.0, 26.0, 45.0, 53.0, 50.0, 68.0, 85.0, 136.0, 146.0, 242.0, 329.0, 956.0, 7625.0, 95424.0, 742613.0, 184057.0, 13579.0, 1539.0, 418.0, 243.0, 181.0, 139.0, 105.0, 70.0, 64.0, 60.0, 34.0, 25.0, 24.0, 20.0, 16.0, 21.0, 10.0, 8.0, 7.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.336669921875, -0.3266563415527344, -0.31664276123046875, -0.3066291809082031, -0.2966156005859375, -0.2866020202636719, -0.27658843994140625, -0.2665748596191406, -0.256561279296875, -0.24654769897460938, -0.23653411865234375, -0.22652053833007812, -0.2165069580078125, -0.20649337768554688, -0.19647979736328125, -0.18646621704101562, -0.17645263671875, -0.16643905639648438, -0.15642547607421875, -0.14641189575195312, -0.1363983154296875, -0.12638473510742188, -0.11637115478515625, -0.10635757446289062, -0.096343994140625, -0.08633041381835938, -0.07631683349609375, -0.06630325317382812, -0.0562896728515625, -0.046276092529296875, -0.03626251220703125, -0.026248931884765625, -0.0162353515625, -0.006221771240234375, 0.00379180908203125, 0.013805389404296875, 0.0238189697265625, 0.033832550048828125, 0.04384613037109375, 0.053859710693359375, 0.063873291015625, 0.07388687133789062, 0.08390045166015625, 0.09391403198242188, 0.1039276123046875, 0.11394119262695312, 0.12395477294921875, 0.13396835327148438, 0.14398193359375, 0.15399551391601562, 0.16400909423828125, 0.17402267456054688, 0.1840362548828125, 0.19404983520507812, 0.20406341552734375, 0.21407699584960938, 0.224090576171875, 0.23410415649414062, 0.24411773681640625, 0.2541313171386719, 0.2641448974609375, 0.2741584777832031, 0.28417205810546875, 0.2941856384277344, 0.30419921875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 29.0, 71.0, 320.0, 431.0, 103.0, 29.0, 13.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9896280169487, -0.9694715142250061, -0.9493150115013123, -0.9291585683822632, -0.9090020656585693, -0.8888455629348755, -0.8686890602111816, -0.8485325574874878, -0.828376054763794, -0.8082195520401001, -0.7880630493164062, -0.7679065465927124, -0.7477501034736633, -0.7275936007499695, -0.7074370980262756, -0.6872805953025818, -0.6671241521835327, -0.6469676494598389, -0.626811146736145, -0.6066546440124512, -0.5864982008934021, -0.5663416981697083, -0.5461851954460144, -0.5260286927223206, -0.5058721899986267, -0.48571568727493286, -0.4655592143535614, -0.44540271162986755, -0.4252462089061737, -0.40508973598480225, -0.3849332332611084, -0.36477673053741455, -0.3446202278137207, -0.32446372509002686, -0.3043072521686554, -0.28415074944496155, -0.2639942467212677, -0.24383775889873505, -0.2236812710762024, -0.20352476835250854, -0.1833682805299759, -0.16321179270744324, -0.1430552899837494, -0.12289880216121674, -0.10274230688810349, -0.08258581161499023, -0.06242932379245758, -0.04227282106876373, -0.02211633324623108, -0.0019598398357629776, 0.018196653574705124, 0.038353145122528076, 0.05850964039564133, 0.07866613566875458, 0.09882262349128723, 0.11897912621498108, 0.13913561403751373, 0.1592921018600464, 0.17944860458374023, 0.1996050924062729, 0.21976158022880554, 0.2399180829524994, 0.26007455587387085, 0.2802310585975647, 0.30038756132125854]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 5.0, 15.0, 15.0, 18.0, 17.0, 25.0, 15.0, 28.0, 35.0, 37.0, 41.0, 53.0, 48.0, 63.0, 53.0, 64.0, 53.0, 60.0, 52.0, 36.0, 39.0, 43.0, 41.0, 31.0, 19.0, 20.0, 26.0, 21.0, 3.0, 7.0, 6.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04804348945617676, -0.046116337180137634, -0.04418918862938881, -0.042262040078639984, -0.04033488780260086, -0.03840773552656174, -0.03648058697581291, -0.03455343842506409, -0.03262628614902496, -0.03069913573563099, -0.028771985322237015, -0.02684483490884304, -0.024917684495449066, -0.022990534082055092, -0.021063383668661118, -0.019136233255267143, -0.01720908284187317, -0.015281932428479195, -0.01335478201508522, -0.011427631601691246, -0.009500481188297272, -0.007573330774903297, -0.005646180361509323, -0.003719029948115349, -0.0017918795347213745, 0.0001352708786725998, 0.002062421292066574, 0.003989571705460548, 0.005916722118854523, 0.007843872532248497, 0.009771022945642471, 0.011698173359036446, 0.01362532377243042, 0.015552474185824394, 0.01747962459921837, 0.019406775012612343, 0.021333925426006317, 0.02326107583940029, 0.025188226252794266, 0.02711537666618824, 0.029042527079582214, 0.03096967749297619, 0.03289682790637016, 0.03482397645711899, 0.03675112873315811, 0.038678281009197235, 0.04060542955994606, 0.042532578110694885, 0.04445973038673401, 0.04638688266277313, 0.04831403121352196, 0.05024117976427078, 0.052168332040309906, 0.05409548431634903, 0.056022632867097855, 0.05794978141784668, 0.0598769336938858, 0.06180408596992493, 0.06373123824596405, 0.06565838307142258, 0.0675855353474617, 0.06951268762350082, 0.07143983244895935, 0.07336698472499847, 0.0752941370010376]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 8.0, 4.0, 9.0, 10.0, 6.0, 16.0, 9.0, 19.0, 21.0, 19.0, 22.0, 26.0, 16.0, 32.0, 43.0, 36.0, 35.0, 30.0, 39.0, 37.0, 37.0, 33.0, 39.0, 26.0, 38.0, 40.0, 26.0, 34.0, 26.0, 25.0, 31.0, 23.0, 27.0, 29.0, 20.0, 13.0, 17.0, 12.0, 12.0, 8.0, 10.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.873046875, -1.8148956298828125, -1.756744384765625, -1.6985931396484375, -1.64044189453125, -1.5822906494140625, -1.524139404296875, -1.4659881591796875, -1.4078369140625, -1.3496856689453125, -1.291534423828125, -1.2333831787109375, -1.17523193359375, -1.1170806884765625, -1.058929443359375, -1.0007781982421875, -0.942626953125, -0.8844757080078125, -0.826324462890625, -0.7681732177734375, -0.71002197265625, -0.6518707275390625, -0.593719482421875, -0.5355682373046875, -0.4774169921875, -0.4192657470703125, -0.361114501953125, -0.3029632568359375, -0.24481201171875, -0.1866607666015625, -0.128509521484375, -0.0703582763671875, -0.01220703125, 0.0459442138671875, 0.104095458984375, 0.1622467041015625, 0.22039794921875, 0.2785491943359375, 0.336700439453125, 0.3948516845703125, 0.4530029296875, 0.5111541748046875, 0.569305419921875, 0.6274566650390625, 0.68560791015625, 0.7437591552734375, 0.801910400390625, 0.8600616455078125, 0.918212890625, 0.9763641357421875, 1.034515380859375, 1.0926666259765625, 1.15081787109375, 1.2089691162109375, 1.267120361328125, 1.3252716064453125, 1.3834228515625, 1.4415740966796875, 1.499725341796875, 1.5578765869140625, 1.61602783203125, 1.6741790771484375, 1.732330322265625, 1.7904815673828125, 1.8486328125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 2.0, 4.0, 10.0, 8.0, 16.0, 16.0, 30.0, 50.0, 87.0, 120.0, 193.0, 327.0, 646.0, 1069.0, 1921.0, 3557.0, 7187.0, 17222.0, 53422.0, 206199.0, 514936.0, 167583.0, 45130.0, 14885.0, 6534.0, 3277.0, 1742.0, 942.0, 616.0, 310.0, 187.0, 106.0, 71.0, 49.0, 22.0, 15.0, 15.0, 14.0, 13.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.625, -3.513214111328125, -3.40142822265625, -3.289642333984375, -3.1778564453125, -3.066070556640625, -2.95428466796875, -2.842498779296875, -2.730712890625, -2.618927001953125, -2.50714111328125, -2.395355224609375, -2.2835693359375, -2.171783447265625, -2.05999755859375, -1.948211669921875, -1.83642578125, -1.724639892578125, -1.61285400390625, -1.501068115234375, -1.3892822265625, -1.277496337890625, -1.16571044921875, -1.053924560546875, -0.942138671875, -0.830352783203125, -0.71856689453125, -0.606781005859375, -0.4949951171875, -0.383209228515625, -0.27142333984375, -0.159637451171875, -0.0478515625, 0.063934326171875, 0.17572021484375, 0.287506103515625, 0.3992919921875, 0.511077880859375, 0.62286376953125, 0.734649658203125, 0.846435546875, 0.958221435546875, 1.07000732421875, 1.181793212890625, 1.2935791015625, 1.405364990234375, 1.51715087890625, 1.628936767578125, 1.74072265625, 1.852508544921875, 1.96429443359375, 2.076080322265625, 2.1878662109375, 2.299652099609375, 2.41143798828125, 2.523223876953125, 2.635009765625, 2.746795654296875, 2.85858154296875, 2.970367431640625, 3.0821533203125, 3.193939208984375, 3.30572509765625, 3.417510986328125, 3.529296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 5.0, 9.0, 7.0, 18.0, 12.0, 18.0, 17.0, 29.0, 24.0, 24.0, 25.0, 28.0, 33.0, 44.0, 45.0, 55.0, 99.0, 197.0, 1419.0, 317.0, 143.0, 75.0, 57.0, 34.0, 44.0, 38.0, 24.0, 29.0, 29.0, 21.0, 20.0, 23.0, 13.0, 15.0, 6.0, 9.0, 5.0, 4.0, 6.0, 9.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.8515625, -6.6143798828125, -6.377197265625, -6.1400146484375, -5.90283203125, -5.6656494140625, -5.428466796875, -5.1912841796875, -4.9541015625, -4.7169189453125, -4.479736328125, -4.2425537109375, -4.00537109375, -3.7681884765625, -3.531005859375, -3.2938232421875, -3.056640625, -2.8194580078125, -2.582275390625, -2.3450927734375, -2.10791015625, -1.8707275390625, -1.633544921875, -1.3963623046875, -1.1591796875, -0.9219970703125, -0.684814453125, -0.4476318359375, -0.21044921875, 0.0267333984375, 0.263916015625, 0.5010986328125, 0.73828125, 0.9754638671875, 1.212646484375, 1.4498291015625, 1.68701171875, 1.9241943359375, 2.161376953125, 2.3985595703125, 2.6357421875, 2.8729248046875, 3.110107421875, 3.3472900390625, 3.58447265625, 3.8216552734375, 4.058837890625, 4.2960205078125, 4.533203125, 4.7703857421875, 5.007568359375, 5.2447509765625, 5.48193359375, 5.7191162109375, 5.956298828125, 6.1934814453125, 6.4306640625, 6.6678466796875, 6.905029296875, 7.1422119140625, 7.37939453125, 7.6165771484375, 7.853759765625, 8.0909423828125, 8.328125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 12.0, 5.0, 13.0, 11.0, 8.0, 11.0, 16.0, 32.0, 20.0, 33.0, 54.0, 67.0, 84.0, 141.0, 213.0, 294.0, 814.0, 3536.0, 26406.0, 1518460.0, 1563075.0, 27059.0, 3516.0, 798.0, 314.0, 193.0, 120.0, 83.0, 55.0, 54.0, 54.0, 29.0, 24.0, 22.0, 17.0, 15.0, 15.0, 11.0, 9.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.0546875, -13.664306640625, -13.27392578125, -12.883544921875, -12.4931640625, -12.102783203125, -11.71240234375, -11.322021484375, -10.931640625, -10.541259765625, -10.15087890625, -9.760498046875, -9.3701171875, -8.979736328125, -8.58935546875, -8.198974609375, -7.80859375, -7.418212890625, -7.02783203125, -6.637451171875, -6.2470703125, -5.856689453125, -5.46630859375, -5.075927734375, -4.685546875, -4.295166015625, -3.90478515625, -3.514404296875, -3.1240234375, -2.733642578125, -2.34326171875, -1.952880859375, -1.5625, -1.172119140625, -0.78173828125, -0.391357421875, -0.0009765625, 0.389404296875, 0.77978515625, 1.170166015625, 1.560546875, 1.950927734375, 2.34130859375, 2.731689453125, 3.1220703125, 3.512451171875, 3.90283203125, 4.293212890625, 4.68359375, 5.073974609375, 5.46435546875, 5.854736328125, 6.2451171875, 6.635498046875, 7.02587890625, 7.416259765625, 7.806640625, 8.197021484375, 8.58740234375, 8.977783203125, 9.3681640625, 9.758544921875, 10.14892578125, 10.539306640625, 10.9296875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 10.0, 606.0, 391.0, 9.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.25605583190918, -11.364521980285645, -7.472987651824951, -3.581453323364258, 0.31008052825927734, 4.2016143798828125, 8.093149185180664, 11.984682083129883, 15.876216888427734, 19.767751693725586, 23.659284591674805, 27.550819396972656, 31.442352294921875, 35.333885192871094, 39.22542190551758, 43.1169548034668, 47.00849151611328, 50.9000244140625, 54.791561126708984, 58.6830940246582, 62.57462692260742, 66.4661636352539, 70.35769653320312, 74.24922943115234, 78.14076232910156, 82.03229522705078, 85.923828125, 89.81536865234375, 93.70690155029297, 97.59843444824219, 101.4899673461914, 105.38150024414062, 109.27303314208984, 113.16456604003906, 117.05609893798828, 120.9476318359375, 124.83917236328125, 128.73069763183594, 132.6222381591797, 136.51376342773438, 140.40530395507812, 144.29684448242188, 148.18836975097656, 152.0799102783203, 155.971435546875, 159.86297607421875, 163.7545166015625, 167.6460418701172, 171.53758239746094, 175.4291229248047, 179.32064819335938, 183.21218872070312, 187.1037139892578, 190.99525451660156, 194.88677978515625, 198.7783203125, 202.6698455810547, 206.56138610839844, 210.45291137695312, 214.34445190429688, 218.23597717285156, 222.1275177001953, 226.01904296875, 229.91058349609375, 233.8021240234375]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 6.0, 8.0, 6.0, 10.0, 9.0, 13.0, 12.0, 21.0, 12.0, 18.0, 29.0, 24.0, 32.0, 25.0, 26.0, 41.0, 34.0, 35.0, 36.0, 49.0, 45.0, 44.0, 33.0, 46.0, 44.0, 42.0, 31.0, 32.0, 19.0, 31.0, 24.0, 24.0, 17.0, 17.0, 19.0, 20.0, 14.0, 7.0, 6.0, 7.0, 3.0, 3.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.850576400756836, -22.15789222717285, -21.4652099609375, -20.772525787353516, -20.07984161376953, -19.38715934753418, -18.694475173950195, -18.001792907714844, -17.30910873413086, -16.616424560546875, -15.923742294311523, -15.231058120727539, -14.538374900817871, -13.845691680908203, -13.153007507324219, -12.46032428741455, -11.767641067504883, -11.074957847595215, -10.382274627685547, -9.689590454101562, -8.996907234191895, -8.304224014282227, -7.6115403175354, -6.918856620788574, -6.226173400878906, -5.533490180969238, -4.840806484222412, -4.148122787475586, -3.455439567565918, -2.762756109237671, -2.070072650909424, -1.3773889541625977, -0.6847057342529297, 0.007977724075317383, 0.7006611824035645, 1.3933446407318115, 2.0860280990600586, 2.7787115573883057, 3.4713950157165527, 4.164078712463379, 4.856761932373047, 5.549445152282715, 6.242128849029541, 6.934812545776367, 7.627495765686035, 8.320178985595703, 9.012863159179688, 9.705546379089355, 10.398229598999023, 11.090912818908691, 11.78359603881836, 12.476280212402344, 13.168963432312012, 13.86164665222168, 14.554330825805664, 15.247014045715332, 15.939697265625, 16.632381439208984, 17.325063705444336, 18.01774787902832, 18.710430145263672, 19.403114318847656, 20.09579849243164, 20.788482666015625, 21.481164932250977]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 6.0, 6.0, 2.0, 6.0, 8.0, 7.0, 13.0, 17.0, 19.0, 14.0, 28.0, 26.0, 29.0, 43.0, 38.0, 36.0, 29.0, 39.0, 38.0, 33.0, 33.0, 40.0, 41.0, 35.0, 38.0, 33.0, 39.0, 32.0, 33.0, 37.0, 21.0, 24.0, 29.0, 17.0, 19.0, 16.0, 14.0, 14.0, 9.0, 8.0, 14.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.12890625, -2.06378173828125, -1.9986572265625, -1.93353271484375, -1.868408203125, -1.80328369140625, -1.7381591796875, -1.67303466796875, -1.60791015625, -1.54278564453125, -1.4776611328125, -1.41253662109375, -1.347412109375, -1.28228759765625, -1.2171630859375, -1.15203857421875, -1.0869140625, -1.02178955078125, -0.9566650390625, -0.89154052734375, -0.826416015625, -0.76129150390625, -0.6961669921875, -0.63104248046875, -0.56591796875, -0.50079345703125, -0.4356689453125, -0.37054443359375, -0.305419921875, -0.24029541015625, -0.1751708984375, -0.11004638671875, -0.044921875, 0.02020263671875, 0.0853271484375, 0.15045166015625, 0.215576171875, 0.28070068359375, 0.3458251953125, 0.41094970703125, 0.47607421875, 0.54119873046875, 0.6063232421875, 0.67144775390625, 0.736572265625, 0.80169677734375, 0.8668212890625, 0.93194580078125, 0.9970703125, 1.06219482421875, 1.1273193359375, 1.19244384765625, 1.257568359375, 1.32269287109375, 1.3878173828125, 1.45294189453125, 1.51806640625, 1.58319091796875, 1.6483154296875, 1.71343994140625, 1.778564453125, 1.84368896484375, 1.9088134765625, 1.97393798828125, 2.0390625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 10.0, 7.0, 20.0, 26.0, 36.0, 42.0, 66.0, 116.0, 177.0, 336.0, 597.0, 1087.0, 2281.0, 5341.0, 13480.0, 38448.0, 122353.0, 440812.0, 1408363.0, 1483326.0, 479339.0, 132300.0, 41247.0, 14337.0, 5475.0, 2314.0, 1073.0, 547.0, 312.0, 144.0, 108.0, 60.0, 44.0, 35.0, 11.0, 11.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.29296875, -3.183319091796875, -3.07366943359375, -2.964019775390625, -2.8543701171875, -2.744720458984375, -2.63507080078125, -2.525421142578125, -2.415771484375, -2.306121826171875, -2.19647216796875, -2.086822509765625, -1.9771728515625, -1.867523193359375, -1.75787353515625, -1.648223876953125, -1.53857421875, -1.428924560546875, -1.31927490234375, -1.209625244140625, -1.0999755859375, -0.990325927734375, -0.88067626953125, -0.771026611328125, -0.661376953125, -0.551727294921875, -0.44207763671875, -0.332427978515625, -0.2227783203125, -0.113128662109375, -0.00347900390625, 0.106170654296875, 0.2158203125, 0.325469970703125, 0.43511962890625, 0.544769287109375, 0.6544189453125, 0.764068603515625, 0.87371826171875, 0.983367919921875, 1.093017578125, 1.202667236328125, 1.31231689453125, 1.421966552734375, 1.5316162109375, 1.641265869140625, 1.75091552734375, 1.860565185546875, 1.97021484375, 2.079864501953125, 2.18951416015625, 2.299163818359375, 2.4088134765625, 2.518463134765625, 2.62811279296875, 2.737762451171875, 2.847412109375, 2.957061767578125, 3.06671142578125, 3.176361083984375, 3.2860107421875, 3.395660400390625, 3.50531005859375, 3.614959716796875, 3.724609375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 7.0, 7.0, 8.0, 20.0, 21.0, 29.0, 48.0, 55.0, 77.0, 64.0, 99.0, 146.0, 195.0, 241.0, 273.0, 331.0, 392.0, 394.0, 364.0, 270.0, 223.0, 177.0, 145.0, 110.0, 84.0, 58.0, 45.0, 39.0, 32.0, 29.0, 21.0, 12.0, 15.0, 10.0, 7.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.12109375, -4.97869873046875, -4.8363037109375, -4.69390869140625, -4.551513671875, -4.40911865234375, -4.2667236328125, -4.12432861328125, -3.98193359375, -3.83953857421875, -3.6971435546875, -3.55474853515625, -3.412353515625, -3.26995849609375, -3.1275634765625, -2.98516845703125, -2.8427734375, -2.70037841796875, -2.5579833984375, -2.41558837890625, -2.273193359375, -2.13079833984375, -1.9884033203125, -1.84600830078125, -1.70361328125, -1.56121826171875, -1.4188232421875, -1.27642822265625, -1.134033203125, -0.99163818359375, -0.8492431640625, -0.70684814453125, -0.564453125, -0.42205810546875, -0.2796630859375, -0.13726806640625, 0.005126953125, 0.14752197265625, 0.2899169921875, 0.43231201171875, 0.57470703125, 0.71710205078125, 0.8594970703125, 1.00189208984375, 1.144287109375, 1.28668212890625, 1.4290771484375, 1.57147216796875, 1.7138671875, 1.85626220703125, 1.9986572265625, 2.14105224609375, 2.283447265625, 2.42584228515625, 2.5682373046875, 2.71063232421875, 2.85302734375, 2.99542236328125, 3.1378173828125, 3.28021240234375, 3.422607421875, 3.56500244140625, 3.7073974609375, 3.84979248046875, 3.9921875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 11.0, 17.0, 23.0, 22.0, 30.0, 33.0, 61.0, 80.0, 117.0, 169.0, 285.0, 482.0, 913.0, 1845.0, 4181.0, 11048.0, 31445.0, 96583.0, 302983.0, 919976.0, 1641604.0, 795905.0, 259528.0, 82506.0, 27138.0, 9777.0, 3837.0, 1626.0, 826.0, 449.0, 257.0, 181.0, 100.0, 55.0, 53.0, 40.0, 25.0, 23.0, 11.0, 10.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.69921875, -4.5447998046875, -4.390380859375, -4.2359619140625, -4.08154296875, -3.9271240234375, -3.772705078125, -3.6182861328125, -3.4638671875, -3.3094482421875, -3.155029296875, -3.0006103515625, -2.84619140625, -2.6917724609375, -2.537353515625, -2.3829345703125, -2.228515625, -2.0740966796875, -1.919677734375, -1.7652587890625, -1.61083984375, -1.4564208984375, -1.302001953125, -1.1475830078125, -0.9931640625, -0.8387451171875, -0.684326171875, -0.5299072265625, -0.37548828125, -0.2210693359375, -0.066650390625, 0.0877685546875, 0.2421875, 0.3966064453125, 0.551025390625, 0.7054443359375, 0.85986328125, 1.0142822265625, 1.168701171875, 1.3231201171875, 1.4775390625, 1.6319580078125, 1.786376953125, 1.9407958984375, 2.09521484375, 2.2496337890625, 2.404052734375, 2.5584716796875, 2.712890625, 2.8673095703125, 3.021728515625, 3.1761474609375, 3.33056640625, 3.4849853515625, 3.639404296875, 3.7938232421875, 3.9482421875, 4.1026611328125, 4.257080078125, 4.4114990234375, 4.56591796875, 4.7203369140625, 4.874755859375, 5.0291748046875, 5.18359375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 10.0, 28.0, 45.0, 67.0, 109.0, 112.0, 146.0, 140.0, 132.0, 89.0, 60.0, 44.0, 16.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.264461517333984, -25.003093719482422, -23.74172592163086, -22.480358123779297, -21.218990325927734, -19.957622528076172, -18.69625473022461, -17.434886932373047, -16.173519134521484, -14.912151336669922, -13.65078353881836, -12.389415740966797, -11.128047943115234, -9.866680145263672, -8.605313301086426, -7.343945503234863, -6.082578659057617, -4.821210861206055, -3.5598433017730713, -2.298475742340088, -1.0371079444885254, 0.2242598533630371, 1.4856271743774414, 2.746994972229004, 4.008362770080566, 5.269730567932129, 6.531098365783691, 7.792465686798096, 9.0538330078125, 10.315200805664062, 11.576568603515625, 12.837936401367188, 14.09930419921875, 15.360671997070312, 16.622039794921875, 17.883407592773438, 19.144775390625, 20.406143188476562, 21.667510986328125, 22.928878784179688, 24.19024658203125, 25.451614379882812, 26.712982177734375, 27.974349975585938, 29.2357177734375, 30.497085571289062, 31.758453369140625, 33.01982116699219, 34.28118896484375, 35.54255676269531, 36.803924560546875, 38.06529235839844, 39.32666015625, 40.58802795410156, 41.849395751953125, 43.11076354980469, 44.372127532958984, 45.63349533081055, 46.89486312866211, 48.15623092651367, 49.417598724365234, 50.6789665222168, 51.94033432006836, 53.20170211791992, 54.463069915771484]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 11.0, 3.0, 9.0, 10.0, 9.0, 15.0, 13.0, 8.0, 21.0, 19.0, 22.0, 23.0, 28.0, 34.0, 38.0, 39.0, 33.0, 34.0, 45.0, 42.0, 44.0, 37.0, 40.0, 36.0, 36.0, 30.0, 24.0, 34.0, 37.0, 35.0, 33.0, 26.0, 24.0, 21.0, 20.0, 15.0, 11.0, 8.0, 8.0, 7.0, 6.0, 5.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.10764503479004, -17.561763763427734, -17.015884399414062, -16.470003128051758, -15.924123764038086, -15.378243446350098, -14.83236312866211, -14.286481857299805, -13.740602493286133, -13.194722175598145, -12.648841857910156, -12.102961540222168, -11.55708122253418, -11.011200904846191, -10.465320587158203, -9.919439315795898, -9.37355899810791, -8.827678680419922, -8.281798362731934, -7.735918045043945, -7.190037727355957, -6.644157409667969, -6.098276615142822, -5.552396297454834, -5.006515979766846, -4.460635662078857, -3.914755344390869, -3.3688747882843018, -2.8229944705963135, -2.277114152908325, -1.7312335968017578, -1.1853532791137695, -0.6394729614257812, -0.0935925841331482, 0.45228779315948486, 0.9981682300567627, 1.544048547744751, 2.0899288654327393, 2.6358094215393066, 3.181689739227295, 3.727570056915283, 4.2734503746032715, 4.81933069229126, 5.365211486816406, 5.9110918045043945, 6.456972122192383, 7.002852439880371, 7.548732757568359, 8.094613075256348, 8.640493392944336, 9.186373710632324, 9.732254028320312, 10.2781343460083, 10.824014663696289, 11.369895935058594, 11.915775299072266, 12.46165657043457, 13.007536888122559, 13.553417205810547, 14.099297523498535, 14.645177841186523, 15.191058158874512, 15.7369384765625, 16.282819747924805, 16.828699111938477]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 8.0, 12.0, 13.0, 13.0, 11.0, 20.0, 20.0, 23.0, 38.0, 32.0, 42.0, 43.0, 40.0, 31.0, 42.0, 39.0, 37.0, 42.0, 41.0, 35.0, 47.0, 36.0, 37.0, 39.0, 29.0, 26.0, 30.0, 27.0, 20.0, 20.0, 13.0, 15.0, 13.0, 13.0, 8.0, 3.0, 11.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.486328125, -2.41412353515625, -2.3419189453125, -2.26971435546875, -2.197509765625, -2.12530517578125, -2.0531005859375, -1.98089599609375, -1.90869140625, -1.83648681640625, -1.7642822265625, -1.69207763671875, -1.619873046875, -1.54766845703125, -1.4754638671875, -1.40325927734375, -1.3310546875, -1.25885009765625, -1.1866455078125, -1.11444091796875, -1.042236328125, -0.97003173828125, -0.8978271484375, -0.82562255859375, -0.75341796875, -0.68121337890625, -0.6090087890625, -0.53680419921875, -0.464599609375, -0.39239501953125, -0.3201904296875, -0.24798583984375, -0.17578125, -0.10357666015625, -0.0313720703125, 0.04083251953125, 0.113037109375, 0.18524169921875, 0.2574462890625, 0.32965087890625, 0.40185546875, 0.47406005859375, 0.5462646484375, 0.61846923828125, 0.690673828125, 0.76287841796875, 0.8350830078125, 0.90728759765625, 0.9794921875, 1.05169677734375, 1.1239013671875, 1.19610595703125, 1.268310546875, 1.34051513671875, 1.4127197265625, 1.48492431640625, 1.55712890625, 1.62933349609375, 1.7015380859375, 1.77374267578125, 1.845947265625, 1.91815185546875, 1.9903564453125, 2.06256103515625, 2.134765625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 10.0, 15.0, 22.0, 43.0, 58.0, 95.0, 138.0, 210.0, 347.0, 533.0, 779.0, 1246.0, 1804.0, 2920.0, 4423.0, 6725.0, 10515.0, 15611.0, 22895.0, 33005.0, 46207.0, 61899.0, 80225.0, 97286.0, 109556.0, 112552.0, 104187.0, 88795.0, 70855.0, 53370.0, 38699.0, 27390.0, 19189.0, 12619.0, 8313.0, 5622.0, 3713.0, 2402.0, 1524.0, 985.0, 632.0, 414.0, 296.0, 160.0, 92.0, 60.0, 45.0, 27.0, 27.0, 7.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5078125, -0.490447998046875, -0.47308349609375, -0.455718994140625, -0.4383544921875, -0.420989990234375, -0.40362548828125, -0.386260986328125, -0.368896484375, -0.351531982421875, -0.33416748046875, -0.316802978515625, -0.2994384765625, -0.282073974609375, -0.26470947265625, -0.247344970703125, -0.22998046875, -0.212615966796875, -0.19525146484375, -0.177886962890625, -0.1605224609375, -0.143157958984375, -0.12579345703125, -0.108428955078125, -0.091064453125, -0.073699951171875, -0.05633544921875, -0.038970947265625, -0.0216064453125, -0.004241943359375, 0.01312255859375, 0.030487060546875, 0.0478515625, 0.065216064453125, 0.08258056640625, 0.099945068359375, 0.1173095703125, 0.134674072265625, 0.15203857421875, 0.169403076171875, 0.186767578125, 0.204132080078125, 0.22149658203125, 0.238861083984375, 0.2562255859375, 0.273590087890625, 0.29095458984375, 0.308319091796875, 0.32568359375, 0.343048095703125, 0.36041259765625, 0.377777099609375, 0.3951416015625, 0.412506103515625, 0.42987060546875, 0.447235107421875, 0.464599609375, 0.481964111328125, 0.49932861328125, 0.516693115234375, 0.5340576171875, 0.551422119140625, 0.56878662109375, 0.586151123046875, 0.603515625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 8.0, 7.0, 5.0, 4.0, 8.0, 7.0, 12.0, 7.0, 11.0, 18.0, 7.0, 23.0, 24.0, 26.0, 35.0, 35.0, 28.0, 36.0, 31.0, 45.0, 31.0, 40.0, 37.0, 1059.0, 39.0, 29.0, 40.0, 25.0, 31.0, 43.0, 32.0, 24.0, 24.0, 34.0, 23.0, 18.0, 21.0, 13.0, 12.0, 9.0, 7.0, 7.0, 9.0, 10.0, 4.0, 6.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0], "bins": [-1.8427734375, -1.7899017333984375, -1.737030029296875, -1.6841583251953125, -1.63128662109375, -1.5784149169921875, -1.525543212890625, -1.4726715087890625, -1.4197998046875, -1.3669281005859375, -1.314056396484375, -1.2611846923828125, -1.20831298828125, -1.1554412841796875, -1.102569580078125, -1.0496978759765625, -0.996826171875, -0.9439544677734375, -0.891082763671875, -0.8382110595703125, -0.78533935546875, -0.7324676513671875, -0.679595947265625, -0.6267242431640625, -0.5738525390625, -0.5209808349609375, -0.468109130859375, -0.4152374267578125, -0.36236572265625, -0.3094940185546875, -0.256622314453125, -0.2037506103515625, -0.15087890625, -0.0980072021484375, -0.045135498046875, 0.0077362060546875, 0.06060791015625, 0.1134796142578125, 0.166351318359375, 0.2192230224609375, 0.2720947265625, 0.3249664306640625, 0.377838134765625, 0.4307098388671875, 0.48358154296875, 0.5364532470703125, 0.589324951171875, 0.6421966552734375, 0.695068359375, 0.7479400634765625, 0.800811767578125, 0.8536834716796875, 0.90655517578125, 0.9594268798828125, 1.012298583984375, 1.0651702880859375, 1.1180419921875, 1.1709136962890625, 1.223785400390625, 1.2766571044921875, 1.32952880859375, 1.3824005126953125, 1.435272216796875, 1.4881439208984375, 1.541015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 9.0, 12.0, 27.0, 29.0, 39.0, 63.0, 96.0, 150.0, 184.0, 258.0, 435.0, 705.0, 986.0, 1566.0, 2348.0, 3532.0, 5454.0, 8265.0, 12362.0, 20093.0, 37582.0, 1878648.0, 56721.0, 24932.0, 14518.0, 9487.0, 6232.0, 4264.0, 2787.0, 1876.0, 1185.0, 755.0, 512.0, 332.0, 233.0, 136.0, 94.0, 48.0, 55.0, 30.0, 23.0, 14.0, 19.0, 12.0, 10.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.25390625, -1.215545654296875, -1.17718505859375, -1.138824462890625, -1.1004638671875, -1.062103271484375, -1.02374267578125, -0.985382080078125, -0.947021484375, -0.908660888671875, -0.87030029296875, -0.831939697265625, -0.7935791015625, -0.755218505859375, -0.71685791015625, -0.678497314453125, -0.64013671875, -0.601776123046875, -0.56341552734375, -0.525054931640625, -0.4866943359375, -0.448333740234375, -0.40997314453125, -0.371612548828125, -0.333251953125, -0.294891357421875, -0.25653076171875, -0.218170166015625, -0.1798095703125, -0.141448974609375, -0.10308837890625, -0.064727783203125, -0.0263671875, 0.011993408203125, 0.05035400390625, 0.088714599609375, 0.1270751953125, 0.165435791015625, 0.20379638671875, 0.242156982421875, 0.280517578125, 0.318878173828125, 0.35723876953125, 0.395599365234375, 0.4339599609375, 0.472320556640625, 0.51068115234375, 0.549041748046875, 0.58740234375, 0.625762939453125, 0.66412353515625, 0.702484130859375, 0.7408447265625, 0.779205322265625, 0.81756591796875, 0.855926513671875, 0.894287109375, 0.932647705078125, 0.97100830078125, 1.009368896484375, 1.0477294921875, 1.086090087890625, 1.12445068359375, 1.162811279296875, 1.201171875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 8.0, 10.0, 16.0, 17.0, 12.0, 13.0, 18.0, 33.0, 24.0, 31.0, 32.0, 35.0, 41.0, 32.0, 36.0, 37.0, 45.0, 43.0, 46.0, 39.0, 35.0, 44.0, 36.0, 37.0, 30.0, 36.0, 29.0, 21.0, 22.0, 20.0, 19.0, 13.0, 15.0, 14.0, 7.0, 9.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0213623046875, -0.020690202713012695, -0.02001810073852539, -0.019345998764038086, -0.01867389678955078, -0.018001794815063477, -0.017329692840576172, -0.016657590866088867, -0.015985488891601562, -0.015313386917114258, -0.014641284942626953, -0.013969182968139648, -0.013297080993652344, -0.012624979019165039, -0.011952877044677734, -0.01128077507019043, -0.010608673095703125, -0.00993657112121582, -0.009264469146728516, -0.008592367172241211, -0.007920265197753906, -0.0072481632232666016, -0.006576061248779297, -0.005903959274291992, -0.0052318572998046875, -0.004559755325317383, -0.003887653350830078, -0.0032155513763427734, -0.0025434494018554688, -0.001871347427368164, -0.0011992454528808594, -0.0005271434783935547, 0.00014495849609375, 0.0008170604705810547, 0.0014891624450683594, 0.002161264419555664, 0.0028333663940429688, 0.0035054683685302734, 0.004177570343017578, 0.004849672317504883, 0.0055217742919921875, 0.006193876266479492, 0.006865978240966797, 0.0075380802154541016, 0.008210182189941406, 0.008882284164428711, 0.009554386138916016, 0.01022648811340332, 0.010898590087890625, 0.01157069206237793, 0.012242794036865234, 0.012914896011352539, 0.013586997985839844, 0.014259099960327148, 0.014931201934814453, 0.015603303909301758, 0.016275405883789062, 0.016947507858276367, 0.017619609832763672, 0.018291711807250977, 0.01896381378173828, 0.019635915756225586, 0.02030801773071289, 0.020980119705200195, 0.0216522216796875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 9.0, 6.0, 16.0, 12.0, 21.0, 17.0, 28.0, 36.0, 46.0, 51.0, 86.0, 97.0, 149.0, 257.0, 368.0, 770.0, 6679.0, 186958.0, 810542.0, 38713.0, 2080.0, 542.0, 323.0, 193.0, 136.0, 104.0, 68.0, 58.0, 38.0, 30.0, 20.0, 23.0, 15.0, 11.0, 8.0, 2.0, 6.0, 5.0, 5.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4147682189941406, -0.40106964111328125, -0.3873710632324219, -0.3736724853515625, -0.3599739074707031, -0.34627532958984375, -0.3325767517089844, -0.318878173828125, -0.3051795959472656, -0.29148101806640625, -0.2777824401855469, -0.2640838623046875, -0.2503852844238281, -0.23668670654296875, -0.22298812866210938, -0.20928955078125, -0.19559097290039062, -0.18189239501953125, -0.16819381713867188, -0.1544952392578125, -0.14079666137695312, -0.12709808349609375, -0.11339950561523438, -0.099700927734375, -0.08600234985351562, -0.07230377197265625, -0.058605194091796875, -0.0449066162109375, -0.031208038330078125, -0.01750946044921875, -0.003810882568359375, 0.0098876953125, 0.023586273193359375, 0.03728485107421875, 0.050983428955078125, 0.0646820068359375, 0.07838058471679688, 0.09207916259765625, 0.10577774047851562, 0.119476318359375, 0.13317489624023438, 0.14687347412109375, 0.16057205200195312, 0.1742706298828125, 0.18796920776367188, 0.20166778564453125, 0.21536636352539062, 0.22906494140625, 0.24276351928710938, 0.25646209716796875, 0.2701606750488281, 0.2838592529296875, 0.2975578308105469, 0.31125640869140625, 0.3249549865722656, 0.338653564453125, 0.3523521423339844, 0.36605072021484375, 0.3797492980957031, 0.3934478759765625, 0.4071464538574219, 0.42084503173828125, 0.4345436096191406, 0.4482421875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 11.0, 11.0, 19.0, 41.0, 57.0, 125.0, 319.0, 207.0, 99.0, 41.0, 39.0, 12.0, 9.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37152349948883057, -0.3614283800125122, -0.35133323073387146, -0.3412380814552307, -0.33114296197891235, -0.321047842502594, -0.31095269322395325, -0.3008575439453125, -0.29076242446899414, -0.2806673049926758, -0.27057215571403503, -0.2604770064353943, -0.2503818869590759, -0.24028675258159637, -0.23019161820411682, -0.22009648382663727, -0.21000134944915771, -0.19990621507167816, -0.1898110806941986, -0.17971594631671906, -0.1696208119392395, -0.15952567756175995, -0.1494305431842804, -0.13933540880680084, -0.1292402744293213, -0.11914514005184174, -0.10905000567436218, -0.09895487129688263, -0.08885973691940308, -0.07876460254192352, -0.06866946816444397, -0.058574333786964417, -0.04847922921180725, -0.0383840948343277, -0.028288960456848145, -0.01819382607936859, -0.008098691701889038, 0.001996442675590515, 0.012091577053070068, 0.02218671143054962, 0.032281845808029175, 0.04237698018550873, 0.05247211456298828, 0.06256724894046783, 0.07266238331794739, 0.08275751769542694, 0.0928526520729065, 0.10294778645038605, 0.1130429208278656, 0.12313805520534515, 0.1332331895828247, 0.14332832396030426, 0.1534234583377838, 0.16351859271526337, 0.17361372709274292, 0.18370886147022247, 0.19380399584770203, 0.20389913022518158, 0.21399426460266113, 0.22408939898014069, 0.23418453335762024, 0.2442796677350998, 0.25437480211257935, 0.2644699215888977, 0.27456507086753845]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 10.0, 10.0, 6.0, 11.0, 17.0, 21.0, 26.0, 16.0, 22.0, 28.0, 44.0, 26.0, 34.0, 32.0, 22.0, 26.0, 39.0, 35.0, 35.0, 38.0, 31.0, 44.0, 42.0, 36.0, 39.0, 37.0, 36.0, 25.0, 23.0, 24.0, 19.0, 25.0, 16.0, 12.0, 15.0, 10.0, 9.0, 14.0, 6.0, 5.0, 8.0, 3.0, 2.0, 6.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.025686264038085938, -0.024836836382746696, -0.023987408727407455, -0.023137981072068214, -0.022288553416728973, -0.021439125761389732, -0.02058969810605049, -0.01974027045071125, -0.01889084279537201, -0.018041415140032768, -0.017191987484693527, -0.016342559829354286, -0.015493132174015045, -0.014643704518675804, -0.013794276863336563, -0.012944849207997322, -0.012095421552658081, -0.01124599389731884, -0.010396566241979599, -0.009547138586640358, -0.008697710931301117, -0.007848283275961876, -0.006998855620622635, -0.006149427965283394, -0.005300000309944153, -0.004450572654604912, -0.0036011449992656708, -0.0027517173439264297, -0.0019022896885871887, -0.0010528620332479477, -0.00020343437790870667, 0.0006459932774305344, 0.0014954209327697754, 0.0023448485881090164, 0.0031942762434482574, 0.0040437038987874985, 0.0048931315541267395, 0.0057425592094659805, 0.0065919868648052216, 0.007441414520144463, 0.008290842175483704, 0.009140269830822945, 0.009989697486162186, 0.010839125141501427, 0.011688552796840668, 0.012537980452179909, 0.01338740810751915, 0.01423683576285839, 0.015086263418197632, 0.015935691073536873, 0.016785118728876114, 0.017634546384215355, 0.018483974039554596, 0.019333401694893837, 0.020182829350233078, 0.02103225700557232, 0.02188168466091156, 0.0227311123162508, 0.023580539971590042, 0.024429967626929283, 0.025279395282268524, 0.026128822937607765, 0.026978250592947006, 0.027827678248286247, 0.02867710590362549]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 11.0, 11.0, 11.0, 14.0, 21.0, 24.0, 21.0, 31.0, 23.0, 40.0, 33.0, 44.0, 35.0, 43.0, 51.0, 36.0, 45.0, 50.0, 45.0, 42.0, 30.0, 33.0, 26.0, 32.0, 34.0, 28.0, 42.0, 22.0, 24.0, 9.0, 16.0, 17.0, 13.0, 10.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.49609375, -2.420989990234375, -2.34588623046875, -2.270782470703125, -2.1956787109375, -2.120574951171875, -2.04547119140625, -1.970367431640625, -1.895263671875, -1.820159912109375, -1.74505615234375, -1.669952392578125, -1.5948486328125, -1.519744873046875, -1.44464111328125, -1.369537353515625, -1.29443359375, -1.219329833984375, -1.14422607421875, -1.069122314453125, -0.9940185546875, -0.918914794921875, -0.84381103515625, -0.768707275390625, -0.693603515625, -0.618499755859375, -0.54339599609375, -0.468292236328125, -0.3931884765625, -0.318084716796875, -0.24298095703125, -0.167877197265625, -0.0927734375, -0.017669677734375, 0.05743408203125, 0.132537841796875, 0.2076416015625, 0.282745361328125, 0.35784912109375, 0.432952880859375, 0.508056640625, 0.583160400390625, 0.65826416015625, 0.733367919921875, 0.8084716796875, 0.883575439453125, 0.95867919921875, 1.033782958984375, 1.10888671875, 1.183990478515625, 1.25909423828125, 1.334197998046875, 1.4093017578125, 1.484405517578125, 1.55950927734375, 1.634613037109375, 1.709716796875, 1.784820556640625, 1.85992431640625, 1.935028076171875, 2.0101318359375, 2.085235595703125, 2.16033935546875, 2.235443115234375, 2.310546875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 15.0, 17.0, 20.0, 34.0, 46.0, 79.0, 125.0, 214.0, 336.0, 581.0, 1016.0, 1813.0, 3080.0, 5453.0, 9703.0, 17714.0, 35684.0, 88546.0, 258393.0, 358937.0, 156990.0, 54497.0, 24976.0, 13088.0, 7324.0, 4245.0, 2346.0, 1390.0, 743.0, 434.0, 260.0, 140.0, 113.0, 48.0, 35.0, 21.0, 20.0, 18.0, 16.0, 7.0, 3.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.822265625, -2.734771728515625, -2.64727783203125, -2.559783935546875, -2.4722900390625, -2.384796142578125, -2.29730224609375, -2.209808349609375, -2.122314453125, -2.034820556640625, -1.94732666015625, -1.859832763671875, -1.7723388671875, -1.684844970703125, -1.59735107421875, -1.509857177734375, -1.42236328125, -1.334869384765625, -1.24737548828125, -1.159881591796875, -1.0723876953125, -0.984893798828125, -0.89739990234375, -0.809906005859375, -0.722412109375, -0.634918212890625, -0.54742431640625, -0.459930419921875, -0.3724365234375, -0.284942626953125, -0.19744873046875, -0.109954833984375, -0.0224609375, 0.065032958984375, 0.15252685546875, 0.240020751953125, 0.3275146484375, 0.415008544921875, 0.50250244140625, 0.589996337890625, 0.677490234375, 0.764984130859375, 0.85247802734375, 0.939971923828125, 1.0274658203125, 1.114959716796875, 1.20245361328125, 1.289947509765625, 1.37744140625, 1.464935302734375, 1.55242919921875, 1.639923095703125, 1.7274169921875, 1.814910888671875, 1.90240478515625, 1.989898681640625, 2.077392578125, 2.164886474609375, 2.25238037109375, 2.339874267578125, 2.4273681640625, 2.514862060546875, 2.60235595703125, 2.689849853515625, 2.77734375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 2.0, 5.0, 11.0, 11.0, 14.0, 20.0, 20.0, 21.0, 16.0, 38.0, 40.0, 45.0, 42.0, 55.0, 55.0, 111.0, 220.0, 1498.0, 277.0, 115.0, 90.0, 47.0, 58.0, 37.0, 35.0, 29.0, 29.0, 22.0, 12.0, 13.0, 6.0, 11.0, 10.0, 9.0, 4.0, 2.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.8359375, -11.5211181640625, -11.206298828125, -10.8914794921875, -10.57666015625, -10.2618408203125, -9.947021484375, -9.6322021484375, -9.3173828125, -9.0025634765625, -8.687744140625, -8.3729248046875, -8.05810546875, -7.7432861328125, -7.428466796875, -7.1136474609375, -6.798828125, -6.4840087890625, -6.169189453125, -5.8543701171875, -5.53955078125, -5.2247314453125, -4.909912109375, -4.5950927734375, -4.2802734375, -3.9654541015625, -3.650634765625, -3.3358154296875, -3.02099609375, -2.7061767578125, -2.391357421875, -2.0765380859375, -1.76171875, -1.4468994140625, -1.132080078125, -0.8172607421875, -0.50244140625, -0.1876220703125, 0.127197265625, 0.4420166015625, 0.7568359375, 1.0716552734375, 1.386474609375, 1.7012939453125, 2.01611328125, 2.3309326171875, 2.645751953125, 2.9605712890625, 3.275390625, 3.5902099609375, 3.905029296875, 4.2198486328125, 4.53466796875, 4.8494873046875, 5.164306640625, 5.4791259765625, 5.7939453125, 6.1087646484375, 6.423583984375, 6.7384033203125, 7.05322265625, 7.3680419921875, 7.682861328125, 7.9976806640625, 8.3125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 3.0, 6.0, 6.0, 7.0, 14.0, 20.0, 23.0, 30.0, 44.0, 46.0, 78.0, 107.0, 171.0, 297.0, 604.0, 2700.0, 63522.0, 3003749.0, 69930.0, 2773.0, 661.0, 303.0, 168.0, 106.0, 87.0, 54.0, 39.0, 32.0, 30.0, 22.0, 20.0, 12.0, 9.0, 8.0, 4.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.96875, -17.35986328125, -16.7509765625, -16.14208984375, -15.533203125, -14.92431640625, -14.3154296875, -13.70654296875, -13.09765625, -12.48876953125, -11.8798828125, -11.27099609375, -10.662109375, -10.05322265625, -9.4443359375, -8.83544921875, -8.2265625, -7.61767578125, -7.0087890625, -6.39990234375, -5.791015625, -5.18212890625, -4.5732421875, -3.96435546875, -3.35546875, -2.74658203125, -2.1376953125, -1.52880859375, -0.919921875, -0.31103515625, 0.2978515625, 0.90673828125, 1.515625, 2.12451171875, 2.7333984375, 3.34228515625, 3.951171875, 4.56005859375, 5.1689453125, 5.77783203125, 6.38671875, 6.99560546875, 7.6044921875, 8.21337890625, 8.822265625, 9.43115234375, 10.0400390625, 10.64892578125, 11.2578125, 11.86669921875, 12.4755859375, 13.08447265625, 13.693359375, 14.30224609375, 14.9111328125, 15.52001953125, 16.12890625, 16.73779296875, 17.3466796875, 17.95556640625, 18.564453125, 19.17333984375, 19.7822265625, 20.39111328125, 21.0]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 32.0, 186.0, 352.0, 309.0, 107.0, 21.0, 4.0], "bins": [-90.21656799316406, -88.70793151855469, -87.19928741455078, -85.6906509399414, -84.1820068359375, -82.67337036132812, -81.16472625732422, -79.65608978271484, -78.14744567871094, -76.63880920410156, -75.13016510009766, -73.62152862548828, -72.11288452148438, -70.604248046875, -69.0956039428711, -67.58696746826172, -66.07833099365234, -64.56969451904297, -63.06105041503906, -61.55241012573242, -60.04376983642578, -58.535133361816406, -57.0264892578125, -55.517852783203125, -54.00920867919922, -52.50056838989258, -50.99192810058594, -49.4832878112793, -47.974647521972656, -46.46601104736328, -44.957366943359375, -43.44873046875, -41.940086364746094, -40.43144607543945, -38.92280578613281, -37.41416549682617, -35.90552520751953, -34.396888732910156, -32.88824462890625, -31.379608154296875, -29.870967864990234, -28.362327575683594, -26.853687286376953, -25.345046997070312, -23.836408615112305, -22.327768325805664, -20.819128036499023, -19.310489654541016, -17.801847457885742, -16.2932071685791, -14.784567832946777, -13.275927543640137, -11.767288208007812, -10.258647918701172, -8.750007629394531, -7.241368293762207, -5.732728481292725, -4.224088668823242, -2.7154486179351807, -1.2068085670471191, 0.3018312454223633, 1.8104710578918457, 3.3191113471984863, 4.8277506828308105, 6.336390972137451]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 8.0, 14.0, 11.0, 15.0, 18.0, 10.0, 16.0, 19.0, 23.0, 27.0, 22.0, 39.0, 31.0, 42.0, 42.0, 33.0, 24.0, 37.0, 49.0, 39.0, 40.0, 37.0, 25.0, 42.0, 42.0, 35.0, 31.0, 29.0, 35.0, 24.0, 24.0, 12.0, 15.0, 18.0, 9.0, 14.0, 12.0, 12.0, 6.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.8539981842041, -21.171533584594727, -20.48906707763672, -19.806602478027344, -19.12413787841797, -18.44167137145996, -17.759206771850586, -17.076740264892578, -16.394275665283203, -15.711810111999512, -15.02934455871582, -14.346879959106445, -13.664414405822754, -12.981948852539062, -12.299484252929688, -11.617018699645996, -10.934553146362305, -10.252087593078613, -9.569622039794922, -8.887157440185547, -8.204691886901855, -7.522226333618164, -6.839761257171631, -6.157296180725098, -5.474830627441406, -4.792365074157715, -4.109899997711182, -3.4274346828460693, -2.744969367980957, -2.0625040531158447, -1.3800387382507324, -0.6975736618041992, -0.015108108520507812, 0.6673572063446045, 1.3498225212097168, 2.032287836074829, 2.7147531509399414, 3.3972184658050537, 4.079683780670166, 4.762148857116699, 5.444614410400391, 6.127079963684082, 6.809545040130615, 7.492010116577148, 8.17447566986084, 8.856941223144531, 9.539405822753906, 10.221871376037598, 10.904336929321289, 11.58680248260498, 12.269268035888672, 12.951732635498047, 13.634198188781738, 14.31666374206543, 14.999128341674805, 15.681593894958496, 16.364059448242188, 17.046524047851562, 17.72899055480957, 18.411455154418945, 19.093921661376953, 19.776386260986328, 20.458850860595703, 21.141315460205078, 21.823781967163086]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 11.0, 9.0, 12.0, 23.0, 16.0, 21.0, 29.0, 37.0, 45.0, 30.0, 31.0, 39.0, 42.0, 30.0, 31.0, 39.0, 40.0, 41.0, 35.0, 34.0, 36.0, 28.0, 32.0, 30.0, 22.0, 37.0, 36.0, 27.0, 25.0, 23.0, 7.0, 10.0, 10.0, 12.0, 9.0, 5.0, 4.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.30859375, -2.235931396484375, -2.16326904296875, -2.090606689453125, -2.0179443359375, -1.945281982421875, -1.87261962890625, -1.799957275390625, -1.727294921875, -1.654632568359375, -1.58197021484375, -1.509307861328125, -1.4366455078125, -1.363983154296875, -1.29132080078125, -1.218658447265625, -1.14599609375, -1.073333740234375, -1.00067138671875, -0.928009033203125, -0.8553466796875, -0.782684326171875, -0.71002197265625, -0.637359619140625, -0.564697265625, -0.492034912109375, -0.41937255859375, -0.346710205078125, -0.2740478515625, -0.201385498046875, -0.12872314453125, -0.056060791015625, 0.0166015625, 0.089263916015625, 0.16192626953125, 0.234588623046875, 0.3072509765625, 0.379913330078125, 0.45257568359375, 0.525238037109375, 0.597900390625, 0.670562744140625, 0.74322509765625, 0.815887451171875, 0.8885498046875, 0.961212158203125, 1.03387451171875, 1.106536865234375, 1.17919921875, 1.251861572265625, 1.32452392578125, 1.397186279296875, 1.4698486328125, 1.542510986328125, 1.61517333984375, 1.687835693359375, 1.760498046875, 1.833160400390625, 1.90582275390625, 1.978485107421875, 2.0511474609375, 2.123809814453125, 2.19647216796875, 2.269134521484375, 2.341796875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 4.0, 3.0, 8.0, 14.0, 18.0, 19.0, 21.0, 22.0, 25.0, 54.0, 48.0, 53.0, 66.0, 116.0, 163.0, 252.0, 695.0, 2380.0, 11857.0, 94440.0, 1147820.0, 2578471.0, 319756.0, 30785.0, 4857.0, 1159.0, 431.0, 194.0, 117.0, 96.0, 63.0, 49.0, 39.0, 30.0, 28.0, 27.0, 22.0, 13.0, 15.0, 12.0, 8.0, 7.0, 4.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.38671875, -7.15765380859375, -6.9285888671875, -6.69952392578125, -6.470458984375, -6.24139404296875, -6.0123291015625, -5.78326416015625, -5.55419921875, -5.32513427734375, -5.0960693359375, -4.86700439453125, -4.637939453125, -4.40887451171875, -4.1798095703125, -3.95074462890625, -3.7216796875, -3.49261474609375, -3.2635498046875, -3.03448486328125, -2.805419921875, -2.57635498046875, -2.3472900390625, -2.11822509765625, -1.88916015625, -1.66009521484375, -1.4310302734375, -1.20196533203125, -0.972900390625, -0.74383544921875, -0.5147705078125, -0.28570556640625, -0.056640625, 0.17242431640625, 0.4014892578125, 0.63055419921875, 0.859619140625, 1.08868408203125, 1.3177490234375, 1.54681396484375, 1.77587890625, 2.00494384765625, 2.2340087890625, 2.46307373046875, 2.692138671875, 2.92120361328125, 3.1502685546875, 3.37933349609375, 3.6083984375, 3.83746337890625, 4.0665283203125, 4.29559326171875, 4.524658203125, 4.75372314453125, 4.9827880859375, 5.21185302734375, 5.44091796875, 5.66998291015625, 5.8990478515625, 6.12811279296875, 6.357177734375, 6.58624267578125, 6.8153076171875, 7.04437255859375, 7.2734375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 13.0, 25.0, 34.0, 63.0, 82.0, 137.0, 207.0, 293.0, 404.0, 511.0, 630.0, 526.0, 379.0, 259.0, 189.0, 106.0, 69.0, 51.0, 32.0, 18.0, 15.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.063232421875, -8.81396484375, -8.564697265625, -8.3154296875, -8.066162109375, -7.81689453125, -7.567626953125, -7.318359375, -7.069091796875, -6.81982421875, -6.570556640625, -6.3212890625, -6.072021484375, -5.82275390625, -5.573486328125, -5.32421875, -5.074951171875, -4.82568359375, -4.576416015625, -4.3271484375, -4.077880859375, -3.82861328125, -3.579345703125, -3.330078125, -3.080810546875, -2.83154296875, -2.582275390625, -2.3330078125, -2.083740234375, -1.83447265625, -1.585205078125, -1.3359375, -1.086669921875, -0.83740234375, -0.588134765625, -0.3388671875, -0.089599609375, 0.15966796875, 0.408935546875, 0.658203125, 0.907470703125, 1.15673828125, 1.406005859375, 1.6552734375, 1.904541015625, 2.15380859375, 2.403076171875, 2.65234375, 2.901611328125, 3.15087890625, 3.400146484375, 3.6494140625, 3.898681640625, 4.14794921875, 4.397216796875, 4.646484375, 4.895751953125, 5.14501953125, 5.394287109375, 5.6435546875, 5.892822265625, 6.14208984375, 6.391357421875, 6.640625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 5.0, 8.0, 5.0, 11.0, 25.0, 31.0, 50.0, 79.0, 152.0, 260.0, 676.0, 3363.0, 103194.0, 3519122.0, 555920.0, 9476.0, 1065.0, 376.0, 185.0, 121.0, 50.0, 45.0, 28.0, 13.0, 8.0, 13.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.640625, -16.01708984375, -15.3935546875, -14.77001953125, -14.146484375, -13.52294921875, -12.8994140625, -12.27587890625, -11.65234375, -11.02880859375, -10.4052734375, -9.78173828125, -9.158203125, -8.53466796875, -7.9111328125, -7.28759765625, -6.6640625, -6.04052734375, -5.4169921875, -4.79345703125, -4.169921875, -3.54638671875, -2.9228515625, -2.29931640625, -1.67578125, -1.05224609375, -0.4287109375, 0.19482421875, 0.818359375, 1.44189453125, 2.0654296875, 2.68896484375, 3.3125, 3.93603515625, 4.5595703125, 5.18310546875, 5.806640625, 6.43017578125, 7.0537109375, 7.67724609375, 8.30078125, 8.92431640625, 9.5478515625, 10.17138671875, 10.794921875, 11.41845703125, 12.0419921875, 12.66552734375, 13.2890625, 13.91259765625, 14.5361328125, 15.15966796875, 15.783203125, 16.40673828125, 17.0302734375, 17.65380859375, 18.27734375, 18.90087890625, 19.5244140625, 20.14794921875, 20.771484375, 21.39501953125, 22.0185546875, 22.64208984375, 23.265625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 10.0, 17.0, 25.0, 49.0, 69.0, 91.0, 95.0, 99.0, 112.0, 89.0, 106.0, 70.0, 63.0, 52.0, 22.0, 10.0, 9.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.17569923400879, -25.17813491821289, -24.180570602416992, -23.183006286621094, -22.185441970825195, -21.187877655029297, -20.1903133392334, -19.1927490234375, -18.1951847076416, -17.197620391845703, -16.200056076049805, -15.202491760253906, -14.204927444458008, -13.20736312866211, -12.209798812866211, -11.212234497070312, -10.214670181274414, -9.217105865478516, -8.219541549682617, -7.221977233886719, -6.22441291809082, -5.226848602294922, -4.229284286499023, -3.231719970703125, -2.2341556549072266, -1.2365913391113281, -0.2390270233154297, 0.7585372924804688, 1.7561016082763672, 2.7536659240722656, 3.751230239868164, 4.7487945556640625, 5.746360778808594, 6.743925094604492, 7.741489410400391, 8.739053726196289, 9.736618041992188, 10.734182357788086, 11.731746673583984, 12.729310989379883, 13.726875305175781, 14.72443962097168, 15.722003936767578, 16.719568252563477, 17.717132568359375, 18.714696884155273, 19.712261199951172, 20.70982551574707, 21.70738983154297, 22.704954147338867, 23.702518463134766, 24.700082778930664, 25.697647094726562, 26.69521141052246, 27.69277572631836, 28.690340042114258, 29.687904357910156, 30.685468673706055, 31.683032989501953, 32.68059539794922, 33.67816162109375, 34.67572784423828, 35.67329025268555, 36.67085266113281, 37.668418884277344]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 3.0, 10.0, 7.0, 14.0, 11.0, 6.0, 8.0, 15.0, 17.0, 25.0, 19.0, 22.0, 30.0, 36.0, 24.0, 36.0, 36.0, 36.0, 41.0, 40.0, 39.0, 35.0, 30.0, 41.0, 45.0, 30.0, 30.0, 43.0, 33.0, 34.0, 26.0, 29.0, 27.0, 21.0, 21.0, 16.0, 12.0, 8.0, 8.0, 6.0, 6.0, 4.0, 6.0, 7.0, 8.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.697078704833984, -16.167081832885742, -15.637084007263184, -15.107086181640625, -14.577089309692383, -14.047091484069824, -13.517093658447266, -12.987096786499023, -12.457099914550781, -11.927102088928223, -11.39710521697998, -10.867107391357422, -10.33711051940918, -9.807112693786621, -9.277114868164062, -8.74711799621582, -8.217120170593262, -7.687122821807861, -7.157125473022461, -6.627127647399902, -6.09713077545166, -5.567132949829102, -5.037135601043701, -4.507138252258301, -3.9771409034729004, -3.4471435546875, -2.9171462059020996, -2.38714861869812, -1.8571512699127197, -1.3271539211273193, -0.7971563339233398, -0.26715898513793945, 0.26283836364746094, 0.7928357720375061, 1.3228331804275513, 1.8528306484222412, 2.3828279972076416, 2.912825345993042, 3.4428229331970215, 3.972820281982422, 4.502817630767822, 5.032814979553223, 5.562812328338623, 6.092809677124023, 6.622807502746582, 7.152804374694824, 7.682802200317383, 8.212799072265625, 8.742796897888184, 9.272794723510742, 9.802791595458984, 10.332789421081543, 10.862786293029785, 11.392784118652344, 11.922780990600586, 12.452778816223145, 12.982776641845703, 13.512774467468262, 14.042771339416504, 14.572769165039062, 15.102766036987305, 15.632763862609863, 16.162761688232422, 16.692758560180664, 17.222755432128906]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 10.0, 10.0, 15.0, 14.0, 19.0, 25.0, 14.0, 15.0, 28.0, 28.0, 24.0, 36.0, 43.0, 35.0, 40.0, 38.0, 41.0, 34.0, 38.0, 45.0, 49.0, 41.0, 34.0, 27.0, 28.0, 39.0, 26.0, 25.0, 21.0, 18.0, 15.0, 19.0, 17.0, 15.0, 24.0, 10.0, 4.0, 6.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.302734375, -2.2266845703125, -2.150634765625, -2.0745849609375, -1.99853515625, -1.9224853515625, -1.846435546875, -1.7703857421875, -1.6943359375, -1.6182861328125, -1.542236328125, -1.4661865234375, -1.39013671875, -1.3140869140625, -1.238037109375, -1.1619873046875, -1.0859375, -1.0098876953125, -0.933837890625, -0.8577880859375, -0.78173828125, -0.7056884765625, -0.629638671875, -0.5535888671875, -0.4775390625, -0.4014892578125, -0.325439453125, -0.2493896484375, -0.17333984375, -0.0972900390625, -0.021240234375, 0.0548095703125, 0.130859375, 0.2069091796875, 0.282958984375, 0.3590087890625, 0.43505859375, 0.5111083984375, 0.587158203125, 0.6632080078125, 0.7392578125, 0.8153076171875, 0.891357421875, 0.9674072265625, 1.04345703125, 1.1195068359375, 1.195556640625, 1.2716064453125, 1.34765625, 1.4237060546875, 1.499755859375, 1.5758056640625, 1.65185546875, 1.7279052734375, 1.803955078125, 1.8800048828125, 1.9560546875, 2.0321044921875, 2.108154296875, 2.1842041015625, 2.26025390625, 2.3363037109375, 2.412353515625, 2.4884033203125, 2.564453125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 21.0, 27.0, 33.0, 46.0, 77.0, 135.0, 188.0, 305.0, 489.0, 815.0, 1219.0, 1904.0, 3003.0, 4755.0, 7412.0, 11218.0, 17137.0, 25591.0, 36606.0, 50933.0, 68089.0, 86390.0, 103049.0, 113310.0, 112608.0, 100595.0, 84531.0, 65149.0, 48401.0, 34599.0, 23955.0, 16079.0, 10624.0, 6958.0, 4420.0, 2865.0, 1889.0, 1134.0, 702.0, 486.0, 292.0, 174.0, 111.0, 83.0, 40.0, 45.0, 26.0, 15.0, 7.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.51019287109375, -0.4925537109375, -0.47491455078125, -0.457275390625, -0.43963623046875, -0.4219970703125, -0.40435791015625, -0.38671875, -0.36907958984375, -0.3514404296875, -0.33380126953125, -0.316162109375, -0.29852294921875, -0.2808837890625, -0.26324462890625, -0.24560546875, -0.22796630859375, -0.2103271484375, -0.19268798828125, -0.175048828125, -0.15740966796875, -0.1397705078125, -0.12213134765625, -0.1044921875, -0.08685302734375, -0.0692138671875, -0.05157470703125, -0.033935546875, -0.01629638671875, 0.0013427734375, 0.01898193359375, 0.03662109375, 0.05426025390625, 0.0718994140625, 0.08953857421875, 0.107177734375, 0.12481689453125, 0.1424560546875, 0.16009521484375, 0.177734375, 0.19537353515625, 0.2130126953125, 0.23065185546875, 0.248291015625, 0.26593017578125, 0.2835693359375, 0.30120849609375, 0.31884765625, 0.33648681640625, 0.3541259765625, 0.37176513671875, 0.389404296875, 0.40704345703125, 0.4246826171875, 0.44232177734375, 0.4599609375, 0.47760009765625, 0.4952392578125, 0.51287841796875, 0.530517578125, 0.54815673828125, 0.5657958984375, 0.58343505859375, 0.60107421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 8.0, 12.0, 7.0, 8.0, 17.0, 15.0, 12.0, 18.0, 24.0, 27.0, 25.0, 21.0, 39.0, 47.0, 30.0, 42.0, 41.0, 56.0, 1076.0, 55.0, 34.0, 43.0, 50.0, 31.0, 43.0, 24.0, 27.0, 30.0, 22.0, 23.0, 19.0, 19.0, 17.0, 12.0, 7.0, 12.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.62890625, -2.555145263671875, -2.48138427734375, -2.407623291015625, -2.3338623046875, -2.260101318359375, -2.18634033203125, -2.112579345703125, -2.038818359375, -1.965057373046875, -1.89129638671875, -1.817535400390625, -1.7437744140625, -1.670013427734375, -1.59625244140625, -1.522491455078125, -1.44873046875, -1.374969482421875, -1.30120849609375, -1.227447509765625, -1.1536865234375, -1.079925537109375, -1.00616455078125, -0.932403564453125, -0.858642578125, -0.784881591796875, -0.71112060546875, -0.637359619140625, -0.5635986328125, -0.489837646484375, -0.41607666015625, -0.342315673828125, -0.2685546875, -0.194793701171875, -0.12103271484375, -0.047271728515625, 0.0264892578125, 0.100250244140625, 0.17401123046875, 0.247772216796875, 0.321533203125, 0.395294189453125, 0.46905517578125, 0.542816162109375, 0.6165771484375, 0.690338134765625, 0.76409912109375, 0.837860107421875, 0.91162109375, 0.985382080078125, 1.05914306640625, 1.132904052734375, 1.2066650390625, 1.280426025390625, 1.35418701171875, 1.427947998046875, 1.501708984375, 1.575469970703125, 1.64923095703125, 1.722991943359375, 1.7967529296875, 1.870513916015625, 1.94427490234375, 2.018035888671875, 2.091796875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 12.0, 5.0, 14.0, 24.0, 28.0, 34.0, 47.0, 84.0, 136.0, 204.0, 263.0, 434.0, 659.0, 943.0, 1505.0, 2265.0, 3337.0, 5159.0, 7752.0, 11973.0, 19362.0, 35111.0, 1872959.0, 63789.0, 26591.0, 15492.0, 9959.0, 6598.0, 4243.0, 2816.0, 1844.0, 1167.0, 734.0, 505.0, 337.0, 259.0, 160.0, 103.0, 52.0, 48.0, 43.0, 25.0, 12.0, 13.0, 7.0, 4.0, 8.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2265625, -1.18670654296875, -1.1468505859375, -1.10699462890625, -1.067138671875, -1.02728271484375, -0.9874267578125, -0.94757080078125, -0.90771484375, -0.86785888671875, -0.8280029296875, -0.78814697265625, -0.748291015625, -0.70843505859375, -0.6685791015625, -0.62872314453125, -0.5888671875, -0.54901123046875, -0.5091552734375, -0.46929931640625, -0.429443359375, -0.38958740234375, -0.3497314453125, -0.30987548828125, -0.27001953125, -0.23016357421875, -0.1903076171875, -0.15045166015625, -0.110595703125, -0.07073974609375, -0.0308837890625, 0.00897216796875, 0.048828125, 0.08868408203125, 0.1285400390625, 0.16839599609375, 0.208251953125, 0.24810791015625, 0.2879638671875, 0.32781982421875, 0.36767578125, 0.40753173828125, 0.4473876953125, 0.48724365234375, 0.527099609375, 0.56695556640625, 0.6068115234375, 0.64666748046875, 0.6865234375, 0.72637939453125, 0.7662353515625, 0.80609130859375, 0.845947265625, 0.88580322265625, 0.9256591796875, 0.96551513671875, 1.00537109375, 1.04522705078125, 1.0850830078125, 1.12493896484375, 1.164794921875, 1.20465087890625, 1.2445068359375, 1.28436279296875, 1.32421875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 3.0, 7.0, 10.0, 9.0, 16.0, 22.0, 19.0, 20.0, 20.0, 36.0, 45.0, 44.0, 62.0, 69.0, 63.0, 67.0, 47.0, 62.0, 63.0, 61.0, 44.0, 35.0, 33.0, 28.0, 27.0, 19.0, 12.0, 15.0, 3.0, 5.0, 7.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.02972412109375, -0.028800249099731445, -0.02787637710571289, -0.026952505111694336, -0.02602863311767578, -0.025104761123657227, -0.024180889129638672, -0.023257017135620117, -0.022333145141601562, -0.021409273147583008, -0.020485401153564453, -0.0195615291595459, -0.018637657165527344, -0.01771378517150879, -0.016789913177490234, -0.01586604118347168, -0.014942169189453125, -0.01401829719543457, -0.013094425201416016, -0.012170553207397461, -0.011246681213378906, -0.010322809219360352, -0.009398937225341797, -0.008475065231323242, -0.0075511932373046875, -0.006627321243286133, -0.005703449249267578, -0.0047795772552490234, -0.0038557052612304688, -0.002931833267211914, -0.0020079612731933594, -0.0010840892791748047, -0.00016021728515625, 0.0007636547088623047, 0.0016875267028808594, 0.002611398696899414, 0.0035352706909179688, 0.0044591426849365234, 0.005383014678955078, 0.006306886672973633, 0.0072307586669921875, 0.008154630661010742, 0.009078502655029297, 0.010002374649047852, 0.010926246643066406, 0.011850118637084961, 0.012773990631103516, 0.01369786262512207, 0.014621734619140625, 0.01554560661315918, 0.016469478607177734, 0.01739335060119629, 0.018317222595214844, 0.0192410945892334, 0.020164966583251953, 0.021088838577270508, 0.022012710571289062, 0.022936582565307617, 0.023860454559326172, 0.024784326553344727, 0.02570819854736328, 0.026632070541381836, 0.02755594253540039, 0.028479814529418945, 0.0294036865234375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 7.0, 2.0, 3.0, 15.0, 12.0, 13.0, 25.0, 28.0, 23.0, 44.0, 55.0, 73.0, 101.0, 176.0, 301.0, 557.0, 4105.0, 146987.0, 861679.0, 31739.0, 1415.0, 427.0, 267.0, 159.0, 95.0, 50.0, 39.0, 27.0, 26.0, 15.0, 17.0, 19.0, 7.0, 10.0, 8.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.55029296875, -0.5337677001953125, -0.517242431640625, -0.5007171630859375, -0.48419189453125, -0.4676666259765625, -0.451141357421875, -0.4346160888671875, -0.4180908203125, -0.4015655517578125, -0.385040283203125, -0.3685150146484375, -0.35198974609375, -0.3354644775390625, -0.318939208984375, -0.3024139404296875, -0.285888671875, -0.2693634033203125, -0.252838134765625, -0.2363128662109375, -0.21978759765625, -0.2032623291015625, -0.186737060546875, -0.1702117919921875, -0.1536865234375, -0.1371612548828125, -0.120635986328125, -0.1041107177734375, -0.08758544921875, -0.0710601806640625, -0.054534912109375, -0.0380096435546875, -0.021484375, -0.0049591064453125, 0.011566162109375, 0.0280914306640625, 0.04461669921875, 0.0611419677734375, 0.077667236328125, 0.0941925048828125, 0.1107177734375, 0.1272430419921875, 0.143768310546875, 0.1602935791015625, 0.17681884765625, 0.1933441162109375, 0.209869384765625, 0.2263946533203125, 0.242919921875, 0.2594451904296875, 0.275970458984375, 0.2924957275390625, 0.30902099609375, 0.3255462646484375, 0.342071533203125, 0.3585968017578125, 0.3751220703125, 0.3916473388671875, 0.408172607421875, 0.4246978759765625, 0.44122314453125, 0.4577484130859375, 0.474273681640625, 0.4907989501953125, 0.50732421875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 10.0, 22.0, 49.0, 177.0, 555.0, 141.0, 43.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0393935441970825, -1.019557237625122, -0.9997209906578064, -0.979884684085846, -0.9600484371185303, -0.9402121305465698, -0.9203758239746094, -0.9005395174026489, -0.8807032704353333, -0.8608669638633728, -0.8410307168960571, -0.8211944103240967, -0.8013581037521362, -0.7815218567848206, -0.7616855502128601, -0.7418493032455444, -0.722012996673584, -0.7021766901016235, -0.6823404431343079, -0.6625041365623474, -0.6426678895950317, -0.6228315830230713, -0.6029952764511108, -0.5831589698791504, -0.5633227229118347, -0.5434864163398743, -0.5236501693725586, -0.5038138628005981, -0.4839775860309601, -0.464141309261322, -0.4443050026893616, -0.4244687259197235, -0.40463244915008545, -0.3847961723804474, -0.3649598956108093, -0.3451235890388489, -0.3252873122692108, -0.30545103549957275, -0.2856147289276123, -0.26577845215797424, -0.24594219028949738, -0.22610589861869812, -0.20626962184906006, -0.186433345079422, -0.16659705340862274, -0.1467607617378235, -0.12692448496818542, -0.10708819329738617, -0.08725191652774811, -0.06741563230752945, -0.04757934808731079, -0.027743063867092133, -0.007906779646873474, 0.011929504573345184, 0.03176578879356384, 0.0516020804643631, 0.07143835723400116, 0.09127464145421982, 0.11111092567443848, 0.13094720244407654, 0.1507834941148758, 0.17061978578567505, 0.1904560625553131, 0.21029235422611237, 0.23012863099575043]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 2.0, 6.0, 6.0, 13.0, 18.0, 15.0, 17.0, 26.0, 22.0, 24.0, 29.0, 50.0, 46.0, 47.0, 33.0, 41.0, 52.0, 40.0, 50.0, 58.0, 42.0, 41.0, 46.0, 44.0, 43.0, 33.0, 29.0, 29.0, 17.0, 17.0, 10.0, 8.0, 10.0, 12.0, 11.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04792982339859009, -0.04630105942487717, -0.04467229172587395, -0.04304352402687073, -0.041414760053157806, -0.039785996079444885, -0.038157228380441666, -0.036528460681438446, -0.034899696707725525, -0.033270932734012604, -0.031642165035009384, -0.030013399198651314, -0.028384633362293243, -0.026755867525935173, -0.025127101689577103, -0.023498335853219032, -0.021869570016860962, -0.02024080418050289, -0.01861203834414482, -0.01698327250778675, -0.01535450667142868, -0.01372574083507061, -0.01209697499871254, -0.01046820916235447, -0.008839443325996399, -0.0072106774896383286, -0.005581911653280258, -0.003953145816922188, -0.0023243799805641174, -0.0006956141442060471, 0.0009331516921520233, 0.0025619175285100937, 0.004190683364868164, 0.0058194492012262344, 0.007448215037584305, 0.009076980873942375, 0.010705746710300446, 0.012334512546658516, 0.013963278383016586, 0.015592044219374657, 0.017220810055732727, 0.018849575892090797, 0.020478341728448868, 0.022107107564806938, 0.02373587340116501, 0.02536463923752308, 0.02699340507388115, 0.02862217091023922, 0.03025093674659729, 0.03187970072031021, 0.03350846841931343, 0.03513723611831665, 0.03676600009202957, 0.03839476406574249, 0.04002353176474571, 0.04165229946374893, 0.04328106343746185, 0.044909827411174774, 0.046538595110177994, 0.04816736280918121, 0.049796126782894135, 0.051424890756607056, 0.053053658455610275, 0.054682426154613495, 0.056311190128326416]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 3.0, 14.0, 8.0, 5.0, 13.0, 14.0, 22.0, 18.0, 18.0, 26.0, 28.0, 33.0, 31.0, 31.0, 41.0, 35.0, 49.0, 46.0, 37.0, 49.0, 33.0, 41.0, 32.0, 47.0, 36.0, 33.0, 25.0, 36.0, 23.0, 27.0, 17.0, 13.0, 17.0, 15.0, 21.0, 15.0, 7.0, 8.0, 13.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.269317626953125, -2.19293212890625, -2.116546630859375, -2.0401611328125, -1.963775634765625, -1.88739013671875, -1.811004638671875, -1.734619140625, -1.658233642578125, -1.58184814453125, -1.505462646484375, -1.4290771484375, -1.352691650390625, -1.27630615234375, -1.199920654296875, -1.12353515625, -1.047149658203125, -0.97076416015625, -0.894378662109375, -0.8179931640625, -0.741607666015625, -0.66522216796875, -0.588836669921875, -0.512451171875, -0.436065673828125, -0.35968017578125, -0.283294677734375, -0.2069091796875, -0.130523681640625, -0.05413818359375, 0.022247314453125, 0.0986328125, 0.175018310546875, 0.25140380859375, 0.327789306640625, 0.4041748046875, 0.480560302734375, 0.55694580078125, 0.633331298828125, 0.709716796875, 0.786102294921875, 0.86248779296875, 0.938873291015625, 1.0152587890625, 1.091644287109375, 1.16802978515625, 1.244415283203125, 1.32080078125, 1.397186279296875, 1.47357177734375, 1.549957275390625, 1.6263427734375, 1.702728271484375, 1.77911376953125, 1.855499267578125, 1.931884765625, 2.008270263671875, 2.08465576171875, 2.161041259765625, 2.2374267578125, 2.313812255859375, 2.39019775390625, 2.466583251953125, 2.54296875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 6.0, 7.0, 11.0, 23.0, 30.0, 39.0, 62.0, 94.0, 141.0, 219.0, 324.0, 568.0, 962.0, 1439.0, 2226.0, 3350.0, 5205.0, 7926.0, 12445.0, 19029.0, 29491.0, 49532.0, 90390.0, 186077.0, 269052.0, 165835.0, 81332.0, 44849.0, 27527.0, 17882.0, 11488.0, 7354.0, 4858.0, 3032.0, 2070.0, 1358.0, 835.0, 546.0, 350.0, 203.0, 137.0, 87.0, 46.0, 43.0, 19.0, 18.0, 6.0, 9.0, 4.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.861328125, -1.8039093017578125, -1.746490478515625, -1.6890716552734375, -1.63165283203125, -1.5742340087890625, -1.516815185546875, -1.4593963623046875, -1.4019775390625, -1.3445587158203125, -1.287139892578125, -1.2297210693359375, -1.17230224609375, -1.1148834228515625, -1.057464599609375, -1.0000457763671875, -0.942626953125, -0.8852081298828125, -0.827789306640625, -0.7703704833984375, -0.71295166015625, -0.6555328369140625, -0.598114013671875, -0.5406951904296875, -0.4832763671875, -0.4258575439453125, -0.368438720703125, -0.3110198974609375, -0.25360107421875, -0.1961822509765625, -0.138763427734375, -0.0813446044921875, -0.02392578125, 0.0334930419921875, 0.090911865234375, 0.1483306884765625, 0.20574951171875, 0.2631683349609375, 0.320587158203125, 0.3780059814453125, 0.4354248046875, 0.4928436279296875, 0.550262451171875, 0.6076812744140625, 0.66510009765625, 0.7225189208984375, 0.779937744140625, 0.8373565673828125, 0.894775390625, 0.9521942138671875, 1.009613037109375, 1.0670318603515625, 1.12445068359375, 1.1818695068359375, 1.239288330078125, 1.2967071533203125, 1.3541259765625, 1.4115447998046875, 1.468963623046875, 1.5263824462890625, 1.58380126953125, 1.6412200927734375, 1.698638916015625, 1.7560577392578125, 1.8134765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 4.0, 7.0, 12.0, 10.0, 13.0, 20.0, 17.0, 18.0, 38.0, 28.0, 28.0, 35.0, 35.0, 39.0, 40.0, 62.0, 103.0, 258.0, 1522.0, 238.0, 101.0, 69.0, 60.0, 42.0, 29.0, 30.0, 27.0, 31.0, 21.0, 15.0, 14.0, 12.0, 18.0, 10.0, 11.0, 12.0, 1.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6875, -9.3692626953125, -9.051025390625, -8.7327880859375, -8.41455078125, -8.0963134765625, -7.778076171875, -7.4598388671875, -7.1416015625, -6.8233642578125, -6.505126953125, -6.1868896484375, -5.86865234375, -5.5504150390625, -5.232177734375, -4.9139404296875, -4.595703125, -4.2774658203125, -3.959228515625, -3.6409912109375, -3.32275390625, -3.0045166015625, -2.686279296875, -2.3680419921875, -2.0498046875, -1.7315673828125, -1.413330078125, -1.0950927734375, -0.77685546875, -0.4586181640625, -0.140380859375, 0.1778564453125, 0.49609375, 0.8143310546875, 1.132568359375, 1.4508056640625, 1.76904296875, 2.0872802734375, 2.405517578125, 2.7237548828125, 3.0419921875, 3.3602294921875, 3.678466796875, 3.9967041015625, 4.31494140625, 4.6331787109375, 4.951416015625, 5.2696533203125, 5.587890625, 5.9061279296875, 6.224365234375, 6.5426025390625, 6.86083984375, 7.1790771484375, 7.497314453125, 7.8155517578125, 8.1337890625, 8.4520263671875, 8.770263671875, 9.0885009765625, 9.40673828125, 9.7249755859375, 10.043212890625, 10.3614501953125, 10.6796875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 7.0, 6.0, 8.0, 6.0, 12.0, 21.0, 35.0, 39.0, 42.0, 57.0, 77.0, 120.0, 172.0, 248.0, 546.0, 2102.0, 68279.0, 3017404.0, 53193.0, 1924.0, 519.0, 263.0, 188.0, 104.0, 82.0, 55.0, 57.0, 37.0, 25.0, 20.0, 17.0, 10.0, 12.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.9375, -23.2626953125, -22.587890625, -21.9130859375, -21.23828125, -20.5634765625, -19.888671875, -19.2138671875, -18.5390625, -17.8642578125, -17.189453125, -16.5146484375, -15.83984375, -15.1650390625, -14.490234375, -13.8154296875, -13.140625, -12.4658203125, -11.791015625, -11.1162109375, -10.44140625, -9.7666015625, -9.091796875, -8.4169921875, -7.7421875, -7.0673828125, -6.392578125, -5.7177734375, -5.04296875, -4.3681640625, -3.693359375, -3.0185546875, -2.34375, -1.6689453125, -0.994140625, -0.3193359375, 0.35546875, 1.0302734375, 1.705078125, 2.3798828125, 3.0546875, 3.7294921875, 4.404296875, 5.0791015625, 5.75390625, 6.4287109375, 7.103515625, 7.7783203125, 8.453125, 9.1279296875, 9.802734375, 10.4775390625, 11.15234375, 11.8271484375, 12.501953125, 13.1767578125, 13.8515625, 14.5263671875, 15.201171875, 15.8759765625, 16.55078125, 17.2255859375, 17.900390625, 18.5751953125, 19.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 13.0, 48.0, 133.0, 234.0, 245.0, 209.0, 91.0, 30.0, 9.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-53.95926284790039, -52.74051284790039, -51.521766662597656, -50.303016662597656, -49.08427047729492, -47.86552047729492, -46.64677429199219, -45.42802429199219, -44.20927810668945, -42.99052810668945, -41.77178192138672, -40.55303192138672, -39.334285736083984, -38.115535736083984, -36.89678955078125, -35.67803955078125, -34.45928955078125, -33.24053955078125, -32.021793365478516, -30.80304527282715, -29.58429718017578, -28.365549087524414, -27.146800994873047, -25.928050994873047, -24.709304809570312, -23.490556716918945, -22.271808624267578, -21.05306053161621, -19.834312438964844, -18.615564346313477, -17.39681625366211, -16.17806625366211, -14.959320068359375, -13.740571975708008, -12.52182388305664, -11.303075790405273, -10.084327697753906, -8.865579605102539, -7.6468305587768555, -6.428082466125488, -5.209334373474121, -3.990586280822754, -2.7718379497528076, -1.5530896186828613, -0.33434152603149414, 0.884406566619873, 2.1031551361083984, 3.3219032287597656, 4.540651321411133, 5.7593994140625, 6.978147506713867, 8.196895599365234, 9.415643692016602, 10.634391784667969, 11.853140830993652, 13.07188892364502, 14.290637016296387, 15.509385108947754, 16.728134155273438, 17.946882247924805, 19.165630340576172, 20.38437843322754, 21.603126525878906, 22.821874618530273, 24.04062271118164]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 13.0, 11.0, 17.0, 11.0, 13.0, 13.0, 26.0, 17.0, 21.0, 9.0, 26.0, 40.0, 28.0, 30.0, 30.0, 40.0, 32.0, 44.0, 42.0, 47.0, 33.0, 39.0, 34.0, 50.0, 23.0, 29.0, 27.0, 32.0, 21.0, 21.0, 19.0, 22.0, 16.0, 19.0, 18.0, 13.0, 12.0, 8.0, 11.0, 11.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-24.479034423828125, -23.72385025024414, -22.968666076660156, -22.213481903076172, -21.458297729492188, -20.703113555908203, -19.94792938232422, -19.192745208740234, -18.43756103515625, -17.682376861572266, -16.92719268798828, -16.172008514404297, -15.416824340820312, -14.661640167236328, -13.90645694732666, -13.151272773742676, -12.396089553833008, -11.640905380249023, -10.885721206665039, -10.130537033081055, -9.37535285949707, -8.620168685913086, -7.864985466003418, -7.109801292419434, -6.354617118835449, -5.599432945251465, -4.8442487716674805, -4.089065074920654, -3.33388090133667, -2.5786967277526855, -1.8235130310058594, -1.068328857421875, -0.3131427764892578, 0.442041277885437, 1.1972253322601318, 1.952409267425537, 2.7075934410095215, 3.462777614593506, 4.217961311340332, 4.973145484924316, 5.728329658508301, 6.483513832092285, 7.2386980056762695, 7.993881702423096, 8.749065399169922, 9.504249572753906, 10.25943374633789, 11.014617919921875, 11.76980209350586, 12.524986267089844, 13.280170440673828, 14.035354614257812, 14.790538787841797, 15.545722961425781, 16.300907135009766, 17.05609130859375, 17.811275482177734, 18.56645965576172, 19.321643829345703, 20.076828002929688, 20.832012176513672, 21.587196350097656, 22.34238052368164, 23.097564697265625, 23.852746963500977]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 7.0, 7.0, 9.0, 15.0, 19.0, 20.0, 13.0, 22.0, 27.0, 21.0, 34.0, 40.0, 35.0, 29.0, 44.0, 51.0, 44.0, 41.0, 50.0, 38.0, 46.0, 45.0, 37.0, 41.0, 32.0, 37.0, 28.0, 22.0, 19.0, 20.0, 13.0, 22.0, 15.0, 16.0, 9.0, 6.0, 5.0, 9.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.041015625, -2.95257568359375, -2.8641357421875, -2.77569580078125, -2.687255859375, -2.59881591796875, -2.5103759765625, -2.42193603515625, -2.33349609375, -2.24505615234375, -2.1566162109375, -2.06817626953125, -1.979736328125, -1.89129638671875, -1.8028564453125, -1.71441650390625, -1.6259765625, -1.53753662109375, -1.4490966796875, -1.36065673828125, -1.272216796875, -1.18377685546875, -1.0953369140625, -1.00689697265625, -0.91845703125, -0.83001708984375, -0.7415771484375, -0.65313720703125, -0.564697265625, -0.47625732421875, -0.3878173828125, -0.29937744140625, -0.2109375, -0.12249755859375, -0.0340576171875, 0.05438232421875, 0.142822265625, 0.23126220703125, 0.3197021484375, 0.40814208984375, 0.49658203125, 0.58502197265625, 0.6734619140625, 0.76190185546875, 0.850341796875, 0.93878173828125, 1.0272216796875, 1.11566162109375, 1.2041015625, 1.29254150390625, 1.3809814453125, 1.46942138671875, 1.557861328125, 1.64630126953125, 1.7347412109375, 1.82318115234375, 1.91162109375, 2.00006103515625, 2.0885009765625, 2.17694091796875, 2.265380859375, 2.35382080078125, 2.4422607421875, 2.53070068359375, 2.619140625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 10.0, 18.0, 24.0, 26.0, 30.0, 48.0, 82.0, 114.0, 191.0, 322.0, 551.0, 1125.0, 2294.0, 4957.0, 11657.0, 29669.0, 82742.0, 241784.0, 673082.0, 1307729.0, 1106480.0, 474369.0, 163596.0, 56568.0, 21134.0, 8265.0, 3634.0, 1718.0, 831.0, 448.0, 277.0, 168.0, 103.0, 77.0, 43.0, 33.0, 19.0, 13.0, 11.0, 9.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.720703125, -2.622894287109375, -2.52508544921875, -2.427276611328125, -2.3294677734375, -2.231658935546875, -2.13385009765625, -2.036041259765625, -1.938232421875, -1.840423583984375, -1.74261474609375, -1.644805908203125, -1.5469970703125, -1.449188232421875, -1.35137939453125, -1.253570556640625, -1.15576171875, -1.057952880859375, -0.96014404296875, -0.862335205078125, -0.7645263671875, -0.666717529296875, -0.56890869140625, -0.471099853515625, -0.373291015625, -0.275482177734375, -0.17767333984375, -0.079864501953125, 0.0179443359375, 0.115753173828125, 0.21356201171875, 0.311370849609375, 0.4091796875, 0.506988525390625, 0.60479736328125, 0.702606201171875, 0.8004150390625, 0.898223876953125, 0.99603271484375, 1.093841552734375, 1.191650390625, 1.289459228515625, 1.38726806640625, 1.485076904296875, 1.5828857421875, 1.680694580078125, 1.77850341796875, 1.876312255859375, 1.97412109375, 2.071929931640625, 2.16973876953125, 2.267547607421875, 2.3653564453125, 2.463165283203125, 2.56097412109375, 2.658782958984375, 2.756591796875, 2.854400634765625, 2.95220947265625, 3.050018310546875, 3.1478271484375, 3.245635986328125, 3.34344482421875, 3.441253662109375, 3.5390625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 9.0, 17.0, 19.0, 26.0, 38.0, 42.0, 66.0, 89.0, 113.0, 176.0, 197.0, 271.0, 350.0, 418.0, 439.0, 427.0, 321.0, 266.0, 210.0, 181.0, 110.0, 69.0, 55.0, 38.0, 35.0, 19.0, 20.0, 17.0, 5.0, 4.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.0777587890625, -4.885986328125, -4.6942138671875, -4.50244140625, -4.3106689453125, -4.118896484375, -3.9271240234375, -3.7353515625, -3.5435791015625, -3.351806640625, -3.1600341796875, -2.96826171875, -2.7764892578125, -2.584716796875, -2.3929443359375, -2.201171875, -2.0093994140625, -1.817626953125, -1.6258544921875, -1.43408203125, -1.2423095703125, -1.050537109375, -0.8587646484375, -0.6669921875, -0.4752197265625, -0.283447265625, -0.0916748046875, 0.10009765625, 0.2918701171875, 0.483642578125, 0.6754150390625, 0.8671875, 1.0589599609375, 1.250732421875, 1.4425048828125, 1.63427734375, 1.8260498046875, 2.017822265625, 2.2095947265625, 2.4013671875, 2.5931396484375, 2.784912109375, 2.9766845703125, 3.16845703125, 3.3602294921875, 3.552001953125, 3.7437744140625, 3.935546875, 4.1273193359375, 4.319091796875, 4.5108642578125, 4.70263671875, 4.8944091796875, 5.086181640625, 5.2779541015625, 5.4697265625, 5.6614990234375, 5.853271484375, 6.0450439453125, 6.23681640625, 6.4285888671875, 6.620361328125, 6.8121337890625, 7.00390625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 10.0, 10.0, 16.0, 18.0, 33.0, 31.0, 66.0, 72.0, 123.0, 207.0, 388.0, 998.0, 4030.0, 32930.0, 384128.0, 2656802.0, 1016724.0, 86139.0, 8798.0, 1490.0, 519.0, 252.0, 156.0, 100.0, 72.0, 49.0, 34.0, 20.0, 19.0, 13.0, 8.0, 8.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.6953125, -11.3582763671875, -11.021240234375, -10.6842041015625, -10.34716796875, -10.0101318359375, -9.673095703125, -9.3360595703125, -8.9990234375, -8.6619873046875, -8.324951171875, -7.9879150390625, -7.65087890625, -7.3138427734375, -6.976806640625, -6.6397705078125, -6.302734375, -5.9656982421875, -5.628662109375, -5.2916259765625, -4.95458984375, -4.6175537109375, -4.280517578125, -3.9434814453125, -3.6064453125, -3.2694091796875, -2.932373046875, -2.5953369140625, -2.25830078125, -1.9212646484375, -1.584228515625, -1.2471923828125, -0.91015625, -0.5731201171875, -0.236083984375, 0.1009521484375, 0.43798828125, 0.7750244140625, 1.112060546875, 1.4490966796875, 1.7861328125, 2.1231689453125, 2.460205078125, 2.7972412109375, 3.13427734375, 3.4713134765625, 3.808349609375, 4.1453857421875, 4.482421875, 4.8194580078125, 5.156494140625, 5.4935302734375, 5.83056640625, 6.1676025390625, 6.504638671875, 6.8416748046875, 7.1787109375, 7.5157470703125, 7.852783203125, 8.1898193359375, 8.52685546875, 8.8638916015625, 9.200927734375, 9.5379638671875, 9.875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 14.0, 23.0, 48.0, 74.0, 106.0, 157.0, 154.0, 145.0, 108.0, 82.0, 43.0, 29.0, 16.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.551761627197266, -28.245996475219727, -26.940231323242188, -25.63446617126465, -24.32870101928711, -23.02293586730957, -21.71717071533203, -20.411405563354492, -19.105640411376953, -17.799875259399414, -16.494110107421875, -15.188344955444336, -13.882579803466797, -12.576814651489258, -11.271049499511719, -9.96528434753418, -8.65951919555664, -7.353754043579102, -6.0479888916015625, -4.742223739624023, -3.4364585876464844, -2.1306934356689453, -0.8249282836914062, 0.4808368682861328, 1.7866020202636719, 3.092367172241211, 4.39813232421875, 5.703897476196289, 7.009662628173828, 8.315427780151367, 9.621192932128906, 10.926958084106445, 12.232719421386719, 13.538484573364258, 14.844249725341797, 16.150014877319336, 17.455780029296875, 18.761545181274414, 20.067310333251953, 21.373075485229492, 22.67884063720703, 23.98460578918457, 25.29037094116211, 26.59613609313965, 27.901901245117188, 29.207666397094727, 30.513431549072266, 31.819196701049805, 33.124961853027344, 34.43072509765625, 35.73649215698242, 37.042259216308594, 38.3480224609375, 39.653785705566406, 40.95955276489258, 42.26531982421875, 43.571083068847656, 44.87684631347656, 46.182613372802734, 47.488380432128906, 48.79414367675781, 50.09990692138672, 51.40567398071289, 52.71144104003906, 54.01720428466797]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 11.0, 4.0, 9.0, 8.0, 8.0, 14.0, 17.0, 25.0, 25.0, 23.0, 31.0, 34.0, 22.0, 35.0, 32.0, 42.0, 42.0, 35.0, 41.0, 36.0, 43.0, 44.0, 30.0, 33.0, 30.0, 38.0, 36.0, 30.0, 24.0, 19.0, 18.0, 18.0, 20.0, 15.0, 15.0, 13.0, 13.0, 16.0, 5.0, 10.0, 4.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-18.016399383544922, -17.46251106262207, -16.90862274169922, -16.354734420776367, -15.800846099853516, -15.246957778930664, -14.693069458007812, -14.139181137084961, -13.58529281616211, -13.031404495239258, -12.477516174316406, -11.923627853393555, -11.369739532470703, -10.815851211547852, -10.261962890625, -9.708074569702148, -9.154186248779297, -8.600297927856445, -8.046409606933594, -7.492521286010742, -6.938632965087891, -6.384744644165039, -5.8308563232421875, -5.276968002319336, -4.723079681396484, -4.169191360473633, -3.6153030395507812, -3.0614147186279297, -2.507526397705078, -1.9536380767822266, -1.399749755859375, -0.8458614349365234, -0.2919731140136719, 0.2619152069091797, 0.8158035278320312, 1.3696918487548828, 1.9235801696777344, 2.477468490600586, 3.0313568115234375, 3.585245132446289, 4.139133453369141, 4.693021774291992, 5.246910095214844, 5.800798416137695, 6.354686737060547, 6.908575057983398, 7.46246337890625, 8.016351699829102, 8.570240020751953, 9.124128341674805, 9.678016662597656, 10.231904983520508, 10.78579330444336, 11.339681625366211, 11.893569946289062, 12.447458267211914, 13.001346588134766, 13.555234909057617, 14.109123229980469, 14.66301155090332, 15.216899871826172, 15.770788192749023, 16.324676513671875, 16.878564834594727, 17.432453155517578]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 2.0, 7.0, 9.0, 9.0, 6.0, 9.0, 11.0, 15.0, 11.0, 13.0, 26.0, 16.0, 30.0, 26.0, 25.0, 32.0, 31.0, 42.0, 36.0, 46.0, 40.0, 39.0, 42.0, 37.0, 28.0, 31.0, 34.0, 38.0, 36.0, 27.0, 31.0, 23.0, 26.0, 21.0, 16.0, 22.0, 17.0, 18.0, 12.0, 15.0, 11.0, 6.0, 13.0, 6.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0], "bins": [-2.634765625, -2.558929443359375, -2.48309326171875, -2.407257080078125, -2.3314208984375, -2.255584716796875, -2.17974853515625, -2.103912353515625, -2.028076171875, -1.952239990234375, -1.87640380859375, -1.800567626953125, -1.7247314453125, -1.648895263671875, -1.57305908203125, -1.497222900390625, -1.42138671875, -1.345550537109375, -1.26971435546875, -1.193878173828125, -1.1180419921875, -1.042205810546875, -0.96636962890625, -0.890533447265625, -0.814697265625, -0.738861083984375, -0.66302490234375, -0.587188720703125, -0.5113525390625, -0.435516357421875, -0.35968017578125, -0.283843994140625, -0.2080078125, -0.132171630859375, -0.05633544921875, 0.019500732421875, 0.0953369140625, 0.171173095703125, 0.24700927734375, 0.322845458984375, 0.398681640625, 0.474517822265625, 0.55035400390625, 0.626190185546875, 0.7020263671875, 0.777862548828125, 0.85369873046875, 0.929534912109375, 1.00537109375, 1.081207275390625, 1.15704345703125, 1.232879638671875, 1.3087158203125, 1.384552001953125, 1.46038818359375, 1.536224365234375, 1.612060546875, 1.687896728515625, 1.76373291015625, 1.839569091796875, 1.9154052734375, 1.991241455078125, 2.06707763671875, 2.142913818359375, 2.21875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 6.0, 4.0, 13.0, 15.0, 24.0, 41.0, 53.0, 85.0, 140.0, 231.0, 359.0, 535.0, 863.0, 1354.0, 2280.0, 3454.0, 5762.0, 9225.0, 14809.0, 22729.0, 34450.0, 50487.0, 71390.0, 93289.0, 114513.0, 126040.0, 122194.0, 105888.0, 83683.0, 61605.0, 43175.0, 28920.0, 18950.0, 12112.0, 7585.0, 4588.0, 2930.0, 1778.0, 1130.0, 708.0, 406.0, 248.0, 185.0, 121.0, 66.0, 42.0, 38.0, 20.0, 12.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.6083984375, -0.5892562866210938, -0.5701141357421875, -0.5509719848632812, -0.531829833984375, -0.5126876831054688, -0.4935455322265625, -0.47440338134765625, -0.45526123046875, -0.43611907958984375, -0.4169769287109375, -0.39783477783203125, -0.378692626953125, -0.35955047607421875, -0.3404083251953125, -0.32126617431640625, -0.3021240234375, -0.28298187255859375, -0.2638397216796875, -0.24469757080078125, -0.225555419921875, -0.20641326904296875, -0.1872711181640625, -0.16812896728515625, -0.14898681640625, -0.12984466552734375, -0.1107025146484375, -0.09156036376953125, -0.072418212890625, -0.05327606201171875, -0.0341339111328125, -0.01499176025390625, 0.004150390625, 0.02329254150390625, 0.0424346923828125, 0.06157684326171875, 0.080718994140625, 0.09986114501953125, 0.1190032958984375, 0.13814544677734375, 0.15728759765625, 0.17642974853515625, 0.1955718994140625, 0.21471405029296875, 0.233856201171875, 0.25299835205078125, 0.2721405029296875, 0.29128265380859375, 0.3104248046875, 0.32956695556640625, 0.3487091064453125, 0.36785125732421875, 0.386993408203125, 0.40613555908203125, 0.4252777099609375, 0.44441986083984375, 0.46356201171875, 0.48270416259765625, 0.5018463134765625, 0.5209884643554688, 0.540130615234375, 0.5592727661132812, 0.5784149169921875, 0.5975570678710938, 0.61669921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 7.0, 6.0, 7.0, 9.0, 12.0, 18.0, 17.0, 18.0, 15.0, 32.0, 28.0, 32.0, 32.0, 36.0, 27.0, 33.0, 44.0, 41.0, 44.0, 39.0, 1062.0, 50.0, 39.0, 29.0, 31.0, 40.0, 28.0, 31.0, 29.0, 25.0, 15.0, 21.0, 25.0, 11.0, 13.0, 9.0, 14.0, 10.0, 9.0, 3.0, 7.0, 5.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.22265625, -2.15216064453125, -2.0816650390625, -2.01116943359375, -1.940673828125, -1.87017822265625, -1.7996826171875, -1.72918701171875, -1.65869140625, -1.58819580078125, -1.5177001953125, -1.44720458984375, -1.376708984375, -1.30621337890625, -1.2357177734375, -1.16522216796875, -1.0947265625, -1.02423095703125, -0.9537353515625, -0.88323974609375, -0.812744140625, -0.74224853515625, -0.6717529296875, -0.60125732421875, -0.53076171875, -0.46026611328125, -0.3897705078125, -0.31927490234375, -0.248779296875, -0.17828369140625, -0.1077880859375, -0.03729248046875, 0.033203125, 0.10369873046875, 0.1741943359375, 0.24468994140625, 0.315185546875, 0.38568115234375, 0.4561767578125, 0.52667236328125, 0.59716796875, 0.66766357421875, 0.7381591796875, 0.80865478515625, 0.879150390625, 0.94964599609375, 1.0201416015625, 1.09063720703125, 1.1611328125, 1.23162841796875, 1.3021240234375, 1.37261962890625, 1.443115234375, 1.51361083984375, 1.5841064453125, 1.65460205078125, 1.72509765625, 1.79559326171875, 1.8660888671875, 1.93658447265625, 2.007080078125, 2.07757568359375, 2.1480712890625, 2.21856689453125, 2.2890625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 10.0, 10.0, 11.0, 29.0, 39.0, 49.0, 75.0, 105.0, 190.0, 275.0, 388.0, 577.0, 943.0, 1442.0, 2237.0, 3428.0, 5527.0, 8376.0, 12945.0, 21488.0, 39635.0, 1884033.0, 49800.0, 24651.0, 14470.0, 9139.0, 6075.0, 3858.0, 2560.0, 1660.0, 991.0, 721.0, 483.0, 310.0, 194.0, 130.0, 94.0, 55.0, 36.0, 27.0, 20.0, 12.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.3740234375, -1.333160400390625, -1.29229736328125, -1.251434326171875, -1.2105712890625, -1.169708251953125, -1.12884521484375, -1.087982177734375, -1.047119140625, -1.006256103515625, -0.96539306640625, -0.924530029296875, -0.8836669921875, -0.842803955078125, -0.80194091796875, -0.761077880859375, -0.72021484375, -0.679351806640625, -0.63848876953125, -0.597625732421875, -0.5567626953125, -0.515899658203125, -0.47503662109375, -0.434173583984375, -0.393310546875, -0.352447509765625, -0.31158447265625, -0.270721435546875, -0.2298583984375, -0.188995361328125, -0.14813232421875, -0.107269287109375, -0.06640625, -0.025543212890625, 0.01531982421875, 0.056182861328125, 0.0970458984375, 0.137908935546875, 0.17877197265625, 0.219635009765625, 0.260498046875, 0.301361083984375, 0.34222412109375, 0.383087158203125, 0.4239501953125, 0.464813232421875, 0.50567626953125, 0.546539306640625, 0.58740234375, 0.628265380859375, 0.66912841796875, 0.709991455078125, 0.7508544921875, 0.791717529296875, 0.83258056640625, 0.873443603515625, 0.914306640625, 0.955169677734375, 0.99603271484375, 1.036895751953125, 1.0777587890625, 1.118621826171875, 1.15948486328125, 1.200347900390625, 1.2412109375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 11.0, 7.0, 10.0, 12.0, 19.0, 22.0, 22.0, 30.0, 36.0, 45.0, 69.0, 54.0, 70.0, 73.0, 72.0, 64.0, 61.0, 43.0, 47.0, 36.0, 40.0, 37.0, 20.0, 17.0, 14.0, 8.0, 14.0, 8.0, 10.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041595458984375, -0.04024982452392578, -0.03890419006347656, -0.037558555603027344, -0.036212921142578125, -0.034867286682128906, -0.03352165222167969, -0.03217601776123047, -0.03083038330078125, -0.02948474884033203, -0.028139114379882812, -0.026793479919433594, -0.025447845458984375, -0.024102210998535156, -0.022756576538085938, -0.02141094207763672, -0.0200653076171875, -0.01871967315673828, -0.017374038696289062, -0.016028404235839844, -0.014682769775390625, -0.013337135314941406, -0.011991500854492188, -0.010645866394042969, -0.00930023193359375, -0.007954597473144531, -0.0066089630126953125, -0.005263328552246094, -0.003917694091796875, -0.0025720596313476562, -0.0012264251708984375, 0.00011920928955078125, 0.00146484375, 0.0028104782104492188, 0.0041561126708984375, 0.005501747131347656, 0.006847381591796875, 0.008193016052246094, 0.009538650512695312, 0.010884284973144531, 0.01222991943359375, 0.013575553894042969, 0.014921188354492188, 0.016266822814941406, 0.017612457275390625, 0.018958091735839844, 0.020303726196289062, 0.02164936065673828, 0.0229949951171875, 0.02434062957763672, 0.025686264038085938, 0.027031898498535156, 0.028377532958984375, 0.029723167419433594, 0.031068801879882812, 0.03241443634033203, 0.03376007080078125, 0.03510570526123047, 0.03645133972167969, 0.037796974182128906, 0.039142608642578125, 0.040488243103027344, 0.04183387756347656, 0.04317951202392578, 0.044525146484375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 8.0, 10.0, 7.0, 14.0, 9.0, 18.0, 21.0, 26.0, 45.0, 41.0, 74.0, 119.0, 185.0, 393.0, 1374.0, 191806.0, 849968.0, 3200.0, 512.0, 284.0, 135.0, 68.0, 59.0, 30.0, 28.0, 26.0, 20.0, 14.0, 8.0, 8.0, 6.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91943359375, -0.8916854858398438, -0.8639373779296875, -0.8361892700195312, -0.808441162109375, -0.7806930541992188, -0.7529449462890625, -0.7251968383789062, -0.69744873046875, -0.6697006225585938, -0.6419525146484375, -0.6142044067382812, -0.586456298828125, -0.5587081909179688, -0.5309600830078125, -0.5032119750976562, -0.4754638671875, -0.44771575927734375, -0.4199676513671875, -0.39221954345703125, -0.364471435546875, -0.33672332763671875, -0.3089752197265625, -0.28122711181640625, -0.25347900390625, -0.22573089599609375, -0.1979827880859375, -0.17023468017578125, -0.142486572265625, -0.11473846435546875, -0.0869903564453125, -0.05924224853515625, -0.031494140625, -0.00374603271484375, 0.0240020751953125, 0.05175018310546875, 0.079498291015625, 0.10724639892578125, 0.1349945068359375, 0.16274261474609375, 0.19049072265625, 0.21823883056640625, 0.2459869384765625, 0.27373504638671875, 0.301483154296875, 0.32923126220703125, 0.3569793701171875, 0.38472747802734375, 0.4124755859375, 0.44022369384765625, 0.4679718017578125, 0.49571990966796875, 0.523468017578125, 0.5512161254882812, 0.5789642333984375, 0.6067123413085938, 0.63446044921875, 0.6622085571289062, 0.6899566650390625, 0.7177047729492188, 0.745452880859375, 0.7732009887695312, 0.8009490966796875, 0.8286972045898438, 0.8564453125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 42.0, 474.0, 462.0, 26.0, 1.0, 1.0, 2.0], "bins": [-2.3894429206848145, -2.3489482402801514, -2.3084535598754883, -2.267958641052246, -2.227463960647583, -2.18696928024292, -2.146474599838257, -2.1059799194335938, -2.0654852390289307, -2.0249905586242676, -1.984495759010315, -1.9440010786056519, -1.9035063982009888, -1.8630115985870361, -1.822516918182373, -1.78202223777771, -1.7415273189544678, -1.7010326385498047, -1.660537838935852, -1.620043158531189, -1.5795484781265259, -1.5390536785125732, -1.4985589981079102, -1.458064317703247, -1.417569637298584, -1.377074956893921, -1.3365801572799683, -1.2960854768753052, -1.255590796470642, -1.2150959968566895, -1.1746013164520264, -1.1341066360473633, -1.0936118364334106, -1.0531171560287476, -1.012622356414795, -0.9721276760101318, -0.931632936000824, -0.8911381959915161, -0.850643515586853, -0.8101487755775452, -0.7696540355682373, -0.7291592955589294, -0.6886646151542664, -0.6481698751449585, -0.6076751351356506, -0.5671803951263428, -0.5266857147216797, -0.4861909747123718, -0.44569626450538635, -0.4052015542984009, -0.364706814289093, -0.32421210408210754, -0.28371739387512207, -0.2432226538658142, -0.20272794365882874, -0.16223320364952087, -0.1217384934425354, -0.08124376833438873, -0.04074905067682266, -0.0002543330192565918, 0.040240392088890076, 0.08073511719703674, 0.12122982740402222, 0.16172456741333008, 0.20221927762031555]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 10.0, 9.0, 8.0, 13.0, 13.0, 23.0, 20.0, 23.0, 21.0, 32.0, 41.0, 32.0, 49.0, 42.0, 65.0, 54.0, 58.0, 49.0, 49.0, 30.0, 35.0, 34.0, 42.0, 38.0, 36.0, 37.0, 28.0, 21.0, 17.0, 8.0, 18.0, 9.0, 4.0, 8.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13235455751419067, -0.1279679536819458, -0.12358136475086212, -0.11919476836919785, -0.11480817198753357, -0.1104215681552887, -0.10603497177362442, -0.10164837539196014, -0.09726177901029587, -0.09287518262863159, -0.08848858624696732, -0.08410198986530304, -0.07971538603305817, -0.07532879710197449, -0.07094219326972961, -0.06655559688806534, -0.06216900050640106, -0.057782404124736786, -0.05339580774307251, -0.049009207636117935, -0.04462261125445366, -0.04023601487278938, -0.03584941476583481, -0.03146281838417053, -0.027076222002506256, -0.02268962562084198, -0.018303027376532555, -0.013916430063545704, -0.009529832750558853, -0.005143236368894577, -0.0007566381245851517, 0.0036299601197242737, 0.00801655650138855, 0.0124031538143754, 0.01678975112736225, 0.021176349371671677, 0.025562945753335953, 0.02994954213500023, 0.0343361422419548, 0.03872273862361908, 0.043109335005283356, 0.04749593138694763, 0.05188252776861191, 0.05626912787556648, 0.06065572425723076, 0.06504231691360474, 0.06942892074584961, 0.07381551712751389, 0.07820211350917816, 0.08258870989084244, 0.08697530627250671, 0.09136190265417099, 0.09574849903583527, 0.10013510286808014, 0.10452169924974442, 0.10890829563140869, 0.11329489201307297, 0.11768148839473724, 0.12206808477640152, 0.1264546811580658, 0.13084128499031067, 0.13522787392139435, 0.13961447775363922, 0.1440010666847229, 0.14838767051696777]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 8.0, 5.0, 9.0, 9.0, 17.0, 11.0, 12.0, 13.0, 22.0, 21.0, 17.0, 29.0, 35.0, 27.0, 41.0, 31.0, 36.0, 43.0, 35.0, 43.0, 38.0, 29.0, 27.0, 34.0, 42.0, 40.0, 33.0, 21.0, 31.0, 20.0, 23.0, 26.0, 14.0, 23.0, 24.0, 10.0, 16.0, 18.0, 10.0, 10.0, 4.0, 4.0, 13.0, 4.0, 6.0, 5.0, 2.0, 0.0, 3.0, 3.0], "bins": [-2.5234375, -2.45135498046875, -2.3792724609375, -2.30718994140625, -2.235107421875, -2.16302490234375, -2.0909423828125, -2.01885986328125, -1.94677734375, -1.87469482421875, -1.8026123046875, -1.73052978515625, -1.658447265625, -1.58636474609375, -1.5142822265625, -1.44219970703125, -1.3701171875, -1.29803466796875, -1.2259521484375, -1.15386962890625, -1.081787109375, -1.00970458984375, -0.9376220703125, -0.86553955078125, -0.79345703125, -0.72137451171875, -0.6492919921875, -0.57720947265625, -0.505126953125, -0.43304443359375, -0.3609619140625, -0.28887939453125, -0.216796875, -0.14471435546875, -0.0726318359375, -0.00054931640625, 0.071533203125, 0.14361572265625, 0.2156982421875, 0.28778076171875, 0.35986328125, 0.43194580078125, 0.5040283203125, 0.57611083984375, 0.648193359375, 0.72027587890625, 0.7923583984375, 0.86444091796875, 0.9365234375, 1.00860595703125, 1.0806884765625, 1.15277099609375, 1.224853515625, 1.29693603515625, 1.3690185546875, 1.44110107421875, 1.51318359375, 1.58526611328125, 1.6573486328125, 1.72943115234375, 1.801513671875, 1.87359619140625, 1.9456787109375, 2.01776123046875, 2.08984375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 8.0, 12.0, 7.0, 14.0, 11.0, 29.0, 41.0, 45.0, 79.0, 116.0, 182.0, 309.0, 553.0, 962.0, 1697.0, 3184.0, 5670.0, 9970.0, 17522.0, 30731.0, 51848.0, 88418.0, 148674.0, 226920.0, 188714.0, 113296.0, 67033.0, 39676.0, 22819.0, 13196.0, 7287.0, 4034.0, 2387.0, 1277.0, 721.0, 404.0, 254.0, 143.0, 94.0, 57.0, 49.0, 30.0, 25.0, 14.0, 14.0, 5.0, 9.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.51171875, -2.43499755859375, -2.3582763671875, -2.28155517578125, -2.204833984375, -2.12811279296875, -2.0513916015625, -1.97467041015625, -1.89794921875, -1.82122802734375, -1.7445068359375, -1.66778564453125, -1.591064453125, -1.51434326171875, -1.4376220703125, -1.36090087890625, -1.2841796875, -1.20745849609375, -1.1307373046875, -1.05401611328125, -0.977294921875, -0.90057373046875, -0.8238525390625, -0.74713134765625, -0.67041015625, -0.59368896484375, -0.5169677734375, -0.44024658203125, -0.363525390625, -0.28680419921875, -0.2100830078125, -0.13336181640625, -0.056640625, 0.02008056640625, 0.0968017578125, 0.17352294921875, 0.250244140625, 0.32696533203125, 0.4036865234375, 0.48040771484375, 0.55712890625, 0.63385009765625, 0.7105712890625, 0.78729248046875, 0.864013671875, 0.94073486328125, 1.0174560546875, 1.09417724609375, 1.1708984375, 1.24761962890625, 1.3243408203125, 1.40106201171875, 1.477783203125, 1.55450439453125, 1.6312255859375, 1.70794677734375, 1.78466796875, 1.86138916015625, 1.9381103515625, 2.01483154296875, 2.091552734375, 2.16827392578125, 2.2449951171875, 2.32171630859375, 2.3984375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 1.0, 6.0, 5.0, 9.0, 8.0, 6.0, 11.0, 17.0, 10.0, 21.0, 30.0, 31.0, 24.0, 32.0, 36.0, 48.0, 62.0, 62.0, 133.0, 216.0, 1354.0, 279.0, 162.0, 102.0, 57.0, 48.0, 36.0, 36.0, 26.0, 29.0, 25.0, 26.0, 12.0, 11.0, 13.0, 13.0, 10.0, 6.0, 5.0, 8.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0], "bins": [-10.2421875, -9.9385986328125, -9.635009765625, -9.3314208984375, -9.02783203125, -8.7242431640625, -8.420654296875, -8.1170654296875, -7.8134765625, -7.5098876953125, -7.206298828125, -6.9027099609375, -6.59912109375, -6.2955322265625, -5.991943359375, -5.6883544921875, -5.384765625, -5.0811767578125, -4.777587890625, -4.4739990234375, -4.17041015625, -3.8668212890625, -3.563232421875, -3.2596435546875, -2.9560546875, -2.6524658203125, -2.348876953125, -2.0452880859375, -1.74169921875, -1.4381103515625, -1.134521484375, -0.8309326171875, -0.52734375, -0.2237548828125, 0.079833984375, 0.3834228515625, 0.68701171875, 0.9906005859375, 1.294189453125, 1.5977783203125, 1.9013671875, 2.2049560546875, 2.508544921875, 2.8121337890625, 3.11572265625, 3.4193115234375, 3.722900390625, 4.0264892578125, 4.330078125, 4.6336669921875, 4.937255859375, 5.2408447265625, 5.54443359375, 5.8480224609375, 6.151611328125, 6.4552001953125, 6.7587890625, 7.0623779296875, 7.365966796875, 7.6695556640625, 7.97314453125, 8.2767333984375, 8.580322265625, 8.8839111328125, 9.1875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 7.0, 11.0, 11.0, 23.0, 26.0, 30.0, 35.0, 40.0, 51.0, 70.0, 106.0, 133.0, 202.0, 312.0, 525.0, 1802.0, 32200.0, 2454345.0, 643957.0, 9421.0, 981.0, 435.0, 248.0, 171.0, 132.0, 109.0, 73.0, 34.0, 40.0, 41.0, 30.0, 24.0, 16.0, 9.0, 13.0, 5.0, 8.0, 2.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.04833984375, -15.4716796875, -14.89501953125, -14.318359375, -13.74169921875, -13.1650390625, -12.58837890625, -12.01171875, -11.43505859375, -10.8583984375, -10.28173828125, -9.705078125, -9.12841796875, -8.5517578125, -7.97509765625, -7.3984375, -6.82177734375, -6.2451171875, -5.66845703125, -5.091796875, -4.51513671875, -3.9384765625, -3.36181640625, -2.78515625, -2.20849609375, -1.6318359375, -1.05517578125, -0.478515625, 0.09814453125, 0.6748046875, 1.25146484375, 1.828125, 2.40478515625, 2.9814453125, 3.55810546875, 4.134765625, 4.71142578125, 5.2880859375, 5.86474609375, 6.44140625, 7.01806640625, 7.5947265625, 8.17138671875, 8.748046875, 9.32470703125, 9.9013671875, 10.47802734375, 11.0546875, 11.63134765625, 12.2080078125, 12.78466796875, 13.361328125, 13.93798828125, 14.5146484375, 15.09130859375, 15.66796875, 16.24462890625, 16.8212890625, 17.39794921875, 17.974609375, 18.55126953125, 19.1279296875, 19.70458984375, 20.28125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 19.0, 168.0, 498.0, 285.0, 39.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.341888427734375, -14.76266860961914, -12.183448791503906, -9.604228973388672, -7.0250091552734375, -4.445789337158203, -1.8665695190429688, 0.7126502990722656, 3.2918701171875, 5.871089935302734, 8.450309753417969, 11.029529571533203, 13.608749389648438, 16.187969207763672, 18.767189025878906, 21.34640884399414, 23.925628662109375, 26.50484848022461, 29.084068298339844, 31.663288116455078, 34.24250793457031, 36.82172775268555, 39.40094757080078, 41.980167388916016, 44.55938720703125, 47.138607025146484, 49.71782684326172, 52.29704666137695, 54.87626647949219, 57.45548629760742, 60.034706115722656, 62.61392593383789, 65.19314575195312, 67.77236938476562, 70.3515853881836, 72.93080139160156, 75.51002502441406, 78.08924865722656, 80.66846466064453, 83.2476806640625, 85.826904296875, 88.4061279296875, 90.98534393310547, 93.56455993652344, 96.14378356933594, 98.72300720214844, 101.3022232055664, 103.88143920898438, 106.46066284179688, 109.03988647460938, 111.61910247802734, 114.19831848144531, 116.77754211425781, 119.35676574707031, 121.93598175048828, 124.51519775390625, 127.09442138671875, 129.67364501953125, 132.25286865234375, 134.8320770263672, 137.4113006591797, 139.9905242919922, 142.56973266601562, 145.14895629882812, 147.72817993164062]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 9.0, 16.0, 6.0, 11.0, 22.0, 32.0, 23.0, 28.0, 29.0, 44.0, 38.0, 38.0, 36.0, 41.0, 52.0, 31.0, 39.0, 43.0, 40.0, 48.0, 40.0, 46.0, 40.0, 41.0, 29.0, 32.0, 23.0, 21.0, 21.0, 11.0, 16.0, 7.0, 11.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.715574264526367, -25.892799377441406, -25.070026397705078, -24.247251510620117, -23.42447853088379, -22.601703643798828, -21.7789306640625, -20.95615577697754, -20.133380889892578, -19.310606002807617, -18.48783302307129, -17.665058135986328, -16.84228515625, -16.01951026916504, -15.196736335754395, -14.37396240234375, -13.551189422607422, -12.728415489196777, -11.905641555786133, -11.082866668701172, -10.260093688964844, -9.437318801879883, -8.614544868469238, -7.791770935058594, -6.968997001647949, -6.146223068237305, -5.32344913482666, -4.500674724578857, -3.677900791168213, -2.8551268577575684, -2.0323524475097656, -1.209578514099121, -0.38680267333984375, 0.43597137928009033, 1.2587454319000244, 2.081519603729248, 2.9042935371398926, 3.727067470550537, 4.54984188079834, 5.372615814208984, 6.195389747619629, 7.018163681030273, 7.840937614440918, 8.663711547851562, 9.486486434936523, 10.309259414672852, 11.132034301757812, 11.954808235168457, 12.777582168579102, 13.600356101989746, 14.42313003540039, 15.245904922485352, 16.06867790222168, 16.89145278930664, 17.71422576904297, 18.53700065612793, 19.35977554321289, 20.18255043029785, 21.00532341003418, 21.82809829711914, 22.65087127685547, 23.47364616394043, 24.29642105102539, 25.11919403076172, 25.941967010498047]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 8.0, 7.0, 4.0, 12.0, 15.0, 14.0, 18.0, 14.0, 15.0, 17.0, 21.0, 35.0, 22.0, 41.0, 27.0, 36.0, 35.0, 24.0, 47.0, 37.0, 38.0, 39.0, 40.0, 40.0, 46.0, 32.0, 23.0, 33.0, 18.0, 19.0, 26.0, 21.0, 22.0, 24.0, 14.0, 18.0, 18.0, 14.0, 11.0, 14.0, 3.0, 8.0, 12.0, 5.0, 2.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.791015625, -2.70928955078125, -2.6275634765625, -2.54583740234375, -2.464111328125, -2.38238525390625, -2.3006591796875, -2.21893310546875, -2.13720703125, -2.05548095703125, -1.9737548828125, -1.89202880859375, -1.810302734375, -1.72857666015625, -1.6468505859375, -1.56512451171875, -1.4833984375, -1.40167236328125, -1.3199462890625, -1.23822021484375, -1.156494140625, -1.07476806640625, -0.9930419921875, -0.91131591796875, -0.82958984375, -0.74786376953125, -0.6661376953125, -0.58441162109375, -0.502685546875, -0.42095947265625, -0.3392333984375, -0.25750732421875, -0.17578125, -0.09405517578125, -0.0123291015625, 0.06939697265625, 0.151123046875, 0.23284912109375, 0.3145751953125, 0.39630126953125, 0.47802734375, 0.55975341796875, 0.6414794921875, 0.72320556640625, 0.804931640625, 0.88665771484375, 0.9683837890625, 1.05010986328125, 1.1318359375, 1.21356201171875, 1.2952880859375, 1.37701416015625, 1.458740234375, 1.54046630859375, 1.6221923828125, 1.70391845703125, 1.78564453125, 1.86737060546875, 1.9490966796875, 2.03082275390625, 2.112548828125, 2.19427490234375, 2.2760009765625, 2.35772705078125, 2.439453125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 12.0, 5.0, 10.0, 18.0, 12.0, 12.0, 25.0, 17.0, 15.0, 25.0, 30.0, 43.0, 90.0, 181.0, 503.0, 1804.0, 8772.0, 68570.0, 665251.0, 2470105.0, 872644.0, 91962.0, 10972.0, 2003.0, 554.0, 228.0, 90.0, 54.0, 40.0, 29.0, 21.0, 25.0, 10.0, 22.0, 20.0, 17.0, 4.0, 14.0, 11.0, 6.0, 12.0, 4.0, 7.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-7.578125, -7.35888671875, -7.1396484375, -6.92041015625, -6.701171875, -6.48193359375, -6.2626953125, -6.04345703125, -5.82421875, -5.60498046875, -5.3857421875, -5.16650390625, -4.947265625, -4.72802734375, -4.5087890625, -4.28955078125, -4.0703125, -3.85107421875, -3.6318359375, -3.41259765625, -3.193359375, -2.97412109375, -2.7548828125, -2.53564453125, -2.31640625, -2.09716796875, -1.8779296875, -1.65869140625, -1.439453125, -1.22021484375, -1.0009765625, -0.78173828125, -0.5625, -0.34326171875, -0.1240234375, 0.09521484375, 0.314453125, 0.53369140625, 0.7529296875, 0.97216796875, 1.19140625, 1.41064453125, 1.6298828125, 1.84912109375, 2.068359375, 2.28759765625, 2.5068359375, 2.72607421875, 2.9453125, 3.16455078125, 3.3837890625, 3.60302734375, 3.822265625, 4.04150390625, 4.2607421875, 4.47998046875, 4.69921875, 4.91845703125, 5.1376953125, 5.35693359375, 5.576171875, 5.79541015625, 6.0146484375, 6.23388671875, 6.453125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 4.0, 9.0, 9.0, 11.0, 23.0, 31.0, 39.0, 42.0, 64.0, 79.0, 102.0, 138.0, 169.0, 221.0, 259.0, 293.0, 360.0, 365.0, 369.0, 309.0, 231.0, 223.0, 159.0, 128.0, 111.0, 64.0, 65.0, 54.0, 31.0, 25.0, 11.0, 16.0, 12.0, 8.0, 7.0, 4.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.480712890625, -4.31689453125, -4.153076171875, -3.9892578125, -3.825439453125, -3.66162109375, -3.497802734375, -3.333984375, -3.170166015625, -3.00634765625, -2.842529296875, -2.6787109375, -2.514892578125, -2.35107421875, -2.187255859375, -2.0234375, -1.859619140625, -1.69580078125, -1.531982421875, -1.3681640625, -1.204345703125, -1.04052734375, -0.876708984375, -0.712890625, -0.549072265625, -0.38525390625, -0.221435546875, -0.0576171875, 0.106201171875, 0.27001953125, 0.433837890625, 0.59765625, 0.761474609375, 0.92529296875, 1.089111328125, 1.2529296875, 1.416748046875, 1.58056640625, 1.744384765625, 1.908203125, 2.072021484375, 2.23583984375, 2.399658203125, 2.5634765625, 2.727294921875, 2.89111328125, 3.054931640625, 3.21875, 3.382568359375, 3.54638671875, 3.710205078125, 3.8740234375, 4.037841796875, 4.20166015625, 4.365478515625, 4.529296875, 4.693115234375, 4.85693359375, 5.020751953125, 5.1845703125, 5.348388671875, 5.51220703125, 5.676025390625, 5.83984375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 6.0, 9.0, 6.0, 11.0, 18.0, 17.0, 25.0, 49.0, 64.0, 107.0, 112.0, 188.0, 274.0, 455.0, 1045.0, 5271.0, 56026.0, 763782.0, 2829167.0, 495519.0, 36273.0, 3759.0, 854.0, 418.0, 255.0, 172.0, 114.0, 59.0, 65.0, 44.0, 31.0, 26.0, 15.0, 7.0, 7.0, 5.0, 7.0, 9.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4375, -12.0863037109375, -11.735107421875, -11.3839111328125, -11.03271484375, -10.6815185546875, -10.330322265625, -9.9791259765625, -9.6279296875, -9.2767333984375, -8.925537109375, -8.5743408203125, -8.22314453125, -7.8719482421875, -7.520751953125, -7.1695556640625, -6.818359375, -6.4671630859375, -6.115966796875, -5.7647705078125, -5.41357421875, -5.0623779296875, -4.711181640625, -4.3599853515625, -4.0087890625, -3.6575927734375, -3.306396484375, -2.9552001953125, -2.60400390625, -2.2528076171875, -1.901611328125, -1.5504150390625, -1.19921875, -0.8480224609375, -0.496826171875, -0.1456298828125, 0.20556640625, 0.5567626953125, 0.907958984375, 1.2591552734375, 1.6103515625, 1.9615478515625, 2.312744140625, 2.6639404296875, 3.01513671875, 3.3663330078125, 3.717529296875, 4.0687255859375, 4.419921875, 4.7711181640625, 5.122314453125, 5.4735107421875, 5.82470703125, 6.1759033203125, 6.527099609375, 6.8782958984375, 7.2294921875, 7.5806884765625, 7.931884765625, 8.2830810546875, 8.63427734375, 8.9854736328125, 9.336669921875, 9.6878662109375, 10.0390625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 14.0, 11.0, 28.0, 39.0, 50.0, 64.0, 82.0, 114.0, 87.0, 102.0, 114.0, 70.0, 68.0, 55.0, 40.0, 29.0, 10.0, 9.0, 7.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.464115142822266, -30.56171989440918, -29.659324645996094, -28.756927490234375, -27.85453224182129, -26.952136993408203, -26.049739837646484, -25.1473445892334, -24.244949340820312, -23.342554092407227, -22.44015884399414, -21.537761688232422, -20.635366439819336, -19.73297119140625, -18.83057403564453, -17.928178787231445, -17.02578353881836, -16.123388290405273, -15.220992088317871, -14.318595886230469, -13.416200637817383, -12.513805389404297, -11.611409187316895, -10.709012985229492, -9.806617736816406, -8.90422248840332, -8.001826286315918, -7.099430561065674, -6.19703483581543, -5.2946391105651855, -4.392243385314941, -3.4898476600646973, -2.5874500274658203, -1.6850543022155762, -0.782658576965332, 0.11973714828491211, 1.0221328735351562, 1.9245285987854004, 2.8269243240356445, 3.7293200492858887, 4.631715774536133, 5.534111499786377, 6.436507225036621, 7.338902950286865, 8.24129867553711, 9.143693923950195, 10.046090126037598, 10.948486328125, 11.850881576538086, 12.753276824951172, 13.655673027038574, 14.558069229125977, 15.460464477539062, 16.36285972595215, 17.265254974365234, 18.167652130126953, 19.07004737854004, 19.972442626953125, 20.874839782714844, 21.77723503112793, 22.679630279541016, 23.5820255279541, 24.484420776367188, 25.386817932128906, 26.289213180541992]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 2.0, 6.0, 7.0, 11.0, 13.0, 14.0, 14.0, 17.0, 12.0, 21.0, 31.0, 31.0, 17.0, 41.0, 25.0, 36.0, 49.0, 43.0, 42.0, 39.0, 39.0, 42.0, 30.0, 32.0, 38.0, 41.0, 43.0, 33.0, 25.0, 21.0, 26.0, 17.0, 19.0, 22.0, 18.0, 13.0, 13.0, 9.0, 11.0, 11.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.457393646240234, -16.8724308013916, -16.287466049194336, -15.702503204345703, -15.117539405822754, -14.532575607299805, -13.947612762451172, -13.362648963928223, -12.777685165405273, -12.192721366882324, -11.607757568359375, -11.022794723510742, -10.437830924987793, -9.852867126464844, -9.267904281616211, -8.682940483093262, -8.097976684570312, -7.513012886047363, -6.928049564361572, -6.343086242675781, -5.758122444152832, -5.173158645629883, -4.588195323944092, -4.003232002258301, -3.4182682037353516, -2.8333046436309814, -2.2483410835266113, -1.6633775234222412, -1.078413963317871, -0.493450403213501, 0.09151315689086914, 0.6764764785766602, 1.2614402770996094, 1.8464038372039795, 2.4313673973083496, 3.0163309574127197, 3.60129451751709, 4.186258316040039, 4.77122163772583, 5.356184959411621, 5.94114875793457, 6.5261125564575195, 7.1110758781433105, 7.696039199829102, 8.28100299835205, 8.865966796875, 9.450929641723633, 10.035893440246582, 10.620857238769531, 11.20582103729248, 11.79078483581543, 12.375747680664062, 12.960711479187012, 13.545675277709961, 14.130638122558594, 14.715601921081543, 15.300565719604492, 15.885529518127441, 16.47049331665039, 17.055456161499023, 17.640419006347656, 18.225383758544922, 18.810346603393555, 19.395309448242188, 19.980274200439453]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 4.0, 8.0, 9.0, 8.0, 17.0, 20.0, 22.0, 20.0, 29.0, 31.0, 21.0, 31.0, 23.0, 51.0, 44.0, 48.0, 31.0, 40.0, 46.0, 43.0, 49.0, 46.0, 38.0, 23.0, 36.0, 25.0, 30.0, 30.0, 26.0, 21.0, 15.0, 22.0, 15.0, 15.0, 12.0, 10.0, 13.0, 7.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.130859375, -3.041412353515625, -2.95196533203125, -2.862518310546875, -2.7730712890625, -2.683624267578125, -2.59417724609375, -2.504730224609375, -2.415283203125, -2.325836181640625, -2.23638916015625, -2.146942138671875, -2.0574951171875, -1.968048095703125, -1.87860107421875, -1.789154052734375, -1.69970703125, -1.610260009765625, -1.52081298828125, -1.431365966796875, -1.3419189453125, -1.252471923828125, -1.16302490234375, -1.073577880859375, -0.984130859375, -0.894683837890625, -0.80523681640625, -0.715789794921875, -0.6263427734375, -0.536895751953125, -0.44744873046875, -0.358001708984375, -0.2685546875, -0.179107666015625, -0.08966064453125, -0.000213623046875, 0.0892333984375, 0.178680419921875, 0.26812744140625, 0.357574462890625, 0.447021484375, 0.536468505859375, 0.62591552734375, 0.715362548828125, 0.8048095703125, 0.894256591796875, 0.98370361328125, 1.073150634765625, 1.16259765625, 1.252044677734375, 1.34149169921875, 1.430938720703125, 1.5203857421875, 1.609832763671875, 1.69927978515625, 1.788726806640625, 1.878173828125, 1.967620849609375, 2.05706787109375, 2.146514892578125, 2.2359619140625, 2.325408935546875, 2.41485595703125, 2.504302978515625, 2.59375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 2.0, 2.0, 5.0, 11.0, 13.0, 13.0, 23.0, 25.0, 54.0, 82.0, 140.0, 173.0, 282.0, 435.0, 708.0, 1143.0, 1801.0, 3015.0, 4646.0, 7036.0, 11036.0, 17110.0, 25468.0, 36948.0, 51636.0, 69693.0, 88383.0, 105374.0, 115811.0, 114296.0, 100684.0, 83046.0, 63948.0, 47270.0, 33252.0, 22721.0, 15253.0, 9615.0, 6360.0, 4066.0, 2532.0, 1647.0, 996.0, 637.0, 409.0, 256.0, 163.0, 108.0, 84.0, 43.0, 33.0, 24.0, 20.0, 13.0, 8.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.5341796875, -0.5168685913085938, -0.4995574951171875, -0.48224639892578125, -0.464935302734375, -0.44762420654296875, -0.4303131103515625, -0.41300201416015625, -0.39569091796875, -0.37837982177734375, -0.3610687255859375, -0.34375762939453125, -0.326446533203125, -0.30913543701171875, -0.2918243408203125, -0.27451324462890625, -0.2572021484375, -0.23989105224609375, -0.2225799560546875, -0.20526885986328125, -0.187957763671875, -0.17064666748046875, -0.1533355712890625, -0.13602447509765625, -0.11871337890625, -0.10140228271484375, -0.0840911865234375, -0.06678009033203125, -0.049468994140625, -0.03215789794921875, -0.0148468017578125, 0.00246429443359375, 0.019775390625, 0.03708648681640625, 0.0543975830078125, 0.07170867919921875, 0.089019775390625, 0.10633087158203125, 0.1236419677734375, 0.14095306396484375, 0.15826416015625, 0.17557525634765625, 0.1928863525390625, 0.21019744873046875, 0.227508544921875, 0.24481964111328125, 0.2621307373046875, 0.27944183349609375, 0.2967529296875, 0.31406402587890625, 0.3313751220703125, 0.34868621826171875, 0.365997314453125, 0.38330841064453125, 0.4006195068359375, 0.41793060302734375, 0.43524169921875, 0.45255279541015625, 0.4698638916015625, 0.48717498779296875, 0.504486083984375, 0.5217971801757812, 0.5391082763671875, 0.5564193725585938, 0.57373046875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 0.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 10.0, 20.0, 10.0, 13.0, 11.0, 19.0, 19.0, 36.0, 28.0, 34.0, 29.0, 30.0, 33.0, 38.0, 36.0, 46.0, 45.0, 1073.0, 51.0, 44.0, 24.0, 41.0, 38.0, 25.0, 30.0, 39.0, 24.0, 32.0, 17.0, 27.0, 17.0, 11.0, 9.0, 13.0, 13.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294921875, -2.213836669921875, -2.13275146484375, -2.051666259765625, -1.9705810546875, -1.889495849609375, -1.80841064453125, -1.727325439453125, -1.646240234375, -1.565155029296875, -1.48406982421875, -1.402984619140625, -1.3218994140625, -1.240814208984375, -1.15972900390625, -1.078643798828125, -0.99755859375, -0.916473388671875, -0.83538818359375, -0.754302978515625, -0.6732177734375, -0.592132568359375, -0.51104736328125, -0.429962158203125, -0.348876953125, -0.267791748046875, -0.18670654296875, -0.105621337890625, -0.0245361328125, 0.056549072265625, 0.13763427734375, 0.218719482421875, 0.2998046875, 0.380889892578125, 0.46197509765625, 0.543060302734375, 0.6241455078125, 0.705230712890625, 0.78631591796875, 0.867401123046875, 0.948486328125, 1.029571533203125, 1.11065673828125, 1.191741943359375, 1.2728271484375, 1.353912353515625, 1.43499755859375, 1.516082763671875, 1.59716796875, 1.678253173828125, 1.75933837890625, 1.840423583984375, 1.9215087890625, 2.002593994140625, 2.08367919921875, 2.164764404296875, 2.245849609375, 2.326934814453125, 2.40802001953125, 2.489105224609375, 2.5701904296875, 2.651275634765625, 2.73236083984375, 2.813446044921875, 2.89453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 3.0, 2.0, 7.0, 8.0, 11.0, 11.0, 26.0, 26.0, 54.0, 63.0, 111.0, 176.0, 264.0, 458.0, 744.0, 1120.0, 1807.0, 2774.0, 4439.0, 6811.0, 10823.0, 17575.0, 32324.0, 1737621.0, 203673.0, 30786.0, 16730.0, 10468.0, 6617.0, 4313.0, 2727.0, 1752.0, 1027.0, 657.0, 458.0, 229.0, 169.0, 114.0, 57.0, 36.0, 38.0, 10.0, 6.0, 4.0, 10.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.6767578125, -1.6325836181640625, -1.588409423828125, -1.5442352294921875, -1.50006103515625, -1.4558868408203125, -1.411712646484375, -1.3675384521484375, -1.3233642578125, -1.2791900634765625, -1.235015869140625, -1.1908416748046875, -1.14666748046875, -1.1024932861328125, -1.058319091796875, -1.0141448974609375, -0.969970703125, -0.9257965087890625, -0.881622314453125, -0.8374481201171875, -0.79327392578125, -0.7490997314453125, -0.704925537109375, -0.6607513427734375, -0.6165771484375, -0.5724029541015625, -0.528228759765625, -0.4840545654296875, -0.43988037109375, -0.3957061767578125, -0.351531982421875, -0.3073577880859375, -0.26318359375, -0.2190093994140625, -0.174835205078125, -0.1306610107421875, -0.08648681640625, -0.0423126220703125, 0.001861572265625, 0.0460357666015625, 0.0902099609375, 0.1343841552734375, 0.178558349609375, 0.2227325439453125, 0.26690673828125, 0.3110809326171875, 0.355255126953125, 0.3994293212890625, 0.443603515625, 0.4877777099609375, 0.531951904296875, 0.5761260986328125, 0.62030029296875, 0.6644744873046875, 0.708648681640625, 0.7528228759765625, 0.7969970703125, 0.8411712646484375, 0.885345458984375, 0.9295196533203125, 0.97369384765625, 1.0178680419921875, 1.062042236328125, 1.1062164306640625, 1.150390625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 5.0, 7.0, 5.0, 9.0, 13.0, 12.0, 17.0, 22.0, 21.0, 31.0, 41.0, 41.0, 70.0, 95.0, 104.0, 105.0, 85.0, 65.0, 40.0, 45.0, 28.0, 22.0, 14.0, 16.0, 10.0, 15.0, 11.0, 11.0, 7.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06341552734375, -0.06164979934692383, -0.059884071350097656, -0.058118343353271484, -0.05635261535644531, -0.05458688735961914, -0.05282115936279297, -0.0510554313659668, -0.049289703369140625, -0.04752397537231445, -0.04575824737548828, -0.04399251937866211, -0.04222679138183594, -0.040461063385009766, -0.038695335388183594, -0.03692960739135742, -0.03516387939453125, -0.03339815139770508, -0.031632423400878906, -0.029866695404052734, -0.028100967407226562, -0.02633523941040039, -0.02456951141357422, -0.022803783416748047, -0.021038055419921875, -0.019272327423095703, -0.01750659942626953, -0.01574087142944336, -0.013975143432617188, -0.012209415435791016, -0.010443687438964844, -0.008677959442138672, -0.0069122314453125, -0.005146503448486328, -0.0033807754516601562, -0.0016150474548339844, 0.0001506805419921875, 0.0019164085388183594, 0.0036821365356445312, 0.005447864532470703, 0.007213592529296875, 0.008979320526123047, 0.010745048522949219, 0.01251077651977539, 0.014276504516601562, 0.016042232513427734, 0.017807960510253906, 0.019573688507080078, 0.02133941650390625, 0.023105144500732422, 0.024870872497558594, 0.026636600494384766, 0.028402328491210938, 0.03016805648803711, 0.03193378448486328, 0.03369951248168945, 0.035465240478515625, 0.0372309684753418, 0.03899669647216797, 0.04076242446899414, 0.04252815246582031, 0.044293880462646484, 0.046059608459472656, 0.04782533645629883, 0.049591064453125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 7.0, 12.0, 7.0, 17.0, 21.0, 15.0, 39.0, 40.0, 76.0, 114.0, 275.0, 856.0, 6461.0, 969615.0, 67599.0, 2437.0, 443.0, 195.0, 97.0, 43.0, 41.0, 27.0, 24.0, 8.0, 15.0, 11.0, 10.0, 3.0, 5.0, 4.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.1357421875, -1.098846435546875, -1.06195068359375, -1.025054931640625, -0.9881591796875, -0.951263427734375, -0.91436767578125, -0.877471923828125, -0.840576171875, -0.803680419921875, -0.76678466796875, -0.729888916015625, -0.6929931640625, -0.656097412109375, -0.61920166015625, -0.582305908203125, -0.54541015625, -0.508514404296875, -0.47161865234375, -0.434722900390625, -0.3978271484375, -0.360931396484375, -0.32403564453125, -0.287139892578125, -0.250244140625, -0.213348388671875, -0.17645263671875, -0.139556884765625, -0.1026611328125, -0.065765380859375, -0.02886962890625, 0.008026123046875, 0.044921875, 0.081817626953125, 0.11871337890625, 0.155609130859375, 0.1925048828125, 0.229400634765625, 0.26629638671875, 0.303192138671875, 0.340087890625, 0.376983642578125, 0.41387939453125, 0.450775146484375, 0.4876708984375, 0.524566650390625, 0.56146240234375, 0.598358154296875, 0.63525390625, 0.672149658203125, 0.70904541015625, 0.745941162109375, 0.7828369140625, 0.819732666015625, 0.85662841796875, 0.893524169921875, 0.930419921875, 0.967315673828125, 1.00421142578125, 1.041107177734375, 1.0780029296875, 1.114898681640625, 1.15179443359375, 1.188690185546875, 1.2255859375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 20.0, 305.0, 646.0, 40.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.823730230331421, -1.791852593421936, -1.7599748373031616, -1.7280972003936768, -1.6962194442749023, -1.6643418073654175, -1.632464051246643, -1.6005864143371582, -1.5687086582183838, -1.536831021308899, -1.5049532651901245, -1.4730756282806396, -1.4411978721618652, -1.4093202352523804, -1.377442479133606, -1.345564842224121, -1.3136870861053467, -1.2818094491958618, -1.2499316930770874, -1.2180540561676025, -1.1861763000488281, -1.1542986631393433, -1.1224209070205688, -1.090543270111084, -1.0586656332015991, -1.0267879962921143, -0.9949102401733398, -0.9630325436592102, -0.9311548471450806, -0.8992771506309509, -0.8673994541168213, -0.8355218172073364, -0.8036440014839172, -0.7717663049697876, -0.739888608455658, -0.7080109119415283, -0.6761332154273987, -0.644255518913269, -0.6123778820037842, -0.5805001258850098, -0.5486224293708801, -0.5167447328567505, -0.48486703634262085, -0.4529893398284912, -0.4211116433143616, -0.38923394680023193, -0.3573562800884247, -0.32547858357429504, -0.2936009168624878, -0.26172322034835815, -0.22984552383422852, -0.19796784222126007, -0.16609014570713043, -0.1342124491930008, -0.10233476758003235, -0.07045707106590271, -0.03857935965061188, -0.006701666861772537, 0.025176025927066803, 0.057053714990615845, 0.08893141150474548, 0.12080910801887512, 0.15268678963184357, 0.1845644861459732, 0.21644218266010284]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 8.0, 6.0, 11.0, 13.0, 17.0, 23.0, 29.0, 23.0, 27.0, 29.0, 35.0, 39.0, 53.0, 47.0, 52.0, 39.0, 50.0, 53.0, 53.0, 45.0, 65.0, 38.0, 42.0, 25.0, 46.0, 25.0, 23.0, 19.0, 16.0, 13.0, 12.0, 6.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11261707544326782, -0.10884792357683182, -0.10507877916097641, -0.1013096272945404, -0.097540482878685, -0.09377133101224899, -0.09000217914581299, -0.08623303472995758, -0.08246388286352158, -0.07869473099708557, -0.07492558658123016, -0.07115643471479416, -0.06738728284835815, -0.06361813843250275, -0.05984898656606674, -0.056079838424921036, -0.05231069028377533, -0.04854154214262962, -0.04477239400148392, -0.04100324213504791, -0.037234093993902206, -0.0334649458527565, -0.029695795848965645, -0.02592664584517479, -0.022157497704029083, -0.018388349562883377, -0.014619199559092522, -0.010850050486624241, -0.00708090141415596, -0.003311753273010254, 0.0004573967307806015, 0.004226546734571457, 0.007995694875717163, 0.011764843948185444, 0.015533993020653725, 0.01930314302444458, 0.023072291165590286, 0.026841439306735992, 0.030610589310526848, 0.0343797393143177, 0.03814888745546341, 0.041918035596609116, 0.04568718373775482, 0.049456335604190826, 0.05322548374533653, 0.05699463188648224, 0.06076378375291824, 0.06453293561935425, 0.06830208003520966, 0.07207123190164566, 0.07584037631750107, 0.07960952818393707, 0.08337867259979248, 0.08714782446622849, 0.09091697633266449, 0.0946861207485199, 0.0984552726149559, 0.1022244244813919, 0.10599356889724731, 0.10976272076368332, 0.11353187263011932, 0.11730101704597473, 0.12107016891241074, 0.12483932077884674, 0.12860846519470215]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 14.0, 15.0, 12.0, 22.0, 24.0, 20.0, 27.0, 31.0, 23.0, 35.0, 41.0, 34.0, 41.0, 44.0, 42.0, 38.0, 31.0, 54.0, 41.0, 50.0, 31.0, 32.0, 34.0, 38.0, 18.0, 26.0, 24.0, 19.0, 20.0, 19.0, 12.0, 8.0, 15.0, 16.0, 11.0, 3.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.04296875, -2.95489501953125, -2.8668212890625, -2.77874755859375, -2.690673828125, -2.60260009765625, -2.5145263671875, -2.42645263671875, -2.33837890625, -2.25030517578125, -2.1622314453125, -2.07415771484375, -1.986083984375, -1.89801025390625, -1.8099365234375, -1.72186279296875, -1.6337890625, -1.54571533203125, -1.4576416015625, -1.36956787109375, -1.281494140625, -1.19342041015625, -1.1053466796875, -1.01727294921875, -0.92919921875, -0.84112548828125, -0.7530517578125, -0.66497802734375, -0.576904296875, -0.48883056640625, -0.4007568359375, -0.31268310546875, -0.224609375, -0.13653564453125, -0.0484619140625, 0.03961181640625, 0.127685546875, 0.21575927734375, 0.3038330078125, 0.39190673828125, 0.47998046875, 0.56805419921875, 0.6561279296875, 0.74420166015625, 0.832275390625, 0.92034912109375, 1.0084228515625, 1.09649658203125, 1.1845703125, 1.27264404296875, 1.3607177734375, 1.44879150390625, 1.536865234375, 1.62493896484375, 1.7130126953125, 1.80108642578125, 1.88916015625, 1.97723388671875, 2.0653076171875, 2.15338134765625, 2.241455078125, 2.32952880859375, 2.4176025390625, 2.50567626953125, 2.59375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 3.0, 10.0, 9.0, 15.0, 14.0, 28.0, 42.0, 79.0, 116.0, 218.0, 290.0, 529.0, 883.0, 1471.0, 2385.0, 4034.0, 6998.0, 11915.0, 20519.0, 36230.0, 66193.0, 122255.0, 224232.0, 243189.0, 137769.0, 73484.0, 40864.0, 22620.0, 13276.0, 7729.0, 4458.0, 2603.0, 1646.0, 933.0, 575.0, 355.0, 234.0, 132.0, 73.0, 44.0, 27.0, 20.0, 17.0, 8.0, 9.0, 3.0, 4.0, 2.0, 2.0, 8.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.3671875, -2.28582763671875, -2.2044677734375, -2.12310791015625, -2.041748046875, -1.96038818359375, -1.8790283203125, -1.79766845703125, -1.71630859375, -1.63494873046875, -1.5535888671875, -1.47222900390625, -1.390869140625, -1.30950927734375, -1.2281494140625, -1.14678955078125, -1.0654296875, -0.98406982421875, -0.9027099609375, -0.82135009765625, -0.739990234375, -0.65863037109375, -0.5772705078125, -0.49591064453125, -0.41455078125, -0.33319091796875, -0.2518310546875, -0.17047119140625, -0.089111328125, -0.00775146484375, 0.0736083984375, 0.15496826171875, 0.236328125, 0.31768798828125, 0.3990478515625, 0.48040771484375, 0.561767578125, 0.64312744140625, 0.7244873046875, 0.80584716796875, 0.88720703125, 0.96856689453125, 1.0499267578125, 1.13128662109375, 1.212646484375, 1.29400634765625, 1.3753662109375, 1.45672607421875, 1.5380859375, 1.61944580078125, 1.7008056640625, 1.78216552734375, 1.863525390625, 1.94488525390625, 2.0262451171875, 2.10760498046875, 2.18896484375, 2.27032470703125, 2.3516845703125, 2.43304443359375, 2.514404296875, 2.59576416015625, 2.6771240234375, 2.75848388671875, 2.83984375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 5.0, 7.0, 6.0, 16.0, 20.0, 9.0, 14.0, 25.0, 21.0, 29.0, 30.0, 37.0, 44.0, 57.0, 73.0, 93.0, 181.0, 329.0, 1365.0, 168.0, 89.0, 57.0, 54.0, 34.0, 36.0, 34.0, 40.0, 26.0, 15.0, 24.0, 25.0, 15.0, 13.0, 7.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -10.047607421875, -9.74365234375, -9.439697265625, -9.1357421875, -8.831787109375, -8.52783203125, -8.223876953125, -7.919921875, -7.615966796875, -7.31201171875, -7.008056640625, -6.7041015625, -6.400146484375, -6.09619140625, -5.792236328125, -5.48828125, -5.184326171875, -4.88037109375, -4.576416015625, -4.2724609375, -3.968505859375, -3.66455078125, -3.360595703125, -3.056640625, -2.752685546875, -2.44873046875, -2.144775390625, -1.8408203125, -1.536865234375, -1.23291015625, -0.928955078125, -0.625, -0.321044921875, -0.01708984375, 0.286865234375, 0.5908203125, 0.894775390625, 1.19873046875, 1.502685546875, 1.806640625, 2.110595703125, 2.41455078125, 2.718505859375, 3.0224609375, 3.326416015625, 3.63037109375, 3.934326171875, 4.23828125, 4.542236328125, 4.84619140625, 5.150146484375, 5.4541015625, 5.758056640625, 6.06201171875, 6.365966796875, 6.669921875, 6.973876953125, 7.27783203125, 7.581787109375, 7.8857421875, 8.189697265625, 8.49365234375, 8.797607421875, 9.1015625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 5.0, 12.0, 11.0, 13.0, 23.0, 22.0, 35.0, 34.0, 49.0, 61.0, 107.0, 145.0, 184.0, 245.0, 479.0, 1280.0, 21219.0, 2789208.0, 326441.0, 4194.0, 798.0, 348.0, 215.0, 163.0, 99.0, 70.0, 53.0, 49.0, 32.0, 20.0, 25.0, 16.0, 8.0, 9.0, 6.0, 11.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.859375, -22.161865234375, -21.46435546875, -20.766845703125, -20.0693359375, -19.371826171875, -18.67431640625, -17.976806640625, -17.279296875, -16.581787109375, -15.88427734375, -15.186767578125, -14.4892578125, -13.791748046875, -13.09423828125, -12.396728515625, -11.69921875, -11.001708984375, -10.30419921875, -9.606689453125, -8.9091796875, -8.211669921875, -7.51416015625, -6.816650390625, -6.119140625, -5.421630859375, -4.72412109375, -4.026611328125, -3.3291015625, -2.631591796875, -1.93408203125, -1.236572265625, -0.5390625, 0.158447265625, 0.85595703125, 1.553466796875, 2.2509765625, 2.948486328125, 3.64599609375, 4.343505859375, 5.041015625, 5.738525390625, 6.43603515625, 7.133544921875, 7.8310546875, 8.528564453125, 9.22607421875, 9.923583984375, 10.62109375, 11.318603515625, 12.01611328125, 12.713623046875, 13.4111328125, 14.108642578125, 14.80615234375, 15.503662109375, 16.201171875, 16.898681640625, 17.59619140625, 18.293701171875, 18.9912109375, 19.688720703125, 20.38623046875, 21.083740234375, 21.78125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 18.0, 76.0, 258.0, 360.0, 239.0, 52.0, 13.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.02573013305664, -29.247669219970703, -27.469608306884766, -25.691547393798828, -23.91348648071289, -22.135425567626953, -20.357362747192383, -18.579301834106445, -16.801240921020508, -15.02318000793457, -13.245119094848633, -11.467057228088379, -9.688996315002441, -7.910935401916504, -6.13287353515625, -4.3548126220703125, -2.576751708984375, -0.7986905574798584, 0.9793705940246582, 2.757431983947754, 4.535492897033691, 6.313553810119629, 8.091615676879883, 9.86967658996582, 11.647737503051758, 13.425798416137695, 15.203859329223633, 16.981922149658203, 18.75998306274414, 20.538043975830078, 22.316104888916016, 24.094165802001953, 25.872230529785156, 27.650291442871094, 29.42835235595703, 31.20641326904297, 32.984474182128906, 34.762535095214844, 36.54059600830078, 38.31865692138672, 40.096717834472656, 41.874778747558594, 43.65283966064453, 45.43090057373047, 47.208961486816406, 48.987022399902344, 50.76508331298828, 52.54314422607422, 54.32120895385742, 56.09926986694336, 57.8773307800293, 59.655391693115234, 61.43345260620117, 63.21151351928711, 64.98957824707031, 66.76763916015625, 68.54570007324219, 70.32376098632812, 72.10182189941406, 73.8798828125, 75.65794372558594, 77.43600463867188, 79.21406555175781, 80.99212646484375, 82.77018737792969]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 1.0, 3.0, 7.0, 6.0, 3.0, 10.0, 14.0, 15.0, 15.0, 18.0, 20.0, 22.0, 22.0, 33.0, 37.0, 38.0, 32.0, 55.0, 41.0, 33.0, 43.0, 45.0, 40.0, 51.0, 45.0, 37.0, 27.0, 33.0, 36.0, 29.0, 32.0, 31.0, 18.0, 26.0, 14.0, 11.0, 6.0, 8.0, 11.0, 7.0, 9.0, 4.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-31.3690242767334, -30.482471466064453, -29.595916748046875, -28.70936393737793, -27.822811126708984, -26.936256408691406, -26.04970359802246, -25.163150787353516, -24.276596069335938, -23.390043258666992, -22.503488540649414, -21.61693572998047, -20.73038101196289, -19.843828201293945, -18.957275390625, -18.070720672607422, -17.184167861938477, -16.29761505126953, -15.411060333251953, -14.524507522583008, -13.637953758239746, -12.751399993896484, -11.864847183227539, -10.978293418884277, -10.091739654541016, -9.205185890197754, -8.318632125854492, -7.432079315185547, -6.545525550842285, -5.658971786499023, -4.77241849899292, -3.8858652114868164, -2.9993133544921875, -2.112759828567505, -1.2262063026428223, -0.33965277671813965, 0.546900749206543, 1.4334545135498047, 2.320007801055908, 3.2065610885620117, 4.093114852905273, 4.979668617248535, 5.866221904754639, 6.752775192260742, 7.639328956604004, 8.525882720947266, 9.412435531616211, 10.298989295959473, 11.185543060302734, 12.072096824645996, 12.958650588989258, 13.845203399658203, 14.731757164001465, 15.618310928344727, 16.504863739013672, 17.39141845703125, 18.277971267700195, 19.16452407836914, 20.05107879638672, 20.937631607055664, 21.82418441772461, 22.710739135742188, 23.597291946411133, 24.483844757080078, 25.370399475097656]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 13.0, 8.0, 14.0, 22.0, 21.0, 21.0, 32.0, 33.0, 25.0, 27.0, 41.0, 39.0, 38.0, 50.0, 50.0, 39.0, 51.0, 29.0, 41.0, 32.0, 35.0, 27.0, 40.0, 35.0, 26.0, 31.0, 32.0, 23.0, 16.0, 19.0, 6.0, 12.0, 7.0, 11.0, 15.0, 5.0, 7.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0], "bins": [-3.615234375, -3.51593017578125, -3.4166259765625, -3.31732177734375, -3.218017578125, -3.11871337890625, -3.0194091796875, -2.92010498046875, -2.82080078125, -2.72149658203125, -2.6221923828125, -2.52288818359375, -2.423583984375, -2.32427978515625, -2.2249755859375, -2.12567138671875, -2.0263671875, -1.92706298828125, -1.8277587890625, -1.72845458984375, -1.629150390625, -1.52984619140625, -1.4305419921875, -1.33123779296875, -1.23193359375, -1.13262939453125, -1.0333251953125, -0.93402099609375, -0.834716796875, -0.73541259765625, -0.6361083984375, -0.53680419921875, -0.4375, -0.33819580078125, -0.2388916015625, -0.13958740234375, -0.040283203125, 0.05902099609375, 0.1583251953125, 0.25762939453125, 0.35693359375, 0.45623779296875, 0.5555419921875, 0.65484619140625, 0.754150390625, 0.85345458984375, 0.9527587890625, 1.05206298828125, 1.1513671875, 1.25067138671875, 1.3499755859375, 1.44927978515625, 1.548583984375, 1.64788818359375, 1.7471923828125, 1.84649658203125, 1.94580078125, 2.04510498046875, 2.1444091796875, 2.24371337890625, 2.343017578125, 2.44232177734375, 2.5416259765625, 2.64093017578125, 2.740234375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 11.0, 16.0, 16.0, 11.0, 23.0, 32.0, 35.0, 36.0, 58.0, 76.0, 167.0, 321.0, 1090.0, 6675.0, 79726.0, 1215415.0, 2564065.0, 303638.0, 19442.0, 2335.0, 502.0, 200.0, 100.0, 55.0, 43.0, 33.0, 27.0, 20.0, 20.0, 10.0, 18.0, 15.0, 11.0, 7.0, 6.0, 5.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.609375, -10.324462890625, -10.03955078125, -9.754638671875, -9.4697265625, -9.184814453125, -8.89990234375, -8.614990234375, -8.330078125, -8.045166015625, -7.76025390625, -7.475341796875, -7.1904296875, -6.905517578125, -6.62060546875, -6.335693359375, -6.05078125, -5.765869140625, -5.48095703125, -5.196044921875, -4.9111328125, -4.626220703125, -4.34130859375, -4.056396484375, -3.771484375, -3.486572265625, -3.20166015625, -2.916748046875, -2.6318359375, -2.346923828125, -2.06201171875, -1.777099609375, -1.4921875, -1.207275390625, -0.92236328125, -0.637451171875, -0.3525390625, -0.067626953125, 0.21728515625, 0.502197265625, 0.787109375, 1.072021484375, 1.35693359375, 1.641845703125, 1.9267578125, 2.211669921875, 2.49658203125, 2.781494140625, 3.06640625, 3.351318359375, 3.63623046875, 3.921142578125, 4.2060546875, 4.490966796875, 4.77587890625, 5.060791015625, 5.345703125, 5.630615234375, 5.91552734375, 6.200439453125, 6.4853515625, 6.770263671875, 7.05517578125, 7.340087890625, 7.625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 7.0, 5.0, 12.0, 14.0, 7.0, 16.0, 23.0, 36.0, 25.0, 50.0, 63.0, 66.0, 99.0, 134.0, 147.0, 187.0, 222.0, 297.0, 331.0, 319.0, 339.0, 316.0, 276.0, 254.0, 158.0, 155.0, 104.0, 83.0, 72.0, 63.0, 45.0, 37.0, 24.0, 16.0, 20.0, 7.0, 14.0, 5.0, 10.0, 7.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.109375, -4.9498291015625, -4.790283203125, -4.6307373046875, -4.47119140625, -4.3116455078125, -4.152099609375, -3.9925537109375, -3.8330078125, -3.6734619140625, -3.513916015625, -3.3543701171875, -3.19482421875, -3.0352783203125, -2.875732421875, -2.7161865234375, -2.556640625, -2.3970947265625, -2.237548828125, -2.0780029296875, -1.91845703125, -1.7589111328125, -1.599365234375, -1.4398193359375, -1.2802734375, -1.1207275390625, -0.961181640625, -0.8016357421875, -0.64208984375, -0.4825439453125, -0.322998046875, -0.1634521484375, -0.00390625, 0.1556396484375, 0.315185546875, 0.4747314453125, 0.63427734375, 0.7938232421875, 0.953369140625, 1.1129150390625, 1.2724609375, 1.4320068359375, 1.591552734375, 1.7510986328125, 1.91064453125, 2.0701904296875, 2.229736328125, 2.3892822265625, 2.548828125, 2.7083740234375, 2.867919921875, 3.0274658203125, 3.18701171875, 3.3465576171875, 3.506103515625, 3.6656494140625, 3.8251953125, 3.9847412109375, 4.144287109375, 4.3038330078125, 4.46337890625, 4.6229248046875, 4.782470703125, 4.9420166015625, 5.1015625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 8.0, 11.0, 5.0, 14.0, 16.0, 19.0, 22.0, 39.0, 47.0, 60.0, 72.0, 94.0, 123.0, 175.0, 261.0, 482.0, 1839.0, 30898.0, 1405143.0, 2672279.0, 77919.0, 2982.0, 641.0, 296.0, 217.0, 147.0, 106.0, 79.0, 65.0, 51.0, 36.0, 33.0, 25.0, 18.0, 6.0, 7.0, 10.0, 13.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.609375, -16.07568359375, -15.5419921875, -15.00830078125, -14.474609375, -13.94091796875, -13.4072265625, -12.87353515625, -12.33984375, -11.80615234375, -11.2724609375, -10.73876953125, -10.205078125, -9.67138671875, -9.1376953125, -8.60400390625, -8.0703125, -7.53662109375, -7.0029296875, -6.46923828125, -5.935546875, -5.40185546875, -4.8681640625, -4.33447265625, -3.80078125, -3.26708984375, -2.7333984375, -2.19970703125, -1.666015625, -1.13232421875, -0.5986328125, -0.06494140625, 0.46875, 1.00244140625, 1.5361328125, 2.06982421875, 2.603515625, 3.13720703125, 3.6708984375, 4.20458984375, 4.73828125, 5.27197265625, 5.8056640625, 6.33935546875, 6.873046875, 7.40673828125, 7.9404296875, 8.47412109375, 9.0078125, 9.54150390625, 10.0751953125, 10.60888671875, 11.142578125, 11.67626953125, 12.2099609375, 12.74365234375, 13.27734375, 13.81103515625, 14.3447265625, 14.87841796875, 15.412109375, 15.94580078125, 16.4794921875, 17.01318359375, 17.546875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 18.0, 25.0, 41.0, 60.0, 80.0, 96.0, 110.0, 99.0, 108.0, 104.0, 80.0, 70.0, 45.0, 23.0, 19.0, 9.0, 4.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.75283432006836, -24.719707489013672, -23.686580657958984, -22.653453826904297, -21.62032699584961, -20.587200164794922, -19.554075241088867, -18.52094841003418, -17.487821578979492, -16.454694747924805, -15.421567916870117, -14.388442039489746, -13.355315208435059, -12.322188377380371, -11.2890625, -10.255935668945312, -9.222808837890625, -8.189682006835938, -7.156555652618408, -6.123429298400879, -5.090302467346191, -4.057175636291504, -3.0240492820739746, -1.9909229278564453, -0.9577960968017578, 0.07533049583435059, 1.108457088470459, 2.1415836811065674, 3.174710273742676, 4.207837104797363, 5.240963459014893, 6.274089813232422, 7.307212829589844, 8.340339660644531, 9.373466491699219, 10.40659236907959, 11.439719200134277, 12.472846031188965, 13.505971908569336, 14.539098739624023, 15.572225570678711, 16.6053524017334, 17.638479232788086, 18.671606063842773, 19.704730987548828, 20.737857818603516, 21.770984649658203, 22.80411148071289, 23.837238311767578, 24.870365142822266, 25.903491973876953, 26.93661880493164, 27.969745635986328, 29.002872467041016, 30.03599739074707, 31.069124221801758, 32.10224914550781, 33.1353759765625, 34.16850280761719, 35.201629638671875, 36.23475646972656, 37.26788330078125, 38.30101013183594, 39.334136962890625, 40.36726379394531]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 10.0, 14.0, 9.0, 12.0, 14.0, 22.0, 19.0, 28.0, 16.0, 24.0, 27.0, 37.0, 42.0, 52.0, 40.0, 51.0, 37.0, 37.0, 43.0, 45.0, 37.0, 33.0, 52.0, 33.0, 35.0, 35.0, 27.0, 30.0, 25.0, 13.0, 20.0, 16.0, 17.0, 11.0, 15.0, 3.0, 10.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.301591873168945, -20.57067108154297, -19.839752197265625, -19.10883140563965, -18.377910614013672, -17.646991729736328, -16.91607093811035, -16.185150146484375, -15.454231262207031, -14.723311424255371, -13.992391586303711, -13.261470794677734, -12.530550956726074, -11.799631118774414, -11.068710327148438, -10.337790489196777, -9.606870651245117, -8.875950813293457, -8.145030975341797, -7.41411018371582, -6.68319034576416, -5.9522705078125, -5.221350193023682, -4.490429878234863, -3.759510040283203, -3.028589963912964, -2.2976698875427246, -1.5667498111724854, -0.8358297348022461, -0.10490965843200684, 0.6260104179382324, 1.3569307327270508, 2.0878524780273438, 2.818772554397583, 3.5496926307678223, 4.280612945556641, 5.011532783508301, 5.742452621459961, 6.473372936248779, 7.204293251037598, 7.935213088989258, 8.666132926940918, 9.397052764892578, 10.127973556518555, 10.858893394470215, 11.589813232421875, 12.320734024047852, 13.051653861999512, 13.782573699951172, 14.513493537902832, 15.244413375854492, 15.975334167480469, 16.706253051757812, 17.43717384338379, 18.168094635009766, 18.89901351928711, 19.629934310913086, 20.360855102539062, 21.091773986816406, 21.822694778442383, 22.55361557006836, 23.284534454345703, 24.01545524597168, 24.746376037597656, 25.477294921875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 8.0, 7.0, 11.0, 13.0, 20.0, 22.0, 30.0, 24.0, 34.0, 47.0, 37.0, 29.0, 27.0, 35.0, 30.0, 37.0, 34.0, 48.0, 42.0, 35.0, 52.0, 32.0, 30.0, 37.0, 27.0, 26.0, 23.0, 33.0, 27.0, 18.0, 17.0, 12.0, 11.0, 21.0, 7.0, 11.0, 12.0, 5.0, 1.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.723419189453125, -2.63238525390625, -2.541351318359375, -2.4503173828125, -2.359283447265625, -2.26824951171875, -2.177215576171875, -2.086181640625, -1.995147705078125, -1.90411376953125, -1.813079833984375, -1.7220458984375, -1.631011962890625, -1.53997802734375, -1.448944091796875, -1.35791015625, -1.266876220703125, -1.17584228515625, -1.084808349609375, -0.9937744140625, -0.902740478515625, -0.81170654296875, -0.720672607421875, -0.629638671875, -0.538604736328125, -0.44757080078125, -0.356536865234375, -0.2655029296875, -0.174468994140625, -0.08343505859375, 0.007598876953125, 0.0986328125, 0.189666748046875, 0.28070068359375, 0.371734619140625, 0.4627685546875, 0.553802490234375, 0.64483642578125, 0.735870361328125, 0.826904296875, 0.917938232421875, 1.00897216796875, 1.100006103515625, 1.1910400390625, 1.282073974609375, 1.37310791015625, 1.464141845703125, 1.55517578125, 1.646209716796875, 1.73724365234375, 1.828277587890625, 1.9193115234375, 2.010345458984375, 2.10137939453125, 2.192413330078125, 2.283447265625, 2.374481201171875, 2.46551513671875, 2.556549072265625, 2.6475830078125, 2.738616943359375, 2.82965087890625, 2.920684814453125, 3.01171875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 10.0, 6.0, 9.0, 15.0, 26.0, 40.0, 52.0, 80.0, 146.0, 186.0, 388.0, 581.0, 1039.0, 1734.0, 2815.0, 4772.0, 7722.0, 12707.0, 20155.0, 31519.0, 47205.0, 67946.0, 91740.0, 114599.0, 129338.0, 128169.0, 111138.0, 88090.0, 64599.0, 44179.0, 29362.0, 18799.0, 11423.0, 7192.0, 4204.0, 2632.0, 1556.0, 916.0, 588.0, 334.0, 208.0, 120.0, 76.0, 50.0, 51.0, 10.0, 16.0, 5.0, 6.0, 3.0, 7.0, 4.0, 3.0], "bins": [-0.80810546875, -0.7856063842773438, -0.7631072998046875, -0.7406082153320312, -0.718109130859375, -0.6956100463867188, -0.6731109619140625, -0.6506118774414062, -0.62811279296875, -0.6056137084960938, -0.5831146240234375, -0.5606155395507812, -0.538116455078125, -0.5156173706054688, -0.4931182861328125, -0.47061920166015625, -0.4481201171875, -0.42562103271484375, -0.4031219482421875, -0.38062286376953125, -0.358123779296875, -0.33562469482421875, -0.3131256103515625, -0.29062652587890625, -0.26812744140625, -0.24562835693359375, -0.2231292724609375, -0.20063018798828125, -0.178131103515625, -0.15563201904296875, -0.1331329345703125, -0.11063385009765625, -0.088134765625, -0.06563568115234375, -0.0431365966796875, -0.02063751220703125, 0.001861572265625, 0.02436065673828125, 0.0468597412109375, 0.06935882568359375, 0.09185791015625, 0.11435699462890625, 0.1368560791015625, 0.15935516357421875, 0.181854248046875, 0.20435333251953125, 0.2268524169921875, 0.24935150146484375, 0.2718505859375, 0.29434967041015625, 0.3168487548828125, 0.33934783935546875, 0.361846923828125, 0.38434600830078125, 0.4068450927734375, 0.42934417724609375, 0.45184326171875, 0.47434234619140625, 0.4968414306640625, 0.5193405151367188, 0.541839599609375, 0.5643386840820312, 0.5868377685546875, 0.6093368530273438, 0.6318359375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 1.0, 8.0, 9.0, 4.0, 10.0, 11.0, 9.0, 13.0, 21.0, 11.0, 28.0, 14.0, 29.0, 18.0, 24.0, 31.0, 43.0, 38.0, 37.0, 42.0, 41.0, 61.0, 1064.0, 35.0, 35.0, 35.0, 28.0, 38.0, 47.0, 36.0, 30.0, 19.0, 17.0, 19.0, 15.0, 11.0, 15.0, 18.0, 12.0, 9.0, 7.0, 3.0, 8.0, 8.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.654296875, -2.576690673828125, -2.49908447265625, -2.421478271484375, -2.3438720703125, -2.266265869140625, -2.18865966796875, -2.111053466796875, -2.033447265625, -1.955841064453125, -1.87823486328125, -1.800628662109375, -1.7230224609375, -1.645416259765625, -1.56781005859375, -1.490203857421875, -1.41259765625, -1.334991455078125, -1.25738525390625, -1.179779052734375, -1.1021728515625, -1.024566650390625, -0.94696044921875, -0.869354248046875, -0.791748046875, -0.714141845703125, -0.63653564453125, -0.558929443359375, -0.4813232421875, -0.403717041015625, -0.32611083984375, -0.248504638671875, -0.1708984375, -0.093292236328125, -0.01568603515625, 0.061920166015625, 0.1395263671875, 0.217132568359375, 0.29473876953125, 0.372344970703125, 0.449951171875, 0.527557373046875, 0.60516357421875, 0.682769775390625, 0.7603759765625, 0.837982177734375, 0.91558837890625, 0.993194580078125, 1.07080078125, 1.148406982421875, 1.22601318359375, 1.303619384765625, 1.3812255859375, 1.458831787109375, 1.53643798828125, 1.614044189453125, 1.691650390625, 1.769256591796875, 1.84686279296875, 1.924468994140625, 2.0020751953125, 2.079681396484375, 2.15728759765625, 2.234893798828125, 2.3125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 3.0, 5.0, 9.0, 7.0, 14.0, 25.0, 31.0, 51.0, 59.0, 110.0, 170.0, 251.0, 415.0, 567.0, 869.0, 1376.0, 2159.0, 3339.0, 5120.0, 7829.0, 12231.0, 19926.0, 36460.0, 1880831.0, 56796.0, 25935.0, 15243.0, 9616.0, 6239.0, 4063.0, 2633.0, 1699.0, 1024.0, 710.0, 440.0, 299.0, 222.0, 121.0, 76.0, 43.0, 43.0, 23.0, 22.0, 11.0, 8.0, 8.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.4738616943359375, -1.424285888671875, -1.3747100830078125, -1.32513427734375, -1.2755584716796875, -1.225982666015625, -1.1764068603515625, -1.1268310546875, -1.0772552490234375, -1.027679443359375, -0.9781036376953125, -0.92852783203125, -0.8789520263671875, -0.829376220703125, -0.7798004150390625, -0.730224609375, -0.6806488037109375, -0.631072998046875, -0.5814971923828125, -0.53192138671875, -0.4823455810546875, -0.432769775390625, -0.3831939697265625, -0.3336181640625, -0.2840423583984375, -0.234466552734375, -0.1848907470703125, -0.13531494140625, -0.0857391357421875, -0.036163330078125, 0.0134124755859375, 0.06298828125, 0.1125640869140625, 0.162139892578125, 0.2117156982421875, 0.26129150390625, 0.3108673095703125, 0.360443115234375, 0.4100189208984375, 0.4595947265625, 0.5091705322265625, 0.558746337890625, 0.6083221435546875, 0.65789794921875, 0.7074737548828125, 0.757049560546875, 0.8066253662109375, 0.856201171875, 0.9057769775390625, 0.955352783203125, 1.0049285888671875, 1.05450439453125, 1.1040802001953125, 1.153656005859375, 1.2032318115234375, 1.2528076171875, 1.3023834228515625, 1.351959228515625, 1.4015350341796875, 1.45111083984375, 1.5006866455078125, 1.550262451171875, 1.5998382568359375, 1.6494140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 5.0, 11.0, 14.0, 9.0, 18.0, 12.0, 22.0, 19.0, 29.0, 26.0, 38.0, 38.0, 43.0, 45.0, 63.0, 65.0, 62.0, 68.0, 59.0, 57.0, 56.0, 31.0, 37.0, 30.0, 27.0, 20.0, 16.0, 19.0, 12.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039581298828125, -0.038125038146972656, -0.03666877746582031, -0.03521251678466797, -0.033756256103515625, -0.03229999542236328, -0.030843734741210938, -0.029387474060058594, -0.02793121337890625, -0.026474952697753906, -0.025018692016601562, -0.02356243133544922, -0.022106170654296875, -0.02064990997314453, -0.019193649291992188, -0.017737388610839844, -0.0162811279296875, -0.014824867248535156, -0.013368606567382812, -0.011912345886230469, -0.010456085205078125, -0.008999824523925781, -0.0075435638427734375, -0.006087303161621094, -0.00463104248046875, -0.0031747817993164062, -0.0017185211181640625, -0.00026226043701171875, 0.001194000244140625, 0.0026502609252929688, 0.0041065216064453125, 0.005562782287597656, 0.00701904296875, 0.008475303649902344, 0.009931564331054688, 0.011387825012207031, 0.012844085693359375, 0.014300346374511719, 0.015756607055664062, 0.017212867736816406, 0.01866912841796875, 0.020125389099121094, 0.021581649780273438, 0.02303791046142578, 0.024494171142578125, 0.02595043182373047, 0.027406692504882812, 0.028862953186035156, 0.0303192138671875, 0.031775474548339844, 0.03323173522949219, 0.03468799591064453, 0.036144256591796875, 0.03760051727294922, 0.03905677795410156, 0.040513038635253906, 0.04196929931640625, 0.043425559997558594, 0.04488182067871094, 0.04633808135986328, 0.047794342041015625, 0.04925060272216797, 0.05070686340332031, 0.052163124084472656, 0.053619384765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 10.0, 12.0, 11.0, 18.0, 21.0, 19.0, 32.0, 38.0, 44.0, 63.0, 110.0, 267.0, 717.0, 37383.0, 1006601.0, 2272.0, 423.0, 155.0, 74.0, 43.0, 45.0, 31.0, 24.0, 19.0, 21.0, 14.0, 14.0, 11.0, 13.0, 7.0, 4.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.2734375, -1.2392730712890625, -1.205108642578125, -1.1709442138671875, -1.13677978515625, -1.1026153564453125, -1.068450927734375, -1.0342864990234375, -1.0001220703125, -0.9659576416015625, -0.931793212890625, -0.8976287841796875, -0.86346435546875, -0.8292999267578125, -0.795135498046875, -0.7609710693359375, -0.726806640625, -0.6926422119140625, -0.658477783203125, -0.6243133544921875, -0.59014892578125, -0.5559844970703125, -0.521820068359375, -0.4876556396484375, -0.4534912109375, -0.4193267822265625, -0.385162353515625, -0.3509979248046875, -0.31683349609375, -0.2826690673828125, -0.248504638671875, -0.2143402099609375, -0.18017578125, -0.1460113525390625, -0.111846923828125, -0.0776824951171875, -0.04351806640625, -0.0093536376953125, 0.024810791015625, 0.0589752197265625, 0.0931396484375, 0.1273040771484375, 0.161468505859375, 0.1956329345703125, 0.22979736328125, 0.2639617919921875, 0.298126220703125, 0.3322906494140625, 0.366455078125, 0.4006195068359375, 0.434783935546875, 0.4689483642578125, 0.50311279296875, 0.5372772216796875, 0.571441650390625, 0.6056060791015625, 0.6397705078125, 0.6739349365234375, 0.708099365234375, 0.7422637939453125, 0.77642822265625, 0.8105926513671875, 0.844757080078125, 0.8789215087890625, 0.9130859375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 14.0, 356.0, 635.0, 11.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.209282636642456, -3.1530399322509766, -3.096797466278076, -3.0405547618865967, -2.984312057495117, -2.928069591522217, -2.8718268871307373, -2.815584421157837, -2.7593417167663574, -2.703099012374878, -2.6468565464019775, -2.590613842010498, -2.5343713760375977, -2.478128671646118, -2.4218859672546387, -2.3656435012817383, -2.309400796890259, -2.2531580924987793, -2.196915626525879, -2.1406729221343994, -2.08443021774292, -2.0281877517700195, -1.97194504737854, -1.91570246219635, -1.8594598770141602, -1.8032172918319702, -1.7469747066497803, -1.6907320022583008, -1.6344894170761108, -1.578246831893921, -1.5220041275024414, -1.4657615423202515, -1.4095189571380615, -1.3532763719558716, -1.2970337867736816, -1.2407910823822021, -1.1845484972000122, -1.1283059120178223, -1.0720632076263428, -1.0158206224441528, -0.9595779776573181, -0.9033353328704834, -0.8470927476882935, -0.7908501625061035, -0.7346075177192688, -0.6783648729324341, -0.6221222877502441, -0.5658797025680542, -0.5096370577812195, -0.45339444279670715, -0.3971518278121948, -0.3409092128276825, -0.28466659784317017, -0.22842398285865784, -0.1721813678741455, -0.11593875288963318, -0.05969613790512085, -0.0034535229206085205, 0.05278909206390381, 0.10903170704841614, 0.16527432203292847, 0.2215169370174408, 0.2777595520019531, 0.33400216698646545, 0.3902447819709778]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 10.0, 6.0, 6.0, 11.0, 17.0, 16.0, 13.0, 23.0, 30.0, 41.0, 39.0, 43.0, 41.0, 47.0, 45.0, 60.0, 34.0, 48.0, 53.0, 46.0, 49.0, 47.0, 46.0, 34.0, 34.0, 26.0, 34.0, 15.0, 20.0, 13.0, 9.0, 15.0, 14.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19973856210708618, -0.19249895215034485, -0.1852593570947647, -0.17801974713802338, -0.17078015208244324, -0.1635405421257019, -0.15630093216896057, -0.14906133711338043, -0.1418217420578003, -0.13458213210105896, -0.12734253704547882, -0.12010292708873749, -0.11286333203315735, -0.10562372207641602, -0.09838411957025528, -0.09114451706409454, -0.08390490710735321, -0.07666530460119247, -0.06942570209503174, -0.062186095863580704, -0.05494649335741997, -0.04770689085125923, -0.0404672846198082, -0.03322768211364746, -0.025988079607486725, -0.01874847710132599, -0.011508872732520103, -0.004269268363714218, 0.002970334142446518, 0.010209936648607254, 0.01744954288005829, 0.024689145386219025, 0.03192874789237976, 0.0391683503985405, 0.04640795290470123, 0.05364755913615227, 0.060887161642313004, 0.06812676787376404, 0.07536637037992477, 0.08260597288608551, 0.08984557539224625, 0.09708517789840698, 0.10432478040456772, 0.11156438291072845, 0.11880399286746979, 0.12604358792304993, 0.13328319787979126, 0.1405228078365326, 0.14776240289211273, 0.15500201284885406, 0.1622416079044342, 0.16948121786117554, 0.17672081291675568, 0.183960422873497, 0.19120001792907715, 0.19843962788581848, 0.20567923784255981, 0.21291884779930115, 0.2201584428548813, 0.22739805281162262, 0.23463764786720276, 0.2418772578239441, 0.24911686778068542, 0.25635647773742676, 0.2635960578918457]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 9.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 9.0, 5.0, 7.0, 14.0, 11.0, 15.0, 22.0, 39.0, 23.0, 35.0, 31.0, 29.0, 36.0, 22.0, 52.0, 36.0, 31.0, 39.0, 42.0, 35.0, 38.0, 33.0, 41.0, 31.0, 40.0, 41.0, 27.0, 22.0, 18.0, 21.0, 20.0, 18.0, 14.0, 20.0, 10.0, 11.0, 10.0, 9.0, 10.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.796875, -2.7091064453125, -2.621337890625, -2.5335693359375, -2.44580078125, -2.3580322265625, -2.270263671875, -2.1824951171875, -2.0947265625, -2.0069580078125, -1.919189453125, -1.8314208984375, -1.74365234375, -1.6558837890625, -1.568115234375, -1.4803466796875, -1.392578125, -1.3048095703125, -1.217041015625, -1.1292724609375, -1.04150390625, -0.9537353515625, -0.865966796875, -0.7781982421875, -0.6904296875, -0.6026611328125, -0.514892578125, -0.4271240234375, -0.33935546875, -0.2515869140625, -0.163818359375, -0.0760498046875, 0.01171875, 0.0994873046875, 0.187255859375, 0.2750244140625, 0.36279296875, 0.4505615234375, 0.538330078125, 0.6260986328125, 0.7138671875, 0.8016357421875, 0.889404296875, 0.9771728515625, 1.06494140625, 1.1527099609375, 1.240478515625, 1.3282470703125, 1.416015625, 1.5037841796875, 1.591552734375, 1.6793212890625, 1.76708984375, 1.8548583984375, 1.942626953125, 2.0303955078125, 2.1181640625, 2.2059326171875, 2.293701171875, 2.3814697265625, 2.46923828125, 2.5570068359375, 2.644775390625, 2.7325439453125, 2.8203125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 7.0, 15.0, 19.0, 20.0, 41.0, 77.0, 123.0, 180.0, 268.0, 505.0, 846.0, 1459.0, 2431.0, 4447.0, 8517.0, 16083.0, 32057.0, 64217.0, 131475.0, 273624.0, 261485.0, 125129.0, 60916.0, 30538.0, 15676.0, 8206.0, 4429.0, 2413.0, 1378.0, 782.0, 519.0, 241.0, 154.0, 89.0, 57.0, 46.0, 22.0, 15.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.009765625, -2.909332275390625, -2.80889892578125, -2.708465576171875, -2.6080322265625, -2.507598876953125, -2.40716552734375, -2.306732177734375, -2.206298828125, -2.105865478515625, -2.00543212890625, -1.904998779296875, -1.8045654296875, -1.704132080078125, -1.60369873046875, -1.503265380859375, -1.40283203125, -1.302398681640625, -1.20196533203125, -1.101531982421875, -1.0010986328125, -0.900665283203125, -0.80023193359375, -0.699798583984375, -0.599365234375, -0.498931884765625, -0.39849853515625, -0.298065185546875, -0.1976318359375, -0.097198486328125, 0.00323486328125, 0.103668212890625, 0.2041015625, 0.304534912109375, 0.40496826171875, 0.505401611328125, 0.6058349609375, 0.706268310546875, 0.80670166015625, 0.907135009765625, 1.007568359375, 1.108001708984375, 1.20843505859375, 1.308868408203125, 1.4093017578125, 1.509735107421875, 1.61016845703125, 1.710601806640625, 1.81103515625, 1.911468505859375, 2.01190185546875, 2.112335205078125, 2.2127685546875, 2.313201904296875, 2.41363525390625, 2.514068603515625, 2.614501953125, 2.714935302734375, 2.81536865234375, 2.915802001953125, 3.0162353515625, 3.116668701171875, 3.21710205078125, 3.317535400390625, 3.41796875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 4.0, 6.0, 5.0, 11.0, 7.0, 18.0, 16.0, 16.0, 25.0, 36.0, 26.0, 46.0, 29.0, 32.0, 60.0, 73.0, 106.0, 187.0, 1385.0, 301.0, 139.0, 111.0, 53.0, 48.0, 46.0, 41.0, 40.0, 22.0, 23.0, 31.0, 20.0, 15.0, 19.0, 9.0, 9.0, 2.0, 9.0, 2.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.921875, -9.6004638671875, -9.279052734375, -8.9576416015625, -8.63623046875, -8.3148193359375, -7.993408203125, -7.6719970703125, -7.3505859375, -7.0291748046875, -6.707763671875, -6.3863525390625, -6.06494140625, -5.7435302734375, -5.422119140625, -5.1007080078125, -4.779296875, -4.4578857421875, -4.136474609375, -3.8150634765625, -3.49365234375, -3.1722412109375, -2.850830078125, -2.5294189453125, -2.2080078125, -1.8865966796875, -1.565185546875, -1.2437744140625, -0.92236328125, -0.6009521484375, -0.279541015625, 0.0418701171875, 0.36328125, 0.6846923828125, 1.006103515625, 1.3275146484375, 1.64892578125, 1.9703369140625, 2.291748046875, 2.6131591796875, 2.9345703125, 3.2559814453125, 3.577392578125, 3.8988037109375, 4.22021484375, 4.5416259765625, 4.863037109375, 5.1844482421875, 5.505859375, 5.8272705078125, 6.148681640625, 6.4700927734375, 6.79150390625, 7.1129150390625, 7.434326171875, 7.7557373046875, 8.0771484375, 8.3985595703125, 8.719970703125, 9.0413818359375, 9.36279296875, 9.6842041015625, 10.005615234375, 10.3270263671875, 10.6484375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 8.0, 9.0, 6.0, 22.0, 15.0, 25.0, 20.0, 47.0, 68.0, 90.0, 121.0, 182.0, 279.0, 430.0, 881.0, 13583.0, 2959422.0, 166794.0, 2081.0, 566.0, 325.0, 214.0, 146.0, 95.0, 77.0, 48.0, 34.0, 22.0, 21.0, 17.0, 15.0, 7.0, 7.0, 5.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-33.0625, -32.162353515625, -31.26220703125, -30.362060546875, -29.4619140625, -28.561767578125, -27.66162109375, -26.761474609375, -25.861328125, -24.961181640625, -24.06103515625, -23.160888671875, -22.2607421875, -21.360595703125, -20.46044921875, -19.560302734375, -18.66015625, -17.760009765625, -16.85986328125, -15.959716796875, -15.0595703125, -14.159423828125, -13.25927734375, -12.359130859375, -11.458984375, -10.558837890625, -9.65869140625, -8.758544921875, -7.8583984375, -6.958251953125, -6.05810546875, -5.157958984375, -4.2578125, -3.357666015625, -2.45751953125, -1.557373046875, -0.6572265625, 0.242919921875, 1.14306640625, 2.043212890625, 2.943359375, 3.843505859375, 4.74365234375, 5.643798828125, 6.5439453125, 7.444091796875, 8.34423828125, 9.244384765625, 10.14453125, 11.044677734375, 11.94482421875, 12.844970703125, 13.7451171875, 14.645263671875, 15.54541015625, 16.445556640625, 17.345703125, 18.245849609375, 19.14599609375, 20.046142578125, 20.9462890625, 21.846435546875, 22.74658203125, 23.646728515625, 24.546875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [4.0, 71.0, 413.0, 424.0, 100.0, 9.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.29199504852295, -5.648717880249023, -3.005441188812256, -0.3621644973754883, 2.2811126708984375, 4.924389839172363, 7.567666053771973, 10.210944175720215, 12.854220390319824, 15.49749755859375, 18.14077377319336, 20.78404998779297, 23.42732810974121, 26.070606231689453, 28.713882446289062, 31.357158660888672, 34.00043487548828, 36.64371109008789, 39.2869873046875, 41.930267333984375, 44.573543548583984, 47.216819763183594, 49.8600959777832, 52.50337219238281, 55.14665222167969, 57.7899284362793, 60.433204650878906, 63.07648468017578, 65.71975708007812, 68.363037109375, 71.00631713867188, 73.64958953857422, 76.2928695678711, 78.93614959716797, 81.57942199707031, 84.22270202636719, 86.86597442626953, 89.5092544555664, 92.15252685546875, 94.79580688476562, 97.4390869140625, 100.08236694335938, 102.72563934326172, 105.3689193725586, 108.01219177246094, 110.65547180175781, 113.29875183105469, 115.94202423095703, 118.58529663085938, 121.22857666015625, 123.8718490600586, 126.51512908935547, 129.1584014892578, 131.8016815185547, 134.44496154785156, 137.08824157714844, 139.7315216064453, 142.3748016357422, 145.01808166503906, 147.66134643554688, 150.30462646484375, 152.94790649414062, 155.5911865234375, 158.23446655273438, 160.8777313232422]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 8.0, 8.0, 12.0, 11.0, 19.0, 11.0, 16.0, 19.0, 20.0, 19.0, 46.0, 25.0, 27.0, 40.0, 41.0, 36.0, 48.0, 47.0, 40.0, 26.0, 42.0, 45.0, 29.0, 30.0, 31.0, 33.0, 29.0, 26.0, 27.0, 26.0, 15.0, 26.0, 17.0, 11.0, 17.0, 15.0, 12.0, 5.0, 6.0, 4.0, 8.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-27.389083862304688, -26.59893035888672, -25.80877685546875, -25.01862335205078, -24.228469848632812, -23.438316345214844, -22.648162841796875, -21.858009338378906, -21.067855834960938, -20.27770233154297, -19.487548828125, -18.69739532470703, -17.907241821289062, -17.117088317871094, -16.326934814453125, -15.536782264709473, -14.74662971496582, -13.956476211547852, -13.166322708129883, -12.376169204711914, -11.586015701293945, -10.795862197875977, -10.005709648132324, -9.215556144714355, -8.425402641296387, -7.635249137878418, -6.845095634460449, -6.054942607879639, -5.26478910446167, -4.474635601043701, -3.6844825744628906, -2.894329071044922, -2.1041736602783203, -1.3140202760696411, -0.5238668918609619, 0.26628637313842773, 1.0564398765563965, 1.8465933799743652, 2.636746406555176, 3.4268999099731445, 4.217053413391113, 5.007206916809082, 5.797360420227051, 6.587513446807861, 7.37766695022583, 8.16781997680664, 8.95797348022461, 9.748126983642578, 10.538280487060547, 11.328433990478516, 12.118587493896484, 12.908740997314453, 13.698894500732422, 14.48904800415039, 15.279200553894043, 16.069355010986328, 16.859508514404297, 17.649662017822266, 18.439815521240234, 19.229969024658203, 20.020122528076172, 20.81027603149414, 21.60042953491211, 22.390583038330078, 23.180734634399414]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 5.0, 5.0, 7.0, 8.0, 16.0, 20.0, 31.0, 23.0, 33.0, 28.0, 40.0, 40.0, 37.0, 41.0, 35.0, 42.0, 45.0, 48.0, 34.0, 39.0, 44.0, 38.0, 35.0, 42.0, 38.0, 35.0, 18.0, 24.0, 17.0, 20.0, 14.0, 18.0, 14.0, 16.0, 8.0, 11.0, 9.0, 10.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.916046142578125, -2.80865478515625, -2.701263427734375, -2.5938720703125, -2.486480712890625, -2.37908935546875, -2.271697998046875, -2.164306640625, -2.056915283203125, -1.94952392578125, -1.842132568359375, -1.7347412109375, -1.627349853515625, -1.51995849609375, -1.412567138671875, -1.30517578125, -1.197784423828125, -1.09039306640625, -0.983001708984375, -0.8756103515625, -0.768218994140625, -0.66082763671875, -0.553436279296875, -0.446044921875, -0.338653564453125, -0.23126220703125, -0.123870849609375, -0.0164794921875, 0.090911865234375, 0.19830322265625, 0.305694580078125, 0.4130859375, 0.520477294921875, 0.62786865234375, 0.735260009765625, 0.8426513671875, 0.950042724609375, 1.05743408203125, 1.164825439453125, 1.272216796875, 1.379608154296875, 1.48699951171875, 1.594390869140625, 1.7017822265625, 1.809173583984375, 1.91656494140625, 2.023956298828125, 2.13134765625, 2.238739013671875, 2.34613037109375, 2.453521728515625, 2.5609130859375, 2.668304443359375, 2.77569580078125, 2.883087158203125, 2.990478515625, 3.097869873046875, 3.20526123046875, 3.312652587890625, 3.4200439453125, 3.527435302734375, 3.63482666015625, 3.742218017578125, 3.849609375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 5.0, 6.0, 4.0, 6.0, 16.0, 28.0, 31.0, 47.0, 47.0, 84.0, 128.0, 248.0, 503.0, 1213.0, 3938.0, 17454.0, 85056.0, 437127.0, 1539177.0, 1564478.0, 436182.0, 84632.0, 17449.0, 4070.0, 1286.0, 465.0, 197.0, 125.0, 75.0, 47.0, 33.0, 30.0, 22.0, 12.0, 10.0, 7.0, 14.0, 6.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.58984375, -5.42047119140625, -5.2510986328125, -5.08172607421875, -4.912353515625, -4.74298095703125, -4.5736083984375, -4.40423583984375, -4.23486328125, -4.06549072265625, -3.8961181640625, -3.72674560546875, -3.557373046875, -3.38800048828125, -3.2186279296875, -3.04925537109375, -2.8798828125, -2.71051025390625, -2.5411376953125, -2.37176513671875, -2.202392578125, -2.03302001953125, -1.8636474609375, -1.69427490234375, -1.52490234375, -1.35552978515625, -1.1861572265625, -1.01678466796875, -0.847412109375, -0.67803955078125, -0.5086669921875, -0.33929443359375, -0.169921875, -0.00054931640625, 0.1688232421875, 0.33819580078125, 0.507568359375, 0.67694091796875, 0.8463134765625, 1.01568603515625, 1.18505859375, 1.35443115234375, 1.5238037109375, 1.69317626953125, 1.862548828125, 2.03192138671875, 2.2012939453125, 2.37066650390625, 2.5400390625, 2.70941162109375, 2.8787841796875, 3.04815673828125, 3.217529296875, 3.38690185546875, 3.5562744140625, 3.72564697265625, 3.89501953125, 4.06439208984375, 4.2337646484375, 4.40313720703125, 4.572509765625, 4.74188232421875, 4.9112548828125, 5.08062744140625, 5.25]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 12.0, 8.0, 10.0, 22.0, 34.0, 72.0, 104.0, 155.0, 225.0, 340.0, 496.0, 626.0, 573.0, 436.0, 324.0, 241.0, 142.0, 100.0, 56.0, 36.0, 26.0, 21.0, 9.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62109375, -5.33697509765625, -5.0528564453125, -4.76873779296875, -4.484619140625, -4.20050048828125, -3.9163818359375, -3.63226318359375, -3.34814453125, -3.06402587890625, -2.7799072265625, -2.49578857421875, -2.211669921875, -1.92755126953125, -1.6434326171875, -1.35931396484375, -1.0751953125, -0.79107666015625, -0.5069580078125, -0.22283935546875, 0.061279296875, 0.34539794921875, 0.6295166015625, 0.91363525390625, 1.19775390625, 1.48187255859375, 1.7659912109375, 2.05010986328125, 2.334228515625, 2.61834716796875, 2.9024658203125, 3.18658447265625, 3.470703125, 3.75482177734375, 4.0389404296875, 4.32305908203125, 4.607177734375, 4.89129638671875, 5.1754150390625, 5.45953369140625, 5.74365234375, 6.02777099609375, 6.3118896484375, 6.59600830078125, 6.880126953125, 7.16424560546875, 7.4483642578125, 7.73248291015625, 8.0166015625, 8.30072021484375, 8.5848388671875, 8.86895751953125, 9.153076171875, 9.43719482421875, 9.7213134765625, 10.00543212890625, 10.28955078125, 10.57366943359375, 10.8577880859375, 11.14190673828125, 11.426025390625, 11.71014404296875, 11.9942626953125, 12.27838134765625, 12.5625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 12.0, 12.0, 22.0, 36.0, 39.0, 78.0, 131.0, 216.0, 332.0, 653.0, 8577.0, 2941902.0, 1237532.0, 3517.0, 527.0, 283.0, 164.0, 115.0, 51.0, 31.0, 18.0, 11.0, 13.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.71875, -38.79296875, -37.8671875, -36.94140625, -36.015625, -35.08984375, -34.1640625, -33.23828125, -32.3125, -31.38671875, -30.4609375, -29.53515625, -28.609375, -27.68359375, -26.7578125, -25.83203125, -24.90625, -23.98046875, -23.0546875, -22.12890625, -21.203125, -20.27734375, -19.3515625, -18.42578125, -17.5, -16.57421875, -15.6484375, -14.72265625, -13.796875, -12.87109375, -11.9453125, -11.01953125, -10.09375, -9.16796875, -8.2421875, -7.31640625, -6.390625, -5.46484375, -4.5390625, -3.61328125, -2.6875, -1.76171875, -0.8359375, 0.08984375, 1.015625, 1.94140625, 2.8671875, 3.79296875, 4.71875, 5.64453125, 6.5703125, 7.49609375, 8.421875, 9.34765625, 10.2734375, 11.19921875, 12.125, 13.05078125, 13.9765625, 14.90234375, 15.828125, 16.75390625, 17.6796875, 18.60546875, 19.53125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 12.0, 32.0, 66.0, 131.0, 162.0, 189.0, 183.0, 122.0, 71.0, 39.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.60527801513672, -73.86095428466797, -72.11663818359375, -70.372314453125, -68.62799835205078, -66.88367462158203, -65.13935852050781, -63.39503479003906, -61.65071487426758, -59.906394958496094, -58.16207504272461, -56.417755126953125, -54.673431396484375, -52.92911148071289, -51.184791564941406, -49.44047164916992, -47.69615173339844, -45.95183181762695, -44.20751190185547, -42.46318817138672, -40.718868255615234, -38.97454833984375, -37.230228424072266, -35.48590850830078, -33.74158477783203, -31.997264862060547, -30.25294303894043, -28.508623123168945, -26.76430320739746, -25.019981384277344, -23.27566146850586, -21.531341552734375, -19.78702163696289, -18.042701721191406, -16.29837989807129, -14.554059982299805, -12.80974006652832, -11.06541919708252, -9.321098327636719, -7.576778411865234, -5.832457542419434, -4.088137149810791, -2.3438165187835693, -0.5994958877563477, 1.144824504852295, 2.8891448974609375, 4.633465766906738, 6.377785682678223, 8.122106552124023, 9.866427421569824, 11.610747337341309, 13.35506820678711, 15.099388122558594, 16.843708038330078, 18.588029861450195, 20.33234977722168, 22.076671600341797, 23.82099151611328, 25.5653133392334, 27.309633255004883, 29.053953170776367, 30.798274993896484, 32.54259490966797, 34.28691482543945, 36.03123474121094]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 7.0, 12.0, 9.0, 14.0, 14.0, 18.0, 19.0, 24.0, 29.0, 26.0, 24.0, 30.0, 37.0, 34.0, 45.0, 35.0, 36.0, 32.0, 42.0, 40.0, 43.0, 36.0, 35.0, 39.0, 31.0, 29.0, 25.0, 21.0, 27.0, 27.0, 23.0, 21.0, 25.0, 16.0, 20.0, 8.0, 6.0, 9.0, 2.0, 11.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-20.096216201782227, -19.49370765686035, -18.89120101928711, -18.288692474365234, -17.68618392944336, -17.083675384521484, -16.481168746948242, -15.878660202026367, -15.276152610778809, -14.67364501953125, -14.071136474609375, -13.468628883361816, -12.866121292114258, -12.263612747192383, -11.661105155944824, -11.058597564697266, -10.45608901977539, -9.853581428527832, -9.251072883605957, -8.648565292358398, -8.046056747436523, -7.443549156188965, -6.841041564941406, -6.2385334968566895, -5.636025428771973, -5.033517360687256, -4.431009292602539, -3.8285017013549805, -3.2259936332702637, -2.623485565185547, -2.020977735519409, -1.4184699058532715, -0.8159599304199219, -0.21345198154449463, 0.3890559673309326, 0.9915639162063599, 1.594071865081787, 2.196579933166504, 2.7990877628326416, 3.4015955924987793, 4.004103660583496, 4.606611728668213, 5.20911979675293, 5.811627388000488, 6.414135456085205, 7.016643524169922, 7.6191511154174805, 8.221658706665039, 8.824167251586914, 9.426674842834473, 10.029183387756348, 10.631690979003906, 11.234199523925781, 11.83670711517334, 12.439214706420898, 13.041723251342773, 13.644230842590332, 14.24673843383789, 14.849246978759766, 15.451754570007324, 16.054262161254883, 16.656770706176758, 17.259279251098633, 17.861785888671875, 18.46429443359375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 8.0, 14.0, 15.0, 12.0, 26.0, 22.0, 30.0, 27.0, 26.0, 35.0, 43.0, 35.0, 35.0, 28.0, 45.0, 41.0, 34.0, 44.0, 36.0, 44.0, 49.0, 27.0, 29.0, 37.0, 30.0, 25.0, 19.0, 24.0, 20.0, 16.0, 19.0, 15.0, 7.0, 16.0, 10.0, 14.0, 6.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.177734375, -3.08209228515625, -2.9864501953125, -2.89080810546875, -2.795166015625, -2.69952392578125, -2.6038818359375, -2.50823974609375, -2.41259765625, -2.31695556640625, -2.2213134765625, -2.12567138671875, -2.030029296875, -1.93438720703125, -1.8387451171875, -1.74310302734375, -1.6474609375, -1.55181884765625, -1.4561767578125, -1.36053466796875, -1.264892578125, -1.16925048828125, -1.0736083984375, -0.97796630859375, -0.88232421875, -0.78668212890625, -0.6910400390625, -0.59539794921875, -0.499755859375, -0.40411376953125, -0.3084716796875, -0.21282958984375, -0.1171875, -0.02154541015625, 0.0740966796875, 0.16973876953125, 0.265380859375, 0.36102294921875, 0.4566650390625, 0.55230712890625, 0.64794921875, 0.74359130859375, 0.8392333984375, 0.93487548828125, 1.030517578125, 1.12615966796875, 1.2218017578125, 1.31744384765625, 1.4130859375, 1.50872802734375, 1.6043701171875, 1.70001220703125, 1.795654296875, 1.89129638671875, 1.9869384765625, 2.08258056640625, 2.17822265625, 2.27386474609375, 2.3695068359375, 2.46514892578125, 2.560791015625, 2.65643310546875, 2.7520751953125, 2.84771728515625, 2.943359375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 21.0, 22.0, 48.0, 61.0, 116.0, 196.0, 301.0, 484.0, 809.0, 1336.0, 2148.0, 3503.0, 5340.0, 8254.0, 12546.0, 18525.0, 26622.0, 37705.0, 51501.0, 68283.0, 84608.0, 99644.0, 108477.0, 107804.0, 98340.0, 82428.0, 66054.0, 50194.0, 36242.0, 25757.0, 17838.0, 11950.0, 7856.0, 4955.0, 3186.0, 2069.0, 1349.0, 777.0, 504.0, 278.0, 171.0, 88.0, 71.0, 47.0, 18.0, 17.0, 11.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5690994262695312, -0.5512847900390625, -0.5334701538085938, -0.515655517578125, -0.49784088134765625, -0.4800262451171875, -0.46221160888671875, -0.44439697265625, -0.42658233642578125, -0.4087677001953125, -0.39095306396484375, -0.373138427734375, -0.35532379150390625, -0.3375091552734375, -0.31969451904296875, -0.3018798828125, -0.28406524658203125, -0.2662506103515625, -0.24843597412109375, -0.230621337890625, -0.21280670166015625, -0.1949920654296875, -0.17717742919921875, -0.15936279296875, -0.14154815673828125, -0.1237335205078125, -0.10591888427734375, -0.088104248046875, -0.07028961181640625, -0.0524749755859375, -0.03466033935546875, -0.016845703125, 0.00096893310546875, 0.0187835693359375, 0.03659820556640625, 0.054412841796875, 0.07222747802734375, 0.0900421142578125, 0.10785675048828125, 0.12567138671875, 0.14348602294921875, 0.1613006591796875, 0.17911529541015625, 0.196929931640625, 0.21474456787109375, 0.2325592041015625, 0.25037384033203125, 0.2681884765625, 0.28600311279296875, 0.3038177490234375, 0.32163238525390625, 0.339447021484375, 0.35726165771484375, 0.3750762939453125, 0.39289093017578125, 0.41070556640625, 0.42852020263671875, 0.4463348388671875, 0.46414947509765625, 0.481964111328125, 0.49977874755859375, 0.5175933837890625, 0.5354080200195312, 0.55322265625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 8.0, 11.0, 5.0, 7.0, 16.0, 10.0, 16.0, 13.0, 13.0, 20.0, 24.0, 29.0, 20.0, 30.0, 26.0, 29.0, 40.0, 40.0, 43.0, 40.0, 36.0, 1057.0, 39.0, 36.0, 39.0, 33.0, 33.0, 18.0, 23.0, 41.0, 34.0, 26.0, 22.0, 20.0, 22.0, 19.0, 15.0, 8.0, 14.0, 16.0, 4.0, 6.0, 9.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.671875, -2.592742919921875, -2.51361083984375, -2.434478759765625, -2.3553466796875, -2.276214599609375, -2.19708251953125, -2.117950439453125, -2.038818359375, -1.959686279296875, -1.88055419921875, -1.801422119140625, -1.7222900390625, -1.643157958984375, -1.56402587890625, -1.484893798828125, -1.40576171875, -1.326629638671875, -1.24749755859375, -1.168365478515625, -1.0892333984375, -1.010101318359375, -0.93096923828125, -0.851837158203125, -0.772705078125, -0.693572998046875, -0.61444091796875, -0.535308837890625, -0.4561767578125, -0.377044677734375, -0.29791259765625, -0.218780517578125, -0.1396484375, -0.060516357421875, 0.01861572265625, 0.097747802734375, 0.1768798828125, 0.256011962890625, 0.33514404296875, 0.414276123046875, 0.493408203125, 0.572540283203125, 0.65167236328125, 0.730804443359375, 0.8099365234375, 0.889068603515625, 0.96820068359375, 1.047332763671875, 1.12646484375, 1.205596923828125, 1.28472900390625, 1.363861083984375, 1.4429931640625, 1.522125244140625, 1.60125732421875, 1.680389404296875, 1.759521484375, 1.838653564453125, 1.91778564453125, 1.996917724609375, 2.0760498046875, 2.155181884765625, 2.23431396484375, 2.313446044921875, 2.392578125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [6.0, 2.0, 4.0, 4.0, 4.0, 10.0, 19.0, 20.0, 22.0, 25.0, 56.0, 70.0, 133.0, 162.0, 222.0, 295.0, 494.0, 652.0, 1093.0, 1488.0, 2025.0, 3202.0, 4407.0, 6327.0, 8802.0, 13036.0, 20626.0, 34819.0, 1866085.0, 55811.0, 25916.0, 16205.0, 10806.0, 7455.0, 5157.0, 3490.0, 2481.0, 1772.0, 1302.0, 830.0, 612.0, 418.0, 244.0, 173.0, 118.0, 69.0, 52.0, 45.0, 31.0, 18.0, 9.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1376953125, -1.0980987548828125, -1.058502197265625, -1.0189056396484375, -0.97930908203125, -0.9397125244140625, -0.900115966796875, -0.8605194091796875, -0.8209228515625, -0.7813262939453125, -0.741729736328125, -0.7021331787109375, -0.66253662109375, -0.6229400634765625, -0.583343505859375, -0.5437469482421875, -0.504150390625, -0.4645538330078125, -0.424957275390625, -0.3853607177734375, -0.34576416015625, -0.3061676025390625, -0.266571044921875, -0.2269744873046875, -0.1873779296875, -0.1477813720703125, -0.108184814453125, -0.0685882568359375, -0.02899169921875, 0.0106048583984375, 0.050201416015625, 0.0897979736328125, 0.12939453125, 0.1689910888671875, 0.208587646484375, 0.2481842041015625, 0.28778076171875, 0.3273773193359375, 0.366973876953125, 0.4065704345703125, 0.4461669921875, 0.4857635498046875, 0.525360107421875, 0.5649566650390625, 0.60455322265625, 0.6441497802734375, 0.683746337890625, 0.7233428955078125, 0.762939453125, 0.8025360107421875, 0.842132568359375, 0.8817291259765625, 0.92132568359375, 0.9609222412109375, 1.000518798828125, 1.0401153564453125, 1.0797119140625, 1.1193084716796875, 1.158905029296875, 1.1985015869140625, 1.23809814453125, 1.2776947021484375, 1.317291259765625, 1.3568878173828125, 1.396484375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 5.0, 6.0, 12.0, 17.0, 17.0, 27.0, 26.0, 53.0, 60.0, 65.0, 105.0, 127.0, 107.0, 99.0, 71.0, 39.0, 29.0, 24.0, 26.0, 17.0, 10.0, 8.0, 10.0, 3.0, 3.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.043975830078125, -0.04259347915649414, -0.04121112823486328, -0.03982877731323242, -0.03844642639160156, -0.0370640754699707, -0.035681724548339844, -0.034299373626708984, -0.032917022705078125, -0.031534671783447266, -0.030152320861816406, -0.028769969940185547, -0.027387619018554688, -0.026005268096923828, -0.02462291717529297, -0.02324056625366211, -0.02185821533203125, -0.02047586441040039, -0.01909351348876953, -0.017711162567138672, -0.016328811645507812, -0.014946460723876953, -0.013564109802246094, -0.012181758880615234, -0.010799407958984375, -0.009417057037353516, -0.008034706115722656, -0.006652355194091797, -0.0052700042724609375, -0.003887653350830078, -0.0025053024291992188, -0.0011229515075683594, 0.0002593994140625, 0.0016417503356933594, 0.0030241012573242188, 0.004406452178955078, 0.0057888031005859375, 0.007171154022216797, 0.008553504943847656, 0.009935855865478516, 0.011318206787109375, 0.012700557708740234, 0.014082908630371094, 0.015465259552001953, 0.016847610473632812, 0.018229961395263672, 0.01961231231689453, 0.02099466323852539, 0.02237701416015625, 0.02375936508178711, 0.02514171600341797, 0.026524066925048828, 0.027906417846679688, 0.029288768768310547, 0.030671119689941406, 0.032053470611572266, 0.033435821533203125, 0.034818172454833984, 0.036200523376464844, 0.0375828742980957, 0.03896522521972656, 0.04034757614135742, 0.04172992706298828, 0.04311227798461914, 0.04449462890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 14.0, 12.0, 19.0, 27.0, 47.0, 62.0, 117.0, 183.0, 655.0, 72980.0, 971783.0, 1928.0, 280.0, 147.0, 83.0, 48.0, 40.0, 25.0, 22.0, 14.0, 13.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9833984375, -0.9528579711914062, -0.9223175048828125, -0.8917770385742188, -0.861236572265625, -0.8306961059570312, -0.8001556396484375, -0.7696151733398438, -0.73907470703125, -0.7085342407226562, -0.6779937744140625, -0.6474533081054688, -0.616912841796875, -0.5863723754882812, -0.5558319091796875, -0.5252914428710938, -0.4947509765625, -0.46421051025390625, -0.4336700439453125, -0.40312957763671875, -0.372589111328125, -0.34204864501953125, -0.3115081787109375, -0.28096771240234375, -0.25042724609375, -0.21988677978515625, -0.1893463134765625, -0.15880584716796875, -0.128265380859375, -0.09772491455078125, -0.0671844482421875, -0.03664398193359375, -0.006103515625, 0.02443695068359375, 0.0549774169921875, 0.08551788330078125, 0.116058349609375, 0.14659881591796875, 0.1771392822265625, 0.20767974853515625, 0.23822021484375, 0.26876068115234375, 0.2993011474609375, 0.32984161376953125, 0.360382080078125, 0.39092254638671875, 0.4214630126953125, 0.45200347900390625, 0.4825439453125, 0.5130844116210938, 0.5436248779296875, 0.5741653442382812, 0.604705810546875, 0.6352462768554688, 0.6657867431640625, 0.6963272094726562, 0.72686767578125, 0.7574081420898438, 0.7879486083984375, 0.8184890747070312, 0.849029541015625, 0.8795700073242188, 0.9101104736328125, 0.9406509399414062, 0.97119140625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 8.0, 19.0, 108.0, 615.0, 233.0, 22.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1631232500076294, -1.1422538757324219, -1.1213845014572144, -1.1005152463912964, -1.0796458721160889, -1.0587764978408813, -1.0379071235656738, -1.0170377492904663, -0.9961684346199036, -0.975299060344696, -0.9544297456741333, -0.9335603713989258, -0.912691056728363, -0.8918216824531555, -0.8709523677825928, -0.8500829935073853, -0.8292136192321777, -0.8083442449569702, -0.7874749302864075, -0.7666055560112, -0.7457362413406372, -0.7248668670654297, -0.7039974927902222, -0.6831281781196594, -0.6622588634490967, -0.6413894891738892, -0.6205201745033264, -0.5996508002281189, -0.5787814855575562, -0.5579121112823486, -0.5370427370071411, -0.5161734223365784, -0.49530404806137085, -0.4744347035884857, -0.4535653591156006, -0.43269598484039307, -0.41182664036750793, -0.3909572958946228, -0.37008795142173767, -0.34921860694885254, -0.328349232673645, -0.3074798882007599, -0.28661054372787476, -0.26574116945266724, -0.2448718249797821, -0.22400248050689697, -0.20313313603401184, -0.18226377665996552, -0.16139444708824158, -0.14052510261535645, -0.11965574324131012, -0.09878639876842499, -0.07791704684495926, -0.05704769492149353, -0.0361783504486084, -0.015308991074562073, 0.005560353398323059, 0.02642970345914364, 0.04729905351996422, 0.06816840171813965, 0.08903775364160538, 0.1099071055650711, 0.13077645003795624, 0.15164580941200256, 0.1725151538848877]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 9.0, 6.0, 15.0, 22.0, 12.0, 25.0, 15.0, 25.0, 24.0, 39.0, 42.0, 43.0, 38.0, 50.0, 48.0, 33.0, 48.0, 44.0, 53.0, 39.0, 49.0, 37.0, 45.0, 46.0, 35.0, 31.0, 13.0, 23.0, 12.0, 14.0, 11.0, 12.0, 8.0, 8.0, 7.0, 9.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08309537172317505, -0.08034725487232208, -0.07759914547204971, -0.07485102862119675, -0.07210291922092438, -0.06935480237007141, -0.06660668551921844, -0.06385856866836548, -0.06111045926809311, -0.05836234614253044, -0.05561423301696777, -0.05286611616611481, -0.05011800304055214, -0.04736988991498947, -0.044621773064136505, -0.04187365993857384, -0.03912554681301117, -0.0363774336874485, -0.033629320561885834, -0.030881203711032867, -0.0281330905854702, -0.025384977459907532, -0.022636862471699715, -0.019888747483491898, -0.01714063435792923, -0.014392520301043987, -0.011644406244158745, -0.008896292187273502, -0.00614817813038826, -0.0034000640735030174, -0.000651950016617775, 0.002096164971590042, 0.00484427809715271, 0.007592392154037952, 0.010340506210923195, 0.013088620267808437, 0.01583673432469368, 0.018584847450256348, 0.021332962438464165, 0.024081077426671982, 0.02682919055223465, 0.029577303677797318, 0.032325416803359985, 0.03507353365421295, 0.03782164677977562, 0.04056975990533829, 0.043317876756191254, 0.04606598988175392, 0.04881410300731659, 0.05156221613287926, 0.054310329258441925, 0.05705844610929489, 0.05980655923485756, 0.06255467236042023, 0.0653027892112732, 0.06805090606212616, 0.07079901546239853, 0.0735471323132515, 0.07629524171352386, 0.07904335856437683, 0.0817914754152298, 0.08453958481550217, 0.08728770166635513, 0.0900358110666275, 0.09278392791748047]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 12.0, 14.0, 17.0, 16.0, 16.0, 34.0, 22.0, 26.0, 25.0, 31.0, 41.0, 35.0, 27.0, 32.0, 35.0, 38.0, 46.0, 28.0, 32.0, 35.0, 37.0, 24.0, 33.0, 39.0, 34.0, 30.0, 26.0, 23.0, 19.0, 22.0, 18.0, 17.0, 16.0, 16.0, 12.0, 10.0, 6.0, 3.0, 9.0, 10.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-2.87890625, -2.791290283203125, -2.70367431640625, -2.616058349609375, -2.5284423828125, -2.440826416015625, -2.35321044921875, -2.265594482421875, -2.177978515625, -2.090362548828125, -2.00274658203125, -1.915130615234375, -1.8275146484375, -1.739898681640625, -1.65228271484375, -1.564666748046875, -1.47705078125, -1.389434814453125, -1.30181884765625, -1.214202880859375, -1.1265869140625, -1.038970947265625, -0.95135498046875, -0.863739013671875, -0.776123046875, -0.688507080078125, -0.60089111328125, -0.513275146484375, -0.4256591796875, -0.338043212890625, -0.25042724609375, -0.162811279296875, -0.0751953125, 0.012420654296875, 0.10003662109375, 0.187652587890625, 0.2752685546875, 0.362884521484375, 0.45050048828125, 0.538116455078125, 0.625732421875, 0.713348388671875, 0.80096435546875, 0.888580322265625, 0.9761962890625, 1.063812255859375, 1.15142822265625, 1.239044189453125, 1.32666015625, 1.414276123046875, 1.50189208984375, 1.589508056640625, 1.6771240234375, 1.764739990234375, 1.85235595703125, 1.939971923828125, 2.027587890625, 2.115203857421875, 2.20281982421875, 2.290435791015625, 2.3780517578125, 2.465667724609375, 2.55328369140625, 2.640899658203125, 2.728515625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 8.0, 9.0, 11.0, 12.0, 17.0, 25.0, 38.0, 43.0, 76.0, 100.0, 148.0, 221.0, 360.0, 560.0, 839.0, 1410.0, 2450.0, 4283.0, 7895.0, 15570.0, 30966.0, 61084.0, 111462.0, 204568.0, 294058.0, 142978.0, 81127.0, 42561.0, 21033.0, 11030.0, 5660.0, 3156.0, 1775.0, 1111.0, 667.0, 412.0, 237.0, 179.0, 142.0, 76.0, 53.0, 48.0, 22.0, 13.0, 10.0, 20.0, 8.0, 10.0, 4.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0], "bins": [-3.171875, -3.076416015625, -2.98095703125, -2.885498046875, -2.7900390625, -2.694580078125, -2.59912109375, -2.503662109375, -2.408203125, -2.312744140625, -2.21728515625, -2.121826171875, -2.0263671875, -1.930908203125, -1.83544921875, -1.739990234375, -1.64453125, -1.549072265625, -1.45361328125, -1.358154296875, -1.2626953125, -1.167236328125, -1.07177734375, -0.976318359375, -0.880859375, -0.785400390625, -0.68994140625, -0.594482421875, -0.4990234375, -0.403564453125, -0.30810546875, -0.212646484375, -0.1171875, -0.021728515625, 0.07373046875, 0.169189453125, 0.2646484375, 0.360107421875, 0.45556640625, 0.551025390625, 0.646484375, 0.741943359375, 0.83740234375, 0.932861328125, 1.0283203125, 1.123779296875, 1.21923828125, 1.314697265625, 1.41015625, 1.505615234375, 1.60107421875, 1.696533203125, 1.7919921875, 1.887451171875, 1.98291015625, 2.078369140625, 2.173828125, 2.269287109375, 2.36474609375, 2.460205078125, 2.5556640625, 2.651123046875, 2.74658203125, 2.842041015625, 2.9375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 4.0, 6.0, 14.0, 12.0, 5.0, 9.0, 11.0, 14.0, 25.0, 20.0, 18.0, 20.0, 24.0, 36.0, 24.0, 26.0, 39.0, 51.0, 80.0, 120.0, 231.0, 1414.0, 222.0, 123.0, 86.0, 49.0, 49.0, 40.0, 27.0, 21.0, 41.0, 22.0, 29.0, 24.0, 16.0, 14.0, 14.0, 13.0, 10.0, 5.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5234375, -8.22412109375, -7.9248046875, -7.62548828125, -7.326171875, -7.02685546875, -6.7275390625, -6.42822265625, -6.12890625, -5.82958984375, -5.5302734375, -5.23095703125, -4.931640625, -4.63232421875, -4.3330078125, -4.03369140625, -3.734375, -3.43505859375, -3.1357421875, -2.83642578125, -2.537109375, -2.23779296875, -1.9384765625, -1.63916015625, -1.33984375, -1.04052734375, -0.7412109375, -0.44189453125, -0.142578125, 0.15673828125, 0.4560546875, 0.75537109375, 1.0546875, 1.35400390625, 1.6533203125, 1.95263671875, 2.251953125, 2.55126953125, 2.8505859375, 3.14990234375, 3.44921875, 3.74853515625, 4.0478515625, 4.34716796875, 4.646484375, 4.94580078125, 5.2451171875, 5.54443359375, 5.84375, 6.14306640625, 6.4423828125, 6.74169921875, 7.041015625, 7.34033203125, 7.6396484375, 7.93896484375, 8.23828125, 8.53759765625, 8.8369140625, 9.13623046875, 9.435546875, 9.73486328125, 10.0341796875, 10.33349609375, 10.6328125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 4.0, 5.0, 4.0, 8.0, 18.0, 12.0, 21.0, 40.0, 36.0, 53.0, 86.0, 107.0, 171.0, 268.0, 415.0, 972.0, 4126.0, 453248.0, 2674432.0, 8888.0, 1343.0, 568.0, 246.0, 201.0, 108.0, 80.0, 63.0, 39.0, 35.0, 34.0, 13.0, 21.0, 9.0, 10.0, 6.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.59375, -28.67333984375, -27.7529296875, -26.83251953125, -25.912109375, -24.99169921875, -24.0712890625, -23.15087890625, -22.23046875, -21.31005859375, -20.3896484375, -19.46923828125, -18.548828125, -17.62841796875, -16.7080078125, -15.78759765625, -14.8671875, -13.94677734375, -13.0263671875, -12.10595703125, -11.185546875, -10.26513671875, -9.3447265625, -8.42431640625, -7.50390625, -6.58349609375, -5.6630859375, -4.74267578125, -3.822265625, -2.90185546875, -1.9814453125, -1.06103515625, -0.140625, 0.77978515625, 1.7001953125, 2.62060546875, 3.541015625, 4.46142578125, 5.3818359375, 6.30224609375, 7.22265625, 8.14306640625, 9.0634765625, 9.98388671875, 10.904296875, 11.82470703125, 12.7451171875, 13.66552734375, 14.5859375, 15.50634765625, 16.4267578125, 17.34716796875, 18.267578125, 19.18798828125, 20.1083984375, 21.02880859375, 21.94921875, 22.86962890625, 23.7900390625, 24.71044921875, 25.630859375, 26.55126953125, 27.4716796875, 28.39208984375, 29.3125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 172.0, 495.0, 313.0, 31.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.747785568237305, -12.157312393188477, -9.566839218139648, -6.97636604309082, -4.385892868041992, -1.795419692993164, 0.7950534820556641, 3.385526657104492, 5.97599983215332, 8.566473007202148, 11.156946182250977, 13.747419357299805, 16.337892532348633, 18.92836570739746, 21.51883888244629, 24.109312057495117, 26.699785232543945, 29.290258407592773, 31.8807315826416, 34.47120666503906, 37.061676025390625, 39.65215301513672, 42.24262237548828, 44.833099365234375, 47.42356872558594, 50.014041900634766, 52.604515075683594, 55.19498825073242, 57.78546142578125, 60.37593460083008, 62.966407775878906, 65.556884765625, 68.14735412597656, 70.73782348632812, 73.32830047607422, 75.91877746582031, 78.50924682617188, 81.09971618652344, 83.69019317626953, 86.28067016601562, 88.87113952636719, 91.46160888671875, 94.05208587646484, 96.64256286621094, 99.2330322265625, 101.82350158691406, 104.41397857666016, 107.00445556640625, 109.59492492675781, 112.18539428710938, 114.77587127685547, 117.36634826660156, 119.95681762695312, 122.54728698730469, 125.13776397705078, 127.72824096679688, 130.31871032714844, 132.9091796875, 135.49966430664062, 138.0901336669922, 140.68060302734375, 143.2710723876953, 145.86154174804688, 148.4520263671875, 151.04249572753906]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 5.0, 1.0, 6.0, 5.0, 7.0, 4.0, 10.0, 7.0, 13.0, 16.0, 18.0, 17.0, 22.0, 21.0, 17.0, 36.0, 24.0, 28.0, 25.0, 28.0, 35.0, 29.0, 42.0, 43.0, 45.0, 50.0, 41.0, 39.0, 37.0, 46.0, 30.0, 30.0, 25.0, 33.0, 24.0, 24.0, 19.0, 18.0, 11.0, 16.0, 13.0, 14.0, 10.0, 6.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-28.80816078186035, -28.03438949584961, -27.260618209838867, -26.486846923828125, -25.713075637817383, -24.93930435180664, -24.16553497314453, -23.391761779785156, -22.617992401123047, -21.844221115112305, -21.070449829101562, -20.29667854309082, -19.522907257080078, -18.749135971069336, -17.975364685058594, -17.201595306396484, -16.42782211303711, -15.654050827026367, -14.880279541015625, -14.106508255004883, -13.33273696899414, -12.558965682983398, -11.785195350646973, -11.01142406463623, -10.237652778625488, -9.463881492614746, -8.690110206604004, -7.91633939743042, -7.142568111419678, -6.3687968254089355, -5.595026016235352, -4.821254730224609, -4.0474853515625, -3.273714065551758, -2.4999430179595947, -1.7261719703674316, -0.9524006843566895, -0.17862939834594727, 0.5951414108276367, 1.368912696838379, 2.142683982849121, 2.9164552688598633, 3.6902263164520264, 4.4639973640441895, 5.237768650054932, 6.011539936065674, 6.785310745239258, 7.55908203125, 8.332853317260742, 9.106624603271484, 9.880395889282227, 10.654167175292969, 11.427938461303711, 12.201709747314453, 12.975480079650879, 13.749251365661621, 14.523022651672363, 15.296793937683105, 16.07056427001953, 16.844335556030273, 17.618106842041016, 18.391878128051758, 19.1656494140625, 19.939420700073242, 20.713191986083984]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 9.0, 6.0, 12.0, 4.0, 14.0, 16.0, 14.0, 23.0, 29.0, 27.0, 28.0, 28.0, 26.0, 25.0, 33.0, 35.0, 39.0, 56.0, 31.0, 37.0, 45.0, 37.0, 42.0, 35.0, 31.0, 39.0, 38.0, 22.0, 22.0, 20.0, 25.0, 22.0, 18.0, 20.0, 18.0, 11.0, 12.0, 7.0, 8.0, 12.0, 4.0, 4.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919921875, -2.819610595703125, -2.71929931640625, -2.618988037109375, -2.5186767578125, -2.418365478515625, -2.31805419921875, -2.217742919921875, -2.117431640625, -2.017120361328125, -1.91680908203125, -1.816497802734375, -1.7161865234375, -1.615875244140625, -1.51556396484375, -1.415252685546875, -1.31494140625, -1.214630126953125, -1.11431884765625, -1.014007568359375, -0.9136962890625, -0.813385009765625, -0.71307373046875, -0.612762451171875, -0.512451171875, -0.412139892578125, -0.31182861328125, -0.211517333984375, -0.1112060546875, -0.010894775390625, 0.08941650390625, 0.189727783203125, 0.2900390625, 0.390350341796875, 0.49066162109375, 0.590972900390625, 0.6912841796875, 0.791595458984375, 0.89190673828125, 0.992218017578125, 1.092529296875, 1.192840576171875, 1.29315185546875, 1.393463134765625, 1.4937744140625, 1.594085693359375, 1.69439697265625, 1.794708251953125, 1.89501953125, 1.995330810546875, 2.09564208984375, 2.195953369140625, 2.2962646484375, 2.396575927734375, 2.49688720703125, 2.597198486328125, 2.697509765625, 2.797821044921875, 2.89813232421875, 2.998443603515625, 3.0987548828125, 3.199066162109375, 3.29937744140625, 3.399688720703125, 3.5]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 2.0, 6.0, 8.0, 7.0, 8.0, 14.0, 16.0, 14.0, 14.0, 27.0, 37.0, 36.0, 36.0, 56.0, 68.0, 121.0, 150.0, 244.0, 586.0, 1550.0, 5309.0, 22239.0, 105786.0, 496594.0, 1566239.0, 1458128.0, 422886.0, 87885.0, 18860.0, 4583.0, 1368.0, 560.0, 248.0, 124.0, 96.0, 72.0, 55.0, 34.0, 39.0, 29.0, 19.0, 18.0, 23.0, 19.0, 18.0, 11.0, 12.0, 12.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.1640625, -4.9971923828125, -4.830322265625, -4.6634521484375, -4.49658203125, -4.3297119140625, -4.162841796875, -3.9959716796875, -3.8291015625, -3.6622314453125, -3.495361328125, -3.3284912109375, -3.16162109375, -2.9947509765625, -2.827880859375, -2.6610107421875, -2.494140625, -2.3272705078125, -2.160400390625, -1.9935302734375, -1.82666015625, -1.6597900390625, -1.492919921875, -1.3260498046875, -1.1591796875, -0.9923095703125, -0.825439453125, -0.6585693359375, -0.49169921875, -0.3248291015625, -0.157958984375, 0.0089111328125, 0.17578125, 0.3426513671875, 0.509521484375, 0.6763916015625, 0.84326171875, 1.0101318359375, 1.177001953125, 1.3438720703125, 1.5107421875, 1.6776123046875, 1.844482421875, 2.0113525390625, 2.17822265625, 2.3450927734375, 2.511962890625, 2.6788330078125, 2.845703125, 3.0125732421875, 3.179443359375, 3.3463134765625, 3.51318359375, 3.6800537109375, 3.846923828125, 4.0137939453125, 4.1806640625, 4.3475341796875, 4.514404296875, 4.6812744140625, 4.84814453125, 5.0150146484375, 5.181884765625, 5.3487548828125, 5.515625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 13.0, 11.0, 15.0, 20.0, 22.0, 47.0, 49.0, 52.0, 74.0, 102.0, 136.0, 217.0, 233.0, 346.0, 388.0, 414.0, 390.0, 364.0, 279.0, 210.0, 181.0, 124.0, 90.0, 66.0, 57.0, 45.0, 31.0, 20.0, 18.0, 11.0, 9.0, 7.0, 7.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.88226318359375, -4.6903076171875, -4.49835205078125, -4.306396484375, -4.11444091796875, -3.9224853515625, -3.73052978515625, -3.53857421875, -3.34661865234375, -3.1546630859375, -2.96270751953125, -2.770751953125, -2.57879638671875, -2.3868408203125, -2.19488525390625, -2.0029296875, -1.81097412109375, -1.6190185546875, -1.42706298828125, -1.235107421875, -1.04315185546875, -0.8511962890625, -0.65924072265625, -0.46728515625, -0.27532958984375, -0.0833740234375, 0.10858154296875, 0.300537109375, 0.49249267578125, 0.6844482421875, 0.87640380859375, 1.068359375, 1.26031494140625, 1.4522705078125, 1.64422607421875, 1.836181640625, 2.02813720703125, 2.2200927734375, 2.41204833984375, 2.60400390625, 2.79595947265625, 2.9879150390625, 3.17987060546875, 3.371826171875, 3.56378173828125, 3.7557373046875, 3.94769287109375, 4.1396484375, 4.33160400390625, 4.5235595703125, 4.71551513671875, 4.907470703125, 5.09942626953125, 5.2913818359375, 5.48333740234375, 5.67529296875, 5.86724853515625, 6.0592041015625, 6.25115966796875, 6.443115234375, 6.63507080078125, 6.8270263671875, 7.01898193359375, 7.2109375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 8.0, 7.0, 17.0, 15.0, 21.0, 31.0, 51.0, 46.0, 63.0, 95.0, 128.0, 185.0, 274.0, 435.0, 1229.0, 81662.0, 3933964.0, 173199.0, 1588.0, 412.0, 262.0, 153.0, 99.0, 71.0, 50.0, 58.0, 36.0, 29.0, 23.0, 14.0, 11.0, 11.0, 8.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.421875, -30.5625, -29.703125, -28.84375, -27.984375, -27.125, -26.265625, -25.40625, -24.546875, -23.6875, -22.828125, -21.96875, -21.109375, -20.25, -19.390625, -18.53125, -17.671875, -16.8125, -15.953125, -15.09375, -14.234375, -13.375, -12.515625, -11.65625, -10.796875, -9.9375, -9.078125, -8.21875, -7.359375, -6.5, -5.640625, -4.78125, -3.921875, -3.0625, -2.203125, -1.34375, -0.484375, 0.375, 1.234375, 2.09375, 2.953125, 3.8125, 4.671875, 5.53125, 6.390625, 7.25, 8.109375, 8.96875, 9.828125, 10.6875, 11.546875, 12.40625, 13.265625, 14.125, 14.984375, 15.84375, 16.703125, 17.5625, 18.421875, 19.28125, 20.140625, 21.0, 21.859375, 22.71875, 23.578125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 10.0, 26.0, 92.0, 190.0, 248.0, 230.0, 140.0, 53.0, 24.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-107.445068359375, -105.27725982666016, -103.10945129394531, -100.94164276123047, -98.77383422851562, -96.60602569580078, -94.43821716308594, -92.2704086303711, -90.10260009765625, -87.9347915649414, -85.76698303222656, -83.59917449951172, -81.43136596679688, -79.26355743408203, -77.09574890136719, -74.92794036865234, -72.7601318359375, -70.59232330322266, -68.42451477050781, -66.25670623779297, -64.08889770507812, -61.92108917236328, -59.75328063964844, -57.585472106933594, -55.41766357421875, -53.249855041503906, -51.08204650878906, -48.91423797607422, -46.746429443359375, -44.57862091064453, -42.41081237792969, -40.243003845214844, -38.075199127197266, -35.90739059448242, -33.73958206176758, -31.571773529052734, -29.40396499633789, -27.236156463623047, -25.068347930908203, -22.90053939819336, -20.732730865478516, -18.564922332763672, -16.397113800048828, -14.229305267333984, -12.06149673461914, -9.893688201904297, -7.725879669189453, -5.558071136474609, -3.3902626037597656, -1.2224540710449219, 0.9453544616699219, 3.1131629943847656, 5.280971527099609, 7.448780059814453, 9.616588592529297, 11.78439712524414, 13.952205657958984, 16.120014190673828, 18.287822723388672, 20.455631256103516, 22.62343978881836, 24.791248321533203, 26.959056854248047, 29.12686538696289, 31.294673919677734]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 6.0, 10.0, 8.0, 13.0, 13.0, 8.0, 9.0, 21.0, 16.0, 20.0, 35.0, 28.0, 35.0, 29.0, 32.0, 29.0, 31.0, 46.0, 44.0, 33.0, 39.0, 49.0, 32.0, 40.0, 39.0, 32.0, 32.0, 36.0, 27.0, 32.0, 26.0, 19.0, 19.0, 18.0, 15.0, 19.0, 17.0, 5.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.44076156616211, -20.78228187561035, -20.123804092407227, -19.46532440185547, -18.80684471130371, -18.148365020751953, -17.489887237548828, -16.83140754699707, -16.172927856445312, -15.514449119567871, -14.855969429016113, -14.197490692138672, -13.539011001586914, -12.880532264709473, -12.222053527832031, -11.563573837280273, -10.905096054077148, -10.246617317199707, -9.58813762664795, -8.929658889770508, -8.27117919921875, -7.612700462341309, -6.954221725463867, -6.295742511749268, -5.637263298034668, -4.978784084320068, -4.320304870605469, -3.6618261337280273, -3.0033469200134277, -2.344867706298828, -1.6863887310028076, -1.027909755706787, -0.3694324493408203, 0.28904664516448975, 0.9475257396697998, 1.6060048341751099, 2.26448392868042, 2.9229631423950195, 3.58144211769104, 4.2399210929870605, 4.89840030670166, 5.55687952041626, 6.215358734130859, 6.873837471008301, 7.5323166847229, 8.1907958984375, 8.849274635314941, 9.507753372192383, 10.16623306274414, 10.824711799621582, 11.48319149017334, 12.141670227050781, 12.800149917602539, 13.45862865447998, 14.117107391357422, 14.77558708190918, 15.434065818786621, 16.092544555664062, 16.75102424621582, 17.409503936767578, 18.067981719970703, 18.72646141052246, 19.38494110107422, 20.043418884277344, 20.7018985748291]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 10.0, 20.0, 9.0, 12.0, 23.0, 17.0, 22.0, 28.0, 26.0, 23.0, 23.0, 43.0, 42.0, 33.0, 34.0, 21.0, 35.0, 40.0, 33.0, 37.0, 49.0, 28.0, 42.0, 31.0, 27.0, 35.0, 30.0, 29.0, 27.0, 11.0, 18.0, 25.0, 12.0, 13.0, 9.0, 16.0, 4.0, 9.0, 7.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.7265625, -2.635162353515625, -2.54376220703125, -2.452362060546875, -2.3609619140625, -2.269561767578125, -2.17816162109375, -2.086761474609375, -1.995361328125, -1.903961181640625, -1.81256103515625, -1.721160888671875, -1.6297607421875, -1.538360595703125, -1.44696044921875, -1.355560302734375, -1.26416015625, -1.172760009765625, -1.08135986328125, -0.989959716796875, -0.8985595703125, -0.807159423828125, -0.71575927734375, -0.624359130859375, -0.532958984375, -0.441558837890625, -0.35015869140625, -0.258758544921875, -0.1673583984375, -0.075958251953125, 0.01544189453125, 0.106842041015625, 0.1982421875, 0.289642333984375, 0.38104248046875, 0.472442626953125, 0.5638427734375, 0.655242919921875, 0.74664306640625, 0.838043212890625, 0.929443359375, 1.020843505859375, 1.11224365234375, 1.203643798828125, 1.2950439453125, 1.386444091796875, 1.47784423828125, 1.569244384765625, 1.66064453125, 1.752044677734375, 1.84344482421875, 1.934844970703125, 2.0262451171875, 2.117645263671875, 2.20904541015625, 2.300445556640625, 2.391845703125, 2.483245849609375, 2.57464599609375, 2.666046142578125, 2.7574462890625, 2.848846435546875, 2.94024658203125, 3.031646728515625, 3.123046875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 11.0, 7.0, 14.0, 19.0, 35.0, 59.0, 89.0, 158.0, 250.0, 398.0, 594.0, 1057.0, 1647.0, 2499.0, 4002.0, 6150.0, 9534.0, 13778.0, 20714.0, 29910.0, 42583.0, 57096.0, 74062.0, 91467.0, 105568.0, 111283.0, 106288.0, 93672.0, 76754.0, 59497.0, 43744.0, 31333.0, 21739.0, 14588.0, 10027.0, 6521.0, 4171.0, 2756.0, 1626.0, 1080.0, 707.0, 436.0, 250.0, 145.0, 103.0, 49.0, 37.0, 21.0, 14.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5498046875, -0.5329208374023438, -0.5160369873046875, -0.49915313720703125, -0.482269287109375, -0.46538543701171875, -0.4485015869140625, -0.43161773681640625, -0.41473388671875, -0.39785003662109375, -0.3809661865234375, -0.36408233642578125, -0.347198486328125, -0.33031463623046875, -0.3134307861328125, -0.29654693603515625, -0.2796630859375, -0.26277923583984375, -0.2458953857421875, -0.22901153564453125, -0.212127685546875, -0.19524383544921875, -0.1783599853515625, -0.16147613525390625, -0.14459228515625, -0.12770843505859375, -0.1108245849609375, -0.09394073486328125, -0.077056884765625, -0.06017303466796875, -0.0432891845703125, -0.02640533447265625, -0.009521484375, 0.00736236572265625, 0.0242462158203125, 0.04113006591796875, 0.058013916015625, 0.07489776611328125, 0.0917816162109375, 0.10866546630859375, 0.12554931640625, 0.14243316650390625, 0.1593170166015625, 0.17620086669921875, 0.193084716796875, 0.20996856689453125, 0.2268524169921875, 0.24373626708984375, 0.2606201171875, 0.27750396728515625, 0.2943878173828125, 0.31127166748046875, 0.328155517578125, 0.34503936767578125, 0.3619232177734375, 0.37880706787109375, 0.39569091796875, 0.41257476806640625, 0.4294586181640625, 0.44634246826171875, 0.463226318359375, 0.48011016845703125, 0.4969940185546875, 0.5138778686523438, 0.53076171875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 7.0, 11.0, 10.0, 12.0, 16.0, 16.0, 15.0, 32.0, 23.0, 27.0, 21.0, 36.0, 27.0, 44.0, 32.0, 47.0, 40.0, 42.0, 1066.0, 38.0, 37.0, 36.0, 40.0, 37.0, 40.0, 33.0, 35.0, 34.0, 26.0, 17.0, 23.0, 12.0, 16.0, 18.0, 13.0, 10.0, 9.0, 2.0, 4.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.462890625, -2.380401611328125, -2.29791259765625, -2.215423583984375, -2.1329345703125, -2.050445556640625, -1.96795654296875, -1.885467529296875, -1.802978515625, -1.720489501953125, -1.63800048828125, -1.555511474609375, -1.4730224609375, -1.390533447265625, -1.30804443359375, -1.225555419921875, -1.14306640625, -1.060577392578125, -0.97808837890625, -0.895599365234375, -0.8131103515625, -0.730621337890625, -0.64813232421875, -0.565643310546875, -0.483154296875, -0.400665283203125, -0.31817626953125, -0.235687255859375, -0.1531982421875, -0.070709228515625, 0.01177978515625, 0.094268798828125, 0.1767578125, 0.259246826171875, 0.34173583984375, 0.424224853515625, 0.5067138671875, 0.589202880859375, 0.67169189453125, 0.754180908203125, 0.836669921875, 0.919158935546875, 1.00164794921875, 1.084136962890625, 1.1666259765625, 1.249114990234375, 1.33160400390625, 1.414093017578125, 1.49658203125, 1.579071044921875, 1.66156005859375, 1.744049072265625, 1.8265380859375, 1.909027099609375, 1.99151611328125, 2.074005126953125, 2.156494140625, 2.238983154296875, 2.32147216796875, 2.403961181640625, 2.4864501953125, 2.568939208984375, 2.65142822265625, 2.733917236328125, 2.81640625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 18.0, 20.0, 32.0, 55.0, 67.0, 100.0, 146.0, 245.0, 326.0, 501.0, 811.0, 1202.0, 1825.0, 2572.0, 3842.0, 5528.0, 8255.0, 12447.0, 19236.0, 33360.0, 1835268.0, 91788.0, 28486.0, 17139.0, 11008.0, 7511.0, 5018.0, 3446.0, 2287.0, 1513.0, 1018.0, 731.0, 422.0, 293.0, 222.0, 127.0, 71.0, 62.0, 36.0, 28.0, 14.0, 14.0, 9.0, 9.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.400390625, -1.3613433837890625, -1.322296142578125, -1.2832489013671875, -1.24420166015625, -1.2051544189453125, -1.166107177734375, -1.1270599365234375, -1.0880126953125, -1.0489654541015625, -1.009918212890625, -0.9708709716796875, -0.93182373046875, -0.8927764892578125, -0.853729248046875, -0.8146820068359375, -0.775634765625, -0.7365875244140625, -0.697540283203125, -0.6584930419921875, -0.61944580078125, -0.5803985595703125, -0.541351318359375, -0.5023040771484375, -0.4632568359375, -0.4242095947265625, -0.385162353515625, -0.3461151123046875, -0.30706787109375, -0.2680206298828125, -0.228973388671875, -0.1899261474609375, -0.15087890625, -0.1118316650390625, -0.072784423828125, -0.0337371826171875, 0.00531005859375, 0.0443572998046875, 0.083404541015625, 0.1224517822265625, 0.1614990234375, 0.2005462646484375, 0.239593505859375, 0.2786407470703125, 0.31768798828125, 0.3567352294921875, 0.395782470703125, 0.4348297119140625, 0.473876953125, 0.5129241943359375, 0.551971435546875, 0.5910186767578125, 0.63006591796875, 0.6691131591796875, 0.708160400390625, 0.7472076416015625, 0.7862548828125, 0.8253021240234375, 0.864349365234375, 0.9033966064453125, 0.94244384765625, 0.9814910888671875, 1.020538330078125, 1.0595855712890625, 1.0986328125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 5.0, 10.0, 13.0, 12.0, 13.0, 16.0, 16.0, 10.0, 21.0, 22.0, 28.0, 39.0, 46.0, 66.0, 75.0, 91.0, 83.0, 91.0, 63.0, 48.0, 40.0, 27.0, 26.0, 26.0, 15.0, 18.0, 14.0, 12.0, 7.0, 6.0, 7.0, 3.0, 7.0, 2.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0364990234375, -0.03524160385131836, -0.03398418426513672, -0.03272676467895508, -0.03146934509277344, -0.030211925506591797, -0.028954505920410156, -0.027697086334228516, -0.026439666748046875, -0.025182247161865234, -0.023924827575683594, -0.022667407989501953, -0.021409988403320312, -0.020152568817138672, -0.01889514923095703, -0.01763772964477539, -0.01638031005859375, -0.01512289047241211, -0.013865470886230469, -0.012608051300048828, -0.011350631713867188, -0.010093212127685547, -0.008835792541503906, -0.007578372955322266, -0.006320953369140625, -0.005063533782958984, -0.0038061141967773438, -0.002548694610595703, -0.0012912750244140625, -3.3855438232421875e-05, 0.0012235641479492188, 0.0024809837341308594, 0.0037384033203125, 0.004995822906494141, 0.006253242492675781, 0.007510662078857422, 0.008768081665039062, 0.010025501251220703, 0.011282920837402344, 0.012540340423583984, 0.013797760009765625, 0.015055179595947266, 0.016312599182128906, 0.017570018768310547, 0.018827438354492188, 0.020084857940673828, 0.02134227752685547, 0.02259969711303711, 0.02385711669921875, 0.02511453628540039, 0.02637195587158203, 0.027629375457763672, 0.028886795043945312, 0.030144214630126953, 0.031401634216308594, 0.032659053802490234, 0.033916473388671875, 0.035173892974853516, 0.036431312561035156, 0.0376887321472168, 0.03894615173339844, 0.04020357131958008, 0.04146099090576172, 0.04271841049194336, 0.043975830078125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 4.0, 1.0, 6.0, 8.0, 6.0, 10.0, 7.0, 15.0, 15.0, 23.0, 25.0, 29.0, 37.0, 63.0, 101.0, 214.0, 585.0, 15281.0, 1028079.0, 3077.0, 462.0, 149.0, 95.0, 54.0, 39.0, 25.0, 22.0, 14.0, 14.0, 16.0, 19.0, 13.0, 8.0, 6.0, 8.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.998046875, -0.9681320190429688, -0.9382171630859375, -0.9083023071289062, -0.878387451171875, -0.8484725952148438, -0.8185577392578125, -0.7886428833007812, -0.75872802734375, -0.7288131713867188, -0.6988983154296875, -0.6689834594726562, -0.639068603515625, -0.6091537475585938, -0.5792388916015625, -0.5493240356445312, -0.5194091796875, -0.48949432373046875, -0.4595794677734375, -0.42966461181640625, -0.399749755859375, -0.36983489990234375, -0.3399200439453125, -0.31000518798828125, -0.28009033203125, -0.25017547607421875, -0.2202606201171875, -0.19034576416015625, -0.160430908203125, -0.13051605224609375, -0.1006011962890625, -0.07068634033203125, -0.040771484375, -0.01085662841796875, 0.0190582275390625, 0.04897308349609375, 0.078887939453125, 0.10880279541015625, 0.1387176513671875, 0.16863250732421875, 0.19854736328125, 0.22846221923828125, 0.2583770751953125, 0.28829193115234375, 0.318206787109375, 0.34812164306640625, 0.3780364990234375, 0.40795135498046875, 0.4378662109375, 0.46778106689453125, 0.4976959228515625, 0.5276107788085938, 0.557525634765625, 0.5874404907226562, 0.6173553466796875, 0.6472702026367188, 0.67718505859375, 0.7070999145507812, 0.7370147705078125, 0.7669296264648438, 0.796844482421875, 0.8267593383789062, 0.8566741943359375, 0.8865890502929688, 0.91650390625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 15.0, 357.0, 639.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1608104705810547, -2.1222779750823975, -2.083745241165161, -2.045212745666504, -2.0066800117492676, -1.9681475162506104, -1.929614782333374, -1.8910822868347168, -1.85254967212677, -1.8140170574188232, -1.7754844427108765, -1.7369518280029297, -1.698419213294983, -1.6598865985870361, -1.621354103088379, -1.5828214883804321, -1.5442888736724854, -1.5057562589645386, -1.4672236442565918, -1.428691029548645, -1.3901584148406982, -1.351625919342041, -1.3130931854248047, -1.2745606899261475, -1.2360279560089111, -1.1974953413009644, -1.1589627265930176, -1.1204301118850708, -1.081897497177124, -1.0433650016784668, -1.0048322677612305, -0.9662997722625732, -0.9277672171592712, -0.8892346024513245, -0.8507019877433777, -0.8121694326400757, -0.7736368179321289, -0.7351042032241821, -0.6965715885162354, -0.6580389738082886, -0.6195063591003418, -0.580973744392395, -0.5424411296844482, -0.5039085149765015, -0.46537595987319946, -0.4268433451652527, -0.3883107304573059, -0.3497781455516815, -0.31124556064605713, -0.27271294593811035, -0.23418036103248596, -0.19564774632453918, -0.1571151465177536, -0.11858254671096802, -0.08004993200302124, -0.04151734709739685, -0.0029847323894500732, 0.03554787114262581, 0.07408047467470169, 0.11261308193206787, 0.15114568173885345, 0.18967828154563904, 0.22821089625358582, 0.2667434811592102, 0.305276095867157]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 8.0, 11.0, 13.0, 16.0, 14.0, 26.0, 27.0, 23.0, 28.0, 25.0, 51.0, 47.0, 38.0, 43.0, 45.0, 47.0, 41.0, 47.0, 46.0, 51.0, 51.0, 37.0, 44.0, 38.0, 33.0, 24.0, 21.0, 21.0, 15.0, 19.0, 14.0, 6.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1417033076286316, -0.13710077106952667, -0.13249821960926056, -0.12789568305015564, -0.12329313904047012, -0.1186905950307846, -0.11408805847167969, -0.10948551446199417, -0.10488297045230865, -0.10028042644262314, -0.09567788243293762, -0.0910753458738327, -0.08647280186414719, -0.08187025785446167, -0.07726772129535675, -0.07266517728567123, -0.06806263327598572, -0.0634600892663002, -0.058857548981904984, -0.054255008697509766, -0.04965246468782425, -0.04504992067813873, -0.040447380393743515, -0.0358448401093483, -0.03124229609966278, -0.026639753952622414, -0.022037211805582047, -0.01743466965854168, -0.012832127511501312, -0.008229585364460945, -0.003627043217420578, 0.0009754970669746399, 0.005578041076660156, 0.010180583223700523, 0.01478312537074089, 0.019385667517781258, 0.023988209664821625, 0.028590751811861992, 0.03319329395890236, 0.03779583424329758, 0.04239837825298309, 0.04700092226266861, 0.05160346254706383, 0.056206002831459045, 0.06080854684114456, 0.06541109085083008, 0.070013627409935, 0.07461617141962051, 0.07921871542930603, 0.08382125943899155, 0.08842380344867706, 0.09302634000778198, 0.0976288840174675, 0.10223142802715302, 0.10683396458625793, 0.11143650859594345, 0.11603905260562897, 0.12064159661531448, 0.125244140625, 0.12984667718410492, 0.13444921374320984, 0.13905176520347595, 0.14365430176258087, 0.1482568383216858, 0.1528593897819519]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 12.0, 3.0, 6.0, 15.0, 12.0, 14.0, 23.0, 13.0, 22.0, 20.0, 19.0, 28.0, 30.0, 27.0, 30.0, 25.0, 25.0, 39.0, 36.0, 31.0, 45.0, 41.0, 32.0, 24.0, 40.0, 30.0, 37.0, 23.0, 32.0, 23.0, 35.0, 21.0, 21.0, 22.0, 18.0, 16.0, 11.0, 9.0, 11.0, 12.0, 10.0, 12.0, 13.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 4.0, 2.0], "bins": [-2.8359375, -2.751556396484375, -2.66717529296875, -2.582794189453125, -2.4984130859375, -2.414031982421875, -2.32965087890625, -2.245269775390625, -2.160888671875, -2.076507568359375, -1.99212646484375, -1.907745361328125, -1.8233642578125, -1.738983154296875, -1.65460205078125, -1.570220947265625, -1.48583984375, -1.401458740234375, -1.31707763671875, -1.232696533203125, -1.1483154296875, -1.063934326171875, -0.97955322265625, -0.895172119140625, -0.810791015625, -0.726409912109375, -0.64202880859375, -0.557647705078125, -0.4732666015625, -0.388885498046875, -0.30450439453125, -0.220123291015625, -0.1357421875, -0.051361083984375, 0.03302001953125, 0.117401123046875, 0.2017822265625, 0.286163330078125, 0.37054443359375, 0.454925537109375, 0.539306640625, 0.623687744140625, 0.70806884765625, 0.792449951171875, 0.8768310546875, 0.961212158203125, 1.04559326171875, 1.129974365234375, 1.21435546875, 1.298736572265625, 1.38311767578125, 1.467498779296875, 1.5518798828125, 1.636260986328125, 1.72064208984375, 1.805023193359375, 1.889404296875, 1.973785400390625, 2.05816650390625, 2.142547607421875, 2.2269287109375, 2.311309814453125, 2.39569091796875, 2.480072021484375, 2.564453125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 8.0, 13.0, 12.0, 17.0, 25.0, 34.0, 49.0, 103.0, 129.0, 250.0, 428.0, 699.0, 1369.0, 2374.0, 4274.0, 7126.0, 12526.0, 22770.0, 45020.0, 92355.0, 198629.0, 342116.0, 159047.0, 76836.0, 37390.0, 19516.0, 10777.0, 6319.0, 3540.0, 2041.0, 1160.0, 650.0, 381.0, 203.0, 129.0, 72.0, 52.0, 34.0, 22.0, 13.0, 12.0, 8.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-3.49609375, -3.391326904296875, -3.28656005859375, -3.181793212890625, -3.0770263671875, -2.972259521484375, -2.86749267578125, -2.762725830078125, -2.657958984375, -2.553192138671875, -2.44842529296875, -2.343658447265625, -2.2388916015625, -2.134124755859375, -2.02935791015625, -1.924591064453125, -1.81982421875, -1.715057373046875, -1.61029052734375, -1.505523681640625, -1.4007568359375, -1.295989990234375, -1.19122314453125, -1.086456298828125, -0.981689453125, -0.876922607421875, -0.77215576171875, -0.667388916015625, -0.5626220703125, -0.457855224609375, -0.35308837890625, -0.248321533203125, -0.1435546875, -0.038787841796875, 0.06597900390625, 0.170745849609375, 0.2755126953125, 0.380279541015625, 0.48504638671875, 0.589813232421875, 0.694580078125, 0.799346923828125, 0.90411376953125, 1.008880615234375, 1.1136474609375, 1.218414306640625, 1.32318115234375, 1.427947998046875, 1.53271484375, 1.637481689453125, 1.74224853515625, 1.847015380859375, 1.9517822265625, 2.056549072265625, 2.16131591796875, 2.266082763671875, 2.370849609375, 2.475616455078125, 2.58038330078125, 2.685150146484375, 2.7899169921875, 2.894683837890625, 2.99945068359375, 3.104217529296875, 3.208984375]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 5.0, 0.0, 2.0, 6.0, 6.0, 7.0, 11.0, 17.0, 11.0, 19.0, 18.0, 33.0, 27.0, 30.0, 38.0, 38.0, 38.0, 32.0, 50.0, 61.0, 105.0, 213.0, 1468.0, 253.0, 111.0, 77.0, 50.0, 44.0, 32.0, 30.0, 32.0, 30.0, 20.0, 18.0, 19.0, 16.0, 10.0, 14.0, 14.0, 15.0, 3.0, 9.0, 3.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.2109375, -9.8890380859375, -9.567138671875, -9.2452392578125, -8.92333984375, -8.6014404296875, -8.279541015625, -7.9576416015625, -7.6357421875, -7.3138427734375, -6.991943359375, -6.6700439453125, -6.34814453125, -6.0262451171875, -5.704345703125, -5.3824462890625, -5.060546875, -4.7386474609375, -4.416748046875, -4.0948486328125, -3.77294921875, -3.4510498046875, -3.129150390625, -2.8072509765625, -2.4853515625, -2.1634521484375, -1.841552734375, -1.5196533203125, -1.19775390625, -0.8758544921875, -0.553955078125, -0.2320556640625, 0.08984375, 0.4117431640625, 0.733642578125, 1.0555419921875, 1.37744140625, 1.6993408203125, 2.021240234375, 2.3431396484375, 2.6650390625, 2.9869384765625, 3.308837890625, 3.6307373046875, 3.95263671875, 4.2745361328125, 4.596435546875, 4.9183349609375, 5.240234375, 5.5621337890625, 5.884033203125, 6.2059326171875, 6.52783203125, 6.8497314453125, 7.171630859375, 7.4935302734375, 7.8154296875, 8.1373291015625, 8.459228515625, 8.7811279296875, 9.10302734375, 9.4249267578125, 9.746826171875, 10.0687255859375, 10.390625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 7.0, 9.0, 13.0, 9.0, 14.0, 16.0, 12.0, 27.0, 33.0, 32.0, 43.0, 52.0, 75.0, 108.0, 127.0, 158.0, 237.0, 485.0, 1263.0, 14588.0, 1684039.0, 1428197.0, 13337.0, 1240.0, 479.0, 285.0, 199.0, 134.0, 95.0, 73.0, 54.0, 53.0, 50.0, 41.0, 23.0, 21.0, 16.0, 11.0, 10.0, 5.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-22.109375, -21.418212890625, -20.72705078125, -20.035888671875, -19.3447265625, -18.653564453125, -17.96240234375, -17.271240234375, -16.580078125, -15.888916015625, -15.19775390625, -14.506591796875, -13.8154296875, -13.124267578125, -12.43310546875, -11.741943359375, -11.05078125, -10.359619140625, -9.66845703125, -8.977294921875, -8.2861328125, -7.594970703125, -6.90380859375, -6.212646484375, -5.521484375, -4.830322265625, -4.13916015625, -3.447998046875, -2.7568359375, -2.065673828125, -1.37451171875, -0.683349609375, 0.0078125, 0.698974609375, 1.39013671875, 2.081298828125, 2.7724609375, 3.463623046875, 4.15478515625, 4.845947265625, 5.537109375, 6.228271484375, 6.91943359375, 7.610595703125, 8.3017578125, 8.992919921875, 9.68408203125, 10.375244140625, 11.06640625, 11.757568359375, 12.44873046875, 13.139892578125, 13.8310546875, 14.522216796875, 15.21337890625, 15.904541015625, 16.595703125, 17.286865234375, 17.97802734375, 18.669189453125, 19.3603515625, 20.051513671875, 20.74267578125, 21.433837890625, 22.125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 44.0, 269.0, 467.0, 201.0, 33.0], "bins": [-140.93577575683594, -138.6426544189453, -136.34951782226562, -134.056396484375, -131.76327514648438, -129.47015380859375, -127.1770248413086, -124.88389587402344, -122.59077453613281, -120.29765319824219, -118.00452423095703, -115.71139526367188, -113.41827392578125, -111.12515258789062, -108.83202362060547, -106.53889465332031, -104.24577331542969, -101.95265197753906, -99.6595230102539, -97.36639404296875, -95.07327270507812, -92.7801513671875, -90.48702239990234, -88.19389343261719, -85.90077209472656, -83.60765075683594, -81.31452178955078, -79.02139282226562, -76.728271484375, -74.43515014648438, -72.14202117919922, -69.84889221191406, -67.55577087402344, -65.26264953613281, -62.969520568847656, -60.676395416259766, -58.383270263671875, -56.090145111083984, -53.797019958496094, -51.5038948059082, -49.21076965332031, -46.91764450073242, -44.62451934814453, -42.33139419555664, -40.03826904296875, -37.74514389038086, -35.45201873779297, -33.15889358520508, -30.865768432617188, -28.572643280029297, -26.279518127441406, -23.986392974853516, -21.693267822265625, -19.400142669677734, -17.107017517089844, -14.813892364501953, -12.520766258239746, -10.227641105651855, -7.934515953063965, -5.641390800476074, -3.3482656478881836, -1.055140495300293, 1.2379846572875977, 3.5311098098754883, 5.824234962463379]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 6.0, 5.0, 6.0, 8.0, 6.0, 5.0, 11.0, 15.0, 27.0, 16.0, 19.0, 14.0, 19.0, 25.0, 34.0, 29.0, 30.0, 28.0, 34.0, 38.0, 50.0, 47.0, 46.0, 30.0, 36.0, 36.0, 38.0, 39.0, 30.0, 41.0, 23.0, 30.0, 23.0, 17.0, 24.0, 21.0, 15.0, 8.0, 15.0, 14.0, 8.0, 6.0, 6.0, 6.0, 5.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-26.228559494018555, -25.412853240966797, -24.59714698791504, -23.78144073486328, -22.965734481811523, -22.150028228759766, -21.334320068359375, -20.51861572265625, -19.70290756225586, -18.8872013092041, -18.071495056152344, -17.255788803100586, -16.440082550048828, -15.62437629699707, -14.808669090270996, -13.992962837219238, -13.177257537841797, -12.361551284790039, -11.545845031738281, -10.730138778686523, -9.914432525634766, -9.098726272583008, -8.283019065856934, -7.467312812805176, -6.651606559753418, -5.83590030670166, -5.020194053649902, -4.204487323760986, -3.3887810707092285, -2.5730748176574707, -1.7573680877685547, -0.9416618347167969, -0.12595367431640625, 0.6897526979446411, 1.5054590702056885, 2.3211655616760254, 3.136871814727783, 3.952578067779541, 4.768284797668457, 5.583991050720215, 6.399697303771973, 7.2154035568237305, 8.031109809875488, 8.846817016601562, 9.66252326965332, 10.478229522705078, 11.293935775756836, 12.109642028808594, 12.925348281860352, 13.74105453491211, 14.556760787963867, 15.372467041015625, 16.188173294067383, 17.00387954711914, 17.81958770751953, 18.635292053222656, 19.451000213623047, 20.266706466674805, 21.082412719726562, 21.89811897277832, 22.713825225830078, 23.529531478881836, 24.345237731933594, 25.160945892333984, 25.97665023803711]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 6.0, 9.0, 7.0, 6.0, 13.0, 7.0, 14.0, 16.0, 15.0, 19.0, 17.0, 12.0, 20.0, 17.0, 25.0, 44.0, 34.0, 45.0, 42.0, 36.0, 36.0, 28.0, 43.0, 31.0, 32.0, 38.0, 37.0, 35.0, 33.0, 26.0, 26.0, 20.0, 29.0, 19.0, 25.0, 22.0, 20.0, 13.0, 13.0, 10.0, 22.0, 7.0, 13.0, 6.0, 7.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.177734375, -3.081146240234375, -2.98455810546875, -2.887969970703125, -2.7913818359375, -2.694793701171875, -2.59820556640625, -2.501617431640625, -2.405029296875, -2.308441162109375, -2.21185302734375, -2.115264892578125, -2.0186767578125, -1.922088623046875, -1.82550048828125, -1.728912353515625, -1.63232421875, -1.535736083984375, -1.43914794921875, -1.342559814453125, -1.2459716796875, -1.149383544921875, -1.05279541015625, -0.956207275390625, -0.859619140625, -0.763031005859375, -0.66644287109375, -0.569854736328125, -0.4732666015625, -0.376678466796875, -0.28009033203125, -0.183502197265625, -0.0869140625, 0.009674072265625, 0.10626220703125, 0.202850341796875, 0.2994384765625, 0.396026611328125, 0.49261474609375, 0.589202880859375, 0.685791015625, 0.782379150390625, 0.87896728515625, 0.975555419921875, 1.0721435546875, 1.168731689453125, 1.26531982421875, 1.361907958984375, 1.45849609375, 1.555084228515625, 1.65167236328125, 1.748260498046875, 1.8448486328125, 1.941436767578125, 2.03802490234375, 2.134613037109375, 2.231201171875, 2.327789306640625, 2.42437744140625, 2.520965576171875, 2.6175537109375, 2.714141845703125, 2.81072998046875, 2.907318115234375, 3.00390625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 2.0, 3.0, 7.0, 7.0, 13.0, 11.0, 13.0, 20.0, 18.0, 29.0, 27.0, 55.0, 58.0, 91.0, 149.0, 254.0, 642.0, 2232.0, 9631.0, 55602.0, 359723.0, 1675247.0, 1664066.0, 357664.0, 55475.0, 9555.0, 2214.0, 624.0, 290.0, 144.0, 98.0, 62.0, 49.0, 32.0, 30.0, 22.0, 15.0, 19.0, 12.0, 14.0, 9.0, 12.0, 8.0, 3.0, 8.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-6.97265625, -6.7613525390625, -6.550048828125, -6.3387451171875, -6.12744140625, -5.9161376953125, -5.704833984375, -5.4935302734375, -5.2822265625, -5.0709228515625, -4.859619140625, -4.6483154296875, -4.43701171875, -4.2257080078125, -4.014404296875, -3.8031005859375, -3.591796875, -3.3804931640625, -3.169189453125, -2.9578857421875, -2.74658203125, -2.5352783203125, -2.323974609375, -2.1126708984375, -1.9013671875, -1.6900634765625, -1.478759765625, -1.2674560546875, -1.05615234375, -0.8448486328125, -0.633544921875, -0.4222412109375, -0.2109375, 0.0003662109375, 0.211669921875, 0.4229736328125, 0.63427734375, 0.8455810546875, 1.056884765625, 1.2681884765625, 1.4794921875, 1.6907958984375, 1.902099609375, 2.1134033203125, 2.32470703125, 2.5360107421875, 2.747314453125, 2.9586181640625, 3.169921875, 3.3812255859375, 3.592529296875, 3.8038330078125, 4.01513671875, 4.2264404296875, 4.437744140625, 4.6490478515625, 4.8603515625, 5.0716552734375, 5.282958984375, 5.4942626953125, 5.70556640625, 5.9168701171875, 6.128173828125, 6.3394775390625, 6.55078125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 6.0, 7.0, 4.0, 6.0, 15.0, 13.0, 18.0, 23.0, 33.0, 31.0, 40.0, 57.0, 72.0, 75.0, 96.0, 122.0, 152.0, 158.0, 168.0, 233.0, 266.0, 290.0, 292.0, 305.0, 242.0, 238.0, 209.0, 183.0, 122.0, 124.0, 83.0, 74.0, 60.0, 56.0, 38.0, 30.0, 26.0, 28.0, 15.0, 13.0, 11.0, 10.0, 3.0, 8.0, 2.0, 4.0, 3.0, 7.0, 1.0, 4.0, 2.0], "bins": [-4.9609375, -4.820556640625, -4.68017578125, -4.539794921875, -4.3994140625, -4.259033203125, -4.11865234375, -3.978271484375, -3.837890625, -3.697509765625, -3.55712890625, -3.416748046875, -3.2763671875, -3.135986328125, -2.99560546875, -2.855224609375, -2.71484375, -2.574462890625, -2.43408203125, -2.293701171875, -2.1533203125, -2.012939453125, -1.87255859375, -1.732177734375, -1.591796875, -1.451416015625, -1.31103515625, -1.170654296875, -1.0302734375, -0.889892578125, -0.74951171875, -0.609130859375, -0.46875, -0.328369140625, -0.18798828125, -0.047607421875, 0.0927734375, 0.233154296875, 0.37353515625, 0.513916015625, 0.654296875, 0.794677734375, 0.93505859375, 1.075439453125, 1.2158203125, 1.356201171875, 1.49658203125, 1.636962890625, 1.77734375, 1.917724609375, 2.05810546875, 2.198486328125, 2.3388671875, 2.479248046875, 2.61962890625, 2.760009765625, 2.900390625, 3.040771484375, 3.18115234375, 3.321533203125, 3.4619140625, 3.602294921875, 3.74267578125, 3.883056640625, 4.0234375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 5.0, 3.0, 5.0, 10.0, 7.0, 11.0, 16.0, 15.0, 33.0, 22.0, 38.0, 47.0, 58.0, 63.0, 98.0, 113.0, 159.0, 213.0, 265.0, 416.0, 1517.0, 49584.0, 2715799.0, 1402766.0, 20614.0, 1024.0, 320.0, 213.0, 174.0, 143.0, 98.0, 98.0, 74.0, 52.0, 35.0, 42.0, 31.0, 26.0, 15.0, 10.0, 10.0, 11.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.671875, -18.025634765625, -17.37939453125, -16.733154296875, -16.0869140625, -15.440673828125, -14.79443359375, -14.148193359375, -13.501953125, -12.855712890625, -12.20947265625, -11.563232421875, -10.9169921875, -10.270751953125, -9.62451171875, -8.978271484375, -8.33203125, -7.685791015625, -7.03955078125, -6.393310546875, -5.7470703125, -5.100830078125, -4.45458984375, -3.808349609375, -3.162109375, -2.515869140625, -1.86962890625, -1.223388671875, -0.5771484375, 0.069091796875, 0.71533203125, 1.361572265625, 2.0078125, 2.654052734375, 3.30029296875, 3.946533203125, 4.5927734375, 5.239013671875, 5.88525390625, 6.531494140625, 7.177734375, 7.823974609375, 8.47021484375, 9.116455078125, 9.7626953125, 10.408935546875, 11.05517578125, 11.701416015625, 12.34765625, 12.993896484375, 13.64013671875, 14.286376953125, 14.9326171875, 15.578857421875, 16.22509765625, 16.871337890625, 17.517578125, 18.163818359375, 18.81005859375, 19.456298828125, 20.1025390625, 20.748779296875, 21.39501953125, 22.041259765625, 22.6875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 13.0, 23.0, 32.0, 89.0, 129.0, 150.0, 162.0, 162.0, 104.0, 76.0, 44.0, 13.0, 8.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.65401840209961, -55.25193786621094, -53.849853515625, -52.44777297973633, -51.045692443847656, -49.64360809326172, -48.24152755737305, -46.839447021484375, -45.43736267089844, -44.035282135009766, -42.63319778442383, -41.231117248535156, -39.82903289794922, -38.42695236206055, -37.024871826171875, -35.62278747558594, -34.220706939697266, -32.818626403808594, -31.416542053222656, -30.014461517333984, -28.61237907409668, -27.210296630859375, -25.808216094970703, -24.4061336517334, -23.004051208496094, -21.60196876525879, -20.199886322021484, -18.797805786132812, -17.395723342895508, -15.993640899658203, -14.591559410095215, -13.189477920532227, -11.787391662597656, -10.385309219360352, -8.983227729797363, -7.581145763397217, -6.17906379699707, -4.776981830596924, -3.3748998641967773, -1.972818374633789, -0.5707359313964844, 0.8313460350036621, 2.2334280014038086, 3.635509967803955, 5.037591934204102, 6.439673900604248, 7.8417558670043945, 9.243837356567383, 10.645919799804688, 12.048002243041992, 13.45008373260498, 14.852165222167969, 16.254247665405273, 17.656330108642578, 19.05841064453125, 20.460493087768555, 21.86257553100586, 23.264657974243164, 24.66674041748047, 26.06882095336914, 27.470903396606445, 28.87298583984375, 30.275066375732422, 31.677148818969727, 33.07923126220703]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 5.0, 7.0, 2.0, 8.0, 13.0, 10.0, 17.0, 12.0, 16.0, 22.0, 24.0, 23.0, 33.0, 37.0, 28.0, 42.0, 35.0, 33.0, 39.0, 50.0, 34.0, 33.0, 44.0, 42.0, 43.0, 31.0, 40.0, 27.0, 28.0, 35.0, 29.0, 18.0, 20.0, 16.0, 12.0, 24.0, 12.0, 9.0, 9.0, 14.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.699249267578125, -19.066652297973633, -18.434053421020508, -17.801456451416016, -17.168859481811523, -16.5362606048584, -15.903663635253906, -15.271065711975098, -14.638467788696289, -14.00586986541748, -13.373272895812988, -12.74067497253418, -12.108077049255371, -11.475479125976562, -10.84288215637207, -10.210284233093262, -9.57768726348877, -8.945089340209961, -8.312492370605469, -7.67989444732666, -7.047296524047852, -6.414699077606201, -5.782101631164551, -5.149503707885742, -4.516906261444092, -3.8843085765838623, -3.251710891723633, -2.6191134452819824, -1.986515760421753, -1.3539180755615234, -0.721320629119873, -0.08872270584106445, 0.5438747406005859, 1.1764724254608154, 1.8090699911117554, 2.4416675567626953, 3.074265241622925, 3.7068629264831543, 4.339460372924805, 4.972058296203613, 5.604655742645264, 6.237253189086914, 6.869851112365723, 7.502448558807373, 8.135046005249023, 8.767643928527832, 9.40024185180664, 10.032838821411133, 10.665436744689941, 11.29803466796875, 11.930631637573242, 12.56322956085205, 13.19582748413086, 13.828424453735352, 14.46102237701416, 15.093620300292969, 15.726217269897461, 16.358814239501953, 16.991413116455078, 17.62401008605957, 18.256607055664062, 18.889205932617188, 19.52180290222168, 20.154399871826172, 20.786998748779297]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 2.0, 6.0, 6.0, 9.0, 10.0, 4.0, 16.0, 9.0, 16.0, 24.0, 18.0, 23.0, 16.0, 32.0, 27.0, 48.0, 29.0, 45.0, 46.0, 34.0, 35.0, 44.0, 39.0, 47.0, 45.0, 41.0, 37.0, 36.0, 21.0, 27.0, 29.0, 26.0, 23.0, 18.0, 24.0, 11.0, 16.0, 17.0, 9.0, 8.0, 10.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.2598876953125, -3.160400390625, -3.0609130859375, -2.96142578125, -2.8619384765625, -2.762451171875, -2.6629638671875, -2.5634765625, -2.4639892578125, -2.364501953125, -2.2650146484375, -2.16552734375, -2.0660400390625, -1.966552734375, -1.8670654296875, -1.767578125, -1.6680908203125, -1.568603515625, -1.4691162109375, -1.36962890625, -1.2701416015625, -1.170654296875, -1.0711669921875, -0.9716796875, -0.8721923828125, -0.772705078125, -0.6732177734375, -0.57373046875, -0.4742431640625, -0.374755859375, -0.2752685546875, -0.17578125, -0.0762939453125, 0.023193359375, 0.1226806640625, 0.22216796875, 0.3216552734375, 0.421142578125, 0.5206298828125, 0.6201171875, 0.7196044921875, 0.819091796875, 0.9185791015625, 1.01806640625, 1.1175537109375, 1.217041015625, 1.3165283203125, 1.416015625, 1.5155029296875, 1.614990234375, 1.7144775390625, 1.81396484375, 1.9134521484375, 2.012939453125, 2.1124267578125, 2.2119140625, 2.3114013671875, 2.410888671875, 2.5103759765625, 2.60986328125, 2.7093505859375, 2.808837890625, 2.9083251953125, 3.0078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 8.0, 6.0, 17.0, 39.0, 33.0, 67.0, 116.0, 155.0, 272.0, 407.0, 656.0, 994.0, 1444.0, 2274.0, 3234.0, 4807.0, 6949.0, 10185.0, 14491.0, 20083.0, 28088.0, 37170.0, 48698.0, 61097.0, 74854.0, 86169.0, 95003.0, 97653.0, 91571.0, 81165.0, 68572.0, 55606.0, 43383.0, 32790.0, 24133.0, 17407.0, 12339.0, 8616.0, 5961.0, 4053.0, 2768.0, 1789.0, 1182.0, 804.0, 536.0, 334.0, 213.0, 143.0, 93.0, 56.0, 45.0, 17.0, 13.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420654296875, -0.4062843322753906, -0.39191436767578125, -0.3775444030761719, -0.3631744384765625, -0.3488044738769531, -0.33443450927734375, -0.3200645446777344, -0.305694580078125, -0.2913246154785156, -0.27695465087890625, -0.2625846862792969, -0.2482147216796875, -0.23384475708007812, -0.21947479248046875, -0.20510482788085938, -0.19073486328125, -0.17636489868164062, -0.16199493408203125, -0.14762496948242188, -0.1332550048828125, -0.11888504028320312, -0.10451507568359375, -0.09014511108398438, -0.075775146484375, -0.061405181884765625, -0.04703521728515625, -0.032665252685546875, -0.0182952880859375, -0.003925323486328125, 0.01044464111328125, 0.024814605712890625, 0.0391845703125, 0.053554534912109375, 0.06792449951171875, 0.08229446411132812, 0.0966644287109375, 0.11103439331054688, 0.12540435791015625, 0.13977432250976562, 0.154144287109375, 0.16851425170898438, 0.18288421630859375, 0.19725418090820312, 0.2116241455078125, 0.22599411010742188, 0.24036407470703125, 0.2547340393066406, 0.26910400390625, 0.2834739685058594, 0.29784393310546875, 0.3122138977050781, 0.3265838623046875, 0.3409538269042969, 0.35532379150390625, 0.3696937561035156, 0.384063720703125, 0.3984336853027344, 0.41280364990234375, 0.4271736145019531, 0.4415435791015625, 0.4559135437011719, 0.47028350830078125, 0.4846534729003906, 0.4990234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 7.0, 9.0, 11.0, 8.0, 9.0, 11.0, 12.0, 18.0, 28.0, 26.0, 27.0, 22.0, 21.0, 33.0, 39.0, 41.0, 35.0, 42.0, 44.0, 36.0, 1054.0, 28.0, 35.0, 40.0, 28.0, 49.0, 27.0, 27.0, 29.0, 21.0, 30.0, 23.0, 19.0, 22.0, 15.0, 15.0, 8.0, 6.0, 17.0, 8.0, 8.0, 4.0, 9.0, 2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.369140625, -2.2940673828125, -2.218994140625, -2.1439208984375, -2.06884765625, -1.9937744140625, -1.918701171875, -1.8436279296875, -1.7685546875, -1.6934814453125, -1.618408203125, -1.5433349609375, -1.46826171875, -1.3931884765625, -1.318115234375, -1.2430419921875, -1.16796875, -1.0928955078125, -1.017822265625, -0.9427490234375, -0.86767578125, -0.7926025390625, -0.717529296875, -0.6424560546875, -0.5673828125, -0.4923095703125, -0.417236328125, -0.3421630859375, -0.26708984375, -0.1920166015625, -0.116943359375, -0.0418701171875, 0.033203125, 0.1082763671875, 0.183349609375, 0.2584228515625, 0.33349609375, 0.4085693359375, 0.483642578125, 0.5587158203125, 0.6337890625, 0.7088623046875, 0.783935546875, 0.8590087890625, 0.93408203125, 1.0091552734375, 1.084228515625, 1.1593017578125, 1.234375, 1.3094482421875, 1.384521484375, 1.4595947265625, 1.53466796875, 1.6097412109375, 1.684814453125, 1.7598876953125, 1.8349609375, 1.9100341796875, 1.985107421875, 2.0601806640625, 2.13525390625, 2.2103271484375, 2.285400390625, 2.3604736328125, 2.435546875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 5.0, 6.0, 18.0, 26.0, 43.0, 55.0, 84.0, 112.0, 156.0, 246.0, 320.0, 481.0, 695.0, 1059.0, 1520.0, 2234.0, 3290.0, 4698.0, 6654.0, 9619.0, 14328.0, 22295.0, 38576.0, 1871235.0, 45710.0, 24285.0, 15644.0, 10440.0, 7134.0, 4972.0, 3507.0, 2432.0, 1639.0, 1152.0, 738.0, 515.0, 410.0, 240.0, 162.0, 117.0, 86.0, 53.0, 43.0, 28.0, 22.0, 14.0, 7.0, 12.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.1787109375, -1.1436309814453125, -1.108551025390625, -1.0734710693359375, -1.03839111328125, -1.0033111572265625, -0.968231201171875, -0.9331512451171875, -0.8980712890625, -0.8629913330078125, -0.827911376953125, -0.7928314208984375, -0.75775146484375, -0.7226715087890625, -0.687591552734375, -0.6525115966796875, -0.617431640625, -0.5823516845703125, -0.547271728515625, -0.5121917724609375, -0.47711181640625, -0.4420318603515625, -0.406951904296875, -0.3718719482421875, -0.3367919921875, -0.3017120361328125, -0.266632080078125, -0.2315521240234375, -0.19647216796875, -0.1613922119140625, -0.126312255859375, -0.0912322998046875, -0.05615234375, -0.0210723876953125, 0.014007568359375, 0.0490875244140625, 0.08416748046875, 0.1192474365234375, 0.154327392578125, 0.1894073486328125, 0.2244873046875, 0.2595672607421875, 0.294647216796875, 0.3297271728515625, 0.36480712890625, 0.3998870849609375, 0.434967041015625, 0.4700469970703125, 0.505126953125, 0.5402069091796875, 0.575286865234375, 0.6103668212890625, 0.64544677734375, 0.6805267333984375, 0.715606689453125, 0.7506866455078125, 0.7857666015625, 0.8208465576171875, 0.855926513671875, 0.8910064697265625, 0.92608642578125, 0.9611663818359375, 0.996246337890625, 1.0313262939453125, 1.06640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 3.0, 5.0, 7.0, 7.0, 6.0, 4.0, 12.0, 10.0, 20.0, 15.0, 19.0, 23.0, 30.0, 28.0, 39.0, 58.0, 65.0, 78.0, 80.0, 63.0, 77.0, 55.0, 43.0, 39.0, 24.0, 31.0, 21.0, 24.0, 12.0, 10.0, 12.0, 11.0, 5.0, 8.0, 8.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.035247802734375, -0.034137725830078125, -0.03302764892578125, -0.031917572021484375, -0.0308074951171875, -0.029697418212890625, -0.02858734130859375, -0.027477264404296875, -0.0263671875, -0.025257110595703125, -0.02414703369140625, -0.023036956787109375, -0.0219268798828125, -0.020816802978515625, -0.01970672607421875, -0.018596649169921875, -0.017486572265625, -0.016376495361328125, -0.01526641845703125, -0.014156341552734375, -0.0130462646484375, -0.011936187744140625, -0.01082611083984375, -0.009716033935546875, -0.00860595703125, -0.007495880126953125, -0.00638580322265625, -0.005275726318359375, -0.0041656494140625, -0.003055572509765625, -0.00194549560546875, -0.000835418701171875, 0.000274658203125, 0.001384735107421875, 0.00249481201171875, 0.003604888916015625, 0.0047149658203125, 0.005825042724609375, 0.00693511962890625, 0.008045196533203125, 0.0091552734375, 0.010265350341796875, 0.01137542724609375, 0.012485504150390625, 0.0135955810546875, 0.014705657958984375, 0.01581573486328125, 0.016925811767578125, 0.018035888671875, 0.019145965576171875, 0.02025604248046875, 0.021366119384765625, 0.0224761962890625, 0.023586273193359375, 0.02469635009765625, 0.025806427001953125, 0.02691650390625, 0.028026580810546875, 0.02913665771484375, 0.030246734619140625, 0.0313568115234375, 0.032466888427734375, 0.03357696533203125, 0.034687042236328125, 0.035797119140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 1.0, 7.0, 10.0, 10.0, 6.0, 7.0, 12.0, 9.0, 13.0, 10.0, 20.0, 26.0, 42.0, 56.0, 78.0, 138.0, 371.0, 1214.0, 895902.0, 148973.0, 940.0, 272.0, 144.0, 62.0, 37.0, 34.0, 25.0, 20.0, 19.0, 16.0, 9.0, 8.0, 5.0, 4.0, 8.0, 7.0, 3.0, 8.0, 5.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.8263626098632812, -0.7987213134765625, -0.7710800170898438, -0.743438720703125, -0.7157974243164062, -0.6881561279296875, -0.6605148315429688, -0.63287353515625, -0.6052322387695312, -0.5775909423828125, -0.5499496459960938, -0.522308349609375, -0.49466705322265625, -0.4670257568359375, -0.43938446044921875, -0.4117431640625, -0.38410186767578125, -0.3564605712890625, -0.32881927490234375, -0.301177978515625, -0.27353668212890625, -0.2458953857421875, -0.21825408935546875, -0.19061279296875, -0.16297149658203125, -0.1353302001953125, -0.10768890380859375, -0.080047607421875, -0.05240631103515625, -0.0247650146484375, 0.00287628173828125, 0.030517578125, 0.05815887451171875, 0.0858001708984375, 0.11344146728515625, 0.141082763671875, 0.16872406005859375, 0.1963653564453125, 0.22400665283203125, 0.25164794921875, 0.27928924560546875, 0.3069305419921875, 0.33457183837890625, 0.362213134765625, 0.38985443115234375, 0.4174957275390625, 0.44513702392578125, 0.4727783203125, 0.5004196166992188, 0.5280609130859375, 0.5557022094726562, 0.583343505859375, 0.6109848022460938, 0.6386260986328125, 0.6662673950195312, 0.69390869140625, 0.7215499877929688, 0.7491912841796875, 0.7768325805664062, 0.804473876953125, 0.8321151733398438, 0.8597564697265625, 0.8873977661132812, 0.9150390625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 28.0, 828.0, 150.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7356514930725098, -1.7045257091522217, -1.6734000444412231, -1.642274260520935, -1.611148476600647, -1.5800228118896484, -1.5488970279693604, -1.5177712440490723, -1.4866454601287842, -1.455519676208496, -1.4243940114974976, -1.3932682275772095, -1.3621424436569214, -1.3310167789459229, -1.2998909950256348, -1.2687652111053467, -1.2376395463943481, -1.20651376247406, -1.1753880977630615, -1.1442623138427734, -1.1131365299224854, -1.0820107460021973, -1.0508850812911987, -1.0197592973709106, -0.9886335730552673, -0.957507848739624, -0.9263820648193359, -0.8952563405036926, -0.8641306161880493, -0.8330048322677612, -0.8018791079521179, -0.7707533836364746, -0.7396275997161865, -0.7085018754005432, -0.6773760914802551, -0.6462503671646118, -0.6151245832443237, -0.5839988589286804, -0.5528731346130371, -0.521747350692749, -0.4906216561794281, -0.4594959020614624, -0.4283701777458191, -0.3972444236278534, -0.3661186695098877, -0.334992915391922, -0.3038671612739563, -0.272741436958313, -0.2416156828403473, -0.2104899287223816, -0.1793641895055771, -0.14823845028877258, -0.11711269617080688, -0.08598694205284119, -0.05486120283603668, -0.023735463619232178, 0.0073902904987335205, 0.03851603716611862, 0.06964178383350372, 0.10076753050088882, 0.13189327716827393, 0.16301903128623962, 0.19414477050304413, 0.22527050971984863, 0.25639626383781433]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 6.0, 7.0, 8.0, 11.0, 16.0, 17.0, 23.0, 23.0, 22.0, 41.0, 40.0, 29.0, 43.0, 43.0, 43.0, 56.0, 61.0, 48.0, 46.0, 63.0, 45.0, 44.0, 42.0, 46.0, 31.0, 20.0, 24.0, 26.0, 15.0, 13.0, 11.0, 7.0, 13.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14281076192855835, -0.13836973905563354, -0.13392873108386993, -0.12948770821094513, -0.12504668533802032, -0.12060566991567612, -0.11616465449333191, -0.1117236316204071, -0.1072826161980629, -0.10284160077571869, -0.09840057790279388, -0.09395956248044968, -0.08951854705810547, -0.08507752418518066, -0.08063650876283646, -0.07619549334049225, -0.07175447046756744, -0.06731345504522324, -0.06287243217229843, -0.058431416749954224, -0.05399039760231972, -0.04954937845468521, -0.045108363032341, -0.0406673438847065, -0.03622632473707199, -0.031785305589437485, -0.027344288304448128, -0.02290327101945877, -0.018462251871824265, -0.014021232724189758, -0.009580215439200401, -0.005139198154211044, -0.0006981790065765381, 0.0037428392097353935, 0.008183857426047325, 0.012624875642359257, 0.01706589385867119, 0.021506913006305695, 0.02594793029129505, 0.03038894757628441, 0.034829966723918915, 0.03927098587155342, 0.04371200501918793, 0.048153020441532135, 0.05259403958916664, 0.05703505873680115, 0.061476074159145355, 0.06591708958148956, 0.07035811245441437, 0.07479912787675858, 0.07924015074968338, 0.08368116617202759, 0.08812218904495239, 0.0925632044672966, 0.09700421988964081, 0.10144524276256561, 0.10588625818490982, 0.11032727360725403, 0.11476829648017883, 0.11920931190252304, 0.12365032732486725, 0.12809135019779205, 0.13253237307071686, 0.13697338104248047, 0.14141440391540527]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 8.0, 9.0, 5.0, 10.0, 14.0, 11.0, 14.0, 18.0, 20.0, 19.0, 19.0, 24.0, 27.0, 34.0, 34.0, 42.0, 37.0, 41.0, 39.0, 39.0, 45.0, 48.0, 44.0, 38.0, 42.0, 34.0, 41.0, 26.0, 23.0, 21.0, 23.0, 17.0, 18.0, 26.0, 20.0, 14.0, 14.0, 7.0, 11.0, 5.0, 2.0, 7.0, 3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.086029052734375, -2.98846435546875, -2.890899658203125, -2.7933349609375, -2.695770263671875, -2.59820556640625, -2.500640869140625, -2.403076171875, -2.305511474609375, -2.20794677734375, -2.110382080078125, -2.0128173828125, -1.915252685546875, -1.81768798828125, -1.720123291015625, -1.62255859375, -1.524993896484375, -1.42742919921875, -1.329864501953125, -1.2322998046875, -1.134735107421875, -1.03717041015625, -0.939605712890625, -0.842041015625, -0.744476318359375, -0.64691162109375, -0.549346923828125, -0.4517822265625, -0.354217529296875, -0.25665283203125, -0.159088134765625, -0.0615234375, 0.036041259765625, 0.13360595703125, 0.231170654296875, 0.3287353515625, 0.426300048828125, 0.52386474609375, 0.621429443359375, 0.718994140625, 0.816558837890625, 0.91412353515625, 1.011688232421875, 1.1092529296875, 1.206817626953125, 1.30438232421875, 1.401947021484375, 1.49951171875, 1.597076416015625, 1.69464111328125, 1.792205810546875, 1.8897705078125, 1.987335205078125, 2.08489990234375, 2.182464599609375, 2.280029296875, 2.377593994140625, 2.47515869140625, 2.572723388671875, 2.6702880859375, 2.767852783203125, 2.86541748046875, 2.962982177734375, 3.060546875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 15.0, 12.0, 16.0, 24.0, 29.0, 32.0, 71.0, 98.0, 173.0, 224.0, 405.0, 682.0, 1081.0, 1840.0, 3209.0, 5308.0, 9085.0, 15368.0, 26962.0, 47261.0, 87637.0, 166098.0, 270552.0, 187318.0, 99850.0, 53110.0, 29834.0, 17397.0, 9911.0, 6024.0, 3503.0, 2160.0, 1263.0, 732.0, 461.0, 260.0, 167.0, 93.0, 78.0, 67.0, 38.0, 28.0, 21.0, 11.0, 10.0, 8.0, 9.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0], "bins": [-2.921875, -2.832244873046875, -2.74261474609375, -2.652984619140625, -2.5633544921875, -2.473724365234375, -2.38409423828125, -2.294464111328125, -2.204833984375, -2.115203857421875, -2.02557373046875, -1.935943603515625, -1.8463134765625, -1.756683349609375, -1.66705322265625, -1.577423095703125, -1.48779296875, -1.398162841796875, -1.30853271484375, -1.218902587890625, -1.1292724609375, -1.039642333984375, -0.95001220703125, -0.860382080078125, -0.770751953125, -0.681121826171875, -0.59149169921875, -0.501861572265625, -0.4122314453125, -0.322601318359375, -0.23297119140625, -0.143341064453125, -0.0537109375, 0.035919189453125, 0.12554931640625, 0.215179443359375, 0.3048095703125, 0.394439697265625, 0.48406982421875, 0.573699951171875, 0.663330078125, 0.752960205078125, 0.84259033203125, 0.932220458984375, 1.0218505859375, 1.111480712890625, 1.20111083984375, 1.290740966796875, 1.38037109375, 1.470001220703125, 1.55963134765625, 1.649261474609375, 1.7388916015625, 1.828521728515625, 1.91815185546875, 2.007781982421875, 2.097412109375, 2.187042236328125, 2.27667236328125, 2.366302490234375, 2.4559326171875, 2.545562744140625, 2.63519287109375, 2.724822998046875, 2.814453125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 10.0, 5.0, 11.0, 10.0, 9.0, 16.0, 18.0, 9.0, 28.0, 21.0, 25.0, 41.0, 36.0, 36.0, 40.0, 28.0, 54.0, 89.0, 158.0, 349.0, 1352.0, 181.0, 90.0, 65.0, 50.0, 47.0, 27.0, 28.0, 26.0, 29.0, 22.0, 21.0, 12.0, 31.0, 12.0, 8.0, 12.0, 7.0, 2.0, 7.0, 9.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.40625, -9.129638671875, -8.85302734375, -8.576416015625, -8.2998046875, -8.023193359375, -7.74658203125, -7.469970703125, -7.193359375, -6.916748046875, -6.64013671875, -6.363525390625, -6.0869140625, -5.810302734375, -5.53369140625, -5.257080078125, -4.98046875, -4.703857421875, -4.42724609375, -4.150634765625, -3.8740234375, -3.597412109375, -3.32080078125, -3.044189453125, -2.767578125, -2.490966796875, -2.21435546875, -1.937744140625, -1.6611328125, -1.384521484375, -1.10791015625, -0.831298828125, -0.5546875, -0.278076171875, -0.00146484375, 0.275146484375, 0.5517578125, 0.828369140625, 1.10498046875, 1.381591796875, 1.658203125, 1.934814453125, 2.21142578125, 2.488037109375, 2.7646484375, 3.041259765625, 3.31787109375, 3.594482421875, 3.87109375, 4.147705078125, 4.42431640625, 4.700927734375, 4.9775390625, 5.254150390625, 5.53076171875, 5.807373046875, 6.083984375, 6.360595703125, 6.63720703125, 6.913818359375, 7.1904296875, 7.467041015625, 7.74365234375, 8.020263671875, 8.296875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 7.0, 2.0, 2.0, 5.0, 8.0, 14.0, 15.0, 15.0, 21.0, 22.0, 31.0, 30.0, 56.0, 86.0, 113.0, 135.0, 214.0, 324.0, 739.0, 3558.0, 260927.0, 2860430.0, 16311.0, 1272.0, 435.0, 279.0, 183.0, 119.0, 80.0, 56.0, 54.0, 40.0, 31.0, 27.0, 19.0, 17.0, 7.0, 8.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.8125, -24.95849609375, -24.1044921875, -23.25048828125, -22.396484375, -21.54248046875, -20.6884765625, -19.83447265625, -18.98046875, -18.12646484375, -17.2724609375, -16.41845703125, -15.564453125, -14.71044921875, -13.8564453125, -13.00244140625, -12.1484375, -11.29443359375, -10.4404296875, -9.58642578125, -8.732421875, -7.87841796875, -7.0244140625, -6.17041015625, -5.31640625, -4.46240234375, -3.6083984375, -2.75439453125, -1.900390625, -1.04638671875, -0.1923828125, 0.66162109375, 1.515625, 2.36962890625, 3.2236328125, 4.07763671875, 4.931640625, 5.78564453125, 6.6396484375, 7.49365234375, 8.34765625, 9.20166015625, 10.0556640625, 10.90966796875, 11.763671875, 12.61767578125, 13.4716796875, 14.32568359375, 15.1796875, 16.03369140625, 16.8876953125, 17.74169921875, 18.595703125, 19.44970703125, 20.3037109375, 21.15771484375, 22.01171875, 22.86572265625, 23.7197265625, 24.57373046875, 25.427734375, 26.28173828125, 27.1357421875, 27.98974609375, 28.84375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 36.0, 904.0, 76.0], "bins": [-360.9143371582031, -355.144775390625, -349.3752136230469, -343.60565185546875, -337.8360595703125, -332.0664978027344, -326.29693603515625, -320.5273742675781, -314.7578125, -308.9882507324219, -303.21868896484375, -297.4490966796875, -291.6795349121094, -285.90997314453125, -280.1404113769531, -274.370849609375, -268.60125732421875, -262.8316955566406, -257.0621337890625, -251.2925567626953, -245.5229949951172, -239.75341796875, -233.98385620117188, -228.21429443359375, -222.44473266601562, -216.6751708984375, -210.9055938720703, -205.1360321044922, -199.36647033691406, -193.59689331054688, -187.82733154296875, -182.05776977539062, -176.28819274902344, -170.5186309814453, -164.74905395507812, -158.9794921875, -153.20993041992188, -147.4403533935547, -141.67079162597656, -135.90121459960938, -130.13165283203125, -124.3620834350586, -118.59252166748047, -112.82295227050781, -107.05338287353516, -101.2838134765625, -95.51425170898438, -89.74468231201172, -83.97512817382812, -78.20555877685547, -72.43599700927734, -66.66642761230469, -60.89685821533203, -55.12729263305664, -49.35772705078125, -43.588157653808594, -37.81858825683594, -32.04902267456055, -26.27945327758789, -20.5098876953125, -14.740320205688477, -8.970752716064453, -3.2011871337890625, 2.5683822631835938, 8.337947845458984]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 5.0, 4.0, 4.0, 7.0, 6.0, 10.0, 7.0, 6.0, 10.0, 13.0, 9.0, 17.0, 20.0, 28.0, 25.0, 18.0, 41.0, 34.0, 33.0, 34.0, 35.0, 40.0, 34.0, 35.0, 39.0, 33.0, 40.0, 41.0, 38.0, 30.0, 44.0, 20.0, 36.0, 27.0, 26.0, 17.0, 21.0, 17.0, 10.0, 17.0, 14.0, 11.0, 12.0, 10.0, 7.0, 6.0, 9.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.156494140625, -21.372087478637695, -20.587678909301758, -19.803272247314453, -19.018863677978516, -18.23445701599121, -17.450050354003906, -16.66564178466797, -15.881234169006348, -15.096826553344727, -14.312418937683105, -13.528011322021484, -12.74360466003418, -11.959196090698242, -11.174789428710938, -10.390381813049316, -9.605974197387695, -8.821566581726074, -8.037158966064453, -7.25275182723999, -6.468344211578369, -5.683936595916748, -4.899529457092285, -4.115121841430664, -3.330714225769043, -2.546306610107422, -1.7618992328643799, -0.9774918556213379, -0.1930842399597168, 0.5913233757019043, 1.3757305145263672, 2.1601381301879883, 2.9445457458496094, 3.7289533615112305, 4.513360977172852, 5.2977681159973145, 6.0821757316589355, 6.866583347320557, 7.6509904861450195, 8.43539810180664, 9.219805717468262, 10.004213333129883, 10.788620948791504, 11.573028564453125, 12.35743522644043, 13.141843795776367, 13.926250457763672, 14.710658073425293, 15.495065689086914, 16.27947235107422, 17.063880920410156, 17.84828758239746, 18.6326961517334, 19.417102813720703, 20.20151138305664, 20.985918045043945, 21.77032470703125, 22.554731369018555, 23.339139938354492, 24.123546600341797, 24.907955169677734, 25.69236183166504, 26.476768493652344, 27.26117706298828, 28.04558563232422]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 6.0, 5.0, 7.0, 14.0, 17.0, 14.0, 23.0, 26.0, 21.0, 29.0, 38.0, 40.0, 36.0, 28.0, 44.0, 55.0, 40.0, 51.0, 39.0, 51.0, 44.0, 49.0, 52.0, 42.0, 34.0, 25.0, 31.0, 16.0, 19.0, 15.0, 17.0, 12.0, 12.0, 11.0, 10.0, 9.0, 1.0, 3.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2421875, -4.120819091796875, -3.99945068359375, -3.878082275390625, -3.7567138671875, -3.635345458984375, -3.51397705078125, -3.392608642578125, -3.271240234375, -3.149871826171875, -3.02850341796875, -2.907135009765625, -2.7857666015625, -2.664398193359375, -2.54302978515625, -2.421661376953125, -2.30029296875, -2.178924560546875, -2.05755615234375, -1.936187744140625, -1.8148193359375, -1.693450927734375, -1.57208251953125, -1.450714111328125, -1.329345703125, -1.207977294921875, -1.08660888671875, -0.965240478515625, -0.8438720703125, -0.722503662109375, -0.60113525390625, -0.479766845703125, -0.3583984375, -0.237030029296875, -0.11566162109375, 0.005706787109375, 0.1270751953125, 0.248443603515625, 0.36981201171875, 0.491180419921875, 0.612548828125, 0.733917236328125, 0.85528564453125, 0.976654052734375, 1.0980224609375, 1.219390869140625, 1.34075927734375, 1.462127685546875, 1.58349609375, 1.704864501953125, 1.82623291015625, 1.947601318359375, 2.0689697265625, 2.190338134765625, 2.31170654296875, 2.433074951171875, 2.554443359375, 2.675811767578125, 2.79718017578125, 2.918548583984375, 3.0399169921875, 3.161285400390625, 3.28265380859375, 3.404022216796875, 3.525390625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 2.0, 13.0, 15.0, 12.0, 14.0, 15.0, 21.0, 21.0, 28.0, 41.0, 64.0, 71.0, 163.0, 525.0, 2018.0, 13744.0, 123715.0, 1144607.0, 2421046.0, 437160.0, 43972.0, 5434.0, 912.0, 267.0, 115.0, 62.0, 36.0, 33.0, 33.0, 16.0, 16.0, 8.0, 11.0, 17.0, 7.0, 7.0, 10.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.6796875, -8.4188232421875, -8.157958984375, -7.8970947265625, -7.63623046875, -7.3753662109375, -7.114501953125, -6.8536376953125, -6.5927734375, -6.3319091796875, -6.071044921875, -5.8101806640625, -5.54931640625, -5.2884521484375, -5.027587890625, -4.7667236328125, -4.505859375, -4.2449951171875, -3.984130859375, -3.7232666015625, -3.46240234375, -3.2015380859375, -2.940673828125, -2.6798095703125, -2.4189453125, -2.1580810546875, -1.897216796875, -1.6363525390625, -1.37548828125, -1.1146240234375, -0.853759765625, -0.5928955078125, -0.33203125, -0.0711669921875, 0.189697265625, 0.4505615234375, 0.71142578125, 0.9722900390625, 1.233154296875, 1.4940185546875, 1.7548828125, 2.0157470703125, 2.276611328125, 2.5374755859375, 2.79833984375, 3.0592041015625, 3.320068359375, 3.5809326171875, 3.841796875, 4.1026611328125, 4.363525390625, 4.6243896484375, 4.88525390625, 5.1461181640625, 5.406982421875, 5.6678466796875, 5.9287109375, 6.1895751953125, 6.450439453125, 6.7113037109375, 6.97216796875, 7.2330322265625, 7.493896484375, 7.7547607421875, 8.015625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 9.0, 17.0, 23.0, 40.0, 50.0, 60.0, 87.0, 132.0, 176.0, 235.0, 320.0, 385.0, 493.0, 448.0, 425.0, 339.0, 260.0, 157.0, 120.0, 78.0, 62.0, 41.0, 30.0, 21.0, 20.0, 7.0, 6.0, 12.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0859375, -6.87139892578125, -6.6568603515625, -6.44232177734375, -6.227783203125, -6.01324462890625, -5.7987060546875, -5.58416748046875, -5.36962890625, -5.15509033203125, -4.9405517578125, -4.72601318359375, -4.511474609375, -4.29693603515625, -4.0823974609375, -3.86785888671875, -3.6533203125, -3.43878173828125, -3.2242431640625, -3.00970458984375, -2.795166015625, -2.58062744140625, -2.3660888671875, -2.15155029296875, -1.93701171875, -1.72247314453125, -1.5079345703125, -1.29339599609375, -1.078857421875, -0.86431884765625, -0.6497802734375, -0.43524169921875, -0.220703125, -0.00616455078125, 0.2083740234375, 0.42291259765625, 0.637451171875, 0.85198974609375, 1.0665283203125, 1.28106689453125, 1.49560546875, 1.71014404296875, 1.9246826171875, 2.13922119140625, 2.353759765625, 2.56829833984375, 2.7828369140625, 2.99737548828125, 3.2119140625, 3.42645263671875, 3.6409912109375, 3.85552978515625, 4.070068359375, 4.28460693359375, 4.4991455078125, 4.71368408203125, 4.92822265625, 5.14276123046875, 5.3572998046875, 5.57183837890625, 5.786376953125, 6.00091552734375, 6.2154541015625, 6.42999267578125, 6.64453125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 1.0, 2.0, 5.0, 11.0, 9.0, 14.0, 23.0, 26.0, 31.0, 57.0, 63.0, 116.0, 149.0, 239.0, 421.0, 1117.0, 130571.0, 4034451.0, 25167.0, 740.0, 350.0, 219.0, 144.0, 106.0, 72.0, 59.0, 38.0, 27.0, 22.0, 11.0, 8.0, 9.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.65625, -34.52001953125, -33.3837890625, -32.24755859375, -31.111328125, -29.97509765625, -28.8388671875, -27.70263671875, -26.56640625, -25.43017578125, -24.2939453125, -23.15771484375, -22.021484375, -20.88525390625, -19.7490234375, -18.61279296875, -17.4765625, -16.34033203125, -15.2041015625, -14.06787109375, -12.931640625, -11.79541015625, -10.6591796875, -9.52294921875, -8.38671875, -7.25048828125, -6.1142578125, -4.97802734375, -3.841796875, -2.70556640625, -1.5693359375, -0.43310546875, 0.703125, 1.83935546875, 2.9755859375, 4.11181640625, 5.248046875, 6.38427734375, 7.5205078125, 8.65673828125, 9.79296875, 10.92919921875, 12.0654296875, 13.20166015625, 14.337890625, 15.47412109375, 16.6103515625, 17.74658203125, 18.8828125, 20.01904296875, 21.1552734375, 22.29150390625, 23.427734375, 24.56396484375, 25.7001953125, 26.83642578125, 27.97265625, 29.10888671875, 30.2451171875, 31.38134765625, 32.517578125, 33.65380859375, 34.7900390625, 35.92626953125, 37.0625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 10.0, 40.0, 91.0, 170.0, 222.0, 251.0, 118.0, 74.0, 32.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.64910888671875, -69.758544921875, -67.86798095703125, -65.9774169921875, -64.08685302734375, -62.1962890625, -60.305721282958984, -58.415157318115234, -56.524593353271484, -54.634029388427734, -52.743465423583984, -50.852901458740234, -48.96233367919922, -47.07176971435547, -45.18120574951172, -43.29064178466797, -41.40007781982422, -39.50951385498047, -37.61894989013672, -35.72838592529297, -33.83782196044922, -31.947256088256836, -30.056690216064453, -28.166126251220703, -26.275562286376953, -24.384998321533203, -22.494434356689453, -20.60386848449707, -18.71330451965332, -16.82274055480957, -14.932175636291504, -13.041610717773438, -11.151050567626953, -9.260486602783203, -7.369921684265137, -5.4793572425842285, -3.5887928009033203, -1.6982288360595703, 0.1923360824584961, 2.0829010009765625, 3.9734649658203125, 5.864029407501221, 7.754593849182129, 9.645158767700195, 11.535722732543945, 13.426286697387695, 15.316851615905762, 17.207416534423828, 19.097980499267578, 20.988544464111328, 22.879108428955078, 24.76967430114746, 26.66023826599121, 28.55080223083496, 30.441368103027344, 32.331932067871094, 34.222496032714844, 36.113059997558594, 38.003623962402344, 39.894187927246094, 41.784751892089844, 43.675315856933594, 45.56588363647461, 47.45644760131836, 49.34701156616211]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 5.0, 9.0, 9.0, 7.0, 14.0, 21.0, 21.0, 14.0, 24.0, 29.0, 39.0, 34.0, 40.0, 48.0, 42.0, 45.0, 41.0, 49.0, 48.0, 48.0, 37.0, 48.0, 42.0, 32.0, 26.0, 29.0, 25.0, 36.0, 18.0, 23.0, 8.0, 17.0, 10.0, 14.0, 8.0, 11.0, 8.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.294269561767578, -19.610004425048828, -18.925737380981445, -18.241470336914062, -17.557205200195312, -16.872940063476562, -16.18867301940918, -15.504406929016113, -14.820140838623047, -14.13587474822998, -13.451608657836914, -12.767342567443848, -12.083076477050781, -11.398810386657715, -10.714544296264648, -10.030278205871582, -9.346012115478516, -8.66174602508545, -7.977479934692383, -7.293213844299316, -6.60894775390625, -5.924681663513184, -5.240415573120117, -4.556149482727051, -3.8718833923339844, -3.187617301940918, -2.5033512115478516, -1.8190851211547852, -1.1348190307617188, -0.45055294036865234, 0.23371315002441406, 0.9179792404174805, 1.6022453308105469, 2.2865114212036133, 2.9707775115966797, 3.655043601989746, 4.3393096923828125, 5.023575782775879, 5.707841873168945, 6.392107963562012, 7.076374053955078, 7.7606401443481445, 8.444906234741211, 9.129172325134277, 9.813438415527344, 10.49770450592041, 11.181970596313477, 11.866236686706543, 12.55050277709961, 13.234768867492676, 13.919034957885742, 14.603301048278809, 15.287567138671875, 15.971833229064941, 16.656099319458008, 17.34036636352539, 18.02463150024414, 18.70889663696289, 19.393163681030273, 20.077430725097656, 20.761695861816406, 21.445960998535156, 22.13022804260254, 22.814495086669922, 23.498760223388672]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 6.0, 6.0, 8.0, 9.0, 12.0, 14.0, 14.0, 20.0, 24.0, 24.0, 24.0, 29.0, 34.0, 39.0, 23.0, 37.0, 39.0, 40.0, 47.0, 39.0, 27.0, 25.0, 36.0, 37.0, 27.0, 43.0, 48.0, 21.0, 29.0, 22.0, 30.0, 24.0, 25.0, 15.0, 13.0, 17.0, 6.0, 10.0, 2.0, 6.0, 13.0, 4.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.041015625, -2.941436767578125, -2.84185791015625, -2.742279052734375, -2.6427001953125, -2.543121337890625, -2.44354248046875, -2.343963623046875, -2.244384765625, -2.144805908203125, -2.04522705078125, -1.945648193359375, -1.8460693359375, -1.746490478515625, -1.64691162109375, -1.547332763671875, -1.44775390625, -1.348175048828125, -1.24859619140625, -1.149017333984375, -1.0494384765625, -0.949859619140625, -0.85028076171875, -0.750701904296875, -0.651123046875, -0.551544189453125, -0.45196533203125, -0.352386474609375, -0.2528076171875, -0.153228759765625, -0.05364990234375, 0.045928955078125, 0.1455078125, 0.245086669921875, 0.34466552734375, 0.444244384765625, 0.5438232421875, 0.643402099609375, 0.74298095703125, 0.842559814453125, 0.942138671875, 1.041717529296875, 1.14129638671875, 1.240875244140625, 1.3404541015625, 1.440032958984375, 1.53961181640625, 1.639190673828125, 1.73876953125, 1.838348388671875, 1.93792724609375, 2.037506103515625, 2.1370849609375, 2.236663818359375, 2.33624267578125, 2.435821533203125, 2.535400390625, 2.634979248046875, 2.73455810546875, 2.834136962890625, 2.9337158203125, 3.033294677734375, 3.13287353515625, 3.232452392578125, 3.33203125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 12.0, 9.0, 30.0, 45.0, 57.0, 106.0, 115.0, 208.0, 342.0, 531.0, 872.0, 1332.0, 2044.0, 3173.0, 4874.0, 7481.0, 11474.0, 17117.0, 24714.0, 34827.0, 48987.0, 65442.0, 83921.0, 101194.0, 113178.0, 113584.0, 101474.0, 84208.0, 66474.0, 49607.0, 35773.0, 24773.0, 17330.0, 11607.0, 7692.0, 4944.0, 3267.0, 2026.0, 1375.0, 871.0, 504.0, 353.0, 221.0, 143.0, 100.0, 59.0, 23.0, 22.0, 16.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.53759765625, -0.5213165283203125, -0.505035400390625, -0.4887542724609375, -0.47247314453125, -0.4561920166015625, -0.439910888671875, -0.4236297607421875, -0.4073486328125, -0.3910675048828125, -0.374786376953125, -0.3585052490234375, -0.34222412109375, -0.3259429931640625, -0.309661865234375, -0.2933807373046875, -0.277099609375, -0.2608184814453125, -0.244537353515625, -0.2282562255859375, -0.21197509765625, -0.1956939697265625, -0.179412841796875, -0.1631317138671875, -0.1468505859375, -0.1305694580078125, -0.114288330078125, -0.0980072021484375, -0.08172607421875, -0.0654449462890625, -0.049163818359375, -0.0328826904296875, -0.0166015625, -0.0003204345703125, 0.015960693359375, 0.0322418212890625, 0.04852294921875, 0.0648040771484375, 0.081085205078125, 0.0973663330078125, 0.1136474609375, 0.1299285888671875, 0.146209716796875, 0.1624908447265625, 0.17877197265625, 0.1950531005859375, 0.211334228515625, 0.2276153564453125, 0.243896484375, 0.2601776123046875, 0.276458740234375, 0.2927398681640625, 0.30902099609375, 0.3253021240234375, 0.341583251953125, 0.3578643798828125, 0.3741455078125, 0.3904266357421875, 0.406707763671875, 0.4229888916015625, 0.43927001953125, 0.4555511474609375, 0.471832275390625, 0.4881134033203125, 0.50439453125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 7.0, 13.0, 15.0, 20.0, 21.0, 22.0, 26.0, 15.0, 20.0, 30.0, 24.0, 32.0, 26.0, 36.0, 35.0, 28.0, 38.0, 49.0, 1064.0, 33.0, 36.0, 39.0, 48.0, 33.0, 31.0, 38.0, 30.0, 21.0, 27.0, 16.0, 23.0, 24.0, 14.0, 12.0, 18.0, 6.0, 10.0, 10.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.525390625, -2.444244384765625, -2.36309814453125, -2.281951904296875, -2.2008056640625, -2.119659423828125, -2.03851318359375, -1.957366943359375, -1.876220703125, -1.795074462890625, -1.71392822265625, -1.632781982421875, -1.5516357421875, -1.470489501953125, -1.38934326171875, -1.308197021484375, -1.22705078125, -1.145904541015625, -1.06475830078125, -0.983612060546875, -0.9024658203125, -0.821319580078125, -0.74017333984375, -0.659027099609375, -0.577880859375, -0.496734619140625, -0.41558837890625, -0.334442138671875, -0.2532958984375, -0.172149658203125, -0.09100341796875, -0.009857177734375, 0.0712890625, 0.152435302734375, 0.23358154296875, 0.314727783203125, 0.3958740234375, 0.477020263671875, 0.55816650390625, 0.639312744140625, 0.720458984375, 0.801605224609375, 0.88275146484375, 0.963897705078125, 1.0450439453125, 1.126190185546875, 1.20733642578125, 1.288482666015625, 1.36962890625, 1.450775146484375, 1.53192138671875, 1.613067626953125, 1.6942138671875, 1.775360107421875, 1.85650634765625, 1.937652587890625, 2.018798828125, 2.099945068359375, 2.18109130859375, 2.262237548828125, 2.3433837890625, 2.424530029296875, 2.50567626953125, 2.586822509765625, 2.66796875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 7.0, 11.0, 16.0, 18.0, 34.0, 38.0, 63.0, 99.0, 138.0, 209.0, 350.0, 483.0, 730.0, 1103.0, 1650.0, 2318.0, 3402.0, 4838.0, 7294.0, 10791.0, 16030.0, 25641.0, 51407.0, 1870957.0, 36125.0, 21204.0, 13538.0, 9169.0, 6347.0, 4205.0, 2935.0, 1974.0, 1358.0, 864.0, 605.0, 414.0, 261.0, 170.0, 116.0, 70.0, 42.0, 32.0, 36.0, 8.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.138671875, -1.102294921875, -1.06591796875, -1.029541015625, -0.9931640625, -0.956787109375, -0.92041015625, -0.884033203125, -0.84765625, -0.811279296875, -0.77490234375, -0.738525390625, -0.7021484375, -0.665771484375, -0.62939453125, -0.593017578125, -0.556640625, -0.520263671875, -0.48388671875, -0.447509765625, -0.4111328125, -0.374755859375, -0.33837890625, -0.302001953125, -0.265625, -0.229248046875, -0.19287109375, -0.156494140625, -0.1201171875, -0.083740234375, -0.04736328125, -0.010986328125, 0.025390625, 0.061767578125, 0.09814453125, 0.134521484375, 0.1708984375, 0.207275390625, 0.24365234375, 0.280029296875, 0.31640625, 0.352783203125, 0.38916015625, 0.425537109375, 0.4619140625, 0.498291015625, 0.53466796875, 0.571044921875, 0.607421875, 0.643798828125, 0.68017578125, 0.716552734375, 0.7529296875, 0.789306640625, 0.82568359375, 0.862060546875, 0.8984375, 0.934814453125, 0.97119140625, 1.007568359375, 1.0439453125, 1.080322265625, 1.11669921875, 1.153076171875, 1.189453125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 10.0, 9.0, 8.0, 9.0, 8.0, 28.0, 22.0, 40.0, 44.0, 58.0, 70.0, 91.0, 103.0, 106.0, 80.0, 73.0, 52.0, 40.0, 48.0, 24.0, 22.0, 11.0, 7.0, 9.0, 3.0, 4.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031341552734375, -0.03029346466064453, -0.029245376586914062, -0.028197288513183594, -0.027149200439453125, -0.026101112365722656, -0.025053024291992188, -0.02400493621826172, -0.02295684814453125, -0.02190876007080078, -0.020860671997070312, -0.019812583923339844, -0.018764495849609375, -0.017716407775878906, -0.016668319702148438, -0.015620231628417969, -0.0145721435546875, -0.013524055480957031, -0.012475967407226562, -0.011427879333496094, -0.010379791259765625, -0.009331703186035156, -0.008283615112304688, -0.007235527038574219, -0.00618743896484375, -0.005139350891113281, -0.0040912628173828125, -0.0030431747436523438, -0.001995086669921875, -0.0009469985961914062, 0.0001010894775390625, 0.0011491775512695312, 0.002197265625, 0.0032453536987304688, 0.0042934417724609375, 0.005341529846191406, 0.006389617919921875, 0.007437705993652344, 0.008485794067382812, 0.009533882141113281, 0.01058197021484375, 0.011630058288574219, 0.012678146362304688, 0.013726234436035156, 0.014774322509765625, 0.015822410583496094, 0.016870498657226562, 0.01791858673095703, 0.0189666748046875, 0.02001476287841797, 0.021062850952148438, 0.022110939025878906, 0.023159027099609375, 0.024207115173339844, 0.025255203247070312, 0.02630329132080078, 0.02735137939453125, 0.02839946746826172, 0.029447555541992188, 0.030495643615722656, 0.031543731689453125, 0.032591819763183594, 0.03363990783691406, 0.03468799591064453, 0.035736083984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 5.0, 5.0, 6.0, 17.0, 23.0, 31.0, 49.0, 75.0, 112.0, 214.0, 621.0, 56377.0, 989041.0, 1247.0, 325.0, 145.0, 88.0, 51.0, 30.0, 25.0, 12.0, 8.0, 12.0, 10.0, 1.0, 4.0, 1.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.87060546875, -0.8451385498046875, -0.819671630859375, -0.7942047119140625, -0.76873779296875, -0.7432708740234375, -0.717803955078125, -0.6923370361328125, -0.6668701171875, -0.6414031982421875, -0.615936279296875, -0.5904693603515625, -0.56500244140625, -0.5395355224609375, -0.514068603515625, -0.4886016845703125, -0.463134765625, -0.4376678466796875, -0.412200927734375, -0.3867340087890625, -0.36126708984375, -0.3358001708984375, -0.310333251953125, -0.2848663330078125, -0.2593994140625, -0.2339324951171875, -0.208465576171875, -0.1829986572265625, -0.15753173828125, -0.1320648193359375, -0.106597900390625, -0.0811309814453125, -0.0556640625, -0.0301971435546875, -0.004730224609375, 0.0207366943359375, 0.04620361328125, 0.0716705322265625, 0.097137451171875, 0.1226043701171875, 0.1480712890625, 0.1735382080078125, 0.199005126953125, 0.2244720458984375, 0.24993896484375, 0.2754058837890625, 0.300872802734375, 0.3263397216796875, 0.351806640625, 0.3772735595703125, 0.402740478515625, 0.4282073974609375, 0.45367431640625, 0.4791412353515625, 0.504608154296875, 0.5300750732421875, 0.5555419921875, 0.5810089111328125, 0.606475830078125, 0.6319427490234375, 0.65740966796875, 0.6828765869140625, 0.708343505859375, 0.7338104248046875, 0.75927734375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 30.0, 171.0, 691.0, 101.0, 14.0], "bins": [-0.637591540813446, -0.6272244453430176, -0.6168573498725891, -0.6064902544021606, -0.5961231589317322, -0.5857560634613037, -0.5753889679908752, -0.5650218725204468, -0.5546547770500183, -0.5442876815795898, -0.5339205861091614, -0.5235534906387329, -0.5131863951683044, -0.502819299697876, -0.4924522042274475, -0.48208510875701904, -0.4717179834842682, -0.4613508880138397, -0.45098379254341125, -0.4406166970729828, -0.4302496016025543, -0.41988250613212585, -0.4095154106616974, -0.39914828538894653, -0.38878118991851807, -0.3784140944480896, -0.36804699897766113, -0.35767990350723267, -0.3473128080368042, -0.33694571256637573, -0.32657861709594727, -0.3162115216255188, -0.30584439635276794, -0.2954773008823395, -0.285110205411911, -0.27474310994148254, -0.2643760144710541, -0.2540089190006256, -0.24364180862903595, -0.23327471315860748, -0.22290761768817902, -0.21254052221775055, -0.20217342674732208, -0.19180633127689362, -0.18143922090530396, -0.1710721254348755, -0.16070502996444702, -0.15033793449401855, -0.1399708390235901, -0.12960374355316162, -0.11923664808273315, -0.10886954516172409, -0.09850244969129562, -0.08813535422086716, -0.0777682512998581, -0.06740115582942963, -0.05703406408429146, -0.04666696488857269, -0.036299869418144226, -0.02593277208507061, -0.015565674751996994, -0.005198579281568527, 0.005168519914150238, 0.015535619109869003, 0.02590271458029747]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 6.0, 9.0, 10.0, 7.0, 19.0, 18.0, 23.0, 30.0, 25.0, 30.0, 33.0, 35.0, 29.0, 54.0, 43.0, 37.0, 51.0, 41.0, 47.0, 46.0, 50.0, 56.0, 32.0, 55.0, 31.0, 30.0, 21.0, 24.0, 16.0, 20.0, 10.0, 13.0, 11.0, 6.0, 9.0, 4.0, 7.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03299599885940552, -0.03204496204853058, -0.03109392151236534, -0.030142882838845253, -0.029191844165325165, -0.028240805491805077, -0.02728976681828499, -0.0263387281447649, -0.025387689471244812, -0.024436650797724724, -0.023485612124204636, -0.022534573450684547, -0.02158353477716446, -0.02063249610364437, -0.019681457430124283, -0.018730418756604195, -0.017779380083084106, -0.016828341409564018, -0.01587730273604393, -0.014926264062523842, -0.013975225389003754, -0.013024186715483665, -0.012073148041963577, -0.011122109368443489, -0.010171070694923401, -0.009220032021403313, -0.008268993347883224, -0.007317954674363136, -0.006366916000843048, -0.00541587732732296, -0.004464838653802872, -0.0035137999802827835, -0.0025627613067626953, -0.0016117226332426071, -0.0006606839597225189, 0.0002903547137975693, 0.0012413933873176575, 0.0021924320608377457, 0.003143470734357834, 0.004094509407877922, 0.00504554808139801, 0.0059965867549180984, 0.006947625428438187, 0.007898664101958275, 0.008849702775478363, 0.009800741448998451, 0.01075178012251854, 0.011702818796038628, 0.012653857469558716, 0.013604896143078804, 0.014555934816598892, 0.01550697349011898, 0.01645801216363907, 0.017409050837159157, 0.018360089510679245, 0.019311128184199333, 0.02026216685771942, 0.02121320553123951, 0.022164244204759598, 0.023115282878279686, 0.024066321551799774, 0.025017360225319862, 0.02596839889883995, 0.02691943757236004, 0.027870476245880127]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 3.0, 9.0, 10.0, 14.0, 15.0, 14.0, 18.0, 21.0, 25.0, 26.0, 30.0, 45.0, 25.0, 32.0, 43.0, 30.0, 41.0, 55.0, 42.0, 38.0, 38.0, 40.0, 45.0, 37.0, 35.0, 25.0, 34.0, 27.0, 28.0, 22.0, 19.0, 17.0, 17.0, 15.0, 8.0, 11.0, 7.0, 9.0, 4.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.125, -3.017059326171875, -2.90911865234375, -2.801177978515625, -2.6932373046875, -2.585296630859375, -2.47735595703125, -2.369415283203125, -2.261474609375, -2.153533935546875, -2.04559326171875, -1.937652587890625, -1.8297119140625, -1.721771240234375, -1.61383056640625, -1.505889892578125, -1.39794921875, -1.290008544921875, -1.18206787109375, -1.074127197265625, -0.9661865234375, -0.858245849609375, -0.75030517578125, -0.642364501953125, -0.534423828125, -0.426483154296875, -0.31854248046875, -0.210601806640625, -0.1026611328125, 0.005279541015625, 0.11322021484375, 0.221160888671875, 0.3291015625, 0.437042236328125, 0.54498291015625, 0.652923583984375, 0.7608642578125, 0.868804931640625, 0.97674560546875, 1.084686279296875, 1.192626953125, 1.300567626953125, 1.40850830078125, 1.516448974609375, 1.6243896484375, 1.732330322265625, 1.84027099609375, 1.948211669921875, 2.05615234375, 2.164093017578125, 2.27203369140625, 2.379974365234375, 2.4879150390625, 2.595855712890625, 2.70379638671875, 2.811737060546875, 2.919677734375, 3.027618408203125, 3.13555908203125, 3.243499755859375, 3.3514404296875, 3.459381103515625, 3.56732177734375, 3.675262451171875, 3.783203125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 6.0, 3.0, 3.0, 2.0, 8.0, 8.0, 10.0, 11.0, 21.0, 20.0, 26.0, 38.0, 39.0, 53.0, 83.0, 121.0, 201.0, 370.0, 846.0, 1846.0, 4238.0, 10201.0, 23707.0, 55425.0, 155160.0, 460484.0, 213571.0, 70211.0, 29363.0, 12535.0, 5328.0, 2405.0, 1064.0, 437.0, 243.0, 143.0, 71.0, 57.0, 40.0, 23.0, 28.0, 16.0, 27.0, 13.0, 10.0, 7.0, 12.0, 8.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0], "bins": [-4.46875, -4.331787109375, -4.19482421875, -4.057861328125, -3.9208984375, -3.783935546875, -3.64697265625, -3.510009765625, -3.373046875, -3.236083984375, -3.09912109375, -2.962158203125, -2.8251953125, -2.688232421875, -2.55126953125, -2.414306640625, -2.27734375, -2.140380859375, -2.00341796875, -1.866455078125, -1.7294921875, -1.592529296875, -1.45556640625, -1.318603515625, -1.181640625, -1.044677734375, -0.90771484375, -0.770751953125, -0.6337890625, -0.496826171875, -0.35986328125, -0.222900390625, -0.0859375, 0.051025390625, 0.18798828125, 0.324951171875, 0.4619140625, 0.598876953125, 0.73583984375, 0.872802734375, 1.009765625, 1.146728515625, 1.28369140625, 1.420654296875, 1.5576171875, 1.694580078125, 1.83154296875, 1.968505859375, 2.10546875, 2.242431640625, 2.37939453125, 2.516357421875, 2.6533203125, 2.790283203125, 2.92724609375, 3.064208984375, 3.201171875, 3.338134765625, 3.47509765625, 3.612060546875, 3.7490234375, 3.885986328125, 4.02294921875, 4.159912109375, 4.296875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 1.0, 6.0, 12.0, 9.0, 12.0, 12.0, 21.0, 20.0, 23.0, 27.0, 25.0, 39.0, 37.0, 39.0, 35.0, 51.0, 75.0, 103.0, 243.0, 1525.0, 200.0, 98.0, 56.0, 47.0, 50.0, 33.0, 40.0, 28.0, 35.0, 23.0, 25.0, 16.0, 15.0, 15.0, 8.0, 9.0, 10.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.1015625, -11.7396240234375, -11.377685546875, -11.0157470703125, -10.65380859375, -10.2918701171875, -9.929931640625, -9.5679931640625, -9.2060546875, -8.8441162109375, -8.482177734375, -8.1202392578125, -7.75830078125, -7.3963623046875, -7.034423828125, -6.6724853515625, -6.310546875, -5.9486083984375, -5.586669921875, -5.2247314453125, -4.86279296875, -4.5008544921875, -4.138916015625, -3.7769775390625, -3.4150390625, -3.0531005859375, -2.691162109375, -2.3292236328125, -1.96728515625, -1.6053466796875, -1.243408203125, -0.8814697265625, -0.51953125, -0.1575927734375, 0.204345703125, 0.5662841796875, 0.92822265625, 1.2901611328125, 1.652099609375, 2.0140380859375, 2.3759765625, 2.7379150390625, 3.099853515625, 3.4617919921875, 3.82373046875, 4.1856689453125, 4.547607421875, 4.9095458984375, 5.271484375, 5.6334228515625, 5.995361328125, 6.3572998046875, 6.71923828125, 7.0811767578125, 7.443115234375, 7.8050537109375, 8.1669921875, 8.5289306640625, 8.890869140625, 9.2528076171875, 9.61474609375, 9.9766845703125, 10.338623046875, 10.7005615234375, 11.0625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 12.0, 17.0, 14.0, 12.0, 16.0, 30.0, 25.0, 30.0, 41.0, 45.0, 79.0, 103.0, 124.0, 214.0, 383.0, 1123.0, 9311.0, 2336273.0, 789980.0, 5849.0, 908.0, 391.0, 186.0, 114.0, 77.0, 87.0, 46.0, 47.0, 38.0, 28.0, 26.0, 14.0, 13.0, 12.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.078125, -25.206787109375, -24.33544921875, -23.464111328125, -22.5927734375, -21.721435546875, -20.85009765625, -19.978759765625, -19.107421875, -18.236083984375, -17.36474609375, -16.493408203125, -15.6220703125, -14.750732421875, -13.87939453125, -13.008056640625, -12.13671875, -11.265380859375, -10.39404296875, -9.522705078125, -8.6513671875, -7.780029296875, -6.90869140625, -6.037353515625, -5.166015625, -4.294677734375, -3.42333984375, -2.552001953125, -1.6806640625, -0.809326171875, 0.06201171875, 0.933349609375, 1.8046875, 2.676025390625, 3.54736328125, 4.418701171875, 5.2900390625, 6.161376953125, 7.03271484375, 7.904052734375, 8.775390625, 9.646728515625, 10.51806640625, 11.389404296875, 12.2607421875, 13.132080078125, 14.00341796875, 14.874755859375, 15.74609375, 16.617431640625, 17.48876953125, 18.360107421875, 19.2314453125, 20.102783203125, 20.97412109375, 21.845458984375, 22.716796875, 23.588134765625, 24.45947265625, 25.330810546875, 26.2021484375, 27.073486328125, 27.94482421875, 28.816162109375, 29.6875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 18.0, 66.0, 149.0, 220.0, 203.0, 182.0, 102.0, 53.0, 14.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.131953239440918, -9.146566390991211, -8.16118049621582, -7.175793647766113, -6.190407752990723, -5.205020904541016, -4.219634532928467, -3.234248161315918, -2.248861789703369, -1.2634754180908203, -0.27808892726898193, 0.7072975635528564, 1.6926839351654053, 2.678070545196533, 3.663456916809082, 4.648843288421631, 5.63422966003418, 6.6196160316467285, 7.605002403259277, 8.590389251708984, 9.575775146484375, 10.561161994934082, 11.546548843383789, 12.53193473815918, 13.51732063293457, 14.502707481384277, 15.488093376159668, 16.473480224609375, 17.458866119384766, 18.444252014160156, 19.42963981628418, 20.41502571105957, 21.40041160583496, 22.38579750061035, 23.371185302734375, 24.356571197509766, 25.341957092285156, 26.327342987060547, 27.31273078918457, 28.29811668395996, 29.28350257873535, 30.268888473510742, 31.254276275634766, 32.239662170410156, 33.22504806518555, 34.21043395996094, 35.19581985473633, 36.18120574951172, 37.166595458984375, 38.151981353759766, 39.137367248535156, 40.12275314331055, 41.1081428527832, 42.093528747558594, 43.078914642333984, 44.064300537109375, 45.049686431884766, 46.035072326660156, 47.02045822143555, 48.00584411621094, 48.991233825683594, 49.976619720458984, 50.962005615234375, 51.947391510009766, 52.932777404785156]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 4.0, 10.0, 3.0, 15.0, 15.0, 16.0, 17.0, 30.0, 27.0, 22.0, 25.0, 33.0, 50.0, 31.0, 35.0, 45.0, 49.0, 41.0, 54.0, 52.0, 45.0, 53.0, 27.0, 37.0, 23.0, 44.0, 38.0, 28.0, 26.0, 15.0, 12.0, 17.0, 13.0, 10.0, 6.0, 9.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.916046142578125, -31.875858306884766, -30.83567237854004, -29.795486450195312, -28.755298614501953, -27.715110778808594, -26.674924850463867, -25.63473892211914, -24.59455108642578, -23.554363250732422, -22.514177322387695, -21.47399139404297, -20.43380355834961, -19.39361572265625, -18.353429794311523, -17.313243865966797, -16.273056030273438, -15.232869148254395, -14.192682266235352, -13.152495384216309, -12.112308502197266, -11.072121620178223, -10.03193473815918, -8.991747856140137, -7.951560974121094, -6.911374092102051, -5.871187210083008, -4.831000328063965, -3.790813446044922, -2.750626564025879, -1.710439682006836, -0.670252799987793, 0.3699378967285156, 1.4101247787475586, 2.4503116607666016, 3.4904985427856445, 4.5306854248046875, 5.5708723068237305, 6.611059188842773, 7.651246070861816, 8.69143295288086, 9.731619834899902, 10.771806716918945, 11.811993598937988, 12.852180480957031, 13.892367362976074, 14.932554244995117, 15.97274112701416, 17.012928009033203, 18.053115844726562, 19.09330177307129, 20.133487701416016, 21.173675537109375, 22.213863372802734, 23.25404930114746, 24.294235229492188, 25.334423065185547, 26.374610900878906, 27.414796829223633, 28.45498275756836, 29.49517059326172, 30.535358428955078, 31.575544357299805, 32.61573028564453, 33.65591812133789]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 7.0, 7.0, 8.0, 10.0, 13.0, 12.0, 16.0, 19.0, 14.0, 25.0, 33.0, 26.0, 30.0, 32.0, 38.0, 36.0, 37.0, 33.0, 35.0, 38.0, 38.0, 33.0, 40.0, 37.0, 36.0, 41.0, 39.0, 26.0, 33.0, 27.0, 24.0, 27.0, 19.0, 17.0, 17.0, 13.0, 5.0, 13.0, 7.0, 8.0, 6.0, 2.0, 4.0, 1.0, 1.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.291015625, -3.1793212890625, -3.067626953125, -2.9559326171875, -2.84423828125, -2.7325439453125, -2.620849609375, -2.5091552734375, -2.3974609375, -2.2857666015625, -2.174072265625, -2.0623779296875, -1.95068359375, -1.8389892578125, -1.727294921875, -1.6156005859375, -1.50390625, -1.3922119140625, -1.280517578125, -1.1688232421875, -1.05712890625, -0.9454345703125, -0.833740234375, -0.7220458984375, -0.6103515625, -0.4986572265625, -0.386962890625, -0.2752685546875, -0.16357421875, -0.0518798828125, 0.059814453125, 0.1715087890625, 0.283203125, 0.3948974609375, 0.506591796875, 0.6182861328125, 0.72998046875, 0.8416748046875, 0.953369140625, 1.0650634765625, 1.1767578125, 1.2884521484375, 1.400146484375, 1.5118408203125, 1.62353515625, 1.7352294921875, 1.846923828125, 1.9586181640625, 2.0703125, 2.1820068359375, 2.293701171875, 2.4053955078125, 2.51708984375, 2.6287841796875, 2.740478515625, 2.8521728515625, 2.9638671875, 3.0755615234375, 3.187255859375, 3.2989501953125, 3.41064453125, 3.5223388671875, 3.634033203125, 3.7457275390625, 3.857421875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 6.0, 13.0, 10.0, 16.0, 19.0, 32.0, 47.0, 77.0, 130.0, 159.0, 285.0, 492.0, 924.0, 1867.0, 4077.0, 9561.0, 23197.0, 58075.0, 145250.0, 347579.0, 726774.0, 1112073.0, 920096.0, 488798.0, 212084.0, 85192.0, 33385.0, 13378.0, 5676.0, 2424.0, 1128.0, 609.0, 290.0, 179.0, 104.0, 78.0, 41.0, 37.0, 23.0, 21.0, 15.0, 11.0, 11.0, 10.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.263671875, -3.15380859375, -3.0439453125, -2.93408203125, -2.82421875, -2.71435546875, -2.6044921875, -2.49462890625, -2.384765625, -2.27490234375, -2.1650390625, -2.05517578125, -1.9453125, -1.83544921875, -1.7255859375, -1.61572265625, -1.505859375, -1.39599609375, -1.2861328125, -1.17626953125, -1.06640625, -0.95654296875, -0.8466796875, -0.73681640625, -0.626953125, -0.51708984375, -0.4072265625, -0.29736328125, -0.1875, -0.07763671875, 0.0322265625, 0.14208984375, 0.251953125, 0.36181640625, 0.4716796875, 0.58154296875, 0.69140625, 0.80126953125, 0.9111328125, 1.02099609375, 1.130859375, 1.24072265625, 1.3505859375, 1.46044921875, 1.5703125, 1.68017578125, 1.7900390625, 1.89990234375, 2.009765625, 2.11962890625, 2.2294921875, 2.33935546875, 2.44921875, 2.55908203125, 2.6689453125, 2.77880859375, 2.888671875, 2.99853515625, 3.1083984375, 3.21826171875, 3.328125, 3.43798828125, 3.5478515625, 3.65771484375, 3.767578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 16.0, 15.0, 23.0, 26.0, 38.0, 42.0, 60.0, 77.0, 103.0, 127.0, 200.0, 216.0, 252.0, 337.0, 408.0, 409.0, 331.0, 320.0, 244.0, 201.0, 146.0, 120.0, 91.0, 57.0, 43.0, 32.0, 31.0, 28.0, 19.0, 16.0, 8.0, 8.0, 2.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.01953125, -5.82708740234375, -5.6346435546875, -5.44219970703125, -5.249755859375, -5.05731201171875, -4.8648681640625, -4.67242431640625, -4.47998046875, -4.28753662109375, -4.0950927734375, -3.90264892578125, -3.710205078125, -3.51776123046875, -3.3253173828125, -3.13287353515625, -2.9404296875, -2.74798583984375, -2.5555419921875, -2.36309814453125, -2.170654296875, -1.97821044921875, -1.7857666015625, -1.59332275390625, -1.40087890625, -1.20843505859375, -1.0159912109375, -0.82354736328125, -0.631103515625, -0.43865966796875, -0.2462158203125, -0.05377197265625, 0.138671875, 0.33111572265625, 0.5235595703125, 0.71600341796875, 0.908447265625, 1.10089111328125, 1.2933349609375, 1.48577880859375, 1.67822265625, 1.87066650390625, 2.0631103515625, 2.25555419921875, 2.447998046875, 2.64044189453125, 2.8328857421875, 3.02532958984375, 3.2177734375, 3.41021728515625, 3.6026611328125, 3.79510498046875, 3.987548828125, 4.17999267578125, 4.3724365234375, 4.56488037109375, 4.75732421875, 4.94976806640625, 5.1422119140625, 5.33465576171875, 5.527099609375, 5.71954345703125, 5.9119873046875, 6.10443115234375, 6.296875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 16.0, 11.0, 28.0, 29.0, 41.0, 40.0, 67.0, 108.0, 161.0, 246.0, 417.0, 803.0, 2327.0, 45551.0, 3170591.0, 959074.0, 11629.0, 1480.0, 594.0, 383.0, 179.0, 134.0, 89.0, 66.0, 54.0, 32.0, 38.0, 16.0, 24.0, 8.0, 10.0, 6.0, 3.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.9375, -23.208251953125, -22.47900390625, -21.749755859375, -21.0205078125, -20.291259765625, -19.56201171875, -18.832763671875, -18.103515625, -17.374267578125, -16.64501953125, -15.915771484375, -15.1865234375, -14.457275390625, -13.72802734375, -12.998779296875, -12.26953125, -11.540283203125, -10.81103515625, -10.081787109375, -9.3525390625, -8.623291015625, -7.89404296875, -7.164794921875, -6.435546875, -5.706298828125, -4.97705078125, -4.247802734375, -3.5185546875, -2.789306640625, -2.06005859375, -1.330810546875, -0.6015625, 0.127685546875, 0.85693359375, 1.586181640625, 2.3154296875, 3.044677734375, 3.77392578125, 4.503173828125, 5.232421875, 5.961669921875, 6.69091796875, 7.420166015625, 8.1494140625, 8.878662109375, 9.60791015625, 10.337158203125, 11.06640625, 11.795654296875, 12.52490234375, 13.254150390625, 13.9833984375, 14.712646484375, 15.44189453125, 16.171142578125, 16.900390625, 17.629638671875, 18.35888671875, 19.088134765625, 19.8173828125, 20.546630859375, 21.27587890625, 22.005126953125, 22.734375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 23.0, 43.0, 110.0, 168.0, 202.0, 218.0, 147.0, 54.0, 26.0, 14.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.11661529541016, -70.34900665283203, -68.5813980102539, -66.81378936767578, -65.04618072509766, -63.2785758972168, -61.51096725463867, -59.74335861206055, -57.97575378417969, -56.20814514160156, -54.44053649902344, -52.67292785644531, -50.90532302856445, -49.13771438598633, -47.3701057434082, -45.60249710083008, -43.83488845825195, -42.06727981567383, -40.2996711730957, -38.532066345214844, -36.76445770263672, -34.996849060058594, -33.22924041748047, -31.461631774902344, -29.69402503967285, -27.926416397094727, -26.158809661865234, -24.39120101928711, -22.623592376708984, -20.855985641479492, -19.088376998901367, -17.320770263671875, -15.553157806396484, -13.785550117492676, -12.017942428588867, -10.250333786010742, -8.482726097106934, -6.715118408203125, -4.947509765625, -3.1799020767211914, -1.4122943878173828, 0.3553135395050049, 2.1229214668273926, 3.8905296325683594, 5.658137321472168, 7.425745010375977, 9.193353652954102, 10.96096134185791, 12.728569030761719, 14.496176719665527, 16.263784408569336, 18.03139305114746, 19.798999786376953, 21.566608428955078, 23.334217071533203, 25.101825714111328, 26.86943244934082, 28.637041091918945, 30.404647827148438, 32.17225646972656, 33.93986511230469, 35.70747375488281, 37.47508239746094, 39.2426872253418, 41.01029586791992]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 10.0, 3.0, 11.0, 9.0, 3.0, 7.0, 10.0, 14.0, 17.0, 24.0, 24.0, 27.0, 26.0, 28.0, 42.0, 37.0, 34.0, 41.0, 42.0, 31.0, 43.0, 44.0, 41.0, 22.0, 48.0, 28.0, 45.0, 31.0, 38.0, 29.0, 19.0, 31.0, 18.0, 24.0, 17.0, 14.0, 9.0, 8.0, 10.0, 10.0, 8.0, 13.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.34364891052246, -23.641258239746094, -22.93886947631836, -22.236478805541992, -21.534088134765625, -20.83169937133789, -20.129308700561523, -19.426918029785156, -18.724529266357422, -18.022138595581055, -17.31974983215332, -16.617359161376953, -15.914968490600586, -15.212578773498535, -14.510189056396484, -13.807798385620117, -13.10540771484375, -12.4030179977417, -11.700627326965332, -10.998237609863281, -10.295846939086914, -9.593457221984863, -8.891067504882812, -8.188676834106445, -7.4862871170043945, -6.7838969230651855, -6.081506729125977, -5.379117012023926, -4.676726818084717, -3.974336624145508, -3.271946907043457, -2.569556713104248, -1.867166519165039, -1.1647764444351196, -0.4623863697052002, 0.2400035858154297, 0.9423937797546387, 1.6447839736938477, 2.3471736907958984, 3.0495638847351074, 3.7519540786743164, 4.454344272613525, 5.156734466552734, 5.859124183654785, 6.561514377593994, 7.263904571533203, 7.966294288635254, 8.668684005737305, 9.371074676513672, 10.073464393615723, 10.77585506439209, 11.47824478149414, 12.180635452270508, 12.883025169372559, 13.58541488647461, 14.287805557250977, 14.990195274353027, 15.692584991455078, 16.394975662231445, 17.097366333007812, 17.799755096435547, 18.502145767211914, 19.20453643798828, 19.906925201416016, 20.609315872192383]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 4.0, 4.0, 4.0, 12.0, 11.0, 11.0, 12.0, 20.0, 19.0, 14.0, 15.0, 27.0, 33.0, 31.0, 31.0, 47.0, 39.0, 27.0, 35.0, 47.0, 41.0, 25.0, 52.0, 42.0, 32.0, 30.0, 31.0, 32.0, 39.0, 21.0, 27.0, 24.0, 31.0, 19.0, 16.0, 13.0, 14.0, 8.0, 5.0, 10.0, 4.0, 3.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.126953125, -3.023590087890625, -2.92022705078125, -2.816864013671875, -2.7135009765625, -2.610137939453125, -2.50677490234375, -2.403411865234375, -2.300048828125, -2.196685791015625, -2.09332275390625, -1.989959716796875, -1.8865966796875, -1.783233642578125, -1.67987060546875, -1.576507568359375, -1.47314453125, -1.369781494140625, -1.26641845703125, -1.163055419921875, -1.0596923828125, -0.956329345703125, -0.85296630859375, -0.749603271484375, -0.646240234375, -0.542877197265625, -0.43951416015625, -0.336151123046875, -0.2327880859375, -0.129425048828125, -0.02606201171875, 0.077301025390625, 0.1806640625, 0.284027099609375, 0.38739013671875, 0.490753173828125, 0.5941162109375, 0.697479248046875, 0.80084228515625, 0.904205322265625, 1.007568359375, 1.110931396484375, 1.21429443359375, 1.317657470703125, 1.4210205078125, 1.524383544921875, 1.62774658203125, 1.731109619140625, 1.83447265625, 1.937835693359375, 2.04119873046875, 2.144561767578125, 2.2479248046875, 2.351287841796875, 2.45465087890625, 2.558013916015625, 2.661376953125, 2.764739990234375, 2.86810302734375, 2.971466064453125, 3.0748291015625, 3.178192138671875, 3.28155517578125, 3.384918212890625, 3.48828125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 15.0, 12.0, 16.0, 45.0, 59.0, 86.0, 138.0, 224.0, 297.0, 489.0, 733.0, 1107.0, 1617.0, 2431.0, 3747.0, 5443.0, 7991.0, 11646.0, 16974.0, 24496.0, 34217.0, 46138.0, 61493.0, 77289.0, 91848.0, 103067.0, 107014.0, 99667.0, 86554.0, 70883.0, 54868.0, 41386.0, 29568.0, 21304.0, 14739.0, 10113.0, 6825.0, 4732.0, 3119.0, 2051.0, 1436.0, 902.0, 635.0, 370.0, 272.0, 187.0, 104.0, 83.0, 44.0, 27.0, 29.0, 11.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.484130859375, -0.4691429138183594, -0.45415496826171875, -0.4391670227050781, -0.4241790771484375, -0.4091911315917969, -0.39420318603515625, -0.3792152404785156, -0.364227294921875, -0.3492393493652344, -0.33425140380859375, -0.3192634582519531, -0.3042755126953125, -0.2892875671386719, -0.27429962158203125, -0.2593116760253906, -0.24432373046875, -0.22933578491210938, -0.21434783935546875, -0.19935989379882812, -0.1843719482421875, -0.16938400268554688, -0.15439605712890625, -0.13940811157226562, -0.124420166015625, -0.10943222045898438, -0.09444427490234375, -0.07945632934570312, -0.0644683837890625, -0.049480438232421875, -0.03449249267578125, -0.019504547119140625, -0.0045166015625, 0.010471343994140625, 0.02545928955078125, 0.040447235107421875, 0.0554351806640625, 0.07042312622070312, 0.08541107177734375, 0.10039901733398438, 0.115386962890625, 0.13037490844726562, 0.14536285400390625, 0.16035079956054688, 0.1753387451171875, 0.19032669067382812, 0.20531463623046875, 0.22030258178710938, 0.23529052734375, 0.2502784729003906, 0.26526641845703125, 0.2802543640136719, 0.2952423095703125, 0.3102302551269531, 0.32521820068359375, 0.3402061462402344, 0.355194091796875, 0.3701820373535156, 0.38516998291015625, 0.4001579284667969, 0.4151458740234375, 0.4301338195800781, 0.44512176513671875, 0.4601097106933594, 0.47509765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 6.0, 5.0, 6.0, 9.0, 1.0, 11.0, 10.0, 8.0, 10.0, 14.0, 12.0, 18.0, 17.0, 19.0, 26.0, 22.0, 33.0, 33.0, 30.0, 34.0, 36.0, 39.0, 40.0, 40.0, 1063.0, 30.0, 38.0, 36.0, 30.0, 31.0, 39.0, 30.0, 33.0, 27.0, 23.0, 30.0, 27.0, 15.0, 17.0, 18.0, 9.0, 18.0, 6.0, 7.0, 5.0, 6.0, 5.0, 2.0, 7.0, 2.0, 1.0, 5.0, 1.0, 1.0], "bins": [-2.703125, -2.6256103515625, -2.548095703125, -2.4705810546875, -2.39306640625, -2.3155517578125, -2.238037109375, -2.1605224609375, -2.0830078125, -2.0054931640625, -1.927978515625, -1.8504638671875, -1.77294921875, -1.6954345703125, -1.617919921875, -1.5404052734375, -1.462890625, -1.3853759765625, -1.307861328125, -1.2303466796875, -1.15283203125, -1.0753173828125, -0.997802734375, -0.9202880859375, -0.8427734375, -0.7652587890625, -0.687744140625, -0.6102294921875, -0.53271484375, -0.4552001953125, -0.377685546875, -0.3001708984375, -0.22265625, -0.1451416015625, -0.067626953125, 0.0098876953125, 0.08740234375, 0.1649169921875, 0.242431640625, 0.3199462890625, 0.3974609375, 0.4749755859375, 0.552490234375, 0.6300048828125, 0.70751953125, 0.7850341796875, 0.862548828125, 0.9400634765625, 1.017578125, 1.0950927734375, 1.172607421875, 1.2501220703125, 1.32763671875, 1.4051513671875, 1.482666015625, 1.5601806640625, 1.6376953125, 1.7152099609375, 1.792724609375, 1.8702392578125, 1.94775390625, 2.0252685546875, 2.102783203125, 2.1802978515625, 2.2578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 11.0, 16.0, 15.0, 26.0, 27.0, 34.0, 63.0, 72.0, 123.0, 179.0, 275.0, 376.0, 549.0, 784.0, 1124.0, 1566.0, 2320.0, 3340.0, 4814.0, 6767.0, 9510.0, 13870.0, 21429.0, 35003.0, 1865540.0, 50273.0, 25661.0, 16428.0, 11148.0, 7789.0, 5448.0, 3758.0, 2687.0, 1927.0, 1282.0, 902.0, 620.0, 440.0, 308.0, 192.0, 136.0, 99.0, 69.0, 45.0, 35.0, 11.0, 17.0, 7.0, 10.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0517578125, -1.0175018310546875, -0.983245849609375, -0.9489898681640625, -0.91473388671875, -0.8804779052734375, -0.846221923828125, -0.8119659423828125, -0.7777099609375, -0.7434539794921875, -0.709197998046875, -0.6749420166015625, -0.64068603515625, -0.6064300537109375, -0.572174072265625, -0.5379180908203125, -0.503662109375, -0.4694061279296875, -0.435150146484375, -0.4008941650390625, -0.36663818359375, -0.3323822021484375, -0.298126220703125, -0.2638702392578125, -0.2296142578125, -0.1953582763671875, -0.161102294921875, -0.1268463134765625, -0.09259033203125, -0.0583343505859375, -0.024078369140625, 0.0101776123046875, 0.04443359375, 0.0786895751953125, 0.112945556640625, 0.1472015380859375, 0.18145751953125, 0.2157135009765625, 0.249969482421875, 0.2842254638671875, 0.3184814453125, 0.3527374267578125, 0.386993408203125, 0.4212493896484375, 0.45550537109375, 0.4897613525390625, 0.524017333984375, 0.5582733154296875, 0.592529296875, 0.6267852783203125, 0.661041259765625, 0.6952972412109375, 0.72955322265625, 0.7638092041015625, 0.798065185546875, 0.8323211669921875, 0.8665771484375, 0.9008331298828125, 0.935089111328125, 0.9693450927734375, 1.00360107421875, 1.0378570556640625, 1.072113037109375, 1.1063690185546875, 1.140625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 2.0, 4.0, 5.0, 4.0, 3.0, 7.0, 7.0, 6.0, 8.0, 6.0, 11.0, 12.0, 10.0, 16.0, 18.0, 26.0, 35.0, 27.0, 44.0, 56.0, 66.0, 76.0, 77.0, 72.0, 60.0, 56.0, 46.0, 39.0, 36.0, 33.0, 26.0, 15.0, 14.0, 11.0, 7.0, 10.0, 9.0, 10.0, 6.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02294921875, -0.022269725799560547, -0.021590232849121094, -0.02091073989868164, -0.020231246948242188, -0.019551753997802734, -0.01887226104736328, -0.018192768096923828, -0.017513275146484375, -0.016833782196044922, -0.01615428924560547, -0.015474796295166016, -0.014795303344726562, -0.01411581039428711, -0.013436317443847656, -0.012756824493408203, -0.01207733154296875, -0.011397838592529297, -0.010718345642089844, -0.01003885269165039, -0.009359359741210938, -0.008679866790771484, -0.008000373840332031, -0.007320880889892578, -0.006641387939453125, -0.005961894989013672, -0.005282402038574219, -0.004602909088134766, -0.0039234161376953125, -0.0032439231872558594, -0.0025644302368164062, -0.0018849372863769531, -0.0012054443359375, -0.0005259513854980469, 0.00015354156494140625, 0.0008330345153808594, 0.0015125274658203125, 0.0021920204162597656, 0.0028715133666992188, 0.003551006317138672, 0.004230499267578125, 0.004909992218017578, 0.005589485168457031, 0.006268978118896484, 0.0069484710693359375, 0.007627964019775391, 0.008307456970214844, 0.008986949920654297, 0.00966644287109375, 0.010345935821533203, 0.011025428771972656, 0.01170492172241211, 0.012384414672851562, 0.013063907623291016, 0.013743400573730469, 0.014422893524169922, 0.015102386474609375, 0.015781879425048828, 0.01646137237548828, 0.017140865325927734, 0.017820358276367188, 0.01849985122680664, 0.019179344177246094, 0.019858837127685547, 0.020538330078125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 10.0, 1.0, 4.0, 5.0, 7.0, 11.0, 11.0, 6.0, 17.0, 22.0, 32.0, 47.0, 53.0, 86.0, 137.0, 257.0, 660.0, 10825.0, 1019387.0, 15457.0, 723.0, 298.0, 152.0, 76.0, 53.0, 51.0, 38.0, 21.0, 21.0, 14.0, 9.0, 12.0, 8.0, 3.0, 8.0, 6.0, 5.0, 2.0, 3.0, 5.0, 0.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50341796875, -0.48693084716796875, -0.4704437255859375, -0.45395660400390625, -0.437469482421875, -0.42098236083984375, -0.4044952392578125, -0.38800811767578125, -0.37152099609375, -0.35503387451171875, -0.3385467529296875, -0.32205963134765625, -0.305572509765625, -0.28908538818359375, -0.2725982666015625, -0.25611114501953125, -0.2396240234375, -0.22313690185546875, -0.2066497802734375, -0.19016265869140625, -0.173675537109375, -0.15718841552734375, -0.1407012939453125, -0.12421417236328125, -0.10772705078125, -0.09123992919921875, -0.0747528076171875, -0.05826568603515625, -0.041778564453125, -0.02529144287109375, -0.0088043212890625, 0.00768280029296875, 0.024169921875, 0.04065704345703125, 0.0571441650390625, 0.07363128662109375, 0.090118408203125, 0.10660552978515625, 0.1230926513671875, 0.13957977294921875, 0.15606689453125, 0.17255401611328125, 0.1890411376953125, 0.20552825927734375, 0.222015380859375, 0.23850250244140625, 0.2549896240234375, 0.27147674560546875, 0.2879638671875, 0.30445098876953125, 0.3209381103515625, 0.33742523193359375, 0.353912353515625, 0.37039947509765625, 0.3868865966796875, 0.40337371826171875, 0.41986083984375, 0.43634796142578125, 0.4528350830078125, 0.46932220458984375, 0.485809326171875, 0.5022964477539062, 0.5187835693359375, 0.5352706909179688, 0.5517578125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 17.0, 35.0, 66.0, 176.0, 382.0, 260.0, 52.0, 13.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.22546342015266418, -0.22148779034614563, -0.21751216053962708, -0.21353653073310852, -0.20956090092658997, -0.2055852711200714, -0.20160964131355286, -0.1976340115070343, -0.19365838170051575, -0.1896827518939972, -0.18570712208747864, -0.18173149228096008, -0.17775586247444153, -0.17378023266792297, -0.16980460286140442, -0.16582897305488586, -0.1618533432483673, -0.15787771344184875, -0.1539020836353302, -0.14992645382881165, -0.1459508240222931, -0.14197519421577454, -0.13799956440925598, -0.13402393460273743, -0.13004828989505768, -0.12607266008853912, -0.12209703028202057, -0.11812140047550201, -0.11414577066898346, -0.1101701408624649, -0.10619451105594635, -0.1022188812494278, -0.09824325144290924, -0.09426762163639069, -0.09029199182987213, -0.08631636202335358, -0.08234073221683502, -0.07836510241031647, -0.07438947260379791, -0.07041384279727936, -0.0664382129907608, -0.06246258318424225, -0.058486953377723694, -0.05451132357120514, -0.050535693764686584, -0.04656006395816803, -0.04258443042635918, -0.03860880061984062, -0.03463316708803177, -0.030657537281513214, -0.02668190747499466, -0.022706275805830956, -0.0187306459993124, -0.014755016192793846, -0.010779384523630142, -0.0068037547171115875, -0.002828126773238182, 0.00114750349894166, 0.005123133771121502, 0.009098764508962631, 0.013074394315481186, 0.01705002412199974, 0.021025655791163445, 0.025001285597682, 0.028976915404200554]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 9.0, 5.0, 3.0, 8.0, 7.0, 3.0, 8.0, 7.0, 14.0, 15.0, 16.0, 14.0, 17.0, 24.0, 12.0, 34.0, 27.0, 31.0, 43.0, 31.0, 31.0, 40.0, 35.0, 40.0, 35.0, 41.0, 39.0, 50.0, 28.0, 35.0, 24.0, 24.0, 35.0, 26.0, 21.0, 22.0, 24.0, 24.0, 17.0, 19.0, 11.0, 7.0, 8.0, 10.0, 5.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0], "bins": [-0.01739645004272461, -0.01683700829744339, -0.01627756468951702, -0.015718121081590652, -0.015158679336309433, -0.014599236659705639, -0.014039793983101845, -0.01348035130649805, -0.012920908629894257, -0.012361465953290462, -0.011802023276686668, -0.011242580600082874, -0.01068313792347908, -0.010123695246875286, -0.009564252570271492, -0.009004809893667698, -0.008445367217063904, -0.00788592454046011, -0.007326481863856316, -0.0067670391872525215, -0.006207596510648727, -0.005648153834044933, -0.005088711157441139, -0.004529268480837345, -0.003969825804233551, -0.003410383127629757, -0.002850940451025963, -0.0022914977744221687, -0.0017320550978183746, -0.0011726124212145805, -0.0006131697446107864, -5.372706800699234e-05, 0.0005057156085968018, 0.0010651582852005959, 0.00162460096180439, 0.002184043638408184, 0.002743486315011978, 0.0033029289916157722, 0.0038623716682195663, 0.0044218143448233604, 0.0049812570214271545, 0.005540699698030949, 0.006100142374634743, 0.006659585051238537, 0.007219027727842331, 0.007778470404446125, 0.008337913081049919, 0.008897355757653713, 0.009456798434257507, 0.010016241110861301, 0.010575683787465096, 0.01113512646406889, 0.011694569140672684, 0.012254011817276478, 0.012813454493880272, 0.013372897170484066, 0.01393233984708786, 0.014491782523691654, 0.015051225200295448, 0.015610667876899242, 0.016170110553503036, 0.016729552298784256, 0.017288995906710625, 0.017848439514636993, 0.018407881259918213]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 1.0, 5.0, 9.0, 5.0, 11.0, 18.0, 16.0, 23.0, 26.0, 13.0, 25.0, 34.0, 31.0, 33.0, 39.0, 37.0, 38.0, 45.0, 39.0, 32.0, 48.0, 46.0, 48.0, 33.0, 34.0, 39.0, 29.0, 30.0, 34.0, 24.0, 25.0, 26.0, 18.0, 11.0, 14.0, 10.0, 14.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.037109375, -2.925689697265625, -2.81427001953125, -2.702850341796875, -2.5914306640625, -2.480010986328125, -2.36859130859375, -2.257171630859375, -2.145751953125, -2.034332275390625, -1.92291259765625, -1.811492919921875, -1.7000732421875, -1.588653564453125, -1.47723388671875, -1.365814208984375, -1.25439453125, -1.142974853515625, -1.03155517578125, -0.920135498046875, -0.8087158203125, -0.697296142578125, -0.58587646484375, -0.474456787109375, -0.363037109375, -0.251617431640625, -0.14019775390625, -0.028778076171875, 0.0826416015625, 0.194061279296875, 0.30548095703125, 0.416900634765625, 0.5283203125, 0.639739990234375, 0.75115966796875, 0.862579345703125, 0.9739990234375, 1.085418701171875, 1.19683837890625, 1.308258056640625, 1.419677734375, 1.531097412109375, 1.64251708984375, 1.753936767578125, 1.8653564453125, 1.976776123046875, 2.08819580078125, 2.199615478515625, 2.31103515625, 2.422454833984375, 2.53387451171875, 2.645294189453125, 2.7567138671875, 2.868133544921875, 2.97955322265625, 3.090972900390625, 3.202392578125, 3.313812255859375, 3.42523193359375, 3.536651611328125, 3.6480712890625, 3.759490966796875, 3.87091064453125, 3.982330322265625, 4.09375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 3.0, 6.0, 10.0, 11.0, 23.0, 23.0, 43.0, 53.0, 84.0, 143.0, 203.0, 361.0, 611.0, 972.0, 1753.0, 2890.0, 5093.0, 8314.0, 14348.0, 24260.0, 42237.0, 76097.0, 152579.0, 256561.0, 214247.0, 110706.0, 57387.0, 32891.0, 19255.0, 11274.0, 6688.0, 3882.0, 2286.0, 1307.0, 758.0, 422.0, 292.0, 177.0, 109.0, 55.0, 39.0, 39.0, 26.0, 10.0, 12.0, 7.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.66796875, -2.5718994140625, -2.475830078125, -2.3797607421875, -2.28369140625, -2.1876220703125, -2.091552734375, -1.9954833984375, -1.8994140625, -1.8033447265625, -1.707275390625, -1.6112060546875, -1.51513671875, -1.4190673828125, -1.322998046875, -1.2269287109375, -1.130859375, -1.0347900390625, -0.938720703125, -0.8426513671875, -0.74658203125, -0.6505126953125, -0.554443359375, -0.4583740234375, -0.3623046875, -0.2662353515625, -0.170166015625, -0.0740966796875, 0.02197265625, 0.1180419921875, 0.214111328125, 0.3101806640625, 0.40625, 0.5023193359375, 0.598388671875, 0.6944580078125, 0.79052734375, 0.8865966796875, 0.982666015625, 1.0787353515625, 1.1748046875, 1.2708740234375, 1.366943359375, 1.4630126953125, 1.55908203125, 1.6551513671875, 1.751220703125, 1.8472900390625, 1.943359375, 2.0394287109375, 2.135498046875, 2.2315673828125, 2.32763671875, 2.4237060546875, 2.519775390625, 2.6158447265625, 2.7119140625, 2.8079833984375, 2.904052734375, 3.0001220703125, 3.09619140625, 3.1922607421875, 3.288330078125, 3.3843994140625, 3.48046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 2.0, 4.0, 10.0, 8.0, 18.0, 13.0, 30.0, 25.0, 33.0, 32.0, 32.0, 42.0, 48.0, 50.0, 85.0, 155.0, 1431.0, 413.0, 153.0, 91.0, 52.0, 44.0, 29.0, 48.0, 40.0, 20.0, 24.0, 18.0, 16.0, 19.0, 19.0, 8.0, 5.0, 6.0, 7.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.203125, -12.7904052734375, -12.377685546875, -11.9649658203125, -11.55224609375, -11.1395263671875, -10.726806640625, -10.3140869140625, -9.9013671875, -9.4886474609375, -9.075927734375, -8.6632080078125, -8.25048828125, -7.8377685546875, -7.425048828125, -7.0123291015625, -6.599609375, -6.1868896484375, -5.774169921875, -5.3614501953125, -4.94873046875, -4.5360107421875, -4.123291015625, -3.7105712890625, -3.2978515625, -2.8851318359375, -2.472412109375, -2.0596923828125, -1.64697265625, -1.2342529296875, -0.821533203125, -0.4088134765625, 0.00390625, 0.4166259765625, 0.829345703125, 1.2420654296875, 1.65478515625, 2.0675048828125, 2.480224609375, 2.8929443359375, 3.3056640625, 3.7183837890625, 4.131103515625, 4.5438232421875, 4.95654296875, 5.3692626953125, 5.781982421875, 6.1947021484375, 6.607421875, 7.0201416015625, 7.432861328125, 7.8455810546875, 8.25830078125, 8.6710205078125, 9.083740234375, 9.4964599609375, 9.9091796875, 10.3218994140625, 10.734619140625, 11.1473388671875, 11.56005859375, 11.9727783203125, 12.385498046875, 12.7982177734375, 13.2109375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 3.0, 6.0, 4.0, 7.0, 9.0, 10.0, 12.0, 23.0, 23.0, 32.0, 40.0, 47.0, 89.0, 109.0, 132.0, 185.0, 300.0, 517.0, 1486.0, 15080.0, 554270.0, 2521921.0, 46609.0, 2918.0, 700.0, 338.0, 229.0, 134.0, 101.0, 85.0, 59.0, 47.0, 47.0, 33.0, 15.0, 18.0, 17.0, 12.0, 8.0, 5.0, 9.0, 2.0, 1.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.609375, -18.048583984375, -17.48779296875, -16.927001953125, -16.3662109375, -15.805419921875, -15.24462890625, -14.683837890625, -14.123046875, -13.562255859375, -13.00146484375, -12.440673828125, -11.8798828125, -11.319091796875, -10.75830078125, -10.197509765625, -9.63671875, -9.075927734375, -8.51513671875, -7.954345703125, -7.3935546875, -6.832763671875, -6.27197265625, -5.711181640625, -5.150390625, -4.589599609375, -4.02880859375, -3.468017578125, -2.9072265625, -2.346435546875, -1.78564453125, -1.224853515625, -0.6640625, -0.103271484375, 0.45751953125, 1.018310546875, 1.5791015625, 2.139892578125, 2.70068359375, 3.261474609375, 3.822265625, 4.383056640625, 4.94384765625, 5.504638671875, 6.0654296875, 6.626220703125, 7.18701171875, 7.747802734375, 8.30859375, 8.869384765625, 9.43017578125, 9.990966796875, 10.5517578125, 11.112548828125, 11.67333984375, 12.234130859375, 12.794921875, 13.355712890625, 13.91650390625, 14.477294921875, 15.0380859375, 15.598876953125, 16.15966796875, 16.720458984375, 17.28125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 20.0, 46.0, 83.0, 119.0, 131.0, 170.0, 139.0, 122.0, 92.0, 51.0, 20.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.703411102294922, -21.90923309326172, -21.11505699157715, -20.320878982543945, -19.526700973510742, -18.732524871826172, -17.93834686279297, -17.144168853759766, -16.349992752075195, -15.555815696716309, -14.761637687683105, -13.967460632324219, -13.173283576965332, -12.379106521606445, -11.584928512573242, -10.790751457214355, -9.996573448181152, -9.202396392822266, -8.408218383789062, -7.614041328430176, -6.819864273071289, -6.025686740875244, -5.231509208679199, -4.4373321533203125, -3.6431546211242676, -2.8489773273468018, -2.054800033569336, -1.260622501373291, -0.4664452075958252, 0.3277320861816406, 1.1219096183776855, 1.9160866737365723, 2.710264205932617, 3.504441499710083, 4.298618793487549, 5.092796325683594, 5.8869733810424805, 6.681150913238525, 7.47532844543457, 8.269505500793457, 9.063682556152344, 9.85785961151123, 10.652037620544434, 11.44621467590332, 12.240391731262207, 13.034568786621094, 13.828746795654297, 14.622923851013184, 15.417101860046387, 16.211278915405273, 17.005456924438477, 17.799633026123047, 18.59381103515625, 19.387989044189453, 20.182167053222656, 20.976343154907227, 21.77052116394043, 22.564699172973633, 23.358875274658203, 24.153053283691406, 24.94723129272461, 25.74140739440918, 26.535585403442383, 27.329761505126953, 28.123939514160156]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 13.0, 9.0, 10.0, 7.0, 11.0, 22.0, 19.0, 25.0, 27.0, 26.0, 27.0, 37.0, 46.0, 37.0, 43.0, 46.0, 61.0, 54.0, 46.0, 34.0, 40.0, 53.0, 51.0, 34.0, 36.0, 22.0, 24.0, 25.0, 26.0, 18.0, 18.0, 16.0, 12.0, 5.0, 6.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.133480072021484, -31.12346839904785, -30.11345672607422, -29.103445053100586, -28.093433380126953, -27.08342170715332, -26.073410034179688, -25.063398361206055, -24.053386688232422, -23.04337501525879, -22.033363342285156, -21.023351669311523, -20.01333999633789, -19.003328323364258, -17.993316650390625, -16.983304977416992, -15.97329330444336, -14.963281631469727, -13.953269958496094, -12.943258285522461, -11.933246612548828, -10.923234939575195, -9.913223266601562, -8.90321159362793, -7.893199920654297, -6.883188247680664, -5.873176574707031, -4.863164901733398, -3.8531532287597656, -2.843141555786133, -1.8331298828125, -0.8231182098388672, 0.18689727783203125, 1.196908950805664, 2.206920623779297, 3.2169322967529297, 4.2269439697265625, 5.236955642700195, 6.246967315673828, 7.256978988647461, 8.266990661621094, 9.277002334594727, 10.28701400756836, 11.297025680541992, 12.307037353515625, 13.317049026489258, 14.32706069946289, 15.337072372436523, 16.347084045410156, 17.35709571838379, 18.367107391357422, 19.377119064331055, 20.387130737304688, 21.39714241027832, 22.407154083251953, 23.417165756225586, 24.42717742919922, 25.43718910217285, 26.447200775146484, 27.457212448120117, 28.46722412109375, 29.477235794067383, 30.487247467041016, 31.49725914001465, 32.50727081298828]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 4.0, 4.0, 13.0, 13.0, 8.0, 10.0, 16.0, 18.0, 22.0, 23.0, 20.0, 26.0, 44.0, 24.0, 33.0, 38.0, 45.0, 47.0, 50.0, 48.0, 43.0, 39.0, 38.0, 42.0, 28.0, 33.0, 38.0, 24.0, 28.0, 28.0, 19.0, 19.0, 20.0, 19.0, 8.0, 13.0, 11.0, 8.0, 5.0, 7.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380859375, -3.263092041015625, -3.14532470703125, -3.027557373046875, -2.9097900390625, -2.792022705078125, -2.67425537109375, -2.556488037109375, -2.438720703125, -2.320953369140625, -2.20318603515625, -2.085418701171875, -1.9676513671875, -1.849884033203125, -1.73211669921875, -1.614349365234375, -1.49658203125, -1.378814697265625, -1.26104736328125, -1.143280029296875, -1.0255126953125, -0.907745361328125, -0.78997802734375, -0.672210693359375, -0.554443359375, -0.436676025390625, -0.31890869140625, -0.201141357421875, -0.0833740234375, 0.034393310546875, 0.15216064453125, 0.269927978515625, 0.3876953125, 0.505462646484375, 0.62322998046875, 0.740997314453125, 0.8587646484375, 0.976531982421875, 1.09429931640625, 1.212066650390625, 1.329833984375, 1.447601318359375, 1.56536865234375, 1.683135986328125, 1.8009033203125, 1.918670654296875, 2.03643798828125, 2.154205322265625, 2.27197265625, 2.389739990234375, 2.50750732421875, 2.625274658203125, 2.7430419921875, 2.860809326171875, 2.97857666015625, 3.096343994140625, 3.214111328125, 3.331878662109375, 3.44964599609375, 3.567413330078125, 3.6851806640625, 3.802947998046875, 3.92071533203125, 4.038482666015625, 4.15625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 5.0, 4.0, 2.0, 8.0, 17.0, 9.0, 8.0, 20.0, 21.0, 28.0, 23.0, 31.0, 54.0, 63.0, 135.0, 421.0, 1932.0, 14300.0, 164794.0, 1868257.0, 1949884.0, 176142.0, 15105.0, 2079.0, 467.0, 148.0, 72.0, 61.0, 38.0, 30.0, 17.0, 23.0, 18.0, 14.0, 6.0, 10.0, 11.0, 5.0, 3.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.296875, -9.9849853515625, -9.673095703125, -9.3612060546875, -9.04931640625, -8.7374267578125, -8.425537109375, -8.1136474609375, -7.8017578125, -7.4898681640625, -7.177978515625, -6.8660888671875, -6.55419921875, -6.2423095703125, -5.930419921875, -5.6185302734375, -5.306640625, -4.9947509765625, -4.682861328125, -4.3709716796875, -4.05908203125, -3.7471923828125, -3.435302734375, -3.1234130859375, -2.8115234375, -2.4996337890625, -2.187744140625, -1.8758544921875, -1.56396484375, -1.2520751953125, -0.940185546875, -0.6282958984375, -0.31640625, -0.0045166015625, 0.307373046875, 0.6192626953125, 0.93115234375, 1.2430419921875, 1.554931640625, 1.8668212890625, 2.1787109375, 2.4906005859375, 2.802490234375, 3.1143798828125, 3.42626953125, 3.7381591796875, 4.050048828125, 4.3619384765625, 4.673828125, 4.9857177734375, 5.297607421875, 5.6094970703125, 5.92138671875, 6.2332763671875, 6.545166015625, 6.8570556640625, 7.1689453125, 7.4808349609375, 7.792724609375, 8.1046142578125, 8.41650390625, 8.7283935546875, 9.040283203125, 9.3521728515625, 9.6640625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 12.0, 14.0, 6.0, 30.0, 26.0, 32.0, 51.0, 75.0, 84.0, 154.0, 187.0, 267.0, 373.0, 444.0, 502.0, 426.0, 367.0, 276.0, 213.0, 129.0, 102.0, 75.0, 58.0, 33.0, 36.0, 36.0, 18.0, 14.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.39178466796875, -4.1781005859375, -3.96441650390625, -3.750732421875, -3.53704833984375, -3.3233642578125, -3.10968017578125, -2.89599609375, -2.68231201171875, -2.4686279296875, -2.25494384765625, -2.041259765625, -1.82757568359375, -1.6138916015625, -1.40020751953125, -1.1865234375, -0.97283935546875, -0.7591552734375, -0.54547119140625, -0.331787109375, -0.11810302734375, 0.0955810546875, 0.30926513671875, 0.52294921875, 0.73663330078125, 0.9503173828125, 1.16400146484375, 1.377685546875, 1.59136962890625, 1.8050537109375, 2.01873779296875, 2.232421875, 2.44610595703125, 2.6597900390625, 2.87347412109375, 3.087158203125, 3.30084228515625, 3.5145263671875, 3.72821044921875, 3.94189453125, 4.15557861328125, 4.3692626953125, 4.58294677734375, 4.796630859375, 5.01031494140625, 5.2239990234375, 5.43768310546875, 5.6513671875, 5.86505126953125, 6.0787353515625, 6.29241943359375, 6.506103515625, 6.71978759765625, 6.9334716796875, 7.14715576171875, 7.36083984375, 7.57452392578125, 7.7882080078125, 8.00189208984375, 8.215576171875, 8.42926025390625, 8.6429443359375, 8.85662841796875, 9.0703125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 6.0, 9.0, 13.0, 16.0, 21.0, 31.0, 46.0, 45.0, 69.0, 105.0, 174.0, 257.0, 441.0, 808.0, 2116.0, 16530.0, 635377.0, 3407059.0, 122504.0, 5780.0, 1222.0, 608.0, 357.0, 202.0, 152.0, 106.0, 64.0, 34.0, 32.0, 29.0, 15.0, 9.0, 11.0, 12.0, 8.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-24.953125, -24.301513671875, -23.64990234375, -22.998291015625, -22.3466796875, -21.695068359375, -21.04345703125, -20.391845703125, -19.740234375, -19.088623046875, -18.43701171875, -17.785400390625, -17.1337890625, -16.482177734375, -15.83056640625, -15.178955078125, -14.52734375, -13.875732421875, -13.22412109375, -12.572509765625, -11.9208984375, -11.269287109375, -10.61767578125, -9.966064453125, -9.314453125, -8.662841796875, -8.01123046875, -7.359619140625, -6.7080078125, -6.056396484375, -5.40478515625, -4.753173828125, -4.1015625, -3.449951171875, -2.79833984375, -2.146728515625, -1.4951171875, -0.843505859375, -0.19189453125, 0.459716796875, 1.111328125, 1.762939453125, 2.41455078125, 3.066162109375, 3.7177734375, 4.369384765625, 5.02099609375, 5.672607421875, 6.32421875, 6.975830078125, 7.62744140625, 8.279052734375, 8.9306640625, 9.582275390625, 10.23388671875, 10.885498046875, 11.537109375, 12.188720703125, 12.84033203125, 13.491943359375, 14.1435546875, 14.795166015625, 15.44677734375, 16.098388671875, 16.75]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 22.0, 58.0, 103.0, 155.0, 200.0, 189.0, 157.0, 73.0, 35.0, 11.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.93562316894531, -35.31706237792969, -33.69850540161133, -32.0799446105957, -30.46138572692871, -28.84282684326172, -27.224267959594727, -25.605709075927734, -23.98714828491211, -22.368589401245117, -20.750030517578125, -19.1314697265625, -17.512910842895508, -15.894351959228516, -14.275793075561523, -12.657233238220215, -11.038675308227539, -9.420116424560547, -7.801556587219238, -6.182997703552246, -4.564438343048096, -2.9458789825439453, -1.3273200988769531, 0.29123973846435547, 1.9097986221313477, 3.528357982635498, 5.146917343139648, 6.765476226806641, 8.384035110473633, 10.002594947814941, 11.621153831481934, 13.239713668823242, 14.858272552490234, 16.476831436157227, 18.09539031982422, 19.713951110839844, 21.332509994506836, 22.951068878173828, 24.56962776184082, 26.188186645507812, 27.806747436523438, 29.42530632019043, 31.043865203857422, 32.66242599487305, 34.280982971191406, 35.89954376220703, 37.518104553222656, 39.136661529541016, 40.755218505859375, 42.373779296875, 43.99233627319336, 45.610897064208984, 47.229454040527344, 48.84801483154297, 50.466575622558594, 52.08513259887695, 53.70369338989258, 55.3222541809082, 56.94081115722656, 58.55937194824219, 60.17792892456055, 61.79648971557617, 63.41504669189453, 65.03360748291016, 66.65216827392578]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 10.0, 10.0, 15.0, 17.0, 12.0, 25.0, 27.0, 22.0, 36.0, 29.0, 39.0, 39.0, 36.0, 47.0, 32.0, 36.0, 32.0, 38.0, 40.0, 40.0, 44.0, 42.0, 34.0, 31.0, 33.0, 27.0, 24.0, 16.0, 21.0, 22.0, 16.0, 18.0, 12.0, 7.0, 7.0, 11.0, 10.0, 2.0, 4.0, 6.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-20.990854263305664, -20.358154296875, -19.725452423095703, -19.09275245666504, -18.460052490234375, -17.82735252380371, -17.194652557373047, -16.56195068359375, -15.929250717163086, -15.296550750732422, -14.663849830627441, -14.031148910522461, -13.398448944091797, -12.765748977661133, -12.133048057556152, -11.500347137451172, -10.867647171020508, -10.234947204589844, -9.602246284484863, -8.969545364379883, -8.336845397949219, -7.7041449546813965, -7.071444511413574, -6.438744068145752, -5.80604362487793, -5.173343181610107, -4.540642738342285, -3.907942295074463, -3.2752418518066406, -2.6425414085388184, -2.009840965270996, -1.3771405220031738, -0.7444400787353516, -0.1117396354675293, 0.520960807800293, 1.1536612510681152, 1.7863616943359375, 2.4190621376037598, 3.051762580871582, 3.6844630241394043, 4.317163467407227, 4.949863910675049, 5.582564353942871, 6.215264797210693, 6.847965240478516, 7.480665683746338, 8.11336612701416, 8.74606704711914, 9.378767013549805, 10.011466979980469, 10.64416790008545, 11.27686882019043, 11.909568786621094, 12.542268753051758, 13.174969673156738, 13.807670593261719, 14.440370559692383, 15.073070526123047, 15.705771446228027, 16.338472366333008, 16.971172332763672, 17.603872299194336, 18.236572265625, 18.869274139404297, 19.50197410583496]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 10.0, 6.0, 11.0, 14.0, 20.0, 20.0, 21.0, 27.0, 13.0, 33.0, 24.0, 36.0, 41.0, 38.0, 38.0, 33.0, 51.0, 34.0, 40.0, 45.0, 25.0, 39.0, 45.0, 40.0, 42.0, 29.0, 27.0, 22.0, 16.0, 21.0, 16.0, 17.0, 21.0, 15.0, 8.0, 8.0, 5.0, 6.0, 8.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.517578125, -3.405029296875, -3.29248046875, -3.179931640625, -3.0673828125, -2.954833984375, -2.84228515625, -2.729736328125, -2.6171875, -2.504638671875, -2.39208984375, -2.279541015625, -2.1669921875, -2.054443359375, -1.94189453125, -1.829345703125, -1.716796875, -1.604248046875, -1.49169921875, -1.379150390625, -1.2666015625, -1.154052734375, -1.04150390625, -0.928955078125, -0.81640625, -0.703857421875, -0.59130859375, -0.478759765625, -0.3662109375, -0.253662109375, -0.14111328125, -0.028564453125, 0.083984375, 0.196533203125, 0.30908203125, 0.421630859375, 0.5341796875, 0.646728515625, 0.75927734375, 0.871826171875, 0.984375, 1.096923828125, 1.20947265625, 1.322021484375, 1.4345703125, 1.547119140625, 1.65966796875, 1.772216796875, 1.884765625, 1.997314453125, 2.10986328125, 2.222412109375, 2.3349609375, 2.447509765625, 2.56005859375, 2.672607421875, 2.78515625, 2.897705078125, 3.01025390625, 3.122802734375, 3.2353515625, 3.347900390625, 3.46044921875, 3.572998046875, 3.685546875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 14.0, 10.0, 20.0, 29.0, 48.0, 55.0, 93.0, 150.0, 221.0, 351.0, 510.0, 754.0, 1189.0, 1825.0, 2855.0, 4408.0, 6719.0, 10331.0, 15579.0, 22969.0, 33695.0, 48038.0, 65979.0, 86969.0, 106320.0, 119195.0, 118269.0, 105249.0, 84841.0, 64879.0, 47345.0, 33085.0, 22653.0, 15036.0, 10122.0, 6498.0, 4296.0, 2802.0, 1804.0, 1173.0, 761.0, 478.0, 302.0, 227.0, 123.0, 114.0, 61.0, 46.0, 27.0, 20.0, 12.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.505859375, -0.48952484130859375, -0.4731903076171875, -0.45685577392578125, -0.440521240234375, -0.42418670654296875, -0.4078521728515625, -0.39151763916015625, -0.37518310546875, -0.35884857177734375, -0.3425140380859375, -0.32617950439453125, -0.309844970703125, -0.29351043701171875, -0.2771759033203125, -0.26084136962890625, -0.2445068359375, -0.22817230224609375, -0.2118377685546875, -0.19550323486328125, -0.179168701171875, -0.16283416748046875, -0.1464996337890625, -0.13016510009765625, -0.11383056640625, -0.09749603271484375, -0.0811614990234375, -0.06482696533203125, -0.048492431640625, -0.03215789794921875, -0.0158233642578125, 0.00051116943359375, 0.016845703125, 0.03318023681640625, 0.0495147705078125, 0.06584930419921875, 0.082183837890625, 0.09851837158203125, 0.1148529052734375, 0.13118743896484375, 0.14752197265625, 0.16385650634765625, 0.1801910400390625, 0.19652557373046875, 0.212860107421875, 0.22919464111328125, 0.2455291748046875, 0.26186370849609375, 0.2781982421875, 0.29453277587890625, 0.3108673095703125, 0.32720184326171875, 0.343536376953125, 0.35987091064453125, 0.3762054443359375, 0.39253997802734375, 0.40887451171875, 0.42520904541015625, 0.4415435791015625, 0.45787811279296875, 0.474212646484375, 0.49054718017578125, 0.5068817138671875, 0.5232162475585938, 0.53955078125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 7.0, 11.0, 6.0, 20.0, 17.0, 19.0, 18.0, 27.0, 37.0, 40.0, 28.0, 50.0, 27.0, 42.0, 46.0, 54.0, 50.0, 1060.0, 48.0, 44.0, 48.0, 44.0, 37.0, 34.0, 36.0, 33.0, 20.0, 25.0, 14.0, 22.0, 8.0, 14.0, 10.0, 3.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.287109375, -3.181915283203125, -3.07672119140625, -2.971527099609375, -2.8663330078125, -2.761138916015625, -2.65594482421875, -2.550750732421875, -2.445556640625, -2.340362548828125, -2.23516845703125, -2.129974365234375, -2.0247802734375, -1.919586181640625, -1.81439208984375, -1.709197998046875, -1.60400390625, -1.498809814453125, -1.39361572265625, -1.288421630859375, -1.1832275390625, -1.078033447265625, -0.97283935546875, -0.867645263671875, -0.762451171875, -0.657257080078125, -0.55206298828125, -0.446868896484375, -0.3416748046875, -0.236480712890625, -0.13128662109375, -0.026092529296875, 0.0791015625, 0.184295654296875, 0.28948974609375, 0.394683837890625, 0.4998779296875, 0.605072021484375, 0.71026611328125, 0.815460205078125, 0.920654296875, 1.025848388671875, 1.13104248046875, 1.236236572265625, 1.3414306640625, 1.446624755859375, 1.55181884765625, 1.657012939453125, 1.76220703125, 1.867401123046875, 1.97259521484375, 2.077789306640625, 2.1829833984375, 2.288177490234375, 2.39337158203125, 2.498565673828125, 2.603759765625, 2.708953857421875, 2.81414794921875, 2.919342041015625, 3.0245361328125, 3.129730224609375, 3.23492431640625, 3.340118408203125, 3.4453125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 10.0, 14.0, 12.0, 15.0, 18.0, 34.0, 52.0, 71.0, 85.0, 160.0, 182.0, 277.0, 403.0, 600.0, 800.0, 1214.0, 1710.0, 2507.0, 3511.0, 4941.0, 7261.0, 10585.0, 15990.0, 25149.0, 45352.0, 1871149.0, 37132.0, 22202.0, 14347.0, 9659.0, 6613.0, 4627.0, 3194.0, 2160.0, 1568.0, 1049.0, 742.0, 550.0, 337.0, 247.0, 166.0, 125.0, 94.0, 62.0, 52.0, 35.0, 28.0, 10.0, 11.0, 10.0, 4.0, 7.0, 0.0, 1.0, 4.0, 1.0, 2.0], "bins": [-1.173828125, -1.1375732421875, -1.101318359375, -1.0650634765625, -1.02880859375, -0.9925537109375, -0.956298828125, -0.9200439453125, -0.8837890625, -0.8475341796875, -0.811279296875, -0.7750244140625, -0.73876953125, -0.7025146484375, -0.666259765625, -0.6300048828125, -0.59375, -0.5574951171875, -0.521240234375, -0.4849853515625, -0.44873046875, -0.4124755859375, -0.376220703125, -0.3399658203125, -0.3037109375, -0.2674560546875, -0.231201171875, -0.1949462890625, -0.15869140625, -0.1224365234375, -0.086181640625, -0.0499267578125, -0.013671875, 0.0225830078125, 0.058837890625, 0.0950927734375, 0.13134765625, 0.1676025390625, 0.203857421875, 0.2401123046875, 0.2763671875, 0.3126220703125, 0.348876953125, 0.3851318359375, 0.42138671875, 0.4576416015625, 0.493896484375, 0.5301513671875, 0.56640625, 0.6026611328125, 0.638916015625, 0.6751708984375, 0.71142578125, 0.7476806640625, 0.783935546875, 0.8201904296875, 0.8564453125, 0.8927001953125, 0.928955078125, 0.9652099609375, 1.00146484375, 1.0377197265625, 1.073974609375, 1.1102294921875, 1.146484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 4.0, 2.0, 4.0, 7.0, 7.0, 18.0, 15.0, 17.0, 19.0, 28.0, 35.0, 53.0, 52.0, 47.0, 57.0, 68.0, 91.0, 84.0, 47.0, 59.0, 45.0, 35.0, 44.0, 29.0, 18.0, 22.0, 18.0, 12.0, 9.0, 13.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0229339599609375, -0.022204160690307617, -0.021474361419677734, -0.02074456214904785, -0.02001476287841797, -0.019284963607788086, -0.018555164337158203, -0.01782536506652832, -0.017095565795898438, -0.016365766525268555, -0.015635967254638672, -0.014906167984008789, -0.014176368713378906, -0.013446569442749023, -0.01271677017211914, -0.011986970901489258, -0.011257171630859375, -0.010527372360229492, -0.00979757308959961, -0.009067773818969727, -0.008337974548339844, -0.007608175277709961, -0.006878376007080078, -0.006148576736450195, -0.0054187774658203125, -0.00468897819519043, -0.003959178924560547, -0.003229379653930664, -0.0024995803833007812, -0.0017697811126708984, -0.0010399818420410156, -0.0003101825714111328, 0.00041961669921875, 0.0011494159698486328, 0.0018792152404785156, 0.0026090145111083984, 0.0033388137817382812, 0.004068613052368164, 0.004798412322998047, 0.00552821159362793, 0.0062580108642578125, 0.006987810134887695, 0.007717609405517578, 0.008447408676147461, 0.009177207946777344, 0.009907007217407227, 0.01063680648803711, 0.011366605758666992, 0.012096405029296875, 0.012826204299926758, 0.01355600357055664, 0.014285802841186523, 0.015015602111816406, 0.01574540138244629, 0.016475200653076172, 0.017204999923706055, 0.017934799194335938, 0.01866459846496582, 0.019394397735595703, 0.020124197006225586, 0.02085399627685547, 0.02158379554748535, 0.022313594818115234, 0.023043394088745117, 0.023773193359375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 17.0, 13.0, 18.0, 31.0, 50.0, 59.0, 84.0, 124.0, 197.0, 387.0, 983.0, 186525.0, 857560.0, 1350.0, 455.0, 263.0, 118.0, 89.0, 58.0, 26.0, 39.0, 19.0, 16.0, 10.0, 8.0, 6.0, 1.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53759765625, -0.5208511352539062, -0.5041046142578125, -0.48735809326171875, -0.470611572265625, -0.45386505126953125, -0.4371185302734375, -0.42037200927734375, -0.40362548828125, -0.38687896728515625, -0.3701324462890625, -0.35338592529296875, -0.336639404296875, -0.31989288330078125, -0.3031463623046875, -0.28639984130859375, -0.2696533203125, -0.25290679931640625, -0.2361602783203125, -0.21941375732421875, -0.202667236328125, -0.18592071533203125, -0.1691741943359375, -0.15242767333984375, -0.13568115234375, -0.11893463134765625, -0.1021881103515625, -0.08544158935546875, -0.068695068359375, -0.05194854736328125, -0.0352020263671875, -0.01845550537109375, -0.001708984375, 0.01503753662109375, 0.0317840576171875, 0.04853057861328125, 0.065277099609375, 0.08202362060546875, 0.0987701416015625, 0.11551666259765625, 0.13226318359375, 0.14900970458984375, 0.1657562255859375, 0.18250274658203125, 0.199249267578125, 0.21599578857421875, 0.2327423095703125, 0.24948883056640625, 0.2662353515625, 0.28298187255859375, 0.2997283935546875, 0.31647491455078125, 0.333221435546875, 0.34996795654296875, 0.3667144775390625, 0.38346099853515625, 0.40020751953125, 0.41695404052734375, 0.4337005615234375, 0.45044708251953125, 0.467193603515625, 0.48394012451171875, 0.5006866455078125, 0.5174331665039062, 0.5341796875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 22.0, 448.0, 539.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3671473562717438, -0.354936808347702, -0.3427262604236603, -0.33051571249961853, -0.3183051645755768, -0.30609461665153503, -0.2938840389251709, -0.28167349100112915, -0.2694629430770874, -0.25725239515304565, -0.2450418472290039, -0.23283129930496216, -0.2206207513809204, -0.20841020345687866, -0.19619964063167572, -0.18398909270763397, -0.17177855968475342, -0.15956801176071167, -0.14735746383666992, -0.13514691591262817, -0.12293636053800583, -0.11072581261396408, -0.09851525723934174, -0.08630470931529999, -0.07409416139125824, -0.06188361346721649, -0.049673061817884445, -0.0374625101685524, -0.02525196224451065, -0.013041414320468903, -0.0008308589458465576, 0.01137968897819519, 0.023590266704559326, 0.035800814628601074, 0.04801136627793312, 0.06022191792726517, 0.07243246585130692, 0.08464301377534866, 0.09685356914997101, 0.10906411707401276, 0.1212746649980545, 0.13348521292209625, 0.145695760846138, 0.15790632367134094, 0.1701168715953827, 0.18232741951942444, 0.1945379674434662, 0.20674851536750793, 0.21895906329154968, 0.23116961121559143, 0.24338015913963318, 0.2555907070636749, 0.2678012549877167, 0.2800118029117584, 0.29222238063812256, 0.3044329285621643, 0.31664347648620605, 0.3288540244102478, 0.34106457233428955, 0.3532751202583313, 0.36548566818237305, 0.3776962161064148, 0.38990676403045654, 0.4021173119544983, 0.41432785987854004]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 9.0, 14.0, 9.0, 13.0, 14.0, 20.0, 18.0, 28.0, 21.0, 30.0, 34.0, 32.0, 34.0, 38.0, 35.0, 44.0, 43.0, 39.0, 49.0, 49.0, 43.0, 45.0, 42.0, 33.0, 31.0, 22.0, 32.0, 24.0, 27.0, 15.0, 16.0, 15.0, 21.0, 8.0, 7.0, 9.0, 10.0, 4.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.036565184593200684, -0.035267576575279236, -0.03396996483206749, -0.03267235308885574, -0.031374745070934296, -0.0300771351903677, -0.0287795253098011, -0.027481915429234505, -0.026184305548667908, -0.02488669566810131, -0.023589085787534714, -0.022291475906968117, -0.02099386602640152, -0.019696256145834923, -0.018398646265268326, -0.01710103638470173, -0.015803426504135132, -0.014505816623568535, -0.013208206743001938, -0.011910596862435341, -0.010612986981868744, -0.009315377101302147, -0.00801776722073555, -0.006720157340168953, -0.005422547459602356, -0.004124937579035759, -0.002827327698469162, -0.001529717817902565, -0.00023210793733596802, 0.001065501943230629, 0.002363111823797226, 0.003660721704363823, 0.00495833158493042, 0.006255941465497017, 0.007553551346063614, 0.008851161226630211, 0.010148771107196808, 0.011446380987763405, 0.012743990868330002, 0.014041600748896599, 0.015339210629463196, 0.016636820510029793, 0.01793443039059639, 0.019232040271162987, 0.020529650151729584, 0.02182726003229618, 0.023124869912862778, 0.024422479793429375, 0.02572008967399597, 0.02701769955456257, 0.028315309435129166, 0.029612919315695763, 0.03091052919626236, 0.03220813721418381, 0.033505748957395554, 0.0348033607006073, 0.03610096871852875, 0.037398576736450195, 0.03869618847966194, 0.03999380022287369, 0.041291408240795135, 0.04258901625871658, 0.04388662800192833, 0.045184239745140076, 0.04648184776306152]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 8.0, 6.0, 7.0, 5.0, 9.0, 10.0, 6.0, 8.0, 10.0, 16.0, 11.0, 24.0, 25.0, 27.0, 33.0, 27.0, 38.0, 39.0, 31.0, 31.0, 40.0, 39.0, 47.0, 41.0, 49.0, 33.0, 33.0, 47.0, 32.0, 40.0, 26.0, 27.0, 30.0, 15.0, 19.0, 16.0, 15.0, 14.0, 12.0, 18.0, 6.0, 5.0, 8.0, 6.0, 6.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.38671875, -3.273590087890625, -3.16046142578125, -3.047332763671875, -2.9342041015625, -2.821075439453125, -2.70794677734375, -2.594818115234375, -2.481689453125, -2.368560791015625, -2.25543212890625, -2.142303466796875, -2.0291748046875, -1.916046142578125, -1.80291748046875, -1.689788818359375, -1.57666015625, -1.463531494140625, -1.35040283203125, -1.237274169921875, -1.1241455078125, -1.011016845703125, -0.89788818359375, -0.784759521484375, -0.671630859375, -0.558502197265625, -0.44537353515625, -0.332244873046875, -0.2191162109375, -0.105987548828125, 0.00714111328125, 0.120269775390625, 0.2333984375, 0.346527099609375, 0.45965576171875, 0.572784423828125, 0.6859130859375, 0.799041748046875, 0.91217041015625, 1.025299072265625, 1.138427734375, 1.251556396484375, 1.36468505859375, 1.477813720703125, 1.5909423828125, 1.704071044921875, 1.81719970703125, 1.930328369140625, 2.04345703125, 2.156585693359375, 2.26971435546875, 2.382843017578125, 2.4959716796875, 2.609100341796875, 2.72222900390625, 2.835357666015625, 2.948486328125, 3.061614990234375, 3.17474365234375, 3.287872314453125, 3.4010009765625, 3.514129638671875, 3.62725830078125, 3.740386962890625, 3.853515625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 8.0, 10.0, 12.0, 12.0, 11.0, 13.0, 19.0, 18.0, 22.0, 34.0, 43.0, 54.0, 79.0, 104.0, 213.0, 451.0, 914.0, 2163.0, 5027.0, 11674.0, 27205.0, 81387.0, 318950.0, 416613.0, 121464.0, 35636.0, 14621.0, 6566.0, 2742.0, 1195.0, 543.0, 240.0, 147.0, 100.0, 68.0, 45.0, 36.0, 16.0, 25.0, 11.0, 17.0, 13.0, 14.0, 7.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.13671875, -4.96630859375, -4.7958984375, -4.62548828125, -4.455078125, -4.28466796875, -4.1142578125, -3.94384765625, -3.7734375, -3.60302734375, -3.4326171875, -3.26220703125, -3.091796875, -2.92138671875, -2.7509765625, -2.58056640625, -2.41015625, -2.23974609375, -2.0693359375, -1.89892578125, -1.728515625, -1.55810546875, -1.3876953125, -1.21728515625, -1.046875, -0.87646484375, -0.7060546875, -0.53564453125, -0.365234375, -0.19482421875, -0.0244140625, 0.14599609375, 0.31640625, 0.48681640625, 0.6572265625, 0.82763671875, 0.998046875, 1.16845703125, 1.3388671875, 1.50927734375, 1.6796875, 1.85009765625, 2.0205078125, 2.19091796875, 2.361328125, 2.53173828125, 2.7021484375, 2.87255859375, 3.04296875, 3.21337890625, 3.3837890625, 3.55419921875, 3.724609375, 3.89501953125, 4.0654296875, 4.23583984375, 4.40625, 4.57666015625, 4.7470703125, 4.91748046875, 5.087890625, 5.25830078125, 5.4287109375, 5.59912109375, 5.76953125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 9.0, 3.0, 10.0, 15.0, 15.0, 19.0, 12.0, 21.0, 24.0, 28.0, 31.0, 35.0, 41.0, 42.0, 51.0, 60.0, 91.0, 161.0, 1374.0, 376.0, 139.0, 81.0, 59.0, 47.0, 53.0, 29.0, 47.0, 25.0, 26.0, 18.0, 21.0, 16.0, 9.0, 10.0, 7.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.7384033203125, -10.367431640625, -9.9964599609375, -9.62548828125, -9.2545166015625, -8.883544921875, -8.5125732421875, -8.1416015625, -7.7706298828125, -7.399658203125, -7.0286865234375, -6.65771484375, -6.2867431640625, -5.915771484375, -5.5447998046875, -5.173828125, -4.8028564453125, -4.431884765625, -4.0609130859375, -3.68994140625, -3.3189697265625, -2.947998046875, -2.5770263671875, -2.2060546875, -1.8350830078125, -1.464111328125, -1.0931396484375, -0.72216796875, -0.3511962890625, 0.019775390625, 0.3907470703125, 0.76171875, 1.1326904296875, 1.503662109375, 1.8746337890625, 2.24560546875, 2.6165771484375, 2.987548828125, 3.3585205078125, 3.7294921875, 4.1004638671875, 4.471435546875, 4.8424072265625, 5.21337890625, 5.5843505859375, 5.955322265625, 6.3262939453125, 6.697265625, 7.0682373046875, 7.439208984375, 7.8101806640625, 8.18115234375, 8.5521240234375, 8.923095703125, 9.2940673828125, 9.6650390625, 10.0360107421875, 10.406982421875, 10.7779541015625, 11.14892578125, 11.5198974609375, 11.890869140625, 12.2618408203125, 12.6328125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 10.0, 3.0, 9.0, 17.0, 11.0, 19.0, 20.0, 41.0, 43.0, 56.0, 82.0, 124.0, 181.0, 240.0, 505.0, 1493.0, 12170.0, 528748.0, 2564538.0, 33075.0, 2533.0, 700.0, 334.0, 185.0, 131.0, 88.0, 75.0, 56.0, 50.0, 27.0, 23.0, 23.0, 19.0, 15.0, 10.0, 8.0, 8.0, 6.0, 7.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.921875, -21.260986328125, -20.60009765625, -19.939208984375, -19.2783203125, -18.617431640625, -17.95654296875, -17.295654296875, -16.634765625, -15.973876953125, -15.31298828125, -14.652099609375, -13.9912109375, -13.330322265625, -12.66943359375, -12.008544921875, -11.34765625, -10.686767578125, -10.02587890625, -9.364990234375, -8.7041015625, -8.043212890625, -7.38232421875, -6.721435546875, -6.060546875, -5.399658203125, -4.73876953125, -4.077880859375, -3.4169921875, -2.756103515625, -2.09521484375, -1.434326171875, -0.7734375, -0.112548828125, 0.54833984375, 1.209228515625, 1.8701171875, 2.531005859375, 3.19189453125, 3.852783203125, 4.513671875, 5.174560546875, 5.83544921875, 6.496337890625, 7.1572265625, 7.818115234375, 8.47900390625, 9.139892578125, 9.80078125, 10.461669921875, 11.12255859375, 11.783447265625, 12.4443359375, 13.105224609375, 13.76611328125, 14.427001953125, 15.087890625, 15.748779296875, 16.40966796875, 17.070556640625, 17.7314453125, 18.392333984375, 19.05322265625, 19.714111328125, 20.375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 44.0, 139.0, 296.0, 331.0, 155.0, 36.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.0960807800293, -48.53443145751953, -46.972782135009766, -45.4111328125, -43.849483489990234, -42.28783416748047, -40.7261848449707, -39.16453552246094, -37.60288619995117, -36.041236877441406, -34.47958755493164, -32.917938232421875, -31.35628890991211, -29.794639587402344, -28.232990264892578, -26.671340942382812, -25.10969352722168, -23.548044204711914, -21.98639488220215, -20.424745559692383, -18.863096237182617, -17.30144691467285, -15.739798545837402, -14.178149223327637, -12.616499900817871, -11.054850578308105, -9.49320125579834, -7.931552410125732, -6.369903087615967, -4.808253765106201, -3.2466049194335938, -1.6849555969238281, -0.1233062744140625, 1.4383429288864136, 2.9999921321868896, 4.561641216278076, 6.123290538787842, 7.684939861297607, 9.246588706970215, 10.80823802947998, 12.369887351989746, 13.931536674499512, 15.493185997009277, 17.054834365844727, 18.616483688354492, 20.178133010864258, 21.739782333374023, 23.30143165588379, 24.863080978393555, 26.42473030090332, 27.986379623413086, 29.54802894592285, 31.109678268432617, 32.67132568359375, 34.232975006103516, 35.79462432861328, 37.35627365112305, 38.91792297363281, 40.47957229614258, 42.041221618652344, 43.60287094116211, 45.164520263671875, 46.72616958618164, 48.287818908691406, 49.84946823120117]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 10.0, 5.0, 11.0, 5.0, 13.0, 9.0, 16.0, 18.0, 16.0, 12.0, 22.0, 28.0, 28.0, 27.0, 29.0, 29.0, 34.0, 42.0, 32.0, 32.0, 35.0, 36.0, 40.0, 30.0, 31.0, 40.0, 35.0, 34.0, 29.0, 23.0, 22.0, 26.0, 22.0, 27.0, 28.0, 23.0, 13.0, 18.0, 11.0, 10.0, 13.0, 8.0, 2.0, 2.0, 7.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-26.464702606201172, -25.6445369720459, -24.824371337890625, -24.00420570373535, -23.184040069580078, -22.363872528076172, -21.5437068939209, -20.723541259765625, -19.90337562561035, -19.083209991455078, -18.263044357299805, -17.44287872314453, -16.622711181640625, -15.802546501159668, -14.982379913330078, -14.162214279174805, -13.342048645019531, -12.521883010864258, -11.701717376708984, -10.881550788879395, -10.061385154724121, -9.241219520568848, -8.421052932739258, -7.600887298583984, -6.780721664428711, -5.9605560302734375, -5.140389919281006, -4.320223808288574, -3.500058174133301, -2.6798925399780273, -1.8597264289855957, -1.039560317993164, -0.21939468383789062, 0.6007711887359619, 1.4209370613098145, 2.241102933883667, 3.0612688064575195, 3.881434440612793, 4.701600551605225, 5.521766662597656, 6.34193229675293, 7.162097930908203, 7.982264041900635, 8.802430152893066, 9.62259578704834, 10.442761421203613, 11.262928009033203, 12.083093643188477, 12.90325927734375, 13.723424911499023, 14.543590545654297, 15.363757133483887, 16.183921813964844, 17.00408935546875, 17.824254989624023, 18.644420623779297, 19.46458625793457, 20.284751892089844, 21.104917526245117, 21.92508316040039, 22.745250701904297, 23.565414428710938, 24.385581970214844, 25.205747604370117, 26.02591323852539]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 8.0, 6.0, 3.0, 8.0, 8.0, 8.0, 14.0, 9.0, 12.0, 15.0, 12.0, 31.0, 23.0, 20.0, 20.0, 38.0, 29.0, 36.0, 27.0, 42.0, 38.0, 33.0, 40.0, 53.0, 36.0, 46.0, 50.0, 38.0, 32.0, 31.0, 29.0, 26.0, 28.0, 20.0, 17.0, 18.0, 9.0, 18.0, 14.0, 12.0, 10.0, 8.0, 5.0, 9.0, 9.0, 1.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.6953125, -3.577850341796875, -3.46038818359375, -3.342926025390625, -3.2254638671875, -3.108001708984375, -2.99053955078125, -2.873077392578125, -2.755615234375, -2.638153076171875, -2.52069091796875, -2.403228759765625, -2.2857666015625, -2.168304443359375, -2.05084228515625, -1.933380126953125, -1.81591796875, -1.698455810546875, -1.58099365234375, -1.463531494140625, -1.3460693359375, -1.228607177734375, -1.11114501953125, -0.993682861328125, -0.876220703125, -0.758758544921875, -0.64129638671875, -0.523834228515625, -0.4063720703125, -0.288909912109375, -0.17144775390625, -0.053985595703125, 0.0634765625, 0.180938720703125, 0.29840087890625, 0.415863037109375, 0.5333251953125, 0.650787353515625, 0.76824951171875, 0.885711669921875, 1.003173828125, 1.120635986328125, 1.23809814453125, 1.355560302734375, 1.4730224609375, 1.590484619140625, 1.70794677734375, 1.825408935546875, 1.94287109375, 2.060333251953125, 2.17779541015625, 2.295257568359375, 2.4127197265625, 2.530181884765625, 2.64764404296875, 2.765106201171875, 2.882568359375, 3.000030517578125, 3.11749267578125, 3.234954833984375, 3.3524169921875, 3.469879150390625, 3.58734130859375, 3.704803466796875, 3.822265625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 5.0, 5.0, 8.0, 11.0, 14.0, 16.0, 21.0, 30.0, 27.0, 38.0, 49.0, 79.0, 138.0, 241.0, 418.0, 867.0, 2123.0, 6625.0, 26351.0, 128318.0, 653369.0, 1942140.0, 1129545.0, 240423.0, 46459.0, 10918.0, 3317.0, 1341.0, 598.0, 267.0, 167.0, 104.0, 53.0, 43.0, 35.0, 20.0, 17.0, 11.0, 10.0, 8.0, 7.0, 7.0, 6.0, 6.0, 4.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.1322021484375, -5.932373046875, -5.7325439453125, -5.53271484375, -5.3328857421875, -5.133056640625, -4.9332275390625, -4.7333984375, -4.5335693359375, -4.333740234375, -4.1339111328125, -3.93408203125, -3.7342529296875, -3.534423828125, -3.3345947265625, -3.134765625, -2.9349365234375, -2.735107421875, -2.5352783203125, -2.33544921875, -2.1356201171875, -1.935791015625, -1.7359619140625, -1.5361328125, -1.3363037109375, -1.136474609375, -0.9366455078125, -0.73681640625, -0.5369873046875, -0.337158203125, -0.1373291015625, 0.0625, 0.2623291015625, 0.462158203125, 0.6619873046875, 0.86181640625, 1.0616455078125, 1.261474609375, 1.4613037109375, 1.6611328125, 1.8609619140625, 2.060791015625, 2.2606201171875, 2.46044921875, 2.6602783203125, 2.860107421875, 3.0599365234375, 3.259765625, 3.4595947265625, 3.659423828125, 3.8592529296875, 4.05908203125, 4.2589111328125, 4.458740234375, 4.6585693359375, 4.8583984375, 5.0582275390625, 5.258056640625, 5.4578857421875, 5.65771484375, 5.8575439453125, 6.057373046875, 6.2572021484375, 6.45703125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 5.0, 7.0, 12.0, 13.0, 15.0, 33.0, 45.0, 56.0, 82.0, 89.0, 143.0, 146.0, 242.0, 283.0, 403.0, 382.0, 413.0, 357.0, 333.0, 263.0, 188.0, 135.0, 102.0, 71.0, 61.0, 46.0, 27.0, 24.0, 23.0, 18.0, 10.0, 11.0, 8.0, 3.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.92578125, -4.7374267578125, -4.549072265625, -4.3607177734375, -4.17236328125, -3.9840087890625, -3.795654296875, -3.6072998046875, -3.4189453125, -3.2305908203125, -3.042236328125, -2.8538818359375, -2.66552734375, -2.4771728515625, -2.288818359375, -2.1004638671875, -1.912109375, -1.7237548828125, -1.535400390625, -1.3470458984375, -1.15869140625, -0.9703369140625, -0.781982421875, -0.5936279296875, -0.4052734375, -0.2169189453125, -0.028564453125, 0.1597900390625, 0.34814453125, 0.5364990234375, 0.724853515625, 0.9132080078125, 1.1015625, 1.2899169921875, 1.478271484375, 1.6666259765625, 1.85498046875, 2.0433349609375, 2.231689453125, 2.4200439453125, 2.6083984375, 2.7967529296875, 2.985107421875, 3.1734619140625, 3.36181640625, 3.5501708984375, 3.738525390625, 3.9268798828125, 4.115234375, 4.3035888671875, 4.491943359375, 4.6802978515625, 4.86865234375, 5.0570068359375, 5.245361328125, 5.4337158203125, 5.6220703125, 5.8104248046875, 5.998779296875, 6.1871337890625, 6.37548828125, 6.5638427734375, 6.752197265625, 6.9405517578125, 7.12890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 9.0, 10.0, 12.0, 19.0, 31.0, 31.0, 40.0, 73.0, 91.0, 124.0, 212.0, 315.0, 563.0, 1079.0, 3414.0, 19040.0, 255896.0, 3102231.0, 759041.0, 43203.0, 5565.0, 1525.0, 619.0, 384.0, 254.0, 142.0, 107.0, 64.0, 67.0, 28.0, 23.0, 12.0, 15.0, 9.0, 4.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.953125, -16.4779052734375, -16.002685546875, -15.5274658203125, -15.05224609375, -14.5770263671875, -14.101806640625, -13.6265869140625, -13.1513671875, -12.6761474609375, -12.200927734375, -11.7257080078125, -11.25048828125, -10.7752685546875, -10.300048828125, -9.8248291015625, -9.349609375, -8.8743896484375, -8.399169921875, -7.9239501953125, -7.44873046875, -6.9735107421875, -6.498291015625, -6.0230712890625, -5.5478515625, -5.0726318359375, -4.597412109375, -4.1221923828125, -3.64697265625, -3.1717529296875, -2.696533203125, -2.2213134765625, -1.74609375, -1.2708740234375, -0.795654296875, -0.3204345703125, 0.15478515625, 0.6300048828125, 1.105224609375, 1.5804443359375, 2.0556640625, 2.5308837890625, 3.006103515625, 3.4813232421875, 3.95654296875, 4.4317626953125, 4.906982421875, 5.3822021484375, 5.857421875, 6.3326416015625, 6.807861328125, 7.2830810546875, 7.75830078125, 8.2335205078125, 8.708740234375, 9.1839599609375, 9.6591796875, 10.1343994140625, 10.609619140625, 11.0848388671875, 11.56005859375, 12.0352783203125, 12.510498046875, 12.9857177734375, 13.4609375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 14.0, 38.0, 50.0, 98.0, 116.0, 143.0, 182.0, 130.0, 103.0, 65.0, 37.0, 14.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.697566986083984, -48.42951965332031, -47.16147232055664, -45.89342498779297, -44.62538146972656, -43.35733413696289, -42.08928680419922, -40.82123947143555, -39.553192138671875, -38.2851448059082, -37.01709747314453, -35.74905014038086, -34.48100280761719, -33.21295928955078, -31.94491195678711, -30.676864624023438, -29.408817291259766, -28.140769958496094, -26.872722625732422, -25.604677200317383, -24.33662986755371, -23.06858253479004, -21.800537109375, -20.532489776611328, -19.264442443847656, -17.996395111083984, -16.728347778320312, -15.460302352905273, -14.192255020141602, -12.92420768737793, -11.656161308288574, -10.388114929199219, -9.120067596435547, -7.852020740509033, -6.5839738845825195, -5.315927028656006, -4.047880172729492, -2.7798333168029785, -1.5117864608764648, -0.24374008178710938, 1.0243072509765625, 2.292354106903076, 3.56040096282959, 4.8284478187561035, 6.096494674682617, 7.364541530609131, 8.632588386535645, 9.900634765625, 11.168682098388672, 12.436729431152344, 13.7047758102417, 14.972822189331055, 16.240869522094727, 17.5089168548584, 18.776962280273438, 20.04500961303711, 21.31305694580078, 22.581104278564453, 23.849151611328125, 25.117197036743164, 26.385244369506836, 27.653291702270508, 28.921337127685547, 30.18938446044922, 31.45743179321289]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 8.0, 11.0, 15.0, 9.0, 13.0, 9.0, 17.0, 15.0, 26.0, 29.0, 27.0, 29.0, 43.0, 49.0, 36.0, 41.0, 51.0, 37.0, 48.0, 51.0, 37.0, 57.0, 47.0, 40.0, 43.0, 23.0, 35.0, 24.0, 18.0, 15.0, 22.0, 17.0, 17.0, 5.0, 8.0, 9.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.754226684570312, -21.04230499267578, -20.330385208129883, -19.61846351623535, -18.90654182434082, -18.194622039794922, -17.48270034790039, -16.77077865600586, -16.058856964111328, -15.346936225891113, -14.635014533996582, -13.923093795776367, -13.211172103881836, -12.499251365661621, -11.787330627441406, -11.075408935546875, -10.363489151000977, -9.651568412780762, -8.93964672088623, -8.227725982666016, -7.515804767608643, -6.8038835525512695, -6.091962814331055, -5.380041599273682, -4.668120384216309, -3.9561991691589355, -3.2442781925201416, -2.5323572158813477, -1.8204360008239746, -1.1085147857666016, -0.3965940475463867, 0.31532716751098633, 1.0272464752197266, 1.73916757106781, 2.4510886669158936, 3.1630096435546875, 3.8749308586120605, 4.586852073669434, 5.298772811889648, 6.0106940269470215, 6.7226152420043945, 7.434536457061768, 8.14645767211914, 8.858378410339355, 9.57029914855957, 10.282220840454102, 10.994141578674316, 11.706062316894531, 12.417984008789062, 13.129904747009277, 13.841826438903809, 14.553747177124023, 15.265668869018555, 15.97758960723877, 16.689510345458984, 17.401432037353516, 18.113353729248047, 18.825275421142578, 19.537195205688477, 20.249116897583008, 20.96103858947754, 21.672958374023438, 22.38488006591797, 23.0968017578125, 23.8087215423584]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 9.0, 6.0, 7.0, 13.0, 14.0, 11.0, 17.0, 20.0, 16.0, 20.0, 28.0, 24.0, 36.0, 32.0, 34.0, 42.0, 40.0, 35.0, 46.0, 34.0, 55.0, 45.0, 41.0, 41.0, 44.0, 36.0, 34.0, 33.0, 41.0, 28.0, 21.0, 18.0, 17.0, 13.0, 8.0, 17.0, 11.0, 5.0, 2.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.9693603515625, -3.837158203125, -3.7049560546875, -3.57275390625, -3.4405517578125, -3.308349609375, -3.1761474609375, -3.0439453125, -2.9117431640625, -2.779541015625, -2.6473388671875, -2.51513671875, -2.3829345703125, -2.250732421875, -2.1185302734375, -1.986328125, -1.8541259765625, -1.721923828125, -1.5897216796875, -1.45751953125, -1.3253173828125, -1.193115234375, -1.0609130859375, -0.9287109375, -0.7965087890625, -0.664306640625, -0.5321044921875, -0.39990234375, -0.2677001953125, -0.135498046875, -0.0032958984375, 0.12890625, 0.2611083984375, 0.393310546875, 0.5255126953125, 0.65771484375, 0.7899169921875, 0.922119140625, 1.0543212890625, 1.1865234375, 1.3187255859375, 1.450927734375, 1.5831298828125, 1.71533203125, 1.8475341796875, 1.979736328125, 2.1119384765625, 2.244140625, 2.3763427734375, 2.508544921875, 2.6407470703125, 2.77294921875, 2.9051513671875, 3.037353515625, 3.1695556640625, 3.3017578125, 3.4339599609375, 3.566162109375, 3.6983642578125, 3.83056640625, 3.9627685546875, 4.094970703125, 4.2271728515625, 4.359375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 5.0, 4.0, 9.0, 11.0, 24.0, 28.0, 54.0, 78.0, 134.0, 214.0, 296.0, 403.0, 679.0, 991.0, 1514.0, 2259.0, 3221.0, 4822.0, 7117.0, 10306.0, 14718.0, 21127.0, 30245.0, 41724.0, 56488.0, 74097.0, 91282.0, 106032.0, 111224.0, 105800.0, 91603.0, 74591.0, 56954.0, 41876.0, 30112.0, 21512.0, 14994.0, 10185.0, 7154.0, 4907.0, 3338.0, 2148.0, 1473.0, 927.0, 640.0, 443.0, 281.0, 193.0, 131.0, 74.0, 52.0, 27.0, 16.0, 12.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.468505859375, -0.45363616943359375, -0.4387664794921875, -0.42389678955078125, -0.409027099609375, -0.39415740966796875, -0.3792877197265625, -0.36441802978515625, -0.34954833984375, -0.33467864990234375, -0.3198089599609375, -0.30493927001953125, -0.290069580078125, -0.27519989013671875, -0.2603302001953125, -0.24546051025390625, -0.2305908203125, -0.21572113037109375, -0.2008514404296875, -0.18598175048828125, -0.171112060546875, -0.15624237060546875, -0.1413726806640625, -0.12650299072265625, -0.11163330078125, -0.09676361083984375, -0.0818939208984375, -0.06702423095703125, -0.052154541015625, -0.03728485107421875, -0.0224151611328125, -0.00754547119140625, 0.00732421875, 0.02219390869140625, 0.0370635986328125, 0.05193328857421875, 0.066802978515625, 0.08167266845703125, 0.0965423583984375, 0.11141204833984375, 0.12628173828125, 0.14115142822265625, 0.1560211181640625, 0.17089080810546875, 0.185760498046875, 0.20063018798828125, 0.2154998779296875, 0.23036956787109375, 0.2452392578125, 0.26010894775390625, 0.2749786376953125, 0.28984832763671875, 0.304718017578125, 0.31958770751953125, 0.3344573974609375, 0.34932708740234375, 0.36419677734375, 0.37906646728515625, 0.3939361572265625, 0.40880584716796875, 0.423675537109375, 0.43854522705078125, 0.4534149169921875, 0.46828460693359375, 0.483154296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 5.0, 11.0, 13.0, 6.0, 12.0, 15.0, 8.0, 11.0, 22.0, 18.0, 31.0, 18.0, 34.0, 32.0, 27.0, 41.0, 46.0, 39.0, 57.0, 41.0, 1055.0, 37.0, 46.0, 36.0, 44.0, 33.0, 41.0, 32.0, 22.0, 28.0, 21.0, 20.0, 14.0, 16.0, 17.0, 12.0, 16.0, 12.0, 8.0, 3.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-3.021484375, -2.9332275390625, -2.844970703125, -2.7567138671875, -2.66845703125, -2.5802001953125, -2.491943359375, -2.4036865234375, -2.3154296875, -2.2271728515625, -2.138916015625, -2.0506591796875, -1.96240234375, -1.8741455078125, -1.785888671875, -1.6976318359375, -1.609375, -1.5211181640625, -1.432861328125, -1.3446044921875, -1.25634765625, -1.1680908203125, -1.079833984375, -0.9915771484375, -0.9033203125, -0.8150634765625, -0.726806640625, -0.6385498046875, -0.55029296875, -0.4620361328125, -0.373779296875, -0.2855224609375, -0.197265625, -0.1090087890625, -0.020751953125, 0.0675048828125, 0.15576171875, 0.2440185546875, 0.332275390625, 0.4205322265625, 0.5087890625, 0.5970458984375, 0.685302734375, 0.7735595703125, 0.86181640625, 0.9500732421875, 1.038330078125, 1.1265869140625, 1.21484375, 1.3031005859375, 1.391357421875, 1.4796142578125, 1.56787109375, 1.6561279296875, 1.744384765625, 1.8326416015625, 1.9208984375, 2.0091552734375, 2.097412109375, 2.1856689453125, 2.27392578125, 2.3621826171875, 2.450439453125, 2.5386962890625, 2.626953125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 9.0, 14.0, 14.0, 17.0, 30.0, 37.0, 64.0, 69.0, 95.0, 154.0, 211.0, 312.0, 452.0, 618.0, 853.0, 1259.0, 1811.0, 2570.0, 3737.0, 5446.0, 7751.0, 11568.0, 17855.0, 28100.0, 78681.0, 1840284.0, 32838.0, 20387.0, 13230.0, 8773.0, 6022.0, 4186.0, 2956.0, 2080.0, 1373.0, 914.0, 682.0, 447.0, 348.0, 261.0, 199.0, 123.0, 83.0, 70.0, 40.0, 37.0, 25.0, 26.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-1.107421875, -1.0729827880859375, -1.038543701171875, -1.0041046142578125, -0.96966552734375, -0.9352264404296875, -0.900787353515625, -0.8663482666015625, -0.8319091796875, -0.7974700927734375, -0.763031005859375, -0.7285919189453125, -0.69415283203125, -0.6597137451171875, -0.625274658203125, -0.5908355712890625, -0.556396484375, -0.5219573974609375, -0.487518310546875, -0.4530792236328125, -0.41864013671875, -0.3842010498046875, -0.349761962890625, -0.3153228759765625, -0.2808837890625, -0.2464447021484375, -0.212005615234375, -0.1775665283203125, -0.14312744140625, -0.1086883544921875, -0.074249267578125, -0.0398101806640625, -0.00537109375, 0.0290679931640625, 0.063507080078125, 0.0979461669921875, 0.13238525390625, 0.1668243408203125, 0.201263427734375, 0.2357025146484375, 0.2701416015625, 0.3045806884765625, 0.339019775390625, 0.3734588623046875, 0.40789794921875, 0.4423370361328125, 0.476776123046875, 0.5112152099609375, 0.545654296875, 0.5800933837890625, 0.614532470703125, 0.6489715576171875, 0.68341064453125, 0.7178497314453125, 0.752288818359375, 0.7867279052734375, 0.8211669921875, 0.8556060791015625, 0.890045166015625, 0.9244842529296875, 0.95892333984375, 0.9933624267578125, 1.027801513671875, 1.0622406005859375, 1.0966796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 4.0, 9.0, 14.0, 13.0, 15.0, 23.0, 21.0, 43.0, 33.0, 50.0, 61.0, 80.0, 84.0, 68.0, 76.0, 60.0, 60.0, 61.0, 39.0, 36.0, 22.0, 25.0, 21.0, 15.0, 10.0, 11.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01861572265625, -0.01795029640197754, -0.017284870147705078, -0.016619443893432617, -0.015954017639160156, -0.015288591384887695, -0.014623165130615234, -0.013957738876342773, -0.013292312622070312, -0.012626886367797852, -0.01196146011352539, -0.01129603385925293, -0.010630607604980469, -0.009965181350708008, -0.009299755096435547, -0.008634328842163086, -0.007968902587890625, -0.007303476333618164, -0.006638050079345703, -0.005972623825073242, -0.005307197570800781, -0.00464177131652832, -0.003976345062255859, -0.0033109188079833984, -0.0026454925537109375, -0.0019800662994384766, -0.0013146400451660156, -0.0006492137908935547, 1.621246337890625e-05, 0.0006816387176513672, 0.0013470649719238281, 0.002012491226196289, 0.00267791748046875, 0.003343343734741211, 0.004008769989013672, 0.004674196243286133, 0.005339622497558594, 0.006005048751831055, 0.006670475006103516, 0.0073359012603759766, 0.008001327514648438, 0.008666753768920898, 0.00933218002319336, 0.00999760627746582, 0.010663032531738281, 0.011328458786010742, 0.011993885040283203, 0.012659311294555664, 0.013324737548828125, 0.013990163803100586, 0.014655590057373047, 0.015321016311645508, 0.01598644256591797, 0.01665186882019043, 0.01731729507446289, 0.01798272132873535, 0.018648147583007812, 0.019313573837280273, 0.019979000091552734, 0.020644426345825195, 0.021309852600097656, 0.021975278854370117, 0.022640705108642578, 0.02330613136291504, 0.0239715576171875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 7.0, 6.0, 21.0, 19.0, 18.0, 15.0, 47.0, 55.0, 73.0, 82.0, 182.0, 307.0, 690.0, 15136.0, 1024885.0, 5572.0, 612.0, 248.0, 178.0, 104.0, 82.0, 46.0, 30.0, 26.0, 26.0, 14.0, 10.0, 14.0, 12.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.46484375, -0.4513359069824219, -0.43782806396484375, -0.4243202209472656, -0.4108123779296875, -0.3973045349121094, -0.38379669189453125, -0.3702888488769531, -0.356781005859375, -0.3432731628417969, -0.32976531982421875, -0.3162574768066406, -0.3027496337890625, -0.2892417907714844, -0.27573394775390625, -0.2622261047363281, -0.24871826171875, -0.23521041870117188, -0.22170257568359375, -0.20819473266601562, -0.1946868896484375, -0.18117904663085938, -0.16767120361328125, -0.15416336059570312, -0.140655517578125, -0.12714767456054688, -0.11363983154296875, -0.10013198852539062, -0.0866241455078125, -0.07311630249023438, -0.05960845947265625, -0.046100616455078125, -0.0325927734375, -0.019084930419921875, -0.00557708740234375, 0.007930755615234375, 0.0214385986328125, 0.034946441650390625, 0.04845428466796875, 0.061962127685546875, 0.075469970703125, 0.08897781372070312, 0.10248565673828125, 0.11599349975585938, 0.1295013427734375, 0.14300918579101562, 0.15651702880859375, 0.17002487182617188, 0.18353271484375, 0.19704055786132812, 0.21054840087890625, 0.22405624389648438, 0.2375640869140625, 0.2510719299316406, 0.26457977294921875, 0.2780876159667969, 0.291595458984375, 0.3051033020019531, 0.31861114501953125, 0.3321189880371094, 0.3456268310546875, 0.3591346740722656, 0.37264251708984375, 0.3861503601074219, 0.399658203125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 88.0, 637.0, 262.0, 21.0, 4.0], "bins": [-0.3025161623954773, -0.2975352108478546, -0.29255425930023193, -0.28757330775260925, -0.2825923562049866, -0.2776114046573639, -0.2726304531097412, -0.2676495313644409, -0.26266857981681824, -0.25768762826919556, -0.2527066767215729, -0.2477257251739502, -0.2427447885274887, -0.23776383697986603, -0.23278288543224335, -0.22780193388462067, -0.2228209674358368, -0.2178400158882141, -0.21285906434059143, -0.20787811279296875, -0.20289717614650726, -0.19791622459888458, -0.1929352730512619, -0.18795432150363922, -0.18297338485717773, -0.17799243330955505, -0.17301148176193237, -0.1680305302143097, -0.1630495935678482, -0.15806864202022552, -0.15308769047260284, -0.14810673892498016, -0.14312578737735748, -0.1381448358297348, -0.13316388428211212, -0.12818294763565063, -0.12320198863744736, -0.11822104454040527, -0.11324009299278259, -0.10825914144515991, -0.10327819734811783, -0.09829724580049515, -0.09331630170345306, -0.08833535015583038, -0.0833543986082077, -0.07837344706058502, -0.07339250296354294, -0.06841155141592026, -0.06343059986829758, -0.058449652045965195, -0.053468700498342514, -0.04848775267601013, -0.04350680112838745, -0.03852585330605507, -0.03354490548372269, -0.028563953936100006, -0.023583007976412773, -0.01860205829143524, -0.013621109537780285, -0.008640160784125328, -0.0036592110991477966, 0.0013217385858297348, 0.006302686408162117, 0.011283637955784798, 0.01626458577811718]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 5.0, 5.0, 9.0, 12.0, 12.0, 17.0, 19.0, 17.0, 14.0, 13.0, 21.0, 22.0, 30.0, 38.0, 31.0, 28.0, 31.0, 28.0, 48.0, 35.0, 33.0, 44.0, 50.0, 28.0, 36.0, 44.0, 30.0, 37.0, 35.0, 25.0, 24.0, 21.0, 20.0, 19.0, 16.0, 10.0, 11.0, 7.0, 11.0, 10.0, 10.0, 11.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.01986372470855713, -0.019267667084932327, -0.018671607598662376, -0.018075548112392426, -0.017479490488767624, -0.016883432865142822, -0.01628737337887287, -0.01569131389260292, -0.015095256268978119, -0.014499197714030743, -0.013903139159083366, -0.01330708060413599, -0.012711022049188614, -0.012114963494241238, -0.011518904939293861, -0.010922846384346485, -0.010326787829399109, -0.009730729274451733, -0.009134670719504356, -0.00853861216455698, -0.007942553609609604, -0.007346495054662228, -0.006750436499714851, -0.006154377944767475, -0.005558319389820099, -0.004962260834872723, -0.004366202279925346, -0.00377014372497797, -0.003174085170030594, -0.0025780266150832176, -0.0019819680601358414, -0.0013859095051884651, -0.0007898509502410889, -0.00019379239529371262, 0.00040226615965366364, 0.0009983247146010399, 0.0015943832695484161, 0.0021904418244957924, 0.0027865003794431686, 0.003382558934390545, 0.003978617489337921, 0.004574676044285297, 0.005170734599232674, 0.00576679315418005, 0.006362851709127426, 0.006958910264074802, 0.007554968819022179, 0.008151027373969555, 0.008747085928916931, 0.009343144483864307, 0.009939203038811684, 0.01053526159375906, 0.011131320148706436, 0.011727378703653812, 0.012323437258601189, 0.012919495813548565, 0.013515554368495941, 0.014111612923443317, 0.014707671478390694, 0.01530373003333807, 0.015899788588285446, 0.016495846211910248, 0.0170919056981802, 0.01768796518445015, 0.01828402280807495]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 12.0, 16.0, 16.0, 18.0, 15.0, 19.0, 22.0, 21.0, 30.0, 32.0, 38.0, 33.0, 39.0, 39.0, 54.0, 32.0, 47.0, 38.0, 50.0, 38.0, 54.0, 35.0, 37.0, 25.0, 26.0, 29.0, 25.0, 22.0, 28.0, 14.0, 16.0, 11.0, 10.0, 5.0, 5.0, 5.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.2421875, -4.11578369140625, -3.9893798828125, -3.86297607421875, -3.736572265625, -3.61016845703125, -3.4837646484375, -3.35736083984375, -3.23095703125, -3.10455322265625, -2.9781494140625, -2.85174560546875, -2.725341796875, -2.59893798828125, -2.4725341796875, -2.34613037109375, -2.2197265625, -2.09332275390625, -1.9669189453125, -1.84051513671875, -1.714111328125, -1.58770751953125, -1.4613037109375, -1.33489990234375, -1.20849609375, -1.08209228515625, -0.9556884765625, -0.82928466796875, -0.702880859375, -0.57647705078125, -0.4500732421875, -0.32366943359375, -0.197265625, -0.07086181640625, 0.0555419921875, 0.18194580078125, 0.308349609375, 0.43475341796875, 0.5611572265625, 0.68756103515625, 0.81396484375, 0.94036865234375, 1.0667724609375, 1.19317626953125, 1.319580078125, 1.44598388671875, 1.5723876953125, 1.69879150390625, 1.8251953125, 1.95159912109375, 2.0780029296875, 2.20440673828125, 2.330810546875, 2.45721435546875, 2.5836181640625, 2.71002197265625, 2.83642578125, 2.96282958984375, 3.0892333984375, 3.21563720703125, 3.342041015625, 3.46844482421875, 3.5948486328125, 3.72125244140625, 3.84765625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 8.0, 15.0, 16.0, 31.0, 36.0, 39.0, 42.0, 66.0, 93.0, 109.0, 188.0, 281.0, 459.0, 932.0, 1740.0, 3732.0, 8295.0, 19460.0, 53161.0, 262866.0, 549208.0, 95259.0, 29809.0, 12015.0, 5223.0, 2424.0, 1229.0, 662.0, 395.0, 214.0, 122.0, 110.0, 65.0, 53.0, 43.0, 25.0, 25.0, 23.0, 18.0, 9.0, 13.0, 8.0, 3.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.04693603515625, -6.8282470703125, -6.60955810546875, -6.390869140625, -6.17218017578125, -5.9534912109375, -5.73480224609375, -5.51611328125, -5.29742431640625, -5.0787353515625, -4.86004638671875, -4.641357421875, -4.42266845703125, -4.2039794921875, -3.98529052734375, -3.7666015625, -3.54791259765625, -3.3292236328125, -3.11053466796875, -2.891845703125, -2.67315673828125, -2.4544677734375, -2.23577880859375, -2.01708984375, -1.79840087890625, -1.5797119140625, -1.36102294921875, -1.142333984375, -0.92364501953125, -0.7049560546875, -0.48626708984375, -0.267578125, -0.04888916015625, 0.1697998046875, 0.38848876953125, 0.607177734375, 0.82586669921875, 1.0445556640625, 1.26324462890625, 1.48193359375, 1.70062255859375, 1.9193115234375, 2.13800048828125, 2.356689453125, 2.57537841796875, 2.7940673828125, 3.01275634765625, 3.2314453125, 3.45013427734375, 3.6688232421875, 3.88751220703125, 4.106201171875, 4.32489013671875, 4.5435791015625, 4.76226806640625, 4.98095703125, 5.19964599609375, 5.4183349609375, 5.63702392578125, 5.855712890625, 6.07440185546875, 6.2930908203125, 6.51177978515625, 6.73046875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 5.0, 4.0, 12.0, 12.0, 19.0, 7.0, 17.0, 11.0, 20.0, 29.0, 21.0, 27.0, 36.0, 32.0, 50.0, 47.0, 61.0, 79.0, 144.0, 316.0, 1432.0, 168.0, 79.0, 43.0, 47.0, 48.0, 28.0, 34.0, 29.0, 31.0, 23.0, 28.0, 17.0, 18.0, 16.0, 14.0, 9.0, 4.0, 9.0, 4.0, 3.0, 5.0, 5.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-12.1875, -11.8409423828125, -11.494384765625, -11.1478271484375, -10.80126953125, -10.4547119140625, -10.108154296875, -9.7615966796875, -9.4150390625, -9.0684814453125, -8.721923828125, -8.3753662109375, -8.02880859375, -7.6822509765625, -7.335693359375, -6.9891357421875, -6.642578125, -6.2960205078125, -5.949462890625, -5.6029052734375, -5.25634765625, -4.9097900390625, -4.563232421875, -4.2166748046875, -3.8701171875, -3.5235595703125, -3.177001953125, -2.8304443359375, -2.48388671875, -2.1373291015625, -1.790771484375, -1.4442138671875, -1.09765625, -0.7510986328125, -0.404541015625, -0.0579833984375, 0.28857421875, 0.6351318359375, 0.981689453125, 1.3282470703125, 1.6748046875, 2.0213623046875, 2.367919921875, 2.7144775390625, 3.06103515625, 3.4075927734375, 3.754150390625, 4.1007080078125, 4.447265625, 4.7938232421875, 5.140380859375, 5.4869384765625, 5.83349609375, 6.1800537109375, 6.526611328125, 6.8731689453125, 7.2197265625, 7.5662841796875, 7.912841796875, 8.2593994140625, 8.60595703125, 8.9525146484375, 9.299072265625, 9.6456298828125, 9.9921875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 12.0, 10.0, 9.0, 15.0, 23.0, 28.0, 41.0, 34.0, 49.0, 83.0, 110.0, 135.0, 212.0, 331.0, 700.0, 2344.0, 17082.0, 588120.0, 2498053.0, 32501.0, 3705.0, 871.0, 385.0, 234.0, 160.0, 114.0, 62.0, 63.0, 36.0, 32.0, 24.0, 27.0, 22.0, 17.0, 12.0, 6.0, 7.0, 8.0, 5.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.46142578125, -19.7822265625, -19.10302734375, -18.423828125, -17.74462890625, -17.0654296875, -16.38623046875, -15.70703125, -15.02783203125, -14.3486328125, -13.66943359375, -12.990234375, -12.31103515625, -11.6318359375, -10.95263671875, -10.2734375, -9.59423828125, -8.9150390625, -8.23583984375, -7.556640625, -6.87744140625, -6.1982421875, -5.51904296875, -4.83984375, -4.16064453125, -3.4814453125, -2.80224609375, -2.123046875, -1.44384765625, -0.7646484375, -0.08544921875, 0.59375, 1.27294921875, 1.9521484375, 2.63134765625, 3.310546875, 3.98974609375, 4.6689453125, 5.34814453125, 6.02734375, 6.70654296875, 7.3857421875, 8.06494140625, 8.744140625, 9.42333984375, 10.1025390625, 10.78173828125, 11.4609375, 12.14013671875, 12.8193359375, 13.49853515625, 14.177734375, 14.85693359375, 15.5361328125, 16.21533203125, 16.89453125, 17.57373046875, 18.2529296875, 18.93212890625, 19.611328125, 20.29052734375, 20.9697265625, 21.64892578125, 22.328125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 138.0, 584.0, 263.0, 24.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.37747192382812, -166.3881072998047, -163.39874267578125, -160.40939331054688, -157.42002868652344, -154.4306640625, -151.44129943847656, -148.45193481445312, -145.4625701904297, -142.47320556640625, -139.4838409423828, -136.49447631835938, -133.505126953125, -130.51576232910156, -127.52639770507812, -124.53703308105469, -121.54768371582031, -118.55831909179688, -115.56896209716797, -112.57959747314453, -109.5902328491211, -106.60087585449219, -103.61151123046875, -100.62214660644531, -97.63278198242188, -94.64341735839844, -91.65406036376953, -88.6646957397461, -85.67533111572266, -82.68597412109375, -79.69660949707031, -76.70724487304688, -73.71788787841797, -70.72852325439453, -67.73916625976562, -64.74980163574219, -61.760440826416016, -58.771080017089844, -55.781715393066406, -52.792354583740234, -49.80299377441406, -46.81363296508789, -43.82426834106445, -40.83490753173828, -37.84554672241211, -34.85618591308594, -31.8668212890625, -28.877460479736328, -25.88809585571289, -22.898733139038086, -19.909372329711914, -16.92000961303711, -13.930647850036621, -10.941286087036133, -7.951923370361328, -4.962562561035156, -1.9731998443603516, 1.0161621570587158, 4.005524158477783, 6.99488639831543, 9.984248161315918, 12.973609924316406, 15.962972640991211, 18.952333450317383, 21.941696166992188]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 4.0, 12.0, 10.0, 8.0, 16.0, 16.0, 19.0, 18.0, 28.0, 30.0, 39.0, 33.0, 33.0, 46.0, 61.0, 46.0, 41.0, 59.0, 54.0, 35.0, 46.0, 48.0, 39.0, 35.0, 38.0, 26.0, 28.0, 19.0, 23.0, 15.0, 18.0, 12.0, 7.0, 7.0, 8.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.750354766845703, -27.65522003173828, -26.56008529663086, -25.464950561523438, -24.369815826416016, -23.274681091308594, -22.179548263549805, -21.084413528442383, -19.98927879333496, -18.89414405822754, -17.799009323120117, -16.703874588012695, -15.60874080657959, -14.513606071472168, -13.418472290039062, -12.32333755493164, -11.228202819824219, -10.133068084716797, -9.037933349609375, -7.9427995681762695, -6.847664833068848, -5.752530097961426, -4.657395839691162, -3.5622615814208984, -2.4671268463134766, -1.3719923496246338, -0.276857852935791, 0.8182766437530518, 1.9134111404418945, 3.0085458755493164, 4.10368013381958, 5.198814392089844, 6.293952941894531, 7.389087677001953, 8.484222412109375, 9.57935619354248, 10.674490928649902, 11.769625663757324, 12.86475944519043, 13.959894180297852, 15.055028915405273, 16.150163650512695, 17.245298385620117, 18.34043312072754, 19.435565948486328, 20.53070068359375, 21.625835418701172, 22.720970153808594, 23.816104888916016, 24.911239624023438, 26.00637435913086, 27.10150909423828, 28.196643829345703, 29.291778564453125, 30.386911392211914, 31.482046127319336, 32.577178955078125, 33.67231369018555, 34.76744842529297, 35.86258316040039, 36.95771789550781, 38.052852630615234, 39.147987365722656, 40.24311828613281, 41.3382568359375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 6.0, 9.0, 13.0, 15.0, 9.0, 16.0, 21.0, 17.0, 20.0, 32.0, 25.0, 20.0, 30.0, 37.0, 33.0, 37.0, 40.0, 41.0, 49.0, 52.0, 41.0, 37.0, 40.0, 35.0, 45.0, 32.0, 40.0, 28.0, 21.0, 26.0, 25.0, 19.0, 21.0, 21.0, 9.0, 8.0, 11.0, 4.0, 11.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.796875, -4.661773681640625, -4.52667236328125, -4.391571044921875, -4.2564697265625, -4.121368408203125, -3.98626708984375, -3.851165771484375, -3.716064453125, -3.580963134765625, -3.44586181640625, -3.310760498046875, -3.1756591796875, -3.040557861328125, -2.90545654296875, -2.770355224609375, -2.63525390625, -2.500152587890625, -2.36505126953125, -2.229949951171875, -2.0948486328125, -1.959747314453125, -1.82464599609375, -1.689544677734375, -1.554443359375, -1.419342041015625, -1.28424072265625, -1.149139404296875, -1.0140380859375, -0.878936767578125, -0.74383544921875, -0.608734130859375, -0.4736328125, -0.338531494140625, -0.20343017578125, -0.068328857421875, 0.0667724609375, 0.201873779296875, 0.33697509765625, 0.472076416015625, 0.607177734375, 0.742279052734375, 0.87738037109375, 1.012481689453125, 1.1475830078125, 1.282684326171875, 1.41778564453125, 1.552886962890625, 1.68798828125, 1.823089599609375, 1.95819091796875, 2.093292236328125, 2.2283935546875, 2.363494873046875, 2.49859619140625, 2.633697509765625, 2.768798828125, 2.903900146484375, 3.03900146484375, 3.174102783203125, 3.3092041015625, 3.444305419921875, 3.57940673828125, 3.714508056640625, 3.849609375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 9.0, 9.0, 8.0, 16.0, 14.0, 29.0, 47.0, 56.0, 91.0, 117.0, 190.0, 279.0, 477.0, 848.0, 1762.0, 4151.0, 11198.0, 38110.0, 152053.0, 620257.0, 1659175.0, 1231276.0, 354028.0, 84573.0, 22279.0, 7217.0, 2785.0, 1346.0, 731.0, 404.0, 245.0, 154.0, 111.0, 55.0, 41.0, 33.0, 23.0, 17.0, 14.0, 10.0, 10.0, 7.0, 5.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0], "bins": [-6.390625, -6.21209716796875, -6.0335693359375, -5.85504150390625, -5.676513671875, -5.49798583984375, -5.3194580078125, -5.14093017578125, -4.96240234375, -4.78387451171875, -4.6053466796875, -4.42681884765625, -4.248291015625, -4.06976318359375, -3.8912353515625, -3.71270751953125, -3.5341796875, -3.35565185546875, -3.1771240234375, -2.99859619140625, -2.820068359375, -2.64154052734375, -2.4630126953125, -2.28448486328125, -2.10595703125, -1.92742919921875, -1.7489013671875, -1.57037353515625, -1.391845703125, -1.21331787109375, -1.0347900390625, -0.85626220703125, -0.677734375, -0.49920654296875, -0.3206787109375, -0.14215087890625, 0.036376953125, 0.21490478515625, 0.3934326171875, 0.57196044921875, 0.75048828125, 0.92901611328125, 1.1075439453125, 1.28607177734375, 1.464599609375, 1.64312744140625, 1.8216552734375, 2.00018310546875, 2.1787109375, 2.35723876953125, 2.5357666015625, 2.71429443359375, 2.892822265625, 3.07135009765625, 3.2498779296875, 3.42840576171875, 3.60693359375, 3.78546142578125, 3.9639892578125, 4.14251708984375, 4.321044921875, 4.49957275390625, 4.6781005859375, 4.85662841796875, 5.03515625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 9.0, 12.0, 19.0, 21.0, 32.0, 44.0, 78.0, 103.0, 154.0, 233.0, 348.0, 478.0, 550.0, 544.0, 404.0, 327.0, 221.0, 171.0, 105.0, 68.0, 44.0, 30.0, 20.0, 16.0, 14.0, 8.0, 7.0, 8.0, 0.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-10.6328125, -10.37921142578125, -10.1256103515625, -9.87200927734375, -9.618408203125, -9.36480712890625, -9.1112060546875, -8.85760498046875, -8.60400390625, -8.35040283203125, -8.0968017578125, -7.84320068359375, -7.589599609375, -7.33599853515625, -7.0823974609375, -6.82879638671875, -6.5751953125, -6.32159423828125, -6.0679931640625, -5.81439208984375, -5.560791015625, -5.30718994140625, -5.0535888671875, -4.79998779296875, -4.54638671875, -4.29278564453125, -4.0391845703125, -3.78558349609375, -3.531982421875, -3.27838134765625, -3.0247802734375, -2.77117919921875, -2.517578125, -2.26397705078125, -2.0103759765625, -1.75677490234375, -1.503173828125, -1.24957275390625, -0.9959716796875, -0.74237060546875, -0.48876953125, -0.23516845703125, 0.0184326171875, 0.27203369140625, 0.525634765625, 0.77923583984375, 1.0328369140625, 1.28643798828125, 1.5400390625, 1.79364013671875, 2.0472412109375, 2.30084228515625, 2.554443359375, 2.80804443359375, 3.0616455078125, 3.31524658203125, 3.56884765625, 3.82244873046875, 4.0760498046875, 4.32965087890625, 4.583251953125, 4.83685302734375, 5.0904541015625, 5.34405517578125, 5.59765625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 10.0, 8.0, 24.0, 35.0, 39.0, 65.0, 100.0, 195.0, 353.0, 750.0, 2142.0, 20121.0, 1578051.0, 2557598.0, 30500.0, 2654.0, 755.0, 359.0, 205.0, 139.0, 55.0, 46.0, 34.0, 18.0, 15.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.859375, -26.07080078125, -25.2822265625, -24.49365234375, -23.705078125, -22.91650390625, -22.1279296875, -21.33935546875, -20.55078125, -19.76220703125, -18.9736328125, -18.18505859375, -17.396484375, -16.60791015625, -15.8193359375, -15.03076171875, -14.2421875, -13.45361328125, -12.6650390625, -11.87646484375, -11.087890625, -10.29931640625, -9.5107421875, -8.72216796875, -7.93359375, -7.14501953125, -6.3564453125, -5.56787109375, -4.779296875, -3.99072265625, -3.2021484375, -2.41357421875, -1.625, -0.83642578125, -0.0478515625, 0.74072265625, 1.529296875, 2.31787109375, 3.1064453125, 3.89501953125, 4.68359375, 5.47216796875, 6.2607421875, 7.04931640625, 7.837890625, 8.62646484375, 9.4150390625, 10.20361328125, 10.9921875, 11.78076171875, 12.5693359375, 13.35791015625, 14.146484375, 14.93505859375, 15.7236328125, 16.51220703125, 17.30078125, 18.08935546875, 18.8779296875, 19.66650390625, 20.455078125, 21.24365234375, 22.0322265625, 22.82080078125, 23.609375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 62.0, 216.0, 322.0, 292.0, 95.0, 21.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.23301696777344, -113.22795867919922, -110.222900390625, -107.21783447265625, -104.21277618408203, -101.20771789550781, -98.2026596069336, -95.19760131835938, -92.19253540039062, -89.1874771118164, -86.18241882324219, -83.17735290527344, -80.17229461669922, -77.167236328125, -74.16217803955078, -71.15711975097656, -68.15206146240234, -65.14700317382812, -62.14194107055664, -59.13688278198242, -56.13182067871094, -53.12676239013672, -50.1217041015625, -47.11664581298828, -44.1115837097168, -41.10652542114258, -38.101463317871094, -35.096405029296875, -32.091346740722656, -29.086284637451172, -26.081226348876953, -23.0761661529541, -20.07109832763672, -17.066038131713867, -14.060978889465332, -11.055919647216797, -8.050859451293945, -5.045799255371094, -2.040740966796875, 0.9643192291259766, 3.969379425048828, 6.9744391441345215, 9.979498863220215, 12.98455810546875, 15.989618301391602, 18.994678497314453, 21.999736785888672, 25.004796981811523, 28.009857177734375, 31.014917373657227, 34.01997756958008, 37.0250358581543, 40.03009796142578, 43.03515625, 46.04021453857422, 49.04527282714844, 52.05033493041992, 55.05539321899414, 58.060455322265625, 61.065513610839844, 64.07057189941406, 67.07563781738281, 70.0806884765625, 73.08575439453125, 76.09081268310547]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 6.0, 9.0, 13.0, 18.0, 13.0, 24.0, 23.0, 24.0, 18.0, 36.0, 33.0, 38.0, 34.0, 40.0, 35.0, 41.0, 37.0, 41.0, 51.0, 43.0, 49.0, 26.0, 34.0, 31.0, 36.0, 26.0, 34.0, 29.0, 22.0, 16.0, 13.0, 13.0, 10.0, 17.0, 17.0, 16.0, 5.0, 2.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-23.045528411865234, -22.340007781982422, -21.634489059448242, -20.92896842956543, -20.223447799682617, -19.517929077148438, -18.812408447265625, -18.106887817382812, -17.401369094848633, -16.69584846496582, -15.990328788757324, -15.284809112548828, -14.579289436340332, -13.873769760131836, -13.168249130249023, -12.462729454040527, -11.757208824157715, -11.051689147949219, -10.346168518066406, -9.64064884185791, -8.935129165649414, -8.229608535766602, -7.5240888595581055, -6.818569183349609, -6.113049030303955, -5.407528877258301, -4.702009201049805, -3.9964890480041504, -3.290969133377075, -2.58544921875, -1.8799290657043457, -1.1744093894958496, -0.4688892364501953, 0.23663073778152466, 0.9421507120132446, 1.6476707458496094, 2.3531906604766846, 3.0587105751037598, 3.764230728149414, 4.46975040435791, 5.1752705574035645, 5.880790710449219, 6.586310386657715, 7.291830539703369, 7.997350692749023, 8.70287036895752, 9.408390045166016, 10.113910675048828, 10.819430351257324, 11.52495002746582, 12.230470657348633, 12.935990333557129, 13.641510009765625, 14.347030639648438, 15.052550315856934, 15.75806999206543, 16.463590621948242, 17.169111251831055, 17.874629974365234, 18.580150604248047, 19.28567123413086, 19.99118995666504, 20.69671058654785, 21.40222930908203, 22.107749938964844]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 8.0, 7.0, 12.0, 17.0, 14.0, 11.0, 24.0, 20.0, 36.0, 32.0, 28.0, 29.0, 35.0, 43.0, 45.0, 42.0, 40.0, 41.0, 56.0, 48.0, 48.0, 40.0, 39.0, 41.0, 37.0, 21.0, 29.0, 21.0, 28.0, 17.0, 18.0, 8.0, 15.0, 9.0, 10.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.54296875, -4.40203857421875, -4.2611083984375, -4.12017822265625, -3.979248046875, -3.83831787109375, -3.6973876953125, -3.55645751953125, -3.41552734375, -3.27459716796875, -3.1336669921875, -2.99273681640625, -2.851806640625, -2.71087646484375, -2.5699462890625, -2.42901611328125, -2.2880859375, -2.14715576171875, -2.0062255859375, -1.86529541015625, -1.724365234375, -1.58343505859375, -1.4425048828125, -1.30157470703125, -1.16064453125, -1.01971435546875, -0.8787841796875, -0.73785400390625, -0.596923828125, -0.45599365234375, -0.3150634765625, -0.17413330078125, -0.033203125, 0.10772705078125, 0.2486572265625, 0.38958740234375, 0.530517578125, 0.67144775390625, 0.8123779296875, 0.95330810546875, 1.09423828125, 1.23516845703125, 1.3760986328125, 1.51702880859375, 1.657958984375, 1.79888916015625, 1.9398193359375, 2.08074951171875, 2.2216796875, 2.36260986328125, 2.5035400390625, 2.64447021484375, 2.785400390625, 2.92633056640625, 3.0672607421875, 3.20819091796875, 3.34912109375, 3.49005126953125, 3.6309814453125, 3.77191162109375, 3.912841796875, 4.05377197265625, 4.1947021484375, 4.33563232421875, 4.4765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 6.0, 5.0, 6.0, 5.0, 17.0, 28.0, 50.0, 61.0, 114.0, 190.0, 286.0, 468.0, 647.0, 1044.0, 1571.0, 2462.0, 3791.0, 5580.0, 8599.0, 12609.0, 18508.0, 27761.0, 39273.0, 55150.0, 73987.0, 95019.0, 113194.0, 120089.0, 112960.0, 95958.0, 75868.0, 56791.0, 40421.0, 28146.0, 19407.0, 13131.0, 8770.0, 5669.0, 3682.0, 2534.0, 1616.0, 1075.0, 672.0, 495.0, 302.0, 197.0, 121.0, 89.0, 53.0, 41.0, 23.0, 11.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5124359130859375, -0.495086669921875, -0.4777374267578125, -0.46038818359375, -0.4430389404296875, -0.425689697265625, -0.4083404541015625, -0.3909912109375, -0.3736419677734375, -0.356292724609375, -0.3389434814453125, -0.32159423828125, -0.3042449951171875, -0.286895751953125, -0.2695465087890625, -0.252197265625, -0.2348480224609375, -0.217498779296875, -0.2001495361328125, -0.18280029296875, -0.1654510498046875, -0.148101806640625, -0.1307525634765625, -0.1134033203125, -0.0960540771484375, -0.078704833984375, -0.0613555908203125, -0.04400634765625, -0.0266571044921875, -0.009307861328125, 0.0080413818359375, 0.025390625, 0.0427398681640625, 0.060089111328125, 0.0774383544921875, 0.09478759765625, 0.1121368408203125, 0.129486083984375, 0.1468353271484375, 0.1641845703125, 0.1815338134765625, 0.198883056640625, 0.2162322998046875, 0.23358154296875, 0.2509307861328125, 0.268280029296875, 0.2856292724609375, 0.302978515625, 0.3203277587890625, 0.337677001953125, 0.3550262451171875, 0.37237548828125, 0.3897247314453125, 0.407073974609375, 0.4244232177734375, 0.4417724609375, 0.4591217041015625, 0.476470947265625, 0.4938201904296875, 0.51116943359375, 0.5285186767578125, 0.545867919921875, 0.5632171630859375, 0.58056640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 6.0, 8.0, 6.0, 9.0, 16.0, 21.0, 19.0, 7.0, 15.0, 27.0, 30.0, 32.0, 37.0, 34.0, 28.0, 36.0, 36.0, 33.0, 33.0, 46.0, 1055.0, 42.0, 40.0, 39.0, 34.0, 37.0, 40.0, 37.0, 31.0, 16.0, 17.0, 37.0, 16.0, 23.0, 8.0, 5.0, 10.0, 8.0, 7.0, 10.0, 5.0, 5.0, 4.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.767578125, -2.67645263671875, -2.5853271484375, -2.49420166015625, -2.403076171875, -2.31195068359375, -2.2208251953125, -2.12969970703125, -2.03857421875, -1.94744873046875, -1.8563232421875, -1.76519775390625, -1.674072265625, -1.58294677734375, -1.4918212890625, -1.40069580078125, -1.3095703125, -1.21844482421875, -1.1273193359375, -1.03619384765625, -0.945068359375, -0.85394287109375, -0.7628173828125, -0.67169189453125, -0.58056640625, -0.48944091796875, -0.3983154296875, -0.30718994140625, -0.216064453125, -0.12493896484375, -0.0338134765625, 0.05731201171875, 0.1484375, 0.23956298828125, 0.3306884765625, 0.42181396484375, 0.512939453125, 0.60406494140625, 0.6951904296875, 0.78631591796875, 0.87744140625, 0.96856689453125, 1.0596923828125, 1.15081787109375, 1.241943359375, 1.33306884765625, 1.4241943359375, 1.51531982421875, 1.6064453125, 1.69757080078125, 1.7886962890625, 1.87982177734375, 1.970947265625, 2.06207275390625, 2.1531982421875, 2.24432373046875, 2.33544921875, 2.42657470703125, 2.5177001953125, 2.60882568359375, 2.699951171875, 2.79107666015625, 2.8822021484375, 2.97332763671875, 3.064453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 2.0, 9.0, 11.0, 16.0, 30.0, 38.0, 64.0, 88.0, 111.0, 172.0, 244.0, 358.0, 474.0, 702.0, 1049.0, 1556.0, 2214.0, 3228.0, 4599.0, 6836.0, 10048.0, 15393.0, 24561.0, 43254.0, 1875776.0, 39101.0, 22767.0, 14472.0, 9480.0, 6351.0, 4396.0, 3071.0, 2073.0, 1380.0, 1035.0, 701.0, 437.0, 293.0, 227.0, 169.0, 104.0, 75.0, 53.0, 32.0, 26.0, 25.0, 15.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0], "bins": [-1.400390625, -1.3608551025390625, -1.321319580078125, -1.2817840576171875, -1.24224853515625, -1.2027130126953125, -1.163177490234375, -1.1236419677734375, -1.0841064453125, -1.0445709228515625, -1.005035400390625, -0.9654998779296875, -0.92596435546875, -0.8864288330078125, -0.846893310546875, -0.8073577880859375, -0.767822265625, -0.7282867431640625, -0.688751220703125, -0.6492156982421875, -0.60968017578125, -0.5701446533203125, -0.530609130859375, -0.4910736083984375, -0.4515380859375, -0.4120025634765625, -0.372467041015625, -0.3329315185546875, -0.29339599609375, -0.2538604736328125, -0.214324951171875, -0.1747894287109375, -0.13525390625, -0.0957183837890625, -0.056182861328125, -0.0166473388671875, 0.02288818359375, 0.0624237060546875, 0.101959228515625, 0.1414947509765625, 0.1810302734375, 0.2205657958984375, 0.260101318359375, 0.2996368408203125, 0.33917236328125, 0.3787078857421875, 0.418243408203125, 0.4577789306640625, 0.497314453125, 0.5368499755859375, 0.576385498046875, 0.6159210205078125, 0.65545654296875, 0.6949920654296875, 0.734527587890625, 0.7740631103515625, 0.8135986328125, 0.8531341552734375, 0.892669677734375, 0.9322052001953125, 0.97174072265625, 1.0112762451171875, 1.050811767578125, 1.0903472900390625, 1.1298828125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 8.0, 8.0, 12.0, 10.0, 13.0, 13.0, 19.0, 16.0, 31.0, 29.0, 29.0, 44.0, 45.0, 32.0, 42.0, 49.0, 49.0, 47.0, 46.0, 66.0, 36.0, 43.0, 33.0, 30.0, 34.0, 33.0, 18.0, 26.0, 32.0, 19.0, 9.0, 12.0, 12.0, 5.0, 3.0, 3.0, 7.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01306915283203125, -0.012616991996765137, -0.012164831161499023, -0.01171267032623291, -0.011260509490966797, -0.010808348655700684, -0.01035618782043457, -0.009904026985168457, -0.009451866149902344, -0.00899970531463623, -0.008547544479370117, -0.008095383644104004, -0.007643222808837891, -0.007191061973571777, -0.006738901138305664, -0.006286740303039551, -0.0058345794677734375, -0.005382418632507324, -0.004930257797241211, -0.004478096961975098, -0.004025936126708984, -0.003573775291442871, -0.003121614456176758, -0.0026694536209106445, -0.0022172927856445312, -0.001765131950378418, -0.0013129711151123047, -0.0008608102798461914, -0.0004086494445800781, 4.3511390686035156e-05, 0.0004956722259521484, 0.0009478330612182617, 0.001399993896484375, 0.0018521547317504883, 0.0023043155670166016, 0.002756476402282715, 0.003208637237548828, 0.0036607980728149414, 0.004112958908081055, 0.004565119743347168, 0.005017280578613281, 0.0054694414138793945, 0.005921602249145508, 0.006373763084411621, 0.006825923919677734, 0.007278084754943848, 0.007730245590209961, 0.008182406425476074, 0.008634567260742188, 0.0090867280960083, 0.009538888931274414, 0.009991049766540527, 0.01044321060180664, 0.010895371437072754, 0.011347532272338867, 0.01179969310760498, 0.012251853942871094, 0.012704014778137207, 0.01315617561340332, 0.013608336448669434, 0.014060497283935547, 0.01451265811920166, 0.014964818954467773, 0.015416979789733887, 0.015869140625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 5.0, 9.0, 2.0, 10.0, 5.0, 10.0, 18.0, 26.0, 26.0, 41.0, 39.0, 52.0, 70.0, 76.0, 104.0, 166.0, 245.0, 384.0, 865.0, 11956.0, 983432.0, 48467.0, 1170.0, 436.0, 267.0, 173.0, 124.0, 79.0, 55.0, 43.0, 31.0, 34.0, 30.0, 22.0, 12.0, 12.0, 8.0, 10.0, 9.0, 6.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.326171875, -0.3167533874511719, -0.30733489990234375, -0.2979164123535156, -0.2884979248046875, -0.2790794372558594, -0.26966094970703125, -0.2602424621582031, -0.250823974609375, -0.24140548706054688, -0.23198699951171875, -0.22256851196289062, -0.2131500244140625, -0.20373153686523438, -0.19431304931640625, -0.18489456176757812, -0.17547607421875, -0.16605758666992188, -0.15663909912109375, -0.14722061157226562, -0.1378021240234375, -0.12838363647460938, -0.11896514892578125, -0.10954666137695312, -0.100128173828125, -0.09070968627929688, -0.08129119873046875, -0.07187271118164062, -0.0624542236328125, -0.053035736083984375, -0.04361724853515625, -0.034198760986328125, -0.0247802734375, -0.015361785888671875, -0.00594329833984375, 0.003475189208984375, 0.0128936767578125, 0.022312164306640625, 0.03173065185546875, 0.041149139404296875, 0.050567626953125, 0.059986114501953125, 0.06940460205078125, 0.07882308959960938, 0.0882415771484375, 0.09766006469726562, 0.10707855224609375, 0.11649703979492188, 0.12591552734375, 0.13533401489257812, 0.14475250244140625, 0.15417098999023438, 0.1635894775390625, 0.17300796508789062, 0.18242645263671875, 0.19184494018554688, 0.201263427734375, 0.21068191528320312, 0.22010040283203125, 0.22951889038085938, 0.2389373779296875, 0.24835586547851562, 0.25777435302734375, 0.2671928405761719, 0.276611328125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 65.0, 425.0, 439.0, 65.0, 8.0, 2.0], "bins": [-0.21408145129680634, -0.2105138897895813, -0.20694634318351746, -0.20337878167629242, -0.19981123507022858, -0.19624367356300354, -0.1926761269569397, -0.18910856544971466, -0.18554101884365082, -0.18197345733642578, -0.17840591073036194, -0.1748383492231369, -0.17127080261707306, -0.16770324110984802, -0.16413569450378418, -0.16056813299655914, -0.1570005863904953, -0.15343302488327026, -0.14986547827720642, -0.14629791676998138, -0.14273037016391754, -0.1391628086566925, -0.13559526205062866, -0.13202770054340363, -0.12846015393733978, -0.12489259988069534, -0.1213250458240509, -0.11775749176740646, -0.11418993771076202, -0.11062238365411758, -0.10705482959747314, -0.1034872755408287, -0.09991972148418427, -0.09635216742753983, -0.09278461337089539, -0.08921705931425095, -0.0856495052576065, -0.08208195120096207, -0.07851439714431763, -0.07494684308767319, -0.07137928158044815, -0.06781172752380371, -0.06424417346715927, -0.06067661941051483, -0.05710906535387039, -0.05354151129722595, -0.04997395724058151, -0.04640640318393707, -0.04283884912729263, -0.03927129507064819, -0.035703741014003754, -0.032136186957359314, -0.028568632900714874, -0.025001076981425285, -0.021433522924780846, -0.017865968868136406, -0.014298414811491966, -0.010730860754847527, -0.0071633062325417995, -0.0035957517102360725, -2.8197653591632843e-05, 0.0035393573343753815, 0.007106911391019821, 0.01067446544766426, 0.0142420195043087]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 8.0, 8.0, 14.0, 15.0, 21.0, 28.0, 12.0, 37.0, 27.0, 23.0, 29.0, 26.0, 43.0, 40.0, 43.0, 52.0, 46.0, 48.0, 43.0, 44.0, 46.0, 37.0, 48.0, 28.0, 28.0, 26.0, 20.0, 23.0, 24.0, 21.0, 18.0, 14.0, 18.0, 8.0, 9.0, 8.0, 7.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01807636022567749, -0.017522327601909637, -0.016968296840786934, -0.01641426607966423, -0.015860233455896378, -0.0153062017634511, -0.014752170071005821, -0.014198138378560543, -0.013644106686115265, -0.013090074993669987, -0.012536043301224709, -0.01198201160877943, -0.011427979916334152, -0.010873948223888874, -0.010319916531443596, -0.009765884838998318, -0.00921185314655304, -0.008657821454107761, -0.008103789761662483, -0.007549758069217205, -0.006995726376771927, -0.006441694684326649, -0.0058876629918813705, -0.005333631299436092, -0.004779599606990814, -0.004225567914545536, -0.003671536222100258, -0.0031175045296549797, -0.0025634728372097015, -0.0020094411447644234, -0.0014554094523191452, -0.000901377759873867, -0.00034734606742858887, 0.0002066856250166893, 0.0007607173174619675, 0.0013147490099072456, 0.0018687807023525238, 0.002422812394797802, 0.00297684408724308, 0.0035308757796883583, 0.0040849074721336365, 0.004638939164578915, 0.005192970857024193, 0.005747002549469471, 0.006301034241914749, 0.006855065934360027, 0.0074090976268053055, 0.007963129319250584, 0.008517161011695862, 0.00907119270414114, 0.009625224396586418, 0.010179256089031696, 0.010733287781476974, 0.011287319473922253, 0.01184135116636753, 0.012395382858812809, 0.012949414551258087, 0.013503446243703365, 0.014057477936148643, 0.014611509628593922, 0.0151655413210392, 0.015719573944807053, 0.016273604705929756, 0.01682763546705246, 0.017381668090820312]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 8.0, 12.0, 6.0, 12.0, 13.0, 16.0, 23.0, 20.0, 26.0, 27.0, 35.0, 28.0, 27.0, 31.0, 31.0, 40.0, 40.0, 43.0, 55.0, 44.0, 51.0, 32.0, 39.0, 39.0, 42.0, 29.0, 30.0, 28.0, 19.0, 25.0, 22.0, 23.0, 18.0, 5.0, 11.0, 8.0, 7.0, 12.0, 8.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3203125, -4.186279296875, -4.05224609375, -3.918212890625, -3.7841796875, -3.650146484375, -3.51611328125, -3.382080078125, -3.248046875, -3.114013671875, -2.97998046875, -2.845947265625, -2.7119140625, -2.577880859375, -2.44384765625, -2.309814453125, -2.17578125, -2.041748046875, -1.90771484375, -1.773681640625, -1.6396484375, -1.505615234375, -1.37158203125, -1.237548828125, -1.103515625, -0.969482421875, -0.83544921875, -0.701416015625, -0.5673828125, -0.433349609375, -0.29931640625, -0.165283203125, -0.03125, 0.102783203125, 0.23681640625, 0.370849609375, 0.5048828125, 0.638916015625, 0.77294921875, 0.906982421875, 1.041015625, 1.175048828125, 1.30908203125, 1.443115234375, 1.5771484375, 1.711181640625, 1.84521484375, 1.979248046875, 2.11328125, 2.247314453125, 2.38134765625, 2.515380859375, 2.6494140625, 2.783447265625, 2.91748046875, 3.051513671875, 3.185546875, 3.319580078125, 3.45361328125, 3.587646484375, 3.7216796875, 3.855712890625, 3.98974609375, 4.123779296875, 4.2578125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 8.0, 11.0, 12.0, 18.0, 27.0, 35.0, 55.0, 74.0, 102.0, 132.0, 191.0, 285.0, 396.0, 633.0, 802.0, 1279.0, 1919.0, 2995.0, 4591.0, 7153.0, 11316.0, 17815.0, 28643.0, 47070.0, 81529.0, 153821.0, 245113.0, 191709.0, 101325.0, 56464.0, 34030.0, 21397.0, 13352.0, 8484.0, 5341.0, 3498.0, 2267.0, 1469.0, 970.0, 680.0, 460.0, 328.0, 216.0, 166.0, 104.0, 96.0, 53.0, 33.0, 32.0, 16.0, 16.0, 11.0, 10.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.859375, -3.73358154296875, -3.6077880859375, -3.48199462890625, -3.356201171875, -3.23040771484375, -3.1046142578125, -2.97882080078125, -2.85302734375, -2.72723388671875, -2.6014404296875, -2.47564697265625, -2.349853515625, -2.22406005859375, -2.0982666015625, -1.97247314453125, -1.8466796875, -1.72088623046875, -1.5950927734375, -1.46929931640625, -1.343505859375, -1.21771240234375, -1.0919189453125, -0.96612548828125, -0.84033203125, -0.71453857421875, -0.5887451171875, -0.46295166015625, -0.337158203125, -0.21136474609375, -0.0855712890625, 0.04022216796875, 0.166015625, 0.29180908203125, 0.4176025390625, 0.54339599609375, 0.669189453125, 0.79498291015625, 0.9207763671875, 1.04656982421875, 1.17236328125, 1.29815673828125, 1.4239501953125, 1.54974365234375, 1.675537109375, 1.80133056640625, 1.9271240234375, 2.05291748046875, 2.1787109375, 2.30450439453125, 2.4302978515625, 2.55609130859375, 2.681884765625, 2.80767822265625, 2.9334716796875, 3.05926513671875, 3.18505859375, 3.31085205078125, 3.4366455078125, 3.56243896484375, 3.688232421875, 3.81402587890625, 3.9398193359375, 4.06561279296875, 4.19140625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 11.0, 8.0, 7.0, 11.0, 18.0, 12.0, 19.0, 19.0, 30.0, 24.0, 31.0, 31.0, 38.0, 55.0, 64.0, 55.0, 94.0, 147.0, 212.0, 1280.0, 221.0, 115.0, 91.0, 68.0, 49.0, 43.0, 40.0, 28.0, 33.0, 33.0, 22.0, 24.0, 15.0, 15.0, 14.0, 15.0, 10.0, 8.0, 11.0, 6.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.421875, -11.06005859375, -10.6982421875, -10.33642578125, -9.974609375, -9.61279296875, -9.2509765625, -8.88916015625, -8.52734375, -8.16552734375, -7.8037109375, -7.44189453125, -7.080078125, -6.71826171875, -6.3564453125, -5.99462890625, -5.6328125, -5.27099609375, -4.9091796875, -4.54736328125, -4.185546875, -3.82373046875, -3.4619140625, -3.10009765625, -2.73828125, -2.37646484375, -2.0146484375, -1.65283203125, -1.291015625, -0.92919921875, -0.5673828125, -0.20556640625, 0.15625, 0.51806640625, 0.8798828125, 1.24169921875, 1.603515625, 1.96533203125, 2.3271484375, 2.68896484375, 3.05078125, 3.41259765625, 3.7744140625, 4.13623046875, 4.498046875, 4.85986328125, 5.2216796875, 5.58349609375, 5.9453125, 6.30712890625, 6.6689453125, 7.03076171875, 7.392578125, 7.75439453125, 8.1162109375, 8.47802734375, 8.83984375, 9.20166015625, 9.5634765625, 9.92529296875, 10.287109375, 10.64892578125, 11.0107421875, 11.37255859375, 11.734375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 10.0, 7.0, 16.0, 15.0, 26.0, 28.0, 52.0, 69.0, 107.0, 155.0, 195.0, 346.0, 544.0, 1308.0, 6331.0, 50504.0, 882370.0, 2101215.0, 88603.0, 10133.0, 1867.0, 627.0, 371.0, 233.0, 156.0, 121.0, 81.0, 63.0, 38.0, 35.0, 14.0, 17.0, 8.0, 7.0, 4.0, 2.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-21.40625, -20.82958984375, -20.2529296875, -19.67626953125, -19.099609375, -18.52294921875, -17.9462890625, -17.36962890625, -16.79296875, -16.21630859375, -15.6396484375, -15.06298828125, -14.486328125, -13.90966796875, -13.3330078125, -12.75634765625, -12.1796875, -11.60302734375, -11.0263671875, -10.44970703125, -9.873046875, -9.29638671875, -8.7197265625, -8.14306640625, -7.56640625, -6.98974609375, -6.4130859375, -5.83642578125, -5.259765625, -4.68310546875, -4.1064453125, -3.52978515625, -2.953125, -2.37646484375, -1.7998046875, -1.22314453125, -0.646484375, -0.06982421875, 0.5068359375, 1.08349609375, 1.66015625, 2.23681640625, 2.8134765625, 3.39013671875, 3.966796875, 4.54345703125, 5.1201171875, 5.69677734375, 6.2734375, 6.85009765625, 7.4267578125, 8.00341796875, 8.580078125, 9.15673828125, 9.7333984375, 10.31005859375, 10.88671875, 11.46337890625, 12.0400390625, 12.61669921875, 13.193359375, 13.77001953125, 14.3466796875, 14.92333984375, 15.5]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 9.0, 29.0, 83.0, 140.0, 201.0, 236.0, 169.0, 92.0, 35.0, 8.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.09010696411133, -30.336448669433594, -28.58279037475586, -26.829130172729492, -25.075471878051758, -23.321813583374023, -21.568153381347656, -19.814495086669922, -18.060836791992188, -16.307178497314453, -14.553519248962402, -12.799860000610352, -11.046201705932617, -9.292543411254883, -7.538884162902832, -5.785224914550781, -4.031566619873047, -2.2779078483581543, -0.5242490768432617, 1.2294096946716309, 2.9830684661865234, 4.736726760864258, 6.490386009216309, 8.24404525756836, 9.997703552246094, 11.751361846923828, 13.505021095275879, 15.25868034362793, 17.012338638305664, 18.7659969329834, 20.519657135009766, 22.2733154296875, 24.0269775390625, 25.780635833740234, 27.53429412841797, 29.287954330444336, 31.04161262512207, 32.79527282714844, 34.54893112182617, 36.302589416503906, 38.05624771118164, 39.809906005859375, 41.56356430053711, 43.317222595214844, 45.070884704589844, 46.82453918457031, 48.57820129394531, 50.33185958862305, 52.08551788330078, 53.839176177978516, 55.59283447265625, 57.346492767333984, 59.10015106201172, 60.85381317138672, 62.60747146606445, 64.36112976074219, 66.11479187011719, 67.86845397949219, 69.62210845947266, 71.37577056884766, 73.12942504882812, 74.88308715820312, 76.6367416381836, 78.3904037475586, 80.14405822753906]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 11.0, 14.0, 18.0, 17.0, 20.0, 20.0, 23.0, 28.0, 29.0, 29.0, 43.0, 26.0, 36.0, 36.0, 43.0, 38.0, 39.0, 45.0, 43.0, 46.0, 38.0, 27.0, 37.0, 37.0, 32.0, 25.0, 31.0, 26.0, 22.0, 17.0, 13.0, 15.0, 9.0, 11.0, 11.0, 6.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.1141357421875, -29.184574127197266, -28.25501251220703, -27.325450897216797, -26.395889282226562, -25.466327667236328, -24.536766052246094, -23.60720443725586, -22.677642822265625, -21.74808120727539, -20.818519592285156, -19.888957977294922, -18.959396362304688, -18.029834747314453, -17.10027313232422, -16.170711517333984, -15.241151809692383, -14.311590194702148, -13.382028579711914, -12.45246696472168, -11.522905349731445, -10.593343734741211, -9.663783073425293, -8.734221458435059, -7.804659843444824, -6.87509822845459, -5.9455366134643555, -5.015975475311279, -4.086413860321045, -3.1568522453308105, -2.2272911071777344, -1.2977294921875, -0.3681678771972656, 0.5613936185836792, 1.490955114364624, 2.4205164909362793, 3.3500781059265137, 4.279639720916748, 5.209200859069824, 6.138762474060059, 7.068324089050293, 7.997885704040527, 8.927447319030762, 9.85700798034668, 10.786569595336914, 11.716131210327148, 12.645692825317383, 13.575254440307617, 14.504816055297852, 15.434377670288086, 16.36393928527832, 17.293500900268555, 18.22306251525879, 19.152624130249023, 20.082183837890625, 21.01174545288086, 21.941307067871094, 22.870868682861328, 23.800430297851562, 24.729991912841797, 25.65955352783203, 26.589115142822266, 27.5186767578125, 28.448238372802734, 29.37779998779297]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 13.0, 13.0, 13.0, 14.0, 18.0, 19.0, 17.0, 31.0, 27.0, 21.0, 36.0, 28.0, 42.0, 35.0, 43.0, 59.0, 49.0, 41.0, 43.0, 48.0, 39.0, 36.0, 33.0, 31.0, 34.0, 36.0, 23.0, 13.0, 22.0, 16.0, 13.0, 13.0, 18.0, 13.0, 10.0, 11.0, 5.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.05859375, -4.9163818359375, -4.774169921875, -4.6319580078125, -4.48974609375, -4.3475341796875, -4.205322265625, -4.0631103515625, -3.9208984375, -3.7786865234375, -3.636474609375, -3.4942626953125, -3.35205078125, -3.2098388671875, -3.067626953125, -2.9254150390625, -2.783203125, -2.6409912109375, -2.498779296875, -2.3565673828125, -2.21435546875, -2.0721435546875, -1.929931640625, -1.7877197265625, -1.6455078125, -1.5032958984375, -1.361083984375, -1.2188720703125, -1.07666015625, -0.9344482421875, -0.792236328125, -0.6500244140625, -0.5078125, -0.3656005859375, -0.223388671875, -0.0811767578125, 0.06103515625, 0.2032470703125, 0.345458984375, 0.4876708984375, 0.6298828125, 0.7720947265625, 0.914306640625, 1.0565185546875, 1.19873046875, 1.3409423828125, 1.483154296875, 1.6253662109375, 1.767578125, 1.9097900390625, 2.052001953125, 2.1942138671875, 2.33642578125, 2.4786376953125, 2.620849609375, 2.7630615234375, 2.9052734375, 3.0474853515625, 3.189697265625, 3.3319091796875, 3.47412109375, 3.6163330078125, 3.758544921875, 3.9007568359375, 4.04296875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 14.0, 11.0, 28.0, 46.0, 64.0, 112.0, 152.0, 237.0, 424.0, 761.0, 1338.0, 2953.0, 6410.0, 17739.0, 58429.0, 219236.0, 832630.0, 1784777.0, 926028.0, 245405.0, 64824.0, 19483.0, 6876.0, 3006.0, 1376.0, 769.0, 427.0, 257.0, 178.0, 106.0, 69.0, 35.0, 36.0, 15.0, 6.0, 9.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.3690185546875, -5.187255859375, -5.0054931640625, -4.82373046875, -4.6419677734375, -4.460205078125, -4.2784423828125, -4.0966796875, -3.9149169921875, -3.733154296875, -3.5513916015625, -3.36962890625, -3.1878662109375, -3.006103515625, -2.8243408203125, -2.642578125, -2.4608154296875, -2.279052734375, -2.0972900390625, -1.91552734375, -1.7337646484375, -1.552001953125, -1.3702392578125, -1.1884765625, -1.0067138671875, -0.824951171875, -0.6431884765625, -0.46142578125, -0.2796630859375, -0.097900390625, 0.0838623046875, 0.265625, 0.4473876953125, 0.629150390625, 0.8109130859375, 0.99267578125, 1.1744384765625, 1.356201171875, 1.5379638671875, 1.7197265625, 1.9014892578125, 2.083251953125, 2.2650146484375, 2.44677734375, 2.6285400390625, 2.810302734375, 2.9920654296875, 3.173828125, 3.3555908203125, 3.537353515625, 3.7191162109375, 3.90087890625, 4.0826416015625, 4.264404296875, 4.4461669921875, 4.6279296875, 4.8096923828125, 4.991455078125, 5.1732177734375, 5.35498046875, 5.5367431640625, 5.718505859375, 5.9002685546875, 6.08203125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 9.0, 17.0, 15.0, 16.0, 18.0, 37.0, 32.0, 55.0, 81.0, 94.0, 121.0, 159.0, 228.0, 287.0, 327.0, 394.0, 430.0, 379.0, 325.0, 249.0, 193.0, 135.0, 99.0, 92.0, 55.0, 51.0, 33.0, 25.0, 16.0, 24.0, 15.0, 8.0, 8.0, 6.0, 2.0, 11.0, 3.0, 10.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5, -5.3175048828125, -5.135009765625, -4.9525146484375, -4.77001953125, -4.5875244140625, -4.405029296875, -4.2225341796875, -4.0400390625, -3.8575439453125, -3.675048828125, -3.4925537109375, -3.31005859375, -3.1275634765625, -2.945068359375, -2.7625732421875, -2.580078125, -2.3975830078125, -2.215087890625, -2.0325927734375, -1.85009765625, -1.6676025390625, -1.485107421875, -1.3026123046875, -1.1201171875, -0.9376220703125, -0.755126953125, -0.5726318359375, -0.39013671875, -0.2076416015625, -0.025146484375, 0.1573486328125, 0.33984375, 0.5223388671875, 0.704833984375, 0.8873291015625, 1.06982421875, 1.2523193359375, 1.434814453125, 1.6173095703125, 1.7998046875, 1.9822998046875, 2.164794921875, 2.3472900390625, 2.52978515625, 2.7122802734375, 2.894775390625, 3.0772705078125, 3.259765625, 3.4422607421875, 3.624755859375, 3.8072509765625, 3.98974609375, 4.1722412109375, 4.354736328125, 4.5372314453125, 4.7197265625, 4.9022216796875, 5.084716796875, 5.2672119140625, 5.44970703125, 5.6322021484375, 5.814697265625, 5.9971923828125, 6.1796875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 1.0, 5.0, 5.0, 7.0, 10.0, 21.0, 16.0, 27.0, 29.0, 55.0, 77.0, 101.0, 139.0, 199.0, 382.0, 735.0, 1564.0, 3678.0, 10727.0, 37816.0, 171783.0, 1094943.0, 2325163.0, 434275.0, 80608.0, 20316.0, 6651.0, 2519.0, 1075.0, 562.0, 276.0, 156.0, 109.0, 61.0, 47.0, 28.0, 20.0, 23.0, 20.0, 10.0, 8.0, 5.0, 7.0, 3.0, 4.0, 10.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.25, -8.9541015625, -8.658203125, -8.3623046875, -8.06640625, -7.7705078125, -7.474609375, -7.1787109375, -6.8828125, -6.5869140625, -6.291015625, -5.9951171875, -5.69921875, -5.4033203125, -5.107421875, -4.8115234375, -4.515625, -4.2197265625, -3.923828125, -3.6279296875, -3.33203125, -3.0361328125, -2.740234375, -2.4443359375, -2.1484375, -1.8525390625, -1.556640625, -1.2607421875, -0.96484375, -0.6689453125, -0.373046875, -0.0771484375, 0.21875, 0.5146484375, 0.810546875, 1.1064453125, 1.40234375, 1.6982421875, 1.994140625, 2.2900390625, 2.5859375, 2.8818359375, 3.177734375, 3.4736328125, 3.76953125, 4.0654296875, 4.361328125, 4.6572265625, 4.953125, 5.2490234375, 5.544921875, 5.8408203125, 6.13671875, 6.4326171875, 6.728515625, 7.0244140625, 7.3203125, 7.6162109375, 7.912109375, 8.2080078125, 8.50390625, 8.7998046875, 9.095703125, 9.3916015625, 9.6875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 720.0, 286.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-539.936767578125, -530.590087890625, -521.2434692382812, -511.89678955078125, -502.5501403808594, -493.2034606933594, -483.8568115234375, -474.5101318359375, -465.1634826660156, -455.81683349609375, -446.47015380859375, -437.1235046386719, -427.77685546875, -418.43017578125, -409.0835266113281, -399.73687744140625, -390.39019775390625, -381.0435485839844, -371.6968688964844, -362.3502197265625, -353.0035705566406, -343.6568908691406, -334.31024169921875, -324.96356201171875, -315.616943359375, -306.2702941894531, -296.9236145019531, -287.57696533203125, -278.2303161621094, -268.8836364746094, -259.5369873046875, -250.19032287597656, -240.84364318847656, -231.49697875976562, -222.15032958984375, -212.8036651611328, -203.45700073242188, -194.1103515625, -184.76368713378906, -175.41702270507812, -166.07037353515625, -156.7237091064453, -147.37705993652344, -138.0303955078125, -128.68373107910156, -119.33707427978516, -109.99041748046875, -100.64375305175781, -91.29708862304688, -81.95043182373047, -72.60376739501953, -63.257110595703125, -53.91044998168945, -44.56378936767578, -35.217132568359375, -25.870468139648438, -16.52381134033203, -7.177151679992676, 2.1695079803466797, 11.516166687011719, 20.86282730102539, 30.209487915039062, 39.55614471435547, 48.902809143066406, 58.24946594238281]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 7.0, 12.0, 8.0, 17.0, 18.0, 10.0, 19.0, 16.0, 19.0, 24.0, 25.0, 30.0, 35.0, 37.0, 34.0, 34.0, 34.0, 40.0, 34.0, 41.0, 46.0, 34.0, 42.0, 42.0, 33.0, 30.0, 29.0, 33.0, 17.0, 25.0, 28.0, 28.0, 21.0, 13.0, 12.0, 13.0, 11.0, 4.0, 8.0, 3.0, 7.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.00763511657715, -18.332157135009766, -17.65667724609375, -16.981199264526367, -16.305721282958984, -15.630242347717285, -14.954763412475586, -14.279285430908203, -13.603806495666504, -12.928327560424805, -12.252849578857422, -11.577370643615723, -10.901891708374023, -10.22641372680664, -9.550934791564941, -8.875455856323242, -8.19997787475586, -7.524499416351318, -6.849020957946777, -6.173542022705078, -5.498063564300537, -4.822585105895996, -4.147106170654297, -3.471627712249756, -2.796149253845215, -2.120670795440674, -1.4451920986175537, -0.7697134017944336, -0.09423494338989258, 0.5812435150146484, 1.2567224502563477, 1.9322009086608887, 2.6076812744140625, 3.2831597328186035, 3.9586384296417236, 4.634117126464844, 5.309595584869385, 5.985074043273926, 6.660552978515625, 7.336031436920166, 8.011509895324707, 8.686988830566406, 9.362466812133789, 10.037945747375488, 10.713424682617188, 11.38890266418457, 12.06438159942627, 12.739860534667969, 13.415338516235352, 14.09081745147705, 14.766295433044434, 15.441774368286133, 16.117252349853516, 16.79273223876953, 17.468210220336914, 18.143688201904297, 18.819168090820312, 19.494646072387695, 20.17012596130371, 20.845603942871094, 21.521081924438477, 22.19655990600586, 22.872039794921875, 23.547517776489258, 24.22299575805664]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 13.0, 10.0, 11.0, 6.0, 16.0, 15.0, 15.0, 12.0, 33.0, 26.0, 42.0, 36.0, 34.0, 49.0, 29.0, 43.0, 30.0, 43.0, 50.0, 37.0, 33.0, 37.0, 48.0, 36.0, 36.0, 35.0, 31.0, 32.0, 29.0, 22.0, 20.0, 13.0, 17.0, 16.0, 10.0, 9.0, 6.0, 3.0, 8.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-5.15625, -5.00335693359375, -4.8504638671875, -4.69757080078125, -4.544677734375, -4.39178466796875, -4.2388916015625, -4.08599853515625, -3.93310546875, -3.78021240234375, -3.6273193359375, -3.47442626953125, -3.321533203125, -3.16864013671875, -3.0157470703125, -2.86285400390625, -2.7099609375, -2.55706787109375, -2.4041748046875, -2.25128173828125, -2.098388671875, -1.94549560546875, -1.7926025390625, -1.63970947265625, -1.48681640625, -1.33392333984375, -1.1810302734375, -1.02813720703125, -0.875244140625, -0.72235107421875, -0.5694580078125, -0.41656494140625, -0.263671875, -0.11077880859375, 0.0421142578125, 0.19500732421875, 0.347900390625, 0.50079345703125, 0.6536865234375, 0.80657958984375, 0.95947265625, 1.11236572265625, 1.2652587890625, 1.41815185546875, 1.571044921875, 1.72393798828125, 1.8768310546875, 2.02972412109375, 2.1826171875, 2.33551025390625, 2.4884033203125, 2.64129638671875, 2.794189453125, 2.94708251953125, 3.0999755859375, 3.25286865234375, 3.40576171875, 3.55865478515625, 3.7115478515625, 3.86444091796875, 4.017333984375, 4.17022705078125, 4.3231201171875, 4.47601318359375, 4.62890625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 7.0, 9.0, 8.0, 22.0, 25.0, 53.0, 73.0, 120.0, 162.0, 291.0, 463.0, 741.0, 1175.0, 1941.0, 3092.0, 4766.0, 7485.0, 11860.0, 18298.0, 27425.0, 40498.0, 58413.0, 80935.0, 104606.0, 123197.0, 128815.0, 116267.0, 95391.0, 71513.0, 50889.0, 34551.0, 23485.0, 15215.0, 9911.0, 6134.0, 4027.0, 2444.0, 1582.0, 1002.0, 606.0, 386.0, 233.0, 187.0, 96.0, 74.0, 30.0, 13.0, 16.0, 15.0, 6.0, 8.0, 2.0, 2.0, 3.0], "bins": [-0.69775390625, -0.6779861450195312, -0.6582183837890625, -0.6384506225585938, -0.618682861328125, -0.5989151000976562, -0.5791473388671875, -0.5593795776367188, -0.53961181640625, -0.5198440551757812, -0.5000762939453125, -0.48030853271484375, -0.460540771484375, -0.44077301025390625, -0.4210052490234375, -0.40123748779296875, -0.3814697265625, -0.36170196533203125, -0.3419342041015625, -0.32216644287109375, -0.302398681640625, -0.28263092041015625, -0.2628631591796875, -0.24309539794921875, -0.22332763671875, -0.20355987548828125, -0.1837921142578125, -0.16402435302734375, -0.144256591796875, -0.12448883056640625, -0.1047210693359375, -0.08495330810546875, -0.065185546875, -0.04541778564453125, -0.0256500244140625, -0.00588226318359375, 0.013885498046875, 0.03365325927734375, 0.0534210205078125, 0.07318878173828125, 0.09295654296875, 0.11272430419921875, 0.1324920654296875, 0.15225982666015625, 0.172027587890625, 0.19179534912109375, 0.2115631103515625, 0.23133087158203125, 0.2510986328125, 0.27086639404296875, 0.2906341552734375, 0.31040191650390625, 0.330169677734375, 0.34993743896484375, 0.3697052001953125, 0.38947296142578125, 0.40924072265625, 0.42900848388671875, 0.4487762451171875, 0.46854400634765625, 0.488311767578125, 0.5080795288085938, 0.5278472900390625, 0.5476150512695312, 0.5673828125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 6.0, 5.0, 7.0, 8.0, 11.0, 17.0, 18.0, 17.0, 22.0, 31.0, 39.0, 32.0, 26.0, 43.0, 42.0, 54.0, 34.0, 44.0, 34.0, 1067.0, 43.0, 48.0, 57.0, 40.0, 38.0, 25.0, 25.0, 26.0, 23.0, 17.0, 19.0, 27.0, 17.0, 12.0, 12.0, 9.0, 5.0, 7.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.66015625, -3.543670654296875, -3.42718505859375, -3.310699462890625, -3.1942138671875, -3.077728271484375, -2.96124267578125, -2.844757080078125, -2.728271484375, -2.611785888671875, -2.49530029296875, -2.378814697265625, -2.2623291015625, -2.145843505859375, -2.02935791015625, -1.912872314453125, -1.79638671875, -1.679901123046875, -1.56341552734375, -1.446929931640625, -1.3304443359375, -1.213958740234375, -1.09747314453125, -0.980987548828125, -0.864501953125, -0.748016357421875, -0.63153076171875, -0.515045166015625, -0.3985595703125, -0.282073974609375, -0.16558837890625, -0.049102783203125, 0.0673828125, 0.183868408203125, 0.30035400390625, 0.416839599609375, 0.5333251953125, 0.649810791015625, 0.76629638671875, 0.882781982421875, 0.999267578125, 1.115753173828125, 1.23223876953125, 1.348724365234375, 1.4652099609375, 1.581695556640625, 1.69818115234375, 1.814666748046875, 1.93115234375, 2.047637939453125, 2.16412353515625, 2.280609130859375, 2.3970947265625, 2.513580322265625, 2.63006591796875, 2.746551513671875, 2.863037109375, 2.979522705078125, 3.09600830078125, 3.212493896484375, 3.3289794921875, 3.445465087890625, 3.56195068359375, 3.678436279296875, 3.794921875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 12.0, 10.0, 12.0, 19.0, 20.0, 30.0, 56.0, 51.0, 104.0, 98.0, 137.0, 241.0, 351.0, 482.0, 719.0, 1014.0, 1491.0, 2210.0, 3362.0, 4929.0, 6997.0, 10764.0, 16046.0, 25669.0, 48125.0, 1872180.0, 37309.0, 21837.0, 14035.0, 9245.0, 6182.0, 4266.0, 2845.0, 1985.0, 1381.0, 921.0, 592.0, 413.0, 289.0, 196.0, 158.0, 101.0, 68.0, 59.0, 40.0, 23.0, 22.0, 16.0, 8.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2138671875, -1.1710357666015625, -1.128204345703125, -1.0853729248046875, -1.04254150390625, -0.9997100830078125, -0.956878662109375, -0.9140472412109375, -0.8712158203125, -0.8283843994140625, -0.785552978515625, -0.7427215576171875, -0.69989013671875, -0.6570587158203125, -0.614227294921875, -0.5713958740234375, -0.528564453125, -0.4857330322265625, -0.442901611328125, -0.4000701904296875, -0.35723876953125, -0.3144073486328125, -0.271575927734375, -0.2287445068359375, -0.1859130859375, -0.1430816650390625, -0.100250244140625, -0.0574188232421875, -0.01458740234375, 0.0282440185546875, 0.071075439453125, 0.1139068603515625, 0.15673828125, 0.1995697021484375, 0.242401123046875, 0.2852325439453125, 0.32806396484375, 0.3708953857421875, 0.413726806640625, 0.4565582275390625, 0.4993896484375, 0.5422210693359375, 0.585052490234375, 0.6278839111328125, 0.67071533203125, 0.7135467529296875, 0.756378173828125, 0.7992095947265625, 0.842041015625, 0.8848724365234375, 0.927703857421875, 0.9705352783203125, 1.01336669921875, 1.0561981201171875, 1.099029541015625, 1.1418609619140625, 1.1846923828125, 1.2275238037109375, 1.270355224609375, 1.3131866455078125, 1.35601806640625, 1.3988494873046875, 1.441680908203125, 1.4845123291015625, 1.52734375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 7.0, 10.0, 9.0, 11.0, 10.0, 12.0, 13.0, 21.0, 23.0, 25.0, 26.0, 41.0, 46.0, 33.0, 73.0, 58.0, 55.0, 84.0, 53.0, 52.0, 46.0, 44.0, 42.0, 31.0, 28.0, 26.0, 26.0, 17.0, 10.0, 15.0, 10.0, 13.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.022857666015625, -0.022185325622558594, -0.021512985229492188, -0.02084064483642578, -0.020168304443359375, -0.01949596405029297, -0.018823623657226562, -0.018151283264160156, -0.01747894287109375, -0.016806602478027344, -0.016134262084960938, -0.015461921691894531, -0.014789581298828125, -0.014117240905761719, -0.013444900512695312, -0.012772560119628906, -0.0121002197265625, -0.011427879333496094, -0.010755538940429688, -0.010083198547363281, -0.009410858154296875, -0.008738517761230469, -0.008066177368164062, -0.007393836975097656, -0.00672149658203125, -0.006049156188964844, -0.0053768157958984375, -0.004704475402832031, -0.004032135009765625, -0.0033597946166992188, -0.0026874542236328125, -0.0020151138305664062, -0.0013427734375, -0.0006704330444335938, 1.9073486328125e-06, 0.0006742477416992188, 0.001346588134765625, 0.0020189285278320312, 0.0026912689208984375, 0.0033636093139648438, 0.00403594970703125, 0.004708290100097656, 0.0053806304931640625, 0.006052970886230469, 0.006725311279296875, 0.007397651672363281, 0.008069992065429688, 0.008742332458496094, 0.0094146728515625, 0.010087013244628906, 0.010759353637695312, 0.011431694030761719, 0.012104034423828125, 0.012776374816894531, 0.013448715209960938, 0.014121055603027344, 0.01479339599609375, 0.015465736389160156, 0.016138076782226562, 0.01681041717529297, 0.017482757568359375, 0.01815509796142578, 0.018827438354492188, 0.019499778747558594, 0.020172119140625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 14.0, 10.0, 18.0, 11.0, 19.0, 21.0, 49.0, 37.0, 62.0, 73.0, 108.0, 145.0, 249.0, 390.0, 867.0, 19520.0, 1021542.0, 3670.0, 660.0, 367.0, 178.0, 137.0, 104.0, 65.0, 36.0, 45.0, 39.0, 16.0, 16.0, 15.0, 15.0, 10.0, 14.0, 9.0, 4.0, 2.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.41796875, -0.4042015075683594, -0.39043426513671875, -0.3766670227050781, -0.3628997802734375, -0.3491325378417969, -0.33536529541015625, -0.3215980529785156, -0.307830810546875, -0.2940635681152344, -0.28029632568359375, -0.2665290832519531, -0.2527618408203125, -0.23899459838867188, -0.22522735595703125, -0.21146011352539062, -0.19769287109375, -0.18392562866210938, -0.17015838623046875, -0.15639114379882812, -0.1426239013671875, -0.12885665893554688, -0.11508941650390625, -0.10132217407226562, -0.087554931640625, -0.07378768920898438, -0.06002044677734375, -0.046253204345703125, -0.0324859619140625, -0.018718719482421875, -0.00495147705078125, 0.008815765380859375, 0.0225830078125, 0.036350250244140625, 0.05011749267578125, 0.06388473510742188, 0.0776519775390625, 0.09141921997070312, 0.10518646240234375, 0.11895370483398438, 0.132720947265625, 0.14648818969726562, 0.16025543212890625, 0.17402267456054688, 0.1877899169921875, 0.20155715942382812, 0.21532440185546875, 0.22909164428710938, 0.24285888671875, 0.2566261291503906, 0.27039337158203125, 0.2841606140136719, 0.2979278564453125, 0.3116950988769531, 0.32546234130859375, 0.3392295837402344, 0.352996826171875, 0.3667640686035156, 0.38053131103515625, 0.3942985534667969, 0.4080657958984375, 0.4218330383300781, 0.43560028076171875, 0.4493675231933594, 0.463134765625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 17.0, 933.0, 65.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5359982252120972, -0.5242775082588196, -0.5125568509101868, -0.5008361339569092, -0.489115446805954, -0.4773947596549988, -0.4656740725040436, -0.4539533853530884, -0.4422326683998108, -0.4305119812488556, -0.4187912940979004, -0.4070705771446228, -0.3953498899936676, -0.3836292028427124, -0.3719085156917572, -0.360187828540802, -0.3484671115875244, -0.3367464244365692, -0.325025737285614, -0.3133050203323364, -0.3015843331813812, -0.289863646030426, -0.2781429588794708, -0.2664222717285156, -0.2547015845775604, -0.24298089742660522, -0.23126019537448883, -0.21953950822353363, -0.20781880617141724, -0.19609811902046204, -0.18437743186950684, -0.17265672981739044, -0.16093601286411285, -0.14921532571315765, -0.13749462366104126, -0.12577393651008606, -0.11405323445796967, -0.10233254730701447, -0.09061185270547867, -0.07889115810394287, -0.06717046350240707, -0.05544976890087128, -0.04372907429933548, -0.03200838342308998, -0.020287688821554184, -0.008566994220018387, 0.003153696656227112, 0.014874391257762909, 0.026595085859298706, 0.0383157804608345, 0.0500364750623703, 0.0617571659386158, 0.0734778642654419, 0.0851985514163971, 0.09691924601793289, 0.10863994061946869, 0.12036063522100449, 0.13208132982254028, 0.14380201697349548, 0.15552271902561188, 0.16724340617656708, 0.17896410822868347, 0.19068479537963867, 0.20240548253059387, 0.21412618458271027]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 7.0, 13.0, 18.0, 22.0, 15.0, 16.0, 26.0, 37.0, 29.0, 29.0, 33.0, 35.0, 32.0, 41.0, 53.0, 45.0, 50.0, 53.0, 56.0, 44.0, 44.0, 45.0, 46.0, 35.0, 28.0, 28.0, 24.0, 29.0, 22.0, 9.0, 10.0, 8.0, 9.0, 2.0, 3.0, 1.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032464563846588135, -0.03133701905608177, -0.03020947240293026, -0.029081925749778748, -0.027954380959272385, -0.02682683616876602, -0.02569928951561451, -0.024571742862462997, -0.023444198071956635, -0.02231665328145027, -0.02118910662829876, -0.020061559975147247, -0.018934015184640884, -0.01780647039413452, -0.01667892374098301, -0.015551378019154072, -0.014423832297325134, -0.013296286575496197, -0.01216874085366726, -0.011041195131838322, -0.009913649410009384, -0.008786103688180447, -0.007658557966351509, -0.0065310122445225716, -0.005403466522693634, -0.0042759208008646965, -0.003148375079035759, -0.0020208293572068214, -0.0008932836353778839, 0.00023426208645105362, 0.0013618078082799911, 0.0024893535301089287, 0.003616899251937866, 0.004744444973766804, 0.005871990695595741, 0.006999536417424679, 0.008127082139253616, 0.009254627861082554, 0.010382173582911491, 0.011509719304740429, 0.012637265026569366, 0.013764810748398304, 0.014892356470227242, 0.016019903123378754, 0.017147447913885117, 0.01827499270439148, 0.01940253935754299, 0.020530086010694504, 0.021657630801200867, 0.02278517559170723, 0.023912722244858742, 0.025040268898010254, 0.026167813688516617, 0.02729535847902298, 0.028422905132174492, 0.029550451785326004, 0.030677996575832367, 0.03180554136633873, 0.03293308615684509, 0.034060634672641754, 0.03518817946314812, 0.03631572425365448, 0.03744327276945114, 0.038570817559957504, 0.03969836235046387]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 8.0, 19.0, 11.0, 12.0, 11.0, 14.0, 23.0, 18.0, 31.0, 41.0, 31.0, 36.0, 38.0, 43.0, 50.0, 55.0, 50.0, 41.0, 53.0, 37.0, 45.0, 39.0, 43.0, 34.0, 39.0, 24.0, 22.0, 28.0, 22.0, 10.0, 16.0, 11.0, 14.0, 7.0, 6.0, 2.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.58001708984375, -5.4178466796875, -5.25567626953125, -5.093505859375, -4.93133544921875, -4.7691650390625, -4.60699462890625, -4.44482421875, -4.28265380859375, -4.1204833984375, -3.95831298828125, -3.796142578125, -3.63397216796875, -3.4718017578125, -3.30963134765625, -3.1474609375, -2.98529052734375, -2.8231201171875, -2.66094970703125, -2.498779296875, -2.33660888671875, -2.1744384765625, -2.01226806640625, -1.85009765625, -1.68792724609375, -1.5257568359375, -1.36358642578125, -1.201416015625, -1.03924560546875, -0.8770751953125, -0.71490478515625, -0.552734375, -0.39056396484375, -0.2283935546875, -0.06622314453125, 0.095947265625, 0.25811767578125, 0.4202880859375, 0.58245849609375, 0.74462890625, 0.90679931640625, 1.0689697265625, 1.23114013671875, 1.393310546875, 1.55548095703125, 1.7176513671875, 1.87982177734375, 2.0419921875, 2.20416259765625, 2.3663330078125, 2.52850341796875, 2.690673828125, 2.85284423828125, 3.0150146484375, 3.17718505859375, 3.33935546875, 3.50152587890625, 3.6636962890625, 3.82586669921875, 3.988037109375, 4.15020751953125, 4.3123779296875, 4.47454833984375, 4.63671875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 10.0, 15.0, 21.0, 40.0, 33.0, 65.0, 104.0, 166.0, 237.0, 404.0, 621.0, 1202.0, 2340.0, 4807.0, 10563.0, 23933.0, 54522.0, 132071.0, 332502.0, 288275.0, 111853.0, 46381.0, 20201.0, 9180.0, 4243.0, 2079.0, 1111.0, 606.0, 365.0, 193.0, 140.0, 101.0, 55.0, 29.0, 31.0, 20.0, 8.0, 9.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6953125, -6.4854736328125, -6.275634765625, -6.0657958984375, -5.85595703125, -5.6461181640625, -5.436279296875, -5.2264404296875, -5.0166015625, -4.8067626953125, -4.596923828125, -4.3870849609375, -4.17724609375, -3.9674072265625, -3.757568359375, -3.5477294921875, -3.337890625, -3.1280517578125, -2.918212890625, -2.7083740234375, -2.49853515625, -2.2886962890625, -2.078857421875, -1.8690185546875, -1.6591796875, -1.4493408203125, -1.239501953125, -1.0296630859375, -0.81982421875, -0.6099853515625, -0.400146484375, -0.1903076171875, 0.01953125, 0.2293701171875, 0.439208984375, 0.6490478515625, 0.85888671875, 1.0687255859375, 1.278564453125, 1.4884033203125, 1.6982421875, 1.9080810546875, 2.117919921875, 2.3277587890625, 2.53759765625, 2.7474365234375, 2.957275390625, 3.1671142578125, 3.376953125, 3.5867919921875, 3.796630859375, 4.0064697265625, 4.21630859375, 4.4261474609375, 4.635986328125, 4.8458251953125, 5.0556640625, 5.2655029296875, 5.475341796875, 5.6851806640625, 5.89501953125, 6.1048583984375, 6.314697265625, 6.5245361328125, 6.734375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 10.0, 6.0, 16.0, 12.0, 17.0, 10.0, 13.0, 32.0, 33.0, 43.0, 38.0, 37.0, 49.0, 70.0, 82.0, 143.0, 223.0, 1314.0, 257.0, 161.0, 92.0, 47.0, 59.0, 53.0, 37.0, 28.0, 29.0, 9.0, 20.0, 18.0, 24.0, 12.0, 7.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2109375, -10.804931640625, -10.39892578125, -9.992919921875, -9.5869140625, -9.180908203125, -8.77490234375, -8.368896484375, -7.962890625, -7.556884765625, -7.15087890625, -6.744873046875, -6.3388671875, -5.932861328125, -5.52685546875, -5.120849609375, -4.71484375, -4.308837890625, -3.90283203125, -3.496826171875, -3.0908203125, -2.684814453125, -2.27880859375, -1.872802734375, -1.466796875, -1.060791015625, -0.65478515625, -0.248779296875, 0.1572265625, 0.563232421875, 0.96923828125, 1.375244140625, 1.78125, 2.187255859375, 2.59326171875, 2.999267578125, 3.4052734375, 3.811279296875, 4.21728515625, 4.623291015625, 5.029296875, 5.435302734375, 5.84130859375, 6.247314453125, 6.6533203125, 7.059326171875, 7.46533203125, 7.871337890625, 8.27734375, 8.683349609375, 9.08935546875, 9.495361328125, 9.9013671875, 10.307373046875, 10.71337890625, 11.119384765625, 11.525390625, 11.931396484375, 12.33740234375, 12.743408203125, 13.1494140625, 13.555419921875, 13.96142578125, 14.367431640625, 14.7734375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 10.0, 14.0, 17.0, 31.0, 31.0, 60.0, 74.0, 71.0, 121.0, 197.0, 308.0, 565.0, 1181.0, 4440.0, 53954.0, 2554755.0, 508481.0, 16931.0, 2337.0, 864.0, 422.0, 275.0, 178.0, 99.0, 90.0, 47.0, 46.0, 33.0, 19.0, 15.0, 10.0, 9.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.015625, -21.3232421875, -20.630859375, -19.9384765625, -19.24609375, -18.5537109375, -17.861328125, -17.1689453125, -16.4765625, -15.7841796875, -15.091796875, -14.3994140625, -13.70703125, -13.0146484375, -12.322265625, -11.6298828125, -10.9375, -10.2451171875, -9.552734375, -8.8603515625, -8.16796875, -7.4755859375, -6.783203125, -6.0908203125, -5.3984375, -4.7060546875, -4.013671875, -3.3212890625, -2.62890625, -1.9365234375, -1.244140625, -0.5517578125, 0.140625, 0.8330078125, 1.525390625, 2.2177734375, 2.91015625, 3.6025390625, 4.294921875, 4.9873046875, 5.6796875, 6.3720703125, 7.064453125, 7.7568359375, 8.44921875, 9.1416015625, 9.833984375, 10.5263671875, 11.21875, 11.9111328125, 12.603515625, 13.2958984375, 13.98828125, 14.6806640625, 15.373046875, 16.0654296875, 16.7578125, 17.4501953125, 18.142578125, 18.8349609375, 19.52734375, 20.2197265625, 20.912109375, 21.6044921875, 22.296875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 39.0, 179.0, 365.0, 312.0, 98.0, 18.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.22732543945312, -65.78202819824219, -63.336727142333984, -60.89142608642578, -58.446128845214844, -56.000831604003906, -53.5555305480957, -51.1102294921875, -48.66493225097656, -46.219635009765625, -43.77433395385742, -41.32903289794922, -38.88373565673828, -36.438438415527344, -33.99313735961914, -31.54783821105957, -29.1025390625, -26.65723991394043, -24.21194076538086, -21.76664161682129, -19.32134246826172, -16.87604331970215, -14.430744171142578, -11.985445022583008, -9.540145874023438, -7.094846725463867, -4.649547576904297, -2.2042484283447266, 0.24105072021484375, 2.686349868774414, 5.131649017333984, 7.576948165893555, 10.022239685058594, 12.467538833618164, 14.912837982177734, 17.358137130737305, 19.803436279296875, 22.248735427856445, 24.694034576416016, 27.139333724975586, 29.584632873535156, 32.029930114746094, 34.4752311706543, 36.9205322265625, 39.36582946777344, 41.811126708984375, 44.25642776489258, 46.70172882080078, 49.14702606201172, 51.592323303222656, 54.03762435913086, 56.48292541503906, 58.92822265625, 61.37351989746094, 63.81882095336914, 66.26412200927734, 68.70941925048828, 71.15471649169922, 73.60002136230469, 76.04531860351562, 78.49061584472656, 80.9359130859375, 83.38121032714844, 85.8265151977539, 88.27181243896484]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 5.0, 5.0, 6.0, 6.0, 9.0, 15.0, 13.0, 9.0, 13.0, 21.0, 27.0, 38.0, 25.0, 39.0, 22.0, 32.0, 36.0, 33.0, 42.0, 39.0, 37.0, 28.0, 44.0, 33.0, 38.0, 46.0, 38.0, 50.0, 26.0, 26.0, 29.0, 22.0, 23.0, 28.0, 16.0, 18.0, 12.0, 17.0, 8.0, 6.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.076942443847656, -27.23221206665039, -26.387481689453125, -25.54275131225586, -24.698020935058594, -23.853290557861328, -23.008560180664062, -22.163829803466797, -21.31909942626953, -20.474369049072266, -19.629638671875, -18.784908294677734, -17.94017791748047, -17.095447540283203, -16.250717163085938, -15.405986785888672, -14.561257362365723, -13.716526985168457, -12.871796607971191, -12.027066230773926, -11.18233585357666, -10.337606430053711, -9.492876052856445, -8.64814567565918, -7.803414821624756, -6.95868444442749, -6.113954067230225, -5.269224166870117, -4.424493789672852, -3.579763412475586, -2.7350330352783203, -1.8903026580810547, -1.045572280883789, -0.2008419632911682, 0.6438883543014526, 1.4886186122894287, 2.3333489894866943, 3.178079128265381, 4.0228095054626465, 4.867539882659912, 5.712270259857178, 6.557000637054443, 7.401731014251709, 8.246460914611816, 9.091191291809082, 9.935921669006348, 10.780652046203613, 11.625382423400879, 12.470112800598145, 13.31484317779541, 14.159573554992676, 15.004303932189941, 15.849034309387207, 16.693763732910156, 17.538494110107422, 18.383224487304688, 19.227954864501953, 20.07268524169922, 20.917415618896484, 21.76214599609375, 22.606876373291016, 23.45160675048828, 24.296337127685547, 25.141067504882812, 25.985797882080078]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 8.0, 7.0, 3.0, 10.0, 12.0, 11.0, 12.0, 18.0, 17.0, 20.0, 25.0, 27.0, 24.0, 27.0, 37.0, 42.0, 38.0, 50.0, 27.0, 34.0, 44.0, 40.0, 35.0, 36.0, 39.0, 41.0, 40.0, 40.0, 37.0, 24.0, 16.0, 28.0, 25.0, 17.0, 17.0, 20.0, 13.0, 9.0, 11.0, 6.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.06640625, -4.9140625, -4.76171875, -4.609375, -4.45703125, -4.3046875, -4.15234375, -4.0, -3.84765625, -3.6953125, -3.54296875, -3.390625, -3.23828125, -3.0859375, -2.93359375, -2.78125, -2.62890625, -2.4765625, -2.32421875, -2.171875, -2.01953125, -1.8671875, -1.71484375, -1.5625, -1.41015625, -1.2578125, -1.10546875, -0.953125, -0.80078125, -0.6484375, -0.49609375, -0.34375, -0.19140625, -0.0390625, 0.11328125, 0.265625, 0.41796875, 0.5703125, 0.72265625, 0.875, 1.02734375, 1.1796875, 1.33203125, 1.484375, 1.63671875, 1.7890625, 1.94140625, 2.09375, 2.24609375, 2.3984375, 2.55078125, 2.703125, 2.85546875, 3.0078125, 3.16015625, 3.3125, 3.46484375, 3.6171875, 3.76953125, 3.921875, 4.07421875, 4.2265625, 4.37890625, 4.53125, 4.68359375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 12.0, 15.0, 18.0, 15.0, 29.0, 26.0, 36.0, 41.0, 60.0, 86.0, 101.0, 132.0, 210.0, 298.0, 416.0, 1246.0, 24893.0, 3798301.0, 362895.0, 3588.0, 566.0, 358.0, 221.0, 146.0, 140.0, 111.0, 49.0, 43.0, 44.0, 32.0, 31.0, 24.0, 15.0, 10.0, 5.0, 13.0, 8.0, 7.0, 6.0, 5.0, 2.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.625, -35.570556640625, -34.51611328125, -33.461669921875, -32.4072265625, -31.352783203125, -30.29833984375, -29.243896484375, -28.189453125, -27.135009765625, -26.08056640625, -25.026123046875, -23.9716796875, -22.917236328125, -21.86279296875, -20.808349609375, -19.75390625, -18.699462890625, -17.64501953125, -16.590576171875, -15.5361328125, -14.481689453125, -13.42724609375, -12.372802734375, -11.318359375, -10.263916015625, -9.20947265625, -8.155029296875, -7.1005859375, -6.046142578125, -4.99169921875, -3.937255859375, -2.8828125, -1.828369140625, -0.77392578125, 0.280517578125, 1.3349609375, 2.389404296875, 3.44384765625, 4.498291015625, 5.552734375, 6.607177734375, 7.66162109375, 8.716064453125, 9.7705078125, 10.824951171875, 11.87939453125, 12.933837890625, 13.98828125, 15.042724609375, 16.09716796875, 17.151611328125, 18.2060546875, 19.260498046875, 20.31494140625, 21.369384765625, 22.423828125, 23.478271484375, 24.53271484375, 25.587158203125, 26.6416015625, 27.696044921875, 28.75048828125, 29.804931640625, 30.859375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 7.0, 12.0, 14.0, 21.0, 18.0, 26.0, 41.0, 46.0, 60.0, 107.0, 131.0, 187.0, 262.0, 311.0, 455.0, 512.0, 465.0, 363.0, 250.0, 192.0, 124.0, 105.0, 79.0, 63.0, 45.0, 30.0, 27.0, 16.0, 18.0, 14.0, 16.0, 10.0, 8.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.73828125, -6.52490234375, -6.3115234375, -6.09814453125, -5.884765625, -5.67138671875, -5.4580078125, -5.24462890625, -5.03125, -4.81787109375, -4.6044921875, -4.39111328125, -4.177734375, -3.96435546875, -3.7509765625, -3.53759765625, -3.32421875, -3.11083984375, -2.8974609375, -2.68408203125, -2.470703125, -2.25732421875, -2.0439453125, -1.83056640625, -1.6171875, -1.40380859375, -1.1904296875, -0.97705078125, -0.763671875, -0.55029296875, -0.3369140625, -0.12353515625, 0.08984375, 0.30322265625, 0.5166015625, 0.72998046875, 0.943359375, 1.15673828125, 1.3701171875, 1.58349609375, 1.796875, 2.01025390625, 2.2236328125, 2.43701171875, 2.650390625, 2.86376953125, 3.0771484375, 3.29052734375, 3.50390625, 3.71728515625, 3.9306640625, 4.14404296875, 4.357421875, 4.57080078125, 4.7841796875, 4.99755859375, 5.2109375, 5.42431640625, 5.6376953125, 5.85107421875, 6.064453125, 6.27783203125, 6.4912109375, 6.70458984375, 6.91796875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 11.0, 22.0, 19.0, 20.0, 38.0, 27.0, 52.0, 66.0, 105.0, 182.0, 304.0, 637.0, 2093.0, 12221.0, 139593.0, 3019515.0, 960304.0, 50748.0, 5877.0, 1239.0, 502.0, 220.0, 134.0, 78.0, 57.0, 57.0, 33.0, 28.0, 13.0, 15.0, 15.0, 7.0, 8.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.625, -19.04443359375, -18.4638671875, -17.88330078125, -17.302734375, -16.72216796875, -16.1416015625, -15.56103515625, -14.98046875, -14.39990234375, -13.8193359375, -13.23876953125, -12.658203125, -12.07763671875, -11.4970703125, -10.91650390625, -10.3359375, -9.75537109375, -9.1748046875, -8.59423828125, -8.013671875, -7.43310546875, -6.8525390625, -6.27197265625, -5.69140625, -5.11083984375, -4.5302734375, -3.94970703125, -3.369140625, -2.78857421875, -2.2080078125, -1.62744140625, -1.046875, -0.46630859375, 0.1142578125, 0.69482421875, 1.275390625, 1.85595703125, 2.4365234375, 3.01708984375, 3.59765625, 4.17822265625, 4.7587890625, 5.33935546875, 5.919921875, 6.50048828125, 7.0810546875, 7.66162109375, 8.2421875, 8.82275390625, 9.4033203125, 9.98388671875, 10.564453125, 11.14501953125, 11.7255859375, 12.30615234375, 12.88671875, 13.46728515625, 14.0478515625, 14.62841796875, 15.208984375, 15.78955078125, 16.3701171875, 16.95068359375, 17.53125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 9.0, 136.0, 546.0, 302.0, 25.0, 0.0, 1.0], "bins": [-292.4849548339844, -287.58587646484375, -282.686767578125, -277.7876892089844, -272.8885803222656, -267.989501953125, -263.0904235839844, -258.1913146972656, -253.292236328125, -248.3931427001953, -243.49404907226562, -238.594970703125, -233.6958770751953, -228.79678344726562, -223.89768981933594, -218.99859619140625, -214.09950256347656, -209.20040893554688, -204.3013153076172, -199.40223693847656, -194.50314331054688, -189.6040496826172, -184.7049560546875, -179.8058624267578, -174.90676879882812, -170.00767517089844, -165.10858154296875, -160.20950317382812, -155.31040954589844, -150.41131591796875, -145.51222229003906, -140.61312866210938, -135.7140350341797, -130.81494140625, -125.91585540771484, -121.01676177978516, -116.11767578125, -111.21858215332031, -106.31948852539062, -101.42039489746094, -96.52131652832031, -91.62222290039062, -86.72313690185547, -81.82404327392578, -76.92495727539062, -72.02586364746094, -67.12677001953125, -62.22768020629883, -57.32858657836914, -52.42949676513672, -47.53040313720703, -42.63131332397461, -37.73222351074219, -32.833133697509766, -27.93404197692871, -23.034950256347656, -18.135860443115234, -13.236769676208496, -8.337678909301758, -3.4385881423950195, 1.4605026245117188, 6.359592437744141, 11.258684158325195, 16.15777587890625, 21.056865692138672]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 0.0, 5.0, 2.0, 8.0, 9.0, 8.0, 8.0, 7.0, 19.0, 9.0, 19.0, 22.0, 22.0, 28.0, 25.0, 19.0, 39.0, 47.0, 23.0, 34.0, 42.0, 49.0, 40.0, 27.0, 47.0, 34.0, 47.0, 41.0, 37.0, 38.0, 23.0, 23.0, 27.0, 26.0, 27.0, 15.0, 25.0, 23.0, 10.0, 8.0, 10.0, 11.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.606096267700195, -21.865806579589844, -21.125516891479492, -20.38522720336914, -19.644939422607422, -18.90464973449707, -18.16436004638672, -17.424070358276367, -16.683780670166016, -15.943490982055664, -15.203202247619629, -14.462912559509277, -13.722623825073242, -12.98233413696289, -12.242044448852539, -11.501754760742188, -10.761466979980469, -10.021177291870117, -9.280888557434082, -8.54059886932373, -7.800309658050537, -7.060020446777344, -6.319730758666992, -5.579441547393799, -4.8391523361206055, -4.098863124847412, -3.3585736751556396, -2.618284225463867, -1.8779950141906738, -1.1377058029174805, -0.3974161148071289, 0.34287309646606445, 1.0831642150878906, 1.8234535455703735, 2.5637428760528564, 3.304032325744629, 4.044321537017822, 4.784610748291016, 5.524900436401367, 6.2651896476745605, 7.005478858947754, 7.745768070220947, 8.48605728149414, 9.226346969604492, 9.966636657714844, 10.706925392150879, 11.44721508026123, 12.187503814697266, 12.927793502807617, 13.668083190917969, 14.408371925354004, 15.148661613464355, 15.88895034790039, 16.629240036010742, 17.369529724121094, 18.109819412231445, 18.850109100341797, 19.59039878845215, 20.3306884765625, 21.07097625732422, 21.81126594543457, 22.551555633544922, 23.291845321655273, 24.032135009765625, 24.772422790527344]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 5.0, 16.0, 7.0, 14.0, 15.0, 17.0, 16.0, 15.0, 33.0, 33.0, 35.0, 34.0, 27.0, 35.0, 34.0, 45.0, 45.0, 36.0, 34.0, 41.0, 37.0, 22.0, 37.0, 36.0, 31.0, 30.0, 21.0, 38.0, 23.0, 26.0, 27.0, 17.0, 15.0, 14.0, 14.0, 7.0, 7.0, 6.0, 5.0, 3.0, 3.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.26953125, -4.12945556640625, -3.9893798828125, -3.84930419921875, -3.709228515625, -3.56915283203125, -3.4290771484375, -3.28900146484375, -3.14892578125, -3.00885009765625, -2.8687744140625, -2.72869873046875, -2.588623046875, -2.44854736328125, -2.3084716796875, -2.16839599609375, -2.0283203125, -1.88824462890625, -1.7481689453125, -1.60809326171875, -1.468017578125, -1.32794189453125, -1.1878662109375, -1.04779052734375, -0.90771484375, -0.76763916015625, -0.6275634765625, -0.48748779296875, -0.347412109375, -0.20733642578125, -0.0672607421875, 0.07281494140625, 0.212890625, 0.35296630859375, 0.4930419921875, 0.63311767578125, 0.773193359375, 0.91326904296875, 1.0533447265625, 1.19342041015625, 1.33349609375, 1.47357177734375, 1.6136474609375, 1.75372314453125, 1.893798828125, 2.03387451171875, 2.1739501953125, 2.31402587890625, 2.4541015625, 2.59417724609375, 2.7342529296875, 2.87432861328125, 3.014404296875, 3.15447998046875, 3.2945556640625, 3.43463134765625, 3.57470703125, 3.71478271484375, 3.8548583984375, 3.99493408203125, 4.135009765625, 4.27508544921875, 4.4151611328125, 4.55523681640625, 4.6953125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 5.0, 8.0, 16.0, 26.0, 20.0, 38.0, 66.0, 92.0, 140.0, 197.0, 307.0, 421.0, 617.0, 902.0, 1317.0, 1864.0, 2712.0, 4011.0, 5550.0, 8092.0, 11516.0, 16656.0, 23824.0, 33247.0, 46347.0, 61921.0, 79722.0, 97688.0, 110535.0, 112253.0, 101374.0, 85682.0, 66915.0, 50370.0, 36881.0, 26220.0, 18588.0, 13230.0, 9063.0, 6304.0, 4234.0, 3026.0, 2042.0, 1359.0, 1009.0, 687.0, 464.0, 359.0, 216.0, 155.0, 96.0, 49.0, 40.0, 25.0, 20.0, 17.0, 12.0, 8.0, 5.0, 4.0, 4.0], "bins": [-0.54736328125, -0.53033447265625, -0.5133056640625, -0.49627685546875, -0.479248046875, -0.46221923828125, -0.4451904296875, -0.42816162109375, -0.4111328125, -0.39410400390625, -0.3770751953125, -0.36004638671875, -0.343017578125, -0.32598876953125, -0.3089599609375, -0.29193115234375, -0.27490234375, -0.25787353515625, -0.2408447265625, -0.22381591796875, -0.206787109375, -0.18975830078125, -0.1727294921875, -0.15570068359375, -0.138671875, -0.12164306640625, -0.1046142578125, -0.08758544921875, -0.070556640625, -0.05352783203125, -0.0364990234375, -0.01947021484375, -0.00244140625, 0.01458740234375, 0.0316162109375, 0.04864501953125, 0.065673828125, 0.08270263671875, 0.0997314453125, 0.11676025390625, 0.1337890625, 0.15081787109375, 0.1678466796875, 0.18487548828125, 0.201904296875, 0.21893310546875, 0.2359619140625, 0.25299072265625, 0.27001953125, 0.28704833984375, 0.3040771484375, 0.32110595703125, 0.338134765625, 0.35516357421875, 0.3721923828125, 0.38922119140625, 0.40625, 0.42327880859375, 0.4403076171875, 0.45733642578125, 0.474365234375, 0.49139404296875, 0.5084228515625, 0.52545166015625, 0.54248046875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 3.0, 8.0, 6.0, 7.0, 8.0, 10.0, 12.0, 13.0, 15.0, 13.0, 23.0, 29.0, 17.0, 23.0, 34.0, 44.0, 32.0, 29.0, 38.0, 32.0, 48.0, 47.0, 1073.0, 50.0, 34.0, 41.0, 40.0, 41.0, 28.0, 30.0, 27.0, 27.0, 21.0, 20.0, 22.0, 11.0, 16.0, 14.0, 15.0, 9.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-4.18359375, -4.062103271484375, -3.94061279296875, -3.819122314453125, -3.6976318359375, -3.576141357421875, -3.45465087890625, -3.333160400390625, -3.211669921875, -3.090179443359375, -2.96868896484375, -2.847198486328125, -2.7257080078125, -2.604217529296875, -2.48272705078125, -2.361236572265625, -2.23974609375, -2.118255615234375, -1.99676513671875, -1.875274658203125, -1.7537841796875, -1.632293701171875, -1.51080322265625, -1.389312744140625, -1.267822265625, -1.146331787109375, -1.02484130859375, -0.903350830078125, -0.7818603515625, -0.660369873046875, -0.53887939453125, -0.417388916015625, -0.2958984375, -0.174407958984375, -0.05291748046875, 0.068572998046875, 0.1900634765625, 0.311553955078125, 0.43304443359375, 0.554534912109375, 0.676025390625, 0.797515869140625, 0.91900634765625, 1.040496826171875, 1.1619873046875, 1.283477783203125, 1.40496826171875, 1.526458740234375, 1.64794921875, 1.769439697265625, 1.89093017578125, 2.012420654296875, 2.1339111328125, 2.255401611328125, 2.37689208984375, 2.498382568359375, 2.619873046875, 2.741363525390625, 2.86285400390625, 2.984344482421875, 3.1058349609375, 3.227325439453125, 3.34881591796875, 3.470306396484375, 3.591796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 11.0, 6.0, 11.0, 8.0, 31.0, 16.0, 37.0, 43.0, 62.0, 98.0, 123.0, 189.0, 220.0, 357.0, 535.0, 732.0, 1093.0, 1595.0, 2306.0, 3395.0, 5245.0, 7563.0, 11277.0, 18262.0, 29362.0, 124701.0, 1800683.0, 32631.0, 19207.0, 12346.0, 8048.0, 5394.0, 3577.0, 2557.0, 1700.0, 1117.0, 808.0, 516.0, 353.0, 292.0, 192.0, 114.0, 86.0, 68.0, 50.0, 36.0, 30.0, 17.0, 12.0, 6.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3145294189453125, -1.267730712890625, -1.2209320068359375, -1.17413330078125, -1.1273345947265625, -1.080535888671875, -1.0337371826171875, -0.9869384765625, -0.9401397705078125, -0.893341064453125, -0.8465423583984375, -0.79974365234375, -0.7529449462890625, -0.706146240234375, -0.6593475341796875, -0.612548828125, -0.5657501220703125, -0.518951416015625, -0.4721527099609375, -0.42535400390625, -0.3785552978515625, -0.331756591796875, -0.2849578857421875, -0.2381591796875, -0.1913604736328125, -0.144561767578125, -0.0977630615234375, -0.05096435546875, -0.0041656494140625, 0.042633056640625, 0.0894317626953125, 0.13623046875, 0.1830291748046875, 0.229827880859375, 0.2766265869140625, 0.32342529296875, 0.3702239990234375, 0.417022705078125, 0.4638214111328125, 0.5106201171875, 0.5574188232421875, 0.604217529296875, 0.6510162353515625, 0.69781494140625, 0.7446136474609375, 0.791412353515625, 0.8382110595703125, 0.885009765625, 0.9318084716796875, 0.978607177734375, 1.0254058837890625, 1.07220458984375, 1.1190032958984375, 1.165802001953125, 1.2126007080078125, 1.2593994140625, 1.3061981201171875, 1.352996826171875, 1.3997955322265625, 1.44659423828125, 1.4933929443359375, 1.540191650390625, 1.5869903564453125, 1.6337890625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 3.0, 6.0, 6.0, 9.0, 15.0, 10.0, 15.0, 14.0, 17.0, 28.0, 28.0, 39.0, 52.0, 44.0, 61.0, 54.0, 78.0, 65.0, 61.0, 63.0, 60.0, 58.0, 36.0, 33.0, 27.0, 26.0, 9.0, 12.0, 17.0, 10.0, 5.0, 14.0, 4.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021728515625, -0.021075963973999023, -0.020423412322998047, -0.01977086067199707, -0.019118309020996094, -0.018465757369995117, -0.01781320571899414, -0.017160654067993164, -0.016508102416992188, -0.01585555076599121, -0.015202999114990234, -0.014550447463989258, -0.013897895812988281, -0.013245344161987305, -0.012592792510986328, -0.011940240859985352, -0.011287689208984375, -0.010635137557983398, -0.009982585906982422, -0.009330034255981445, -0.008677482604980469, -0.008024930953979492, -0.007372379302978516, -0.006719827651977539, -0.0060672760009765625, -0.005414724349975586, -0.004762172698974609, -0.004109621047973633, -0.0034570693969726562, -0.0028045177459716797, -0.002151966094970703, -0.0014994144439697266, -0.00084686279296875, -0.00019431114196777344, 0.0004582405090332031, 0.0011107921600341797, 0.0017633438110351562, 0.002415895462036133, 0.0030684471130371094, 0.003720998764038086, 0.0043735504150390625, 0.005026102066040039, 0.005678653717041016, 0.006331205368041992, 0.006983757019042969, 0.007636308670043945, 0.008288860321044922, 0.008941411972045898, 0.009593963623046875, 0.010246515274047852, 0.010899066925048828, 0.011551618576049805, 0.012204170227050781, 0.012856721878051758, 0.013509273529052734, 0.014161825180053711, 0.014814376831054688, 0.015466928482055664, 0.01611948013305664, 0.016772031784057617, 0.017424583435058594, 0.01807713508605957, 0.018729686737060547, 0.019382238388061523, 0.0200347900390625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 12.0, 10.0, 18.0, 13.0, 26.0, 26.0, 37.0, 44.0, 61.0, 77.0, 120.0, 172.0, 303.0, 472.0, 1025.0, 26904.0, 1010268.0, 6773.0, 831.0, 463.0, 234.0, 189.0, 122.0, 71.0, 60.0, 48.0, 36.0, 22.0, 20.0, 24.0, 12.0, 13.0, 8.0, 4.0, 4.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.356201171875, -0.3444786071777344, -0.33275604248046875, -0.3210334777832031, -0.3093109130859375, -0.2975883483886719, -0.28586578369140625, -0.2741432189941406, -0.262420654296875, -0.2506980895996094, -0.23897552490234375, -0.22725296020507812, -0.2155303955078125, -0.20380783081054688, -0.19208526611328125, -0.18036270141601562, -0.16864013671875, -0.15691757202148438, -0.14519500732421875, -0.13347244262695312, -0.1217498779296875, -0.11002731323242188, -0.09830474853515625, -0.08658218383789062, -0.074859619140625, -0.06313705444335938, -0.05141448974609375, -0.039691925048828125, -0.0279693603515625, -0.016246795654296875, -0.00452423095703125, 0.007198333740234375, 0.0189208984375, 0.030643463134765625, 0.04236602783203125, 0.054088592529296875, 0.0658111572265625, 0.07753372192382812, 0.08925628662109375, 0.10097885131835938, 0.112701416015625, 0.12442398071289062, 0.13614654541015625, 0.14786911010742188, 0.1595916748046875, 0.17131423950195312, 0.18303680419921875, 0.19475936889648438, 0.20648193359375, 0.21820449829101562, 0.22992706298828125, 0.24164962768554688, 0.2533721923828125, 0.2650947570800781, 0.27681732177734375, 0.2885398864746094, 0.300262451171875, 0.3119850158691406, 0.32370758056640625, 0.3354301452636719, 0.3471527099609375, 0.3588752746582031, 0.37059783935546875, 0.3823204040527344, 0.39404296875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 42.0, 221.0, 568.0, 162.0, 13.0, 2.0], "bins": [-0.1934494823217392, -0.19024796783924103, -0.18704643845558167, -0.1838449239730835, -0.18064340949058533, -0.17744189500808716, -0.1742403656244278, -0.17103885114192963, -0.16783733665943146, -0.1646358221769333, -0.16143429279327393, -0.15823277831077576, -0.1550312638282776, -0.15182974934577942, -0.14862821996212006, -0.1454267054796219, -0.14222517609596252, -0.13902366161346436, -0.135822132229805, -0.13262061774730682, -0.12941910326480865, -0.12621758878231049, -0.12301605939865112, -0.11981454491615295, -0.11661303043365479, -0.11341150850057602, -0.11020999401807785, -0.10700847208499908, -0.10380695760250092, -0.10060543566942215, -0.09740391373634338, -0.09420239925384521, -0.09100089222192764, -0.08779937028884888, -0.08459785580635071, -0.08139633387327194, -0.07819481939077377, -0.07499329745769501, -0.07179178297519684, -0.06859026104211807, -0.0653887391090393, -0.06218722090125084, -0.05898570269346237, -0.055784180760383606, -0.05258266627788544, -0.04938114434480667, -0.046179626137018204, -0.042978107929229736, -0.03977659344673157, -0.0365750752389431, -0.03337355703115463, -0.030172036960721016, -0.02697051875293255, -0.02376900054514408, -0.020567480474710464, -0.017365962266921997, -0.014164443127810955, -0.010962923988699913, -0.007761405780911446, -0.004559886641800404, -0.0013583684340119362, 0.0018431497737765312, 0.005044669844210148, 0.008246188051998615, 0.011447706259787083]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 10.0, 20.0, 17.0, 6.0, 16.0, 19.0, 18.0, 14.0, 25.0, 36.0, 31.0, 21.0, 33.0, 38.0, 30.0, 42.0, 30.0, 37.0, 39.0, 55.0, 48.0, 40.0, 38.0, 34.0, 34.0, 40.0, 21.0, 25.0, 17.0, 24.0, 23.0, 22.0, 13.0, 15.0, 13.0, 3.0, 10.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0181770920753479, -0.017644768580794334, -0.01711244508624077, -0.016580121591687202, -0.016047798097133636, -0.01551547460258007, -0.014983151108026505, -0.014450827613472939, -0.013918504118919373, -0.013386180624365807, -0.01285385712981224, -0.012321533635258675, -0.011789210140705109, -0.011256886646151543, -0.010724563151597977, -0.01019223965704441, -0.009659916162490845, -0.009127592667937279, -0.008595269173383713, -0.008062945678830147, -0.007530622184276581, -0.006998298689723015, -0.006465975195169449, -0.005933651700615883, -0.005401328206062317, -0.004869004711508751, -0.004336681216955185, -0.003804357722401619, -0.003272034227848053, -0.002739710733294487, -0.002207387238740921, -0.001675063744187355, -0.001142740249633789, -0.0006104167550802231, -7.80932605266571e-05, 0.0004542302340269089, 0.0009865537285804749, 0.0015188772231340408, 0.002051200717687607, 0.002583524212241173, 0.0031158477067947388, 0.0036481712013483047, 0.004180494695901871, 0.004712818190455437, 0.005245141685009003, 0.005777465179562569, 0.006309788674116135, 0.006842112168669701, 0.007374435663223267, 0.007906759157776833, 0.008439082652330399, 0.008971406146883965, 0.00950372964143753, 0.010036053135991096, 0.010568376630544662, 0.011100700125098228, 0.011633023619651794, 0.01216534711420536, 0.012697670608758926, 0.013229994103312492, 0.013762317597866058, 0.014294641092419624, 0.01482696458697319, 0.015359288081526756, 0.015891611576080322]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 6.0, 4.0, 3.0, 5.0, 6.0, 6.0, 6.0, 13.0, 19.0, 15.0, 18.0, 20.0, 15.0, 24.0, 18.0, 23.0, 27.0, 35.0, 36.0, 40.0, 42.0, 41.0, 46.0, 42.0, 45.0, 35.0, 39.0, 36.0, 35.0, 38.0, 36.0, 27.0, 22.0, 17.0, 25.0, 23.0, 21.0, 18.0, 21.0, 12.0, 8.0, 6.0, 4.0, 3.0, 4.0, 6.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.32354736328125, -4.1783447265625, -4.03314208984375, -3.887939453125, -3.74273681640625, -3.5975341796875, -3.45233154296875, -3.30712890625, -3.16192626953125, -3.0167236328125, -2.87152099609375, -2.726318359375, -2.58111572265625, -2.4359130859375, -2.29071044921875, -2.1455078125, -2.00030517578125, -1.8551025390625, -1.70989990234375, -1.564697265625, -1.41949462890625, -1.2742919921875, -1.12908935546875, -0.98388671875, -0.83868408203125, -0.6934814453125, -0.54827880859375, -0.403076171875, -0.25787353515625, -0.1126708984375, 0.03253173828125, 0.177734375, 0.32293701171875, 0.4681396484375, 0.61334228515625, 0.758544921875, 0.90374755859375, 1.0489501953125, 1.19415283203125, 1.33935546875, 1.48455810546875, 1.6297607421875, 1.77496337890625, 1.920166015625, 2.06536865234375, 2.2105712890625, 2.35577392578125, 2.5009765625, 2.64617919921875, 2.7913818359375, 2.93658447265625, 3.081787109375, 3.22698974609375, 3.3721923828125, 3.51739501953125, 3.66259765625, 3.80780029296875, 3.9530029296875, 4.09820556640625, 4.243408203125, 4.38861083984375, 4.5338134765625, 4.67901611328125, 4.82421875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 7.0, 10.0, 10.0, 18.0, 26.0, 26.0, 37.0, 47.0, 62.0, 93.0, 154.0, 176.0, 257.0, 357.0, 512.0, 715.0, 1271.0, 2124.0, 3937.0, 7591.0, 15059.0, 31538.0, 68090.0, 154194.0, 310693.0, 247088.0, 108150.0, 48843.0, 22914.0, 11120.0, 5568.0, 2953.0, 1681.0, 1043.0, 649.0, 448.0, 312.0, 200.0, 147.0, 101.0, 97.0, 69.0, 36.0, 43.0, 23.0, 15.0, 16.0, 13.0, 7.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.23065185546875, -5.0550537109375, -4.87945556640625, -4.703857421875, -4.52825927734375, -4.3526611328125, -4.17706298828125, -4.00146484375, -3.82586669921875, -3.6502685546875, -3.47467041015625, -3.299072265625, -3.12347412109375, -2.9478759765625, -2.77227783203125, -2.5966796875, -2.42108154296875, -2.2454833984375, -2.06988525390625, -1.894287109375, -1.71868896484375, -1.5430908203125, -1.36749267578125, -1.19189453125, -1.01629638671875, -0.8406982421875, -0.66510009765625, -0.489501953125, -0.31390380859375, -0.1383056640625, 0.03729248046875, 0.212890625, 0.38848876953125, 0.5640869140625, 0.73968505859375, 0.915283203125, 1.09088134765625, 1.2664794921875, 1.44207763671875, 1.61767578125, 1.79327392578125, 1.9688720703125, 2.14447021484375, 2.320068359375, 2.49566650390625, 2.6712646484375, 2.84686279296875, 3.0224609375, 3.19805908203125, 3.3736572265625, 3.54925537109375, 3.724853515625, 3.90045166015625, 4.0760498046875, 4.25164794921875, 4.42724609375, 4.60284423828125, 4.7784423828125, 4.95404052734375, 5.129638671875, 5.30523681640625, 5.4808349609375, 5.65643310546875, 5.83203125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 11.0, 14.0, 12.0, 18.0, 26.0, 24.0, 28.0, 23.0, 35.0, 44.0, 59.0, 60.0, 75.0, 138.0, 256.0, 1384.0, 247.0, 132.0, 70.0, 53.0, 34.0, 46.0, 42.0, 25.0, 34.0, 20.0, 28.0, 18.0, 12.0, 11.0, 19.0, 9.0, 2.0, 12.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.03125, -10.6302490234375, -10.229248046875, -9.8282470703125, -9.42724609375, -9.0262451171875, -8.625244140625, -8.2242431640625, -7.8232421875, -7.4222412109375, -7.021240234375, -6.6202392578125, -6.21923828125, -5.8182373046875, -5.417236328125, -5.0162353515625, -4.615234375, -4.2142333984375, -3.813232421875, -3.4122314453125, -3.01123046875, -2.6102294921875, -2.209228515625, -1.8082275390625, -1.4072265625, -1.0062255859375, -0.605224609375, -0.2042236328125, 0.19677734375, 0.5977783203125, 0.998779296875, 1.3997802734375, 1.80078125, 2.2017822265625, 2.602783203125, 3.0037841796875, 3.40478515625, 3.8057861328125, 4.206787109375, 4.6077880859375, 5.0087890625, 5.4097900390625, 5.810791015625, 6.2117919921875, 6.61279296875, 7.0137939453125, 7.414794921875, 7.8157958984375, 8.216796875, 8.6177978515625, 9.018798828125, 9.4197998046875, 9.82080078125, 10.2218017578125, 10.622802734375, 11.0238037109375, 11.4248046875, 11.8258056640625, 12.226806640625, 12.6278076171875, 13.02880859375, 13.4298095703125, 13.830810546875, 14.2318115234375, 14.6328125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 6.0, 11.0, 11.0, 10.0, 18.0, 17.0, 24.0, 39.0, 54.0, 75.0, 99.0, 125.0, 197.0, 298.0, 449.0, 842.0, 2019.0, 146485.0, 2987445.0, 4694.0, 1072.0, 561.0, 351.0, 220.0, 171.0, 110.0, 70.0, 57.0, 40.0, 34.0, 23.0, 8.0, 11.0, 17.0, 10.0, 7.0, 8.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.21875, -42.845703125, -41.47265625, -40.099609375, -38.7265625, -37.353515625, -35.98046875, -34.607421875, -33.234375, -31.861328125, -30.48828125, -29.115234375, -27.7421875, -26.369140625, -24.99609375, -23.623046875, -22.25, -20.876953125, -19.50390625, -18.130859375, -16.7578125, -15.384765625, -14.01171875, -12.638671875, -11.265625, -9.892578125, -8.51953125, -7.146484375, -5.7734375, -4.400390625, -3.02734375, -1.654296875, -0.28125, 1.091796875, 2.46484375, 3.837890625, 5.2109375, 6.583984375, 7.95703125, 9.330078125, 10.703125, 12.076171875, 13.44921875, 14.822265625, 16.1953125, 17.568359375, 18.94140625, 20.314453125, 21.6875, 23.060546875, 24.43359375, 25.806640625, 27.1796875, 28.552734375, 29.92578125, 31.298828125, 32.671875, 34.044921875, 35.41796875, 36.791015625, 38.1640625, 39.537109375, 40.91015625, 42.283203125, 43.65625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 53.0, 604.0, 341.0, 13.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.81536865234375, -245.48989868164062, -239.16441345214844, -232.8389434814453, -226.51345825195312, -220.18798828125, -213.86251831054688, -207.53704833984375, -201.21156311035156, -194.88609313964844, -188.56060791015625, -182.23513793945312, -175.90966796875, -169.5841827392578, -163.2587127685547, -156.9332275390625, -150.60775756835938, -144.28228759765625, -137.95680236816406, -131.63133239746094, -125.30585479736328, -118.98037719726562, -112.6549072265625, -106.32942962646484, -100.00395202636719, -93.67847442626953, -87.35299682617188, -81.02752685546875, -74.7020492553711, -68.37657165527344, -62.05109786987305, -55.725624084472656, -49.400146484375, -43.074668884277344, -36.74919509887695, -30.42371940612793, -24.098243713378906, -17.772768020629883, -11.44729232788086, -5.121818542480469, 1.2036590576171875, 7.529134750366211, 13.854610443115234, 20.180086135864258, 26.50556182861328, 32.83103942871094, 39.15651321411133, 45.48198699951172, 51.807464599609375, 58.13294219970703, 64.45841979980469, 70.78388977050781, 77.10936737060547, 83.43484497070312, 89.76031494140625, 96.0857925415039, 102.41127014160156, 108.73674774169922, 115.06222534179688, 121.3876953125, 127.71317291259766, 134.0386505126953, 140.36412048339844, 146.68960571289062, 153.01507568359375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 6.0, 5.0, 4.0, 5.0, 8.0, 11.0, 11.0, 10.0, 22.0, 10.0, 16.0, 29.0, 27.0, 23.0, 38.0, 32.0, 41.0, 43.0, 41.0, 41.0, 38.0, 44.0, 44.0, 44.0, 47.0, 40.0, 28.0, 34.0, 33.0, 38.0, 34.0, 29.0, 33.0, 15.0, 16.0, 13.0, 12.0, 9.0, 10.0, 6.0, 3.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.42636489868164, -34.30540466308594, -33.184444427490234, -32.06348419189453, -30.942523956298828, -29.821563720703125, -28.700603485107422, -27.57964324951172, -26.458683013916016, -25.337722778320312, -24.21676254272461, -23.095802307128906, -21.974842071533203, -20.8538818359375, -19.732921600341797, -18.611961364746094, -17.490999221801758, -16.370038986206055, -15.249078750610352, -14.128118515014648, -13.007158279418945, -11.886198043823242, -10.765236854553223, -9.64427661895752, -8.523316383361816, -7.402356147766113, -6.28139591217041, -5.160435199737549, -4.039474964141846, -2.9185147285461426, -1.7975540161132812, -0.6765937805175781, 0.444366455078125, 1.5653268098831177, 2.6862871646881104, 3.8072476387023926, 4.928207874298096, 6.049168109893799, 7.17012882232666, 8.291089057922363, 9.412049293518066, 10.53300952911377, 11.653969764709473, 12.774930953979492, 13.895891189575195, 15.016851425170898, 16.1378116607666, 17.258771896362305, 18.379732131958008, 19.50069236755371, 20.621652603149414, 21.742612838745117, 22.86357307434082, 23.984533309936523, 25.10549545288086, 26.226455688476562, 27.347415924072266, 28.46837615966797, 29.589336395263672, 30.710296630859375, 31.831256866455078, 32.95221710205078, 34.073177337646484, 35.19413757324219, 36.31509780883789]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 10.0, 8.0, 12.0, 12.0, 11.0, 21.0, 25.0, 13.0, 26.0, 27.0, 19.0, 23.0, 35.0, 34.0, 43.0, 38.0, 34.0, 36.0, 42.0, 35.0, 32.0, 44.0, 46.0, 45.0, 41.0, 36.0, 36.0, 30.0, 20.0, 24.0, 20.0, 15.0, 18.0, 12.0, 12.0, 17.0, 9.0, 7.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.95703125, -4.80474853515625, -4.6524658203125, -4.50018310546875, -4.347900390625, -4.19561767578125, -4.0433349609375, -3.89105224609375, -3.73876953125, -3.58648681640625, -3.4342041015625, -3.28192138671875, -3.129638671875, -2.97735595703125, -2.8250732421875, -2.67279052734375, -2.5205078125, -2.36822509765625, -2.2159423828125, -2.06365966796875, -1.911376953125, -1.75909423828125, -1.6068115234375, -1.45452880859375, -1.30224609375, -1.14996337890625, -0.9976806640625, -0.84539794921875, -0.693115234375, -0.54083251953125, -0.3885498046875, -0.23626708984375, -0.083984375, 0.06829833984375, 0.2205810546875, 0.37286376953125, 0.525146484375, 0.67742919921875, 0.8297119140625, 0.98199462890625, 1.13427734375, 1.28656005859375, 1.4388427734375, 1.59112548828125, 1.743408203125, 1.89569091796875, 2.0479736328125, 2.20025634765625, 2.3525390625, 2.50482177734375, 2.6571044921875, 2.80938720703125, 2.961669921875, 3.11395263671875, 3.2662353515625, 3.41851806640625, 3.57080078125, 3.72308349609375, 3.8753662109375, 4.02764892578125, 4.179931640625, 4.33221435546875, 4.4844970703125, 4.63677978515625, 4.7890625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 30.0, 42.0, 179.0, 1028.0, 29923.0, 4007564.0, 153346.0, 1877.0, 206.0, 56.0, 21.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.875, -57.664306640625, -56.45361328125, -55.242919921875, -54.0322265625, -52.821533203125, -51.61083984375, -50.400146484375, -49.189453125, -47.978759765625, -46.76806640625, -45.557373046875, -44.3466796875, -43.135986328125, -41.92529296875, -40.714599609375, -39.50390625, -38.293212890625, -37.08251953125, -35.871826171875, -34.6611328125, -33.450439453125, -32.23974609375, -31.029052734375, -29.818359375, -28.607666015625, -27.39697265625, -26.186279296875, -24.9755859375, -23.764892578125, -22.55419921875, -21.343505859375, -20.1328125, -18.922119140625, -17.71142578125, -16.500732421875, -15.2900390625, -14.079345703125, -12.86865234375, -11.657958984375, -10.447265625, -9.236572265625, -8.02587890625, -6.815185546875, -5.6044921875, -4.393798828125, -3.18310546875, -1.972412109375, -0.76171875, 0.448974609375, 1.65966796875, 2.870361328125, 4.0810546875, 5.291748046875, 6.50244140625, 7.713134765625, 8.923828125, 10.134521484375, 11.34521484375, 12.555908203125, 13.7666015625, 14.977294921875, 16.18798828125, 17.398681640625, 18.609375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 6.0, 18.0, 20.0, 32.0, 48.0, 64.0, 91.0, 155.0, 208.0, 246.0, 391.0, 536.0, 611.0, 512.0, 320.0, 236.0, 152.0, 130.0, 87.0, 65.0, 35.0, 33.0, 17.0, 21.0, 16.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -12.0660400390625, -11.733642578125, -11.4012451171875, -11.06884765625, -10.7364501953125, -10.404052734375, -10.0716552734375, -9.7392578125, -9.4068603515625, -9.074462890625, -8.7420654296875, -8.40966796875, -8.0772705078125, -7.744873046875, -7.4124755859375, -7.080078125, -6.7476806640625, -6.415283203125, -6.0828857421875, -5.75048828125, -5.4180908203125, -5.085693359375, -4.7532958984375, -4.4208984375, -4.0885009765625, -3.756103515625, -3.4237060546875, -3.09130859375, -2.7589111328125, -2.426513671875, -2.0941162109375, -1.76171875, -1.4293212890625, -1.096923828125, -0.7645263671875, -0.43212890625, -0.0997314453125, 0.232666015625, 0.5650634765625, 0.8974609375, 1.2298583984375, 1.562255859375, 1.8946533203125, 2.22705078125, 2.5594482421875, 2.891845703125, 3.2242431640625, 3.556640625, 3.8890380859375, 4.221435546875, 4.5538330078125, 4.88623046875, 5.2186279296875, 5.551025390625, 5.8834228515625, 6.2158203125, 6.5482177734375, 6.880615234375, 7.2130126953125, 7.54541015625, 7.8778076171875, 8.210205078125, 8.5426025390625, 8.875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 12.0, 22.0, 24.0, 64.0, 93.0, 160.0, 384.0, 798.0, 2518.0, 17871.0, 924991.0, 3186079.0, 55088.0, 4114.0, 1144.0, 442.0, 227.0, 119.0, 70.0, 24.0, 22.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.671875, -28.89453125, -28.1171875, -27.33984375, -26.5625, -25.78515625, -25.0078125, -24.23046875, -23.453125, -22.67578125, -21.8984375, -21.12109375, -20.34375, -19.56640625, -18.7890625, -18.01171875, -17.234375, -16.45703125, -15.6796875, -14.90234375, -14.125, -13.34765625, -12.5703125, -11.79296875, -11.015625, -10.23828125, -9.4609375, -8.68359375, -7.90625, -7.12890625, -6.3515625, -5.57421875, -4.796875, -4.01953125, -3.2421875, -2.46484375, -1.6875, -0.91015625, -0.1328125, 0.64453125, 1.421875, 2.19921875, 2.9765625, 3.75390625, 4.53125, 5.30859375, 6.0859375, 6.86328125, 7.640625, 8.41796875, 9.1953125, 9.97265625, 10.75, 11.52734375, 12.3046875, 13.08203125, 13.859375, 14.63671875, 15.4140625, 16.19140625, 16.96875, 17.74609375, 18.5234375, 19.30078125, 20.078125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 227.0, 688.0, 93.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-468.1849670410156, -460.0144958496094, -451.8440246582031, -443.673583984375, -435.50311279296875, -427.3326416015625, -419.16217041015625, -410.99169921875, -402.82122802734375, -394.6507568359375, -386.48028564453125, -378.3098449707031, -370.1393737792969, -361.9689025878906, -353.7984313964844, -345.6279602050781, -337.45751953125, -329.28704833984375, -321.1165771484375, -312.9461364746094, -304.7756652832031, -296.6051940917969, -288.4347229003906, -280.2642517089844, -272.09381103515625, -263.92333984375, -255.7528839111328, -247.58241271972656, -239.41195678710938, -231.24148559570312, -223.07101440429688, -214.90054321289062, -206.73007202148438, -198.55960083007812, -190.38914489746094, -182.2186737060547, -174.0482177734375, -165.87774658203125, -157.707275390625, -149.53680419921875, -141.36634826660156, -133.1958770751953, -125.02542114257812, -116.85494995117188, -108.68448638916016, -100.51402282714844, -92.34355163574219, -84.17308807373047, -76.00262451171875, -67.83216094970703, -59.66169357299805, -51.49122619628906, -43.320762634277344, -35.150299072265625, -26.97983169555664, -18.809364318847656, -10.638896942138672, -2.4684314727783203, 5.702033996582031, 13.872499465942383, 22.042964935302734, 30.213428497314453, 38.38389587402344, 46.55436325073242, 54.72482681274414]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 5.0, 3.0, 7.0, 3.0, 6.0, 3.0, 2.0, 3.0, 6.0, 9.0, 11.0, 14.0, 10.0, 23.0, 17.0, 10.0, 17.0, 20.0, 31.0, 23.0, 30.0, 35.0, 36.0, 26.0, 30.0, 35.0, 45.0, 41.0, 44.0, 35.0, 40.0, 34.0, 32.0, 31.0, 37.0, 30.0, 26.0, 24.0, 12.0, 22.0, 22.0, 13.0, 11.0, 14.0, 13.0, 13.0, 11.0, 8.0, 9.0, 9.0, 4.0, 2.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-26.915952682495117, -26.088600158691406, -25.261245727539062, -24.43389320373535, -23.60654067993164, -22.779186248779297, -21.951833724975586, -21.124481201171875, -20.29712677001953, -19.46977424621582, -18.642419815063477, -17.815067291259766, -16.987712860107422, -16.16036033630371, -15.3330078125, -14.505654335021973, -13.678300857543945, -12.850947380065918, -12.02359390258789, -11.19624137878418, -10.368887901306152, -9.541534423828125, -8.714181900024414, -7.886828422546387, -7.059474945068359, -6.232121467590332, -5.404768466949463, -4.577415466308594, -3.7500619888305664, -2.922708511352539, -2.09535551071167, -1.2680025100708008, -0.4406471252441406, 0.3867061138153076, 1.2140593528747559, 2.041412591934204, 2.8687658309936523, 3.6961193084716797, 4.523472309112549, 5.350825309753418, 6.178178787231445, 7.005532264709473, 7.832885265350342, 8.660238265991211, 9.487591743469238, 10.314945220947266, 11.142297744750977, 11.969651222229004, 12.797004699707031, 13.624358177185059, 14.451711654663086, 15.279064178466797, 16.10641860961914, 16.93377113342285, 17.761123657226562, 18.588478088378906, 19.415830612182617, 20.243183135986328, 21.070537567138672, 21.897890090942383, 22.725242614746094, 23.552597045898438, 24.37994956970215, 25.20730209350586, 26.034656524658203]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 5.0, 10.0, 8.0, 10.0, 12.0, 17.0, 13.0, 20.0, 28.0, 34.0, 31.0, 22.0, 26.0, 39.0, 44.0, 36.0, 30.0, 46.0, 36.0, 31.0, 41.0, 50.0, 37.0, 38.0, 35.0, 32.0, 31.0, 30.0, 29.0, 33.0, 24.0, 20.0, 14.0, 14.0, 9.0, 7.0, 10.0, 9.0, 3.0, 5.0, 1.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.046875, -3.9036865234375, -3.760498046875, -3.6173095703125, -3.47412109375, -3.3309326171875, -3.187744140625, -3.0445556640625, -2.9013671875, -2.7581787109375, -2.614990234375, -2.4718017578125, -2.32861328125, -2.1854248046875, -2.042236328125, -1.8990478515625, -1.755859375, -1.6126708984375, -1.469482421875, -1.3262939453125, -1.18310546875, -1.0399169921875, -0.896728515625, -0.7535400390625, -0.6103515625, -0.4671630859375, -0.323974609375, -0.1807861328125, -0.03759765625, 0.1055908203125, 0.248779296875, 0.3919677734375, 0.53515625, 0.6783447265625, 0.821533203125, 0.9647216796875, 1.10791015625, 1.2510986328125, 1.394287109375, 1.5374755859375, 1.6806640625, 1.8238525390625, 1.967041015625, 2.1102294921875, 2.25341796875, 2.3966064453125, 2.539794921875, 2.6829833984375, 2.826171875, 2.9693603515625, 3.112548828125, 3.2557373046875, 3.39892578125, 3.5421142578125, 3.685302734375, 3.8284912109375, 3.9716796875, 4.1148681640625, 4.258056640625, 4.4012451171875, 4.54443359375, 4.6876220703125, 4.830810546875, 4.9739990234375, 5.1171875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 9.0, 17.0, 25.0, 26.0, 44.0, 55.0, 90.0, 146.0, 251.0, 339.0, 524.0, 824.0, 1356.0, 2219.0, 3523.0, 5652.0, 8893.0, 14602.0, 23445.0, 38085.0, 59744.0, 90554.0, 126003.0, 155021.0, 153864.0, 123329.0, 87293.0, 57350.0, 36256.0, 22438.0, 13799.0, 8591.0, 5190.0, 3308.0, 2075.0, 1300.0, 807.0, 532.0, 326.0, 202.0, 153.0, 95.0, 61.0, 51.0, 24.0, 22.0, 13.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.669921875, -0.6482772827148438, -0.6266326904296875, -0.6049880981445312, -0.583343505859375, -0.5616989135742188, -0.5400543212890625, -0.5184097290039062, -0.49676513671875, -0.47512054443359375, -0.4534759521484375, -0.43183135986328125, -0.410186767578125, -0.38854217529296875, -0.3668975830078125, -0.34525299072265625, -0.3236083984375, -0.30196380615234375, -0.2803192138671875, -0.25867462158203125, -0.237030029296875, -0.21538543701171875, -0.1937408447265625, -0.17209625244140625, -0.15045166015625, -0.12880706787109375, -0.1071624755859375, -0.08551788330078125, -0.063873291015625, -0.04222869873046875, -0.0205841064453125, 0.00106048583984375, 0.022705078125, 0.04434967041015625, 0.0659942626953125, 0.08763885498046875, 0.109283447265625, 0.13092803955078125, 0.1525726318359375, 0.17421722412109375, 0.19586181640625, 0.21750640869140625, 0.2391510009765625, 0.26079559326171875, 0.282440185546875, 0.30408477783203125, 0.3257293701171875, 0.34737396240234375, 0.3690185546875, 0.39066314697265625, 0.4123077392578125, 0.43395233154296875, 0.455596923828125, 0.47724151611328125, 0.4988861083984375, 0.5205307006835938, 0.54217529296875, 0.5638198852539062, 0.5854644775390625, 0.6071090698242188, 0.628753662109375, 0.6503982543945312, 0.6720428466796875, 0.6936874389648438, 0.71533203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 6.0, 5.0, 10.0, 10.0, 13.0, 16.0, 20.0, 17.0, 22.0, 21.0, 29.0, 22.0, 25.0, 26.0, 35.0, 32.0, 30.0, 33.0, 40.0, 37.0, 1061.0, 42.0, 40.0, 45.0, 37.0, 41.0, 37.0, 34.0, 26.0, 26.0, 23.0, 22.0, 33.0, 8.0, 17.0, 14.0, 12.0, 12.0, 6.0, 0.0, 6.0, 5.0, 13.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.51171875, -3.407440185546875, -3.30316162109375, -3.198883056640625, -3.0946044921875, -2.990325927734375, -2.88604736328125, -2.781768798828125, -2.677490234375, -2.573211669921875, -2.46893310546875, -2.364654541015625, -2.2603759765625, -2.156097412109375, -2.05181884765625, -1.947540283203125, -1.84326171875, -1.738983154296875, -1.63470458984375, -1.530426025390625, -1.4261474609375, -1.321868896484375, -1.21759033203125, -1.113311767578125, -1.009033203125, -0.904754638671875, -0.80047607421875, -0.696197509765625, -0.5919189453125, -0.487640380859375, -0.38336181640625, -0.279083251953125, -0.1748046875, -0.070526123046875, 0.03375244140625, 0.138031005859375, 0.2423095703125, 0.346588134765625, 0.45086669921875, 0.555145263671875, 0.659423828125, 0.763702392578125, 0.86798095703125, 0.972259521484375, 1.0765380859375, 1.180816650390625, 1.28509521484375, 1.389373779296875, 1.49365234375, 1.597930908203125, 1.70220947265625, 1.806488037109375, 1.9107666015625, 2.015045166015625, 2.11932373046875, 2.223602294921875, 2.327880859375, 2.432159423828125, 2.53643798828125, 2.640716552734375, 2.7449951171875, 2.849273681640625, 2.95355224609375, 3.057830810546875, 3.162109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 3.0, 9.0, 34.0, 23.0, 43.0, 63.0, 95.0, 139.0, 181.0, 231.0, 340.0, 444.0, 688.0, 969.0, 1416.0, 2032.0, 2959.0, 4186.0, 5919.0, 8953.0, 13293.0, 20274.0, 33241.0, 1832381.0, 85959.0, 28248.0, 17514.0, 11743.0, 7881.0, 5344.0, 3753.0, 2673.0, 1796.0, 1295.0, 884.0, 646.0, 441.0, 288.0, 229.0, 152.0, 106.0, 89.0, 59.0, 43.0, 25.0, 13.0, 13.0, 6.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.2375030517578125, -1.198638916015625, -1.1597747802734375, -1.12091064453125, -1.0820465087890625, -1.043182373046875, -1.0043182373046875, -0.9654541015625, -0.9265899658203125, -0.887725830078125, -0.8488616943359375, -0.80999755859375, -0.7711334228515625, -0.732269287109375, -0.6934051513671875, -0.654541015625, -0.6156768798828125, -0.576812744140625, -0.5379486083984375, -0.49908447265625, -0.4602203369140625, -0.421356201171875, -0.3824920654296875, -0.3436279296875, -0.3047637939453125, -0.265899658203125, -0.2270355224609375, -0.18817138671875, -0.1493072509765625, -0.110443115234375, -0.0715789794921875, -0.03271484375, 0.0061492919921875, 0.045013427734375, 0.0838775634765625, 0.12274169921875, 0.1616058349609375, 0.200469970703125, 0.2393341064453125, 0.2781982421875, 0.3170623779296875, 0.355926513671875, 0.3947906494140625, 0.43365478515625, 0.4725189208984375, 0.511383056640625, 0.5502471923828125, 0.589111328125, 0.6279754638671875, 0.666839599609375, 0.7057037353515625, 0.74456787109375, 0.7834320068359375, 0.822296142578125, 0.8611602783203125, 0.9000244140625, 0.9388885498046875, 0.977752685546875, 1.0166168212890625, 1.05548095703125, 1.0943450927734375, 1.133209228515625, 1.1720733642578125, 1.2109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 3.0, 9.0, 6.0, 7.0, 9.0, 8.0, 15.0, 21.0, 17.0, 24.0, 26.0, 26.0, 38.0, 45.0, 54.0, 57.0, 53.0, 72.0, 64.0, 67.0, 67.0, 50.0, 40.0, 25.0, 37.0, 26.0, 21.0, 22.0, 16.0, 11.0, 8.0, 5.0, 11.0, 6.0, 11.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0194549560546875, -0.018844127655029297, -0.018233299255371094, -0.01762247085571289, -0.017011642456054688, -0.016400814056396484, -0.01578998565673828, -0.015179157257080078, -0.014568328857421875, -0.013957500457763672, -0.013346672058105469, -0.012735843658447266, -0.012125015258789062, -0.01151418685913086, -0.010903358459472656, -0.010292530059814453, -0.00968170166015625, -0.009070873260498047, -0.008460044860839844, -0.00784921646118164, -0.0072383880615234375, -0.006627559661865234, -0.006016731262207031, -0.005405902862548828, -0.004795074462890625, -0.004184246063232422, -0.0035734176635742188, -0.0029625892639160156, -0.0023517608642578125, -0.0017409324645996094, -0.0011301040649414062, -0.0005192756652832031, 9.1552734375e-05, 0.0007023811340332031, 0.0013132095336914062, 0.0019240379333496094, 0.0025348663330078125, 0.0031456947326660156, 0.0037565231323242188, 0.004367351531982422, 0.004978179931640625, 0.005589008331298828, 0.006199836730957031, 0.006810665130615234, 0.0074214935302734375, 0.00803232192993164, 0.008643150329589844, 0.009253978729248047, 0.00986480712890625, 0.010475635528564453, 0.011086463928222656, 0.01169729232788086, 0.012308120727539062, 0.012918949127197266, 0.013529777526855469, 0.014140605926513672, 0.014751434326171875, 0.015362262725830078, 0.01597309112548828, 0.016583919525146484, 0.017194747924804688, 0.01780557632446289, 0.018416404724121094, 0.019027233123779297, 0.0196380615234375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 14.0, 11.0, 16.0, 22.0, 24.0, 21.0, 29.0, 54.0, 60.0, 74.0, 120.0, 152.0, 183.0, 384.0, 732.0, 2321.0, 929582.0, 111830.0, 1273.0, 581.0, 314.0, 194.0, 134.0, 99.0, 68.0, 47.0, 49.0, 33.0, 26.0, 25.0, 17.0, 14.0, 9.0, 8.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.384033203125, -0.37233734130859375, -0.3606414794921875, -0.34894561767578125, -0.337249755859375, -0.32555389404296875, -0.3138580322265625, -0.30216217041015625, -0.29046630859375, -0.27877044677734375, -0.2670745849609375, -0.25537872314453125, -0.243682861328125, -0.23198699951171875, -0.2202911376953125, -0.20859527587890625, -0.1968994140625, -0.18520355224609375, -0.1735076904296875, -0.16181182861328125, -0.150115966796875, -0.13842010498046875, -0.1267242431640625, -0.11502838134765625, -0.10333251953125, -0.09163665771484375, -0.0799407958984375, -0.06824493408203125, -0.056549072265625, -0.04485321044921875, -0.0331573486328125, -0.02146148681640625, -0.009765625, 0.00193023681640625, 0.0136260986328125, 0.02532196044921875, 0.037017822265625, 0.04871368408203125, 0.0604095458984375, 0.07210540771484375, 0.08380126953125, 0.09549713134765625, 0.1071929931640625, 0.11888885498046875, 0.130584716796875, 0.14228057861328125, 0.1539764404296875, 0.16567230224609375, 0.1773681640625, 0.18906402587890625, 0.2007598876953125, 0.21245574951171875, 0.224151611328125, 0.23584747314453125, 0.2475433349609375, 0.25923919677734375, 0.27093505859375, 0.28263092041015625, 0.2943267822265625, 0.30602264404296875, 0.317718505859375, 0.32941436767578125, 0.3411102294921875, 0.35280609130859375, 0.364501953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 400.0, 611.0, 2.0], "bins": [-0.49828213453292847, -0.4902520179748535, -0.48222190141677856, -0.4741917848587036, -0.4661616384983063, -0.4581315219402313, -0.45010140538215637, -0.4420712888240814, -0.43404117226600647, -0.4260110557079315, -0.41798093914985657, -0.40995079278945923, -0.4019206762313843, -0.3938905596733093, -0.3858604431152344, -0.3778303265571594, -0.3698002099990845, -0.3617700934410095, -0.35373997688293457, -0.3457098603248596, -0.3376797139644623, -0.32964959740638733, -0.3216194808483124, -0.3135893642902374, -0.3055592179298401, -0.29752910137176514, -0.2894989848136902, -0.28146886825561523, -0.2734387218952179, -0.26540860533714294, -0.257378488779068, -0.24934837222099304, -0.24131827056407928, -0.23328815400600433, -0.2252580225467682, -0.21722790598869324, -0.2091977894306183, -0.20116767287254333, -0.1931375414133072, -0.18510742485523224, -0.1770772933959961, -0.16904717683792114, -0.161017045378685, -0.15298692882061005, -0.1449568122625351, -0.13692668080329895, -0.128896564245224, -0.12086644768714905, -0.1128363236784935, -0.10480619966983795, -0.096776083111763, -0.08874595910310745, -0.0807158350944519, -0.07268571853637695, -0.0646555945277214, -0.056625474244356155, -0.048595353960990906, -0.040565233677625656, -0.032535113394260406, -0.02450498938560486, -0.01647486910223961, -0.008444748818874359, -0.00041462481021881104, 0.007615495473146439, 0.01564561389386654]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 16.0, 12.0, 21.0, 21.0, 25.0, 28.0, 28.0, 33.0, 44.0, 47.0, 60.0, 57.0, 57.0, 61.0, 66.0, 59.0, 50.0, 51.0, 51.0, 30.0, 30.0, 24.0, 31.0, 10.0, 22.0, 20.0, 8.0, 15.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.028846025466918945, -0.027915380895137787, -0.02698473632335663, -0.02605409175157547, -0.02512344717979431, -0.024192802608013153, -0.023262158036231995, -0.022331513464450836, -0.021400868892669678, -0.02047022432088852, -0.01953957974910736, -0.018608935177326202, -0.017678290605545044, -0.016747646033763885, -0.015817001461982727, -0.014886356890201569, -0.01395571231842041, -0.013025067746639252, -0.012094423174858093, -0.011163778603076935, -0.010233134031295776, -0.009302489459514618, -0.00837184488773346, -0.007441200315952301, -0.006510555744171143, -0.005579911172389984, -0.004649266600608826, -0.0037186220288276672, -0.002787977457046509, -0.0018573328852653503, -0.0009266883134841919, 3.956258296966553e-06, 0.000934600830078125, 0.0018652454018592834, 0.002795889973640442, 0.0037265345454216003, 0.004657179117202759, 0.005587823688983917, 0.006518468260765076, 0.007449112832546234, 0.008379757404327393, 0.009310401976108551, 0.01024104654788971, 0.011171691119670868, 0.012102335691452026, 0.013032980263233185, 0.013963624835014343, 0.014894269406795502, 0.01582491397857666, 0.01675555855035782, 0.017686203122138977, 0.018616847693920135, 0.019547492265701294, 0.020478136837482452, 0.02140878140926361, 0.02233942598104477, 0.023270070552825928, 0.024200715124607086, 0.025131359696388245, 0.026062004268169403, 0.02699264883995056, 0.02792329341173172, 0.02885393798351288, 0.029784582555294037, 0.030715227127075195]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 6.0, 7.0, 4.0, 4.0, 7.0, 10.0, 13.0, 10.0, 21.0, 13.0, 23.0, 33.0, 24.0, 28.0, 24.0, 33.0, 36.0, 34.0, 36.0, 43.0, 39.0, 39.0, 49.0, 52.0, 35.0, 31.0, 30.0, 22.0, 35.0, 39.0, 33.0, 23.0, 24.0, 27.0, 19.0, 14.0, 11.0, 10.0, 12.0, 10.0, 4.0, 8.0, 4.0, 9.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.92999267578125, -3.7857666015625, -3.64154052734375, -3.497314453125, -3.35308837890625, -3.2088623046875, -3.06463623046875, -2.92041015625, -2.77618408203125, -2.6319580078125, -2.48773193359375, -2.343505859375, -2.19927978515625, -2.0550537109375, -1.91082763671875, -1.7666015625, -1.62237548828125, -1.4781494140625, -1.33392333984375, -1.189697265625, -1.04547119140625, -0.9012451171875, -0.75701904296875, -0.61279296875, -0.46856689453125, -0.3243408203125, -0.18011474609375, -0.035888671875, 0.10833740234375, 0.2525634765625, 0.39678955078125, 0.541015625, 0.68524169921875, 0.8294677734375, 0.97369384765625, 1.117919921875, 1.26214599609375, 1.4063720703125, 1.55059814453125, 1.69482421875, 1.83905029296875, 1.9832763671875, 2.12750244140625, 2.271728515625, 2.41595458984375, 2.5601806640625, 2.70440673828125, 2.8486328125, 2.99285888671875, 3.1370849609375, 3.28131103515625, 3.425537109375, 3.56976318359375, 3.7139892578125, 3.85821533203125, 4.00244140625, 4.14666748046875, 4.2908935546875, 4.43511962890625, 4.579345703125, 4.72357177734375, 4.8677978515625, 5.01202392578125, 5.15625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 19.0, 22.0, 21.0, 34.0, 47.0, 76.0, 132.0, 173.0, 232.0, 314.0, 476.0, 814.0, 1282.0, 2513.0, 6090.0, 18630.0, 78681.0, 411467.0, 416774.0, 79562.0, 18885.0, 5991.0, 2584.0, 1306.0, 767.0, 551.0, 349.0, 218.0, 152.0, 103.0, 76.0, 65.0, 57.0, 24.0, 12.0, 12.0, 12.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.96875, -9.6839599609375, -9.399169921875, -9.1143798828125, -8.82958984375, -8.5447998046875, -8.260009765625, -7.9752197265625, -7.6904296875, -7.4056396484375, -7.120849609375, -6.8360595703125, -6.55126953125, -6.2664794921875, -5.981689453125, -5.6968994140625, -5.412109375, -5.1273193359375, -4.842529296875, -4.5577392578125, -4.27294921875, -3.9881591796875, -3.703369140625, -3.4185791015625, -3.1337890625, -2.8489990234375, -2.564208984375, -2.2794189453125, -1.99462890625, -1.7098388671875, -1.425048828125, -1.1402587890625, -0.85546875, -0.5706787109375, -0.285888671875, -0.0010986328125, 0.28369140625, 0.5684814453125, 0.853271484375, 1.1380615234375, 1.4228515625, 1.7076416015625, 1.992431640625, 2.2772216796875, 2.56201171875, 2.8468017578125, 3.131591796875, 3.4163818359375, 3.701171875, 3.9859619140625, 4.270751953125, 4.5555419921875, 4.84033203125, 5.1251220703125, 5.409912109375, 5.6947021484375, 5.9794921875, 6.2642822265625, 6.549072265625, 6.8338623046875, 7.11865234375, 7.4034423828125, 7.688232421875, 7.9730224609375, 8.2578125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 6.0, 6.0, 8.0, 18.0, 12.0, 23.0, 19.0, 25.0, 39.0, 32.0, 43.0, 51.0, 51.0, 70.0, 136.0, 246.0, 1442.0, 223.0, 143.0, 78.0, 67.0, 42.0, 38.0, 40.0, 22.0, 33.0, 19.0, 16.0, 15.0, 14.0, 11.0, 10.0, 11.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.5859375, -12.2095947265625, -11.833251953125, -11.4569091796875, -11.08056640625, -10.7042236328125, -10.327880859375, -9.9515380859375, -9.5751953125, -9.1988525390625, -8.822509765625, -8.4461669921875, -8.06982421875, -7.6934814453125, -7.317138671875, -6.9407958984375, -6.564453125, -6.1881103515625, -5.811767578125, -5.4354248046875, -5.05908203125, -4.6827392578125, -4.306396484375, -3.9300537109375, -3.5537109375, -3.1773681640625, -2.801025390625, -2.4246826171875, -2.04833984375, -1.6719970703125, -1.295654296875, -0.9193115234375, -0.54296875, -0.1666259765625, 0.209716796875, 0.5860595703125, 0.96240234375, 1.3387451171875, 1.715087890625, 2.0914306640625, 2.4677734375, 2.8441162109375, 3.220458984375, 3.5968017578125, 3.97314453125, 4.3494873046875, 4.725830078125, 5.1021728515625, 5.478515625, 5.8548583984375, 6.231201171875, 6.6075439453125, 6.98388671875, 7.3602294921875, 7.736572265625, 8.1129150390625, 8.4892578125, 8.8656005859375, 9.241943359375, 9.6182861328125, 9.99462890625, 10.3709716796875, 10.747314453125, 11.1236572265625, 11.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 9.0, 13.0, 11.0, 17.0, 15.0, 38.0, 40.0, 42.0, 57.0, 90.0, 99.0, 134.0, 228.0, 306.0, 533.0, 1177.0, 4650.0, 2885150.0, 247730.0, 2940.0, 909.0, 437.0, 286.0, 196.0, 141.0, 117.0, 64.0, 70.0, 41.0, 39.0, 26.0, 18.0, 18.0, 10.0, 10.0, 7.0, 4.0, 4.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-36.65625, -35.50634765625, -34.3564453125, -33.20654296875, -32.056640625, -30.90673828125, -29.7568359375, -28.60693359375, -27.45703125, -26.30712890625, -25.1572265625, -24.00732421875, -22.857421875, -21.70751953125, -20.5576171875, -19.40771484375, -18.2578125, -17.10791015625, -15.9580078125, -14.80810546875, -13.658203125, -12.50830078125, -11.3583984375, -10.20849609375, -9.05859375, -7.90869140625, -6.7587890625, -5.60888671875, -4.458984375, -3.30908203125, -2.1591796875, -1.00927734375, 0.140625, 1.29052734375, 2.4404296875, 3.59033203125, 4.740234375, 5.89013671875, 7.0400390625, 8.18994140625, 9.33984375, 10.48974609375, 11.6396484375, 12.78955078125, 13.939453125, 15.08935546875, 16.2392578125, 17.38916015625, 18.5390625, 19.68896484375, 20.8388671875, 21.98876953125, 23.138671875, 24.28857421875, 25.4384765625, 26.58837890625, 27.73828125, 28.88818359375, 30.0380859375, 31.18798828125, 32.337890625, 33.48779296875, 34.6376953125, 35.78759765625, 36.9375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 19.0, 93.0, 309.0, 396.0, 160.0, 34.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.127653121948242, -22.910930633544922, -19.694210052490234, -16.477489471435547, -13.260766983032227, -10.044046401977539, -6.827323913574219, -3.6106014251708984, -0.39388084411621094, 2.822840690612793, 6.039562225341797, 9.2562837600708, 12.473005294799805, 15.689725875854492, 18.906448364257812, 22.123170852661133, 25.33989143371582, 28.55661392211914, 31.773334503173828, 34.990055084228516, 38.20677947998047, 41.423500061035156, 44.640220642089844, 47.85694122314453, 51.07366180419922, 54.290382385253906, 57.507102966308594, 60.72382736206055, 63.940547943115234, 67.15727233886719, 70.37399291992188, 73.59071350097656, 76.80743408203125, 80.02415466308594, 83.24087524414062, 86.45759582519531, 89.67431640625, 92.89103698730469, 96.1077651977539, 99.3244857788086, 102.54120635986328, 105.75792694091797, 108.97464752197266, 112.19136810302734, 115.40809631347656, 118.62481689453125, 121.84153747558594, 125.05825805664062, 128.2749786376953, 131.49169921875, 134.7084197998047, 137.92514038085938, 141.14186096191406, 144.35858154296875, 147.57530212402344, 150.79202270507812, 154.00875854492188, 157.22547912597656, 160.44219970703125, 163.65892028808594, 166.87564086914062, 170.0923614501953, 173.30908203125, 176.52581787109375, 179.74252319335938]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 4.0, 6.0, 10.0, 9.0, 5.0, 12.0, 25.0, 15.0, 22.0, 28.0, 30.0, 23.0, 24.0, 33.0, 33.0, 31.0, 37.0, 41.0, 37.0, 46.0, 42.0, 39.0, 36.0, 37.0, 40.0, 39.0, 21.0, 26.0, 29.0, 20.0, 30.0, 24.0, 22.0, 19.0, 18.0, 14.0, 14.0, 3.0, 6.0, 7.0, 8.0, 2.0, 5.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.641427993774414, -24.764957427978516, -23.888484954833984, -23.012014389038086, -22.135543823242188, -21.259071350097656, -20.382600784301758, -19.50613021850586, -18.629657745361328, -17.75318717956543, -16.8767147064209, -16.000244140625, -15.123773574829102, -14.247302055358887, -13.370830535888672, -12.494359970092773, -11.617889404296875, -10.74141788482666, -9.864947319030762, -8.988475799560547, -8.112005233764648, -7.235533714294434, -6.359062194824219, -5.482591152191162, -4.6061201095581055, -3.729649066925049, -2.853177785873413, -1.9767065048217773, -1.1002354621887207, -0.22376441955566406, 0.6527070999145508, 1.5291781425476074, 2.405649185180664, 3.2821202278137207, 4.158591270446777, 5.035062789916992, 5.911533832550049, 6.7880048751831055, 7.66447639465332, 8.540946960449219, 9.417418479919434, 10.293889999389648, 11.170360565185547, 12.046832084655762, 12.923303604125977, 13.799774169921875, 14.67624568939209, 15.552717208862305, 16.429187774658203, 17.3056583404541, 18.182130813598633, 19.05860137939453, 19.93507194519043, 20.811542510986328, 21.68801498413086, 22.564485549926758, 23.440956115722656, 24.317426681518555, 25.193899154663086, 26.070369720458984, 26.946840286254883, 27.82331085205078, 28.699783325195312, 29.57625389099121, 30.452726364135742]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 8.0, 5.0, 5.0, 4.0, 7.0, 11.0, 19.0, 15.0, 16.0, 14.0, 19.0, 15.0, 31.0, 30.0, 27.0, 27.0, 35.0, 33.0, 30.0, 38.0, 42.0, 44.0, 34.0, 36.0, 30.0, 31.0, 40.0, 30.0, 22.0, 30.0, 25.0, 30.0, 31.0, 22.0, 23.0, 16.0, 22.0, 15.0, 10.0, 14.0, 15.0, 9.0, 12.0, 5.0, 3.0, 4.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.09765625, -3.96112060546875, -3.8245849609375, -3.68804931640625, -3.551513671875, -3.41497802734375, -3.2784423828125, -3.14190673828125, -3.00537109375, -2.86883544921875, -2.7322998046875, -2.59576416015625, -2.459228515625, -2.32269287109375, -2.1861572265625, -2.04962158203125, -1.9130859375, -1.77655029296875, -1.6400146484375, -1.50347900390625, -1.366943359375, -1.23040771484375, -1.0938720703125, -0.95733642578125, -0.82080078125, -0.68426513671875, -0.5477294921875, -0.41119384765625, -0.274658203125, -0.13812255859375, -0.0015869140625, 0.13494873046875, 0.271484375, 0.40802001953125, 0.5445556640625, 0.68109130859375, 0.817626953125, 0.95416259765625, 1.0906982421875, 1.22723388671875, 1.36376953125, 1.50030517578125, 1.6368408203125, 1.77337646484375, 1.909912109375, 2.04644775390625, 2.1829833984375, 2.31951904296875, 2.4560546875, 2.59259033203125, 2.7291259765625, 2.86566162109375, 3.002197265625, 3.13873291015625, 3.2752685546875, 3.41180419921875, 3.54833984375, 3.68487548828125, 3.8214111328125, 3.95794677734375, 4.094482421875, 4.23101806640625, 4.3675537109375, 4.50408935546875, 4.640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 8.0, 22.0, 16.0, 37.0, 59.0, 122.0, 200.0, 420.0, 1032.0, 2202.0, 5661.0, 17524.0, 75465.0, 565127.0, 2360479.0, 996309.0, 132312.0, 25083.0, 7404.0, 2727.0, 1062.0, 490.0, 236.0, 120.0, 57.0, 27.0, 36.0, 15.0, 6.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.9765625, -11.6497802734375, -11.322998046875, -10.9962158203125, -10.66943359375, -10.3426513671875, -10.015869140625, -9.6890869140625, -9.3623046875, -9.0355224609375, -8.708740234375, -8.3819580078125, -8.05517578125, -7.7283935546875, -7.401611328125, -7.0748291015625, -6.748046875, -6.4212646484375, -6.094482421875, -5.7677001953125, -5.44091796875, -5.1141357421875, -4.787353515625, -4.4605712890625, -4.1337890625, -3.8070068359375, -3.480224609375, -3.1534423828125, -2.82666015625, -2.4998779296875, -2.173095703125, -1.8463134765625, -1.51953125, -1.1927490234375, -0.865966796875, -0.5391845703125, -0.21240234375, 0.1143798828125, 0.441162109375, 0.7679443359375, 1.0947265625, 1.4215087890625, 1.748291015625, 2.0750732421875, 2.40185546875, 2.7286376953125, 3.055419921875, 3.3822021484375, 3.708984375, 4.0357666015625, 4.362548828125, 4.6893310546875, 5.01611328125, 5.3428955078125, 5.669677734375, 5.9964599609375, 6.3232421875, 6.6500244140625, 6.976806640625, 7.3035888671875, 7.63037109375, 7.9571533203125, 8.283935546875, 8.6107177734375, 8.9375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 11.0, 16.0, 22.0, 23.0, 41.0, 53.0, 66.0, 68.0, 137.0, 143.0, 219.0, 307.0, 382.0, 501.0, 507.0, 446.0, 312.0, 226.0, 178.0, 121.0, 92.0, 53.0, 38.0, 31.0, 22.0, 9.0, 17.0, 13.0, 8.0, 3.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.978271484375, -8.70654296875, -8.434814453125, -8.1630859375, -7.891357421875, -7.61962890625, -7.347900390625, -7.076171875, -6.804443359375, -6.53271484375, -6.260986328125, -5.9892578125, -5.717529296875, -5.44580078125, -5.174072265625, -4.90234375, -4.630615234375, -4.35888671875, -4.087158203125, -3.8154296875, -3.543701171875, -3.27197265625, -3.000244140625, -2.728515625, -2.456787109375, -2.18505859375, -1.913330078125, -1.6416015625, -1.369873046875, -1.09814453125, -0.826416015625, -0.5546875, -0.282958984375, -0.01123046875, 0.260498046875, 0.5322265625, 0.803955078125, 1.07568359375, 1.347412109375, 1.619140625, 1.890869140625, 2.16259765625, 2.434326171875, 2.7060546875, 2.977783203125, 3.24951171875, 3.521240234375, 3.79296875, 4.064697265625, 4.33642578125, 4.608154296875, 4.8798828125, 5.151611328125, 5.42333984375, 5.695068359375, 5.966796875, 6.238525390625, 6.51025390625, 6.781982421875, 7.0537109375, 7.325439453125, 7.59716796875, 7.868896484375, 8.140625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 13.0, 14.0, 19.0, 23.0, 51.0, 69.0, 96.0, 174.0, 323.0, 735.0, 1661.0, 5872.0, 37058.0, 872890.0, 3134841.0, 123759.0, 11699.0, 2885.0, 996.0, 446.0, 240.0, 139.0, 90.0, 48.0, 35.0, 36.0, 26.0, 14.0, 6.0, 5.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.171875, -17.60791015625, -17.0439453125, -16.47998046875, -15.916015625, -15.35205078125, -14.7880859375, -14.22412109375, -13.66015625, -13.09619140625, -12.5322265625, -11.96826171875, -11.404296875, -10.84033203125, -10.2763671875, -9.71240234375, -9.1484375, -8.58447265625, -8.0205078125, -7.45654296875, -6.892578125, -6.32861328125, -5.7646484375, -5.20068359375, -4.63671875, -4.07275390625, -3.5087890625, -2.94482421875, -2.380859375, -1.81689453125, -1.2529296875, -0.68896484375, -0.125, 0.43896484375, 1.0029296875, 1.56689453125, 2.130859375, 2.69482421875, 3.2587890625, 3.82275390625, 4.38671875, 4.95068359375, 5.5146484375, 6.07861328125, 6.642578125, 7.20654296875, 7.7705078125, 8.33447265625, 8.8984375, 9.46240234375, 10.0263671875, 10.59033203125, 11.154296875, 11.71826171875, 12.2822265625, 12.84619140625, 13.41015625, 13.97412109375, 14.5380859375, 15.10205078125, 15.666015625, 16.22998046875, 16.7939453125, 17.35791015625, 17.921875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 31.0, 470.0, 476.0, 37.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-464.6063232421875, -456.1550598144531, -447.70379638671875, -439.2525634765625, -430.8013000488281, -422.35003662109375, -413.8987731933594, -405.447509765625, -396.99627685546875, -388.5450134277344, -380.09375, -371.64251708984375, -363.1912536621094, -354.739990234375, -346.2887268066406, -337.83746337890625, -329.38623046875, -320.9349670410156, -312.48370361328125, -304.032470703125, -295.5812072753906, -287.12994384765625, -278.6786804199219, -270.2274169921875, -261.7761535644531, -253.32489013671875, -244.87364196777344, -236.42237854003906, -227.97113037109375, -219.51986694335938, -211.068603515625, -202.6173553466797, -194.16612243652344, -185.71485900878906, -177.26361083984375, -168.81234741210938, -160.36109924316406, -151.9098358154297, -143.45858764648438, -135.00732421875, -126.55606842041016, -118.10481262207031, -109.65355682373047, -101.20230102539062, -92.75103759765625, -84.29978942871094, -75.84852600097656, -67.39727020263672, -58.946014404296875, -50.49475860595703, -42.04350280761719, -33.59224319458008, -25.140987396240234, -16.68973159790039, -8.238471984863281, 0.2127838134765625, 8.664039611816406, 17.11529541015625, 25.566553115844727, 34.0178108215332, 42.46906661987305, 50.92032241821289, 59.37158203125, 67.82283782958984, 76.27409362792969]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 5.0, 10.0, 13.0, 10.0, 13.0, 20.0, 15.0, 30.0, 21.0, 35.0, 27.0, 37.0, 38.0, 40.0, 45.0, 33.0, 67.0, 44.0, 48.0, 54.0, 44.0, 38.0, 44.0, 36.0, 30.0, 33.0, 24.0, 25.0, 23.0, 18.0, 14.0, 9.0, 10.0, 13.0, 6.0, 6.0, 5.0, 3.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.745880126953125, -29.71100425720215, -28.676128387451172, -27.641252517700195, -26.60637664794922, -25.571500778198242, -24.536624908447266, -23.50174903869629, -22.466873168945312, -21.431997299194336, -20.39712142944336, -19.362245559692383, -18.327369689941406, -17.29249382019043, -16.257617950439453, -15.222742080688477, -14.1878662109375, -13.152990341186523, -12.118114471435547, -11.08323860168457, -10.048362731933594, -9.013486862182617, -7.978610992431641, -6.943735122680664, -5.9088592529296875, -4.873983383178711, -3.8391075134277344, -2.804231643676758, -1.7693557739257812, -0.7344799041748047, 0.3003959655761719, 1.3352718353271484, 2.370147705078125, 3.4050235748291016, 4.439899444580078, 5.474775314331055, 6.509651184082031, 7.544527053833008, 8.579402923583984, 9.614278793334961, 10.649154663085938, 11.684030532836914, 12.71890640258789, 13.753782272338867, 14.788658142089844, 15.82353401184082, 16.858409881591797, 17.893285751342773, 18.92816162109375, 19.963037490844727, 20.997913360595703, 22.03278923034668, 23.067665100097656, 24.102540969848633, 25.13741683959961, 26.172292709350586, 27.207168579101562, 28.24204444885254, 29.276920318603516, 30.311796188354492, 31.34667205810547, 32.38154602050781, 33.41642379760742, 34.45130157470703, 35.486175537109375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 9.0, 13.0, 10.0, 15.0, 15.0, 18.0, 19.0, 28.0, 25.0, 28.0, 32.0, 31.0, 37.0, 41.0, 35.0, 33.0, 39.0, 44.0, 37.0, 45.0, 35.0, 40.0, 42.0, 46.0, 46.0, 26.0, 29.0, 29.0, 24.0, 22.0, 20.0, 11.0, 16.0, 8.0, 13.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6953125, -4.548095703125, -4.40087890625, -4.253662109375, -4.1064453125, -3.959228515625, -3.81201171875, -3.664794921875, -3.517578125, -3.370361328125, -3.22314453125, -3.075927734375, -2.9287109375, -2.781494140625, -2.63427734375, -2.487060546875, -2.33984375, -2.192626953125, -2.04541015625, -1.898193359375, -1.7509765625, -1.603759765625, -1.45654296875, -1.309326171875, -1.162109375, -1.014892578125, -0.86767578125, -0.720458984375, -0.5732421875, -0.426025390625, -0.27880859375, -0.131591796875, 0.015625, 0.162841796875, 0.31005859375, 0.457275390625, 0.6044921875, 0.751708984375, 0.89892578125, 1.046142578125, 1.193359375, 1.340576171875, 1.48779296875, 1.635009765625, 1.7822265625, 1.929443359375, 2.07666015625, 2.223876953125, 2.37109375, 2.518310546875, 2.66552734375, 2.812744140625, 2.9599609375, 3.107177734375, 3.25439453125, 3.401611328125, 3.548828125, 3.696044921875, 3.84326171875, 3.990478515625, 4.1376953125, 4.284912109375, 4.43212890625, 4.579345703125, 4.7265625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 5.0, 10.0, 14.0, 20.0, 25.0, 48.0, 69.0, 117.0, 166.0, 244.0, 395.0, 607.0, 974.0, 1511.0, 2405.0, 3727.0, 5969.0, 9750.0, 16440.0, 26443.0, 43765.0, 70190.0, 106973.0, 149628.0, 170430.0, 149149.0, 107147.0, 69943.0, 43630.0, 26692.0, 16045.0, 9804.0, 5978.0, 3692.0, 2303.0, 1443.0, 994.0, 616.0, 408.0, 264.0, 185.0, 126.0, 70.0, 50.0, 35.0, 20.0, 13.0, 9.0, 5.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.7353515625, -0.7127227783203125, -0.690093994140625, -0.6674652099609375, -0.64483642578125, -0.6222076416015625, -0.599578857421875, -0.5769500732421875, -0.5543212890625, -0.5316925048828125, -0.509063720703125, -0.4864349365234375, -0.46380615234375, -0.4411773681640625, -0.418548583984375, -0.3959197998046875, -0.373291015625, -0.3506622314453125, -0.328033447265625, -0.3054046630859375, -0.28277587890625, -0.2601470947265625, -0.237518310546875, -0.2148895263671875, -0.1922607421875, -0.1696319580078125, -0.147003173828125, -0.1243743896484375, -0.10174560546875, -0.0791168212890625, -0.056488037109375, -0.0338592529296875, -0.01123046875, 0.0113983154296875, 0.034027099609375, 0.0566558837890625, 0.07928466796875, 0.1019134521484375, 0.124542236328125, 0.1471710205078125, 0.1697998046875, 0.1924285888671875, 0.215057373046875, 0.2376861572265625, 0.26031494140625, 0.2829437255859375, 0.305572509765625, 0.3282012939453125, 0.350830078125, 0.3734588623046875, 0.396087646484375, 0.4187164306640625, 0.44134521484375, 0.4639739990234375, 0.486602783203125, 0.5092315673828125, 0.5318603515625, 0.5544891357421875, 0.577117919921875, 0.5997467041015625, 0.62237548828125, 0.6450042724609375, 0.667633056640625, 0.6902618408203125, 0.712890625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 4.0, 14.0, 13.0, 6.0, 7.0, 14.0, 20.0, 27.0, 27.0, 36.0, 39.0, 32.0, 40.0, 27.0, 27.0, 32.0, 37.0, 34.0, 33.0, 1067.0, 43.0, 24.0, 41.0, 41.0, 39.0, 40.0, 35.0, 39.0, 29.0, 21.0, 17.0, 28.0, 15.0, 16.0, 7.0, 6.0, 14.0, 4.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.40234375, -3.300872802734375, -3.19940185546875, -3.097930908203125, -2.9964599609375, -2.894989013671875, -2.79351806640625, -2.692047119140625, -2.590576171875, -2.489105224609375, -2.38763427734375, -2.286163330078125, -2.1846923828125, -2.083221435546875, -1.98175048828125, -1.880279541015625, -1.77880859375, -1.677337646484375, -1.57586669921875, -1.474395751953125, -1.3729248046875, -1.271453857421875, -1.16998291015625, -1.068511962890625, -0.967041015625, -0.865570068359375, -0.76409912109375, -0.662628173828125, -0.5611572265625, -0.459686279296875, -0.35821533203125, -0.256744384765625, -0.1552734375, -0.053802490234375, 0.04766845703125, 0.149139404296875, 0.2506103515625, 0.352081298828125, 0.45355224609375, 0.555023193359375, 0.656494140625, 0.757965087890625, 0.85943603515625, 0.960906982421875, 1.0623779296875, 1.163848876953125, 1.26531982421875, 1.366790771484375, 1.46826171875, 1.569732666015625, 1.67120361328125, 1.772674560546875, 1.8741455078125, 1.975616455078125, 2.07708740234375, 2.178558349609375, 2.280029296875, 2.381500244140625, 2.48297119140625, 2.584442138671875, 2.6859130859375, 2.787384033203125, 2.88885498046875, 2.990325927734375, 3.091796875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 5.0, 5.0, 14.0, 10.0, 17.0, 24.0, 32.0, 69.0, 102.0, 119.0, 194.0, 317.0, 471.0, 672.0, 1076.0, 1571.0, 2431.0, 3590.0, 5561.0, 8699.0, 13987.0, 23711.0, 43946.0, 1885280.0, 42724.0, 23504.0, 14191.0, 8663.0, 5543.0, 3623.0, 2376.0, 1515.0, 1068.0, 646.0, 441.0, 308.0, 216.0, 137.0, 102.0, 55.0, 40.0, 22.0, 23.0, 10.0, 5.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.609375, -1.562713623046875, -1.51605224609375, -1.469390869140625, -1.4227294921875, -1.376068115234375, -1.32940673828125, -1.282745361328125, -1.236083984375, -1.189422607421875, -1.14276123046875, -1.096099853515625, -1.0494384765625, -1.002777099609375, -0.95611572265625, -0.909454345703125, -0.86279296875, -0.816131591796875, -0.76947021484375, -0.722808837890625, -0.6761474609375, -0.629486083984375, -0.58282470703125, -0.536163330078125, -0.489501953125, -0.442840576171875, -0.39617919921875, -0.349517822265625, -0.3028564453125, -0.256195068359375, -0.20953369140625, -0.162872314453125, -0.1162109375, -0.069549560546875, -0.02288818359375, 0.023773193359375, 0.0704345703125, 0.117095947265625, 0.16375732421875, 0.210418701171875, 0.257080078125, 0.303741455078125, 0.35040283203125, 0.397064208984375, 0.4437255859375, 0.490386962890625, 0.53704833984375, 0.583709716796875, 0.63037109375, 0.677032470703125, 0.72369384765625, 0.770355224609375, 0.8170166015625, 0.863677978515625, 0.91033935546875, 0.957000732421875, 1.003662109375, 1.050323486328125, 1.09698486328125, 1.143646240234375, 1.1903076171875, 1.236968994140625, 1.28363037109375, 1.330291748046875, 1.376953125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 6.0, 5.0, 3.0, 4.0, 4.0, 8.0, 10.0, 19.0, 21.0, 12.0, 18.0, 31.0, 22.0, 31.0, 36.0, 36.0, 31.0, 48.0, 38.0, 44.0, 51.0, 49.0, 49.0, 48.0, 47.0, 44.0, 29.0, 42.0, 35.0, 30.0, 15.0, 19.0, 23.0, 19.0, 14.0, 13.0, 13.0, 9.0, 4.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01270294189453125, -0.012321233749389648, -0.011939525604248047, -0.011557817459106445, -0.011176109313964844, -0.010794401168823242, -0.01041269302368164, -0.010030984878540039, -0.009649276733398438, -0.009267568588256836, -0.008885860443115234, -0.008504152297973633, -0.008122444152832031, -0.00774073600769043, -0.007359027862548828, -0.0069773197174072266, -0.006595611572265625, -0.0062139034271240234, -0.005832195281982422, -0.00545048713684082, -0.005068778991699219, -0.004687070846557617, -0.004305362701416016, -0.003923654556274414, -0.0035419464111328125, -0.003160238265991211, -0.0027785301208496094, -0.002396821975708008, -0.0020151138305664062, -0.0016334056854248047, -0.0012516975402832031, -0.0008699893951416016, -0.00048828125, -0.00010657310485839844, 0.0002751350402832031, 0.0006568431854248047, 0.0010385513305664062, 0.0014202594757080078, 0.0018019676208496094, 0.002183675765991211, 0.0025653839111328125, 0.002947092056274414, 0.0033288002014160156, 0.003710508346557617, 0.004092216491699219, 0.00447392463684082, 0.004855632781982422, 0.0052373409271240234, 0.005619049072265625, 0.0060007572174072266, 0.006382465362548828, 0.00676417350769043, 0.007145881652832031, 0.007527589797973633, 0.007909297943115234, 0.008291006088256836, 0.008672714233398438, 0.009054422378540039, 0.00943613052368164, 0.009817838668823242, 0.010199546813964844, 0.010581254959106445, 0.010962963104248047, 0.011344671249389648, 0.01172637939453125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 6.0, 3.0, 4.0, 10.0, 8.0, 16.0, 19.0, 16.0, 26.0, 34.0, 44.0, 49.0, 56.0, 73.0, 112.0, 119.0, 196.0, 264.0, 407.0, 719.0, 2005.0, 147980.0, 887608.0, 6138.0, 919.0, 485.0, 348.0, 220.0, 154.0, 114.0, 74.0, 60.0, 50.0, 42.0, 37.0, 30.0, 21.0, 20.0, 9.0, 8.0, 13.0, 9.0, 8.0, 6.0, 5.0, 6.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.209228515625, -0.202301025390625, -0.19537353515625, -0.188446044921875, -0.1815185546875, -0.174591064453125, -0.16766357421875, -0.160736083984375, -0.15380859375, -0.146881103515625, -0.13995361328125, -0.133026123046875, -0.1260986328125, -0.119171142578125, -0.11224365234375, -0.105316162109375, -0.098388671875, -0.091461181640625, -0.08453369140625, -0.077606201171875, -0.0706787109375, -0.063751220703125, -0.05682373046875, -0.049896240234375, -0.04296875, -0.036041259765625, -0.02911376953125, -0.022186279296875, -0.0152587890625, -0.008331298828125, -0.00140380859375, 0.005523681640625, 0.012451171875, 0.019378662109375, 0.02630615234375, 0.033233642578125, 0.0401611328125, 0.047088623046875, 0.05401611328125, 0.060943603515625, 0.06787109375, 0.074798583984375, 0.08172607421875, 0.088653564453125, 0.0955810546875, 0.102508544921875, 0.10943603515625, 0.116363525390625, 0.123291015625, 0.130218505859375, 0.13714599609375, 0.144073486328125, 0.1510009765625, 0.157928466796875, 0.16485595703125, 0.171783447265625, 0.1787109375, 0.185638427734375, 0.19256591796875, 0.199493408203125, 0.2064208984375, 0.213348388671875, 0.22027587890625, 0.227203369140625, 0.234130859375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 522.0, 493.0, 1.0, 1.0], "bins": [-0.42400431632995605, -0.417055606842041, -0.410106897354126, -0.4031582176685333, -0.3962095081806183, -0.38926079869270325, -0.3823120892047882, -0.37536337971687317, -0.3684147000312805, -0.3614659905433655, -0.35451728105545044, -0.3475686013698578, -0.34061989188194275, -0.3336711823940277, -0.32672247290611267, -0.31977376341819763, -0.3128250539302826, -0.30587634444236755, -0.2989276349544525, -0.29197895526885986, -0.2850302457809448, -0.2780815362930298, -0.27113282680511475, -0.2641841173171997, -0.25723543763160706, -0.250286728143692, -0.24333803355693817, -0.23638932406902313, -0.2294406294822693, -0.22249191999435425, -0.2155432105064392, -0.20859451591968536, -0.20164580643177032, -0.19469709694385529, -0.18774840235710144, -0.1807996928691864, -0.17385099828243256, -0.16690228879451752, -0.15995359420776367, -0.15300488471984863, -0.1460561752319336, -0.13910746574401855, -0.1321587711572647, -0.12521006166934967, -0.11826135963201523, -0.11131265759468079, -0.10436395555734634, -0.0974152535200119, -0.09046654403209686, -0.08351784199476242, -0.07656913995742798, -0.06962043046951294, -0.0626717284321785, -0.055723026394844055, -0.04877432435750961, -0.04182561859488487, -0.03487692028284073, -0.027928216382861137, -0.020979512482881546, -0.014030810445547104, -0.0070821065455675125, -0.00013340264558792114, 0.006815299391746521, 0.013764005154371262, 0.020712707191705704]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 6.0, 8.0, 18.0, 14.0, 23.0, 23.0, 26.0, 30.0, 37.0, 50.0, 53.0, 50.0, 71.0, 60.0, 59.0, 51.0, 54.0, 60.0, 50.0, 57.0, 25.0, 41.0, 40.0, 21.0, 29.0, 14.0, 14.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015443086624145508, -0.014838527888059616, -0.014233969151973724, -0.013629410415887833, -0.013024851679801941, -0.01242029294371605, -0.011815734207630157, -0.011211175471544266, -0.010606616735458374, -0.010002057999372482, -0.00939749926328659, -0.008792940527200699, -0.008188381791114807, -0.007583823055028915, -0.006979264318943024, -0.006374705582857132, -0.00577014684677124, -0.0051655881106853485, -0.004561029374599457, -0.003956470638513565, -0.0033519119024276733, -0.0027473531663417816, -0.00214279443025589, -0.0015382356941699982, -0.0009336769580841064, -0.0003291182219982147, 0.000275440514087677, 0.0008799992501735687, 0.0014845579862594604, 0.002089116722345352, 0.002693675458431244, 0.0032982341945171356, 0.0039027929306030273, 0.004507351666688919, 0.005111910402774811, 0.0057164691388607025, 0.006321027874946594, 0.006925586611032486, 0.007530145347118378, 0.00813470408320427, 0.008739262819290161, 0.009343821555376053, 0.009948380291461945, 0.010552939027547836, 0.011157497763633728, 0.01176205649971962, 0.012366615235805511, 0.012971173971891403, 0.013575732707977295, 0.014180291444063187, 0.014784850180149078, 0.01538940891623497, 0.015993967652320862, 0.016598526388406754, 0.017203085124492645, 0.017807643860578537, 0.01841220259666443, 0.01901676133275032, 0.019621320068836212, 0.020225878804922104, 0.020830437541007996, 0.021434996277093887, 0.02203955501317978, 0.02264411374926567, 0.023248672485351562]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 3.0, 3.0, 0.0, 7.0, 6.0, 9.0, 4.0, 11.0, 19.0, 18.0, 20.0, 27.0, 32.0, 30.0, 31.0, 32.0, 36.0, 44.0, 38.0, 48.0, 44.0, 34.0, 40.0, 44.0, 52.0, 49.0, 40.0, 30.0, 24.0, 34.0, 33.0, 31.0, 26.0, 22.0, 16.0, 20.0, 8.0, 4.0, 11.0, 4.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.01953125, -4.8662109375, -4.712890625, -4.5595703125, -4.40625, -4.2529296875, -4.099609375, -3.9462890625, -3.79296875, -3.6396484375, -3.486328125, -3.3330078125, -3.1796875, -3.0263671875, -2.873046875, -2.7197265625, -2.56640625, -2.4130859375, -2.259765625, -2.1064453125, -1.953125, -1.7998046875, -1.646484375, -1.4931640625, -1.33984375, -1.1865234375, -1.033203125, -0.8798828125, -0.7265625, -0.5732421875, -0.419921875, -0.2666015625, -0.11328125, 0.0400390625, 0.193359375, 0.3466796875, 0.5, 0.6533203125, 0.806640625, 0.9599609375, 1.11328125, 1.2666015625, 1.419921875, 1.5732421875, 1.7265625, 1.8798828125, 2.033203125, 2.1865234375, 2.33984375, 2.4931640625, 2.646484375, 2.7998046875, 2.953125, 3.1064453125, 3.259765625, 3.4130859375, 3.56640625, 3.7197265625, 3.873046875, 4.0263671875, 4.1796875, 4.3330078125, 4.486328125, 4.6396484375, 4.79296875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 10.0, 9.0, 13.0, 18.0, 25.0, 33.0, 48.0, 57.0, 88.0, 104.0, 137.0, 204.0, 296.0, 397.0, 560.0, 827.0, 1292.0, 2227.0, 4410.0, 10106.0, 29223.0, 105053.0, 375932.0, 366882.0, 101571.0, 28319.0, 9996.0, 4416.0, 2196.0, 1257.0, 843.0, 594.0, 377.0, 272.0, 208.0, 143.0, 118.0, 78.0, 53.0, 38.0, 30.0, 29.0, 11.0, 16.0, 8.0, 4.0, 5.0, 5.0, 3.0, 2.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8515625, -5.65643310546875, -5.4613037109375, -5.26617431640625, -5.071044921875, -4.87591552734375, -4.6807861328125, -4.48565673828125, -4.29052734375, -4.09539794921875, -3.9002685546875, -3.70513916015625, -3.510009765625, -3.31488037109375, -3.1197509765625, -2.92462158203125, -2.7294921875, -2.53436279296875, -2.3392333984375, -2.14410400390625, -1.948974609375, -1.75384521484375, -1.5587158203125, -1.36358642578125, -1.16845703125, -0.97332763671875, -0.7781982421875, -0.58306884765625, -0.387939453125, -0.19281005859375, 0.0023193359375, 0.19744873046875, 0.392578125, 0.58770751953125, 0.7828369140625, 0.97796630859375, 1.173095703125, 1.36822509765625, 1.5633544921875, 1.75848388671875, 1.95361328125, 2.14874267578125, 2.3438720703125, 2.53900146484375, 2.734130859375, 2.92926025390625, 3.1243896484375, 3.31951904296875, 3.5146484375, 3.70977783203125, 3.9049072265625, 4.10003662109375, 4.295166015625, 4.49029541015625, 4.6854248046875, 4.88055419921875, 5.07568359375, 5.27081298828125, 5.4659423828125, 5.66107177734375, 5.856201171875, 6.05133056640625, 6.2464599609375, 6.44158935546875, 6.63671875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 6.0, 5.0, 9.0, 15.0, 10.0, 21.0, 24.0, 30.0, 24.0, 41.0, 44.0, 54.0, 57.0, 80.0, 133.0, 296.0, 1462.0, 230.0, 118.0, 63.0, 50.0, 42.0, 37.0, 33.0, 27.0, 25.0, 26.0, 10.0, 17.0, 10.0, 9.0, 8.0, 5.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-15.3046875, -14.8951416015625, -14.485595703125, -14.0760498046875, -13.66650390625, -13.2569580078125, -12.847412109375, -12.4378662109375, -12.0283203125, -11.6187744140625, -11.209228515625, -10.7996826171875, -10.39013671875, -9.9805908203125, -9.571044921875, -9.1614990234375, -8.751953125, -8.3424072265625, -7.932861328125, -7.5233154296875, -7.11376953125, -6.7042236328125, -6.294677734375, -5.8851318359375, -5.4755859375, -5.0660400390625, -4.656494140625, -4.2469482421875, -3.83740234375, -3.4278564453125, -3.018310546875, -2.6087646484375, -2.19921875, -1.7896728515625, -1.380126953125, -0.9705810546875, -0.56103515625, -0.1514892578125, 0.258056640625, 0.6676025390625, 1.0771484375, 1.4866943359375, 1.896240234375, 2.3057861328125, 2.71533203125, 3.1248779296875, 3.534423828125, 3.9439697265625, 4.353515625, 4.7630615234375, 5.172607421875, 5.5821533203125, 5.99169921875, 6.4012451171875, 6.810791015625, 7.2203369140625, 7.6298828125, 8.0394287109375, 8.448974609375, 8.8585205078125, 9.26806640625, 9.6776123046875, 10.087158203125, 10.4967041015625, 10.90625]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 6.0, 4.0, 13.0, 20.0, 23.0, 31.0, 48.0, 50.0, 67.0, 90.0, 164.0, 204.0, 322.0, 706.0, 2756.0, 1279455.0, 1856691.0, 3116.0, 762.0, 395.0, 227.0, 123.0, 105.0, 87.0, 56.0, 38.0, 26.0, 31.0, 19.0, 12.0, 14.0, 13.0, 7.0, 4.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.359375, -21.5888671875, -20.818359375, -20.0478515625, -19.27734375, -18.5068359375, -17.736328125, -16.9658203125, -16.1953125, -15.4248046875, -14.654296875, -13.8837890625, -13.11328125, -12.3427734375, -11.572265625, -10.8017578125, -10.03125, -9.2607421875, -8.490234375, -7.7197265625, -6.94921875, -6.1787109375, -5.408203125, -4.6376953125, -3.8671875, -3.0966796875, -2.326171875, -1.5556640625, -0.78515625, -0.0146484375, 0.755859375, 1.5263671875, 2.296875, 3.0673828125, 3.837890625, 4.6083984375, 5.37890625, 6.1494140625, 6.919921875, 7.6904296875, 8.4609375, 9.2314453125, 10.001953125, 10.7724609375, 11.54296875, 12.3134765625, 13.083984375, 13.8544921875, 14.625, 15.3955078125, 16.166015625, 16.9365234375, 17.70703125, 18.4775390625, 19.248046875, 20.0185546875, 20.7890625, 21.5595703125, 22.330078125, 23.1005859375, 23.87109375, 24.6416015625, 25.412109375, 26.1826171875, 26.953125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 15.0, 78.0, 221.0, 311.0, 248.0, 102.0, 21.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.46453285217285, -24.660200119018555, -22.85586929321289, -21.051536560058594, -19.247203826904297, -17.44287109375, -15.63853931427002, -13.834207534790039, -12.029874801635742, -10.225542068481445, -8.421210289001465, -6.616878032684326, -4.8125457763671875, -3.0082130432128906, -1.2038812637329102, 0.6004505157470703, 2.404783248901367, 4.209115505218506, 6.0134477615356445, 7.817780017852783, 9.622112274169922, 11.426445007324219, 13.2307767868042, 15.03510856628418, 16.839441299438477, 18.643774032592773, 20.448104858398438, 22.252437591552734, 24.05677032470703, 25.861103057861328, 27.665435791015625, 29.46976661682129, 31.27410125732422, 33.078433990478516, 34.88276672363281, 36.68709945678711, 38.491432189941406, 40.29576110839844, 42.100093841552734, 43.90442657470703, 45.70875930786133, 47.513092041015625, 49.31742477416992, 51.12175750732422, 52.92608642578125, 54.73042297363281, 56.534751892089844, 58.33908462524414, 60.14341735839844, 61.947750091552734, 63.75208282470703, 65.55641174316406, 67.36074829101562, 69.16507720947266, 70.96941375732422, 72.77374267578125, 74.57807922363281, 76.38240814208984, 78.1867446899414, 79.99107360839844, 81.79541015625, 83.59973907470703, 85.4040756225586, 87.20840454101562, 89.01273345947266]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 8.0, 4.0, 6.0, 11.0, 8.0, 10.0, 12.0, 30.0, 19.0, 35.0, 24.0, 42.0, 32.0, 41.0, 44.0, 41.0, 58.0, 45.0, 45.0, 45.0, 43.0, 45.0, 38.0, 45.0, 30.0, 33.0, 28.0, 30.0, 30.0, 25.0, 18.0, 14.0, 20.0, 9.0, 10.0, 6.0, 6.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-34.691532135009766, -33.714481353759766, -32.7374267578125, -31.7603759765625, -30.7833251953125, -29.8062744140625, -28.829221725463867, -27.852169036865234, -26.875118255615234, -25.898067474365234, -24.9210147857666, -23.94396209716797, -22.96691131591797, -21.98986053466797, -21.012807846069336, -20.035755157470703, -19.058704376220703, -18.081653594970703, -17.10460090637207, -16.127548217773438, -15.150497436523438, -14.173445701599121, -13.196393966674805, -12.219342231750488, -11.242290496826172, -10.265238761901855, -9.288187026977539, -8.311135292053223, -7.334083557128906, -6.35703182220459, -5.379980087280273, -4.402928352355957, -3.425874710083008, -2.4488229751586914, -1.471771240234375, -0.4947195053100586, 0.4823322296142578, 1.4593839645385742, 2.4364356994628906, 3.413487434387207, 4.390539169311523, 5.36759090423584, 6.344642639160156, 7.321694374084473, 8.298746109008789, 9.275797843933105, 10.252849578857422, 11.229901313781738, 12.206953048706055, 13.184004783630371, 14.161056518554688, 15.138108253479004, 16.11515998840332, 17.092212677001953, 18.069263458251953, 19.046314239501953, 20.023366928100586, 21.00041961669922, 21.97747039794922, 22.95452117919922, 23.93157386779785, 24.908626556396484, 25.885677337646484, 26.862728118896484, 27.839780807495117]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 2.0, 8.0, 8.0, 13.0, 19.0, 14.0, 20.0, 19.0, 27.0, 31.0, 27.0, 38.0, 34.0, 59.0, 43.0, 46.0, 42.0, 67.0, 47.0, 51.0, 46.0, 35.0, 33.0, 37.0, 41.0, 29.0, 24.0, 25.0, 9.0, 18.0, 20.0, 18.0, 10.0, 11.0, 7.0, 7.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.49609375, -5.31561279296875, -5.1351318359375, -4.95465087890625, -4.774169921875, -4.59368896484375, -4.4132080078125, -4.23272705078125, -4.05224609375, -3.87176513671875, -3.6912841796875, -3.51080322265625, -3.330322265625, -3.14984130859375, -2.9693603515625, -2.78887939453125, -2.6083984375, -2.42791748046875, -2.2474365234375, -2.06695556640625, -1.886474609375, -1.70599365234375, -1.5255126953125, -1.34503173828125, -1.16455078125, -0.98406982421875, -0.8035888671875, -0.62310791015625, -0.442626953125, -0.26214599609375, -0.0816650390625, 0.09881591796875, 0.279296875, 0.45977783203125, 0.6402587890625, 0.82073974609375, 1.001220703125, 1.18170166015625, 1.3621826171875, 1.54266357421875, 1.72314453125, 1.90362548828125, 2.0841064453125, 2.26458740234375, 2.445068359375, 2.62554931640625, 2.8060302734375, 2.98651123046875, 3.1669921875, 3.34747314453125, 3.5279541015625, 3.70843505859375, 3.888916015625, 4.06939697265625, 4.2498779296875, 4.43035888671875, 4.61083984375, 4.79132080078125, 4.9718017578125, 5.15228271484375, 5.332763671875, 5.51324462890625, 5.6937255859375, 5.87420654296875, 6.0546875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 10.0, 19.0, 15.0, 25.0, 32.0, 40.0, 51.0, 88.0, 127.0, 195.0, 272.0, 462.0, 792.0, 1754.0, 4861.0, 22804.0, 313091.0, 3266779.0, 538795.0, 32714.0, 6661.0, 2118.0, 1001.0, 533.0, 356.0, 205.0, 157.0, 99.0, 57.0, 51.0, 34.0, 16.0, 17.0, 11.0, 15.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.3125, -18.6123046875, -17.912109375, -17.2119140625, -16.51171875, -15.8115234375, -15.111328125, -14.4111328125, -13.7109375, -13.0107421875, -12.310546875, -11.6103515625, -10.91015625, -10.2099609375, -9.509765625, -8.8095703125, -8.109375, -7.4091796875, -6.708984375, -6.0087890625, -5.30859375, -4.6083984375, -3.908203125, -3.2080078125, -2.5078125, -1.8076171875, -1.107421875, -0.4072265625, 0.29296875, 0.9931640625, 1.693359375, 2.3935546875, 3.09375, 3.7939453125, 4.494140625, 5.1943359375, 5.89453125, 6.5947265625, 7.294921875, 7.9951171875, 8.6953125, 9.3955078125, 10.095703125, 10.7958984375, 11.49609375, 12.1962890625, 12.896484375, 13.5966796875, 14.296875, 14.9970703125, 15.697265625, 16.3974609375, 17.09765625, 17.7978515625, 18.498046875, 19.1982421875, 19.8984375, 20.5986328125, 21.298828125, 21.9990234375, 22.69921875, 23.3994140625, 24.099609375, 24.7998046875, 25.5]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 2.0, 11.0, 8.0, 31.0, 29.0, 64.0, 108.0, 156.0, 292.0, 498.0, 727.0, 761.0, 559.0, 333.0, 212.0, 113.0, 74.0, 38.0, 30.0, 10.0, 6.0, 9.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.296875, -18.7620849609375, -18.227294921875, -17.6925048828125, -17.15771484375, -16.6229248046875, -16.088134765625, -15.5533447265625, -15.0185546875, -14.4837646484375, -13.948974609375, -13.4141845703125, -12.87939453125, -12.3446044921875, -11.809814453125, -11.2750244140625, -10.740234375, -10.2054443359375, -9.670654296875, -9.1358642578125, -8.60107421875, -8.0662841796875, -7.531494140625, -6.9967041015625, -6.4619140625, -5.9271240234375, -5.392333984375, -4.8575439453125, -4.32275390625, -3.7879638671875, -3.253173828125, -2.7183837890625, -2.18359375, -1.6488037109375, -1.114013671875, -0.5792236328125, -0.04443359375, 0.4903564453125, 1.025146484375, 1.5599365234375, 2.0947265625, 2.6295166015625, 3.164306640625, 3.6990966796875, 4.23388671875, 4.7686767578125, 5.303466796875, 5.8382568359375, 6.373046875, 6.9078369140625, 7.442626953125, 7.9774169921875, 8.51220703125, 9.0469970703125, 9.581787109375, 10.1165771484375, 10.6513671875, 11.1861572265625, 11.720947265625, 12.2557373046875, 12.79052734375, 13.3253173828125, 13.860107421875, 14.3948974609375, 14.9296875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 1.0, 6.0, 9.0, 11.0, 19.0, 23.0, 87.0, 194.0, 472.0, 1478.0, 6970.0, 256197.0, 3892979.0, 31026.0, 3347.0, 900.0, 306.0, 137.0, 53.0, 22.0, 16.0, 8.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.8125, -43.57763671875, -42.3427734375, -41.10791015625, -39.873046875, -38.63818359375, -37.4033203125, -36.16845703125, -34.93359375, -33.69873046875, -32.4638671875, -31.22900390625, -29.994140625, -28.75927734375, -27.5244140625, -26.28955078125, -25.0546875, -23.81982421875, -22.5849609375, -21.35009765625, -20.115234375, -18.88037109375, -17.6455078125, -16.41064453125, -15.17578125, -13.94091796875, -12.7060546875, -11.47119140625, -10.236328125, -9.00146484375, -7.7666015625, -6.53173828125, -5.296875, -4.06201171875, -2.8271484375, -1.59228515625, -0.357421875, 0.87744140625, 2.1123046875, 3.34716796875, 4.58203125, 5.81689453125, 7.0517578125, 8.28662109375, 9.521484375, 10.75634765625, 11.9912109375, 13.22607421875, 14.4609375, 15.69580078125, 16.9306640625, 18.16552734375, 19.400390625, 20.63525390625, 21.8701171875, 23.10498046875, 24.33984375, 25.57470703125, 26.8095703125, 28.04443359375, 29.279296875, 30.51416015625, 31.7490234375, 32.98388671875, 34.21875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 19.0, 24.0, 39.0, 52.0, 89.0, 122.0, 141.0, 160.0, 142.0, 84.0, 45.0, 35.0, 15.0, 11.0, 6.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.17864227294922, -89.7169189453125, -86.25518798828125, -82.79346466064453, -79.33174133300781, -75.8700180053711, -72.40829467773438, -68.94656372070312, -65.4848403930664, -62.02311706542969, -58.5613899230957, -55.09966278076172, -51.637939453125, -48.17621612548828, -44.7144889831543, -41.25276184082031, -37.791038513183594, -34.329315185546875, -30.86758804321289, -27.40586280822754, -23.944137573242188, -20.482412338256836, -17.020687103271484, -13.558961868286133, -10.097236633300781, -6.63551139831543, -3.173786163330078, 0.28793907165527344, 3.749664306640625, 7.211389541625977, 10.673114776611328, 14.13484001159668, 17.5965576171875, 21.05828285217285, 24.520008087158203, 27.981733322143555, 31.443458557128906, 34.905181884765625, 38.36690902709961, 41.828636169433594, 45.29035949707031, 48.75208282470703, 52.213809967041016, 55.675537109375, 59.13726043701172, 62.59898376464844, 66.06071472167969, 69.5224380493164, 72.98416137695312, 76.44588470458984, 79.90760803222656, 83.36933898925781, 86.83106231689453, 90.29278564453125, 93.7545166015625, 97.21623992919922, 100.67796325683594, 104.13968658447266, 107.60140991210938, 111.06314086914062, 114.52486419677734, 117.98658752441406, 121.44831848144531, 124.91004180908203, 128.37176513671875]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 7.0, 14.0, 19.0, 17.0, 17.0, 24.0, 13.0, 25.0, 18.0, 25.0, 30.0, 38.0, 35.0, 40.0, 30.0, 36.0, 43.0, 31.0, 25.0, 36.0, 42.0, 32.0, 33.0, 34.0, 46.0, 37.0, 19.0, 23.0, 15.0, 15.0, 25.0, 18.0, 18.0, 22.0, 18.0, 12.0, 12.0, 13.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-39.833343505859375, -38.589176177978516, -37.345008850097656, -36.1008415222168, -34.85667419433594, -33.61250305175781, -32.36833572387695, -31.124168395996094, -29.880001068115234, -28.635833740234375, -27.391666412353516, -26.147497177124023, -24.903329849243164, -23.659162521362305, -22.414993286132812, -21.170825958251953, -19.926658630371094, -18.682491302490234, -17.438323974609375, -16.194154739379883, -14.949987411499023, -13.705820083618164, -12.461651802062988, -11.217483520507812, -9.973316192626953, -8.729148864746094, -7.484980583190918, -6.2408127784729, -4.996644973754883, -3.7524771690368652, -2.5083093643188477, -1.2641410827636719, -0.0199737548828125, 1.224194049835205, 2.4683618545532227, 3.7125296592712402, 4.956697463989258, 6.200865268707275, 7.445033073425293, 8.689201354980469, 9.933368682861328, 11.177536010742188, 12.421704292297363, 13.665872573852539, 14.910039901733398, 16.154207229614258, 17.39837646484375, 18.64254379272461, 19.88671112060547, 21.130878448486328, 22.375045776367188, 23.61921501159668, 24.86338233947754, 26.1075496673584, 27.35171890258789, 28.59588623046875, 29.84005355834961, 31.08422088623047, 32.32838821411133, 33.57255554199219, 34.81672668457031, 36.06089401245117, 37.30506134033203, 38.54922866821289, 39.79339599609375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 9.0, 8.0, 18.0, 16.0, 19.0, 13.0, 17.0, 28.0, 29.0, 31.0, 29.0, 37.0, 25.0, 40.0, 34.0, 33.0, 33.0, 41.0, 30.0, 39.0, 38.0, 30.0, 42.0, 37.0, 35.0, 34.0, 32.0, 17.0, 19.0, 26.0, 14.0, 20.0, 17.0, 17.0, 11.0, 16.0, 8.0, 8.0, 7.0, 5.0, 9.0, 7.0, 1.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-48.3125, -46.74462890625, -45.1767578125, -43.60888671875, -42.041015625, -40.47314453125, -38.9052734375, -37.33740234375, -35.76953125, -34.20166015625, -32.6337890625, -31.06591796875, -29.498046875, -27.93017578125, -26.3623046875, -24.79443359375, -23.2265625, -21.65869140625, -20.0908203125, -18.52294921875, -16.955078125, -15.38720703125, -13.8193359375, -12.25146484375, -10.68359375, -9.11572265625, -7.5478515625, -5.97998046875, -4.412109375, -2.84423828125, -1.2763671875, 0.29150390625, 1.859375, 3.42724609375, 4.9951171875, 6.56298828125, 8.130859375, 9.69873046875, 11.2666015625, 12.83447265625, 14.40234375, 15.97021484375, 17.5380859375, 19.10595703125, 20.673828125, 22.24169921875, 23.8095703125, 25.37744140625, 26.9453125, 28.51318359375, 30.0810546875, 31.64892578125, 33.216796875, 34.78466796875, 36.3525390625, 37.92041015625, 39.48828125, 41.05615234375, 42.6240234375, 44.19189453125, 45.759765625, 47.32763671875, 48.8955078125, 50.46337890625, 52.03125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 16.0, 13.0, 36.0, 44.0, 80.0, 124.0, 193.0, 291.0, 476.0, 688.0, 1054.0, 1481.0, 2280.0, 3477.0, 5107.0, 7575.0, 11162.0, 16227.0, 23204.0, 32871.0, 46211.0, 62453.0, 80963.0, 100004.0, 113183.0, 114962.0, 104267.0, 86311.0, 66578.0, 50125.0, 36297.0, 25526.0, 17935.0, 12131.0, 8296.0, 5703.0, 3729.0, 2512.0, 1686.0, 1100.0, 767.0, 497.0, 316.0, 209.0, 136.0, 97.0, 57.0, 32.0, 22.0, 19.0, 13.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.865234375, -3.741058349609375, -3.61688232421875, -3.492706298828125, -3.3685302734375, -3.244354248046875, -3.12017822265625, -2.996002197265625, -2.871826171875, -2.747650146484375, -2.62347412109375, -2.499298095703125, -2.3751220703125, -2.250946044921875, -2.12677001953125, -2.002593994140625, -1.87841796875, -1.754241943359375, -1.63006591796875, -1.505889892578125, -1.3817138671875, -1.257537841796875, -1.13336181640625, -1.009185791015625, -0.885009765625, -0.760833740234375, -0.63665771484375, -0.512481689453125, -0.3883056640625, -0.264129638671875, -0.13995361328125, -0.015777587890625, 0.1083984375, 0.232574462890625, 0.35675048828125, 0.480926513671875, 0.6051025390625, 0.729278564453125, 0.85345458984375, 0.977630615234375, 1.101806640625, 1.225982666015625, 1.35015869140625, 1.474334716796875, 1.5985107421875, 1.722686767578125, 1.84686279296875, 1.971038818359375, 2.09521484375, 2.219390869140625, 2.34356689453125, 2.467742919921875, 2.5919189453125, 2.716094970703125, 2.84027099609375, 2.964447021484375, 3.088623046875, 3.212799072265625, 3.33697509765625, 3.461151123046875, 3.5853271484375, 3.709503173828125, 3.83367919921875, 3.957855224609375, 4.08203125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 1.0, 5.0, 8.0, 8.0, 3.0, 9.0, 14.0, 10.0, 22.0, 18.0, 26.0, 18.0, 12.0, 22.0, 18.0, 36.0, 32.0, 24.0, 27.0, 40.0, 40.0, 40.0, 38.0, 1065.0, 41.0, 37.0, 29.0, 49.0, 26.0, 36.0, 40.0, 27.0, 22.0, 25.0, 14.0, 15.0, 23.0, 13.0, 13.0, 19.0, 14.0, 8.0, 10.0, 13.0, 2.0, 6.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.31884765625, -31.2939453125, -30.26904296875, -29.244140625, -28.21923828125, -27.1943359375, -26.16943359375, -25.14453125, -24.11962890625, -23.0947265625, -22.06982421875, -21.044921875, -20.02001953125, -18.9951171875, -17.97021484375, -16.9453125, -15.92041015625, -14.8955078125, -13.87060546875, -12.845703125, -11.82080078125, -10.7958984375, -9.77099609375, -8.74609375, -7.72119140625, -6.6962890625, -5.67138671875, -4.646484375, -3.62158203125, -2.5966796875, -1.57177734375, -0.546875, 0.47802734375, 1.5029296875, 2.52783203125, 3.552734375, 4.57763671875, 5.6025390625, 6.62744140625, 7.65234375, 8.67724609375, 9.7021484375, 10.72705078125, 11.751953125, 12.77685546875, 13.8017578125, 14.82666015625, 15.8515625, 16.87646484375, 17.9013671875, 18.92626953125, 19.951171875, 20.97607421875, 22.0009765625, 23.02587890625, 24.05078125, 25.07568359375, 26.1005859375, 27.12548828125, 28.150390625, 29.17529296875, 30.2001953125, 31.22509765625, 32.25]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 9.0, 17.0, 22.0, 33.0, 39.0, 69.0, 74.0, 94.0, 133.0, 231.0, 251.0, 376.0, 514.0, 754.0, 1062.0, 1416.0, 2178.0, 2998.0, 4343.0, 6170.0, 8816.0, 12621.0, 17948.0, 26638.0, 62648.0, 1841346.0, 33524.0, 21854.0, 15041.0, 10525.0, 7608.0, 5242.0, 3705.0, 2551.0, 1828.0, 1300.0, 860.0, 635.0, 481.0, 318.0, 240.0, 156.0, 134.0, 97.0, 71.0, 39.0, 44.0, 25.0, 21.0, 18.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0], "bins": [-10.7734375, -10.449462890625, -10.12548828125, -9.801513671875, -9.4775390625, -9.153564453125, -8.82958984375, -8.505615234375, -8.181640625, -7.857666015625, -7.53369140625, -7.209716796875, -6.8857421875, -6.561767578125, -6.23779296875, -5.913818359375, -5.58984375, -5.265869140625, -4.94189453125, -4.617919921875, -4.2939453125, -3.969970703125, -3.64599609375, -3.322021484375, -2.998046875, -2.674072265625, -2.35009765625, -2.026123046875, -1.7021484375, -1.378173828125, -1.05419921875, -0.730224609375, -0.40625, -0.082275390625, 0.24169921875, 0.565673828125, 0.8896484375, 1.213623046875, 1.53759765625, 1.861572265625, 2.185546875, 2.509521484375, 2.83349609375, 3.157470703125, 3.4814453125, 3.805419921875, 4.12939453125, 4.453369140625, 4.77734375, 5.101318359375, 5.42529296875, 5.749267578125, 6.0732421875, 6.397216796875, 6.72119140625, 7.045166015625, 7.369140625, 7.693115234375, 8.01708984375, 8.341064453125, 8.6650390625, 8.989013671875, 9.31298828125, 9.636962890625, 9.9609375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 4.0, 3.0, 8.0, 6.0, 5.0, 13.0, 10.0, 14.0, 15.0, 23.0, 21.0, 30.0, 54.0, 48.0, 51.0, 56.0, 58.0, 68.0, 64.0, 65.0, 50.0, 61.0, 42.0, 46.0, 29.0, 31.0, 21.0, 24.0, 9.0, 11.0, 10.0, 12.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.11834716796875, -0.1145315170288086, -0.11071586608886719, -0.10690021514892578, -0.10308456420898438, -0.09926891326904297, -0.09545326232910156, -0.09163761138916016, -0.08782196044921875, -0.08400630950927734, -0.08019065856933594, -0.07637500762939453, -0.07255935668945312, -0.06874370574951172, -0.06492805480957031, -0.061112403869628906, -0.0572967529296875, -0.053481101989746094, -0.04966545104980469, -0.04584980010986328, -0.042034149169921875, -0.03821849822998047, -0.03440284729003906, -0.030587196350097656, -0.02677154541015625, -0.022955894470214844, -0.019140243530273438, -0.015324592590332031, -0.011508941650390625, -0.007693290710449219, -0.0038776397705078125, -6.198883056640625e-05, 0.003753662109375, 0.007569313049316406, 0.011384963989257812, 0.015200614929199219, 0.019016265869140625, 0.02283191680908203, 0.026647567749023438, 0.030463218688964844, 0.03427886962890625, 0.038094520568847656, 0.04191017150878906, 0.04572582244873047, 0.049541473388671875, 0.05335712432861328, 0.05717277526855469, 0.060988426208496094, 0.0648040771484375, 0.0686197280883789, 0.07243537902832031, 0.07625102996826172, 0.08006668090820312, 0.08388233184814453, 0.08769798278808594, 0.09151363372802734, 0.09532928466796875, 0.09914493560791016, 0.10296058654785156, 0.10677623748779297, 0.11059188842773438, 0.11440753936767578, 0.11822319030761719, 0.1220388412475586, 0.1258544921875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 14.0, 21.0, 22.0, 23.0, 23.0, 46.0, 56.0, 87.0, 119.0, 204.0, 271.0, 475.0, 719.0, 1217.0, 2067.0, 4388.0, 10872.0, 33071.0, 116042.0, 328457.0, 354685.0, 134138.0, 38489.0, 12314.0, 4962.0, 2289.0, 1286.0, 723.0, 453.0, 311.0, 217.0, 151.0, 87.0, 57.0, 55.0, 35.0, 17.0, 19.0, 14.0, 14.0, 4.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6298828125, -0.6096038818359375, -0.589324951171875, -0.5690460205078125, -0.54876708984375, -0.5284881591796875, -0.508209228515625, -0.4879302978515625, -0.4676513671875, -0.4473724365234375, -0.427093505859375, -0.4068145751953125, -0.38653564453125, -0.3662567138671875, -0.345977783203125, -0.3256988525390625, -0.305419921875, -0.2851409912109375, -0.264862060546875, -0.2445831298828125, -0.22430419921875, -0.2040252685546875, -0.183746337890625, -0.1634674072265625, -0.1431884765625, -0.1229095458984375, -0.102630615234375, -0.0823516845703125, -0.06207275390625, -0.0417938232421875, -0.021514892578125, -0.0012359619140625, 0.01904296875, 0.0393218994140625, 0.059600830078125, 0.0798797607421875, 0.10015869140625, 0.1204376220703125, 0.140716552734375, 0.1609954833984375, 0.1812744140625, 0.2015533447265625, 0.221832275390625, 0.2421112060546875, 0.26239013671875, 0.2826690673828125, 0.302947998046875, 0.3232269287109375, 0.343505859375, 0.3637847900390625, 0.384063720703125, 0.4043426513671875, 0.42462158203125, 0.4449005126953125, 0.465179443359375, 0.4854583740234375, 0.5057373046875, 0.5260162353515625, 0.546295166015625, 0.5665740966796875, 0.58685302734375, 0.6071319580078125, 0.627410888671875, 0.6476898193359375, 0.66796875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 11.0, 14.0, 16.0, 18.0, 17.0, 32.0, 37.0, 46.0, 73.0, 75.0, 81.0, 89.0, 85.0, 82.0, 90.0, 53.0, 48.0, 35.0, 32.0, 19.0, 12.0, 10.0, 3.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.15420223772525787, -0.14940379559993744, -0.1446053683757782, -0.13980692625045776, -0.13500849902629852, -0.1302100569009781, -0.12541162967681885, -0.12061318755149841, -0.11581476032733917, -0.11101632565259933, -0.1062178909778595, -0.10141945630311966, -0.09662102162837982, -0.09182258695363998, -0.08702415227890015, -0.08222571015357971, -0.07742727547883987, -0.07262884080410004, -0.0678304061293602, -0.06303197145462036, -0.058233536779880524, -0.053435102105140686, -0.04863666370511055, -0.04383822903037071, -0.039039794355630875, -0.03424135968089104, -0.0294429250061512, -0.024644488468766212, -0.019846053794026375, -0.015047619119286537, -0.01024918258190155, -0.005450747907161713, -0.000652313232421875, 0.00414612190797925, 0.008944557048380375, 0.013742992654442787, 0.018541427329182625, 0.023339862003922462, 0.02813829854130745, 0.03293673321604729, 0.037735167890787125, 0.04253360256552696, 0.0473320372402668, 0.052130475640296936, 0.056928910315036774, 0.06172734498977661, 0.06652577966451645, 0.07132421433925629, 0.07612264901399612, 0.08092108368873596, 0.0857195183634758, 0.09051795303821564, 0.09531638771295547, 0.10011482238769531, 0.10491326451301575, 0.10971169173717499, 0.11451013386249542, 0.11930856853723526, 0.1241070032119751, 0.12890544533729553, 0.13370387256145477, 0.1385023146867752, 0.14330074191093445, 0.14809918403625488, 0.15289761126041412]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 11.0, 8.0, 12.0, 25.0, 17.0, 15.0, 18.0, 19.0, 28.0, 27.0, 35.0, 32.0, 40.0, 30.0, 42.0, 51.0, 40.0, 48.0, 43.0, 51.0, 46.0, 50.0, 31.0, 34.0, 32.0, 31.0, 28.0, 33.0, 25.0, 20.0, 17.0, 12.0, 10.0, 7.0, 5.0, 6.0, 5.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.11548370122909546, -0.11232256889343262, -0.10916143655776978, -0.10600029677152634, -0.1028391644358635, -0.09967803210020065, -0.09651689231395721, -0.09335575997829437, -0.09019462764263153, -0.08703349530696869, -0.08387236297130585, -0.08071122318506241, -0.07755009084939957, -0.07438895851373672, -0.07122781872749329, -0.06806668639183044, -0.0649055540561676, -0.06174442172050476, -0.05858328565955162, -0.05542214959859848, -0.05226101726293564, -0.0490998849272728, -0.045938748866319656, -0.042777612805366516, -0.039616480469703674, -0.03645534813404083, -0.03329421207308769, -0.0301330778747797, -0.02697194367647171, -0.02381080947816372, -0.020649675279855728, -0.017488541081547737, -0.014327406883239746, -0.011166272684931755, -0.008005138486623764, -0.004844004288315773, -0.001682870090007782, 0.001478264108300209, 0.0046393983066082, 0.007800532504916191, 0.010961666703224182, 0.014122800901532173, 0.017283935099840164, 0.020445069298148155, 0.023606203496456146, 0.026767337694764137, 0.02992847189307213, 0.03308960795402527, 0.03625074028968811, 0.03941187262535095, 0.04257300868630409, 0.04573414474725723, 0.048895277082920074, 0.052056409418582916, 0.055217545479536057, 0.0583786815404892, 0.06153981387615204, 0.06470094621181488, 0.06786207854747772, 0.07102321833372116, 0.074184350669384, 0.07734548300504684, 0.08050662279129028, 0.08366775512695312, 0.08682888746261597]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 7.0, 1.0, 4.0, 5.0, 5.0, 8.0, 11.0, 10.0, 17.0, 20.0, 23.0, 21.0, 24.0, 29.0, 31.0, 36.0, 34.0, 28.0, 22.0, 37.0, 39.0, 30.0, 35.0, 30.0, 41.0, 44.0, 36.0, 29.0, 41.0, 34.0, 31.0, 26.0, 33.0, 20.0, 25.0, 16.0, 15.0, 15.0, 12.0, 11.0, 11.0, 6.0, 9.0, 15.0, 10.0, 4.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-47.96875, -46.4248046875, -44.880859375, -43.3369140625, -41.79296875, -40.2490234375, -38.705078125, -37.1611328125, -35.6171875, -34.0732421875, -32.529296875, -30.9853515625, -29.44140625, -27.8974609375, -26.353515625, -24.8095703125, -23.265625, -21.7216796875, -20.177734375, -18.6337890625, -17.08984375, -15.5458984375, -14.001953125, -12.4580078125, -10.9140625, -9.3701171875, -7.826171875, -6.2822265625, -4.73828125, -3.1943359375, -1.650390625, -0.1064453125, 1.4375, 2.9814453125, 4.525390625, 6.0693359375, 7.61328125, 9.1572265625, 10.701171875, 12.2451171875, 13.7890625, 15.3330078125, 16.876953125, 18.4208984375, 19.96484375, 21.5087890625, 23.052734375, 24.5966796875, 26.140625, 27.6845703125, 29.228515625, 30.7724609375, 32.31640625, 33.8603515625, 35.404296875, 36.9482421875, 38.4921875, 40.0361328125, 41.580078125, 43.1240234375, 44.66796875, 46.2119140625, 47.755859375, 49.2998046875, 50.84375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 4.0, 3.0, 3.0, 9.0, 8.0, 4.0, 18.0, 27.0, 30.0, 35.0, 32.0, 36.0, 66.0, 76.0, 103.0, 141.0, 227.0, 433.0, 1080.0, 3713.0, 16468.0, 88349.0, 384859.0, 421093.0, 105851.0, 19113.0, 4288.0, 1187.0, 434.0, 251.0, 144.0, 97.0, 83.0, 59.0, 47.0, 38.0, 25.0, 16.0, 21.0, 13.0, 11.0, 16.0, 9.0, 4.0, 11.0, 3.0, 5.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0], "bins": [-9.78125, -9.47607421875, -9.1708984375, -8.86572265625, -8.560546875, -8.25537109375, -7.9501953125, -7.64501953125, -7.33984375, -7.03466796875, -6.7294921875, -6.42431640625, -6.119140625, -5.81396484375, -5.5087890625, -5.20361328125, -4.8984375, -4.59326171875, -4.2880859375, -3.98291015625, -3.677734375, -3.37255859375, -3.0673828125, -2.76220703125, -2.45703125, -2.15185546875, -1.8466796875, -1.54150390625, -1.236328125, -0.93115234375, -0.6259765625, -0.32080078125, -0.015625, 0.28955078125, 0.5947265625, 0.89990234375, 1.205078125, 1.51025390625, 1.8154296875, 2.12060546875, 2.42578125, 2.73095703125, 3.0361328125, 3.34130859375, 3.646484375, 3.95166015625, 4.2568359375, 4.56201171875, 4.8671875, 5.17236328125, 5.4775390625, 5.78271484375, 6.087890625, 6.39306640625, 6.6982421875, 7.00341796875, 7.30859375, 7.61376953125, 7.9189453125, 8.22412109375, 8.529296875, 8.83447265625, 9.1396484375, 9.44482421875, 9.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 8.0, 10.0, 7.0, 14.0, 12.0, 9.0, 16.0, 15.0, 22.0, 30.0, 34.0, 36.0, 38.0, 49.0, 70.0, 56.0, 61.0, 2090.0, 56.0, 44.0, 44.0, 34.0, 53.0, 39.0, 31.0, 39.0, 29.0, 25.0, 17.0, 14.0, 9.0, 10.0, 6.0, 8.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.1875, -84.421875, -81.65625, -78.890625, -76.125, -73.359375, -70.59375, -67.828125, -65.0625, -62.296875, -59.53125, -56.765625, -54.0, -51.234375, -48.46875, -45.703125, -42.9375, -40.171875, -37.40625, -34.640625, -31.875, -29.109375, -26.34375, -23.578125, -20.8125, -18.046875, -15.28125, -12.515625, -9.75, -6.984375, -4.21875, -1.453125, 1.3125, 4.078125, 6.84375, 9.609375, 12.375, 15.140625, 17.90625, 20.671875, 23.4375, 26.203125, 28.96875, 31.734375, 34.5, 37.265625, 40.03125, 42.796875, 45.5625, 48.328125, 51.09375, 53.859375, 56.625, 59.390625, 62.15625, 64.921875, 67.6875, 70.453125, 73.21875, 75.984375, 78.75, 81.515625, 84.28125, 87.046875, 89.8125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 11.0, 18.0, 23.0, 32.0, 39.0, 59.0, 99.0, 176.0, 292.0, 477.0, 862.0, 1737.0, 4339.0, 25209.0, 369088.0, 2678216.0, 53904.0, 6559.0, 2179.0, 1018.0, 547.0, 309.0, 186.0, 113.0, 66.0, 49.0, 21.0, 12.0, 13.0, 16.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.1484375, -12.7393798828125, -12.330322265625, -11.9212646484375, -11.51220703125, -11.1031494140625, -10.694091796875, -10.2850341796875, -9.8759765625, -9.4669189453125, -9.057861328125, -8.6488037109375, -8.23974609375, -7.8306884765625, -7.421630859375, -7.0125732421875, -6.603515625, -6.1944580078125, -5.785400390625, -5.3763427734375, -4.96728515625, -4.5582275390625, -4.149169921875, -3.7401123046875, -3.3310546875, -2.9219970703125, -2.512939453125, -2.1038818359375, -1.69482421875, -1.2857666015625, -0.876708984375, -0.4676513671875, -0.05859375, 0.3504638671875, 0.759521484375, 1.1685791015625, 1.57763671875, 1.9866943359375, 2.395751953125, 2.8048095703125, 3.2138671875, 3.6229248046875, 4.031982421875, 4.4410400390625, 4.85009765625, 5.2591552734375, 5.668212890625, 6.0772705078125, 6.486328125, 6.8953857421875, 7.304443359375, 7.7135009765625, 8.12255859375, 8.5316162109375, 8.940673828125, 9.3497314453125, 9.7587890625, 10.1678466796875, 10.576904296875, 10.9859619140625, 11.39501953125, 11.8040771484375, 12.213134765625, 12.6221923828125, 13.03125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 16.0, 20.0, 41.0, 49.0, 96.0, 125.0, 161.0, 158.0, 101.0, 84.0, 40.0, 23.0, 21.0, 9.0, 7.0, 6.0, 2.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.42304992675781, -112.64338684082031, -108.86373138427734, -105.08406829833984, -101.30440521240234, -97.52474975585938, -93.74508666992188, -89.96542358398438, -86.18576049804688, -82.40609741210938, -78.6264419555664, -74.8467788696289, -71.0671157836914, -67.28746032714844, -63.50779724121094, -59.72813415527344, -55.94847869873047, -52.168819427490234, -48.389156341552734, -44.6094970703125, -40.829833984375, -37.050174713134766, -33.27051544189453, -29.490854263305664, -25.711193084716797, -21.93153190612793, -18.151870727539062, -14.372211456298828, -10.592550277709961, -6.812889099121094, -3.0332298278808594, 0.7464313507080078, 4.526100158691406, 8.305761337280273, 12.085421562194824, 15.865081787109375, 19.644742965698242, 23.42440414428711, 27.204063415527344, 30.98372459411621, 34.76338577270508, 38.54304504394531, 42.32270812988281, 46.10236740112305, 49.88202667236328, 53.66168975830078, 57.441349029541016, 61.22100830078125, 65.00067138671875, 68.78033447265625, 72.55998992919922, 76.33965301513672, 80.11931610107422, 83.89897155761719, 87.67863464355469, 91.45829772949219, 95.23796081542969, 99.01762390136719, 102.79727935791016, 106.57694244384766, 110.35660552978516, 114.13626098632812, 117.91592407226562, 121.69558715820312, 125.4752426147461]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 4.0, 9.0, 12.0, 12.0, 9.0, 13.0, 14.0, 22.0, 21.0, 36.0, 38.0, 37.0, 29.0, 34.0, 30.0, 39.0, 42.0, 41.0, 44.0, 45.0, 39.0, 56.0, 31.0, 52.0, 43.0, 32.0, 23.0, 22.0, 25.0, 21.0, 22.0, 16.0, 15.0, 14.0, 6.0, 10.0, 7.0, 5.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.03158569335938, -89.88787841796875, -86.74417877197266, -83.60047149658203, -80.45677185058594, -77.31306457519531, -74.16935729980469, -71.0256576538086, -67.8819580078125, -64.73825073242188, -61.59455108642578, -58.450843811035156, -55.30714416503906, -52.16343688964844, -49.01973342895508, -45.87602996826172, -42.732322692871094, -39.588619232177734, -36.444915771484375, -33.30120849609375, -30.157506942749023, -27.013803482055664, -23.870098114013672, -20.726394653320312, -17.582691192626953, -14.438987731933594, -11.295283317565918, -8.151578903198242, -5.007875442504883, -1.8641719818115234, 1.2795333862304688, 4.423236846923828, 7.566932678222656, 10.710636138916016, 13.854340553283691, 16.998044967651367, 20.141748428344727, 23.285451889038086, 26.429157257080078, 29.572860717773438, 32.7165641784668, 35.860267639160156, 39.003971099853516, 42.147674560546875, 45.2913818359375, 48.435081481933594, 51.57878875732422, 54.72249221801758, 57.86619567871094, 61.0098991394043, 64.15360260009766, 67.29730987548828, 70.44100952148438, 73.584716796875, 76.72842407226562, 79.87212371826172, 83.01582336425781, 86.15953063964844, 89.30323028564453, 92.44693756103516, 95.59063720703125, 98.73434448242188, 101.8780517578125, 105.0217514038086, 108.16545867919922]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 14.0, 9.0, 18.0, 37.0, 54.0, 64.0, 82.0, 122.0, 165.0, 274.0, 326.0, 523.0, 762.0, 1072.0, 1645.0, 2557.0, 3957.0, 5873.0, 1009512.0, 7454.0, 4688.0, 3178.0, 2057.0, 1276.0, 875.0, 552.0, 404.0, 305.0, 203.0, 136.0, 105.0, 61.0, 57.0, 32.0, 27.0, 19.0, 16.0, 11.0, 3.0, 7.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.038135528564453, -18.375150680541992, -17.712167739868164, -17.049182891845703, -16.386199951171875, -15.723215103149414, -15.060230255126953, -14.397246360778809, -13.734262466430664, -13.07127857208252, -12.408294677734375, -11.745309829711914, -11.08232593536377, -10.419342041015625, -9.756357192993164, -9.09337329864502, -8.430389404296875, -7.7674055099487305, -7.104421138763428, -6.441436767578125, -5.7784528732299805, -5.115468978881836, -4.452484607696533, -3.7895002365112305, -3.126516342163086, -2.4635322093963623, -1.8005480766296387, -1.137563943862915, -0.4745798110961914, 0.18840432167053223, 0.8513884544372559, 1.5143728256225586, 2.177358627319336, 2.8403427600860596, 3.503326892852783, 4.166311264038086, 4.8292951583862305, 5.492279052734375, 6.155263423919678, 6.8182477951049805, 7.481231689453125, 8.14421558380127, 8.807199478149414, 9.470184326171875, 10.13316822052002, 10.796152114868164, 11.459136962890625, 12.12212085723877, 12.785104751586914, 13.448088645935059, 14.111072540283203, 14.774057388305664, 15.437041282653809, 16.100025177001953, 16.763010025024414, 17.425994873046875, 18.088977813720703, 18.751962661743164, 19.414945602416992, 20.077930450439453, 20.74091339111328, 21.403898239135742, 22.066883087158203, 22.72986602783203, 23.392850875854492]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 5.0, 9.0, 11.0, 17.0, 29.0, 39.0, 47.0, 73.0, 191.0, 1435.0, 51460328.0, 684.0, 122.0, 45.0, 17.0, 21.0, 11.0, 12.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-964.5, -930.5382690429688, -896.5765380859375, -862.6148071289062, -828.653076171875, -794.6912841796875, -760.7295532226562, -726.767822265625, -692.8060913085938, -658.8443603515625, -624.8826293945312, -590.9208984375, -556.9591064453125, -522.9974365234375, -489.03564453125, -455.07391357421875, -421.1121826171875, -387.15045166015625, -353.188720703125, -319.2269592285156, -285.2652282714844, -251.30349731445312, -217.3417510986328, -183.3800048828125, -149.41827392578125, -115.45653533935547, -81.49479675292969, -47.533058166503906, -13.571319580078125, 20.390411376953125, 54.35215759277344, 88.31390380859375, 122.275634765625, 156.23736572265625, 190.19911193847656, 224.16085815429688, 258.1225891113281, 292.0843200683594, 326.04608154296875, 360.0078125, 393.96954345703125, 427.9312744140625, 461.89300537109375, 495.8547668457031, 529.8165283203125, 563.7781982421875, 597.739990234375, 631.7017211914062, 665.6634521484375, 699.6251831054688, 733.5869140625, 767.5486450195312, 801.5103759765625, 835.47216796875, 869.4338989257812, 903.3956298828125, 937.3573608398438, 971.319091796875, 1005.2808227539062, 1039.2425537109375, 1073.204345703125, 1107.166015625, 1141.1278076171875, 1175.089599609375, 1209.05126953125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 22.0, 33.0, 70.0, 180.0, 346.0, 194.0, 72.0, 37.0, 18.0, 10.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-113.5955810546875, -110.7294921875, -107.86339569091797, -104.99730682373047, -102.13121795654297, -99.26512145996094, -96.39903259277344, -93.53294372558594, -90.6668472290039, -87.8007583618164, -84.93466186523438, -82.06857299804688, -79.20248413085938, -76.33638763427734, -73.47029876708984, -70.60420227050781, -67.73811340332031, -64.87202453613281, -62.00593185424805, -59.13983917236328, -56.273746490478516, -53.40765380859375, -50.54156494140625, -47.675472259521484, -44.80938720703125, -41.943294525146484, -39.077205657958984, -36.21111297607422, -33.34502029418945, -30.47892951965332, -27.612838745117188, -24.746746063232422, -21.880653381347656, -19.014562606811523, -16.148469924926758, -13.282379150390625, -10.416287422180176, -7.550195693969727, -4.684104919433594, -1.8180122375488281, 1.0480785369873047, 3.914170026779175, 6.780261516571045, 9.646352767944336, 12.512444496154785, 15.378536224365234, 18.244626998901367, 21.110719680786133, 23.976810455322266, 26.8429012298584, 29.708993911743164, 32.5750846862793, 35.44117736816406, 38.30726623535156, 41.17335891723633, 44.039451599121094, 46.905540466308594, 49.77163314819336, 52.63772201538086, 55.503814697265625, 58.36990737915039, 61.236000061035156, 64.10208892822266, 66.96818542480469, 69.83427429199219]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 9.0, 11.0, 10.0, 11.0, 26.0, 25.0, 26.0, 32.0, 46.0, 48.0, 51.0, 69.0, 53.0, 71.0, 72.0, 54.0, 44.0, 52.0, 45.0, 51.0, 29.0, 33.0, 18.0, 17.0, 15.0, 8.0, 8.0, 7.0, 9.0, 3.0, 4.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-57.838279724121094, -56.089500427246094, -54.340721130371094, -52.591941833496094, -50.843162536621094, -49.094383239746094, -47.345603942871094, -45.596824645996094, -43.848045349121094, -42.099266052246094, -40.350486755371094, -38.601707458496094, -36.852928161621094, -35.104148864746094, -33.355369567871094, -31.60658836364746, -29.857807159423828, -28.109027862548828, -26.360248565673828, -24.611469268798828, -22.862689971923828, -21.113910675048828, -19.365129470825195, -17.616350173950195, -15.867570877075195, -14.118791580200195, -12.370012283325195, -10.621232032775879, -8.872452735900879, -7.123673439025879, -5.3748931884765625, -3.6261138916015625, -1.8773345947265625, -0.1285550594329834, 1.6202244758605957, 3.369004249572754, 5.117783546447754, 6.866562843322754, 8.61534309387207, 10.36412239074707, 12.11290168762207, 13.86168098449707, 15.61046028137207, 17.359241485595703, 19.108020782470703, 20.856800079345703, 22.605579376220703, 24.354358673095703, 26.103137969970703, 27.851917266845703, 29.600696563720703, 31.349475860595703, 33.0982551574707, 34.8470344543457, 36.59581756591797, 38.34459686279297, 40.09337615966797, 41.84215545654297, 43.59093475341797, 45.33971405029297, 47.08849334716797, 48.83727264404297, 50.58605194091797, 52.33483123779297, 54.08361053466797]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 13.0, 6.0, 11.0, 5.0, 14.0, 10.0, 10.0, 16.0, 24.0, 32.0, 55.0, 59.0, 91.0, 127.0, 171.0, 208.0, 366.0, 540.0, 788.0, 1255.0, 2063.0, 3639.0, 7512.0, 18352.0, 66167.0, 3952202.0, 89889.0, 24273.0, 11202.0, 6029.0, 3481.0, 2129.0, 1317.0, 772.0, 503.0, 336.0, 189.0, 149.0, 97.0, 54.0, 44.0, 19.0, 25.0, 11.0, 12.0, 12.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.37890625, -2.308074951171875, -2.23724365234375, -2.166412353515625, -2.0955810546875, -2.024749755859375, -1.95391845703125, -1.883087158203125, -1.812255859375, -1.741424560546875, -1.67059326171875, -1.599761962890625, -1.5289306640625, -1.458099365234375, -1.38726806640625, -1.316436767578125, -1.24560546875, -1.174774169921875, -1.10394287109375, -1.033111572265625, -0.9622802734375, -0.891448974609375, -0.82061767578125, -0.749786376953125, -0.678955078125, -0.608123779296875, -0.53729248046875, -0.466461181640625, -0.3956298828125, -0.324798583984375, -0.25396728515625, -0.183135986328125, -0.1123046875, -0.041473388671875, 0.02935791015625, 0.100189208984375, 0.1710205078125, 0.241851806640625, 0.31268310546875, 0.383514404296875, 0.454345703125, 0.525177001953125, 0.59600830078125, 0.666839599609375, 0.7376708984375, 0.808502197265625, 0.87933349609375, 0.950164794921875, 1.02099609375, 1.091827392578125, 1.16265869140625, 1.233489990234375, 1.3043212890625, 1.375152587890625, 1.44598388671875, 1.516815185546875, 1.587646484375, 1.658477783203125, 1.72930908203125, 1.800140380859375, 1.8709716796875, 1.941802978515625, 2.01263427734375, 2.083465576171875, 2.154296875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 2.0, 7.0, 3.0, 8.0, 9.0, 10.0, 12.0, 17.0, 15.0, 34.0, 747.0, 24.0, 8.0, 14.0, 10.0, 6.0, 7.0, 7.0, 5.0, 7.0, 6.0, 5.0, 2.0, 7.0, 5.0, 3.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.42234039306640625, -0.4101104736328125, -0.39788055419921875, -0.385650634765625, -0.37342071533203125, -0.3611907958984375, -0.34896087646484375, -0.33673095703125, -0.32450103759765625, -0.3122711181640625, -0.30004119873046875, -0.287811279296875, -0.27558135986328125, -0.2633514404296875, -0.25112152099609375, -0.2388916015625, -0.22666168212890625, -0.2144317626953125, -0.20220184326171875, -0.189971923828125, -0.17774200439453125, -0.1655120849609375, -0.15328216552734375, -0.14105224609375, -0.12882232666015625, -0.1165924072265625, -0.10436248779296875, -0.092132568359375, -0.07990264892578125, -0.0676727294921875, -0.05544281005859375, -0.043212890625, -0.03098297119140625, -0.0187530517578125, -0.00652313232421875, 0.005706787109375, 0.01793670654296875, 0.0301666259765625, 0.04239654541015625, 0.05462646484375, 0.06685638427734375, 0.0790863037109375, 0.09131622314453125, 0.103546142578125, 0.11577606201171875, 0.1280059814453125, 0.14023590087890625, 0.1524658203125, 0.16469573974609375, 0.1769256591796875, 0.18915557861328125, 0.201385498046875, 0.21361541748046875, 0.2258453369140625, 0.23807525634765625, 0.25030517578125, 0.26253509521484375, 0.2747650146484375, 0.28699493408203125, 0.299224853515625, 0.31145477294921875, 0.3236846923828125, 0.33591461181640625, 0.34814453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 14.0, 19.0, 23.0, 31.0, 34.0, 59.0, 98.0, 127.0, 202.0, 336.0, 515.0, 921.0, 1567.0, 3068.0, 6583.0, 15242.0, 41908.0, 151267.0, 1692714.0, 2048697.0, 158677.0, 42979.0, 15521.0, 6609.0, 3134.0, 1640.0, 876.0, 505.0, 312.0, 200.0, 135.0, 79.0, 57.0, 45.0, 29.0, 19.0, 9.0, 5.0, 3.0, 4.0, 6.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93115234375, -0.8990554809570312, -0.8669586181640625, -0.8348617553710938, -0.802764892578125, -0.7706680297851562, -0.7385711669921875, -0.7064743041992188, -0.67437744140625, -0.6422805786132812, -0.6101837158203125, -0.5780868530273438, -0.545989990234375, -0.5138931274414062, -0.4817962646484375, -0.44969940185546875, -0.4176025390625, -0.38550567626953125, -0.3534088134765625, -0.32131195068359375, -0.289215087890625, -0.25711822509765625, -0.2250213623046875, -0.19292449951171875, -0.16082763671875, -0.12873077392578125, -0.0966339111328125, -0.06453704833984375, -0.032440185546875, -0.00034332275390625, 0.0317535400390625, 0.06385040283203125, 0.095947265625, 0.12804412841796875, 0.1601409912109375, 0.19223785400390625, 0.224334716796875, 0.25643157958984375, 0.2885284423828125, 0.32062530517578125, 0.35272216796875, 0.38481903076171875, 0.4169158935546875, 0.44901275634765625, 0.481109619140625, 0.5132064819335938, 0.5453033447265625, 0.5774002075195312, 0.6094970703125, 0.6415939331054688, 0.6736907958984375, 0.7057876586914062, 0.737884521484375, 0.7699813842773438, 0.8020782470703125, 0.8341751098632812, 0.86627197265625, 0.8983688354492188, 0.9304656982421875, 0.9625625610351562, 0.994659423828125, 1.0267562866210938, 1.0588531494140625, 1.0909500122070312, 1.123046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 12.0, 12.0, 27.0, 33.0, 31.0, 46.0, 84.0, 113.0, 195.0, 316.0, 823.0, 1334.0, 400.0, 187.0, 140.0, 86.0, 60.0, 52.0, 38.0, 18.0, 17.0, 18.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55810546875, -0.5426559448242188, -0.5272064208984375, -0.5117568969726562, -0.496307373046875, -0.48085784912109375, -0.4654083251953125, -0.44995880126953125, -0.43450927734375, -0.41905975341796875, -0.4036102294921875, -0.38816070556640625, -0.372711181640625, -0.35726165771484375, -0.3418121337890625, -0.32636260986328125, -0.3109130859375, -0.29546356201171875, -0.2800140380859375, -0.26456451416015625, -0.249114990234375, -0.23366546630859375, -0.2182159423828125, -0.20276641845703125, -0.18731689453125, -0.17186737060546875, -0.1564178466796875, -0.14096832275390625, -0.125518798828125, -0.11006927490234375, -0.0946197509765625, -0.07917022705078125, -0.063720703125, -0.04827117919921875, -0.0328216552734375, -0.01737213134765625, -0.001922607421875, 0.01352691650390625, 0.0289764404296875, 0.04442596435546875, 0.05987548828125, 0.07532501220703125, 0.0907745361328125, 0.10622406005859375, 0.121673583984375, 0.13712310791015625, 0.1525726318359375, 0.16802215576171875, 0.1834716796875, 0.19892120361328125, 0.2143707275390625, 0.22982025146484375, 0.245269775390625, 0.26071929931640625, 0.2761688232421875, 0.29161834716796875, 0.30706787109375, 0.32251739501953125, 0.3379669189453125, 0.35341644287109375, 0.368865966796875, 0.38431549072265625, 0.3997650146484375, 0.41521453857421875, 0.4306640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 8.0, 15.0, 20.0, 67.0, 108.0, 193.0, 215.0, 182.0, 93.0, 41.0, 23.0, 17.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.889422416687012, -4.779504299163818, -4.669586181640625, -4.559668064117432, -4.449749946594238, -4.339831829071045, -4.229913711547852, -4.119996070861816, -4.010077953338623, -3.9001598358154297, -3.7902417182922363, -3.680323600769043, -3.5704057216644287, -3.4604876041412354, -3.350569486618042, -3.2406513690948486, -3.130733013153076, -3.020814895629883, -2.9108967781066895, -2.800978660583496, -2.691060781478882, -2.5811426639556885, -2.471224546432495, -2.3613064289093018, -2.2513885498046875, -2.141470432281494, -2.031552314758301, -1.921634316444397, -1.8117161989212036, -1.7017982006072998, -1.5918800830841064, -1.481961965560913, -1.3720438480377197, -1.2621257305145264, -1.1522077322006226, -1.0422896146774292, -0.9323714971542358, -0.8224534392356873, -0.7125353813171387, -0.6026172637939453, -0.49269920587539673, -0.38278111815452576, -0.2728630304336548, -0.1629449725151062, -0.05302688479423523, 0.05689120292663574, 0.16680926084518433, 0.2767273783683777, 0.38664543628692627, 0.49656352400779724, 0.6064816117286682, 0.7163996696472168, 0.8263177871704102, 0.9362358450889587, 1.0461539030075073, 1.1560720205307007, 1.2659900188446045, 1.3759081363677979, 1.4858261346817017, 1.595744252204895, 1.7056623697280884, 1.8155803680419922, 1.9254984855651855, 2.035416603088379, 2.1453347206115723]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 6.0, 7.0, 9.0, 13.0, 15.0, 14.0, 13.0, 21.0, 27.0, 26.0, 32.0, 39.0, 41.0, 39.0, 56.0, 50.0, 56.0, 56.0, 61.0, 48.0, 51.0, 40.0, 40.0, 29.0, 39.0, 30.0, 21.0, 26.0, 23.0, 19.0, 10.0, 15.0, 7.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.381485939025879, -1.3311620950698853, -1.2808382511138916, -1.230514407157898, -1.1801905632019043, -1.1298668384552002, -1.079542875289917, -1.029219150543213, -0.9788953065872192, -0.9285714626312256, -0.8782476186752319, -0.8279237747192383, -0.7775999903678894, -0.7272761464118958, -0.6769523024559021, -0.6266285181045532, -0.5763046145439148, -0.5259807705879211, -0.4756569564342499, -0.4253331124782562, -0.37500929832458496, -0.3246854543685913, -0.27436161041259766, -0.2240377962589264, -0.17371395230293274, -0.12339012324810028, -0.07306628674268723, -0.02274245023727417, 0.02758137881755829, 0.07790520787239075, 0.1282290518283844, 0.17855286598205566, 0.22887670993804932, 0.27920055389404297, 0.32952436804771423, 0.3798482120037079, 0.43017202615737915, 0.4804958701133728, 0.5308197140693665, 0.5811434984207153, 0.631467342376709, 0.6817911863327026, 0.7321150302886963, 0.7824388742446899, 0.8327626585960388, 0.8830865025520325, 0.9334103465080261, 0.983734130859375, 1.0340580940246582, 1.0843819379806519, 1.1347057819366455, 1.1850296258926392, 1.2353534698486328, 1.285677194595337, 1.3360011577606201, 1.3863248825073242, 1.4366487264633179, 1.4869725704193115, 1.5372964143753052, 1.5876202583312988, 1.6379441022872925, 1.6882679462432861, 1.7385916709899902, 1.7889155149459839, 1.8392393589019775]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 16.0, 22.0, 34.0, 40.0, 54.0, 85.0, 131.0, 199.0, 280.0, 427.0, 629.0, 972.0, 1506.0, 2514.0, 3843.0, 6644.0, 11538.0, 20841.0, 44517.0, 795794.0, 97715.0, 25745.0, 13955.0, 8271.0, 4821.0, 2914.0, 1787.0, 1083.0, 737.0, 496.0, 327.0, 183.0, 135.0, 91.0, 55.0, 40.0, 41.0, 15.0, 16.0, 15.0, 6.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5, -1.4526519775390625, -1.405303955078125, -1.3579559326171875, -1.31060791015625, -1.2632598876953125, -1.215911865234375, -1.1685638427734375, -1.1212158203125, -1.0738677978515625, -1.026519775390625, -0.9791717529296875, -0.93182373046875, -0.8844757080078125, -0.837127685546875, -0.7897796630859375, -0.742431640625, -0.6950836181640625, -0.647735595703125, -0.6003875732421875, -0.55303955078125, -0.5056915283203125, -0.458343505859375, -0.4109954833984375, -0.3636474609375, -0.3162994384765625, -0.268951416015625, -0.2216033935546875, -0.17425537109375, -0.1269073486328125, -0.079559326171875, -0.0322113037109375, 0.01513671875, 0.0624847412109375, 0.109832763671875, 0.1571807861328125, 0.20452880859375, 0.2518768310546875, 0.299224853515625, 0.3465728759765625, 0.3939208984375, 0.4412689208984375, 0.488616943359375, 0.5359649658203125, 0.58331298828125, 0.6306610107421875, 0.678009033203125, 0.7253570556640625, 0.772705078125, 0.8200531005859375, 0.867401123046875, 0.9147491455078125, 0.96209716796875, 1.0094451904296875, 1.056793212890625, 1.1041412353515625, 1.1514892578125, 1.1988372802734375, 1.246185302734375, 1.2935333251953125, 1.34088134765625, 1.3882293701171875, 1.435577392578125, 1.4829254150390625, 1.5302734375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 6.0, 13.0, 10.0, 15.0, 14.0, 39.0, 331.0, 400.0, 43.0, 16.0, 10.0, 7.0, 6.0, 5.0, 9.0, 3.0, 7.0, 3.0, 4.0, 8.0, 3.0, 6.0, 5.0, 0.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.43994140625, -0.4277763366699219, -0.41561126708984375, -0.4034461975097656, -0.3912811279296875, -0.3791160583496094, -0.36695098876953125, -0.3547859191894531, -0.342620849609375, -0.3304557800292969, -0.31829071044921875, -0.3061256408691406, -0.2939605712890625, -0.2817955017089844, -0.26963043212890625, -0.2574653625488281, -0.24530029296875, -0.23313522338867188, -0.22097015380859375, -0.20880508422851562, -0.1966400146484375, -0.18447494506835938, -0.17230987548828125, -0.16014480590820312, -0.147979736328125, -0.13581466674804688, -0.12364959716796875, -0.11148452758789062, -0.0993194580078125, -0.08715438842773438, -0.07498931884765625, -0.06282424926757812, -0.0506591796875, -0.038494110107421875, -0.02632904052734375, -0.014163970947265625, -0.0019989013671875, 0.010166168212890625, 0.02233123779296875, 0.034496307373046875, 0.046661376953125, 0.058826446533203125, 0.07099151611328125, 0.08315658569335938, 0.0953216552734375, 0.10748672485351562, 0.11965179443359375, 0.13181686401367188, 0.14398193359375, 0.15614700317382812, 0.16831207275390625, 0.18047714233398438, 0.1926422119140625, 0.20480728149414062, 0.21697235107421875, 0.22913742065429688, 0.241302490234375, 0.2534675598144531, 0.26563262939453125, 0.2777976989746094, 0.2899627685546875, 0.3021278381347656, 0.31429290771484375, 0.3264579772949219, 0.338623046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 11.0, 9.0, 21.0, 19.0, 30.0, 26.0, 63.0, 80.0, 130.0, 180.0, 276.0, 433.0, 717.0, 1436.0, 2926.0, 6638.0, 16232.0, 48034.0, 199312.0, 517057.0, 182182.0, 44825.0, 15336.0, 6300.0, 2814.0, 1473.0, 768.0, 428.0, 259.0, 182.0, 116.0, 73.0, 56.0, 33.0, 18.0, 20.0, 9.0, 8.0, 9.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-1.6953125, -1.6512451171875, -1.607177734375, -1.5631103515625, -1.51904296875, -1.4749755859375, -1.430908203125, -1.3868408203125, -1.3427734375, -1.2987060546875, -1.254638671875, -1.2105712890625, -1.16650390625, -1.1224365234375, -1.078369140625, -1.0343017578125, -0.990234375, -0.9461669921875, -0.902099609375, -0.8580322265625, -0.81396484375, -0.7698974609375, -0.725830078125, -0.6817626953125, -0.6376953125, -0.5936279296875, -0.549560546875, -0.5054931640625, -0.46142578125, -0.4173583984375, -0.373291015625, -0.3292236328125, -0.28515625, -0.2410888671875, -0.197021484375, -0.1529541015625, -0.10888671875, -0.0648193359375, -0.020751953125, 0.0233154296875, 0.0673828125, 0.1114501953125, 0.155517578125, 0.1995849609375, 0.24365234375, 0.2877197265625, 0.331787109375, 0.3758544921875, 0.419921875, 0.4639892578125, 0.508056640625, 0.5521240234375, 0.59619140625, 0.6402587890625, 0.684326171875, 0.7283935546875, 0.7724609375, 0.8165283203125, 0.860595703125, 0.9046630859375, 0.94873046875, 0.9927978515625, 1.036865234375, 1.0809326171875, 1.125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 0.0, 6.0, 3.0, 4.0, 2.0, 2.0, 9.0, 2.0, 14.0, 11.0, 15.0, 12.0, 15.0, 16.0, 20.0, 26.0, 27.0, 35.0, 25.0, 25.0, 40.0, 36.0, 46.0, 27.0, 40.0, 40.0, 36.0, 41.0, 42.0, 28.0, 37.0, 31.0, 37.0, 23.0, 26.0, 23.0, 26.0, 21.0, 19.0, 20.0, 11.0, 13.0, 11.0, 15.0, 12.0, 8.0, 10.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.3271484375, -1.285430908203125, -1.24371337890625, -1.201995849609375, -1.1602783203125, -1.118560791015625, -1.07684326171875, -1.035125732421875, -0.993408203125, -0.951690673828125, -0.90997314453125, -0.868255615234375, -0.8265380859375, -0.784820556640625, -0.74310302734375, -0.701385498046875, -0.65966796875, -0.617950439453125, -0.57623291015625, -0.534515380859375, -0.4927978515625, -0.451080322265625, -0.40936279296875, -0.367645263671875, -0.325927734375, -0.284210205078125, -0.24249267578125, -0.200775146484375, -0.1590576171875, -0.117340087890625, -0.07562255859375, -0.033905029296875, 0.0078125, 0.049530029296875, 0.09124755859375, 0.132965087890625, 0.1746826171875, 0.216400146484375, 0.25811767578125, 0.299835205078125, 0.341552734375, 0.383270263671875, 0.42498779296875, 0.466705322265625, 0.5084228515625, 0.550140380859375, 0.59185791015625, 0.633575439453125, 0.67529296875, 0.717010498046875, 0.75872802734375, 0.800445556640625, 0.8421630859375, 0.883880615234375, 0.92559814453125, 0.967315673828125, 1.009033203125, 1.050750732421875, 1.09246826171875, 1.134185791015625, 1.1759033203125, 1.217620849609375, 1.25933837890625, 1.301055908203125, 1.3427734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 8.0, 25.0, 21.0, 26.0, 47.0, 49.0, 90.0, 168.0, 341.0, 838.0, 2576.0, 11220.0, 350163.0, 665388.0, 12869.0, 2841.0, 964.0, 415.0, 182.0, 98.0, 76.0, 39.0, 37.0, 20.0, 6.0, 16.0, 3.0, 1.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.171875, -9.864013671875, -9.55615234375, -9.248291015625, -8.9404296875, -8.632568359375, -8.32470703125, -8.016845703125, -7.708984375, -7.401123046875, -7.09326171875, -6.785400390625, -6.4775390625, -6.169677734375, -5.86181640625, -5.553955078125, -5.24609375, -4.938232421875, -4.63037109375, -4.322509765625, -4.0146484375, -3.706787109375, -3.39892578125, -3.091064453125, -2.783203125, -2.475341796875, -2.16748046875, -1.859619140625, -1.5517578125, -1.243896484375, -0.93603515625, -0.628173828125, -0.3203125, -0.012451171875, 0.29541015625, 0.603271484375, 0.9111328125, 1.218994140625, 1.52685546875, 1.834716796875, 2.142578125, 2.450439453125, 2.75830078125, 3.066162109375, 3.3740234375, 3.681884765625, 3.98974609375, 4.297607421875, 4.60546875, 4.913330078125, 5.22119140625, 5.529052734375, 5.8369140625, 6.144775390625, 6.45263671875, 6.760498046875, 7.068359375, 7.376220703125, 7.68408203125, 7.991943359375, 8.2998046875, 8.607666015625, 8.91552734375, 9.223388671875, 9.53125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 3.0, 10.0, 14.0, 26.0, 40.0, 53.0, 97.0, 157.0, 197.0, 160.0, 80.0, 51.0, 34.0, 20.0, 13.0, 12.0, 14.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002732276916503906, -0.00026153773069381714, -0.00024984776973724365, -0.00023815780878067017, -0.00022646784782409668, -0.0002147778868675232, -0.0002030879259109497, -0.00019139796495437622, -0.00017970800399780273, -0.00016801804304122925, -0.00015632808208465576, -0.00014463812112808228, -0.0001329481601715088, -0.0001212581992149353, -0.00010956823825836182, -9.787827730178833e-05, -8.618831634521484e-05, -7.449835538864136e-05, -6.280839443206787e-05, -5.1118433475494385e-05, -3.94284725189209e-05, -2.7738511562347412e-05, -1.6048550605773926e-05, -4.3585896492004395e-06, 7.331371307373047e-06, 1.9021332263946533e-05, 3.071129322052002e-05, 4.2401254177093506e-05, 5.409121513366699e-05, 6.578117609024048e-05, 7.747113704681396e-05, 8.916109800338745e-05, 0.00010085105895996094, 0.00011254101991653442, 0.0001242309808731079, 0.0001359209418296814, 0.00014761090278625488, 0.00015930086374282837, 0.00017099082469940186, 0.00018268078565597534, 0.00019437074661254883, 0.00020606070756912231, 0.0002177506685256958, 0.0002294406294822693, 0.00024113059043884277, 0.00025282055139541626, 0.00026451051235198975, 0.00027620047330856323, 0.0002878904342651367, 0.0002995803952217102, 0.0003112703561782837, 0.0003229603171348572, 0.00033465027809143066, 0.00034634023904800415, 0.00035803020000457764, 0.0003697201609611511, 0.0003814101219177246, 0.0003931000828742981, 0.0004047900438308716, 0.00041648000478744507, 0.00042816996574401855, 0.00043985992670059204, 0.00045154988765716553, 0.000463239848613739, 0.0004749298095703125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 5.0, 8.0, 9.0, 20.0, 30.0, 59.0, 77.0, 121.0, 197.0, 368.0, 792.0, 1848.0, 4884.0, 17520.0, 131284.0, 805969.0, 67050.0, 11739.0, 3644.0, 1409.0, 662.0, 354.0, 196.0, 114.0, 63.0, 36.0, 26.0, 16.0, 13.0, 9.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.3984375, -4.27044677734375, -4.1424560546875, -4.01446533203125, -3.886474609375, -3.75848388671875, -3.6304931640625, -3.50250244140625, -3.37451171875, -3.24652099609375, -3.1185302734375, -2.99053955078125, -2.862548828125, -2.73455810546875, -2.6065673828125, -2.47857666015625, -2.3505859375, -2.22259521484375, -2.0946044921875, -1.96661376953125, -1.838623046875, -1.71063232421875, -1.5826416015625, -1.45465087890625, -1.32666015625, -1.19866943359375, -1.0706787109375, -0.94268798828125, -0.814697265625, -0.68670654296875, -0.5587158203125, -0.43072509765625, -0.302734375, -0.17474365234375, -0.0467529296875, 0.08123779296875, 0.209228515625, 0.33721923828125, 0.4652099609375, 0.59320068359375, 0.72119140625, 0.84918212890625, 0.9771728515625, 1.10516357421875, 1.233154296875, 1.36114501953125, 1.4891357421875, 1.61712646484375, 1.7451171875, 1.87310791015625, 2.0010986328125, 2.12908935546875, 2.257080078125, 2.38507080078125, 2.5130615234375, 2.64105224609375, 2.76904296875, 2.89703369140625, 3.0250244140625, 3.15301513671875, 3.281005859375, 3.40899658203125, 3.5369873046875, 3.66497802734375, 3.79296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 7.0, 12.0, 7.0, 10.0, 10.0, 18.0, 24.0, 21.0, 34.0, 44.0, 87.0, 83.0, 128.0, 104.0, 102.0, 81.0, 52.0, 45.0, 30.0, 22.0, 13.0, 12.0, 14.0, 7.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.748046875, -2.662872314453125, -2.57769775390625, -2.492523193359375, -2.4073486328125, -2.322174072265625, -2.23699951171875, -2.151824951171875, -2.066650390625, -1.981475830078125, -1.89630126953125, -1.811126708984375, -1.7259521484375, -1.640777587890625, -1.55560302734375, -1.470428466796875, -1.38525390625, -1.300079345703125, -1.21490478515625, -1.129730224609375, -1.0445556640625, -0.959381103515625, -0.87420654296875, -0.789031982421875, -0.703857421875, -0.618682861328125, -0.53350830078125, -0.448333740234375, -0.3631591796875, -0.277984619140625, -0.19281005859375, -0.107635498046875, -0.0224609375, 0.062713623046875, 0.14788818359375, 0.233062744140625, 0.3182373046875, 0.403411865234375, 0.48858642578125, 0.573760986328125, 0.658935546875, 0.744110107421875, 0.82928466796875, 0.914459228515625, 0.9996337890625, 1.084808349609375, 1.16998291015625, 1.255157470703125, 1.34033203125, 1.425506591796875, 1.51068115234375, 1.595855712890625, 1.6810302734375, 1.766204833984375, 1.85137939453125, 1.936553955078125, 2.021728515625, 2.106903076171875, 2.19207763671875, 2.277252197265625, 2.3624267578125, 2.447601318359375, 2.53277587890625, 2.617950439453125, 2.703125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 5.0, 7.0, 14.0, 20.0, 31.0, 87.0, 176.0, 252.0, 225.0, 92.0, 43.0, 12.0, 12.0, 9.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.25713348388672, -36.31671142578125, -35.376285552978516, -34.43586349487305, -33.49544143676758, -32.555015563964844, -31.614593505859375, -30.674171447753906, -29.733747482299805, -28.793323516845703, -27.852901458740234, -26.912477493286133, -25.97205352783203, -25.031631469726562, -24.09120750427246, -23.15078353881836, -22.21036148071289, -21.26993751525879, -20.32951545715332, -19.38909149169922, -18.44866943359375, -17.50824546813965, -16.567821502685547, -15.627398490905762, -14.686975479125977, -13.746552467346191, -12.806129455566406, -11.865705490112305, -10.92528247833252, -9.984859466552734, -9.044435501098633, -8.104012489318848, -7.1635894775390625, -6.223166465759277, -5.282742977142334, -4.342319488525391, -3.4018964767456055, -2.4614734649658203, -1.521049976348877, -0.5806264877319336, 0.35979652404785156, 1.3002197742462158, 2.24064302444458, 3.1810662746429443, 4.121489524841309, 5.061912536621094, 6.002336025238037, 6.9427595138549805, 7.883182525634766, 8.82360553741455, 9.764028549194336, 10.704452514648438, 11.644875526428223, 12.585298538208008, 13.52572250366211, 14.466145515441895, 15.40656852722168, 16.34699249267578, 17.28741455078125, 18.22783851623535, 19.168262481689453, 20.108684539794922, 21.049108505249023, 21.989532470703125, 22.929954528808594]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 11.0, 8.0, 15.0, 16.0, 33.0, 41.0, 84.0, 101.0, 125.0, 130.0, 135.0, 97.0, 62.0, 32.0, 24.0, 11.0, 12.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.282602310180664, -26.354427337646484, -25.426254272460938, -24.498079299926758, -23.569904327392578, -22.6417293548584, -21.71355438232422, -20.785381317138672, -19.857206344604492, -18.929031372070312, -18.000858306884766, -17.072683334350586, -16.144508361816406, -15.216333389282227, -14.288159370422363, -13.3599853515625, -12.43181037902832, -11.50363540649414, -10.575461387634277, -9.647287368774414, -8.719112396240234, -7.790937900543213, -6.862763404846191, -5.93458890914917, -5.006414413452148, -4.078239917755127, -3.1500654220581055, -2.221890926361084, -1.2937164306640625, -0.365541934967041, 0.5626325607299805, 1.490807056427002, 2.4189834594726562, 3.3471579551696777, 4.275332450866699, 5.203506946563721, 6.131681442260742, 7.059855937957764, 7.988030433654785, 8.916204452514648, 9.844379425048828, 10.772554397583008, 11.700728416442871, 12.628902435302734, 13.557077407836914, 14.485252380371094, 15.413426399230957, 16.34160041809082, 17.269775390625, 18.19795036315918, 19.12612533569336, 20.054298400878906, 20.982473373413086, 21.910648345947266, 22.838821411132812, 23.766996383666992, 24.695171356201172, 25.62334632873535, 26.55152130126953, 27.479694366455078, 28.407869338989258, 29.336044311523438, 30.264217376708984, 31.192392349243164, 32.120567321777344]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 10.0, 16.0, 17.0, 28.0, 43.0, 60.0, 105.0, 141.0, 238.0, 424.0, 731.0, 1533.0, 3355.0, 9848.0, 48544.0, 3906869.0, 189997.0, 20418.0, 6110.0, 2568.0, 1216.0, 669.0, 440.0, 287.0, 180.0, 129.0, 77.0, 58.0, 40.0, 29.0, 22.0, 14.0, 13.0, 7.0, 5.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.70703125, -4.5587158203125, -4.410400390625, -4.2620849609375, -4.11376953125, -3.9654541015625, -3.817138671875, -3.6688232421875, -3.5205078125, -3.3721923828125, -3.223876953125, -3.0755615234375, -2.92724609375, -2.7789306640625, -2.630615234375, -2.4822998046875, -2.333984375, -2.1856689453125, -2.037353515625, -1.8890380859375, -1.74072265625, -1.5924072265625, -1.444091796875, -1.2957763671875, -1.1474609375, -0.9991455078125, -0.850830078125, -0.7025146484375, -0.55419921875, -0.4058837890625, -0.257568359375, -0.1092529296875, 0.0390625, 0.1873779296875, 0.335693359375, 0.4840087890625, 0.63232421875, 0.7806396484375, 0.928955078125, 1.0772705078125, 1.2255859375, 1.3739013671875, 1.522216796875, 1.6705322265625, 1.81884765625, 1.9671630859375, 2.115478515625, 2.2637939453125, 2.412109375, 2.5604248046875, 2.708740234375, 2.8570556640625, 3.00537109375, 3.1536865234375, 3.302001953125, 3.4503173828125, 3.5986328125, 3.7469482421875, 3.895263671875, 4.0435791015625, 4.19189453125, 4.3402099609375, 4.488525390625, 4.6368408203125, 4.78515625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 12.0, 5.0, 9.0, 14.0, 18.0, 50.0, 149.0, 297.0, 233.0, 98.0, 25.0, 12.0, 8.0, 5.0, 9.0, 13.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406982421875, -0.3929023742675781, -0.37882232666015625, -0.3647422790527344, -0.3506622314453125, -0.3365821838378906, -0.32250213623046875, -0.3084220886230469, -0.294342041015625, -0.2802619934082031, -0.26618194580078125, -0.2521018981933594, -0.2380218505859375, -0.22394180297851562, -0.20986175537109375, -0.19578170776367188, -0.18170166015625, -0.16762161254882812, -0.15354156494140625, -0.13946151733398438, -0.1253814697265625, -0.11130142211914062, -0.09722137451171875, -0.08314132690429688, -0.069061279296875, -0.054981231689453125, -0.04090118408203125, -0.026821136474609375, -0.0127410888671875, 0.001338958740234375, 0.01541900634765625, 0.029499053955078125, 0.0435791015625, 0.057659149169921875, 0.07173919677734375, 0.08581924438476562, 0.0998992919921875, 0.11397933959960938, 0.12805938720703125, 0.14213943481445312, 0.156219482421875, 0.17029953002929688, 0.18437957763671875, 0.19845962524414062, 0.2125396728515625, 0.22661972045898438, 0.24069976806640625, 0.2547798156738281, 0.26885986328125, 0.2829399108886719, 0.29701995849609375, 0.3111000061035156, 0.3251800537109375, 0.3392601013183594, 0.35334014892578125, 0.3674201965332031, 0.381500244140625, 0.3955802917480469, 0.40966033935546875, 0.4237403869628906, 0.4378204345703125, 0.4519004821777344, 0.46598052978515625, 0.4800605773925781, 0.494140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 7.0, 3.0, 6.0, 9.0, 9.0, 25.0, 28.0, 37.0, 59.0, 76.0, 155.0, 259.0, 519.0, 1171.0, 2747.0, 8121.0, 29808.0, 194198.0, 3644880.0, 261563.0, 35124.0, 9516.0, 3232.0, 1361.0, 573.0, 336.0, 171.0, 93.0, 68.0, 41.0, 27.0, 12.0, 13.0, 10.0, 4.0, 4.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.986328125, -2.904632568359375, -2.82293701171875, -2.741241455078125, -2.6595458984375, -2.577850341796875, -2.49615478515625, -2.414459228515625, -2.332763671875, -2.251068115234375, -2.16937255859375, -2.087677001953125, -2.0059814453125, -1.924285888671875, -1.84259033203125, -1.760894775390625, -1.67919921875, -1.597503662109375, -1.51580810546875, -1.434112548828125, -1.3524169921875, -1.270721435546875, -1.18902587890625, -1.107330322265625, -1.025634765625, -0.943939208984375, -0.86224365234375, -0.780548095703125, -0.6988525390625, -0.617156982421875, -0.53546142578125, -0.453765869140625, -0.3720703125, -0.290374755859375, -0.20867919921875, -0.126983642578125, -0.0452880859375, 0.036407470703125, 0.11810302734375, 0.199798583984375, 0.281494140625, 0.363189697265625, 0.44488525390625, 0.526580810546875, 0.6082763671875, 0.689971923828125, 0.77166748046875, 0.853363037109375, 0.93505859375, 1.016754150390625, 1.09844970703125, 1.180145263671875, 1.2618408203125, 1.343536376953125, 1.42523193359375, 1.506927490234375, 1.588623046875, 1.670318603515625, 1.75201416015625, 1.833709716796875, 1.9154052734375, 1.997100830078125, 2.07879638671875, 2.160491943359375, 2.2421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 9.0, 13.0, 23.0, 20.0, 39.0, 60.0, 120.0, 291.0, 922.0, 1793.0, 391.0, 159.0, 82.0, 49.0, 25.0, 19.0, 16.0, 7.0, 9.0, 10.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.67236328125, -0.6542510986328125, -0.636138916015625, -0.6180267333984375, -0.59991455078125, -0.5818023681640625, -0.563690185546875, -0.5455780029296875, -0.5274658203125, -0.5093536376953125, -0.491241455078125, -0.4731292724609375, -0.45501708984375, -0.4369049072265625, -0.418792724609375, -0.4006805419921875, -0.382568359375, -0.3644561767578125, -0.346343994140625, -0.3282318115234375, -0.31011962890625, -0.2920074462890625, -0.273895263671875, -0.2557830810546875, -0.2376708984375, -0.2195587158203125, -0.201446533203125, -0.1833343505859375, -0.16522216796875, -0.1471099853515625, -0.128997802734375, -0.1108856201171875, -0.0927734375, -0.0746612548828125, -0.056549072265625, -0.0384368896484375, -0.02032470703125, -0.0022125244140625, 0.015899658203125, 0.0340118408203125, 0.0521240234375, 0.0702362060546875, 0.088348388671875, 0.1064605712890625, 0.12457275390625, 0.1426849365234375, 0.160797119140625, 0.1789093017578125, 0.197021484375, 0.2151336669921875, 0.233245849609375, 0.2513580322265625, 0.26947021484375, 0.2875823974609375, 0.305694580078125, 0.3238067626953125, 0.3419189453125, 0.3600311279296875, 0.378143310546875, 0.3962554931640625, 0.41436767578125, 0.4324798583984375, 0.450592041015625, 0.4687042236328125, 0.48681640625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 22.0, 76.0, 385.0, 400.0, 86.0, 23.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.294368267059326, -5.098230838775635, -4.902093410491943, -4.70595645904541, -4.509819030761719, -4.313681602478027, -4.117544174194336, -3.9214069843292236, -3.7252697944641113, -3.52913236618042, -3.3329951763153076, -3.136857748031616, -2.940720558166504, -2.7445831298828125, -2.548445701599121, -2.352308511734009, -2.1561710834503174, -1.9600337743759155, -1.7638964653015137, -1.5677590370178223, -1.37162184715271, -1.1754844188690186, -0.9793471097946167, -0.7832098007202148, -0.587072491645813, -0.39093518257141113, -0.1947978436946869, 0.0013394951820373535, 0.1974768042564392, 0.39361411333084106, 0.5897514820098877, 0.7858887910842896, 0.9820261001586914, 1.1781634092330933, 1.3743007183074951, 1.5704381465911865, 1.7665753364562988, 1.9627127647399902, 2.1588501930236816, 2.354987382888794, 2.5511245727539062, 2.7472620010375977, 2.94339919090271, 3.1395366191864014, 3.3356738090515137, 3.531811237335205, 3.7279486656188965, 3.924085855484009, 4.120223045349121, 4.3163604736328125, 4.512497901916504, 4.708634853363037, 4.9047722816467285, 5.10090970993042, 5.297047138214111, 5.4931840896606445, 5.689321994781494, 5.8854594230651855, 6.081596851348877, 6.27773380279541, 6.473871231079102, 6.670008659362793, 6.866146087646484, 7.062283515930176, 7.258420467376709]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 10.0, 10.0, 14.0, 20.0, 34.0, 42.0, 58.0, 98.0, 112.0, 114.0, 93.0, 75.0, 86.0, 68.0, 42.0, 31.0, 23.0, 12.0, 13.0, 7.0, 5.0, 7.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.57211971282959, -2.493805170059204, -2.4154906272888184, -2.3371763229370117, -2.258861780166626, -2.1805472373962402, -2.1022326946258545, -2.0239181518554688, -1.9456037282943726, -1.8672891855239868, -1.7889747619628906, -1.7106602191925049, -1.6323456764221191, -1.554031252861023, -1.4757167100906372, -1.397402286529541, -1.3190877437591553, -1.2407732009887695, -1.1624587774276733, -1.0841442346572876, -1.0058298110961914, -0.9275152683258057, -0.8492007255554199, -0.770886242389679, -0.692571759223938, -0.614257276058197, -0.535942792892456, -0.4576282501220703, -0.37931376695632935, -0.3009992837905884, -0.22268477082252502, -0.14437025785446167, -0.0660555362701416, 0.012258961796760559, 0.09057345986366272, 0.16888795793056488, 0.24720245599746704, 0.325516939163208, 0.40383145213127136, 0.4821459650993347, 0.5604604482650757, 0.6387749314308167, 0.7170894145965576, 0.7954039573669434, 0.8737184405326843, 0.9520329236984253, 1.030347466468811, 1.1086618900299072, 1.186976432800293, 1.2652909755706787, 1.343605399131775, 1.4219199419021606, 1.5002343654632568, 1.5785489082336426, 1.6568634510040283, 1.735177993774414, 1.8134924173355103, 1.891806960105896, 1.9701213836669922, 2.048435926437378, 2.1267504692077637, 2.2050647735595703, 2.283379316329956, 2.361693859100342, 2.4400084018707275]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 4.0, 5.0, 13.0, 14.0, 25.0, 28.0, 46.0, 57.0, 72.0, 119.0, 180.0, 279.0, 389.0, 616.0, 882.0, 1481.0, 2437.0, 4294.0, 7889.0, 15913.0, 39820.0, 279346.0, 587013.0, 63819.0, 20816.0, 9875.0, 5179.0, 2965.0, 1764.0, 1031.0, 710.0, 487.0, 283.0, 233.0, 134.0, 97.0, 74.0, 46.0, 32.0, 16.0, 24.0, 11.0, 7.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.01171875, -1.949188232421875, -1.88665771484375, -1.824127197265625, -1.7615966796875, -1.699066162109375, -1.63653564453125, -1.574005126953125, -1.511474609375, -1.448944091796875, -1.38641357421875, -1.323883056640625, -1.2613525390625, -1.198822021484375, -1.13629150390625, -1.073760986328125, -1.01123046875, -0.948699951171875, -0.88616943359375, -0.823638916015625, -0.7611083984375, -0.698577880859375, -0.63604736328125, -0.573516845703125, -0.510986328125, -0.448455810546875, -0.38592529296875, -0.323394775390625, -0.2608642578125, -0.198333740234375, -0.13580322265625, -0.073272705078125, -0.0107421875, 0.051788330078125, 0.11431884765625, 0.176849365234375, 0.2393798828125, 0.301910400390625, 0.36444091796875, 0.426971435546875, 0.489501953125, 0.552032470703125, 0.61456298828125, 0.677093505859375, 0.7396240234375, 0.802154541015625, 0.86468505859375, 0.927215576171875, 0.98974609375, 1.052276611328125, 1.11480712890625, 1.177337646484375, 1.2398681640625, 1.302398681640625, 1.36492919921875, 1.427459716796875, 1.489990234375, 1.552520751953125, 1.61505126953125, 1.677581787109375, 1.7401123046875, 1.802642822265625, 1.86517333984375, 1.927703857421875, 1.990234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 13.0, 9.0, 6.0, 9.0, 18.0, 40.0, 105.0, 219.0, 261.0, 153.0, 69.0, 18.0, 16.0, 3.0, 8.0, 1.0, 5.0, 11.0, 2.0, 7.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34912109375, -0.33725738525390625, -0.3253936767578125, -0.31352996826171875, -0.301666259765625, -0.28980255126953125, -0.2779388427734375, -0.26607513427734375, -0.25421142578125, -0.24234771728515625, -0.2304840087890625, -0.21862030029296875, -0.206756591796875, -0.19489288330078125, -0.1830291748046875, -0.17116546630859375, -0.1593017578125, -0.14743804931640625, -0.1355743408203125, -0.12371063232421875, -0.111846923828125, -0.09998321533203125, -0.0881195068359375, -0.07625579833984375, -0.06439208984375, -0.05252838134765625, -0.0406646728515625, -0.02880096435546875, -0.016937255859375, -0.00507354736328125, 0.0067901611328125, 0.01865386962890625, 0.030517578125, 0.04238128662109375, 0.0542449951171875, 0.06610870361328125, 0.077972412109375, 0.08983612060546875, 0.1016998291015625, 0.11356353759765625, 0.12542724609375, 0.13729095458984375, 0.1491546630859375, 0.16101837158203125, 0.172882080078125, 0.18474578857421875, 0.1966094970703125, 0.20847320556640625, 0.2203369140625, 0.23220062255859375, 0.2440643310546875, 0.25592803955078125, 0.267791748046875, 0.27965545654296875, 0.2915191650390625, 0.30338287353515625, 0.31524658203125, 0.32711029052734375, 0.3389739990234375, 0.35083770751953125, 0.362701416015625, 0.37456512451171875, 0.3864288330078125, 0.39829254150390625, 0.41015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 11.0, 6.0, 7.0, 11.0, 25.0, 29.0, 46.0, 72.0, 103.0, 157.0, 289.0, 536.0, 970.0, 2167.0, 5381.0, 16035.0, 57350.0, 251193.0, 490243.0, 165882.0, 38865.0, 11500.0, 4152.0, 1675.0, 770.0, 404.0, 225.0, 147.0, 105.0, 64.0, 35.0, 28.0, 13.0, 11.0, 8.0, 8.0, 7.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5791015625, -1.53314208984375, -1.4871826171875, -1.44122314453125, -1.395263671875, -1.34930419921875, -1.3033447265625, -1.25738525390625, -1.21142578125, -1.16546630859375, -1.1195068359375, -1.07354736328125, -1.027587890625, -0.98162841796875, -0.9356689453125, -0.88970947265625, -0.84375, -0.79779052734375, -0.7518310546875, -0.70587158203125, -0.659912109375, -0.61395263671875, -0.5679931640625, -0.52203369140625, -0.47607421875, -0.43011474609375, -0.3841552734375, -0.33819580078125, -0.292236328125, -0.24627685546875, -0.2003173828125, -0.15435791015625, -0.1083984375, -0.06243896484375, -0.0164794921875, 0.02947998046875, 0.075439453125, 0.12139892578125, 0.1673583984375, 0.21331787109375, 0.25927734375, 0.30523681640625, 0.3511962890625, 0.39715576171875, 0.443115234375, 0.48907470703125, 0.5350341796875, 0.58099365234375, 0.626953125, 0.67291259765625, 0.7188720703125, 0.76483154296875, 0.810791015625, 0.85675048828125, 0.9027099609375, 0.94866943359375, 0.99462890625, 1.04058837890625, 1.0865478515625, 1.13250732421875, 1.178466796875, 1.22442626953125, 1.2703857421875, 1.31634521484375, 1.3623046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 4.0, 8.0, 15.0, 6.0, 17.0, 8.0, 17.0, 16.0, 24.0, 22.0, 30.0, 35.0, 35.0, 30.0, 39.0, 37.0, 42.0, 52.0, 45.0, 51.0, 33.0, 54.0, 43.0, 34.0, 36.0, 36.0, 30.0, 25.0, 27.0, 22.0, 19.0, 19.0, 17.0, 11.0, 9.0, 7.0, 6.0, 8.0, 5.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.177734375, -1.144287109375, -1.11083984375, -1.077392578125, -1.0439453125, -1.010498046875, -0.97705078125, -0.943603515625, -0.91015625, -0.876708984375, -0.84326171875, -0.809814453125, -0.7763671875, -0.742919921875, -0.70947265625, -0.676025390625, -0.642578125, -0.609130859375, -0.57568359375, -0.542236328125, -0.5087890625, -0.475341796875, -0.44189453125, -0.408447265625, -0.375, -0.341552734375, -0.30810546875, -0.274658203125, -0.2412109375, -0.207763671875, -0.17431640625, -0.140869140625, -0.107421875, -0.073974609375, -0.04052734375, -0.007080078125, 0.0263671875, 0.059814453125, 0.09326171875, 0.126708984375, 0.16015625, 0.193603515625, 0.22705078125, 0.260498046875, 0.2939453125, 0.327392578125, 0.36083984375, 0.394287109375, 0.427734375, 0.461181640625, 0.49462890625, 0.528076171875, 0.5615234375, 0.594970703125, 0.62841796875, 0.661865234375, 0.6953125, 0.728759765625, 0.76220703125, 0.795654296875, 0.8291015625, 0.862548828125, 0.89599609375, 0.929443359375, 0.962890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 12.0, 11.0, 24.0, 24.0, 68.0, 106.0, 271.0, 667.0, 2453.0, 24268.0, 979736.0, 36520.0, 3044.0, 755.0, 293.0, 127.0, 77.0, 38.0, 20.0, 13.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6875, -9.3704833984375, -9.053466796875, -8.7364501953125, -8.41943359375, -8.1024169921875, -7.785400390625, -7.4683837890625, -7.1513671875, -6.8343505859375, -6.517333984375, -6.2003173828125, -5.88330078125, -5.5662841796875, -5.249267578125, -4.9322509765625, -4.615234375, -4.2982177734375, -3.981201171875, -3.6641845703125, -3.34716796875, -3.0301513671875, -2.713134765625, -2.3961181640625, -2.0791015625, -1.7620849609375, -1.445068359375, -1.1280517578125, -0.81103515625, -0.4940185546875, -0.177001953125, 0.1400146484375, 0.45703125, 0.7740478515625, 1.091064453125, 1.4080810546875, 1.72509765625, 2.0421142578125, 2.359130859375, 2.6761474609375, 2.9931640625, 3.3101806640625, 3.627197265625, 3.9442138671875, 4.26123046875, 4.5782470703125, 4.895263671875, 5.2122802734375, 5.529296875, 5.8463134765625, 6.163330078125, 6.4803466796875, 6.79736328125, 7.1143798828125, 7.431396484375, 7.7484130859375, 8.0654296875, 8.3824462890625, 8.699462890625, 9.0164794921875, 9.33349609375, 9.6505126953125, 9.967529296875, 10.2845458984375, 10.6015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 16.0, 14.0, 27.0, 23.0, 55.0, 81.0, 116.0, 175.0, 167.0, 112.0, 86.0, 56.0, 26.0, 18.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002315044403076172, -0.0002234838902950287, -0.00021546334028244019, -0.00020744279026985168, -0.00019942224025726318, -0.00019140169024467468, -0.00018338114023208618, -0.00017536059021949768, -0.00016734004020690918, -0.00015931949019432068, -0.00015129894018173218, -0.00014327839016914368, -0.00013525784015655518, -0.00012723729014396667, -0.00011921674013137817, -0.00011119619011878967, -0.00010317564010620117, -9.515509009361267e-05, -8.713454008102417e-05, -7.911399006843567e-05, -7.109344005584717e-05, -6.307289004325867e-05, -5.5052340030670166e-05, -4.7031790018081665e-05, -3.9011240005493164e-05, -3.099068999290466e-05, -2.2970139980316162e-05, -1.4949589967727661e-05, -6.92903995513916e-06, 1.0915100574493408e-06, 9.112060070037842e-06, 1.7132610082626343e-05, 2.5153160095214844e-05, 3.3173710107803345e-05, 4.1194260120391846e-05, 4.921481013298035e-05, 5.723536014556885e-05, 6.525591015815735e-05, 7.327646017074585e-05, 8.129701018333435e-05, 8.931756019592285e-05, 9.733811020851135e-05, 0.00010535866022109985, 0.00011337921023368835, 0.00012139976024627686, 0.00012942031025886536, 0.00013744086027145386, 0.00014546141028404236, 0.00015348196029663086, 0.00016150251030921936, 0.00016952306032180786, 0.00017754361033439636, 0.00018556416034698486, 0.00019358471035957336, 0.00020160526037216187, 0.00020962581038475037, 0.00021764636039733887, 0.00022566691040992737, 0.00023368746042251587, 0.00024170801043510437, 0.00024972856044769287, 0.00025774911046028137, 0.0002657696604728699, 0.0002737902104854584, 0.0002818107604980469]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 6.0, 10.0, 14.0, 31.0, 48.0, 63.0, 122.0, 198.0, 374.0, 916.0, 3653.0, 26867.0, 897129.0, 108933.0, 7460.0, 1601.0, 605.0, 216.0, 102.0, 87.0, 49.0, 26.0, 14.0, 6.0, 7.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.48828125, -7.28436279296875, -7.0804443359375, -6.87652587890625, -6.672607421875, -6.46868896484375, -6.2647705078125, -6.06085205078125, -5.85693359375, -5.65301513671875, -5.4490966796875, -5.24517822265625, -5.041259765625, -4.83734130859375, -4.6334228515625, -4.42950439453125, -4.2255859375, -4.02166748046875, -3.8177490234375, -3.61383056640625, -3.409912109375, -3.20599365234375, -3.0020751953125, -2.79815673828125, -2.59423828125, -2.39031982421875, -2.1864013671875, -1.98248291015625, -1.778564453125, -1.57464599609375, -1.3707275390625, -1.16680908203125, -0.962890625, -0.75897216796875, -0.5550537109375, -0.35113525390625, -0.147216796875, 0.05670166015625, 0.2606201171875, 0.46453857421875, 0.66845703125, 0.87237548828125, 1.0762939453125, 1.28021240234375, 1.484130859375, 1.68804931640625, 1.8919677734375, 2.09588623046875, 2.2998046875, 2.50372314453125, 2.7076416015625, 2.91156005859375, 3.115478515625, 3.31939697265625, 3.5233154296875, 3.72723388671875, 3.93115234375, 4.13507080078125, 4.3389892578125, 4.54290771484375, 4.746826171875, 4.95074462890625, 5.1546630859375, 5.35858154296875, 5.5625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 9.0, 8.0, 16.0, 30.0, 50.0, 127.0, 327.0, 246.0, 107.0, 34.0, 18.0, 11.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.8515625, -7.67645263671875, -7.5013427734375, -7.32623291015625, -7.151123046875, -6.97601318359375, -6.8009033203125, -6.62579345703125, -6.45068359375, -6.27557373046875, -6.1004638671875, -5.92535400390625, -5.750244140625, -5.57513427734375, -5.4000244140625, -5.22491455078125, -5.0498046875, -4.87469482421875, -4.6995849609375, -4.52447509765625, -4.349365234375, -4.17425537109375, -3.9991455078125, -3.82403564453125, -3.64892578125, -3.47381591796875, -3.2987060546875, -3.12359619140625, -2.948486328125, -2.77337646484375, -2.5982666015625, -2.42315673828125, -2.248046875, -2.07293701171875, -1.8978271484375, -1.72271728515625, -1.547607421875, -1.37249755859375, -1.1973876953125, -1.02227783203125, -0.84716796875, -0.67205810546875, -0.4969482421875, -0.32183837890625, -0.146728515625, 0.02838134765625, 0.2034912109375, 0.37860107421875, 0.5537109375, 0.72882080078125, 0.9039306640625, 1.07904052734375, 1.254150390625, 1.42926025390625, 1.6043701171875, 1.77947998046875, 1.95458984375, 2.12969970703125, 2.3048095703125, 2.47991943359375, 2.655029296875, 2.83013916015625, 3.0052490234375, 3.18035888671875, 3.35546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 13.0, 22.0, 121.0, 231.0, 295.0, 189.0, 71.0, 27.0, 12.0, 4.0, 3.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.39697265625, -26.69879913330078, -26.000627517700195, -25.302453994750977, -24.604280471801758, -23.906108856201172, -23.207935333251953, -22.509761810302734, -21.811588287353516, -21.113414764404297, -20.41524314880371, -19.717069625854492, -19.018896102905273, -18.320724487304688, -17.62255096435547, -16.92437744140625, -16.226205825805664, -15.528033256530762, -14.829859733581543, -14.13168716430664, -13.433513641357422, -12.73534107208252, -12.037168502807617, -11.338994979858398, -10.640822410583496, -9.942649841308594, -9.244476318359375, -8.546303749084473, -7.848130702972412, -7.149957656860352, -6.451785087585449, -5.753612041473389, -5.055438995361328, -4.357265949249268, -3.659093141555786, -2.9609203338623047, -2.262747287750244, -1.5645742416381836, -0.8664016723632812, -0.1682286262512207, 0.5299444198608398, 1.2281173467636108, 1.9262902736663818, 2.6244630813598633, 3.322636127471924, 4.020809173583984, 4.718981742858887, 5.417154788970947, 6.115327835083008, 6.813500881195068, 7.511673927307129, 8.209846496582031, 8.90802001953125, 9.606192588806152, 10.304365158081055, 11.002538681030273, 11.700711250305176, 12.398883819580078, 13.097057342529297, 13.7952299118042, 14.493402481079102, 15.19157600402832, 15.889748573303223, 16.587921142578125, 17.286094665527344]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 19.0, 26.0, 34.0, 53.0, 73.0, 114.0, 94.0, 112.0, 124.0, 88.0, 86.0, 53.0, 30.0, 32.0, 17.0, 2.0, 5.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.823339462280273, -27.137771606445312, -26.45220184326172, -25.766632080078125, -25.081064224243164, -24.395496368408203, -23.70992660522461, -23.024356842041016, -22.338788986206055, -21.653221130371094, -20.9676513671875, -20.282081604003906, -19.596513748168945, -18.910945892333984, -18.22537612915039, -17.539806365966797, -16.854238510131836, -16.168670654296875, -15.483100891113281, -14.797532081604004, -14.111963272094727, -13.42639446258545, -12.740825653076172, -12.055256843566895, -11.369688034057617, -10.68411922454834, -9.998550415039062, -9.312981605529785, -8.627412796020508, -7.9418439865112305, -7.256275177001953, -6.570706367492676, -5.885139465332031, -5.199570655822754, -4.514001846313477, -3.828433036804199, -3.142864227294922, -2.4572954177856445, -1.7717266082763672, -1.0861577987670898, -0.4005889892578125, 0.28497982025146484, 0.9705486297607422, 1.6561174392700195, 2.341686248779297, 3.027255058288574, 3.7128238677978516, 4.398392677307129, 5.083961486816406, 5.769530296325684, 6.455099105834961, 7.140667915344238, 7.826236724853516, 8.511805534362793, 9.19737434387207, 9.882943153381348, 10.568511962890625, 11.254080772399902, 11.93964958190918, 12.625218391418457, 13.310787200927734, 13.996356010437012, 14.681924819946289, 15.367493629455566, 16.053062438964844]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 2.0, 5.0, 8.0, 8.0, 8.0, 4.0, 9.0, 8.0, 13.0, 21.0, 18.0, 21.0, 53.0, 51.0, 73.0, 134.0, 281.0, 560.0, 1184.0, 3561.0, 25892.0, 4085823.0, 67532.0, 5597.0, 1677.0, 763.0, 382.0, 216.0, 129.0, 89.0, 55.0, 45.0, 21.0, 15.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.7890625, -11.52496337890625, -11.2608642578125, -10.99676513671875, -10.732666015625, -10.46856689453125, -10.2044677734375, -9.94036865234375, -9.67626953125, -9.41217041015625, -9.1480712890625, -8.88397216796875, -8.619873046875, -8.35577392578125, -8.0916748046875, -7.82757568359375, -7.5634765625, -7.29937744140625, -7.0352783203125, -6.77117919921875, -6.507080078125, -6.24298095703125, -5.9788818359375, -5.71478271484375, -5.45068359375, -5.18658447265625, -4.9224853515625, -4.65838623046875, -4.394287109375, -4.13018798828125, -3.8660888671875, -3.60198974609375, -3.337890625, -3.07379150390625, -2.8096923828125, -2.54559326171875, -2.281494140625, -2.01739501953125, -1.7532958984375, -1.48919677734375, -1.22509765625, -0.96099853515625, -0.6968994140625, -0.43280029296875, -0.168701171875, 0.09539794921875, 0.3594970703125, 0.62359619140625, 0.8876953125, 1.15179443359375, 1.4158935546875, 1.67999267578125, 1.944091796875, 2.20819091796875, 2.4722900390625, 2.73638916015625, 3.00048828125, 3.26458740234375, 3.5286865234375, 3.79278564453125, 4.056884765625, 4.32098388671875, 4.5850830078125, 4.84918212890625, 5.11328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 8.0, 18.0, 27.0, 61.0, 176.0, 269.0, 253.0, 99.0, 35.0, 10.0, 12.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.87548828125, -0.8559226989746094, -0.8363571166992188, -0.8167915344238281, -0.7972259521484375, -0.7776603698730469, -0.7580947875976562, -0.7385292053222656, -0.718963623046875, -0.6993980407714844, -0.6798324584960938, -0.6602668762207031, -0.6407012939453125, -0.6211357116699219, -0.6015701293945312, -0.5820045471191406, -0.56243896484375, -0.5428733825683594, -0.5233078002929688, -0.5037422180175781, -0.4841766357421875, -0.4646110534667969, -0.44504547119140625, -0.4254798889160156, -0.405914306640625, -0.3863487243652344, -0.36678314208984375, -0.3472175598144531, -0.3276519775390625, -0.3080863952636719, -0.28852081298828125, -0.2689552307128906, -0.2493896484375, -0.22982406616210938, -0.21025848388671875, -0.19069290161132812, -0.1711273193359375, -0.15156173706054688, -0.13199615478515625, -0.11243057250976562, -0.092864990234375, -0.07329940795898438, -0.05373382568359375, -0.034168243408203125, -0.0146026611328125, 0.004962921142578125, 0.02452850341796875, 0.044094085693359375, 0.06365966796875, 0.08322525024414062, 0.10279083251953125, 0.12235641479492188, 0.1419219970703125, 0.16148757934570312, 0.18105316162109375, 0.20061874389648438, 0.220184326171875, 0.23974990844726562, 0.25931549072265625, 0.2788810729980469, 0.2984466552734375, 0.3180122375488281, 0.33757781982421875, 0.3571434020996094, 0.376708984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 6.0, 17.0, 21.0, 38.0, 83.0, 280.0, 1428.0, 23755.0, 4152840.0, 14265.0, 1150.0, 245.0, 76.0, 43.0, 16.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5703125, -10.1986083984375, -9.826904296875, -9.4552001953125, -9.08349609375, -8.7117919921875, -8.340087890625, -7.9683837890625, -7.5966796875, -7.2249755859375, -6.853271484375, -6.4815673828125, -6.10986328125, -5.7381591796875, -5.366455078125, -4.9947509765625, -4.623046875, -4.2513427734375, -3.879638671875, -3.5079345703125, -3.13623046875, -2.7645263671875, -2.392822265625, -2.0211181640625, -1.6494140625, -1.2777099609375, -0.906005859375, -0.5343017578125, -0.16259765625, 0.2091064453125, 0.580810546875, 0.9525146484375, 1.32421875, 1.6959228515625, 2.067626953125, 2.4393310546875, 2.81103515625, 3.1827392578125, 3.554443359375, 3.9261474609375, 4.2978515625, 4.6695556640625, 5.041259765625, 5.4129638671875, 5.78466796875, 6.1563720703125, 6.528076171875, 6.8997802734375, 7.271484375, 7.6431884765625, 8.014892578125, 8.3865966796875, 8.75830078125, 9.1300048828125, 9.501708984375, 9.8734130859375, 10.2451171875, 10.6168212890625, 10.988525390625, 11.3602294921875, 11.73193359375, 12.1036376953125, 12.475341796875, 12.8470458984375, 13.21875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 2.0, 7.0, 11.0, 27.0, 52.0, 109.0, 424.0, 2382.0, 696.0, 193.0, 73.0, 32.0, 15.0, 17.0, 12.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.9786148071289062, -0.9503936767578125, -0.9221725463867188, -0.893951416015625, -0.8657302856445312, -0.8375091552734375, -0.8092880249023438, -0.78106689453125, -0.7528457641601562, -0.7246246337890625, -0.6964035034179688, -0.668182373046875, -0.6399612426757812, -0.6117401123046875, -0.5835189819335938, -0.5552978515625, -0.5270767211914062, -0.4988555908203125, -0.47063446044921875, -0.442413330078125, -0.41419219970703125, -0.3859710693359375, -0.35774993896484375, -0.32952880859375, -0.30130767822265625, -0.2730865478515625, -0.24486541748046875, -0.216644287109375, -0.18842315673828125, -0.1602020263671875, -0.13198089599609375, -0.103759765625, -0.07553863525390625, -0.0473175048828125, -0.01909637451171875, 0.009124755859375, 0.03734588623046875, 0.0655670166015625, 0.09378814697265625, 0.12200927734375, 0.15023040771484375, 0.1784515380859375, 0.20667266845703125, 0.234893798828125, 0.26311492919921875, 0.2913360595703125, 0.31955718994140625, 0.3477783203125, 0.37599945068359375, 0.4042205810546875, 0.43244171142578125, 0.460662841796875, 0.48888397216796875, 0.5171051025390625, 0.5453262329101562, 0.57354736328125, 0.6017684936523438, 0.6299896240234375, 0.6582107543945312, 0.686431884765625, 0.7146530151367188, 0.7428741455078125, 0.7710952758789062, 0.79931640625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 10.0, 32.0, 89.0, 270.0, 349.0, 174.0, 50.0, 11.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.939841270446777, -5.771453857421875, -5.603066444396973, -5.4346795082092285, -5.266292095184326, -5.097904682159424, -4.92951774597168, -4.761130332946777, -4.592742919921875, -4.424355506896973, -4.25596809387207, -4.087581157684326, -3.919193744659424, -3.7508063316345215, -3.5824191570281982, -3.414031982421875, -3.2456445693969727, -3.0772571563720703, -2.908869981765747, -2.740482807159424, -2.5720953941345215, -2.403707981109619, -2.235320806503296, -2.0669336318969727, -1.8985462188720703, -1.7301589250564575, -1.5617716312408447, -1.393384337425232, -1.2249970436096191, -1.0566097497940063, -0.8882224559783936, -0.7198351621627808, -0.5514483451843262, -0.3830610513687134, -0.21467375755310059, -0.04628646373748779, 0.122100830078125, 0.2904881238937378, 0.4588754177093506, 0.6272627115249634, 0.7956500053405762, 0.964037299156189, 1.1324245929718018, 1.3008118867874146, 1.4691991806030273, 1.6375864744186401, 1.805973768234253, 1.9743610620498657, 2.1427483558654785, 2.311135768890381, 2.479522943496704, 2.6479101181030273, 2.8162975311279297, 2.984684944152832, 3.1530721187591553, 3.3214592933654785, 3.489846706390381, 3.658234119415283, 3.8266212940216064, 3.9950084686279297, 4.163395881652832, 4.331783294677734, 4.500170707702637, 4.668557643890381, 4.836945056915283]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 10.0, 28.0, 52.0, 115.0, 174.0, 227.0, 183.0, 129.0, 56.0, 13.0, 10.0, 8.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7335176467895508, -1.5246598720550537, -1.3158020973205566, -1.1069444417953491, -0.898086667060852, -0.689228892326355, -0.48037123680114746, -0.2715134620666504, -0.06265568733215332, 0.14620205760002136, 0.35505980253219604, 0.5639175176620483, 0.7727752923965454, 0.9816330671310425, 1.19049072265625, 1.399348497390747, 1.6082062721252441, 1.8170640468597412, 2.0259218215942383, 2.2347793579101562, 2.4436373710632324, 2.6524949073791504, 2.8613526821136475, 3.0702104568481445, 3.2790682315826416, 3.4879260063171387, 3.6967837810516357, 3.905641555786133, 4.114499092102051, 4.323357105255127, 4.532214641571045, 4.741072654724121, 4.949930191040039, 5.158787727355957, 5.367645740509033, 5.576503276824951, 5.785361289978027, 5.994218826293945, 6.203076362609863, 6.4119343757629395, 6.620792388916016, 6.829649925231934, 7.03850793838501, 7.247365474700928, 7.456223487854004, 7.665081024169922, 7.87393856048584, 8.082796096801758, 8.291654586791992, 8.50051212310791, 8.709369659423828, 8.918228149414062, 9.12708568572998, 9.335943222045898, 9.544800758361816, 9.753658294677734, 9.962515830993652, 10.17137336730957, 10.380230903625488, 10.589089393615723, 10.79794692993164, 11.006804466247559, 11.215662002563477, 11.424520492553711, 11.633378028869629]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 7.0, 2.0, 5.0, 4.0, 6.0, 6.0, 11.0, 16.0, 16.0, 18.0, 31.0, 38.0, 65.0, 79.0, 124.0, 191.0, 296.0, 500.0, 793.0, 1591.0, 3519.0, 10412.0, 51098.0, 534294.0, 392096.0, 38440.0, 8526.0, 2977.0, 1379.0, 742.0, 455.0, 279.0, 167.0, 104.0, 69.0, 49.0, 29.0, 32.0, 32.0, 23.0, 8.0, 6.0, 5.0, 6.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.5078125, -2.42926025390625, -2.3507080078125, -2.27215576171875, -2.193603515625, -2.11505126953125, -2.0364990234375, -1.95794677734375, -1.87939453125, -1.80084228515625, -1.7222900390625, -1.64373779296875, -1.565185546875, -1.48663330078125, -1.4080810546875, -1.32952880859375, -1.2509765625, -1.17242431640625, -1.0938720703125, -1.01531982421875, -0.936767578125, -0.85821533203125, -0.7796630859375, -0.70111083984375, -0.62255859375, -0.54400634765625, -0.4654541015625, -0.38690185546875, -0.308349609375, -0.22979736328125, -0.1512451171875, -0.07269287109375, 0.005859375, 0.08441162109375, 0.1629638671875, 0.24151611328125, 0.320068359375, 0.39862060546875, 0.4771728515625, 0.55572509765625, 0.63427734375, 0.71282958984375, 0.7913818359375, 0.86993408203125, 0.948486328125, 1.02703857421875, 1.1055908203125, 1.18414306640625, 1.2626953125, 1.34124755859375, 1.4197998046875, 1.49835205078125, 1.576904296875, 1.65545654296875, 1.7340087890625, 1.81256103515625, 1.89111328125, 1.96966552734375, 2.0482177734375, 2.12677001953125, 2.205322265625, 2.28387451171875, 2.3624267578125, 2.44097900390625, 2.51953125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 9.0, 7.0, 16.0, 28.0, 55.0, 100.0, 139.0, 179.0, 170.0, 113.0, 70.0, 30.0, 28.0, 12.0, 10.0, 2.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.320068359375, -0.3090095520019531, -0.29795074462890625, -0.2868919372558594, -0.2758331298828125, -0.2647743225097656, -0.25371551513671875, -0.24265670776367188, -0.231597900390625, -0.22053909301757812, -0.20948028564453125, -0.19842147827148438, -0.1873626708984375, -0.17630386352539062, -0.16524505615234375, -0.15418624877929688, -0.14312744140625, -0.13206863403320312, -0.12100982666015625, -0.10995101928710938, -0.0988922119140625, -0.08783340454101562, -0.07677459716796875, -0.06571578979492188, -0.054656982421875, -0.043598175048828125, -0.03253936767578125, -0.021480560302734375, -0.0104217529296875, 0.000637054443359375, 0.01169586181640625, 0.022754669189453125, 0.0338134765625, 0.044872283935546875, 0.05593109130859375, 0.06698989868164062, 0.0780487060546875, 0.08910751342773438, 0.10016632080078125, 0.11122512817382812, 0.122283935546875, 0.13334274291992188, 0.14440155029296875, 0.15546035766601562, 0.1665191650390625, 0.17757797241210938, 0.18863677978515625, 0.19969558715820312, 0.21075439453125, 0.22181320190429688, 0.23287200927734375, 0.24393081665039062, 0.2549896240234375, 0.2660484313964844, 0.27710723876953125, 0.2881660461425781, 0.299224853515625, 0.3102836608886719, 0.32134246826171875, 0.3324012756347656, 0.3434600830078125, 0.3545188903808594, 0.36557769775390625, 0.3766365051269531, 0.3876953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 5.0, 12.0, 11.0, 23.0, 23.0, 21.0, 36.0, 49.0, 87.0, 101.0, 161.0, 317.0, 525.0, 942.0, 2308.0, 7823.0, 40822.0, 265191.0, 561637.0, 137431.0, 22121.0, 5083.0, 1707.0, 830.0, 426.0, 265.0, 168.0, 110.0, 70.0, 66.0, 40.0, 38.0, 26.0, 15.0, 17.0, 9.0, 8.0, 6.0, 6.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.912109375, -1.846893310546875, -1.78167724609375, -1.716461181640625, -1.6512451171875, -1.586029052734375, -1.52081298828125, -1.455596923828125, -1.390380859375, -1.325164794921875, -1.25994873046875, -1.194732666015625, -1.1295166015625, -1.064300537109375, -0.99908447265625, -0.933868408203125, -0.86865234375, -0.803436279296875, -0.73822021484375, -0.673004150390625, -0.6077880859375, -0.542572021484375, -0.47735595703125, -0.412139892578125, -0.346923828125, -0.281707763671875, -0.21649169921875, -0.151275634765625, -0.0860595703125, -0.020843505859375, 0.04437255859375, 0.109588623046875, 0.1748046875, 0.240020751953125, 0.30523681640625, 0.370452880859375, 0.4356689453125, 0.500885009765625, 0.56610107421875, 0.631317138671875, 0.696533203125, 0.761749267578125, 0.82696533203125, 0.892181396484375, 0.9573974609375, 1.022613525390625, 1.08782958984375, 1.153045654296875, 1.21826171875, 1.283477783203125, 1.34869384765625, 1.413909912109375, 1.4791259765625, 1.544342041015625, 1.60955810546875, 1.674774169921875, 1.739990234375, 1.805206298828125, 1.87042236328125, 1.935638427734375, 2.0008544921875, 2.066070556640625, 2.13128662109375, 2.196502685546875, 2.26171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 5.0, 3.0, 8.0, 17.0, 19.0, 12.0, 13.0, 25.0, 15.0, 25.0, 25.0, 34.0, 38.0, 48.0, 39.0, 40.0, 45.0, 33.0, 47.0, 48.0, 39.0, 50.0, 47.0, 46.0, 36.0, 26.0, 39.0, 29.0, 16.0, 30.0, 14.0, 16.0, 16.0, 7.0, 9.0, 7.0, 4.0, 6.0, 4.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.056640625, -1.0231475830078125, -0.989654541015625, -0.9561614990234375, -0.92266845703125, -0.8891754150390625, -0.855682373046875, -0.8221893310546875, -0.7886962890625, -0.7552032470703125, -0.721710205078125, -0.6882171630859375, -0.65472412109375, -0.6212310791015625, -0.587738037109375, -0.5542449951171875, -0.520751953125, -0.4872589111328125, -0.453765869140625, -0.4202728271484375, -0.38677978515625, -0.3532867431640625, -0.319793701171875, -0.2863006591796875, -0.2528076171875, -0.2193145751953125, -0.185821533203125, -0.1523284912109375, -0.11883544921875, -0.0853424072265625, -0.051849365234375, -0.0183563232421875, 0.01513671875, 0.0486297607421875, 0.082122802734375, 0.1156158447265625, 0.14910888671875, 0.1826019287109375, 0.216094970703125, 0.2495880126953125, 0.2830810546875, 0.3165740966796875, 0.350067138671875, 0.3835601806640625, 0.41705322265625, 0.4505462646484375, 0.484039306640625, 0.5175323486328125, 0.551025390625, 0.5845184326171875, 0.618011474609375, 0.6515045166015625, 0.68499755859375, 0.7184906005859375, 0.751983642578125, 0.7854766845703125, 0.8189697265625, 0.8524627685546875, 0.885955810546875, 0.9194488525390625, 0.95294189453125, 0.9864349365234375, 1.019927978515625, 1.0534210205078125, 1.0869140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 2.0, 10.0, 12.0, 20.0, 16.0, 26.0, 39.0, 60.0, 97.0, 143.0, 259.0, 519.0, 986.0, 2334.0, 6189.0, 21529.0, 99424.0, 520360.0, 319345.0, 55766.0, 13636.0, 4284.0, 1664.0, 814.0, 370.0, 222.0, 137.0, 99.0, 53.0, 34.0, 27.0, 19.0, 11.0, 18.0, 3.0, 8.0, 3.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0270843505859375, -0.992645263671875, -0.9582061767578125, -0.92376708984375, -0.8893280029296875, -0.854888916015625, -0.8204498291015625, -0.7860107421875, -0.7515716552734375, -0.717132568359375, -0.6826934814453125, -0.64825439453125, -0.6138153076171875, -0.579376220703125, -0.5449371337890625, -0.510498046875, -0.4760589599609375, -0.441619873046875, -0.4071807861328125, -0.37274169921875, -0.3383026123046875, -0.303863525390625, -0.2694244384765625, -0.2349853515625, -0.2005462646484375, -0.166107177734375, -0.1316680908203125, -0.09722900390625, -0.0627899169921875, -0.028350830078125, 0.0060882568359375, 0.04052734375, 0.0749664306640625, 0.109405517578125, 0.1438446044921875, 0.17828369140625, 0.2127227783203125, 0.247161865234375, 0.2816009521484375, 0.3160400390625, 0.3504791259765625, 0.384918212890625, 0.4193572998046875, 0.45379638671875, 0.4882354736328125, 0.522674560546875, 0.5571136474609375, 0.591552734375, 0.6259918212890625, 0.660430908203125, 0.6948699951171875, 0.72930908203125, 0.7637481689453125, 0.798187255859375, 0.8326263427734375, 0.8670654296875, 0.9015045166015625, 0.935943603515625, 0.9703826904296875, 1.00482177734375, 1.0392608642578125, 1.073699951171875, 1.1081390380859375, 1.142578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 5.0, 8.0, 6.0, 9.0, 13.0, 17.0, 30.0, 20.0, 33.0, 42.0, 39.0, 55.0, 65.0, 82.0, 81.0, 63.0, 72.0, 62.0, 39.0, 49.0, 30.0, 23.0, 32.0, 14.0, 15.0, 11.0, 15.0, 12.0, 7.0, 7.0, 3.0, 6.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001093745231628418, -0.00010553840547800064, -0.00010170228779315948, -9.786617010831833e-05, -9.403005242347717e-05, -9.019393473863602e-05, -8.635781705379486e-05, -8.25216993689537e-05, -7.868558168411255e-05, -7.484946399927139e-05, -7.101334631443024e-05, -6.717722862958908e-05, -6.334111094474792e-05, -5.950499325990677e-05, -5.566887557506561e-05, -5.183275789022446e-05, -4.79966402053833e-05, -4.4160522520542145e-05, -4.032440483570099e-05, -3.648828715085983e-05, -3.265216946601868e-05, -2.881605178117752e-05, -2.4979934096336365e-05, -2.114381641149521e-05, -1.7307698726654053e-05, -1.3471581041812897e-05, -9.63546335697174e-06, -5.799345672130585e-06, -1.9632279872894287e-06, 1.8728896975517273e-06, 5.709007382392883e-06, 9.54512506723404e-06, 1.3381242752075195e-05, 1.721736043691635e-05, 2.1053478121757507e-05, 2.4889595806598663e-05, 2.872571349143982e-05, 3.2561831176280975e-05, 3.639794886112213e-05, 4.023406654596329e-05, 4.407018423080444e-05, 4.79063019156456e-05, 5.1742419600486755e-05, 5.557853728532791e-05, 5.941465497016907e-05, 6.325077265501022e-05, 6.708689033985138e-05, 7.092300802469254e-05, 7.475912570953369e-05, 7.859524339437485e-05, 8.2431361079216e-05, 8.626747876405716e-05, 9.010359644889832e-05, 9.393971413373947e-05, 9.777583181858063e-05, 0.00010161194950342178, 0.00010544806718826294, 0.0001092841848731041, 0.00011312030255794525, 0.00011695642024278641, 0.00012079253792762756, 0.00012462865561246872, 0.00012846477329730988, 0.00013230089098215103, 0.0001361370086669922]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 17.0, 18.0, 27.0, 39.0, 42.0, 81.0, 150.0, 234.0, 498.0, 1002.0, 2850.0, 11191.0, 66323.0, 587931.0, 330861.0, 36597.0, 6992.0, 2004.0, 794.0, 388.0, 188.0, 126.0, 74.0, 44.0, 23.0, 14.0, 8.0, 11.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.166015625, -1.11712646484375, -1.0682373046875, -1.01934814453125, -0.970458984375, -0.92156982421875, -0.8726806640625, -0.82379150390625, -0.77490234375, -0.72601318359375, -0.6771240234375, -0.62823486328125, -0.579345703125, -0.53045654296875, -0.4815673828125, -0.43267822265625, -0.3837890625, -0.33489990234375, -0.2860107421875, -0.23712158203125, -0.188232421875, -0.13934326171875, -0.0904541015625, -0.04156494140625, 0.00732421875, 0.05621337890625, 0.1051025390625, 0.15399169921875, 0.202880859375, 0.25177001953125, 0.3006591796875, 0.34954833984375, 0.3984375, 0.44732666015625, 0.4962158203125, 0.54510498046875, 0.593994140625, 0.64288330078125, 0.6917724609375, 0.74066162109375, 0.78955078125, 0.83843994140625, 0.8873291015625, 0.93621826171875, 0.985107421875, 1.03399658203125, 1.0828857421875, 1.13177490234375, 1.1806640625, 1.22955322265625, 1.2784423828125, 1.32733154296875, 1.376220703125, 1.42510986328125, 1.4739990234375, 1.52288818359375, 1.57177734375, 1.62066650390625, 1.6695556640625, 1.71844482421875, 1.767333984375, 1.81622314453125, 1.8651123046875, 1.91400146484375, 1.962890625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 2.0, 4.0, 6.0, 9.0, 15.0, 12.0, 15.0, 17.0, 25.0, 25.0, 44.0, 61.0, 69.0, 68.0, 90.0, 98.0, 82.0, 87.0, 61.0, 43.0, 43.0, 25.0, 29.0, 21.0, 14.0, 6.0, 6.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5087890625, -0.488006591796875, -0.46722412109375, -0.446441650390625, -0.4256591796875, -0.404876708984375, -0.38409423828125, -0.363311767578125, -0.342529296875, -0.321746826171875, -0.30096435546875, -0.280181884765625, -0.2593994140625, -0.238616943359375, -0.21783447265625, -0.197052001953125, -0.17626953125, -0.155487060546875, -0.13470458984375, -0.113922119140625, -0.0931396484375, -0.072357177734375, -0.05157470703125, -0.030792236328125, -0.010009765625, 0.010772705078125, 0.03155517578125, 0.052337646484375, 0.0731201171875, 0.093902587890625, 0.11468505859375, 0.135467529296875, 0.15625, 0.177032470703125, 0.19781494140625, 0.218597412109375, 0.2393798828125, 0.260162353515625, 0.28094482421875, 0.301727294921875, 0.322509765625, 0.343292236328125, 0.36407470703125, 0.384857177734375, 0.4056396484375, 0.426422119140625, 0.44720458984375, 0.467987060546875, 0.48876953125, 0.509552001953125, 0.53033447265625, 0.551116943359375, 0.5718994140625, 0.592681884765625, 0.61346435546875, 0.634246826171875, 0.655029296875, 0.675811767578125, 0.69659423828125, 0.717376708984375, 0.7381591796875, 0.758941650390625, 0.77972412109375, 0.800506591796875, 0.8212890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 9.0, 26.0, 116.0, 389.0, 349.0, 75.0, 23.0, 9.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.94568634033203, -44.026458740234375, -43.10723114013672, -42.18800354003906, -41.268775939941406, -40.34954833984375, -39.430320739746094, -38.51109313964844, -37.59186553955078, -36.672637939453125, -35.75341033935547, -34.83418273925781, -33.914955139160156, -32.9957275390625, -32.076499938964844, -31.15727424621582, -30.238048553466797, -29.31882095336914, -28.399593353271484, -27.480365753173828, -26.561138153076172, -25.641910552978516, -24.72268295288086, -23.803457260131836, -22.884227752685547, -21.96500015258789, -21.045772552490234, -20.126544952392578, -19.207317352294922, -18.288089752197266, -17.36886215209961, -16.449636459350586, -15.53040885925293, -14.611181259155273, -13.691953659057617, -12.772726058959961, -11.853499412536621, -10.934271812438965, -10.015044212341309, -9.095817565917969, -8.176589965820312, -7.257362365722656, -6.338135242462158, -5.418907642364502, -4.499680519104004, -3.5804529190063477, -2.6612253189086914, -1.7419981956481934, -0.8227701187133789, 0.09645730257034302, 1.015684723854065, 1.9349122047424316, 2.854139566421509, 3.773366928100586, 4.692594528198242, 5.61182165145874, 6.5310492515563965, 7.450276851654053, 8.36950397491455, 9.288731575012207, 10.207959175109863, 11.127185821533203, 12.04641342163086, 12.965641021728516, 13.884868621826172]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 10.0, 11.0, 7.0, 6.0, 19.0, 25.0, 36.0, 20.0, 36.0, 38.0, 41.0, 45.0, 65.0, 67.0, 49.0, 73.0, 51.0, 56.0, 52.0, 47.0, 50.0, 32.0, 34.0, 37.0, 19.0, 19.0, 15.0, 8.0, 10.0, 11.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.135098457336426, -7.786456108093262, -7.4378132820129395, -7.089170932769775, -6.740528106689453, -6.391885757446289, -6.043243408203125, -5.694601058959961, -5.345958232879639, -4.997315883636475, -4.648673057556152, -4.300030708312988, -3.951388120651245, -3.602745532989502, -3.254103183746338, -2.9054605960845947, -2.5568180084228516, -2.2081754207611084, -1.8595329523086548, -1.5108904838562012, -1.162247896194458, -0.8136053085327148, -0.4649629592895508, -0.11632037162780762, 0.23232221603393555, 0.5809647440910339, 0.9296072721481323, 1.278249740600586, 1.626892328262329, 1.9755349159240723, 2.3241772651672363, 2.6728198528289795, 3.0214614868164062, 3.3701040744781494, 3.7187466621398926, 4.067389011383057, 4.416031837463379, 4.764674186706543, 5.113316535949707, 5.461958885192871, 5.810601711273193, 6.159244060516357, 6.50788688659668, 6.856529235839844, 7.205171585083008, 7.55381441116333, 7.902456760406494, 8.251099586486816, 8.59974193572998, 8.948384284973145, 9.297026634216309, 9.645669937133789, 9.994312286376953, 10.342954635620117, 10.691596984863281, 11.040239334106445, 11.38888168334961, 11.737524032592773, 12.086166381835938, 12.434808731079102, 12.783452033996582, 13.132094383239746, 13.48073673248291, 13.829379081726074, 14.178022384643555]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 15.0, 18.0, 30.0, 40.0, 78.0, 175.0, 470.0, 2148.0, 78441.0, 4104954.0, 6215.0, 943.0, 356.0, 151.0, 93.0, 62.0, 38.0, 14.0, 10.0, 7.0, 4.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.0625, -11.6630859375, -11.263671875, -10.8642578125, -10.46484375, -10.0654296875, -9.666015625, -9.2666015625, -8.8671875, -8.4677734375, -8.068359375, -7.6689453125, -7.26953125, -6.8701171875, -6.470703125, -6.0712890625, -5.671875, -5.2724609375, -4.873046875, -4.4736328125, -4.07421875, -3.6748046875, -3.275390625, -2.8759765625, -2.4765625, -2.0771484375, -1.677734375, -1.2783203125, -0.87890625, -0.4794921875, -0.080078125, 0.3193359375, 0.71875, 1.1181640625, 1.517578125, 1.9169921875, 2.31640625, 2.7158203125, 3.115234375, 3.5146484375, 3.9140625, 4.3134765625, 4.712890625, 5.1123046875, 5.51171875, 5.9111328125, 6.310546875, 6.7099609375, 7.109375, 7.5087890625, 7.908203125, 8.3076171875, 8.70703125, 9.1064453125, 9.505859375, 9.9052734375, 10.3046875, 10.7041015625, 11.103515625, 11.5029296875, 11.90234375, 12.3017578125, 12.701171875, 13.1005859375, 13.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 4.0, 10.0, 19.0, 16.0, 25.0, 48.0, 82.0, 95.0, 120.0, 134.0, 121.0, 96.0, 73.0, 58.0, 33.0, 22.0, 15.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.399169921875, -0.3857460021972656, -0.37232208251953125, -0.3588981628417969, -0.3454742431640625, -0.3320503234863281, -0.31862640380859375, -0.3052024841308594, -0.291778564453125, -0.2783546447753906, -0.26493072509765625, -0.2515068054199219, -0.2380828857421875, -0.22465896606445312, -0.21123504638671875, -0.19781112670898438, -0.18438720703125, -0.17096328735351562, -0.15753936767578125, -0.14411544799804688, -0.1306915283203125, -0.11726760864257812, -0.10384368896484375, -0.09041976928710938, -0.076995849609375, -0.06357192993164062, -0.05014801025390625, -0.036724090576171875, -0.0233001708984375, -0.009876251220703125, 0.00354766845703125, 0.016971588134765625, 0.0303955078125, 0.043819427490234375, 0.05724334716796875, 0.07066726684570312, 0.0840911865234375, 0.09751510620117188, 0.11093902587890625, 0.12436294555664062, 0.137786865234375, 0.15121078491210938, 0.16463470458984375, 0.17805862426757812, 0.1914825439453125, 0.20490646362304688, 0.21833038330078125, 0.23175430297851562, 0.24517822265625, 0.2586021423339844, 0.27202606201171875, 0.2854499816894531, 0.2988739013671875, 0.3122978210449219, 0.32572174072265625, 0.3391456604003906, 0.352569580078125, 0.3659934997558594, 0.37941741943359375, 0.3928413391113281, 0.4062652587890625, 0.4196891784667969, 0.43311309814453125, 0.4465370178222656, 0.4599609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 13.0, 12.0, 17.0, 27.0, 33.0, 33.0, 58.0, 76.0, 100.0, 159.0, 244.0, 454.0, 797.0, 1526.0, 3236.0, 8938.0, 29670.0, 156473.0, 3162542.0, 728063.0, 73797.0, 17285.0, 5738.0, 2325.0, 1095.0, 594.0, 329.0, 224.0, 145.0, 82.0, 51.0, 38.0, 27.0, 13.0, 19.0, 9.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0], "bins": [-1.9052734375, -1.8488922119140625, -1.792510986328125, -1.7361297607421875, -1.67974853515625, -1.6233673095703125, -1.566986083984375, -1.5106048583984375, -1.4542236328125, -1.3978424072265625, -1.341461181640625, -1.2850799560546875, -1.22869873046875, -1.1723175048828125, -1.115936279296875, -1.0595550537109375, -1.003173828125, -0.9467926025390625, -0.890411376953125, -0.8340301513671875, -0.77764892578125, -0.7212677001953125, -0.664886474609375, -0.6085052490234375, -0.5521240234375, -0.4957427978515625, -0.439361572265625, -0.3829803466796875, -0.32659912109375, -0.2702178955078125, -0.213836669921875, -0.1574554443359375, -0.10107421875, -0.0446929931640625, 0.011688232421875, 0.0680694580078125, 0.12445068359375, 0.1808319091796875, 0.237213134765625, 0.2935943603515625, 0.3499755859375, 0.4063568115234375, 0.462738037109375, 0.5191192626953125, 0.57550048828125, 0.6318817138671875, 0.688262939453125, 0.7446441650390625, 0.801025390625, 0.8574066162109375, 0.913787841796875, 0.9701690673828125, 1.02655029296875, 1.0829315185546875, 1.139312744140625, 1.1956939697265625, 1.2520751953125, 1.3084564208984375, 1.364837646484375, 1.4212188720703125, 1.47760009765625, 1.5339813232421875, 1.590362548828125, 1.6467437744140625, 1.703125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 10.0, 10.0, 14.0, 18.0, 24.0, 47.0, 63.0, 98.0, 187.0, 406.0, 1614.0, 841.0, 330.0, 158.0, 72.0, 52.0, 41.0, 23.0, 23.0, 12.0, 4.0, 9.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5942420959472656, -0.5771560668945312, -0.5600700378417969, -0.5429840087890625, -0.5258979797363281, -0.5088119506835938, -0.4917259216308594, -0.474639892578125, -0.4575538635253906, -0.44046783447265625, -0.4233818054199219, -0.4062957763671875, -0.3892097473144531, -0.37212371826171875, -0.3550376892089844, -0.33795166015625, -0.3208656311035156, -0.30377960205078125, -0.2866935729980469, -0.2696075439453125, -0.2525215148925781, -0.23543548583984375, -0.21834945678710938, -0.201263427734375, -0.18417739868164062, -0.16709136962890625, -0.15000534057617188, -0.1329193115234375, -0.11583328247070312, -0.09874725341796875, -0.08166122436523438, -0.0645751953125, -0.047489166259765625, -0.03040313720703125, -0.013317108154296875, 0.0037689208984375, 0.020854949951171875, 0.03794097900390625, 0.055027008056640625, 0.072113037109375, 0.08919906616210938, 0.10628509521484375, 0.12337112426757812, 0.1404571533203125, 0.15754318237304688, 0.17462921142578125, 0.19171524047851562, 0.20880126953125, 0.22588729858398438, 0.24297332763671875, 0.2600593566894531, 0.2771453857421875, 0.2942314147949219, 0.31131744384765625, 0.3284034729003906, 0.345489501953125, 0.3625755310058594, 0.37966156005859375, 0.3967475891113281, 0.4138336181640625, 0.4309196472167969, 0.44800567626953125, 0.4650917053222656, 0.482177734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 15.0, 53.0, 139.0, 278.0, 287.0, 161.0, 42.0, 12.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.475436210632324, -6.31697940826416, -6.158522129058838, -6.000065326690674, -5.84160852432251, -5.6831512451171875, -5.524694442749023, -5.366237640380859, -5.207780361175537, -5.049323558807373, -4.890866279602051, -4.732409477233887, -4.573952674865723, -4.4154953956604, -4.257038593292236, -4.098581314086914, -3.940124750137329, -3.781667709350586, -3.623210906982422, -3.4647538661956787, -3.3062968254089355, -3.1478400230407715, -2.9893829822540283, -2.830925941467285, -2.672469139099121, -2.514012098312378, -2.355555295944214, -2.1970982551574707, -2.0386412143707275, -1.880184292793274, -1.7217273712158203, -1.5632703304290771, -1.404813289642334, -1.2463563680648804, -1.0878993272781372, -0.9294424057006836, -0.7709854245185852, -0.6125284433364868, -0.4540715217590332, -0.29561448097229004, -0.13715755939483643, 0.02129940688610077, 0.17975637316703796, 0.33821332454681396, 0.49667030572891235, 0.6551272869110107, 0.8135842084884644, 0.9720412492752075, 1.1304981708526611, 1.2889550924301147, 1.447412133216858, 1.6058690547943115, 1.7643260955810547, 1.9227830171585083, 2.081239938735962, 2.239696979522705, 2.398153781890869, 2.5566108226776123, 2.7150676250457764, 2.8735246658325195, 3.0319817066192627, 3.190438747406006, 3.34889554977417, 3.507352590560913, 3.6658096313476562]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 10.0, 16.0, 17.0, 25.0, 35.0, 31.0, 45.0, 38.0, 40.0, 66.0, 55.0, 52.0, 61.0, 49.0, 66.0, 60.0, 48.0, 56.0, 40.0, 44.0, 36.0, 27.0, 12.0, 17.0, 14.0, 10.0, 12.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.499537944793701, -2.430980682373047, -2.3624234199523926, -2.2938661575317383, -2.225308895111084, -2.1567516326904297, -2.0881943702697754, -2.019637107849121, -1.9510798454284668, -1.8825225830078125, -1.8139653205871582, -1.745408058166504, -1.6768507957458496, -1.6082935333251953, -1.539736270904541, -1.4711790084838867, -1.4026216268539429, -1.3340643644332886, -1.2655071020126343, -1.19694983959198, -1.1283925771713257, -1.0598353147506714, -0.9912779927253723, -0.922720730304718, -0.8541634678840637, -0.7856062054634094, -0.7170489430427551, -0.648491621017456, -0.5799343585968018, -0.5113770961761475, -0.44281983375549316, -0.37426257133483887, -0.305705189704895, -0.23714792728424072, -0.16859064996242523, -0.10003337264060974, -0.031476110219955444, 0.03708115220069885, 0.10563844442367554, 0.17419570684432983, 0.24275296926498413, 0.3113102316856384, 0.3798674941062927, 0.4484247863292694, 0.5169820785522461, 0.5855393409729004, 0.6540966033935547, 0.722653865814209, 0.7912111282348633, 0.8597683906555176, 0.9283256530761719, 0.9968829154968262, 1.0654401779174805, 1.1339974403381348, 1.202554702758789, 1.2711119651794434, 1.3396692276000977, 1.408226490020752, 1.4767837524414062, 1.5453410148620605, 1.6138982772827148, 1.6824555397033691, 1.7510128021240234, 1.8195700645446777, 1.8881274461746216]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 2.0, 9.0, 5.0, 4.0, 17.0, 20.0, 29.0, 39.0, 43.0, 91.0, 180.0, 246.0, 443.0, 830.0, 1595.0, 3502.0, 10636.0, 68426.0, 559055.0, 354436.0, 35784.0, 7289.0, 2838.0, 1346.0, 706.0, 359.0, 235.0, 114.0, 81.0, 37.0, 38.0, 24.0, 29.0, 11.0, 11.0, 7.0, 4.0, 4.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0], "bins": [-2.345703125, -2.272064208984375, -2.19842529296875, -2.124786376953125, -2.0511474609375, -1.977508544921875, -1.90386962890625, -1.830230712890625, -1.756591796875, -1.682952880859375, -1.60931396484375, -1.535675048828125, -1.4620361328125, -1.388397216796875, -1.31475830078125, -1.241119384765625, -1.16748046875, -1.093841552734375, -1.02020263671875, -0.946563720703125, -0.8729248046875, -0.799285888671875, -0.72564697265625, -0.652008056640625, -0.578369140625, -0.504730224609375, -0.43109130859375, -0.357452392578125, -0.2838134765625, -0.210174560546875, -0.13653564453125, -0.062896728515625, 0.0107421875, 0.084381103515625, 0.15802001953125, 0.231658935546875, 0.3052978515625, 0.378936767578125, 0.45257568359375, 0.526214599609375, 0.599853515625, 0.673492431640625, 0.74713134765625, 0.820770263671875, 0.8944091796875, 0.968048095703125, 1.04168701171875, 1.115325927734375, 1.18896484375, 1.262603759765625, 1.33624267578125, 1.409881591796875, 1.4835205078125, 1.557159423828125, 1.63079833984375, 1.704437255859375, 1.778076171875, 1.851715087890625, 1.92535400390625, 1.998992919921875, 2.0726318359375, 2.146270751953125, 2.21990966796875, 2.293548583984375, 2.3671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 8.0, 8.0, 10.0, 13.0, 33.0, 47.0, 74.0, 84.0, 109.0, 147.0, 107.0, 105.0, 91.0, 59.0, 30.0, 32.0, 10.0, 9.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.358642578125, -0.34581756591796875, -0.3329925537109375, -0.32016754150390625, -0.307342529296875, -0.29451751708984375, -0.2816925048828125, -0.26886749267578125, -0.25604248046875, -0.24321746826171875, -0.2303924560546875, -0.21756744384765625, -0.204742431640625, -0.19191741943359375, -0.1790924072265625, -0.16626739501953125, -0.1534423828125, -0.14061737060546875, -0.1277923583984375, -0.11496734619140625, -0.102142333984375, -0.08931732177734375, -0.0764923095703125, -0.06366729736328125, -0.05084228515625, -0.03801727294921875, -0.0251922607421875, -0.01236724853515625, 0.000457763671875, 0.01328277587890625, 0.0261077880859375, 0.03893280029296875, 0.0517578125, 0.06458282470703125, 0.0774078369140625, 0.09023284912109375, 0.103057861328125, 0.11588287353515625, 0.1287078857421875, 0.14153289794921875, 0.15435791015625, 0.16718292236328125, 0.1800079345703125, 0.19283294677734375, 0.205657958984375, 0.21848297119140625, 0.2313079833984375, 0.24413299560546875, 0.2569580078125, 0.26978302001953125, 0.2826080322265625, 0.29543304443359375, 0.308258056640625, 0.32108306884765625, 0.3339080810546875, 0.34673309326171875, 0.35955810546875, 0.37238311767578125, 0.3852081298828125, 0.39803314208984375, 0.410858154296875, 0.42368316650390625, 0.4365081787109375, 0.44933319091796875, 0.462158203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 6.0, 4.0, 10.0, 9.0, 9.0, 16.0, 15.0, 23.0, 32.0, 59.0, 90.0, 103.0, 167.0, 238.0, 357.0, 590.0, 1035.0, 2226.0, 6594.0, 27942.0, 145500.0, 475004.0, 304688.0, 63314.0, 13048.0, 3795.0, 1431.0, 790.0, 502.0, 317.0, 170.0, 138.0, 81.0, 75.0, 43.0, 34.0, 27.0, 12.0, 15.0, 13.0, 13.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4912109375, -1.437469482421875, -1.38372802734375, -1.329986572265625, -1.2762451171875, -1.222503662109375, -1.16876220703125, -1.115020751953125, -1.061279296875, -1.007537841796875, -0.95379638671875, -0.900054931640625, -0.8463134765625, -0.792572021484375, -0.73883056640625, -0.685089111328125, -0.63134765625, -0.577606201171875, -0.52386474609375, -0.470123291015625, -0.4163818359375, -0.362640380859375, -0.30889892578125, -0.255157470703125, -0.201416015625, -0.147674560546875, -0.09393310546875, -0.040191650390625, 0.0135498046875, 0.067291259765625, 0.12103271484375, 0.174774169921875, 0.228515625, 0.282257080078125, 0.33599853515625, 0.389739990234375, 0.4434814453125, 0.497222900390625, 0.55096435546875, 0.604705810546875, 0.658447265625, 0.712188720703125, 0.76593017578125, 0.819671630859375, 0.8734130859375, 0.927154541015625, 0.98089599609375, 1.034637451171875, 1.08837890625, 1.142120361328125, 1.19586181640625, 1.249603271484375, 1.3033447265625, 1.357086181640625, 1.41082763671875, 1.464569091796875, 1.518310546875, 1.572052001953125, 1.62579345703125, 1.679534912109375, 1.7332763671875, 1.787017822265625, 1.84075927734375, 1.894500732421875, 1.9482421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 10.0, 8.0, 10.0, 8.0, 13.0, 14.0, 26.0, 16.0, 29.0, 15.0, 27.0, 25.0, 29.0, 38.0, 33.0, 33.0, 33.0, 35.0, 41.0, 41.0, 42.0, 46.0, 48.0, 41.0, 35.0, 24.0, 31.0, 31.0, 38.0, 28.0, 22.0, 22.0, 17.0, 23.0, 15.0, 12.0, 9.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.109375, -1.0706634521484375, -1.031951904296875, -0.9932403564453125, -0.95452880859375, -0.9158172607421875, -0.877105712890625, -0.8383941650390625, -0.7996826171875, -0.7609710693359375, -0.722259521484375, -0.6835479736328125, -0.64483642578125, -0.6061248779296875, -0.567413330078125, -0.5287017822265625, -0.489990234375, -0.4512786865234375, -0.412567138671875, -0.3738555908203125, -0.33514404296875, -0.2964324951171875, -0.257720947265625, -0.2190093994140625, -0.1802978515625, -0.1415863037109375, -0.102874755859375, -0.0641632080078125, -0.02545166015625, 0.0132598876953125, 0.051971435546875, 0.0906829833984375, 0.12939453125, 0.1681060791015625, 0.206817626953125, 0.2455291748046875, 0.28424072265625, 0.3229522705078125, 0.361663818359375, 0.4003753662109375, 0.4390869140625, 0.4777984619140625, 0.516510009765625, 0.5552215576171875, 0.59393310546875, 0.6326446533203125, 0.671356201171875, 0.7100677490234375, 0.748779296875, 0.7874908447265625, 0.826202392578125, 0.8649139404296875, 0.90362548828125, 0.9423370361328125, 0.981048583984375, 1.0197601318359375, 1.0584716796875, 1.0971832275390625, 1.135894775390625, 1.1746063232421875, 1.21331787109375, 1.2520294189453125, 1.290740966796875, 1.3294525146484375, 1.3681640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 6.0, 11.0, 14.0, 32.0, 72.0, 153.0, 391.0, 1272.0, 6235.0, 57561.0, 646589.0, 307678.0, 23818.0, 3397.0, 793.0, 306.0, 114.0, 63.0, 19.0, 11.0, 5.0, 6.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3212890625, -1.2769775390625, -1.232666015625, -1.1883544921875, -1.14404296875, -1.0997314453125, -1.055419921875, -1.0111083984375, -0.966796875, -0.9224853515625, -0.878173828125, -0.8338623046875, -0.78955078125, -0.7452392578125, -0.700927734375, -0.6566162109375, -0.6123046875, -0.5679931640625, -0.523681640625, -0.4793701171875, -0.43505859375, -0.3907470703125, -0.346435546875, -0.3021240234375, -0.2578125, -0.2135009765625, -0.169189453125, -0.1248779296875, -0.08056640625, -0.0362548828125, 0.008056640625, 0.0523681640625, 0.0966796875, 0.1409912109375, 0.185302734375, 0.2296142578125, 0.27392578125, 0.3182373046875, 0.362548828125, 0.4068603515625, 0.451171875, 0.4954833984375, 0.539794921875, 0.5841064453125, 0.62841796875, 0.6727294921875, 0.717041015625, 0.7613525390625, 0.8056640625, 0.8499755859375, 0.894287109375, 0.9385986328125, 0.98291015625, 1.0272216796875, 1.071533203125, 1.1158447265625, 1.16015625, 1.2044677734375, 1.248779296875, 1.2930908203125, 1.33740234375, 1.3817138671875, 1.426025390625, 1.4703369140625, 1.5146484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 8.0, 10.0, 11.0, 14.0, 15.0, 21.0, 16.0, 31.0, 31.0, 40.0, 45.0, 58.0, 64.0, 85.0, 70.0, 83.0, 78.0, 57.0, 37.0, 40.0, 32.0, 25.0, 26.0, 14.0, 12.0, 13.0, 15.0, 5.0, 9.0, 4.0, 1.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010877847671508789, -0.00010539684444665909, -0.00010201521217823029, -9.863357990980148e-05, -9.525194764137268e-05, -9.187031537294388e-05, -8.848868310451508e-05, -8.510705083608627e-05, -8.172541856765747e-05, -7.834378629922867e-05, -7.496215403079987e-05, -7.158052176237106e-05, -6.819888949394226e-05, -6.481725722551346e-05, -6.143562495708466e-05, -5.805399268865585e-05, -5.467236042022705e-05, -5.129072815179825e-05, -4.7909095883369446e-05, -4.452746361494064e-05, -4.114583134651184e-05, -3.776419907808304e-05, -3.4382566809654236e-05, -3.100093454122543e-05, -2.761930227279663e-05, -2.423767000436783e-05, -2.0856037735939026e-05, -1.7474405467510223e-05, -1.4092773199081421e-05, -1.0711140930652618e-05, -7.329508662223816e-06, -3.9478763937950134e-06, -5.662441253662109e-07, 2.8153881430625916e-06, 6.197020411491394e-06, 9.578652679920197e-06, 1.2960284948348999e-05, 1.63419172167778e-05, 1.9723549485206604e-05, 2.3105181753635406e-05, 2.648681402206421e-05, 2.986844629049301e-05, 3.3250078558921814e-05, 3.6631710827350616e-05, 4.001334309577942e-05, 4.339497536420822e-05, 4.6776607632637024e-05, 5.0158239901065826e-05, 5.353987216949463e-05, 5.692150443792343e-05, 6.0303136706352234e-05, 6.368476897478104e-05, 6.706640124320984e-05, 7.044803351163864e-05, 7.382966578006744e-05, 7.721129804849625e-05, 8.059293031692505e-05, 8.397456258535385e-05, 8.735619485378265e-05, 9.073782712221146e-05, 9.411945939064026e-05, 9.750109165906906e-05, 0.00010088272392749786, 0.00010426435619592667, 0.00010764598846435547]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 6.0, 12.0, 17.0, 31.0, 47.0, 87.0, 133.0, 234.0, 487.0, 1013.0, 2645.0, 11112.0, 72111.0, 572010.0, 335501.0, 42253.0, 7159.0, 1972.0, 795.0, 416.0, 218.0, 104.0, 75.0, 45.0, 25.0, 20.0, 15.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1181640625, -1.0765380859375, -1.034912109375, -0.9932861328125, -0.95166015625, -0.9100341796875, -0.868408203125, -0.8267822265625, -0.78515625, -0.7435302734375, -0.701904296875, -0.6602783203125, -0.61865234375, -0.5770263671875, -0.535400390625, -0.4937744140625, -0.4521484375, -0.4105224609375, -0.368896484375, -0.3272705078125, -0.28564453125, -0.2440185546875, -0.202392578125, -0.1607666015625, -0.119140625, -0.0775146484375, -0.035888671875, 0.0057373046875, 0.04736328125, 0.0889892578125, 0.130615234375, 0.1722412109375, 0.2138671875, 0.2554931640625, 0.297119140625, 0.3387451171875, 0.38037109375, 0.4219970703125, 0.463623046875, 0.5052490234375, 0.546875, 0.5885009765625, 0.630126953125, 0.6717529296875, 0.71337890625, 0.7550048828125, 0.796630859375, 0.8382568359375, 0.8798828125, 0.9215087890625, 0.963134765625, 1.0047607421875, 1.04638671875, 1.0880126953125, 1.129638671875, 1.1712646484375, 1.212890625, 1.2545166015625, 1.296142578125, 1.3377685546875, 1.37939453125, 1.4210205078125, 1.462646484375, 1.5042724609375, 1.5458984375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 8.0, 7.0, 8.0, 10.0, 15.0, 20.0, 18.0, 19.0, 31.0, 37.0, 59.0, 65.0, 80.0, 79.0, 103.0, 86.0, 73.0, 52.0, 47.0, 32.0, 37.0, 33.0, 14.0, 14.0, 14.0, 8.0, 9.0, 4.0, 4.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66357421875, -0.64080810546875, -0.6180419921875, -0.59527587890625, -0.572509765625, -0.54974365234375, -0.5269775390625, -0.50421142578125, -0.4814453125, -0.45867919921875, -0.4359130859375, -0.41314697265625, -0.390380859375, -0.36761474609375, -0.3448486328125, -0.32208251953125, -0.29931640625, -0.27655029296875, -0.2537841796875, -0.23101806640625, -0.208251953125, -0.18548583984375, -0.1627197265625, -0.13995361328125, -0.1171875, -0.09442138671875, -0.0716552734375, -0.04888916015625, -0.026123046875, -0.00335693359375, 0.0194091796875, 0.04217529296875, 0.06494140625, 0.08770751953125, 0.1104736328125, 0.13323974609375, 0.156005859375, 0.17877197265625, 0.2015380859375, 0.22430419921875, 0.2470703125, 0.26983642578125, 0.2926025390625, 0.31536865234375, 0.338134765625, 0.36090087890625, 0.3836669921875, 0.40643310546875, 0.42919921875, 0.45196533203125, 0.4747314453125, 0.49749755859375, 0.520263671875, 0.54302978515625, 0.5657958984375, 0.58856201171875, 0.611328125, 0.63409423828125, 0.6568603515625, 0.67962646484375, 0.702392578125, 0.72515869140625, 0.7479248046875, 0.77069091796875, 0.79345703125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 10.0, 22.0, 30.0, 68.0, 132.0, 197.0, 202.0, 162.0, 81.0, 51.0, 15.0, 16.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.13979434967041, -10.71440601348877, -10.289018630981445, -9.863630294799805, -9.438241958618164, -9.012853622436523, -8.587465286254883, -8.162077903747559, -7.736689567565918, -7.311301231384277, -6.885913372039795, -6.4605255126953125, -6.035137176513672, -5.609748840332031, -5.184360980987549, -4.758973121643066, -4.333584785461426, -3.9081966876983643, -3.4828085899353027, -3.057420492172241, -2.6320323944091797, -2.206644296646118, -1.7812561988830566, -1.3558681011199951, -0.9304800033569336, -0.5050919055938721, -0.07970380783081055, 0.345684289932251, 0.7710723876953125, 1.196460485458374, 1.6218485832214355, 2.047236680984497, 2.472623825073242, 2.8980119228363037, 3.3234000205993652, 3.7487881183624268, 4.174176216125488, 4.599564552307129, 5.024952411651611, 5.450340270996094, 5.875728607177734, 6.301116943359375, 6.726504802703857, 7.15189266204834, 7.5772809982299805, 8.002669334411621, 8.428056716918945, 8.853445053100586, 9.278833389282227, 9.704221725463867, 10.129610061645508, 10.554997444152832, 10.980385780334473, 11.405774116516113, 11.831161499023438, 12.256549835205078, 12.681938171386719, 13.10732650756836, 13.53271484375, 13.958102226257324, 14.383490562438965, 14.808878898620605, 15.23426628112793, 15.65965461730957, 16.08504295349121]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 11.0, 11.0, 14.0, 20.0, 17.0, 27.0, 26.0, 27.0, 26.0, 45.0, 27.0, 39.0, 45.0, 48.0, 41.0, 56.0, 43.0, 51.0, 37.0, 46.0, 28.0, 49.0, 37.0, 34.0, 30.0, 22.0, 26.0, 21.0, 11.0, 14.0, 10.0, 12.0, 9.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.41882038116455, -10.11875057220459, -9.818679809570312, -9.518610000610352, -9.21854019165039, -8.918469429016113, -8.618399620056152, -8.318328857421875, -8.018259048461914, -7.718188762664795, -7.418118476867676, -7.118048667907715, -6.817978382110596, -6.517908096313477, -6.217838287353516, -5.9177680015563965, -5.617697715759277, -5.317627429962158, -5.017557144165039, -4.717487335205078, -4.417417049407959, -4.11734676361084, -3.8172767162323, -3.5172066688537598, -3.2171363830566406, -2.9170660972595215, -2.6169960498809814, -2.3169260025024414, -2.0168557167053223, -1.7167855501174927, -1.416715383529663, -1.116645336151123, -0.8165760040283203, -0.5165058374404907, -0.21643567085266113, 0.08363449573516846, 0.38370466232299805, 0.6837748289108276, 0.9838449954986572, 1.2839150428771973, 1.5839853286743164, 1.884055495262146, 2.1841256618499756, 2.4841957092285156, 2.7842659950256348, 3.084336280822754, 3.384406328201294, 3.684476375579834, 3.984546661376953, 4.284616947174072, 4.584687232971191, 4.884757041931152, 5.1848273277282715, 5.484897613525391, 5.784967422485352, 6.085037708282471, 6.38510799407959, 6.685178279876709, 6.985248565673828, 7.285318374633789, 7.585388660430908, 7.885458946228027, 8.185528755187988, 8.485599517822266, 8.785669326782227]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 7.0, 2.0, 5.0, 5.0, 14.0, 18.0, 19.0, 51.0, 78.0, 121.0, 253.0, 437.0, 983.0, 3004.0, 17880.0, 522525.0, 3609526.0, 31306.0, 4765.0, 1558.0, 692.0, 371.0, 214.0, 154.0, 95.0, 49.0, 33.0, 32.0, 16.0, 14.0, 9.0, 8.0, 9.0, 4.0, 2.0, 2.0, 4.0, 6.0, 4.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.689453125, -2.58648681640625, -2.4835205078125, -2.38055419921875, -2.277587890625, -2.17462158203125, -2.0716552734375, -1.96868896484375, -1.86572265625, -1.76275634765625, -1.6597900390625, -1.55682373046875, -1.453857421875, -1.35089111328125, -1.2479248046875, -1.14495849609375, -1.0419921875, -0.93902587890625, -0.8360595703125, -0.73309326171875, -0.630126953125, -0.52716064453125, -0.4241943359375, -0.32122802734375, -0.21826171875, -0.11529541015625, -0.0123291015625, 0.09063720703125, 0.193603515625, 0.29656982421875, 0.3995361328125, 0.50250244140625, 0.60546875, 0.70843505859375, 0.8114013671875, 0.91436767578125, 1.017333984375, 1.12030029296875, 1.2232666015625, 1.32623291015625, 1.42919921875, 1.53216552734375, 1.6351318359375, 1.73809814453125, 1.841064453125, 1.94403076171875, 2.0469970703125, 2.14996337890625, 2.2529296875, 2.35589599609375, 2.4588623046875, 2.56182861328125, 2.664794921875, 2.76776123046875, 2.8707275390625, 2.97369384765625, 3.07666015625, 3.17962646484375, 3.2825927734375, 3.38555908203125, 3.488525390625, 3.59149169921875, 3.6944580078125, 3.79742431640625, 3.900390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 4.0, 9.0, 15.0, 25.0, 22.0, 41.0, 47.0, 81.0, 81.0, 93.0, 100.0, 84.0, 91.0, 50.0, 72.0, 50.0, 37.0, 24.0, 22.0, 14.0, 13.0, 11.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374755859375, -0.3609275817871094, -0.34709930419921875, -0.3332710266113281, -0.3194427490234375, -0.3056144714355469, -0.29178619384765625, -0.2779579162597656, -0.264129638671875, -0.2503013610839844, -0.23647308349609375, -0.22264480590820312, -0.2088165283203125, -0.19498825073242188, -0.18115997314453125, -0.16733169555664062, -0.15350341796875, -0.13967514038085938, -0.12584686279296875, -0.11201858520507812, -0.0981903076171875, -0.08436203002929688, -0.07053375244140625, -0.056705474853515625, -0.042877197265625, -0.029048919677734375, -0.01522064208984375, -0.001392364501953125, 0.0124359130859375, 0.026264190673828125, 0.04009246826171875, 0.053920745849609375, 0.0677490234375, 0.08157730102539062, 0.09540557861328125, 0.10923385620117188, 0.1230621337890625, 0.13689041137695312, 0.15071868896484375, 0.16454696655273438, 0.178375244140625, 0.19220352172851562, 0.20603179931640625, 0.21986007690429688, 0.2336883544921875, 0.24751663208007812, 0.26134490966796875, 0.2751731872558594, 0.28900146484375, 0.3028297424316406, 0.31665802001953125, 0.3304862976074219, 0.3443145751953125, 0.3581428527832031, 0.37197113037109375, 0.3857994079589844, 0.399627685546875, 0.4134559631347656, 0.42728424072265625, 0.4411125183105469, 0.4549407958984375, 0.4687690734863281, 0.48259735107421875, 0.4964256286621094, 0.51025390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 6.0, 9.0, 11.0, 22.0, 37.0, 78.0, 181.0, 454.0, 1409.0, 7241.0, 146934.0, 3985713.0, 46760.0, 3974.0, 865.0, 276.0, 119.0, 76.0, 47.0, 29.0, 18.0, 14.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.78472900390625, -2.6749267578125, -2.56512451171875, -2.455322265625, -2.34552001953125, -2.2357177734375, -2.12591552734375, -2.01611328125, -1.90631103515625, -1.7965087890625, -1.68670654296875, -1.576904296875, -1.46710205078125, -1.3572998046875, -1.24749755859375, -1.1376953125, -1.02789306640625, -0.9180908203125, -0.80828857421875, -0.698486328125, -0.58868408203125, -0.4788818359375, -0.36907958984375, -0.25927734375, -0.14947509765625, -0.0396728515625, 0.07012939453125, 0.179931640625, 0.28973388671875, 0.3995361328125, 0.50933837890625, 0.619140625, 0.72894287109375, 0.8387451171875, 0.94854736328125, 1.058349609375, 1.16815185546875, 1.2779541015625, 1.38775634765625, 1.49755859375, 1.60736083984375, 1.7171630859375, 1.82696533203125, 1.936767578125, 2.04656982421875, 2.1563720703125, 2.26617431640625, 2.3759765625, 2.48577880859375, 2.5955810546875, 2.70538330078125, 2.815185546875, 2.92498779296875, 3.0347900390625, 3.14459228515625, 3.25439453125, 3.36419677734375, 3.4739990234375, 3.58380126953125, 3.693603515625, 3.80340576171875, 3.9132080078125, 4.02301025390625, 4.1328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 4.0, 2.0, 6.0, 4.0, 16.0, 31.0, 51.0, 105.0, 252.0, 704.0, 2048.0, 484.0, 171.0, 91.0, 43.0, 25.0, 11.0, 4.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70361328125, -0.6811904907226562, -0.6587677001953125, -0.6363449096679688, -0.613922119140625, -0.5914993286132812, -0.5690765380859375, -0.5466537475585938, -0.52423095703125, -0.5018081665039062, -0.4793853759765625, -0.45696258544921875, -0.434539794921875, -0.41211700439453125, -0.3896942138671875, -0.36727142333984375, -0.3448486328125, -0.32242584228515625, -0.3000030517578125, -0.27758026123046875, -0.255157470703125, -0.23273468017578125, -0.2103118896484375, -0.18788909912109375, -0.16546630859375, -0.14304351806640625, -0.1206207275390625, -0.09819793701171875, -0.075775146484375, -0.05335235595703125, -0.0309295654296875, -0.00850677490234375, 0.013916015625, 0.03633880615234375, 0.0587615966796875, 0.08118438720703125, 0.103607177734375, 0.12602996826171875, 0.1484527587890625, 0.17087554931640625, 0.19329833984375, 0.21572113037109375, 0.2381439208984375, 0.26056671142578125, 0.282989501953125, 0.30541229248046875, 0.3278350830078125, 0.35025787353515625, 0.3726806640625, 0.39510345458984375, 0.4175262451171875, 0.43994903564453125, 0.462371826171875, 0.48479461669921875, 0.5072174072265625, 0.5296401977539062, 0.55206298828125, 0.5744857788085938, 0.5969085693359375, 0.6193313598632812, 0.641754150390625, 0.6641769409179688, 0.6865997314453125, 0.7090225219726562, 0.7314453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 18.0, 86.0, 197.0, 345.0, 221.0, 85.0, 29.0, 15.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.779697418212891, -7.62592077255249, -7.47214412689209, -7.3183674812316895, -7.164590835571289, -7.010814189910889, -6.857037544250488, -6.70326042175293, -6.5494842529296875, -6.395707607269287, -6.241930961608887, -6.088154315948486, -5.934377670288086, -5.7806010246276855, -5.626824378967285, -5.473047256469727, -5.319270610809326, -5.165493965148926, -5.011717319488525, -4.857940673828125, -4.704164028167725, -4.550387382507324, -4.396610736846924, -4.242834091186523, -4.089056968688965, -3.9352803230285645, -3.781503677368164, -3.6277270317077637, -3.4739503860473633, -3.320173740386963, -3.1663968563079834, -3.012620210647583, -2.85884428024292, -2.7050676345825195, -2.551290988922119, -2.3975143432617188, -2.2437376976013184, -2.089961051940918, -1.9361841678619385, -1.782407522201538, -1.6286308765411377, -1.4748542308807373, -1.321077585220337, -1.167300820350647, -1.0135241746902466, -0.8597475290298462, -0.705970823764801, -0.5521941184997559, -0.39841747283935547, -0.2446407973766327, -0.09086412191390991, 0.06291255354881287, 0.21668922901153564, 0.37046587467193604, 0.5242425799369812, 0.6780192852020264, 0.8317959308624268, 0.9855725765228271, 1.1393492221832275, 1.2931259870529175, 1.4469026327133179, 1.6006792783737183, 1.7544560432434082, 1.9082326889038086, 2.062009334564209]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 8.0, 9.0, 10.0, 15.0, 15.0, 27.0, 31.0, 26.0, 43.0, 36.0, 44.0, 50.0, 48.0, 56.0, 53.0, 46.0, 60.0, 55.0, 49.0, 45.0, 38.0, 35.0, 32.0, 31.0, 24.0, 28.0, 21.0, 12.0, 19.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.700307846069336, -1.6449215412139893, -1.5895352363586426, -1.5341488122940063, -1.4787625074386597, -1.423376202583313, -1.3679898977279663, -1.31260347366333, -1.2572171688079834, -1.2018308639526367, -1.14644455909729, -1.0910581350326538, -1.0356718301773071, -0.9802855253219604, -0.9248992204666138, -0.8695128560066223, -0.8141265511512756, -0.758740246295929, -0.7033538818359375, -0.6479675769805908, -0.5925812125205994, -0.5371949076652527, -0.4818085730075836, -0.42642223834991455, -0.3710359036922455, -0.3156495690345764, -0.26026323437690735, -0.20487691462039948, -0.1494905799627304, -0.09410426020622253, -0.03871792554855347, 0.0166684091091156, 0.07205474376678467, 0.12744107842445374, 0.1828274130821228, 0.23821373283863068, 0.29360008239746094, 0.3489863872528076, 0.4043727219104767, 0.45975905656814575, 0.5151454210281372, 0.5705317258834839, 0.6259180903434753, 0.681304395198822, 0.7366907596588135, 0.7920770645141602, 0.8474633693695068, 0.9028497338294983, 0.958236038684845, 1.0136224031448364, 1.069008708000183, 1.1243950128555298, 1.1797813177108765, 1.2351677417755127, 1.2905540466308594, 1.345940351486206, 1.4013266563415527, 1.4567129611968994, 1.512099266052246, 1.5674856901168823, 1.622871994972229, 1.6782582998275757, 1.7336446046829224, 1.7890310287475586, 1.8444173336029053]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 7.0, 3.0, 6.0, 13.0, 19.0, 24.0, 37.0, 54.0, 75.0, 127.0, 138.0, 210.0, 339.0, 477.0, 815.0, 1433.0, 2823.0, 7027.0, 22552.0, 86461.0, 306339.0, 413616.0, 149433.0, 37450.0, 10632.0, 3896.0, 1851.0, 959.0, 549.0, 373.0, 251.0, 191.0, 92.0, 72.0, 70.0, 48.0, 23.0, 24.0, 16.0, 11.0, 10.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1953125, -1.1581878662109375, -1.121063232421875, -1.0839385986328125, -1.04681396484375, -1.0096893310546875, -0.972564697265625, -0.9354400634765625, -0.8983154296875, -0.8611907958984375, -0.824066162109375, -0.7869415283203125, -0.74981689453125, -0.7126922607421875, -0.675567626953125, -0.6384429931640625, -0.601318359375, -0.5641937255859375, -0.527069091796875, -0.4899444580078125, -0.45281982421875, -0.4156951904296875, -0.378570556640625, -0.3414459228515625, -0.3043212890625, -0.2671966552734375, -0.230072021484375, -0.1929473876953125, -0.15582275390625, -0.1186981201171875, -0.081573486328125, -0.0444488525390625, -0.00732421875, 0.0298004150390625, 0.066925048828125, 0.1040496826171875, 0.14117431640625, 0.1782989501953125, 0.215423583984375, 0.2525482177734375, 0.2896728515625, 0.3267974853515625, 0.363922119140625, 0.4010467529296875, 0.43817138671875, 0.4752960205078125, 0.512420654296875, 0.5495452880859375, 0.586669921875, 0.6237945556640625, 0.660919189453125, 0.6980438232421875, 0.73516845703125, 0.7722930908203125, 0.809417724609375, 0.8465423583984375, 0.8836669921875, 0.9207916259765625, 0.957916259765625, 0.9950408935546875, 1.03216552734375, 1.0692901611328125, 1.106414794921875, 1.1435394287109375, 1.1806640625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 10.0, 14.0, 22.0, 20.0, 31.0, 65.0, 59.0, 92.0, 95.0, 87.0, 98.0, 91.0, 73.0, 52.0, 61.0, 49.0, 22.0, 19.0, 13.0, 10.0, 8.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424560546875, -0.4100151062011719, -0.39546966552734375, -0.3809242248535156, -0.3663787841796875, -0.3518333435058594, -0.33728790283203125, -0.3227424621582031, -0.308197021484375, -0.2936515808105469, -0.27910614013671875, -0.2645606994628906, -0.2500152587890625, -0.23546981811523438, -0.22092437744140625, -0.20637893676757812, -0.19183349609375, -0.17728805541992188, -0.16274261474609375, -0.14819717407226562, -0.1336517333984375, -0.11910629272460938, -0.10456085205078125, -0.09001541137695312, -0.075469970703125, -0.060924530029296875, -0.04637908935546875, -0.031833648681640625, -0.0172882080078125, -0.002742767333984375, 0.01180267333984375, 0.026348114013671875, 0.0408935546875, 0.055438995361328125, 0.06998443603515625, 0.08452987670898438, 0.0990753173828125, 0.11362075805664062, 0.12816619873046875, 0.14271163940429688, 0.157257080078125, 0.17180252075195312, 0.18634796142578125, 0.20089340209960938, 0.2154388427734375, 0.22998428344726562, 0.24452972412109375, 0.2590751647949219, 0.27362060546875, 0.2881660461425781, 0.30271148681640625, 0.3172569274902344, 0.3318023681640625, 0.3463478088378906, 0.36089324951171875, 0.3754386901855469, 0.389984130859375, 0.4045295715332031, 0.41907501220703125, 0.4336204528808594, 0.4481658935546875, 0.4627113342285156, 0.47725677490234375, 0.4918022155761719, 0.50634765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 12.0, 13.0, 7.0, 22.0, 26.0, 38.0, 54.0, 65.0, 105.0, 125.0, 229.0, 362.0, 710.0, 1523.0, 3973.0, 14377.0, 69943.0, 342175.0, 460460.0, 121593.0, 23028.0, 5572.0, 1997.0, 879.0, 441.0, 280.0, 169.0, 105.0, 60.0, 63.0, 42.0, 25.0, 26.0, 13.0, 10.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.3165283203125, -1.269775390625, -1.2230224609375, -1.17626953125, -1.1295166015625, -1.082763671875, -1.0360107421875, -0.9892578125, -0.9425048828125, -0.895751953125, -0.8489990234375, -0.80224609375, -0.7554931640625, -0.708740234375, -0.6619873046875, -0.615234375, -0.5684814453125, -0.521728515625, -0.4749755859375, -0.42822265625, -0.3814697265625, -0.334716796875, -0.2879638671875, -0.2412109375, -0.1944580078125, -0.147705078125, -0.1009521484375, -0.05419921875, -0.0074462890625, 0.039306640625, 0.0860595703125, 0.1328125, 0.1795654296875, 0.226318359375, 0.2730712890625, 0.31982421875, 0.3665771484375, 0.413330078125, 0.4600830078125, 0.5068359375, 0.5535888671875, 0.600341796875, 0.6470947265625, 0.69384765625, 0.7406005859375, 0.787353515625, 0.8341064453125, 0.880859375, 0.9276123046875, 0.974365234375, 1.0211181640625, 1.06787109375, 1.1146240234375, 1.161376953125, 1.2081298828125, 1.2548828125, 1.3016357421875, 1.348388671875, 1.3951416015625, 1.44189453125, 1.4886474609375, 1.535400390625, 1.5821533203125, 1.62890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 8.0, 8.0, 9.0, 3.0, 17.0, 12.0, 12.0, 28.0, 23.0, 20.0, 37.0, 36.0, 28.0, 37.0, 48.0, 41.0, 48.0, 47.0, 52.0, 50.0, 46.0, 49.0, 36.0, 43.0, 38.0, 29.0, 25.0, 26.0, 26.0, 21.0, 21.0, 17.0, 12.0, 12.0, 9.0, 6.0, 3.0, 3.0, 1.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.529296875, -1.4828948974609375, -1.436492919921875, -1.3900909423828125, -1.34368896484375, -1.2972869873046875, -1.250885009765625, -1.2044830322265625, -1.1580810546875, -1.1116790771484375, -1.065277099609375, -1.0188751220703125, -0.97247314453125, -0.9260711669921875, -0.879669189453125, -0.8332672119140625, -0.786865234375, -0.7404632568359375, -0.694061279296875, -0.6476593017578125, -0.60125732421875, -0.5548553466796875, -0.508453369140625, -0.4620513916015625, -0.4156494140625, -0.3692474365234375, -0.322845458984375, -0.2764434814453125, -0.23004150390625, -0.1836395263671875, -0.137237548828125, -0.0908355712890625, -0.04443359375, 0.0019683837890625, 0.048370361328125, 0.0947723388671875, 0.14117431640625, 0.1875762939453125, 0.233978271484375, 0.2803802490234375, 0.3267822265625, 0.3731842041015625, 0.419586181640625, 0.4659881591796875, 0.51239013671875, 0.5587921142578125, 0.605194091796875, 0.6515960693359375, 0.697998046875, 0.7444000244140625, 0.790802001953125, 0.8372039794921875, 0.88360595703125, 0.9300079345703125, 0.976409912109375, 1.0228118896484375, 1.0692138671875, 1.1156158447265625, 1.162017822265625, 1.2084197998046875, 1.25482177734375, 1.3012237548828125, 1.347625732421875, 1.3940277099609375, 1.4404296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 5.0, 4.0, 8.0, 4.0, 9.0, 20.0, 18.0, 23.0, 28.0, 45.0, 62.0, 79.0, 136.0, 213.0, 338.0, 590.0, 1106.0, 2426.0, 5616.0, 14585.0, 42935.0, 135933.0, 357334.0, 317354.0, 112358.0, 35503.0, 12258.0, 4818.0, 2195.0, 1031.0, 561.0, 334.0, 181.0, 134.0, 77.0, 52.0, 38.0, 41.0, 24.0, 28.0, 9.0, 9.0, 6.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.353759765625, -0.3436279296875, -0.33349609375, -0.3233642578125, -0.313232421875, -0.3031005859375, -0.29296875, -0.2828369140625, -0.272705078125, -0.2625732421875, -0.25244140625, -0.2423095703125, -0.232177734375, -0.2220458984375, -0.2119140625, -0.2017822265625, -0.191650390625, -0.1815185546875, -0.17138671875, -0.1612548828125, -0.151123046875, -0.1409912109375, -0.130859375, -0.1207275390625, -0.110595703125, -0.1004638671875, -0.09033203125, -0.0802001953125, -0.070068359375, -0.0599365234375, -0.0498046875, -0.0396728515625, -0.029541015625, -0.0194091796875, -0.00927734375, 0.0008544921875, 0.010986328125, 0.0211181640625, 0.03125, 0.0413818359375, 0.051513671875, 0.0616455078125, 0.07177734375, 0.0819091796875, 0.092041015625, 0.1021728515625, 0.1123046875, 0.1224365234375, 0.132568359375, 0.1427001953125, 0.15283203125, 0.1629638671875, 0.173095703125, 0.1832275390625, 0.193359375, 0.2034912109375, 0.213623046875, 0.2237548828125, 0.23388671875, 0.2440185546875, 0.254150390625, 0.2642822265625, 0.2744140625, 0.2845458984375, 0.294677734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 11.0, 10.0, 9.0, 2.0, 10.0, 12.0, 16.0, 18.0, 44.0, 31.0, 53.0, 51.0, 58.0, 80.0, 93.0, 111.0, 84.0, 59.0, 52.0, 31.0, 25.0, 24.0, 22.0, 9.0, 19.0, 11.0, 10.0, 6.0, 2.0, 12.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011277198791503906, -0.0001093326136469841, -0.00010589323937892914, -0.00010245386511087418, -9.901449084281921e-05, -9.557511657476425e-05, -9.213574230670929e-05, -8.869636803865433e-05, -8.525699377059937e-05, -8.18176195025444e-05, -7.837824523448944e-05, -7.493887096643448e-05, -7.149949669837952e-05, -6.806012243032455e-05, -6.462074816226959e-05, -6.118137389421463e-05, -5.774199962615967e-05, -5.4302625358104706e-05, -5.0863251090049744e-05, -4.742387682199478e-05, -4.398450255393982e-05, -4.054512828588486e-05, -3.7105754017829895e-05, -3.366637974977493e-05, -3.022700548171997e-05, -2.678763121366501e-05, -2.3348256945610046e-05, -1.9908882677555084e-05, -1.6469508409500122e-05, -1.303013414144516e-05, -9.590759873390198e-06, -6.151385605335236e-06, -2.7120113372802734e-06, 7.273629307746887e-07, 4.166737198829651e-06, 7.606111466884613e-06, 1.1045485734939575e-05, 1.4484860002994537e-05, 1.79242342710495e-05, 2.136360853910446e-05, 2.4802982807159424e-05, 2.8242357075214386e-05, 3.168173134326935e-05, 3.512110561132431e-05, 3.856047987937927e-05, 4.1999854147434235e-05, 4.54392284154892e-05, 4.887860268354416e-05, 5.231797695159912e-05, 5.575735121965408e-05, 5.9196725487709045e-05, 6.263609975576401e-05, 6.607547402381897e-05, 6.951484829187393e-05, 7.29542225599289e-05, 7.639359682798386e-05, 7.983297109603882e-05, 8.327234536409378e-05, 8.671171963214874e-05, 9.01510939002037e-05, 9.359046816825867e-05, 9.702984243631363e-05, 0.00010046921670436859, 0.00010390859097242355, 0.00010734796524047852]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 8.0, 9.0, 14.0, 16.0, 19.0, 37.0, 44.0, 92.0, 133.0, 190.0, 294.0, 541.0, 922.0, 1942.0, 4295.0, 11643.0, 34689.0, 120349.0, 388763.0, 339290.0, 98463.0, 29403.0, 9953.0, 3750.0, 1612.0, 844.0, 459.0, 280.0, 167.0, 102.0, 66.0, 57.0, 39.0, 21.0, 11.0, 10.0, 9.0, 4.0, 2.0, 3.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.401123046875, -0.38855743408203125, -0.3759918212890625, -0.36342620849609375, -0.350860595703125, -0.33829498291015625, -0.3257293701171875, -0.31316375732421875, -0.30059814453125, -0.28803253173828125, -0.2754669189453125, -0.26290130615234375, -0.250335693359375, -0.23777008056640625, -0.2252044677734375, -0.21263885498046875, -0.2000732421875, -0.18750762939453125, -0.1749420166015625, -0.16237640380859375, -0.149810791015625, -0.13724517822265625, -0.1246795654296875, -0.11211395263671875, -0.09954833984375, -0.08698272705078125, -0.0744171142578125, -0.06185150146484375, -0.049285888671875, -0.03672027587890625, -0.0241546630859375, -0.01158905029296875, 0.0009765625, 0.01354217529296875, 0.0261077880859375, 0.03867340087890625, 0.051239013671875, 0.06380462646484375, 0.0763702392578125, 0.08893585205078125, 0.10150146484375, 0.11406707763671875, 0.1266326904296875, 0.13919830322265625, 0.151763916015625, 0.16432952880859375, 0.1768951416015625, 0.18946075439453125, 0.2020263671875, 0.21459197998046875, 0.2271575927734375, 0.23972320556640625, 0.252288818359375, 0.26485443115234375, 0.2774200439453125, 0.28998565673828125, 0.30255126953125, 0.31511688232421875, 0.3276824951171875, 0.34024810791015625, 0.352813720703125, 0.36537933349609375, 0.3779449462890625, 0.39051055908203125, 0.403076171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 5.0, 4.0, 5.0, 7.0, 13.0, 12.0, 20.0, 12.0, 31.0, 27.0, 37.0, 45.0, 53.0, 60.0, 62.0, 70.0, 74.0, 69.0, 63.0, 57.0, 51.0, 48.0, 31.0, 29.0, 25.0, 27.0, 15.0, 7.0, 10.0, 3.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.450927734375, -0.4389152526855469, -0.42690277099609375, -0.4148902893066406, -0.4028778076171875, -0.3908653259277344, -0.37885284423828125, -0.3668403625488281, -0.354827880859375, -0.3428153991699219, -0.33080291748046875, -0.3187904357910156, -0.3067779541015625, -0.2947654724121094, -0.28275299072265625, -0.2707405090332031, -0.25872802734375, -0.24671554565429688, -0.23470306396484375, -0.22269058227539062, -0.2106781005859375, -0.19866561889648438, -0.18665313720703125, -0.17464065551757812, -0.162628173828125, -0.15061569213867188, -0.13860321044921875, -0.12659072875976562, -0.1145782470703125, -0.10256576538085938, -0.09055328369140625, -0.07854080200195312, -0.0665283203125, -0.054515838623046875, -0.04250335693359375, -0.030490875244140625, -0.0184783935546875, -0.006465911865234375, 0.00554656982421875, 0.017559051513671875, 0.029571533203125, 0.041584014892578125, 0.05359649658203125, 0.06560897827148438, 0.0776214599609375, 0.08963394165039062, 0.10164642333984375, 0.11365890502929688, 0.12567138671875, 0.13768386840820312, 0.14969635009765625, 0.16170883178710938, 0.1737213134765625, 0.18573379516601562, 0.19774627685546875, 0.20975875854492188, 0.221771240234375, 0.23378372192382812, 0.24579620361328125, 0.2578086853027344, 0.2698211669921875, 0.2818336486816406, 0.29384613037109375, 0.3058586120605469, 0.31787109375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 9.0, 14.0, 17.0, 21.0, 49.0, 55.0, 79.0, 145.0, 140.0, 137.0, 110.0, 67.0, 57.0, 33.0, 19.0, 13.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.278322219848633, -5.046104431152344, -4.8138861656188965, -4.581668376922607, -4.34945011138916, -4.117232322692871, -3.885014295578003, -3.6527962684631348, -3.4205784797668457, -3.1883604526519775, -2.9561424255371094, -2.7239246368408203, -2.491706609725952, -2.259488582611084, -2.027270555496216, -1.7950526475906372, -1.5628345012664795, -1.3306164741516113, -1.0983985662460327, -0.8661805391311646, -0.6339625716209412, -0.4017446041107178, -0.1695265769958496, 0.062691330909729, 0.29490935802459717, 0.5271273255348206, 0.759345293045044, 0.9915633201599121, 1.2237813472747803, 1.4559992551803589, 1.688217282295227, 1.9204351902008057, 2.152653217315674, 2.384871244430542, 2.61708927154541, 2.849307060241699, 3.0815250873565674, 3.3137431144714355, 3.5459611415863037, 3.778179168701172, 4.010396957397461, 4.24261474609375, 4.474833011627197, 4.707050800323486, 4.939269065856934, 5.171486854553223, 5.403704643249512, 5.635922908782959, 5.868141174316406, 6.100358963012695, 6.332577228546143, 6.564795017242432, 6.797013282775879, 7.029231071472168, 7.261448860168457, 7.493667125701904, 7.725884914398193, 7.958102703094482, 8.19032096862793, 8.422538757324219, 8.654756546020508, 8.886974334716797, 9.119193077087402, 9.351410865783691, 9.58362865447998]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 8.0, 3.0, 5.0, 4.0, 14.0, 6.0, 10.0, 12.0, 17.0, 13.0, 19.0, 22.0, 20.0, 37.0, 38.0, 33.0, 33.0, 46.0, 42.0, 42.0, 49.0, 45.0, 40.0, 37.0, 47.0, 35.0, 34.0, 31.0, 27.0, 32.0, 32.0, 21.0, 17.0, 24.0, 27.0, 9.0, 10.0, 11.0, 13.0, 6.0, 6.0, 9.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-7.593559265136719, -7.337581157684326, -7.081603527069092, -6.825625419616699, -6.569647789001465, -6.313669681549072, -6.05769157409668, -5.801713943481445, -5.545735836029053, -5.28975772857666, -5.033780097961426, -4.777801990509033, -4.521823883056641, -4.265846252441406, -4.009868144989014, -3.7538902759552, -3.4979124069213867, -3.2419345378875732, -2.9859566688537598, -2.729978561401367, -2.4740006923675537, -2.2180228233337402, -1.9620448350906372, -1.7060668468475342, -1.4500889778137207, -1.1941111087799072, -0.9381331205368042, -0.682155191898346, -0.4261772632598877, -0.17019939422607422, 0.08577859401702881, 0.34175658226013184, 0.5977344512939453, 0.8537123799324036, 1.1096903085708618, 1.3656682968139648, 1.6216461658477783, 1.8776240348815918, 2.1336021423339844, 2.389580011367798, 2.6455578804016113, 2.901535749435425, 3.1575136184692383, 3.413491725921631, 3.6694695949554443, 3.925447463989258, 4.18142557144165, 4.437403678894043, 4.693381309509277, 4.94935941696167, 5.205337047576904, 5.461315155029297, 5.717292785644531, 5.973270893096924, 6.229249000549316, 6.485226631164551, 6.741204738616943, 6.997182846069336, 7.25316047668457, 7.509138584136963, 7.7651166915893555, 8.02109432220459, 8.277071952819824, 8.533050537109375, 8.78902816772461]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 3.0, 14.0, 20.0, 29.0, 52.0, 126.0, 247.0, 625.0, 1614.0, 5104.0, 23482.0, 375191.0, 3725988.0, 48704.0, 8552.0, 2459.0, 958.0, 486.0, 210.0, 128.0, 74.0, 59.0, 32.0, 33.0, 20.0, 22.0, 6.0, 7.0, 12.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4677734375, -1.4070892333984375, -1.346405029296875, -1.2857208251953125, -1.22503662109375, -1.1643524169921875, -1.103668212890625, -1.0429840087890625, -0.9822998046875, -0.9216156005859375, -0.860931396484375, -0.8002471923828125, -0.73956298828125, -0.6788787841796875, -0.618194580078125, -0.5575103759765625, -0.496826171875, -0.4361419677734375, -0.375457763671875, -0.3147735595703125, -0.25408935546875, -0.1934051513671875, -0.132720947265625, -0.0720367431640625, -0.0113525390625, 0.0493316650390625, 0.110015869140625, 0.1707000732421875, 0.23138427734375, 0.2920684814453125, 0.352752685546875, 0.4134368896484375, 0.47412109375, 0.5348052978515625, 0.595489501953125, 0.6561737060546875, 0.71685791015625, 0.7775421142578125, 0.838226318359375, 0.8989105224609375, 0.9595947265625, 1.0202789306640625, 1.080963134765625, 1.1416473388671875, 1.20233154296875, 1.2630157470703125, 1.323699951171875, 1.3843841552734375, 1.445068359375, 1.5057525634765625, 1.566436767578125, 1.6271209716796875, 1.68780517578125, 1.7484893798828125, 1.809173583984375, 1.8698577880859375, 1.9305419921875, 1.9912261962890625, 2.051910400390625, 2.1125946044921875, 2.17327880859375, 2.2339630126953125, 2.294647216796875, 2.3553314208984375, 2.416015625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 8.0, 10.0, 15.0, 14.0, 31.0, 36.0, 45.0, 54.0, 69.0, 85.0, 73.0, 72.0, 67.0, 76.0, 69.0, 52.0, 54.0, 44.0, 35.0, 28.0, 11.0, 10.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364990234375, -0.3514747619628906, -0.33795928955078125, -0.3244438171386719, -0.3109283447265625, -0.2974128723144531, -0.28389739990234375, -0.2703819274902344, -0.256866455078125, -0.24335098266601562, -0.22983551025390625, -0.21632003784179688, -0.2028045654296875, -0.18928909301757812, -0.17577362060546875, -0.16225814819335938, -0.14874267578125, -0.13522720336914062, -0.12171173095703125, -0.10819625854492188, -0.0946807861328125, -0.08116531372070312, -0.06764984130859375, -0.054134368896484375, -0.040618896484375, -0.027103424072265625, -0.01358795166015625, -7.2479248046875e-05, 0.0134429931640625, 0.026958465576171875, 0.04047393798828125, 0.053989410400390625, 0.0675048828125, 0.08102035522460938, 0.09453582763671875, 0.10805130004882812, 0.1215667724609375, 0.13508224487304688, 0.14859771728515625, 0.16211318969726562, 0.175628662109375, 0.18914413452148438, 0.20265960693359375, 0.21617507934570312, 0.2296905517578125, 0.24320602416992188, 0.25672149658203125, 0.2702369689941406, 0.28375244140625, 0.2972679138183594, 0.31078338623046875, 0.3242988586425781, 0.3378143310546875, 0.3513298034667969, 0.36484527587890625, 0.3783607482910156, 0.391876220703125, 0.4053916931152344, 0.41890716552734375, 0.4324226379394531, 0.4459381103515625, 0.4594535827636719, 0.47296905517578125, 0.4864845275878906, 0.5]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 11.0, 11.0, 22.0, 27.0, 37.0, 60.0, 79.0, 138.0, 329.0, 759.0, 2665.0, 18681.0, 2381457.0, 1767728.0, 18163.0, 2505.0, 722.0, 305.0, 161.0, 113.0, 83.0, 57.0, 48.0, 37.0, 20.0, 20.0, 9.0, 9.0, 7.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.132781982421875, -2.05657958984375, -1.980377197265625, -1.9041748046875, -1.827972412109375, -1.75177001953125, -1.675567626953125, -1.599365234375, -1.523162841796875, -1.44696044921875, -1.370758056640625, -1.2945556640625, -1.218353271484375, -1.14215087890625, -1.065948486328125, -0.98974609375, -0.913543701171875, -0.83734130859375, -0.761138916015625, -0.6849365234375, -0.608734130859375, -0.53253173828125, -0.456329345703125, -0.380126953125, -0.303924560546875, -0.22772216796875, -0.151519775390625, -0.0753173828125, 0.000885009765625, 0.07708740234375, 0.153289794921875, 0.2294921875, 0.305694580078125, 0.38189697265625, 0.458099365234375, 0.5343017578125, 0.610504150390625, 0.68670654296875, 0.762908935546875, 0.839111328125, 0.915313720703125, 0.99151611328125, 1.067718505859375, 1.1439208984375, 1.220123291015625, 1.29632568359375, 1.372528076171875, 1.44873046875, 1.524932861328125, 1.60113525390625, 1.677337646484375, 1.7535400390625, 1.829742431640625, 1.90594482421875, 1.982147216796875, 2.058349609375, 2.134552001953125, 2.21075439453125, 2.286956787109375, 2.3631591796875, 2.439361572265625, 2.51556396484375, 2.591766357421875, 2.66796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 8.0, 7.0, 15.0, 26.0, 44.0, 105.0, 235.0, 1103.0, 1923.0, 359.0, 114.0, 60.0, 25.0, 11.0, 19.0, 3.0, 5.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4365234375, -0.41680908203125, -0.3970947265625, -0.37738037109375, -0.357666015625, -0.33795166015625, -0.3182373046875, -0.29852294921875, -0.27880859375, -0.25909423828125, -0.2393798828125, -0.21966552734375, -0.199951171875, -0.18023681640625, -0.1605224609375, -0.14080810546875, -0.12109375, -0.10137939453125, -0.0816650390625, -0.06195068359375, -0.042236328125, -0.02252197265625, -0.0028076171875, 0.01690673828125, 0.03662109375, 0.05633544921875, 0.0760498046875, 0.09576416015625, 0.115478515625, 0.13519287109375, 0.1549072265625, 0.17462158203125, 0.1943359375, 0.21405029296875, 0.2337646484375, 0.25347900390625, 0.273193359375, 0.29290771484375, 0.3126220703125, 0.33233642578125, 0.35205078125, 0.37176513671875, 0.3914794921875, 0.41119384765625, 0.430908203125, 0.45062255859375, 0.4703369140625, 0.49005126953125, 0.509765625, 0.52947998046875, 0.5491943359375, 0.56890869140625, 0.588623046875, 0.60833740234375, 0.6280517578125, 0.64776611328125, 0.66748046875, 0.68719482421875, 0.7069091796875, 0.72662353515625, 0.746337890625, 0.76605224609375, 0.7857666015625, 0.80548095703125, 0.8251953125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 35.0, 226.0, 474.0, 198.0, 55.0, 11.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.512691497802734, -9.320574760437012, -9.128458023071289, -8.936341285705566, -8.744224548339844, -8.552106857299805, -8.359990119934082, -8.16787338256836, -7.975756645202637, -7.783639907836914, -7.591523170471191, -7.3994059562683105, -7.207289218902588, -7.015172481536865, -6.823055267333984, -6.630938529968262, -6.438821792602539, -6.246705055236816, -6.054588317871094, -5.862471103668213, -5.67035436630249, -5.478237628936768, -5.286120414733887, -5.094003677368164, -4.901886940002441, -4.709770202636719, -4.517653465270996, -4.325536251068115, -4.133419513702393, -3.94130277633667, -3.749185800552368, -3.5570688247680664, -3.3649516105651855, -3.172834873199463, -2.980717897415161, -2.7886009216308594, -2.5964841842651367, -2.404367446899414, -2.2122504711151123, -2.0201334953308105, -1.828016757965088, -1.6358999013900757, -1.4437830448150635, -1.2516661882400513, -1.059549331665039, -0.8674324750900269, -0.6753156185150146, -0.48319876194000244, -0.29108190536499023, -0.09896504878997803, 0.09315180778503418, 0.2852686643600464, 0.4773855209350586, 0.6695023775100708, 0.861619234085083, 1.0537360906600952, 1.2458529472351074, 1.4379698038101196, 1.6300866603851318, 1.822203516960144, 2.0143203735351562, 2.206437110900879, 2.3985540866851807, 2.5906710624694824, 2.782787799835205]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 13.0, 13.0, 23.0, 37.0, 38.0, 66.0, 72.0, 67.0, 70.0, 95.0, 95.0, 71.0, 83.0, 52.0, 52.0, 38.0, 33.0, 24.0, 20.0, 14.0, 8.0, 5.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.841303586959839, -2.7718827724456787, -2.7024621963500977, -2.6330413818359375, -2.5636205673217773, -2.494199752807617, -2.424779176712036, -2.355358362197876, -2.285937786102295, -2.2165169715881348, -2.1470963954925537, -2.0776755809783936, -2.0082547664642334, -1.9388340711593628, -1.8694133758544922, -1.799992561340332, -1.7305717468261719, -1.6611510515213013, -1.5917302370071411, -1.5223095417022705, -1.4528887271881104, -1.3834680318832397, -1.3140473365783691, -1.244626522064209, -1.1752058267593384, -1.1057851314544678, -1.0363643169403076, -0.966943621635437, -0.8975228667259216, -0.8281021118164062, -0.7586814165115356, -0.6892606616020203, -0.6198396682739258, -0.5504189133644104, -0.4809981882572174, -0.4115774631500244, -0.34215670824050903, -0.27273595333099365, -0.20331522822380066, -0.13389450311660767, -0.06447374820709229, 0.004946991801261902, 0.07436773180961609, 0.14378847181797028, 0.21320921182632446, 0.28262996673583984, 0.35205069184303284, 0.42147141695022583, 0.4908921718597412, 0.5603129267692566, 0.629733681678772, 0.6991543769836426, 0.768575131893158, 0.8379958868026733, 0.907416582107544, 0.9768373370170593, 1.0462580919265747, 1.1156787872314453, 1.1850996017456055, 1.254520297050476, 1.3239409923553467, 1.3933618068695068, 1.4627825021743774, 1.532203197479248, 1.6016240119934082]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 9.0, 7.0, 10.0, 13.0, 15.0, 23.0, 35.0, 44.0, 67.0, 106.0, 156.0, 235.0, 360.0, 671.0, 1223.0, 2461.0, 6073.0, 17403.0, 59519.0, 224701.0, 430862.0, 218191.0, 58269.0, 16772.0, 5854.0, 2467.0, 1237.0, 647.0, 367.0, 229.0, 151.0, 95.0, 79.0, 60.0, 41.0, 33.0, 23.0, 17.0, 7.0, 7.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0380859375, -1.0028839111328125, -0.967681884765625, -0.9324798583984375, -0.89727783203125, -0.8620758056640625, -0.826873779296875, -0.7916717529296875, -0.7564697265625, -0.7212677001953125, -0.686065673828125, -0.6508636474609375, -0.61566162109375, -0.5804595947265625, -0.545257568359375, -0.5100555419921875, -0.474853515625, -0.4396514892578125, -0.404449462890625, -0.3692474365234375, -0.33404541015625, -0.2988433837890625, -0.263641357421875, -0.2284393310546875, -0.1932373046875, -0.1580352783203125, -0.122833251953125, -0.0876312255859375, -0.05242919921875, -0.0172271728515625, 0.017974853515625, 0.0531768798828125, 0.08837890625, 0.1235809326171875, 0.158782958984375, 0.1939849853515625, 0.22918701171875, 0.2643890380859375, 0.299591064453125, 0.3347930908203125, 0.3699951171875, 0.4051971435546875, 0.440399169921875, 0.4756011962890625, 0.51080322265625, 0.5460052490234375, 0.581207275390625, 0.6164093017578125, 0.651611328125, 0.6868133544921875, 0.722015380859375, 0.7572174072265625, 0.79241943359375, 0.8276214599609375, 0.862823486328125, 0.8980255126953125, 0.9332275390625, 0.9684295654296875, 1.003631591796875, 1.0388336181640625, 1.07403564453125, 1.1092376708984375, 1.144439697265625, 1.1796417236328125, 1.21484375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 12.0, 10.0, 20.0, 23.0, 34.0, 39.0, 47.0, 63.0, 78.0, 80.0, 71.0, 76.0, 79.0, 71.0, 65.0, 46.0, 42.0, 46.0, 24.0, 22.0, 15.0, 7.0, 3.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359130859375, -0.3454856872558594, -0.33184051513671875, -0.3181953430175781, -0.3045501708984375, -0.2909049987792969, -0.27725982666015625, -0.2636146545410156, -0.249969482421875, -0.23632431030273438, -0.22267913818359375, -0.20903396606445312, -0.1953887939453125, -0.18174362182617188, -0.16809844970703125, -0.15445327758789062, -0.14080810546875, -0.12716293334960938, -0.11351776123046875, -0.09987258911132812, -0.0862274169921875, -0.07258224487304688, -0.05893707275390625, -0.045291900634765625, -0.031646728515625, -0.018001556396484375, -0.00435638427734375, 0.009288787841796875, 0.0229339599609375, 0.036579132080078125, 0.05022430419921875, 0.06386947631835938, 0.0775146484375, 0.09115982055664062, 0.10480499267578125, 0.11845016479492188, 0.1320953369140625, 0.14574050903320312, 0.15938568115234375, 0.17303085327148438, 0.186676025390625, 0.20032119750976562, 0.21396636962890625, 0.22761154174804688, 0.2412567138671875, 0.2549018859863281, 0.26854705810546875, 0.2821922302246094, 0.29583740234375, 0.3094825744628906, 0.32312774658203125, 0.3367729187011719, 0.3504180908203125, 0.3640632629394531, 0.37770843505859375, 0.3913536071777344, 0.404998779296875, 0.4186439514160156, 0.43228912353515625, 0.4459342956542969, 0.4595794677734375, 0.4732246398925781, 0.48686981201171875, 0.5005149841308594, 0.51416015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 6.0, 5.0, 18.0, 22.0, 27.0, 43.0, 55.0, 65.0, 81.0, 135.0, 214.0, 343.0, 530.0, 862.0, 1969.0, 5549.0, 24717.0, 140310.0, 480072.0, 313968.0, 61391.0, 11668.0, 3248.0, 1282.0, 744.0, 406.0, 292.0, 160.0, 110.0, 83.0, 57.0, 27.0, 35.0, 22.0, 9.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.59765625, -1.55419921875, -1.5107421875, -1.46728515625, -1.423828125, -1.38037109375, -1.3369140625, -1.29345703125, -1.25, -1.20654296875, -1.1630859375, -1.11962890625, -1.076171875, -1.03271484375, -0.9892578125, -0.94580078125, -0.90234375, -0.85888671875, -0.8154296875, -0.77197265625, -0.728515625, -0.68505859375, -0.6416015625, -0.59814453125, -0.5546875, -0.51123046875, -0.4677734375, -0.42431640625, -0.380859375, -0.33740234375, -0.2939453125, -0.25048828125, -0.20703125, -0.16357421875, -0.1201171875, -0.07666015625, -0.033203125, 0.01025390625, 0.0537109375, 0.09716796875, 0.140625, 0.18408203125, 0.2275390625, 0.27099609375, 0.314453125, 0.35791015625, 0.4013671875, 0.44482421875, 0.48828125, 0.53173828125, 0.5751953125, 0.61865234375, 0.662109375, 0.70556640625, 0.7490234375, 0.79248046875, 0.8359375, 0.87939453125, 0.9228515625, 0.96630859375, 1.009765625, 1.05322265625, 1.0966796875, 1.14013671875, 1.18359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 8.0, 9.0, 11.0, 14.0, 16.0, 15.0, 25.0, 27.0, 17.0, 34.0, 33.0, 25.0, 28.0, 33.0, 48.0, 45.0, 53.0, 50.0, 48.0, 53.0, 59.0, 39.0, 35.0, 34.0, 40.0, 37.0, 31.0, 25.0, 28.0, 27.0, 15.0, 12.0, 7.0, 5.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.7275390625, -1.680419921875, -1.63330078125, -1.586181640625, -1.5390625, -1.491943359375, -1.44482421875, -1.397705078125, -1.3505859375, -1.303466796875, -1.25634765625, -1.209228515625, -1.162109375, -1.114990234375, -1.06787109375, -1.020751953125, -0.9736328125, -0.926513671875, -0.87939453125, -0.832275390625, -0.78515625, -0.738037109375, -0.69091796875, -0.643798828125, -0.5966796875, -0.549560546875, -0.50244140625, -0.455322265625, -0.408203125, -0.361083984375, -0.31396484375, -0.266845703125, -0.2197265625, -0.172607421875, -0.12548828125, -0.078369140625, -0.03125, 0.015869140625, 0.06298828125, 0.110107421875, 0.1572265625, 0.204345703125, 0.25146484375, 0.298583984375, 0.345703125, 0.392822265625, 0.43994140625, 0.487060546875, 0.5341796875, 0.581298828125, 0.62841796875, 0.675537109375, 0.72265625, 0.769775390625, 0.81689453125, 0.864013671875, 0.9111328125, 0.958251953125, 1.00537109375, 1.052490234375, 1.099609375, 1.146728515625, 1.19384765625, 1.240966796875, 1.2880859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 11.0, 15.0, 23.0, 32.0, 61.0, 127.0, 269.0, 646.0, 2106.0, 9831.0, 87287.0, 639286.0, 277227.0, 25778.0, 3965.0, 1086.0, 410.0, 185.0, 83.0, 44.0, 33.0, 17.0, 13.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.541015625, -0.5234146118164062, -0.5058135986328125, -0.48821258544921875, -0.470611572265625, -0.45301055908203125, -0.4354095458984375, -0.41780853271484375, -0.40020751953125, -0.38260650634765625, -0.3650054931640625, -0.34740447998046875, -0.329803466796875, -0.31220245361328125, -0.2946014404296875, -0.27700042724609375, -0.2593994140625, -0.24179840087890625, -0.2241973876953125, -0.20659637451171875, -0.188995361328125, -0.17139434814453125, -0.1537933349609375, -0.13619232177734375, -0.11859130859375, -0.10099029541015625, -0.0833892822265625, -0.06578826904296875, -0.048187255859375, -0.03058624267578125, -0.0129852294921875, 0.00461578369140625, 0.022216796875, 0.03981781005859375, 0.0574188232421875, 0.07501983642578125, 0.092620849609375, 0.11022186279296875, 0.1278228759765625, 0.14542388916015625, 0.16302490234375, 0.18062591552734375, 0.1982269287109375, 0.21582794189453125, 0.233428955078125, 0.25102996826171875, 0.2686309814453125, 0.28623199462890625, 0.3038330078125, 0.32143402099609375, 0.3390350341796875, 0.35663604736328125, 0.374237060546875, 0.39183807373046875, 0.4094390869140625, 0.42704010009765625, 0.44464111328125, 0.46224212646484375, 0.4798431396484375, 0.49744415283203125, 0.515045166015625, 0.5326461791992188, 0.5502471923828125, 0.5678482055664062, 0.58544921875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 4.0, 9.0, 5.0, 14.0, 12.0, 22.0, 17.0, 28.0, 47.0, 47.0, 55.0, 92.0, 130.0, 132.0, 95.0, 73.0, 38.0, 36.0, 33.0, 30.0, 17.0, 13.0, 11.0, 12.0, 4.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013113021850585938, -0.00012675300240516663, -0.00012237578630447388, -0.00011799857020378113, -0.00011362135410308838, -0.00010924413800239563, -0.00010486692190170288, -0.00010048970580101013, -9.611248970031738e-05, -9.173527359962463e-05, -8.735805749893188e-05, -8.298084139823914e-05, -7.860362529754639e-05, -7.422640919685364e-05, -6.984919309616089e-05, -6.547197699546814e-05, -6.109476089477539e-05, -5.671754479408264e-05, -5.234032869338989e-05, -4.7963112592697144e-05, -4.3585896492004395e-05, -3.9208680391311646e-05, -3.4831464290618896e-05, -3.0454248189926147e-05, -2.60770320892334e-05, -2.169981598854065e-05, -1.73225998878479e-05, -1.2945383787155151e-05, -8.568167686462402e-06, -4.190951585769653e-06, 1.862645149230957e-07, 4.563480615615845e-06, 8.940696716308594e-06, 1.3317912817001343e-05, 1.7695128917694092e-05, 2.207234501838684e-05, 2.644956111907959e-05, 3.082677721977234e-05, 3.520399332046509e-05, 3.958120942115784e-05, 4.3958425521850586e-05, 4.8335641622543335e-05, 5.2712857723236084e-05, 5.709007382392883e-05, 6.146728992462158e-05, 6.584450602531433e-05, 7.022172212600708e-05, 7.459893822669983e-05, 7.897615432739258e-05, 8.335337042808533e-05, 8.773058652877808e-05, 9.210780262947083e-05, 9.648501873016357e-05, 0.00010086223483085632, 0.00010523945093154907, 0.00010961666703224182, 0.00011399388313293457, 0.00011837109923362732, 0.00012274831533432007, 0.00012712553143501282, 0.00013150274753570557, 0.00013587996363639832, 0.00014025717973709106, 0.0001446343958377838, 0.00014901161193847656]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 9.0, 9.0, 7.0, 16.0, 11.0, 16.0, 40.0, 57.0, 75.0, 142.0, 212.0, 422.0, 690.0, 1438.0, 3279.0, 10415.0, 43977.0, 241638.0, 546171.0, 156894.0, 30248.0, 7590.0, 2623.0, 1127.0, 607.0, 303.0, 193.0, 117.0, 74.0, 48.0, 33.0, 12.0, 19.0, 15.0, 9.0, 7.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38330078125, -0.3706817626953125, -0.358062744140625, -0.3454437255859375, -0.33282470703125, -0.3202056884765625, -0.307586669921875, -0.2949676513671875, -0.2823486328125, -0.2697296142578125, -0.257110595703125, -0.2444915771484375, -0.23187255859375, -0.2192535400390625, -0.206634521484375, -0.1940155029296875, -0.181396484375, -0.1687774658203125, -0.156158447265625, -0.1435394287109375, -0.13092041015625, -0.1183013916015625, -0.105682373046875, -0.0930633544921875, -0.0804443359375, -0.0678253173828125, -0.055206298828125, -0.0425872802734375, -0.02996826171875, -0.0173492431640625, -0.004730224609375, 0.0078887939453125, 0.0205078125, 0.0331268310546875, 0.045745849609375, 0.0583648681640625, 0.07098388671875, 0.0836029052734375, 0.096221923828125, 0.1088409423828125, 0.1214599609375, 0.1340789794921875, 0.146697998046875, 0.1593170166015625, 0.17193603515625, 0.1845550537109375, 0.197174072265625, 0.2097930908203125, 0.222412109375, 0.2350311279296875, 0.247650146484375, 0.2602691650390625, 0.27288818359375, 0.2855072021484375, 0.298126220703125, 0.3107452392578125, 0.3233642578125, 0.3359832763671875, 0.348602294921875, 0.3612213134765625, 0.37384033203125, 0.3864593505859375, 0.399078369140625, 0.4116973876953125, 0.42431640625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 5.0, 13.0, 23.0, 25.0, 28.0, 46.0, 56.0, 69.0, 68.0, 86.0, 82.0, 92.0, 86.0, 76.0, 64.0, 45.0, 31.0, 21.0, 23.0, 14.0, 9.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.3222084045410156, -0.30970001220703125, -0.2971916198730469, -0.2846832275390625, -0.2721748352050781, -0.25966644287109375, -0.24715805053710938, -0.234649658203125, -0.22214126586914062, -0.20963287353515625, -0.19712448120117188, -0.1846160888671875, -0.17210769653320312, -0.15959930419921875, -0.14709091186523438, -0.13458251953125, -0.12207412719726562, -0.10956573486328125, -0.09705734252929688, -0.0845489501953125, -0.07204055786132812, -0.05953216552734375, -0.047023773193359375, -0.034515380859375, -0.022006988525390625, -0.00949859619140625, 0.003009796142578125, 0.0155181884765625, 0.028026580810546875, 0.04053497314453125, 0.053043365478515625, 0.0655517578125, 0.07806015014648438, 0.09056854248046875, 0.10307693481445312, 0.1155853271484375, 0.12809371948242188, 0.14060211181640625, 0.15311050415039062, 0.165618896484375, 0.17812728881835938, 0.19063568115234375, 0.20314407348632812, 0.2156524658203125, 0.22816085815429688, 0.24066925048828125, 0.2531776428222656, 0.26568603515625, 0.2781944274902344, 0.29070281982421875, 0.3032112121582031, 0.3157196044921875, 0.3282279968261719, 0.34073638916015625, 0.3532447814941406, 0.365753173828125, 0.3782615661621094, 0.39076995849609375, 0.4032783508300781, 0.4157867431640625, 0.4282951354980469, 0.44080352783203125, 0.4533119201660156, 0.4658203125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 11.0, 46.0, 139.0, 325.0, 294.0, 133.0, 39.0, 12.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.213546276092529, -6.659966945648193, -6.106387615203857, -5.552807807922363, -4.999228477478027, -4.445649147033691, -3.8920698165893555, -3.3384904861450195, -2.7849111557006836, -2.2313318252563477, -1.6777523756027222, -1.1241729259490967, -0.5705935955047607, -0.017014265060424805, 0.5365653038024902, 1.0901446342468262, 1.643723964691162, 2.197303295135498, 2.750882625579834, 3.304462194442749, 3.858041524887085, 4.41162109375, 4.965200424194336, 5.518779754638672, 6.072359085083008, 6.625938415527344, 7.17951774597168, 7.733097076416016, 8.286676406860352, 8.840255737304688, 9.393835067749023, 9.94741439819336, 10.500995635986328, 11.054574966430664, 11.608154296875, 12.161733627319336, 12.715312957763672, 13.268892288208008, 13.822471618652344, 14.37605094909668, 14.929630279541016, 15.483209609985352, 16.036788940429688, 16.590368270874023, 17.14394760131836, 17.697526931762695, 18.25110626220703, 18.804685592651367, 19.358264923095703, 19.91184425354004, 20.465423583984375, 21.01900291442871, 21.572582244873047, 22.126161575317383, 22.67974090576172, 23.233320236206055, 23.786901473999023, 24.34048080444336, 24.894060134887695, 25.44763946533203, 26.001218795776367, 26.554798126220703, 27.10837745666504, 27.661956787109375, 28.21553611755371]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 1.0, 6.0, 11.0, 8.0, 16.0, 14.0, 21.0, 19.0, 33.0, 38.0, 39.0, 60.0, 41.0, 43.0, 54.0, 59.0, 58.0, 64.0, 42.0, 64.0, 50.0, 51.0, 39.0, 26.0, 29.0, 23.0, 29.0, 6.0, 16.0, 13.0, 1.0, 5.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.093514442443848, -8.785726547241211, -8.477937698364258, -8.170149803161621, -7.862361907958984, -7.5545735359191895, -7.2467851638793945, -6.938997268676758, -6.631208896636963, -6.323420524597168, -6.015632629394531, -5.707844257354736, -5.400055885314941, -5.092267990112305, -4.78447961807251, -4.476691246032715, -4.168903350830078, -3.8611152172088623, -3.5533270835876465, -3.2455387115478516, -2.9377505779266357, -2.62996244430542, -2.322174072265625, -2.014385938644409, -1.7065978050231934, -1.3988096714019775, -1.0910214185714722, -0.7832332253456116, -0.475445032119751, -0.16765689849853516, 0.14013135433197021, 0.4479196071624756, 0.755706787109375, 1.0634949207305908, 1.3712831735610962, 1.6790714263916016, 1.9868595600128174, 2.294647693634033, 2.602436065673828, 2.910224199295044, 3.2180123329162598, 3.5258004665374756, 3.8335886001586914, 4.141376972198486, 4.449165344238281, 4.756953239440918, 5.064741611480713, 5.372529983520508, 5.6803178787231445, 5.9881062507629395, 6.295894145965576, 6.603682518005371, 6.911470413208008, 7.219258785247803, 7.527047157287598, 7.834835052490234, 8.142623901367188, 8.450411796569824, 8.758200645446777, 9.065988540649414, 9.37377643585205, 9.681564331054688, 9.98935317993164, 10.297141075134277, 10.604928970336914]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 12.0, 21.0, 24.0, 44.0, 55.0, 97.0, 160.0, 246.0, 492.0, 945.0, 2138.0, 6045.0, 24222.0, 210962.0, 3770284.0, 148504.0, 19677.0, 5401.0, 2247.0, 1092.0, 545.0, 313.0, 222.0, 131.0, 99.0, 72.0, 63.0, 37.0, 15.0, 24.0, 12.0, 11.0, 8.0, 10.0, 11.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3251953125, -1.2731170654296875, -1.221038818359375, -1.1689605712890625, -1.11688232421875, -1.0648040771484375, -1.012725830078125, -0.9606475830078125, -0.9085693359375, -0.8564910888671875, -0.804412841796875, -0.7523345947265625, -0.70025634765625, -0.6481781005859375, -0.596099853515625, -0.5440216064453125, -0.491943359375, -0.4398651123046875, -0.387786865234375, -0.3357086181640625, -0.28363037109375, -0.2315521240234375, -0.179473876953125, -0.1273956298828125, -0.0753173828125, -0.0232391357421875, 0.028839111328125, 0.0809173583984375, 0.13299560546875, 0.1850738525390625, 0.237152099609375, 0.2892303466796875, 0.34130859375, 0.3933868408203125, 0.445465087890625, 0.4975433349609375, 0.54962158203125, 0.6016998291015625, 0.653778076171875, 0.7058563232421875, 0.7579345703125, 0.8100128173828125, 0.862091064453125, 0.9141693115234375, 0.96624755859375, 1.0183258056640625, 1.070404052734375, 1.1224822998046875, 1.174560546875, 1.2266387939453125, 1.278717041015625, 1.3307952880859375, 1.38287353515625, 1.4349517822265625, 1.487030029296875, 1.5391082763671875, 1.5911865234375, 1.6432647705078125, 1.695343017578125, 1.7474212646484375, 1.79949951171875, 1.8515777587890625, 1.903656005859375, 1.9557342529296875, 2.0078125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 5.0, 5.0, 3.0, 17.0, 11.0, 16.0, 18.0, 28.0, 32.0, 48.0, 35.0, 68.0, 79.0, 61.0, 66.0, 90.0, 70.0, 70.0, 47.0, 52.0, 47.0, 36.0, 21.0, 25.0, 12.0, 4.0, 12.0, 6.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.350341796875, -0.3368797302246094, -0.32341766357421875, -0.3099555969238281, -0.2964935302734375, -0.2830314636230469, -0.26956939697265625, -0.2561073303222656, -0.242645263671875, -0.22918319702148438, -0.21572113037109375, -0.20225906372070312, -0.1887969970703125, -0.17533493041992188, -0.16187286376953125, -0.14841079711914062, -0.13494873046875, -0.12148666381835938, -0.10802459716796875, -0.09456253051757812, -0.0811004638671875, -0.06763839721679688, -0.05417633056640625, -0.040714263916015625, -0.027252197265625, -0.013790130615234375, -0.00032806396484375, 0.013134002685546875, 0.0265960693359375, 0.040058135986328125, 0.05352020263671875, 0.06698226928710938, 0.0804443359375, 0.09390640258789062, 0.10736846923828125, 0.12083053588867188, 0.1342926025390625, 0.14775466918945312, 0.16121673583984375, 0.17467880249023438, 0.188140869140625, 0.20160293579101562, 0.21506500244140625, 0.22852706909179688, 0.2419891357421875, 0.2554512023925781, 0.26891326904296875, 0.2823753356933594, 0.29583740234375, 0.3092994689941406, 0.32276153564453125, 0.3362236022949219, 0.3496856689453125, 0.3631477355957031, 0.37660980224609375, 0.3900718688964844, 0.403533935546875, 0.4169960021972656, 0.43045806884765625, 0.4439201354980469, 0.4573822021484375, 0.4708442687988281, 0.48430633544921875, 0.4977684020996094, 0.51123046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 14.0, 20.0, 29.0, 44.0, 61.0, 83.0, 144.0, 241.0, 358.0, 585.0, 1096.0, 1983.0, 4673.0, 14561.0, 89630.0, 3165541.0, 849492.0, 47032.0, 10171.0, 3874.0, 1859.0, 1085.0, 672.0, 380.0, 212.0, 114.0, 105.0, 66.0, 44.0, 30.0, 16.0, 21.0, 5.0, 5.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5048828125, -1.460418701171875, -1.41595458984375, -1.371490478515625, -1.3270263671875, -1.282562255859375, -1.23809814453125, -1.193634033203125, -1.149169921875, -1.104705810546875, -1.06024169921875, -1.015777587890625, -0.9713134765625, -0.926849365234375, -0.88238525390625, -0.837921142578125, -0.79345703125, -0.748992919921875, -0.70452880859375, -0.660064697265625, -0.6156005859375, -0.571136474609375, -0.52667236328125, -0.482208251953125, -0.437744140625, -0.393280029296875, -0.34881591796875, -0.304351806640625, -0.2598876953125, -0.215423583984375, -0.17095947265625, -0.126495361328125, -0.08203125, -0.037567138671875, 0.00689697265625, 0.051361083984375, 0.0958251953125, 0.140289306640625, 0.18475341796875, 0.229217529296875, 0.273681640625, 0.318145751953125, 0.36260986328125, 0.407073974609375, 0.4515380859375, 0.496002197265625, 0.54046630859375, 0.584930419921875, 0.62939453125, 0.673858642578125, 0.71832275390625, 0.762786865234375, 0.8072509765625, 0.851715087890625, 0.89617919921875, 0.940643310546875, 0.985107421875, 1.029571533203125, 1.07403564453125, 1.118499755859375, 1.1629638671875, 1.207427978515625, 1.25189208984375, 1.296356201171875, 1.3408203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 6.0, 9.0, 17.0, 30.0, 38.0, 78.0, 122.0, 336.0, 1121.0, 1453.0, 393.0, 210.0, 91.0, 63.0, 33.0, 18.0, 15.0, 5.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7724609375, -0.7504425048828125, -0.728424072265625, -0.7064056396484375, -0.68438720703125, -0.6623687744140625, -0.640350341796875, -0.6183319091796875, -0.5963134765625, -0.5742950439453125, -0.552276611328125, -0.5302581787109375, -0.50823974609375, -0.4862213134765625, -0.464202880859375, -0.4421844482421875, -0.420166015625, -0.3981475830078125, -0.376129150390625, -0.3541107177734375, -0.33209228515625, -0.3100738525390625, -0.288055419921875, -0.2660369873046875, -0.2440185546875, -0.2220001220703125, -0.199981689453125, -0.1779632568359375, -0.15594482421875, -0.1339263916015625, -0.111907958984375, -0.0898895263671875, -0.06787109375, -0.0458526611328125, -0.023834228515625, -0.0018157958984375, 0.02020263671875, 0.0422210693359375, 0.064239501953125, 0.0862579345703125, 0.1082763671875, 0.1302947998046875, 0.152313232421875, 0.1743316650390625, 0.19635009765625, 0.2183685302734375, 0.240386962890625, 0.2624053955078125, 0.284423828125, 0.3064422607421875, 0.328460693359375, 0.3504791259765625, 0.37249755859375, 0.3945159912109375, 0.416534423828125, 0.4385528564453125, 0.4605712890625, 0.4825897216796875, 0.504608154296875, 0.5266265869140625, 0.54864501953125, 0.5706634521484375, 0.592681884765625, 0.6147003173828125, 0.63671875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 19.0, 31.0, 48.0, 149.0, 216.0, 244.0, 152.0, 61.0, 41.0, 11.0, 11.0, 5.0, 2.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4701778888702393, -2.3156943321228027, -2.161210775375366, -2.0067272186279297, -1.8522435426712036, -1.697759985923767, -1.543276309967041, -1.3887927532196045, -1.234309196472168, -1.0798256397247314, -0.9253420233726501, -0.7708584070205688, -0.6163748502731323, -0.4618912935256958, -0.3074076771736145, -0.1529240608215332, 0.0015594959259033203, 0.15604308247566223, 0.31052666902542114, 0.46501025557518005, 0.619493842124939, 0.7739773988723755, 0.9284610152244568, 1.082944631576538, 1.2374281883239746, 1.3919117450714111, 1.5463953018188477, 1.7008789777755737, 1.8553625345230103, 2.0098462104797363, 2.164329767227173, 2.3188133239746094, 2.473296642303467, 2.6277801990509033, 2.78226375579834, 2.9367473125457764, 3.091230869293213, 3.2457146644592285, 3.400198221206665, 3.5546817779541016, 3.709165334701538, 3.8636488914489746, 4.01813268661499, 4.172616004943848, 4.327099800109863, 4.481583118438721, 4.636066913604736, 4.790550231933594, 4.945034027099609, 5.099517822265625, 5.254001140594482, 5.408484935760498, 5.5629682540893555, 5.717452049255371, 5.8719353675842285, 6.026419162750244, 6.180902481079102, 6.335386276245117, 6.489869594573975, 6.64435338973999, 6.798836708068848, 6.953320503234863, 7.107803821563721, 7.262287616729736, 7.416771411895752]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 7.0, 9.0, 23.0, 27.0, 27.0, 43.0, 60.0, 59.0, 56.0, 73.0, 76.0, 61.0, 75.0, 74.0, 70.0, 47.0, 46.0, 35.0, 32.0, 31.0, 17.0, 12.0, 16.0, 8.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6953272819519043, -2.60137677192688, -2.5074260234832764, -2.413475513458252, -2.3195250034332275, -2.225574493408203, -2.1316237449645996, -2.037673234939575, -1.9437227249145508, -1.8497720956802368, -1.7558215856552124, -1.6618709564208984, -1.567920446395874, -1.47396981716156, -1.380019187927246, -1.2860686779022217, -1.1921180486679077, -1.0981674194335938, -1.0042169094085693, -0.9102662801742554, -0.816315770149231, -0.722365140914917, -0.6284145712852478, -0.5344640016555786, -0.4405134320259094, -0.34656286239624023, -0.25261229276657104, -0.15866169333457947, -0.06471112370491028, 0.02923944592475891, 0.12319004535675049, 0.21714061498641968, 0.31109118461608887, 0.40504175424575806, 0.49899232387542725, 0.5929429531097412, 0.6868934631347656, 0.7808440923690796, 0.8747946619987488, 0.968745231628418, 1.0626957416534424, 1.1566463708877563, 1.2505968809127808, 1.3445475101470947, 1.4384980201721191, 1.532448649406433, 1.626399278640747, 1.7203497886657715, 1.8143004179000854, 1.9082510471343994, 2.002201557159424, 2.0961520671844482, 2.1901028156280518, 2.284053325653076, 2.3780038356781006, 2.471954345703125, 2.5659050941467285, 2.659855604171753, 2.7538063526153564, 2.847756862640381, 2.9417073726654053, 3.0356578826904297, 3.129608631134033, 3.2235591411590576, 3.317509651184082]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 13.0, 15.0, 13.0, 12.0, 23.0, 32.0, 44.0, 53.0, 113.0, 147.0, 178.0, 314.0, 522.0, 793.0, 1436.0, 2612.0, 5542.0, 14639.0, 48439.0, 177677.0, 426768.0, 259362.0, 73403.0, 21365.0, 7410.0, 3335.0, 1606.0, 955.0, 575.0, 380.0, 244.0, 140.0, 118.0, 84.0, 64.0, 31.0, 22.0, 18.0, 14.0, 10.0, 8.0, 7.0, 2.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0], "bins": [-1.3291015625, -1.2907562255859375, -1.252410888671875, -1.2140655517578125, -1.17572021484375, -1.1373748779296875, -1.099029541015625, -1.0606842041015625, -1.0223388671875, -0.9839935302734375, -0.945648193359375, -0.9073028564453125, -0.86895751953125, -0.8306121826171875, -0.792266845703125, -0.7539215087890625, -0.715576171875, -0.6772308349609375, -0.638885498046875, -0.6005401611328125, -0.56219482421875, -0.5238494873046875, -0.485504150390625, -0.4471588134765625, -0.4088134765625, -0.3704681396484375, -0.332122802734375, -0.2937774658203125, -0.25543212890625, -0.2170867919921875, -0.178741455078125, -0.1403961181640625, -0.10205078125, -0.0637054443359375, -0.025360107421875, 0.0129852294921875, 0.05133056640625, 0.0896759033203125, 0.128021240234375, 0.1663665771484375, 0.2047119140625, 0.2430572509765625, 0.281402587890625, 0.3197479248046875, 0.35809326171875, 0.3964385986328125, 0.434783935546875, 0.4731292724609375, 0.511474609375, 0.5498199462890625, 0.588165283203125, 0.6265106201171875, 0.66485595703125, 0.7032012939453125, 0.741546630859375, 0.7798919677734375, 0.8182373046875, 0.8565826416015625, 0.894927978515625, 0.9332733154296875, 0.97161865234375, 1.0099639892578125, 1.048309326171875, 1.0866546630859375, 1.125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 4.0, 5.0, 13.0, 14.0, 16.0, 20.0, 21.0, 35.0, 38.0, 61.0, 65.0, 67.0, 79.0, 81.0, 82.0, 64.0, 67.0, 58.0, 46.0, 44.0, 33.0, 25.0, 17.0, 11.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3759765625, -0.36196136474609375, -0.3479461669921875, -0.33393096923828125, -0.319915771484375, -0.30590057373046875, -0.2918853759765625, -0.27787017822265625, -0.26385498046875, -0.24983978271484375, -0.2358245849609375, -0.22180938720703125, -0.207794189453125, -0.19377899169921875, -0.1797637939453125, -0.16574859619140625, -0.1517333984375, -0.13771820068359375, -0.1237030029296875, -0.10968780517578125, -0.095672607421875, -0.08165740966796875, -0.0676422119140625, -0.05362701416015625, -0.03961181640625, -0.02559661865234375, -0.0115814208984375, 0.00243377685546875, 0.016448974609375, 0.03046417236328125, 0.0444793701171875, 0.05849456787109375, 0.072509765625, 0.08652496337890625, 0.1005401611328125, 0.11455535888671875, 0.128570556640625, 0.14258575439453125, 0.1566009521484375, 0.17061614990234375, 0.18463134765625, 0.19864654541015625, 0.2126617431640625, 0.22667694091796875, 0.240692138671875, 0.25470733642578125, 0.2687225341796875, 0.28273773193359375, 0.2967529296875, 0.31076812744140625, 0.3247833251953125, 0.33879852294921875, 0.352813720703125, 0.36682891845703125, 0.3808441162109375, 0.39485931396484375, 0.40887451171875, 0.42288970947265625, 0.4369049072265625, 0.45092010498046875, 0.464935302734375, 0.47895050048828125, 0.4929656982421875, 0.5069808959960938, 0.52099609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 5.0, 3.0, 9.0, 11.0, 10.0, 15.0, 25.0, 27.0, 30.0, 46.0, 84.0, 105.0, 156.0, 225.0, 383.0, 659.0, 1262.0, 3087.0, 8431.0, 28549.0, 103784.0, 303665.0, 374612.0, 158732.0, 44222.0, 12630.0, 4076.0, 1615.0, 757.0, 449.0, 262.0, 168.0, 124.0, 90.0, 62.0, 47.0, 36.0, 34.0, 16.0, 16.0, 12.0, 8.0, 6.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.009765625, -0.9763031005859375, -0.942840576171875, -0.9093780517578125, -0.87591552734375, -0.8424530029296875, -0.808990478515625, -0.7755279541015625, -0.7420654296875, -0.7086029052734375, -0.675140380859375, -0.6416778564453125, -0.60821533203125, -0.5747528076171875, -0.541290283203125, -0.5078277587890625, -0.474365234375, -0.4409027099609375, -0.407440185546875, -0.3739776611328125, -0.34051513671875, -0.3070526123046875, -0.273590087890625, -0.2401275634765625, -0.2066650390625, -0.1732025146484375, -0.139739990234375, -0.1062774658203125, -0.07281494140625, -0.0393524169921875, -0.005889892578125, 0.0275726318359375, 0.06103515625, 0.0944976806640625, 0.127960205078125, 0.1614227294921875, 0.19488525390625, 0.2283477783203125, 0.261810302734375, 0.2952728271484375, 0.3287353515625, 0.3621978759765625, 0.395660400390625, 0.4291229248046875, 0.46258544921875, 0.4960479736328125, 0.529510498046875, 0.5629730224609375, 0.596435546875, 0.6298980712890625, 0.663360595703125, 0.6968231201171875, 0.73028564453125, 0.7637481689453125, 0.797210693359375, 0.8306732177734375, 0.8641357421875, 0.8975982666015625, 0.931060791015625, 0.9645233154296875, 0.99798583984375, 1.0314483642578125, 1.064910888671875, 1.0983734130859375, 1.1318359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 8.0, 6.0, 6.0, 8.0, 16.0, 23.0, 23.0, 22.0, 30.0, 26.0, 40.0, 61.0, 31.0, 56.0, 55.0, 61.0, 63.0, 56.0, 48.0, 48.0, 38.0, 38.0, 39.0, 32.0, 28.0, 14.0, 27.0, 17.0, 21.0, 12.0, 11.0, 12.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5830078125, -1.530517578125, -1.47802734375, -1.425537109375, -1.373046875, -1.320556640625, -1.26806640625, -1.215576171875, -1.1630859375, -1.110595703125, -1.05810546875, -1.005615234375, -0.953125, -0.900634765625, -0.84814453125, -0.795654296875, -0.7431640625, -0.690673828125, -0.63818359375, -0.585693359375, -0.533203125, -0.480712890625, -0.42822265625, -0.375732421875, -0.3232421875, -0.270751953125, -0.21826171875, -0.165771484375, -0.11328125, -0.060791015625, -0.00830078125, 0.044189453125, 0.0966796875, 0.149169921875, 0.20166015625, 0.254150390625, 0.306640625, 0.359130859375, 0.41162109375, 0.464111328125, 0.5166015625, 0.569091796875, 0.62158203125, 0.674072265625, 0.7265625, 0.779052734375, 0.83154296875, 0.884033203125, 0.9365234375, 0.989013671875, 1.04150390625, 1.093994140625, 1.146484375, 1.198974609375, 1.25146484375, 1.303955078125, 1.3564453125, 1.408935546875, 1.46142578125, 1.513916015625, 1.56640625, 1.618896484375, 1.67138671875, 1.723876953125, 1.7763671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 7.0, 10.0, 11.0, 16.0, 29.0, 46.0, 66.0, 128.0, 247.0, 736.0, 2495.0, 15205.0, 267663.0, 718292.0, 37031.0, 4702.0, 1127.0, 340.0, 177.0, 76.0, 45.0, 29.0, 17.0, 14.0, 7.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.8043975830078125, -0.774810791015625, -0.7452239990234375, -0.71563720703125, -0.6860504150390625, -0.656463623046875, -0.6268768310546875, -0.5972900390625, -0.5677032470703125, -0.538116455078125, -0.5085296630859375, -0.47894287109375, -0.4493560791015625, -0.419769287109375, -0.3901824951171875, -0.360595703125, -0.3310089111328125, -0.301422119140625, -0.2718353271484375, -0.24224853515625, -0.2126617431640625, -0.183074951171875, -0.1534881591796875, -0.1239013671875, -0.0943145751953125, -0.064727783203125, -0.0351409912109375, -0.00555419921875, 0.0240325927734375, 0.053619384765625, 0.0832061767578125, 0.11279296875, 0.1423797607421875, 0.171966552734375, 0.2015533447265625, 0.23114013671875, 0.2607269287109375, 0.290313720703125, 0.3199005126953125, 0.3494873046875, 0.3790740966796875, 0.408660888671875, 0.4382476806640625, 0.46783447265625, 0.4974212646484375, 0.527008056640625, 0.5565948486328125, 0.586181640625, 0.6157684326171875, 0.645355224609375, 0.6749420166015625, 0.70452880859375, 0.7341156005859375, 0.763702392578125, 0.7932891845703125, 0.8228759765625, 0.8524627685546875, 0.882049560546875, 0.9116363525390625, 0.94122314453125, 0.9708099365234375, 1.000396728515625, 1.0299835205078125, 1.0595703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 6.0, 6.0, 2.0, 10.0, 7.0, 18.0, 22.0, 25.0, 31.0, 37.0, 57.0, 74.0, 109.0, 143.0, 117.0, 99.0, 60.0, 47.0, 36.0, 20.0, 18.0, 15.0, 10.0, 5.0, 7.0, 7.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00010329484939575195, -9.942706674337387e-05, -9.555928409099579e-05, -9.16915014386177e-05, -8.782371878623962e-05, -8.395593613386154e-05, -8.008815348148346e-05, -7.622037082910538e-05, -7.23525881767273e-05, -6.848480552434921e-05, -6.461702287197113e-05, -6.074924021959305e-05, -5.6881457567214966e-05, -5.3013674914836884e-05, -4.91458922624588e-05, -4.527810961008072e-05, -4.141032695770264e-05, -3.7542544305324554e-05, -3.367476165294647e-05, -2.980697900056839e-05, -2.5939196348190308e-05, -2.2071413695812225e-05, -1.8203631043434143e-05, -1.433584839105606e-05, -1.0468065738677979e-05, -6.600283086299896e-06, -2.732500433921814e-06, 1.1352822184562683e-06, 5.003064870834351e-06, 8.870847523212433e-06, 1.2738630175590515e-05, 1.6606412827968597e-05, 2.047419548034668e-05, 2.4341978132724762e-05, 2.8209760785102844e-05, 3.2077543437480927e-05, 3.594532608985901e-05, 3.981310874223709e-05, 4.368089139461517e-05, 4.7548674046993256e-05, 5.141645669937134e-05, 5.528423935174942e-05, 5.91520220041275e-05, 6.301980465650558e-05, 6.688758730888367e-05, 7.075536996126175e-05, 7.462315261363983e-05, 7.849093526601791e-05, 8.2358717918396e-05, 8.622650057077408e-05, 9.009428322315216e-05, 9.396206587553024e-05, 9.782984852790833e-05, 0.00010169763118028641, 0.00010556541383266449, 0.00010943319648504257, 0.00011330097913742065, 0.00011716876178979874, 0.00012103654444217682, 0.0001249043270945549, 0.00012877210974693298, 0.00013263989239931107, 0.00013650767505168915, 0.00014037545770406723, 0.0001442432403564453]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 0.0, 5.0, 9.0, 7.0, 8.0, 25.0, 31.0, 51.0, 70.0, 93.0, 186.0, 369.0, 838.0, 2074.0, 6469.0, 35305.0, 533126.0, 431419.0, 29234.0, 5699.0, 1892.0, 812.0, 324.0, 192.0, 122.0, 73.0, 31.0, 28.0, 11.0, 9.0, 8.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71533203125, -0.6906280517578125, -0.665924072265625, -0.6412200927734375, -0.61651611328125, -0.5918121337890625, -0.567108154296875, -0.5424041748046875, -0.5177001953125, -0.4929962158203125, -0.468292236328125, -0.4435882568359375, -0.41888427734375, -0.3941802978515625, -0.369476318359375, -0.3447723388671875, -0.320068359375, -0.2953643798828125, -0.270660400390625, -0.2459564208984375, -0.22125244140625, -0.1965484619140625, -0.171844482421875, -0.1471405029296875, -0.1224365234375, -0.0977325439453125, -0.073028564453125, -0.0483245849609375, -0.02362060546875, 0.0010833740234375, 0.025787353515625, 0.0504913330078125, 0.0751953125, 0.0998992919921875, 0.124603271484375, 0.1493072509765625, 0.17401123046875, 0.1987152099609375, 0.223419189453125, 0.2481231689453125, 0.2728271484375, 0.2975311279296875, 0.322235107421875, 0.3469390869140625, 0.37164306640625, 0.3963470458984375, 0.421051025390625, 0.4457550048828125, 0.470458984375, 0.4951629638671875, 0.519866943359375, 0.5445709228515625, 0.56927490234375, 0.5939788818359375, 0.618682861328125, 0.6433868408203125, 0.6680908203125, 0.6927947998046875, 0.717498779296875, 0.7422027587890625, 0.76690673828125, 0.7916107177734375, 0.816314697265625, 0.8410186767578125, 0.86572265625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 8.0, 19.0, 39.0, 59.0, 95.0, 154.0, 177.0, 181.0, 88.0, 76.0, 41.0, 20.0, 10.0, 11.0, 4.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89697265625, -0.871795654296875, -0.84661865234375, -0.821441650390625, -0.7962646484375, -0.771087646484375, -0.74591064453125, -0.720733642578125, -0.695556640625, -0.670379638671875, -0.64520263671875, -0.620025634765625, -0.5948486328125, -0.569671630859375, -0.54449462890625, -0.519317626953125, -0.494140625, -0.468963623046875, -0.44378662109375, -0.418609619140625, -0.3934326171875, -0.368255615234375, -0.34307861328125, -0.317901611328125, -0.292724609375, -0.267547607421875, -0.24237060546875, -0.217193603515625, -0.1920166015625, -0.166839599609375, -0.14166259765625, -0.116485595703125, -0.09130859375, -0.066131591796875, -0.04095458984375, -0.015777587890625, 0.0093994140625, 0.034576416015625, 0.05975341796875, 0.084930419921875, 0.110107421875, 0.135284423828125, 0.16046142578125, 0.185638427734375, 0.2108154296875, 0.235992431640625, 0.26116943359375, 0.286346435546875, 0.3115234375, 0.336700439453125, 0.36187744140625, 0.387054443359375, 0.4122314453125, 0.437408447265625, 0.46258544921875, 0.487762451171875, 0.512939453125, 0.538116455078125, 0.56329345703125, 0.588470458984375, 0.6136474609375, 0.638824462890625, 0.66400146484375, 0.689178466796875, 0.71435546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 14.0, 17.0, 21.0, 33.0, 64.0, 119.0, 155.0, 162.0, 148.0, 111.0, 69.0, 33.0, 25.0, 13.0, 4.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.415001392364502, -6.130497932434082, -5.845994472503662, -5.561491012573242, -5.276987075805664, -4.992484092712402, -4.707980155944824, -4.423476696014404, -4.138973236083984, -3.8544697761535645, -3.5699663162231445, -3.2854626178741455, -3.0009591579437256, -2.7164556980133057, -2.4319519996643066, -2.1474485397338867, -1.8629450798034668, -1.5784416198730469, -1.2939380407333374, -1.009434461593628, -0.724931001663208, -0.4404275417327881, -0.1559239625930786, 0.12857961654663086, 0.4130830764770508, 0.6975865960121155, 0.9820901155471802, 1.2665936946868896, 1.5510971546173096, 1.8356006145477295, 2.1201043128967285, 2.4046077728271484, 2.68911075592041, 2.97361421585083, 3.25811767578125, 3.542621374130249, 3.827124834060669, 4.111628532409668, 4.396131992340088, 4.680635452270508, 4.965138912200928, 5.249642372131348, 5.534145832061768, 5.8186492919921875, 6.103153228759766, 6.387656211853027, 6.6721601486206055, 6.956663608551025, 7.241167068481445, 7.525670528411865, 7.810173988342285, 8.094677925109863, 8.379180908203125, 8.663684844970703, 8.948187828063965, 9.232691764831543, 9.517194747924805, 9.801698684692383, 10.086201667785645, 10.370705604553223, 10.655208587646484, 10.939712524414062, 11.224215507507324, 11.508719444274902, 11.79322338104248]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 11.0, 10.0, 7.0, 8.0, 10.0, 18.0, 19.0, 16.0, 25.0, 22.0, 28.0, 35.0, 39.0, 42.0, 37.0, 47.0, 43.0, 42.0, 48.0, 48.0, 52.0, 48.0, 51.0, 36.0, 33.0, 33.0, 30.0, 20.0, 20.0, 18.0, 25.0, 23.0, 10.0, 5.0, 13.0, 10.0, 3.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.0203375816345215, -6.75600528717041, -6.491673469543457, -6.227341175079346, -5.963009357452393, -5.698677062988281, -5.434345245361328, -5.170012950897217, -4.9056806564331055, -4.641348361968994, -4.377016544342041, -4.11268424987793, -3.8483524322509766, -3.5840201377868652, -3.319688081741333, -3.055356025695801, -2.7910242080688477, -2.5266921520233154, -2.262360095977783, -1.9980279207229614, -1.7336958646774292, -1.469363808631897, -1.2050316333770752, -0.940699577331543, -0.6763675212860107, -0.41203543543815613, -0.1477033495903015, 0.11662876605987549, 0.3809608221054077, 0.6452928781509399, 0.9096250534057617, 1.173957109451294, 1.438288688659668, 1.7026207447052002, 1.9669528007507324, 2.2312850952148438, 2.495616912841797, 2.759949207305908, 3.0242812633514404, 3.2886133193969727, 3.552945375442505, 3.817277431488037, 4.081609725952148, 4.345941543579102, 4.610273838043213, 4.874605655670166, 5.138937950134277, 5.4032697677612305, 5.667602062225342, 5.931934356689453, 6.196266174316406, 6.460598468780518, 6.724930286407471, 6.989262580871582, 7.253594398498535, 7.5179266929626465, 7.782258987426758, 8.046590805053711, 8.31092357635498, 8.575255393981934, 8.839587211608887, 9.10391902923584, 9.36825180053711, 9.632583618164062, 9.896915435791016]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 9.0, 17.0, 17.0, 18.0, 31.0, 33.0, 43.0, 66.0, 140.0, 212.0, 342.0, 750.0, 1750.0, 4979.0, 18685.0, 134458.0, 3876131.0, 129335.0, 18198.0, 5058.0, 1844.0, 801.0, 461.0, 276.0, 168.0, 135.0, 74.0, 52.0, 47.0, 35.0, 24.0, 14.0, 15.0, 15.0, 8.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.36328125, -1.3170623779296875, -1.270843505859375, -1.2246246337890625, -1.17840576171875, -1.1321868896484375, -1.085968017578125, -1.0397491455078125, -0.9935302734375, -0.9473114013671875, -0.901092529296875, -0.8548736572265625, -0.80865478515625, -0.7624359130859375, -0.716217041015625, -0.6699981689453125, -0.623779296875, -0.5775604248046875, -0.531341552734375, -0.4851226806640625, -0.43890380859375, -0.3926849365234375, -0.346466064453125, -0.3002471923828125, -0.2540283203125, -0.2078094482421875, -0.161590576171875, -0.1153717041015625, -0.06915283203125, -0.0229339599609375, 0.023284912109375, 0.0695037841796875, 0.11572265625, 0.1619415283203125, 0.208160400390625, 0.2543792724609375, 0.30059814453125, 0.3468170166015625, 0.393035888671875, 0.4392547607421875, 0.4854736328125, 0.5316925048828125, 0.577911376953125, 0.6241302490234375, 0.67034912109375, 0.7165679931640625, 0.762786865234375, 0.8090057373046875, 0.855224609375, 0.9014434814453125, 0.947662353515625, 0.9938812255859375, 1.04010009765625, 1.0863189697265625, 1.132537841796875, 1.1787567138671875, 1.2249755859375, 1.2711944580078125, 1.317413330078125, 1.3636322021484375, 1.40985107421875, 1.4560699462890625, 1.502288818359375, 1.5485076904296875, 1.5947265625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 12.0, 10.0, 12.0, 21.0, 15.0, 28.0, 35.0, 35.0, 59.0, 48.0, 77.0, 66.0, 90.0, 77.0, 57.0, 45.0, 52.0, 61.0, 38.0, 42.0, 23.0, 19.0, 17.0, 12.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.347900390625, -0.3340034484863281, -0.32010650634765625, -0.3062095642089844, -0.2923126220703125, -0.2784156799316406, -0.26451873779296875, -0.2506217956542969, -0.236724853515625, -0.22282791137695312, -0.20893096923828125, -0.19503402709960938, -0.1811370849609375, -0.16724014282226562, -0.15334320068359375, -0.13944625854492188, -0.12554931640625, -0.11165237426757812, -0.09775543212890625, -0.08385848999023438, -0.0699615478515625, -0.056064605712890625, -0.04216766357421875, -0.028270721435546875, -0.014373779296875, -0.000476837158203125, 0.01342010498046875, 0.027317047119140625, 0.0412139892578125, 0.055110931396484375, 0.06900787353515625, 0.08290481567382812, 0.0968017578125, 0.11069869995117188, 0.12459564208984375, 0.13849258422851562, 0.1523895263671875, 0.16628646850585938, 0.18018341064453125, 0.19408035278320312, 0.207977294921875, 0.22187423706054688, 0.23577117919921875, 0.24966812133789062, 0.2635650634765625, 0.2774620056152344, 0.29135894775390625, 0.3052558898925781, 0.31915283203125, 0.3330497741699219, 0.34694671630859375, 0.3608436584472656, 0.3747406005859375, 0.3886375427246094, 0.40253448486328125, 0.4164314270019531, 0.430328369140625, 0.4442253112792969, 0.45812225341796875, 0.4720191955566406, 0.4859161376953125, 0.4998130798339844, 0.5137100219726562, 0.5276069641113281, 0.54150390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 2.0, 13.0, 3.0, 19.0, 24.0, 45.0, 64.0, 106.0, 161.0, 345.0, 733.0, 1891.0, 5974.0, 24055.0, 171662.0, 3668422.0, 278203.0, 31624.0, 7225.0, 2112.0, 806.0, 357.0, 148.0, 105.0, 50.0, 43.0, 30.0, 19.0, 15.0, 9.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3896484375, -1.3526763916015625, -1.315704345703125, -1.2787322998046875, -1.24176025390625, -1.2047882080078125, -1.167816162109375, -1.1308441162109375, -1.0938720703125, -1.0569000244140625, -1.019927978515625, -0.9829559326171875, -0.94598388671875, -0.9090118408203125, -0.872039794921875, -0.8350677490234375, -0.798095703125, -0.7611236572265625, -0.724151611328125, -0.6871795654296875, -0.65020751953125, -0.6132354736328125, -0.576263427734375, -0.5392913818359375, -0.5023193359375, -0.4653472900390625, -0.428375244140625, -0.3914031982421875, -0.35443115234375, -0.3174591064453125, -0.280487060546875, -0.2435150146484375, -0.20654296875, -0.1695709228515625, -0.132598876953125, -0.0956268310546875, -0.05865478515625, -0.0216827392578125, 0.015289306640625, 0.0522613525390625, 0.0892333984375, 0.1262054443359375, 0.163177490234375, 0.2001495361328125, 0.23712158203125, 0.2740936279296875, 0.311065673828125, 0.3480377197265625, 0.385009765625, 0.4219818115234375, 0.458953857421875, 0.4959259033203125, 0.53289794921875, 0.5698699951171875, 0.606842041015625, 0.6438140869140625, 0.6807861328125, 0.7177581787109375, 0.754730224609375, 0.7917022705078125, 0.82867431640625, 0.8656463623046875, 0.902618408203125, 0.9395904541015625, 0.9765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 0.0, 8.0, 8.0, 8.0, 20.0, 20.0, 42.0, 69.0, 141.0, 283.0, 1161.0, 1646.0, 357.0, 138.0, 67.0, 39.0, 24.0, 16.0, 9.0, 9.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66357421875, -0.6461524963378906, -0.6287307739257812, -0.6113090515136719, -0.5938873291015625, -0.5764656066894531, -0.5590438842773438, -0.5416221618652344, -0.524200439453125, -0.5067787170410156, -0.48935699462890625, -0.4719352722167969, -0.4545135498046875, -0.4370918273925781, -0.41967010498046875, -0.4022483825683594, -0.38482666015625, -0.3674049377441406, -0.34998321533203125, -0.3325614929199219, -0.3151397705078125, -0.2977180480957031, -0.28029632568359375, -0.2628746032714844, -0.245452880859375, -0.22803115844726562, -0.21060943603515625, -0.19318771362304688, -0.1757659912109375, -0.15834426879882812, -0.14092254638671875, -0.12350082397460938, -0.1060791015625, -0.08865737915039062, -0.07123565673828125, -0.053813934326171875, -0.0363922119140625, -0.018970489501953125, -0.00154876708984375, 0.015872955322265625, 0.033294677734375, 0.050716400146484375, 0.06813812255859375, 0.08555984497070312, 0.1029815673828125, 0.12040328979492188, 0.13782501220703125, 0.15524673461914062, 0.17266845703125, 0.19009017944335938, 0.20751190185546875, 0.22493362426757812, 0.2423553466796875, 0.2597770690917969, 0.27719879150390625, 0.2946205139160156, 0.312042236328125, 0.3294639587402344, 0.34688568115234375, 0.3643074035644531, 0.3817291259765625, 0.3991508483886719, 0.41657257080078125, 0.4339942932128906, 0.451416015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 47.0, 219.0, 528.0, 190.0, 21.0, 6.0, 0.0, 0.0, 2.0], "bins": [-15.284835815429688, -15.018941879272461, -14.75304889678955, -14.487154960632324, -14.221261024475098, -13.955368041992188, -13.689474105834961, -13.423580169677734, -13.157687187194824, -12.891793251037598, -12.625900268554688, -12.360006332397461, -12.094112396240234, -11.828219413757324, -11.562325477600098, -11.296431541442871, -11.030538558959961, -10.764644622802734, -10.498751640319824, -10.232857704162598, -9.966963768005371, -9.701070785522461, -9.435176849365234, -9.169282913208008, -8.903388977050781, -8.637495040893555, -8.371602058410645, -8.105708122253418, -7.83981466293335, -7.573921203613281, -7.308027267456055, -7.042133808135986, -6.776240825653076, -6.510347366333008, -6.244453430175781, -5.978559970855713, -5.7126665115356445, -5.446772575378418, -5.18087911605835, -4.914985656738281, -4.649091720581055, -4.383198261260986, -4.11730432510376, -3.8514108657836914, -3.585517406463623, -3.3196237087249756, -3.053730010986328, -2.7878365516662598, -2.5219430923461914, -2.256049394607544, -1.9901559352874756, -1.7242622375488281, -1.4583686590194702, -1.1924750804901123, -0.9265813827514648, -0.6606878042221069, -0.394794225692749, -0.12890061736106873, 0.13699299097061157, 0.40288662910461426, 0.6687802076339722, 0.9346737861633301, 1.2005674839019775, 1.4664610624313354, 1.7323546409606934]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 12.0, 12.0, 14.0, 13.0, 26.0, 23.0, 30.0, 32.0, 33.0, 27.0, 60.0, 38.0, 37.0, 51.0, 48.0, 59.0, 63.0, 45.0, 50.0, 48.0, 38.0, 34.0, 38.0, 29.0, 16.0, 26.0, 13.0, 11.0, 12.0, 10.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.3984137773513794, -1.3566186428070068, -1.3148235082626343, -1.2730283737182617, -1.2312331199645996, -1.189437985420227, -1.1476428508758545, -1.105847716331482, -1.0640525817871094, -1.0222574472427368, -0.9804623126983643, -0.9386671185493469, -0.8968719840049744, -0.8550768494606018, -0.8132816553115845, -0.7714865207672119, -0.7296913862228394, -0.6878962516784668, -0.6461011171340942, -0.6043059229850769, -0.5625107884407043, -0.5207156538963318, -0.47892048954963684, -0.4371253252029419, -0.39533019065856934, -0.3535350561141968, -0.31173989176750183, -0.2699447274208069, -0.22814959287643433, -0.18635444343090057, -0.14455929398536682, -0.10276412963867188, -0.06096911430358887, -0.019173964858055115, 0.022621184587478638, 0.06441633403301239, 0.10621148347854614, 0.1480066329240799, 0.18980178236961365, 0.2315969467163086, 0.27339208126068115, 0.3151872158050537, 0.35698238015174866, 0.3987775444984436, 0.44057267904281616, 0.4823678135871887, 0.524163007736206, 0.5659581422805786, 0.6077532768249512, 0.6495484113693237, 0.6913435459136963, 0.7331387400627136, 0.7749338746070862, 0.8167290091514587, 0.8585242033004761, 0.9003193378448486, 0.9421144723892212, 0.9839096069335938, 1.0257047414779663, 1.0674998760223389, 1.109295129776001, 1.1510902643203735, 1.192885398864746, 1.2346805334091187, 1.2764756679534912]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 12.0, 10.0, 23.0, 16.0, 25.0, 45.0, 53.0, 106.0, 133.0, 176.0, 265.0, 413.0, 653.0, 1073.0, 1956.0, 3928.0, 8954.0, 23836.0, 69683.0, 208728.0, 377571.0, 228307.0, 77346.0, 25965.0, 10082.0, 4110.0, 2023.0, 1142.0, 692.0, 411.0, 274.0, 170.0, 113.0, 85.0, 55.0, 38.0, 24.0, 14.0, 14.0, 8.0, 9.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.9595489501953125, -0.925933837890625, -0.8923187255859375, -0.85870361328125, -0.8250885009765625, -0.791473388671875, -0.7578582763671875, -0.7242431640625, -0.6906280517578125, -0.657012939453125, -0.6233978271484375, -0.58978271484375, -0.5561676025390625, -0.522552490234375, -0.4889373779296875, -0.455322265625, -0.4217071533203125, -0.388092041015625, -0.3544769287109375, -0.32086181640625, -0.2872467041015625, -0.253631591796875, -0.2200164794921875, -0.1864013671875, -0.1527862548828125, -0.119171142578125, -0.0855560302734375, -0.05194091796875, -0.0183258056640625, 0.015289306640625, 0.0489044189453125, 0.08251953125, 0.1161346435546875, 0.149749755859375, 0.1833648681640625, 0.21697998046875, 0.2505950927734375, 0.284210205078125, 0.3178253173828125, 0.3514404296875, 0.3850555419921875, 0.418670654296875, 0.4522857666015625, 0.48590087890625, 0.5195159912109375, 0.553131103515625, 0.5867462158203125, 0.620361328125, 0.6539764404296875, 0.687591552734375, 0.7212066650390625, 0.75482177734375, 0.7884368896484375, 0.822052001953125, 0.8556671142578125, 0.8892822265625, 0.9228973388671875, 0.956512451171875, 0.9901275634765625, 1.02374267578125, 1.0573577880859375, 1.090972900390625, 1.1245880126953125, 1.158203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 12.0, 13.0, 15.0, 24.0, 21.0, 25.0, 45.0, 47.0, 55.0, 77.0, 75.0, 84.0, 78.0, 58.0, 49.0, 54.0, 54.0, 51.0, 32.0, 29.0, 29.0, 12.0, 17.0, 8.0, 5.0, 1.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.34515380859375, -0.3309326171875, -0.31671142578125, -0.302490234375, -0.28826904296875, -0.2740478515625, -0.25982666015625, -0.24560546875, -0.23138427734375, -0.2171630859375, -0.20294189453125, -0.188720703125, -0.17449951171875, -0.1602783203125, -0.14605712890625, -0.1318359375, -0.11761474609375, -0.1033935546875, -0.08917236328125, -0.074951171875, -0.06072998046875, -0.0465087890625, -0.03228759765625, -0.01806640625, -0.00384521484375, 0.0103759765625, 0.02459716796875, 0.038818359375, 0.05303955078125, 0.0672607421875, 0.08148193359375, 0.095703125, 0.10992431640625, 0.1241455078125, 0.13836669921875, 0.152587890625, 0.16680908203125, 0.1810302734375, 0.19525146484375, 0.20947265625, 0.22369384765625, 0.2379150390625, 0.25213623046875, 0.266357421875, 0.28057861328125, 0.2947998046875, 0.30902099609375, 0.3232421875, 0.33746337890625, 0.3516845703125, 0.36590576171875, 0.380126953125, 0.39434814453125, 0.4085693359375, 0.42279052734375, 0.43701171875, 0.45123291015625, 0.4654541015625, 0.47967529296875, 0.493896484375, 0.50811767578125, 0.5223388671875, 0.53656005859375, 0.55078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 9.0, 10.0, 9.0, 19.0, 34.0, 26.0, 36.0, 55.0, 73.0, 105.0, 140.0, 171.0, 222.0, 327.0, 511.0, 810.0, 1449.0, 3503.0, 9864.0, 31181.0, 102400.0, 277113.0, 360150.0, 176226.0, 55645.0, 17252.0, 5776.0, 2216.0, 1081.0, 657.0, 409.0, 259.0, 204.0, 138.0, 119.0, 77.0, 76.0, 56.0, 37.0, 24.0, 18.0, 15.0, 13.0, 10.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8662109375, -0.8365936279296875, -0.806976318359375, -0.7773590087890625, -0.74774169921875, -0.7181243896484375, -0.688507080078125, -0.6588897705078125, -0.6292724609375, -0.5996551513671875, -0.570037841796875, -0.5404205322265625, -0.51080322265625, -0.4811859130859375, -0.451568603515625, -0.4219512939453125, -0.392333984375, -0.3627166748046875, -0.333099365234375, -0.3034820556640625, -0.27386474609375, -0.2442474365234375, -0.214630126953125, -0.1850128173828125, -0.1553955078125, -0.1257781982421875, -0.096160888671875, -0.0665435791015625, -0.03692626953125, -0.0073089599609375, 0.022308349609375, 0.0519256591796875, 0.08154296875, 0.1111602783203125, 0.140777587890625, 0.1703948974609375, 0.20001220703125, 0.2296295166015625, 0.259246826171875, 0.2888641357421875, 0.3184814453125, 0.3480987548828125, 0.377716064453125, 0.4073333740234375, 0.43695068359375, 0.4665679931640625, 0.496185302734375, 0.5258026123046875, 0.555419921875, 0.5850372314453125, 0.614654541015625, 0.6442718505859375, 0.67388916015625, 0.7035064697265625, 0.733123779296875, 0.7627410888671875, 0.7923583984375, 0.8219757080078125, 0.851593017578125, 0.8812103271484375, 0.91082763671875, 0.9404449462890625, 0.970062255859375, 0.9996795654296875, 1.029296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 5.0, 4.0, 13.0, 13.0, 16.0, 13.0, 18.0, 31.0, 27.0, 32.0, 22.0, 37.0, 45.0, 41.0, 45.0, 40.0, 49.0, 48.0, 47.0, 45.0, 43.0, 42.0, 31.0, 42.0, 35.0, 33.0, 22.0, 23.0, 17.0, 21.0, 16.0, 17.0, 16.0, 7.0, 9.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5751953125, -1.5287628173828125, -1.482330322265625, -1.4358978271484375, -1.38946533203125, -1.3430328369140625, -1.296600341796875, -1.2501678466796875, -1.2037353515625, -1.1573028564453125, -1.110870361328125, -1.0644378662109375, -1.01800537109375, -0.9715728759765625, -0.925140380859375, -0.8787078857421875, -0.832275390625, -0.7858428955078125, -0.739410400390625, -0.6929779052734375, -0.64654541015625, -0.6001129150390625, -0.553680419921875, -0.5072479248046875, -0.4608154296875, -0.4143829345703125, -0.367950439453125, -0.3215179443359375, -0.27508544921875, -0.2286529541015625, -0.182220458984375, -0.1357879638671875, -0.08935546875, -0.0429229736328125, 0.003509521484375, 0.0499420166015625, 0.09637451171875, 0.1428070068359375, 0.189239501953125, 0.2356719970703125, 0.2821044921875, 0.3285369873046875, 0.374969482421875, 0.4214019775390625, 0.46783447265625, 0.5142669677734375, 0.560699462890625, 0.6071319580078125, 0.653564453125, 0.6999969482421875, 0.746429443359375, 0.7928619384765625, 0.83929443359375, 0.8857269287109375, 0.932159423828125, 0.9785919189453125, 1.0250244140625, 1.0714569091796875, 1.117889404296875, 1.1643218994140625, 1.21075439453125, 1.2571868896484375, 1.303619384765625, 1.3500518798828125, 1.396484375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 0.0, 6.0, 13.0, 15.0, 15.0, 20.0, 39.0, 64.0, 141.0, 234.0, 581.0, 1440.0, 4336.0, 16742.0, 101798.0, 609424.0, 267163.0, 34956.0, 7667.0, 2294.0, 886.0, 359.0, 160.0, 78.0, 39.0, 27.0, 18.0, 8.0, 9.0, 12.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61328125, -0.5956192016601562, -0.5779571533203125, -0.5602951049804688, -0.542633056640625, -0.5249710083007812, -0.5073089599609375, -0.48964691162109375, -0.47198486328125, -0.45432281494140625, -0.4366607666015625, -0.41899871826171875, -0.401336669921875, -0.38367462158203125, -0.3660125732421875, -0.34835052490234375, -0.3306884765625, -0.31302642822265625, -0.2953643798828125, -0.27770233154296875, -0.260040283203125, -0.24237823486328125, -0.2247161865234375, -0.20705413818359375, -0.18939208984375, -0.17173004150390625, -0.1540679931640625, -0.13640594482421875, -0.118743896484375, -0.10108184814453125, -0.0834197998046875, -0.06575775146484375, -0.048095703125, -0.03043365478515625, -0.0127716064453125, 0.00489044189453125, 0.022552490234375, 0.04021453857421875, 0.0578765869140625, 0.07553863525390625, 0.09320068359375, 0.11086273193359375, 0.1285247802734375, 0.14618682861328125, 0.163848876953125, 0.18151092529296875, 0.1991729736328125, 0.21683502197265625, 0.2344970703125, 0.25215911865234375, 0.2698211669921875, 0.28748321533203125, 0.305145263671875, 0.32280731201171875, 0.3404693603515625, 0.35813140869140625, 0.37579345703125, 0.39345550537109375, 0.4111175537109375, 0.42877960205078125, 0.446441650390625, 0.46410369873046875, 0.4817657470703125, 0.49942779541015625, 0.51708984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 10.0, 1.0, 8.0, 7.0, 11.0, 6.0, 11.0, 11.0, 17.0, 24.0, 21.0, 34.0, 32.0, 30.0, 42.0, 59.0, 70.0, 80.0, 94.0, 73.0, 64.0, 55.0, 37.0, 43.0, 36.0, 26.0, 9.0, 16.0, 17.0, 9.0, 11.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00010138750076293945, -9.849760681390762e-05, -9.56077128648758e-05, -9.271781891584396e-05, -8.982792496681213e-05, -8.69380310177803e-05, -8.404813706874847e-05, -8.115824311971664e-05, -7.826834917068481e-05, -7.537845522165298e-05, -7.248856127262115e-05, -6.959866732358932e-05, -6.67087733745575e-05, -6.381887942552567e-05, -6.0928985476493835e-05, -5.8039091527462006e-05, -5.5149197578430176e-05, -5.2259303629398346e-05, -4.9369409680366516e-05, -4.6479515731334686e-05, -4.3589621782302856e-05, -4.0699727833271027e-05, -3.78098338842392e-05, -3.491993993520737e-05, -3.203004598617554e-05, -2.9140152037143707e-05, -2.6250258088111877e-05, -2.3360364139080048e-05, -2.0470470190048218e-05, -1.7580576241016388e-05, -1.4690682291984558e-05, -1.1800788342952728e-05, -8.910894393920898e-06, -6.021000444889069e-06, -3.1311064958572388e-06, -2.4121254682540894e-07, 2.648681402206421e-06, 5.538575351238251e-06, 8.42846930027008e-06, 1.131836324930191e-05, 1.420825719833374e-05, 1.709815114736557e-05, 1.99880450963974e-05, 2.287793904542923e-05, 2.576783299446106e-05, 2.865772694349289e-05, 3.154762089252472e-05, 3.443751484155655e-05, 3.732740879058838e-05, 4.021730273962021e-05, 4.310719668865204e-05, 4.599709063768387e-05, 4.88869845867157e-05, 5.177687853574753e-05, 5.466677248477936e-05, 5.755666643381119e-05, 6.044656038284302e-05, 6.333645433187485e-05, 6.622634828090668e-05, 6.911624222993851e-05, 7.200613617897034e-05, 7.489603012800217e-05, 7.7785924077034e-05, 8.067581802606583e-05, 8.356571197509766e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 7.0, 13.0, 10.0, 17.0, 33.0, 50.0, 56.0, 101.0, 151.0, 286.0, 438.0, 961.0, 2116.0, 5955.0, 22456.0, 131762.0, 652285.0, 190456.0, 29073.0, 7428.0, 2452.0, 1111.0, 546.0, 305.0, 173.0, 108.0, 55.0, 46.0, 30.0, 14.0, 19.0, 7.0, 5.0, 8.0, 5.0, 1.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.446533203125, -0.4290809631347656, -0.41162872314453125, -0.3941764831542969, -0.3767242431640625, -0.3592720031738281, -0.34181976318359375, -0.3243675231933594, -0.306915283203125, -0.2894630432128906, -0.27201080322265625, -0.2545585632324219, -0.2371063232421875, -0.21965408325195312, -0.20220184326171875, -0.18474960327148438, -0.16729736328125, -0.14984512329101562, -0.13239288330078125, -0.11494064331054688, -0.0974884033203125, -0.08003616333007812, -0.06258392333984375, -0.045131683349609375, -0.027679443359375, -0.010227203369140625, 0.00722503662109375, 0.024677276611328125, 0.0421295166015625, 0.059581756591796875, 0.07703399658203125, 0.09448623657226562, 0.1119384765625, 0.12939071655273438, 0.14684295654296875, 0.16429519653320312, 0.1817474365234375, 0.19919967651367188, 0.21665191650390625, 0.23410415649414062, 0.251556396484375, 0.2690086364746094, 0.28646087646484375, 0.3039131164550781, 0.3213653564453125, 0.3388175964355469, 0.35626983642578125, 0.3737220764160156, 0.39117431640625, 0.4086265563964844, 0.42607879638671875, 0.4435310363769531, 0.4609832763671875, 0.4784355163574219, 0.49588775634765625, 0.5133399963378906, 0.530792236328125, 0.5482444763183594, 0.5656967163085938, 0.5831489562988281, 0.6006011962890625, 0.6180534362792969, 0.6355056762695312, 0.6529579162597656, 0.67041015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 2.0, 5.0, 7.0, 9.0, 5.0, 23.0, 19.0, 24.0, 46.0, 71.0, 108.0, 118.0, 120.0, 122.0, 103.0, 62.0, 48.0, 28.0, 19.0, 14.0, 12.0, 9.0, 10.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.77734375, -0.7581253051757812, -0.7389068603515625, -0.7196884155273438, -0.700469970703125, -0.6812515258789062, -0.6620330810546875, -0.6428146362304688, -0.62359619140625, -0.6043777465820312, -0.5851593017578125, -0.5659408569335938, -0.546722412109375, -0.5275039672851562, -0.5082855224609375, -0.48906707763671875, -0.4698486328125, -0.45063018798828125, -0.4314117431640625, -0.41219329833984375, -0.392974853515625, -0.37375640869140625, -0.3545379638671875, -0.33531951904296875, -0.31610107421875, -0.29688262939453125, -0.2776641845703125, -0.25844573974609375, -0.239227294921875, -0.22000885009765625, -0.2007904052734375, -0.18157196044921875, -0.162353515625, -0.14313507080078125, -0.1239166259765625, -0.10469818115234375, -0.085479736328125, -0.06626129150390625, -0.0470428466796875, -0.02782440185546875, -0.00860595703125, 0.01061248779296875, 0.0298309326171875, 0.04904937744140625, 0.068267822265625, 0.08748626708984375, 0.1067047119140625, 0.12592315673828125, 0.1451416015625, 0.16436004638671875, 0.1835784912109375, 0.20279693603515625, 0.222015380859375, 0.24123382568359375, 0.2604522705078125, 0.27967071533203125, 0.29888916015625, 0.31810760498046875, 0.3373260498046875, 0.35654449462890625, 0.375762939453125, 0.39498138427734375, 0.4141998291015625, 0.43341827392578125, 0.45263671875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 12.0, 25.0, 45.0, 104.0, 157.0, 166.0, 184.0, 122.0, 78.0, 45.0, 29.0, 12.0, 8.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.880414962768555, -9.541049003601074, -9.201683044433594, -8.862316131591797, -8.522950172424316, -8.183584213256836, -7.8442182540893555, -7.504852294921875, -7.1654863357543945, -6.826120376586914, -6.486753940582275, -6.147387981414795, -5.8080220222473145, -5.468655586242676, -5.129289627075195, -4.789923667907715, -4.450557231903076, -4.111191272735596, -3.771825075149536, -3.4324588775634766, -3.093092918395996, -2.7537267208099365, -2.414360523223877, -2.0749945640563965, -1.735628366470337, -1.396262288093567, -1.0568962097167969, -0.7175300121307373, -0.3781639337539673, -0.038797855377197266, 0.3005683422088623, 0.6399343013763428, 0.9793004989624023, 1.3186665773391724, 1.6580326557159424, 1.997398853302002, 2.3367648124694824, 2.676131010055542, 3.0154972076416016, 3.354863166809082, 3.6942293643951416, 4.033595561981201, 4.372961521148682, 4.71232795715332, 5.051693916320801, 5.391059875488281, 5.730425834655762, 6.069791793823242, 6.409158229827881, 6.748524188995361, 7.087890625, 7.4272565841674805, 7.766622543334961, 8.105988502502441, 8.445354461669922, 8.784721374511719, 9.1240873336792, 9.46345329284668, 9.80281925201416, 10.14218521118164, 10.481552124023438, 10.820918083190918, 11.160284042358398, 11.499650001525879, 11.83901596069336]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 7.0, 9.0, 10.0, 12.0, 12.0, 12.0, 25.0, 15.0, 22.0, 15.0, 33.0, 32.0, 41.0, 36.0, 48.0, 36.0, 48.0, 40.0, 47.0, 53.0, 47.0, 43.0, 30.0, 48.0, 38.0, 25.0, 40.0, 22.0, 33.0, 18.0, 12.0, 17.0, 11.0, 11.0, 15.0, 10.0, 12.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.525279998779297, -9.243924140930176, -8.962568283081055, -8.681211471557617, -8.399855613708496, -8.118499755859375, -7.837143898010254, -7.555788040161133, -7.2744317054748535, -6.993075847625732, -6.711719512939453, -6.430363655090332, -6.149007797241211, -5.867651462554932, -5.5862956047058105, -5.304939270019531, -5.02358341217041, -4.742227554321289, -4.46087121963501, -4.179515361785889, -3.8981592655181885, -3.6168031692504883, -3.335447311401367, -3.054091215133667, -2.772735118865967, -2.4913790225982666, -2.2100229263305664, -1.9286670684814453, -1.6473109722137451, -1.365954875946045, -1.0845988988876343, -0.8032429218292236, -0.5218868255615234, -0.24053078889846802, 0.0408252477645874, 0.3221812844276428, 0.6035373210906982, 0.8848934173583984, 1.166249394416809, 1.4476053714752197, 1.72896146774292, 2.01031756401062, 2.2916736602783203, 2.5730295181274414, 2.8543856143951416, 3.135741710662842, 3.417097568511963, 3.698453664779663, 3.9798097610473633, 4.261165618896484, 4.542521953582764, 4.823877811431885, 5.105234146118164, 5.386590003967285, 5.667945861816406, 5.949301719665527, 6.230658054351807, 6.512013912200928, 6.793370246887207, 7.074726104736328, 7.356081962585449, 7.6374382972717285, 7.91879415512085, 8.200150489807129, 8.48150634765625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 9.0, 13.0, 22.0, 30.0, 38.0, 52.0, 91.0, 153.0, 319.0, 658.0, 1456.0, 4473.0, 20962.0, 259428.0, 3827416.0, 64192.0, 9831.0, 2658.0, 1049.0, 570.0, 326.0, 168.0, 117.0, 76.0, 43.0, 38.0, 28.0, 17.0, 6.0, 13.0, 4.0, 6.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.4889068603515625, -1.439727783203125, -1.3905487060546875, -1.34136962890625, -1.2921905517578125, -1.243011474609375, -1.1938323974609375, -1.1446533203125, -1.0954742431640625, -1.046295166015625, -0.9971160888671875, -0.94793701171875, -0.8987579345703125, -0.849578857421875, -0.8003997802734375, -0.751220703125, -0.7020416259765625, -0.652862548828125, -0.6036834716796875, -0.55450439453125, -0.5053253173828125, -0.456146240234375, -0.4069671630859375, -0.3577880859375, -0.3086090087890625, -0.259429931640625, -0.2102508544921875, -0.16107177734375, -0.1118927001953125, -0.062713623046875, -0.0135345458984375, 0.03564453125, 0.0848236083984375, 0.134002685546875, 0.1831817626953125, 0.23236083984375, 0.2815399169921875, 0.330718994140625, 0.3798980712890625, 0.4290771484375, 0.4782562255859375, 0.527435302734375, 0.5766143798828125, 0.62579345703125, 0.6749725341796875, 0.724151611328125, 0.7733306884765625, 0.822509765625, 0.8716888427734375, 0.920867919921875, 0.9700469970703125, 1.01922607421875, 1.0684051513671875, 1.117584228515625, 1.1667633056640625, 1.2159423828125, 1.2651214599609375, 1.314300537109375, 1.3634796142578125, 1.41265869140625, 1.4618377685546875, 1.511016845703125, 1.5601959228515625, 1.609375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 13.0, 15.0, 18.0, 22.0, 33.0, 35.0, 44.0, 64.0, 55.0, 70.0, 76.0, 77.0, 68.0, 56.0, 57.0, 66.0, 44.0, 45.0, 33.0, 25.0, 25.0, 12.0, 11.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45556640625, -0.43914794921875, -0.4227294921875, -0.40631103515625, -0.389892578125, -0.37347412109375, -0.3570556640625, -0.34063720703125, -0.32421875, -0.30780029296875, -0.2913818359375, -0.27496337890625, -0.258544921875, -0.24212646484375, -0.2257080078125, -0.20928955078125, -0.19287109375, -0.17645263671875, -0.1600341796875, -0.14361572265625, -0.127197265625, -0.11077880859375, -0.0943603515625, -0.07794189453125, -0.0615234375, -0.04510498046875, -0.0286865234375, -0.01226806640625, 0.004150390625, 0.02056884765625, 0.0369873046875, 0.05340576171875, 0.06982421875, 0.08624267578125, 0.1026611328125, 0.11907958984375, 0.135498046875, 0.15191650390625, 0.1683349609375, 0.18475341796875, 0.201171875, 0.21759033203125, 0.2340087890625, 0.25042724609375, 0.266845703125, 0.28326416015625, 0.2996826171875, 0.31610107421875, 0.33251953125, 0.34893798828125, 0.3653564453125, 0.38177490234375, 0.398193359375, 0.41461181640625, 0.4310302734375, 0.44744873046875, 0.4638671875, 0.48028564453125, 0.4967041015625, 0.51312255859375, 0.529541015625, 0.54595947265625, 0.5623779296875, 0.57879638671875, 0.59521484375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 14.0, 20.0, 28.0, 38.0, 59.0, 81.0, 193.0, 499.0, 1854.0, 8813.0, 88956.0, 3895505.0, 181483.0, 13207.0, 2440.0, 594.0, 236.0, 103.0, 55.0, 35.0, 21.0, 16.0, 13.0, 9.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16796875, -2.1145782470703125, -2.061187744140625, -2.0077972412109375, -1.95440673828125, -1.9010162353515625, -1.847625732421875, -1.7942352294921875, -1.7408447265625, -1.6874542236328125, -1.634063720703125, -1.5806732177734375, -1.52728271484375, -1.4738922119140625, -1.420501708984375, -1.3671112060546875, -1.313720703125, -1.2603302001953125, -1.206939697265625, -1.1535491943359375, -1.10015869140625, -1.0467681884765625, -0.993377685546875, -0.9399871826171875, -0.8865966796875, -0.8332061767578125, -0.779815673828125, -0.7264251708984375, -0.67303466796875, -0.6196441650390625, -0.566253662109375, -0.5128631591796875, -0.45947265625, -0.4060821533203125, -0.352691650390625, -0.2993011474609375, -0.24591064453125, -0.1925201416015625, -0.139129638671875, -0.0857391357421875, -0.0323486328125, 0.0210418701171875, 0.074432373046875, 0.1278228759765625, 0.18121337890625, 0.2346038818359375, 0.287994384765625, 0.3413848876953125, 0.394775390625, 0.4481658935546875, 0.501556396484375, 0.5549468994140625, 0.60833740234375, 0.6617279052734375, 0.715118408203125, 0.7685089111328125, 0.8218994140625, 0.8752899169921875, 0.928680419921875, 0.9820709228515625, 1.03546142578125, 1.0888519287109375, 1.142242431640625, 1.1956329345703125, 1.2490234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 5.0, 7.0, 12.0, 9.0, 20.0, 38.0, 84.0, 152.0, 415.0, 2134.0, 816.0, 181.0, 81.0, 43.0, 35.0, 16.0, 8.0, 4.0, 6.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-1.1396484375, -1.1162376403808594, -1.0928268432617188, -1.0694160461425781, -1.0460052490234375, -1.0225944519042969, -0.9991836547851562, -0.9757728576660156, -0.952362060546875, -0.9289512634277344, -0.9055404663085938, -0.8821296691894531, -0.8587188720703125, -0.8353080749511719, -0.8118972778320312, -0.7884864807128906, -0.76507568359375, -0.7416648864746094, -0.7182540893554688, -0.6948432922363281, -0.6714324951171875, -0.6480216979980469, -0.6246109008789062, -0.6012001037597656, -0.577789306640625, -0.5543785095214844, -0.5309677124023438, -0.5075569152832031, -0.4841461181640625, -0.4607353210449219, -0.43732452392578125, -0.4139137268066406, -0.3905029296875, -0.3670921325683594, -0.34368133544921875, -0.3202705383300781, -0.2968597412109375, -0.2734489440917969, -0.25003814697265625, -0.22662734985351562, -0.203216552734375, -0.17980575561523438, -0.15639495849609375, -0.13298416137695312, -0.1095733642578125, -0.08616256713867188, -0.06275177001953125, -0.039340972900390625, -0.01593017578125, 0.007480621337890625, 0.03089141845703125, 0.054302215576171875, 0.0777130126953125, 0.10112380981445312, 0.12453460693359375, 0.14794540405273438, 0.171356201171875, 0.19476699829101562, 0.21817779541015625, 0.24158859252929688, 0.2649993896484375, 0.2884101867675781, 0.31182098388671875, 0.3352317810058594, 0.358642578125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 19.0, 37.0, 95.0, 158.0, 202.0, 187.0, 154.0, 83.0, 35.0, 17.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4339399337768555, -5.320358753204346, -5.206777572631836, -5.093196868896484, -4.979615688323975, -4.866034507751465, -4.752453327178955, -4.638872146606445, -4.5252909660339355, -4.411709785461426, -4.298128604888916, -4.184547424316406, -4.070966720581055, -3.957385540008545, -3.843804359436035, -3.7302231788635254, -3.616642475128174, -3.503061294555664, -3.3894803524017334, -3.2758991718292236, -3.162317991256714, -3.048737049102783, -2.9351558685302734, -2.8215746879577637, -2.707993507385254, -2.594412326812744, -2.4808313846588135, -2.3672502040863037, -2.253669023513794, -2.1400880813598633, -2.0265069007873535, -1.9129258394241333, -1.799344778060913, -1.6857637166976929, -1.572182536125183, -1.458601474761963, -1.3450204133987427, -1.2314393520355225, -1.1178581714630127, -1.0042771100997925, -0.8906959891319275, -0.7771148681640625, -0.6635338068008423, -0.5499526858329773, -0.4363715946674347, -0.3227905035018921, -0.2092093825340271, -0.09562832117080688, 0.017952799797058105, 0.1315338909626007, 0.2451149970293045, 0.3586961030960083, 0.4722771942615509, 0.5858582854270935, 0.6994394063949585, 0.8130204677581787, 0.9266015887260437, 1.0401827096939087, 1.153763771057129, 1.2673449516296387, 1.3809260129928589, 1.494507074356079, 1.6080882549285889, 1.7216691970825195, 1.8352503776550293]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 4.0, 13.0, 13.0, 12.0, 19.0, 18.0, 30.0, 27.0, 36.0, 39.0, 41.0, 37.0, 45.0, 51.0, 65.0, 74.0, 49.0, 56.0, 45.0, 49.0, 44.0, 46.0, 34.0, 29.0, 31.0, 26.0, 13.0, 15.0, 10.0, 9.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.0898728370666504, -2.0325448513031006, -1.9752166271209717, -1.9178885221481323, -1.860560417175293, -1.8032324314117432, -1.7459043264389038, -1.6885762214660645, -1.631248116493225, -1.5739200115203857, -1.5165919065475464, -1.459263801574707, -1.4019358158111572, -1.3446075916290283, -1.2872796058654785, -1.2299515008926392, -1.1726233959197998, -1.1152952909469604, -1.057967185974121, -1.0006390810012817, -0.9433110356330872, -0.8859829306602478, -0.8286548852920532, -0.7713267803192139, -0.7139986753463745, -0.6566705703735352, -0.5993424654006958, -0.5420144200325012, -0.48468631505966187, -0.4273582100868225, -0.37003013491630554, -0.3127020597457886, -0.25537383556365967, -0.1980457454919815, -0.14071765542030334, -0.08338956534862518, -0.02606147527694702, 0.031266629695892334, 0.0885947048664093, 0.14592278003692627, 0.20325088500976562, 0.260578989982605, 0.31790706515312195, 0.3752351403236389, 0.43256324529647827, 0.4898913502693176, 0.5472193956375122, 0.6045475006103516, 0.6618756055831909, 0.7192037105560303, 0.7765318155288696, 0.8338598608970642, 0.8911879658699036, 0.9485160708427429, 1.0058441162109375, 1.0631722211837769, 1.1205003261566162, 1.1778284311294556, 1.235156536102295, 1.2924846410751343, 1.3498127460479736, 1.4071407318115234, 1.4644688367843628, 1.5217969417572021, 1.5791250467300415]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 10.0, 12.0, 10.0, 19.0, 32.0, 34.0, 39.0, 80.0, 89.0, 131.0, 177.0, 359.0, 504.0, 915.0, 1557.0, 3059.0, 6288.0, 15210.0, 42742.0, 140938.0, 397730.0, 297618.0, 90605.0, 28995.0, 10843.0, 4761.0, 2344.0, 1316.0, 745.0, 468.0, 287.0, 188.0, 126.0, 74.0, 64.0, 46.0, 27.0, 24.0, 26.0, 11.0, 7.0, 8.0, 7.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.05859375, -1.0242462158203125, -0.989898681640625, -0.9555511474609375, -0.92120361328125, -0.8868560791015625, -0.852508544921875, -0.8181610107421875, -0.7838134765625, -0.7494659423828125, -0.715118408203125, -0.6807708740234375, -0.64642333984375, -0.6120758056640625, -0.577728271484375, -0.5433807373046875, -0.509033203125, -0.4746856689453125, -0.440338134765625, -0.4059906005859375, -0.37164306640625, -0.3372955322265625, -0.302947998046875, -0.2686004638671875, -0.2342529296875, -0.1999053955078125, -0.165557861328125, -0.1312103271484375, -0.09686279296875, -0.0625152587890625, -0.028167724609375, 0.0061798095703125, 0.04052734375, 0.0748748779296875, 0.109222412109375, 0.1435699462890625, 0.17791748046875, 0.2122650146484375, 0.246612548828125, 0.2809600830078125, 0.3153076171875, 0.3496551513671875, 0.384002685546875, 0.4183502197265625, 0.45269775390625, 0.4870452880859375, 0.521392822265625, 0.5557403564453125, 0.590087890625, 0.6244354248046875, 0.658782958984375, 0.6931304931640625, 0.72747802734375, 0.7618255615234375, 0.796173095703125, 0.8305206298828125, 0.8648681640625, 0.8992156982421875, 0.933563232421875, 0.9679107666015625, 1.00225830078125, 1.0366058349609375, 1.070953369140625, 1.1053009033203125, 1.1396484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 9.0, 10.0, 11.0, 24.0, 28.0, 17.0, 41.0, 52.0, 46.0, 62.0, 65.0, 86.0, 68.0, 62.0, 63.0, 61.0, 47.0, 50.0, 42.0, 33.0, 28.0, 27.0, 16.0, 13.0, 10.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4013671875, -0.38585662841796875, -0.3703460693359375, -0.35483551025390625, -0.339324951171875, -0.32381439208984375, -0.3083038330078125, -0.29279327392578125, -0.27728271484375, -0.26177215576171875, -0.2462615966796875, -0.23075103759765625, -0.215240478515625, -0.19972991943359375, -0.1842193603515625, -0.16870880126953125, -0.1531982421875, -0.13768768310546875, -0.1221771240234375, -0.10666656494140625, -0.091156005859375, -0.07564544677734375, -0.0601348876953125, -0.04462432861328125, -0.02911376953125, -0.01360321044921875, 0.0019073486328125, 0.01741790771484375, 0.032928466796875, 0.04843902587890625, 0.0639495849609375, 0.07946014404296875, 0.094970703125, 0.11048126220703125, 0.1259918212890625, 0.14150238037109375, 0.157012939453125, 0.17252349853515625, 0.1880340576171875, 0.20354461669921875, 0.21905517578125, 0.23456573486328125, 0.2500762939453125, 0.26558685302734375, 0.281097412109375, 0.29660797119140625, 0.3121185302734375, 0.32762908935546875, 0.3431396484375, 0.35865020751953125, 0.3741607666015625, 0.38967132568359375, 0.405181884765625, 0.42069244384765625, 0.4362030029296875, 0.45171356201171875, 0.46722412109375, 0.48273468017578125, 0.4982452392578125, 0.5137557983398438, 0.529266357421875, 0.5447769165039062, 0.5602874755859375, 0.5757980346679688, 0.59130859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 12.0, 12.0, 17.0, 23.0, 26.0, 39.0, 52.0, 75.0, 120.0, 132.0, 183.0, 304.0, 481.0, 913.0, 2148.0, 7029.0, 27918.0, 145855.0, 525149.0, 269253.0, 51300.0, 11305.0, 3232.0, 1227.0, 573.0, 333.0, 238.0, 157.0, 114.0, 73.0, 63.0, 38.0, 28.0, 27.0, 20.0, 10.0, 18.0, 12.0, 11.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2548828125, -1.212615966796875, -1.17034912109375, -1.128082275390625, -1.0858154296875, -1.043548583984375, -1.00128173828125, -0.959014892578125, -0.916748046875, -0.874481201171875, -0.83221435546875, -0.789947509765625, -0.7476806640625, -0.705413818359375, -0.66314697265625, -0.620880126953125, -0.57861328125, -0.536346435546875, -0.49407958984375, -0.451812744140625, -0.4095458984375, -0.367279052734375, -0.32501220703125, -0.282745361328125, -0.240478515625, -0.198211669921875, -0.15594482421875, -0.113677978515625, -0.0714111328125, -0.029144287109375, 0.01312255859375, 0.055389404296875, 0.09765625, 0.139923095703125, 0.18218994140625, 0.224456787109375, 0.2667236328125, 0.308990478515625, 0.35125732421875, 0.393524169921875, 0.435791015625, 0.478057861328125, 0.52032470703125, 0.562591552734375, 0.6048583984375, 0.647125244140625, 0.68939208984375, 0.731658935546875, 0.77392578125, 0.816192626953125, 0.85845947265625, 0.900726318359375, 0.9429931640625, 0.985260009765625, 1.02752685546875, 1.069793701171875, 1.112060546875, 1.154327392578125, 1.19659423828125, 1.238861083984375, 1.2811279296875, 1.323394775390625, 1.36566162109375, 1.407928466796875, 1.4501953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 11.0, 11.0, 18.0, 26.0, 28.0, 27.0, 35.0, 35.0, 32.0, 39.0, 34.0, 52.0, 44.0, 44.0, 46.0, 56.0, 60.0, 44.0, 37.0, 55.0, 28.0, 38.0, 28.0, 23.0, 17.0, 18.0, 20.0, 16.0, 11.0, 11.0, 8.0, 2.0, 7.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.6572265625, -1.6082305908203125, -1.559234619140625, -1.5102386474609375, -1.46124267578125, -1.4122467041015625, -1.363250732421875, -1.3142547607421875, -1.2652587890625, -1.2162628173828125, -1.167266845703125, -1.1182708740234375, -1.06927490234375, -1.0202789306640625, -0.971282958984375, -0.9222869873046875, -0.873291015625, -0.8242950439453125, -0.775299072265625, -0.7263031005859375, -0.67730712890625, -0.6283111572265625, -0.579315185546875, -0.5303192138671875, -0.4813232421875, -0.4323272705078125, -0.383331298828125, -0.3343353271484375, -0.28533935546875, -0.2363433837890625, -0.187347412109375, -0.1383514404296875, -0.08935546875, -0.0403594970703125, 0.008636474609375, 0.0576324462890625, 0.10662841796875, 0.1556243896484375, 0.204620361328125, 0.2536163330078125, 0.3026123046875, 0.3516082763671875, 0.400604248046875, 0.4496002197265625, 0.49859619140625, 0.5475921630859375, 0.596588134765625, 0.6455841064453125, 0.694580078125, 0.7435760498046875, 0.792572021484375, 0.8415679931640625, 0.89056396484375, 0.9395599365234375, 0.988555908203125, 1.0375518798828125, 1.0865478515625, 1.1355438232421875, 1.184539794921875, 1.2335357666015625, 1.28253173828125, 1.3315277099609375, 1.380523681640625, 1.4295196533203125, 1.478515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 3.0, 6.0, 27.0, 50.0, 119.0, 305.0, 1217.0, 10682.0, 545062.0, 479402.0, 10014.0, 1159.0, 287.0, 94.0, 61.0, 23.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08984375, -1.05224609375, -1.0146484375, -0.97705078125, -0.939453125, -0.90185546875, -0.8642578125, -0.82666015625, -0.7890625, -0.75146484375, -0.7138671875, -0.67626953125, -0.638671875, -0.60107421875, -0.5634765625, -0.52587890625, -0.48828125, -0.45068359375, -0.4130859375, -0.37548828125, -0.337890625, -0.30029296875, -0.2626953125, -0.22509765625, -0.1875, -0.14990234375, -0.1123046875, -0.07470703125, -0.037109375, 0.00048828125, 0.0380859375, 0.07568359375, 0.11328125, 0.15087890625, 0.1884765625, 0.22607421875, 0.263671875, 0.30126953125, 0.3388671875, 0.37646484375, 0.4140625, 0.45166015625, 0.4892578125, 0.52685546875, 0.564453125, 0.60205078125, 0.6396484375, 0.67724609375, 0.71484375, 0.75244140625, 0.7900390625, 0.82763671875, 0.865234375, 0.90283203125, 0.9404296875, 0.97802734375, 1.015625, 1.05322265625, 1.0908203125, 1.12841796875, 1.166015625, 1.20361328125, 1.2412109375, 1.27880859375, 1.31640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 2.0, 5.0, 3.0, 9.0, 5.0, 13.0, 15.0, 17.0, 22.0, 30.0, 35.0, 63.0, 119.0, 165.0, 165.0, 114.0, 53.0, 32.0, 26.0, 14.0, 21.0, 17.0, 3.0, 14.0, 7.0, 6.0, 6.0, 4.0, 6.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00015461444854736328, -0.00015030894428491592, -0.00014600344002246857, -0.0001416979357600212, -0.00013739243149757385, -0.0001330869272351265, -0.00012878142297267914, -0.00012447591871023178, -0.00012017041444778442, -0.00011586491018533707, -0.00011155940592288971, -0.00010725390166044235, -0.000102948397397995, -9.864289313554764e-05, -9.433738887310028e-05, -9.003188461065292e-05, -8.572638034820557e-05, -8.142087608575821e-05, -7.711537182331085e-05, -7.28098675608635e-05, -6.850436329841614e-05, -6.419885903596878e-05, -5.989335477352142e-05, -5.5587850511074066e-05, -5.128234624862671e-05, -4.697684198617935e-05, -4.2671337723731995e-05, -3.836583346128464e-05, -3.406032919883728e-05, -2.9754824936389923e-05, -2.5449320673942566e-05, -2.114381641149521e-05, -1.683831214904785e-05, -1.2532807886600494e-05, -8.227303624153137e-06, -3.92179936170578e-06, 3.8370490074157715e-07, 4.689209163188934e-06, 8.994713425636292e-06, 1.3300217688083649e-05, 1.7605721950531006e-05, 2.1911226212978363e-05, 2.621673047542572e-05, 3.052223473787308e-05, 3.4827739000320435e-05, 3.913324326276779e-05, 4.343874752521515e-05, 4.7744251787662506e-05, 5.204975605010986e-05, 5.635526031255722e-05, 6.066076457500458e-05, 6.496626883745193e-05, 6.927177309989929e-05, 7.357727736234665e-05, 7.7882781624794e-05, 8.218828588724136e-05, 8.649379014968872e-05, 9.079929441213608e-05, 9.510479867458344e-05, 9.941030293703079e-05, 0.00010371580719947815, 0.0001080213114619255, 0.00011232681572437286, 0.00011663231998682022, 0.00012093782424926758]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 17.0, 25.0, 42.0, 96.0, 226.0, 497.0, 1570.0, 13746.0, 612900.0, 406066.0, 11137.0, 1410.0, 384.0, 226.0, 107.0, 47.0, 26.0, 9.0, 6.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16015625, -1.1259918212890625, -1.091827392578125, -1.0576629638671875, -1.02349853515625, -0.9893341064453125, -0.955169677734375, -0.9210052490234375, -0.8868408203125, -0.8526763916015625, -0.818511962890625, -0.7843475341796875, -0.75018310546875, -0.7160186767578125, -0.681854248046875, -0.6476898193359375, -0.613525390625, -0.5793609619140625, -0.545196533203125, -0.5110321044921875, -0.47686767578125, -0.4427032470703125, -0.408538818359375, -0.3743743896484375, -0.3402099609375, -0.3060455322265625, -0.271881103515625, -0.2377166748046875, -0.20355224609375, -0.1693878173828125, -0.135223388671875, -0.1010589599609375, -0.06689453125, -0.0327301025390625, 0.001434326171875, 0.0355987548828125, 0.06976318359375, 0.1039276123046875, 0.138092041015625, 0.1722564697265625, 0.2064208984375, 0.2405853271484375, 0.274749755859375, 0.3089141845703125, 0.34307861328125, 0.3772430419921875, 0.411407470703125, 0.4455718994140625, 0.479736328125, 0.5139007568359375, 0.548065185546875, 0.5822296142578125, 0.61639404296875, 0.6505584716796875, 0.684722900390625, 0.7188873291015625, 0.7530517578125, 0.7872161865234375, 0.821380615234375, 0.8555450439453125, 0.88970947265625, 0.9238739013671875, 0.958038330078125, 0.9922027587890625, 1.0263671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 5.0, 11.0, 13.0, 28.0, 35.0, 65.0, 144.0, 206.0, 224.0, 102.0, 58.0, 35.0, 27.0, 13.0, 8.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78173828125, -0.7564315795898438, -0.7311248779296875, -0.7058181762695312, -0.680511474609375, -0.6552047729492188, -0.6298980712890625, -0.6045913696289062, -0.57928466796875, -0.5539779663085938, -0.5286712646484375, -0.5033645629882812, -0.478057861328125, -0.45275115966796875, -0.4274444580078125, -0.40213775634765625, -0.3768310546875, -0.35152435302734375, -0.3262176513671875, -0.30091094970703125, -0.275604248046875, -0.25029754638671875, -0.2249908447265625, -0.19968414306640625, -0.17437744140625, -0.14907073974609375, -0.1237640380859375, -0.09845733642578125, -0.073150634765625, -0.04784393310546875, -0.0225372314453125, 0.00276947021484375, 0.028076171875, 0.05338287353515625, 0.0786895751953125, 0.10399627685546875, 0.129302978515625, 0.15460968017578125, 0.1799163818359375, 0.20522308349609375, 0.23052978515625, 0.25583648681640625, 0.2811431884765625, 0.30644989013671875, 0.331756591796875, 0.35706329345703125, 0.3823699951171875, 0.40767669677734375, 0.4329833984375, 0.45829010009765625, 0.4835968017578125, 0.5089035034179688, 0.534210205078125, 0.5595169067382812, 0.5848236083984375, 0.6101303100585938, 0.63543701171875, 0.6607437133789062, 0.6860504150390625, 0.7113571166992188, 0.736663818359375, 0.7619705200195312, 0.7872772216796875, 0.8125839233398438, 0.837890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 28.0, 51.0, 101.0, 193.0, 260.0, 179.0, 90.0, 44.0, 20.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.21891212463379, -19.80767250061035, -19.39643096923828, -18.985191345214844, -18.573951721191406, -18.16271209716797, -17.7514705657959, -17.34023094177246, -16.92898941040039, -16.517749786376953, -16.106508255004883, -15.695268630981445, -15.284029006958008, -14.872788429260254, -14.4615478515625, -14.050308227539062, -13.639068603515625, -13.227828025817871, -12.816588401794434, -12.40534782409668, -11.994108200073242, -11.582867622375488, -11.171627044677734, -10.760387420654297, -10.349146842956543, -9.937906265258789, -9.526666641235352, -9.115426063537598, -8.704185485839844, -8.292945861816406, -7.881705284118652, -7.470465183258057, -7.059225082397461, -6.647984981536865, -6.2367448806762695, -5.825504302978516, -5.41426420211792, -5.003024101257324, -4.59178352355957, -4.180543422698975, -3.769303321838379, -3.358063220977783, -2.9468228816986084, -2.5355825424194336, -2.124342441558838, -1.7131023406982422, -1.3018620014190674, -0.8906216621398926, -0.4793815612792969, -0.06814134120941162, 0.34309887886047363, 0.7543390989303589, 1.1655793190002441, 1.5768194198608398, 1.9880597591400146, 2.3993000984191895, 2.810540199279785, 3.221780300140381, 3.6330206394195557, 4.0442609786987305, 4.455501079559326, 4.866741180419922, 5.277981758117676, 5.6892218589782715, 6.100461959838867]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 8.0, 9.0, 5.0, 5.0, 7.0, 11.0, 12.0, 10.0, 6.0, 17.0, 19.0, 20.0, 25.0, 27.0, 28.0, 27.0, 36.0, 41.0, 31.0, 39.0, 42.0, 41.0, 42.0, 32.0, 41.0, 37.0, 42.0, 32.0, 31.0, 24.0, 28.0, 22.0, 21.0, 30.0, 12.0, 16.0, 23.0, 18.0, 14.0, 15.0, 13.0, 8.0, 12.0, 5.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.463913917541504, -6.257000923156738, -6.050088405609131, -5.843175411224365, -5.6362624168396, -5.429349899291992, -5.222436904907227, -5.015523910522461, -4.808610916137695, -4.60169792175293, -4.394785404205322, -4.187872409820557, -3.980959415435791, -3.7740466594696045, -3.567133903503418, -3.3602209091186523, -3.153308391571045, -2.9463956356048584, -2.7394826412200928, -2.5325698852539062, -2.3256568908691406, -2.118744134902954, -1.9118313789367676, -1.7049185037612915, -1.4980056285858154, -1.2910927534103394, -1.0841798782348633, -0.8772671222686768, -0.6703542470932007, -0.4634413719177246, -0.2565286159515381, -0.04961574077606201, 0.15729713439941406, 0.36420997977256775, 0.5711228251457214, 0.7780356407165527, 0.9849485158920288, 1.1918613910675049, 1.3987741470336914, 1.6056870222091675, 1.8125998973846436, 2.01951265335083, 2.2264256477355957, 2.4333384037017822, 2.6402511596679688, 2.8471641540527344, 3.054076910018921, 3.2609896659851074, 3.467902660369873, 3.6748154163360596, 3.881728410720825, 4.088641166687012, 4.295554161071777, 4.502467155456543, 4.70937967300415, 4.916292667388916, 5.123205184936523, 5.330118179321289, 5.5370306968688965, 5.743943691253662, 5.950856685638428, 6.157769203186035, 6.364682197570801, 6.571595191955566, 6.778508186340332]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 13.0, 19.0, 32.0, 41.0, 74.0, 120.0, 195.0, 389.0, 720.0, 1627.0, 4261.0, 14055.0, 77017.0, 3817186.0, 241222.0, 25853.0, 6783.0, 2285.0, 1054.0, 531.0, 291.0, 179.0, 110.0, 58.0, 47.0, 26.0, 27.0, 15.0, 18.0, 4.0, 7.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3564453125, -1.3107757568359375, -1.265106201171875, -1.2194366455078125, -1.17376708984375, -1.1280975341796875, -1.082427978515625, -1.0367584228515625, -0.9910888671875, -0.9454193115234375, -0.899749755859375, -0.8540802001953125, -0.80841064453125, -0.7627410888671875, -0.717071533203125, -0.6714019775390625, -0.625732421875, -0.5800628662109375, -0.534393310546875, -0.4887237548828125, -0.44305419921875, -0.3973846435546875, -0.351715087890625, -0.3060455322265625, -0.2603759765625, -0.2147064208984375, -0.169036865234375, -0.1233673095703125, -0.07769775390625, -0.0320281982421875, 0.013641357421875, 0.0593109130859375, 0.10498046875, 0.1506500244140625, 0.196319580078125, 0.2419891357421875, 0.28765869140625, 0.3333282470703125, 0.378997802734375, 0.4246673583984375, 0.4703369140625, 0.5160064697265625, 0.561676025390625, 0.6073455810546875, 0.65301513671875, 0.6986846923828125, 0.744354248046875, 0.7900238037109375, 0.835693359375, 0.8813629150390625, 0.927032470703125, 0.9727020263671875, 1.01837158203125, 1.0640411376953125, 1.109710693359375, 1.1553802490234375, 1.2010498046875, 1.2467193603515625, 1.292388916015625, 1.3380584716796875, 1.38372802734375, 1.4293975830078125, 1.475067138671875, 1.5207366943359375, 1.56640625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 5.0, 12.0, 18.0, 25.0, 34.0, 43.0, 36.0, 51.0, 52.0, 76.0, 76.0, 58.0, 70.0, 66.0, 62.0, 60.0, 45.0, 44.0, 33.0, 30.0, 19.0, 16.0, 18.0, 13.0, 7.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4990234375, -0.4818572998046875, -0.464691162109375, -0.4475250244140625, -0.43035888671875, -0.4131927490234375, -0.396026611328125, -0.3788604736328125, -0.3616943359375, -0.3445281982421875, -0.327362060546875, -0.3101959228515625, -0.29302978515625, -0.2758636474609375, -0.258697509765625, -0.2415313720703125, -0.224365234375, -0.2071990966796875, -0.190032958984375, -0.1728668212890625, -0.15570068359375, -0.1385345458984375, -0.121368408203125, -0.1042022705078125, -0.0870361328125, -0.0698699951171875, -0.052703857421875, -0.0355377197265625, -0.01837158203125, -0.0012054443359375, 0.015960693359375, 0.0331268310546875, 0.05029296875, 0.0674591064453125, 0.084625244140625, 0.1017913818359375, 0.11895751953125, 0.1361236572265625, 0.153289794921875, 0.1704559326171875, 0.1876220703125, 0.2047882080078125, 0.221954345703125, 0.2391204833984375, 0.25628662109375, 0.2734527587890625, 0.290618896484375, 0.3077850341796875, 0.324951171875, 0.3421173095703125, 0.359283447265625, 0.3764495849609375, 0.39361572265625, 0.4107818603515625, 0.427947998046875, 0.4451141357421875, 0.4622802734375, 0.4794464111328125, 0.496612548828125, 0.5137786865234375, 0.53094482421875, 0.5481109619140625, 0.565277099609375, 0.5824432373046875, 0.599609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 4.0, 11.0, 11.0, 11.0, 20.0, 16.0, 29.0, 59.0, 84.0, 94.0, 170.0, 231.0, 491.0, 938.0, 2303.0, 7470.0, 35336.0, 1043350.0, 3045111.0, 45488.0, 8320.0, 2593.0, 937.0, 412.0, 267.0, 106.0, 110.0, 67.0, 53.0, 37.0, 45.0, 30.0, 16.0, 16.0, 13.0, 8.0, 3.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3779296875, -1.3335723876953125, -1.289215087890625, -1.2448577880859375, -1.20050048828125, -1.1561431884765625, -1.111785888671875, -1.0674285888671875, -1.0230712890625, -0.9787139892578125, -0.934356689453125, -0.8899993896484375, -0.84564208984375, -0.8012847900390625, -0.756927490234375, -0.7125701904296875, -0.668212890625, -0.6238555908203125, -0.579498291015625, -0.5351409912109375, -0.49078369140625, -0.4464263916015625, -0.402069091796875, -0.3577117919921875, -0.3133544921875, -0.2689971923828125, -0.224639892578125, -0.1802825927734375, -0.13592529296875, -0.0915679931640625, -0.047210693359375, -0.0028533935546875, 0.04150390625, 0.0858612060546875, 0.130218505859375, 0.1745758056640625, 0.21893310546875, 0.2632904052734375, 0.307647705078125, 0.3520050048828125, 0.3963623046875, 0.4407196044921875, 0.485076904296875, 0.5294342041015625, 0.57379150390625, 0.6181488037109375, 0.662506103515625, 0.7068634033203125, 0.751220703125, 0.7955780029296875, 0.839935302734375, 0.8842926025390625, 0.92864990234375, 0.9730072021484375, 1.017364501953125, 1.0617218017578125, 1.1060791015625, 1.1504364013671875, 1.194793701171875, 1.2391510009765625, 1.28350830078125, 1.3278656005859375, 1.372222900390625, 1.4165802001953125, 1.4609375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 9.0, 13.0, 12.0, 16.0, 24.0, 49.0, 97.0, 272.0, 1719.0, 1424.0, 246.0, 83.0, 46.0, 28.0, 8.0, 8.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5135955810546875, -0.493011474609375, -0.4724273681640625, -0.45184326171875, -0.4312591552734375, -0.410675048828125, -0.3900909423828125, -0.3695068359375, -0.3489227294921875, -0.328338623046875, -0.3077545166015625, -0.28717041015625, -0.2665863037109375, -0.246002197265625, -0.2254180908203125, -0.204833984375, -0.1842498779296875, -0.163665771484375, -0.1430816650390625, -0.12249755859375, -0.1019134521484375, -0.081329345703125, -0.0607452392578125, -0.0401611328125, -0.0195770263671875, 0.001007080078125, 0.0215911865234375, 0.04217529296875, 0.0627593994140625, 0.083343505859375, 0.1039276123046875, 0.12451171875, 0.1450958251953125, 0.165679931640625, 0.1862640380859375, 0.20684814453125, 0.2274322509765625, 0.248016357421875, 0.2686004638671875, 0.2891845703125, 0.3097686767578125, 0.330352783203125, 0.3509368896484375, 0.37152099609375, 0.3921051025390625, 0.412689208984375, 0.4332733154296875, 0.453857421875, 0.4744415283203125, 0.495025634765625, 0.5156097412109375, 0.53619384765625, 0.5567779541015625, 0.577362060546875, 0.5979461669921875, 0.6185302734375, 0.6391143798828125, 0.659698486328125, 0.6802825927734375, 0.70086669921875, 0.7214508056640625, 0.742034912109375, 0.7626190185546875, 0.783203125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 12.0, 22.0, 71.0, 242.0, 389.0, 212.0, 47.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.738100051879883, -7.563866138458252, -7.389632701873779, -7.215398788452148, -7.041165351867676, -6.866931438446045, -6.692697525024414, -6.518464088439941, -6.344230651855469, -6.169996738433838, -5.995763301849365, -5.821529388427734, -5.647295951843262, -5.473062038421631, -5.298828125, -5.124594688415527, -4.9503607749938965, -4.776126861572266, -4.601893424987793, -4.427659511566162, -4.2534260749816895, -4.079192161560059, -3.904958486557007, -3.730724811553955, -3.5564911365509033, -3.3822574615478516, -3.2080237865448, -3.033790111541748, -2.859556198120117, -2.6853227615356445, -2.5110888481140137, -2.336855173110962, -2.1626217365264893, -1.9883880615234375, -1.8141543865203857, -1.6399205923080444, -1.4656869173049927, -1.291453242301941, -1.1172194480895996, -0.9429857730865479, -0.7687520980834961, -0.5945184230804443, -0.4202846884727478, -0.24605095386505127, -0.07181727886199951, 0.10241639614105225, 0.27665019035339355, 0.4508838653564453, 0.6251175403594971, 0.7993512153625488, 0.9735849499702454, 1.147818684577942, 1.3220523595809937, 1.4962860345840454, 1.6705198287963867, 1.8447535037994385, 2.0189871788024902, 2.193220853805542, 2.3674545288085938, 2.5416884422302246, 2.7159218788146973, 2.890155792236328, 3.06438946723938, 3.2386231422424316, 3.4128568172454834]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 7.0, 10.0, 9.0, 15.0, 22.0, 30.0, 28.0, 48.0, 34.0, 50.0, 56.0, 69.0, 73.0, 68.0, 69.0, 67.0, 59.0, 56.0, 51.0, 47.0, 33.0, 31.0, 16.0, 11.0, 19.0, 9.0, 2.0, 6.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6605596542358398, -1.6041394472122192, -1.5477192401885986, -1.4912991523742676, -1.434878945350647, -1.3784587383270264, -1.3220386505126953, -1.2656184434890747, -1.209198236465454, -1.1527780294418335, -1.096357822418213, -1.0399377346038818, -0.9835175275802612, -0.9270973205566406, -0.8706771731376648, -0.814257025718689, -0.7578368186950684, -0.7014166116714478, -0.6449964642524719, -0.5885763168334961, -0.5321561098098755, -0.47573593258857727, -0.41931575536727905, -0.36289557814598083, -0.3064754009246826, -0.2500552237033844, -0.19363504648208618, -0.13721486926078796, -0.08079469203948975, -0.02437451481819153, 0.03204566240310669, 0.08846583962440491, 0.14488613605499268, 0.2013063132762909, 0.2577264904975891, 0.31414666771888733, 0.37056684494018555, 0.42698702216148376, 0.483407199382782, 0.5398273468017578, 0.5962475538253784, 0.652667760848999, 0.7090879082679749, 0.7655080556869507, 0.8219282627105713, 0.8783484697341919, 0.9347686171531677, 0.9911887645721436, 1.0476089715957642, 1.1040291786193848, 1.1604492664337158, 1.2168694734573364, 1.273289680480957, 1.3297098875045776, 1.3861300945281982, 1.4425501823425293, 1.49897038936615, 1.5553905963897705, 1.6118106842041016, 1.6682308912277222, 1.7246510982513428, 1.7810713052749634, 1.837491512298584, 1.893911600112915, 1.9503318071365356]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 10.0, 17.0, 26.0, 32.0, 66.0, 99.0, 140.0, 254.0, 457.0, 843.0, 1679.0, 3838.0, 10872.0, 41984.0, 191048.0, 503330.0, 223636.0, 49253.0, 12763.0, 4233.0, 1873.0, 884.0, 498.0, 242.0, 150.0, 121.0, 63.0, 38.0, 27.0, 23.0, 7.0, 9.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.3857421875, -1.341827392578125, -1.29791259765625, -1.253997802734375, -1.2100830078125, -1.166168212890625, -1.12225341796875, -1.078338623046875, -1.034423828125, -0.990509033203125, -0.94659423828125, -0.902679443359375, -0.8587646484375, -0.814849853515625, -0.77093505859375, -0.727020263671875, -0.68310546875, -0.639190673828125, -0.59527587890625, -0.551361083984375, -0.5074462890625, -0.463531494140625, -0.41961669921875, -0.375701904296875, -0.331787109375, -0.287872314453125, -0.24395751953125, -0.200042724609375, -0.1561279296875, -0.112213134765625, -0.06829833984375, -0.024383544921875, 0.01953125, 0.063446044921875, 0.10736083984375, 0.151275634765625, 0.1951904296875, 0.239105224609375, 0.28302001953125, 0.326934814453125, 0.370849609375, 0.414764404296875, 0.45867919921875, 0.502593994140625, 0.5465087890625, 0.590423583984375, 0.63433837890625, 0.678253173828125, 0.72216796875, 0.766082763671875, 0.80999755859375, 0.853912353515625, 0.8978271484375, 0.941741943359375, 0.98565673828125, 1.029571533203125, 1.073486328125, 1.117401123046875, 1.16131591796875, 1.205230712890625, 1.2491455078125, 1.293060302734375, 1.33697509765625, 1.380889892578125, 1.4248046875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 12.0, 22.0, 17.0, 23.0, 39.0, 41.0, 39.0, 53.0, 60.0, 76.0, 57.0, 72.0, 65.0, 75.0, 54.0, 63.0, 35.0, 35.0, 35.0, 28.0, 23.0, 16.0, 18.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.479736328125, -0.4630241394042969, -0.44631195068359375, -0.4295997619628906, -0.4128875732421875, -0.3961753845214844, -0.37946319580078125, -0.3627510070800781, -0.346038818359375, -0.3293266296386719, -0.31261444091796875, -0.2959022521972656, -0.2791900634765625, -0.2624778747558594, -0.24576568603515625, -0.22905349731445312, -0.21234130859375, -0.19562911987304688, -0.17891693115234375, -0.16220474243164062, -0.1454925537109375, -0.12878036499023438, -0.11206817626953125, -0.09535598754882812, -0.078643798828125, -0.061931610107421875, -0.04521942138671875, -0.028507232666015625, -0.0117950439453125, 0.004917144775390625, 0.02162933349609375, 0.038341522216796875, 0.0550537109375, 0.07176589965820312, 0.08847808837890625, 0.10519027709960938, 0.1219024658203125, 0.13861465454101562, 0.15532684326171875, 0.17203903198242188, 0.188751220703125, 0.20546340942382812, 0.22217559814453125, 0.23888778686523438, 0.2555999755859375, 0.2723121643066406, 0.28902435302734375, 0.3057365417480469, 0.32244873046875, 0.3391609191894531, 0.35587310791015625, 0.3725852966308594, 0.3892974853515625, 0.4060096740722656, 0.42272186279296875, 0.4394340515136719, 0.456146240234375, 0.4728584289550781, 0.48957061767578125, 0.5062828063964844, 0.5229949951171875, 0.5397071838378906, 0.5564193725585938, 0.5731315612792969, 0.58984375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 10.0, 8.0, 3.0, 9.0, 13.0, 17.0, 25.0, 43.0, 52.0, 60.0, 104.0, 156.0, 304.0, 657.0, 1606.0, 5354.0, 21926.0, 114841.0, 503438.0, 321211.0, 60810.0, 12303.0, 3321.0, 1109.0, 484.0, 240.0, 153.0, 93.0, 53.0, 35.0, 31.0, 15.0, 21.0, 14.0, 8.0, 9.0, 3.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5009765625, -1.455230712890625, -1.40948486328125, -1.363739013671875, -1.3179931640625, -1.272247314453125, -1.22650146484375, -1.180755615234375, -1.135009765625, -1.089263916015625, -1.04351806640625, -0.997772216796875, -0.9520263671875, -0.906280517578125, -0.86053466796875, -0.814788818359375, -0.76904296875, -0.723297119140625, -0.67755126953125, -0.631805419921875, -0.5860595703125, -0.540313720703125, -0.49456787109375, -0.448822021484375, -0.403076171875, -0.357330322265625, -0.31158447265625, -0.265838623046875, -0.2200927734375, -0.174346923828125, -0.12860107421875, -0.082855224609375, -0.037109375, 0.008636474609375, 0.05438232421875, 0.100128173828125, 0.1458740234375, 0.191619873046875, 0.23736572265625, 0.283111572265625, 0.328857421875, 0.374603271484375, 0.42034912109375, 0.466094970703125, 0.5118408203125, 0.557586669921875, 0.60333251953125, 0.649078369140625, 0.69482421875, 0.740570068359375, 0.78631591796875, 0.832061767578125, 0.8778076171875, 0.923553466796875, 0.96929931640625, 1.015045166015625, 1.060791015625, 1.106536865234375, 1.15228271484375, 1.198028564453125, 1.2437744140625, 1.289520263671875, 1.33526611328125, 1.381011962890625, 1.4267578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 6.0, 14.0, 11.0, 17.0, 18.0, 23.0, 29.0, 36.0, 32.0, 48.0, 29.0, 58.0, 52.0, 49.0, 68.0, 49.0, 59.0, 61.0, 50.0, 44.0, 48.0, 32.0, 27.0, 19.0, 23.0, 14.0, 14.0, 11.0, 16.0, 8.0, 3.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4710235595703125, -1.413726806640625, -1.3564300537109375, -1.29913330078125, -1.2418365478515625, -1.184539794921875, -1.1272430419921875, -1.0699462890625, -1.0126495361328125, -0.955352783203125, -0.8980560302734375, -0.84075927734375, -0.7834625244140625, -0.726165771484375, -0.6688690185546875, -0.611572265625, -0.5542755126953125, -0.496978759765625, -0.4396820068359375, -0.38238525390625, -0.3250885009765625, -0.267791748046875, -0.2104949951171875, -0.1531982421875, -0.0959014892578125, -0.038604736328125, 0.0186920166015625, 0.07598876953125, 0.1332855224609375, 0.190582275390625, 0.2478790283203125, 0.30517578125, 0.3624725341796875, 0.419769287109375, 0.4770660400390625, 0.53436279296875, 0.5916595458984375, 0.648956298828125, 0.7062530517578125, 0.7635498046875, 0.8208465576171875, 0.878143310546875, 0.9354400634765625, 0.99273681640625, 1.0500335693359375, 1.107330322265625, 1.1646270751953125, 1.221923828125, 1.2792205810546875, 1.336517333984375, 1.3938140869140625, 1.45111083984375, 1.5084075927734375, 1.565704345703125, 1.6230010986328125, 1.6802978515625, 1.7375946044921875, 1.794891357421875, 1.8521881103515625, 1.90948486328125, 1.9667816162109375, 2.024078369140625, 2.0813751220703125, 2.138671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 7.0, 11.0, 12.0, 29.0, 51.0, 111.0, 225.0, 568.0, 2028.0, 12640.0, 199741.0, 782589.0, 44187.0, 4603.0, 1078.0, 379.0, 134.0, 70.0, 37.0, 22.0, 14.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7978515625, -0.7738571166992188, -0.7498626708984375, -0.7258682250976562, -0.701873779296875, -0.6778793334960938, -0.6538848876953125, -0.6298904418945312, -0.60589599609375, -0.5819015502929688, -0.5579071044921875, -0.5339126586914062, -0.509918212890625, -0.48592376708984375, -0.4619293212890625, -0.43793487548828125, -0.4139404296875, -0.38994598388671875, -0.3659515380859375, -0.34195709228515625, -0.317962646484375, -0.29396820068359375, -0.2699737548828125, -0.24597930908203125, -0.22198486328125, -0.19799041748046875, -0.1739959716796875, -0.15000152587890625, -0.126007080078125, -0.10201263427734375, -0.0780181884765625, -0.05402374267578125, -0.030029296875, -0.00603485107421875, 0.0179595947265625, 0.04195404052734375, 0.065948486328125, 0.08994293212890625, 0.1139373779296875, 0.13793182373046875, 0.16192626953125, 0.18592071533203125, 0.2099151611328125, 0.23390960693359375, 0.257904052734375, 0.28189849853515625, 0.3058929443359375, 0.32988739013671875, 0.3538818359375, 0.37787628173828125, 0.4018707275390625, 0.42586517333984375, 0.449859619140625, 0.47385406494140625, 0.4978485107421875, 0.5218429565429688, 0.54583740234375, 0.5698318481445312, 0.5938262939453125, 0.6178207397460938, 0.641815185546875, 0.6658096313476562, 0.6898040771484375, 0.7137985229492188, 0.73779296875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 3.0, 5.0, 6.0, 5.0, 8.0, 14.0, 14.0, 18.0, 27.0, 30.0, 40.0, 54.0, 132.0, 181.0, 180.0, 103.0, 41.0, 32.0, 17.0, 15.0, 19.0, 9.0, 7.0, 8.0, 7.0, 3.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011748075485229492, -0.00011311005800962448, -0.00010873936116695404, -0.0001043686643242836, -9.999796748161316e-05, -9.562727063894272e-05, -9.125657379627228e-05, -8.688587695360184e-05, -8.25151801109314e-05, -7.814448326826096e-05, -7.377378642559052e-05, -6.940308958292007e-05, -6.503239274024963e-05, -6.066169589757919e-05, -5.629099905490875e-05, -5.192030221223831e-05, -4.754960536956787e-05, -4.317890852689743e-05, -3.880821168422699e-05, -3.443751484155655e-05, -3.006681799888611e-05, -2.5696121156215668e-05, -2.1325424313545227e-05, -1.6954727470874786e-05, -1.2584030628204346e-05, -8.213333785533905e-06, -3.842636942863464e-06, 5.280598998069763e-07, 4.898756742477417e-06, 9.269453585147858e-06, 1.3640150427818298e-05, 1.801084727048874e-05, 2.238154411315918e-05, 2.675224095582962e-05, 3.112293779850006e-05, 3.54936346411705e-05, 3.986433148384094e-05, 4.423502832651138e-05, 4.8605725169181824e-05, 5.2976422011852264e-05, 5.7347118854522705e-05, 6.171781569719315e-05, 6.608851253986359e-05, 7.045920938253403e-05, 7.482990622520447e-05, 7.920060306787491e-05, 8.357129991054535e-05, 8.794199675321579e-05, 9.231269359588623e-05, 9.668339043855667e-05, 0.00010105408728122711, 0.00010542478412389755, 0.00010979548096656799, 0.00011416617780923843, 0.00011853687465190887, 0.00012290757149457932, 0.00012727826833724976, 0.0001316489651799202, 0.00013601966202259064, 0.00014039035886526108, 0.00014476105570793152, 0.00014913175255060196, 0.0001535024493932724, 0.00015787314623594284, 0.00016224384307861328]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 8.0, 20.0, 14.0, 31.0, 38.0, 93.0, 163.0, 296.0, 681.0, 1970.0, 9312.0, 80817.0, 800500.0, 137193.0, 13294.0, 2580.0, 814.0, 335.0, 171.0, 78.0, 67.0, 35.0, 12.0, 11.0, 10.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.67333984375, -0.6538772583007812, -0.6344146728515625, -0.6149520874023438, -0.595489501953125, -0.5760269165039062, -0.5565643310546875, -0.5371017456054688, -0.51763916015625, -0.49817657470703125, -0.4787139892578125, -0.45925140380859375, -0.439788818359375, -0.42032623291015625, -0.4008636474609375, -0.38140106201171875, -0.3619384765625, -0.34247589111328125, -0.3230133056640625, -0.30355072021484375, -0.284088134765625, -0.26462554931640625, -0.2451629638671875, -0.22570037841796875, -0.20623779296875, -0.18677520751953125, -0.1673126220703125, -0.14785003662109375, -0.128387451171875, -0.10892486572265625, -0.0894622802734375, -0.06999969482421875, -0.050537109375, -0.03107452392578125, -0.0116119384765625, 0.00785064697265625, 0.027313232421875, 0.04677581787109375, 0.0662384033203125, 0.08570098876953125, 0.10516357421875, 0.12462615966796875, 0.1440887451171875, 0.16355133056640625, 0.183013916015625, 0.20247650146484375, 0.2219390869140625, 0.24140167236328125, 0.2608642578125, 0.28032684326171875, 0.2997894287109375, 0.31925201416015625, 0.338714599609375, 0.35817718505859375, 0.3776397705078125, 0.39710235595703125, 0.41656494140625, 0.43602752685546875, 0.4554901123046875, 0.47495269775390625, 0.494415283203125, 0.5138778686523438, 0.5333404541015625, 0.5528030395507812, 0.572265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 7.0, 11.0, 7.0, 28.0, 23.0, 24.0, 33.0, 55.0, 65.0, 80.0, 109.0, 117.0, 113.0, 81.0, 65.0, 49.0, 31.0, 23.0, 20.0, 8.0, 17.0, 11.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53857421875, -0.5251426696777344, -0.5117111206054688, -0.4982795715332031, -0.4848480224609375, -0.4714164733886719, -0.45798492431640625, -0.4445533752441406, -0.431121826171875, -0.4176902770996094, -0.40425872802734375, -0.3908271789550781, -0.3773956298828125, -0.3639640808105469, -0.35053253173828125, -0.3371009826660156, -0.32366943359375, -0.3102378845214844, -0.29680633544921875, -0.2833747863769531, -0.2699432373046875, -0.2565116882324219, -0.24308013916015625, -0.22964859008789062, -0.216217041015625, -0.20278549194335938, -0.18935394287109375, -0.17592239379882812, -0.1624908447265625, -0.14905929565429688, -0.13562774658203125, -0.12219619750976562, -0.1087646484375, -0.09533309936523438, -0.08190155029296875, -0.06847000122070312, -0.0550384521484375, -0.041606903076171875, -0.02817535400390625, -0.014743804931640625, -0.001312255859375, 0.012119293212890625, 0.02555084228515625, 0.038982391357421875, 0.0524139404296875, 0.06584548950195312, 0.07927703857421875, 0.09270858764648438, 0.10614013671875, 0.11957168579101562, 0.13300323486328125, 0.14643478393554688, 0.1598663330078125, 0.17329788208007812, 0.18672943115234375, 0.20016098022460938, 0.213592529296875, 0.22702407836914062, 0.24045562744140625, 0.2538871765136719, 0.2673187255859375, 0.2807502746582031, 0.29418182373046875, 0.3076133728027344, 0.321044921875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 26.0, 74.0, 137.0, 241.0, 252.0, 152.0, 75.0, 24.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.99754524230957, -16.537954330444336, -16.0783634185791, -15.618773460388184, -15.159183502197266, -14.699592590332031, -14.240002632141113, -13.780411720275879, -13.320821762084961, -12.861230850219727, -12.401640892028809, -11.942049980163574, -11.482460021972656, -11.022869110107422, -10.563279151916504, -10.10368824005127, -9.644098281860352, -9.184507369995117, -8.7249174118042, -8.265326499938965, -7.805736541748047, -7.3461456298828125, -6.8865556716918945, -6.42696475982666, -5.967373847961426, -5.50778341293335, -5.048192977905273, -4.588602542877197, -4.129012107849121, -3.669421434402466, -3.2098309993743896, -2.7502405643463135, -2.2906503677368164, -1.8310599327087402, -1.371469497680664, -0.9118789434432983, -0.45228850841522217, 0.007302045822143555, 0.4668924808502197, 0.9264829158782959, 1.386073350906372, 1.8456637859344482, 2.3052542209625244, 2.7648448944091797, 3.224435329437256, 3.684025764465332, 4.143616199493408, 4.603206634521484, 5.0627970695495605, 5.522387504577637, 5.981977939605713, 6.441568374633789, 6.901158809661865, 7.360749244689941, 7.820340156555176, 8.279930114746094, 8.739521026611328, 9.199111938476562, 9.65870189666748, 10.118292808532715, 10.577882766723633, 11.037473678588867, 11.497063636779785, 11.95665454864502, 12.416244506835938]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 10.0, 9.0, 12.0, 10.0, 13.0, 19.0, 10.0, 20.0, 25.0, 35.0, 24.0, 21.0, 25.0, 36.0, 37.0, 32.0, 39.0, 36.0, 41.0, 34.0, 38.0, 34.0, 38.0, 41.0, 31.0, 31.0, 36.0, 21.0, 27.0, 26.0, 19.0, 28.0, 25.0, 18.0, 14.0, 18.0, 8.0, 8.0, 12.0, 6.0, 5.0, 3.0, 7.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.13810920715332, -5.950170040130615, -5.76223087310791, -5.574291706085205, -5.3863525390625, -5.198413372039795, -5.01047420501709, -4.822534561157227, -4.63459587097168, -4.446656703948975, -4.2587175369262695, -4.0707783699035645, -3.8828392028808594, -3.6949000358581543, -3.50696063041687, -3.319021463394165, -3.131082057952881, -2.943142890930176, -2.7552037239074707, -2.5672645568847656, -2.3793253898620605, -2.1913862228393555, -2.0034468173980713, -1.8155076503753662, -1.6275684833526611, -1.439629316329956, -1.251690149307251, -1.0637508630752563, -0.8758116960525513, -0.6878725290298462, -0.49993324279785156, -0.3119940757751465, -0.12405538558959961, 0.06388381123542786, 0.2518230080604553, 0.4397622346878052, 0.6277014017105103, 0.8156405687332153, 1.00357985496521, 1.191519021987915, 1.3794581890106201, 1.5673973560333252, 1.7553365230560303, 1.943275809288025, 2.1312150955200195, 2.3191542625427246, 2.5070934295654297, 2.6950325965881348, 2.88297176361084, 3.070910930633545, 3.25885009765625, 3.446789264678955, 3.63472843170166, 3.8226675987243652, 4.01060676574707, 4.198546409606934, 4.3864850997924805, 4.5744242668151855, 4.762363433837891, 4.950302600860596, 5.138241767883301, 5.326180934906006, 5.514120101928711, 5.702059745788574, 5.889998912811279]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 8.0, 11.0, 28.0, 20.0, 30.0, 51.0, 112.0, 163.0, 280.0, 556.0, 1017.0, 2360.0, 6112.0, 23466.0, 277240.0, 3808701.0, 56666.0, 10691.0, 3505.0, 1492.0, 754.0, 373.0, 215.0, 123.0, 95.0, 63.0, 39.0, 21.0, 12.0, 19.0, 12.0, 13.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.09375, -2.024505615234375, -1.95526123046875, -1.886016845703125, -1.8167724609375, -1.747528076171875, -1.67828369140625, -1.609039306640625, -1.539794921875, -1.470550537109375, -1.40130615234375, -1.332061767578125, -1.2628173828125, -1.193572998046875, -1.12432861328125, -1.055084228515625, -0.98583984375, -0.916595458984375, -0.84735107421875, -0.778106689453125, -0.7088623046875, -0.639617919921875, -0.57037353515625, -0.501129150390625, -0.431884765625, -0.362640380859375, -0.29339599609375, -0.224151611328125, -0.1549072265625, -0.085662841796875, -0.01641845703125, 0.052825927734375, 0.1220703125, 0.191314697265625, 0.26055908203125, 0.329803466796875, 0.3990478515625, 0.468292236328125, 0.53753662109375, 0.606781005859375, 0.676025390625, 0.745269775390625, 0.81451416015625, 0.883758544921875, 0.9530029296875, 1.022247314453125, 1.09149169921875, 1.160736083984375, 1.22998046875, 1.299224853515625, 1.36846923828125, 1.437713623046875, 1.5069580078125, 1.576202392578125, 1.64544677734375, 1.714691162109375, 1.783935546875, 1.853179931640625, 1.92242431640625, 1.991668701171875, 2.0609130859375, 2.130157470703125, 2.19940185546875, 2.268646240234375, 2.337890625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 14.0, 21.0, 18.0, 27.0, 33.0, 45.0, 50.0, 50.0, 63.0, 60.0, 82.0, 57.0, 68.0, 63.0, 67.0, 49.0, 34.0, 44.0, 36.0, 21.0, 20.0, 19.0, 12.0, 9.0, 8.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50439453125, -0.486663818359375, -0.46893310546875, -0.451202392578125, -0.4334716796875, -0.415740966796875, -0.39801025390625, -0.380279541015625, -0.362548828125, -0.344818115234375, -0.32708740234375, -0.309356689453125, -0.2916259765625, -0.273895263671875, -0.25616455078125, -0.238433837890625, -0.220703125, -0.202972412109375, -0.18524169921875, -0.167510986328125, -0.1497802734375, -0.132049560546875, -0.11431884765625, -0.096588134765625, -0.078857421875, -0.061126708984375, -0.04339599609375, -0.025665283203125, -0.0079345703125, 0.009796142578125, 0.02752685546875, 0.045257568359375, 0.06298828125, 0.080718994140625, 0.09844970703125, 0.116180419921875, 0.1339111328125, 0.151641845703125, 0.16937255859375, 0.187103271484375, 0.204833984375, 0.222564697265625, 0.24029541015625, 0.258026123046875, 0.2757568359375, 0.293487548828125, 0.31121826171875, 0.328948974609375, 0.3466796875, 0.364410400390625, 0.38214111328125, 0.399871826171875, 0.4176025390625, 0.435333251953125, 0.45306396484375, 0.470794677734375, 0.488525390625, 0.506256103515625, 0.52398681640625, 0.541717529296875, 0.5594482421875, 0.577178955078125, 0.59490966796875, 0.612640380859375, 0.63037109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 12.0, 6.0, 15.0, 17.0, 25.0, 21.0, 29.0, 48.0, 62.0, 73.0, 124.0, 197.0, 315.0, 568.0, 1184.0, 2861.0, 7975.0, 31418.0, 336051.0, 3696737.0, 91796.0, 16124.0, 4799.0, 1834.0, 828.0, 393.0, 218.0, 117.0, 88.0, 67.0, 60.0, 40.0, 38.0, 31.0, 25.0, 11.0, 8.0, 11.0, 16.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0], "bins": [-1.68359375, -1.6344757080078125, -1.585357666015625, -1.5362396240234375, -1.48712158203125, -1.4380035400390625, -1.388885498046875, -1.3397674560546875, -1.2906494140625, -1.2415313720703125, -1.192413330078125, -1.1432952880859375, -1.09417724609375, -1.0450592041015625, -0.995941162109375, -0.9468231201171875, -0.897705078125, -0.8485870361328125, -0.799468994140625, -0.7503509521484375, -0.70123291015625, -0.6521148681640625, -0.602996826171875, -0.5538787841796875, -0.5047607421875, -0.4556427001953125, -0.406524658203125, -0.3574066162109375, -0.30828857421875, -0.2591705322265625, -0.210052490234375, -0.1609344482421875, -0.11181640625, -0.0626983642578125, -0.013580322265625, 0.0355377197265625, 0.08465576171875, 0.1337738037109375, 0.182891845703125, 0.2320098876953125, 0.2811279296875, 0.3302459716796875, 0.379364013671875, 0.4284820556640625, 0.47760009765625, 0.5267181396484375, 0.575836181640625, 0.6249542236328125, 0.674072265625, 0.7231903076171875, 0.772308349609375, 0.8214263916015625, 0.87054443359375, 0.9196624755859375, 0.968780517578125, 1.0178985595703125, 1.0670166015625, 1.1161346435546875, 1.165252685546875, 1.2143707275390625, 1.26348876953125, 1.3126068115234375, 1.361724853515625, 1.4108428955078125, 1.4599609375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 18.0, 31.0, 53.0, 110.0, 473.0, 2730.0, 411.0, 101.0, 52.0, 29.0, 17.0, 8.0, 10.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.748046875, -0.7197723388671875, -0.691497802734375, -0.6632232666015625, -0.63494873046875, -0.6066741943359375, -0.578399658203125, -0.5501251220703125, -0.5218505859375, -0.4935760498046875, -0.465301513671875, -0.4370269775390625, -0.40875244140625, -0.3804779052734375, -0.352203369140625, -0.3239288330078125, -0.295654296875, -0.2673797607421875, -0.239105224609375, -0.2108306884765625, -0.18255615234375, -0.1542816162109375, -0.126007080078125, -0.0977325439453125, -0.0694580078125, -0.0411834716796875, -0.012908935546875, 0.0153656005859375, 0.04364013671875, 0.0719146728515625, 0.100189208984375, 0.1284637451171875, 0.15673828125, 0.1850128173828125, 0.213287353515625, 0.2415618896484375, 0.26983642578125, 0.2981109619140625, 0.326385498046875, 0.3546600341796875, 0.3829345703125, 0.4112091064453125, 0.439483642578125, 0.4677581787109375, 0.49603271484375, 0.5243072509765625, 0.552581787109375, 0.5808563232421875, 0.609130859375, 0.6374053955078125, 0.665679931640625, 0.6939544677734375, 0.72222900390625, 0.7505035400390625, 0.778778076171875, 0.8070526123046875, 0.8353271484375, 0.8636016845703125, 0.891876220703125, 0.9201507568359375, 0.94842529296875, 0.9766998291015625, 1.004974365234375, 1.0332489013671875, 1.0615234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 11.0, 9.0, 46.0, 145.0, 268.0, 290.0, 150.0, 59.0, 9.0, 8.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.002898216247559, -6.840642929077148, -6.6783881187438965, -6.5161333084106445, -6.353878021240234, -6.191622734069824, -6.029367923736572, -5.86711311340332, -5.70485782623291, -5.5426025390625, -5.380347728729248, -5.218092918395996, -5.055837631225586, -4.893582344055176, -4.731327533721924, -4.569072723388672, -4.406817436218262, -4.244562149047852, -4.0823073387146, -3.9200522899627686, -3.7577972412109375, -3.5955421924591064, -3.4332871437072754, -3.2710320949554443, -3.1087770462036133, -2.9465219974517822, -2.784266948699951, -2.62201189994812, -2.459756851196289, -2.297501802444458, -2.135246753692627, -1.972991704940796, -1.8107361793518066, -1.6484811305999756, -1.4862260818481445, -1.3239710330963135, -1.1617159843444824, -0.9994609355926514, -0.8372058868408203, -0.6749508380889893, -0.5126957893371582, -0.35044074058532715, -0.1881856918334961, -0.02593064308166504, 0.13632440567016602, 0.29857945442199707, 0.4608345031738281, 0.6230895519256592, 0.7853446006774902, 0.9475996494293213, 1.1098546981811523, 1.2721097469329834, 1.4343647956848145, 1.5966198444366455, 1.7588748931884766, 1.9211299419403076, 2.0833849906921387, 2.2456400394439697, 2.407895088195801, 2.570150136947632, 2.732405185699463, 2.894660234451294, 3.056915283203125, 3.219170331954956, 3.381425380706787]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 9.0, 10.0, 15.0, 21.0, 33.0, 47.0, 48.0, 72.0, 78.0, 79.0, 89.0, 81.0, 72.0, 77.0, 62.0, 61.0, 41.0, 23.0, 24.0, 19.0, 14.0, 9.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1502106189727783, -3.062445640563965, -2.9746809005737305, -2.886915922164917, -2.7991509437561035, -2.711386203765869, -2.6236212253570557, -2.535856246948242, -2.448091506958008, -2.3603265285491943, -2.27256178855896, -2.1847968101501465, -2.097031831741333, -2.0092668533325195, -1.9215021133422852, -1.8337371349334717, -1.7459721565246582, -1.6582072973251343, -1.5704423189163208, -1.4826774597167969, -1.3949124813079834, -1.3071476221084595, -1.2193827629089355, -1.131617784500122, -1.0438529253005981, -0.9560880064964294, -0.8683230876922607, -0.7805582284927368, -0.6927933096885681, -0.6050283908843994, -0.5172635316848755, -0.4294986128807068, -0.341733455657959, -0.2539685368537903, -0.16620364785194397, -0.07843875885009766, 0.009326159954071045, 0.09709107875823975, 0.18485593795776367, 0.2726208567619324, 0.3603857755661011, 0.4481506943702698, 0.5359156131744385, 0.6236804723739624, 0.7114453911781311, 0.7992103099822998, 0.8869751691818237, 0.9747400879859924, 1.0625050067901611, 1.150269865989685, 1.2380348443984985, 1.3257997035980225, 1.413564682006836, 1.5013295412063599, 1.5890944004058838, 1.6768593788146973, 1.7646242380142212, 1.8523890972137451, 1.9401540756225586, 2.027918815612793, 2.1156837940216064, 2.20344877243042, 2.2912135124206543, 2.3789784908294678, 2.4667434692382812]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 8.0, 7.0, 18.0, 24.0, 28.0, 51.0, 66.0, 85.0, 106.0, 188.0, 223.0, 452.0, 682.0, 1226.0, 2236.0, 4733.0, 10249.0, 27343.0, 81861.0, 239960.0, 387111.0, 190729.0, 62586.0, 21231.0, 8499.0, 3976.0, 1995.0, 1055.0, 648.0, 390.0, 242.0, 153.0, 91.0, 76.0, 67.0, 43.0, 19.0, 26.0, 16.0, 10.0, 9.0, 9.0, 4.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.4296875, -1.3881072998046875, -1.346527099609375, -1.3049468994140625, -1.26336669921875, -1.2217864990234375, -1.180206298828125, -1.1386260986328125, -1.0970458984375, -1.0554656982421875, -1.013885498046875, -0.9723052978515625, -0.93072509765625, -0.8891448974609375, -0.847564697265625, -0.8059844970703125, -0.764404296875, -0.7228240966796875, -0.681243896484375, -0.6396636962890625, -0.59808349609375, -0.5565032958984375, -0.514923095703125, -0.4733428955078125, -0.4317626953125, -0.3901824951171875, -0.348602294921875, -0.3070220947265625, -0.26544189453125, -0.2238616943359375, -0.182281494140625, -0.1407012939453125, -0.09912109375, -0.0575408935546875, -0.015960693359375, 0.0256195068359375, 0.06719970703125, 0.1087799072265625, 0.150360107421875, 0.1919403076171875, 0.2335205078125, 0.2751007080078125, 0.316680908203125, 0.3582611083984375, 0.39984130859375, 0.4414215087890625, 0.483001708984375, 0.5245819091796875, 0.566162109375, 0.6077423095703125, 0.649322509765625, 0.6909027099609375, 0.73248291015625, 0.7740631103515625, 0.815643310546875, 0.8572235107421875, 0.8988037109375, 0.9403839111328125, 0.981964111328125, 1.0235443115234375, 1.06512451171875, 1.1067047119140625, 1.148284912109375, 1.1898651123046875, 1.2314453125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 13.0, 20.0, 28.0, 34.0, 32.0, 36.0, 52.0, 53.0, 69.0, 60.0, 57.0, 86.0, 63.0, 56.0, 62.0, 49.0, 51.0, 31.0, 30.0, 22.0, 20.0, 18.0, 11.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5068359375, -0.4894866943359375, -0.472137451171875, -0.4547882080078125, -0.43743896484375, -0.4200897216796875, -0.402740478515625, -0.3853912353515625, -0.3680419921875, -0.3506927490234375, -0.333343505859375, -0.3159942626953125, -0.29864501953125, -0.2812957763671875, -0.263946533203125, -0.2465972900390625, -0.229248046875, -0.2118988037109375, -0.194549560546875, -0.1772003173828125, -0.15985107421875, -0.1425018310546875, -0.125152587890625, -0.1078033447265625, -0.0904541015625, -0.0731048583984375, -0.055755615234375, -0.0384063720703125, -0.02105712890625, -0.0037078857421875, 0.013641357421875, 0.0309906005859375, 0.04833984375, 0.0656890869140625, 0.083038330078125, 0.1003875732421875, 0.11773681640625, 0.1350860595703125, 0.152435302734375, 0.1697845458984375, 0.1871337890625, 0.2044830322265625, 0.221832275390625, 0.2391815185546875, 0.25653076171875, 0.2738800048828125, 0.291229248046875, 0.3085784912109375, 0.325927734375, 0.3432769775390625, 0.360626220703125, 0.3779754638671875, 0.39532470703125, 0.4126739501953125, 0.430023193359375, 0.4473724365234375, 0.4647216796875, 0.4820709228515625, 0.499420166015625, 0.5167694091796875, 0.53411865234375, 0.5514678955078125, 0.568817138671875, 0.5861663818359375, 0.603515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 9.0, 12.0, 21.0, 15.0, 30.0, 45.0, 65.0, 96.0, 149.0, 292.0, 450.0, 884.0, 2106.0, 6118.0, 25567.0, 151170.0, 586680.0, 225661.0, 36249.0, 7993.0, 2525.0, 1060.0, 561.0, 297.0, 181.0, 103.0, 60.0, 40.0, 40.0, 26.0, 10.0, 15.0, 4.0, 9.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73046875, -1.66998291015625, -1.6094970703125, -1.54901123046875, -1.488525390625, -1.42803955078125, -1.3675537109375, -1.30706787109375, -1.24658203125, -1.18609619140625, -1.1256103515625, -1.06512451171875, -1.004638671875, -0.94415283203125, -0.8836669921875, -0.82318115234375, -0.7626953125, -0.70220947265625, -0.6417236328125, -0.58123779296875, -0.520751953125, -0.46026611328125, -0.3997802734375, -0.33929443359375, -0.27880859375, -0.21832275390625, -0.1578369140625, -0.09735107421875, -0.036865234375, 0.02362060546875, 0.0841064453125, 0.14459228515625, 0.205078125, 0.26556396484375, 0.3260498046875, 0.38653564453125, 0.447021484375, 0.50750732421875, 0.5679931640625, 0.62847900390625, 0.68896484375, 0.74945068359375, 0.8099365234375, 0.87042236328125, 0.930908203125, 0.99139404296875, 1.0518798828125, 1.11236572265625, 1.1728515625, 1.23333740234375, 1.2938232421875, 1.35430908203125, 1.414794921875, 1.47528076171875, 1.5357666015625, 1.59625244140625, 1.65673828125, 1.71722412109375, 1.7777099609375, 1.83819580078125, 1.898681640625, 1.95916748046875, 2.0196533203125, 2.08013916015625, 2.140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 9.0, 15.0, 12.0, 22.0, 27.0, 33.0, 34.0, 36.0, 48.0, 35.0, 68.0, 75.0, 59.0, 69.0, 73.0, 60.0, 48.0, 37.0, 46.0, 41.0, 23.0, 27.0, 20.0, 12.0, 12.0, 11.0, 8.0, 2.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.88671875, -2.805511474609375, -2.72430419921875, -2.643096923828125, -2.5618896484375, -2.480682373046875, -2.39947509765625, -2.318267822265625, -2.237060546875, -2.155853271484375, -2.07464599609375, -1.993438720703125, -1.9122314453125, -1.831024169921875, -1.74981689453125, -1.668609619140625, -1.58740234375, -1.506195068359375, -1.42498779296875, -1.343780517578125, -1.2625732421875, -1.181365966796875, -1.10015869140625, -1.018951416015625, -0.937744140625, -0.856536865234375, -0.77532958984375, -0.694122314453125, -0.6129150390625, -0.531707763671875, -0.45050048828125, -0.369293212890625, -0.2880859375, -0.206878662109375, -0.12567138671875, -0.044464111328125, 0.0367431640625, 0.117950439453125, 0.19915771484375, 0.280364990234375, 0.361572265625, 0.442779541015625, 0.52398681640625, 0.605194091796875, 0.6864013671875, 0.767608642578125, 0.84881591796875, 0.930023193359375, 1.01123046875, 1.092437744140625, 1.17364501953125, 1.254852294921875, 1.3360595703125, 1.417266845703125, 1.49847412109375, 1.579681396484375, 1.660888671875, 1.742095947265625, 1.82330322265625, 1.904510498046875, 1.9857177734375, 2.066925048828125, 2.14813232421875, 2.229339599609375, 2.310546875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 10.0, 4.0, 17.0, 18.0, 26.0, 34.0, 59.0, 90.0, 136.0, 228.0, 421.0, 720.0, 1484.0, 3708.0, 13822.0, 101838.0, 794963.0, 109448.0, 14242.0, 3834.0, 1562.0, 778.0, 413.0, 236.0, 139.0, 104.0, 52.0, 38.0, 23.0, 20.0, 23.0, 13.0, 10.0, 7.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.04296875, -1.0087890625, -0.974609375, -0.9404296875, -0.90625, -0.8720703125, -0.837890625, -0.8037109375, -0.76953125, -0.7353515625, -0.701171875, -0.6669921875, -0.6328125, -0.5986328125, -0.564453125, -0.5302734375, -0.49609375, -0.4619140625, -0.427734375, -0.3935546875, -0.359375, -0.3251953125, -0.291015625, -0.2568359375, -0.22265625, -0.1884765625, -0.154296875, -0.1201171875, -0.0859375, -0.0517578125, -0.017578125, 0.0166015625, 0.05078125, 0.0849609375, 0.119140625, 0.1533203125, 0.1875, 0.2216796875, 0.255859375, 0.2900390625, 0.32421875, 0.3583984375, 0.392578125, 0.4267578125, 0.4609375, 0.4951171875, 0.529296875, 0.5634765625, 0.59765625, 0.6318359375, 0.666015625, 0.7001953125, 0.734375, 0.7685546875, 0.802734375, 0.8369140625, 0.87109375, 0.9052734375, 0.939453125, 0.9736328125, 1.0078125, 1.0419921875, 1.076171875, 1.1103515625, 1.14453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 6.0, 7.0, 5.0, 6.0, 14.0, 10.0, 19.0, 26.0, 31.0, 50.0, 53.0, 60.0, 136.0, 188.0, 109.0, 80.0, 46.0, 39.0, 27.0, 21.0, 18.0, 22.0, 11.0, 12.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00023317337036132812, -0.0002269502729177475, -0.00022072717547416687, -0.00021450407803058624, -0.00020828098058700562, -0.000202057883143425, -0.00019583478569984436, -0.00018961168825626373, -0.0001833885908126831, -0.00017716549336910248, -0.00017094239592552185, -0.00016471929848194122, -0.0001584962010383606, -0.00015227310359477997, -0.00014605000615119934, -0.0001398269087076187, -0.00013360381126403809, -0.00012738071382045746, -0.00012115761637687683, -0.0001149345189332962, -0.00010871142148971558, -0.00010248832404613495, -9.626522660255432e-05, -9.00421291589737e-05, -8.381903171539307e-05, -7.759593427181244e-05, -7.137283682823181e-05, -6.514973938465118e-05, -5.892664194107056e-05, -5.270354449748993e-05, -4.64804470539093e-05, -4.0257349610328674e-05, -3.403425216674805e-05, -2.781115472316742e-05, -2.1588057279586792e-05, -1.5364959836006165e-05, -9.141862392425537e-06, -2.9187649488449097e-06, 3.3043324947357178e-06, 9.527429938316345e-06, 1.5750527381896973e-05, 2.19736248254776e-05, 2.8196722269058228e-05, 3.4419819712638855e-05, 4.064291715621948e-05, 4.686601459980011e-05, 5.308911204338074e-05, 5.9312209486961365e-05, 6.553530693054199e-05, 7.175840437412262e-05, 7.798150181770325e-05, 8.420459926128387e-05, 9.04276967048645e-05, 9.665079414844513e-05, 0.00010287389159202576, 0.00010909698903560638, 0.00011532008647918701, 0.00012154318392276764, 0.00012776628136634827, 0.0001339893788099289, 0.00014021247625350952, 0.00014643557369709015, 0.00015265867114067078, 0.0001588817685842514, 0.00016510486602783203]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 1.0, 7.0, 19.0, 14.0, 29.0, 61.0, 106.0, 218.0, 536.0, 1367.0, 5340.0, 49487.0, 833183.0, 144696.0, 10071.0, 2114.0, 713.0, 295.0, 124.0, 76.0, 43.0, 19.0, 10.0, 6.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.012939453125, -0.96826171875, -0.923583984375, -0.87890625, -0.834228515625, -0.78955078125, -0.744873046875, -0.7001953125, -0.655517578125, -0.61083984375, -0.566162109375, -0.521484375, -0.476806640625, -0.43212890625, -0.387451171875, -0.3427734375, -0.298095703125, -0.25341796875, -0.208740234375, -0.1640625, -0.119384765625, -0.07470703125, -0.030029296875, 0.0146484375, 0.059326171875, 0.10400390625, 0.148681640625, 0.193359375, 0.238037109375, 0.28271484375, 0.327392578125, 0.3720703125, 0.416748046875, 0.46142578125, 0.506103515625, 0.55078125, 0.595458984375, 0.64013671875, 0.684814453125, 0.7294921875, 0.774169921875, 0.81884765625, 0.863525390625, 0.908203125, 0.952880859375, 0.99755859375, 1.042236328125, 1.0869140625, 1.131591796875, 1.17626953125, 1.220947265625, 1.265625, 1.310302734375, 1.35498046875, 1.399658203125, 1.4443359375, 1.489013671875, 1.53369140625, 1.578369140625, 1.623046875, 1.667724609375, 1.71240234375, 1.757080078125, 1.8017578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 4.0, 6.0, 14.0, 14.0, 33.0, 43.0, 92.0, 127.0, 191.0, 174.0, 105.0, 69.0, 34.0, 27.0, 8.0, 8.0, 14.0, 5.0, 3.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.148529052734375, -1.10858154296875, -1.068634033203125, -1.0286865234375, -0.988739013671875, -0.94879150390625, -0.908843994140625, -0.868896484375, -0.828948974609375, -0.78900146484375, -0.749053955078125, -0.7091064453125, -0.669158935546875, -0.62921142578125, -0.589263916015625, -0.54931640625, -0.509368896484375, -0.46942138671875, -0.429473876953125, -0.3895263671875, -0.349578857421875, -0.30963134765625, -0.269683837890625, -0.229736328125, -0.189788818359375, -0.14984130859375, -0.109893798828125, -0.0699462890625, -0.029998779296875, 0.00994873046875, 0.049896240234375, 0.08984375, 0.129791259765625, 0.16973876953125, 0.209686279296875, 0.2496337890625, 0.289581298828125, 0.32952880859375, 0.369476318359375, 0.409423828125, 0.449371337890625, 0.48931884765625, 0.529266357421875, 0.5692138671875, 0.609161376953125, 0.64910888671875, 0.689056396484375, 0.72900390625, 0.768951416015625, 0.80889892578125, 0.848846435546875, 0.8887939453125, 0.928741455078125, 0.96868896484375, 1.008636474609375, 1.048583984375, 1.088531494140625, 1.12847900390625, 1.168426513671875, 1.2083740234375, 1.248321533203125, 1.28826904296875, 1.328216552734375, 1.3681640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 2.0, 17.0, 44.0, 84.0, 129.0, 202.0, 172.0, 144.0, 100.0, 52.0, 32.0, 11.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.7243709564209, -21.122425079345703, -20.520479202270508, -19.91853141784668, -19.316585540771484, -18.71463966369629, -18.112693786621094, -17.5107479095459, -16.908802032470703, -16.306856155395508, -15.704909324645996, -15.1029634475708, -14.501016616821289, -13.899070739746094, -13.297124862670898, -12.695178985595703, -12.093231201171875, -11.49128532409668, -10.889338493347168, -10.287392616271973, -9.685445785522461, -9.083499908447266, -8.48155403137207, -7.879607677459717, -7.277661323547363, -6.67571496963501, -6.073768615722656, -5.471822738647461, -4.869876384735107, -4.267930030822754, -3.6659839153289795, -3.064037799835205, -2.4620914459228516, -1.8601452112197876, -1.2581989765167236, -0.6562527418136597, -0.0543065071105957, 0.5476398468017578, 1.1495859622955322, 1.7515320777893066, 2.35347843170166, 2.9554247856140137, 3.557370901107788, 4.1593170166015625, 4.761263370513916, 5.3632097244262695, 5.965155601501465, 6.567101955413818, 7.169048309326172, 7.770994663238525, 8.372941017150879, 8.974886894226074, 9.576833724975586, 10.178779602050781, 10.780725479125977, 11.382671356201172, 11.984618186950684, 12.586564064025879, 13.18851089477539, 13.790456771850586, 14.392402648925781, 14.994349479675293, 15.596295356750488, 16.1982421875, 16.800188064575195]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 4.0, 7.0, 11.0, 3.0, 12.0, 9.0, 12.0, 14.0, 16.0, 26.0, 19.0, 31.0, 25.0, 27.0, 32.0, 36.0, 37.0, 41.0, 49.0, 40.0, 34.0, 50.0, 44.0, 39.0, 30.0, 48.0, 43.0, 40.0, 42.0, 22.0, 24.0, 21.0, 29.0, 20.0, 6.0, 8.0, 13.0, 6.0, 9.0, 7.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.322471618652344, -10.965357780456543, -10.608244895935059, -10.251131057739258, -9.894017219543457, -9.536903381347656, -9.179790496826172, -8.822676658630371, -8.46556282043457, -8.10844898223877, -7.751335620880127, -7.394222259521484, -7.037108421325684, -6.679995059967041, -6.322881698608398, -5.965767860412598, -5.608654499053955, -5.2515411376953125, -4.894427299499512, -4.537313938140869, -4.180200099945068, -3.823086738586426, -3.465973138809204, -3.1088595390319824, -2.7517459392547607, -2.394632339477539, -2.0375187397003174, -1.6804052591323853, -1.3232916593551636, -0.9661780595779419, -0.6090645790100098, -0.2519509792327881, 0.1051626205444336, 0.4622761905193329, 0.8193897604942322, 1.176503300666809, 1.5336169004440308, 1.8907305002212524, 2.2478439807891846, 2.6049575805664062, 2.962071180343628, 3.3191847801208496, 3.6762983798980713, 4.033411979675293, 4.3905253410339355, 4.747639179229736, 5.104752540588379, 5.46186637878418, 5.818979740142822, 6.176093101501465, 6.533206939697266, 6.890320301055908, 7.247434139251709, 7.604547500610352, 7.961661338806152, 8.318775177001953, 8.675888061523438, 9.033001899719238, 9.390114784240723, 9.747228622436523, 10.104342460632324, 10.461456298828125, 10.81856918334961, 11.17568302154541, 11.532796859741211]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 7.0, 8.0, 9.0, 23.0, 29.0, 48.0, 47.0, 75.0, 135.0, 266.0, 568.0, 1424.0, 4033.0, 17013.0, 187899.0, 3883523.0, 82783.0, 11043.0, 3053.0, 1140.0, 449.0, 266.0, 142.0, 90.0, 66.0, 35.0, 26.0, 21.0, 24.0, 7.0, 11.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.181640625, -2.10736083984375, -2.0330810546875, -1.95880126953125, -1.884521484375, -1.81024169921875, -1.7359619140625, -1.66168212890625, -1.58740234375, -1.51312255859375, -1.4388427734375, -1.36456298828125, -1.290283203125, -1.21600341796875, -1.1417236328125, -1.06744384765625, -0.9931640625, -0.91888427734375, -0.8446044921875, -0.77032470703125, -0.696044921875, -0.62176513671875, -0.5474853515625, -0.47320556640625, -0.39892578125, -0.32464599609375, -0.2503662109375, -0.17608642578125, -0.101806640625, -0.02752685546875, 0.0467529296875, 0.12103271484375, 0.1953125, 0.26959228515625, 0.3438720703125, 0.41815185546875, 0.492431640625, 0.56671142578125, 0.6409912109375, 0.71527099609375, 0.78955078125, 0.86383056640625, 0.9381103515625, 1.01239013671875, 1.086669921875, 1.16094970703125, 1.2352294921875, 1.30950927734375, 1.3837890625, 1.45806884765625, 1.5323486328125, 1.60662841796875, 1.680908203125, 1.75518798828125, 1.8294677734375, 1.90374755859375, 1.97802734375, 2.05230712890625, 2.1265869140625, 2.20086669921875, 2.275146484375, 2.34942626953125, 2.4237060546875, 2.49798583984375, 2.572265625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 4.0, 10.0, 17.0, 23.0, 24.0, 19.0, 42.0, 36.0, 39.0, 37.0, 67.0, 66.0, 68.0, 65.0, 60.0, 54.0, 58.0, 51.0, 50.0, 47.0, 35.0, 30.0, 29.0, 14.0, 12.0, 9.0, 14.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.569549560546875, -0.54974365234375, -0.529937744140625, -0.5101318359375, -0.490325927734375, -0.47052001953125, -0.450714111328125, -0.430908203125, -0.411102294921875, -0.39129638671875, -0.371490478515625, -0.3516845703125, -0.331878662109375, -0.31207275390625, -0.292266845703125, -0.2724609375, -0.252655029296875, -0.23284912109375, -0.213043212890625, -0.1932373046875, -0.173431396484375, -0.15362548828125, -0.133819580078125, -0.114013671875, -0.094207763671875, -0.07440185546875, -0.054595947265625, -0.0347900390625, -0.014984130859375, 0.00482177734375, 0.024627685546875, 0.04443359375, 0.064239501953125, 0.08404541015625, 0.103851318359375, 0.1236572265625, 0.143463134765625, 0.16326904296875, 0.183074951171875, 0.202880859375, 0.222686767578125, 0.24249267578125, 0.262298583984375, 0.2821044921875, 0.301910400390625, 0.32171630859375, 0.341522216796875, 0.361328125, 0.381134033203125, 0.40093994140625, 0.420745849609375, 0.4405517578125, 0.460357666015625, 0.48016357421875, 0.499969482421875, 0.519775390625, 0.539581298828125, 0.55938720703125, 0.579193115234375, 0.5989990234375, 0.618804931640625, 0.63861083984375, 0.658416748046875, 0.67822265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 9.0, 4.0, 20.0, 22.0, 29.0, 50.0, 61.0, 103.0, 148.0, 181.0, 290.0, 477.0, 737.0, 1589.0, 4164.0, 13649.0, 71377.0, 2238991.0, 1772971.0, 68225.0, 13474.0, 4005.0, 1610.0, 732.0, 453.0, 281.0, 203.0, 127.0, 88.0, 50.0, 55.0, 35.0, 26.0, 16.0, 18.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.419921875, -1.3725738525390625, -1.325225830078125, -1.2778778076171875, -1.23052978515625, -1.1831817626953125, -1.135833740234375, -1.0884857177734375, -1.0411376953125, -0.9937896728515625, -0.946441650390625, -0.8990936279296875, -0.85174560546875, -0.8043975830078125, -0.757049560546875, -0.7097015380859375, -0.662353515625, -0.6150054931640625, -0.567657470703125, -0.5203094482421875, -0.47296142578125, -0.4256134033203125, -0.378265380859375, -0.3309173583984375, -0.2835693359375, -0.2362213134765625, -0.188873291015625, -0.1415252685546875, -0.09417724609375, -0.0468292236328125, 0.000518798828125, 0.0478668212890625, 0.09521484375, 0.1425628662109375, 0.189910888671875, 0.2372589111328125, 0.28460693359375, 0.3319549560546875, 0.379302978515625, 0.4266510009765625, 0.4739990234375, 0.5213470458984375, 0.568695068359375, 0.6160430908203125, 0.66339111328125, 0.7107391357421875, 0.758087158203125, 0.8054351806640625, 0.852783203125, 0.9001312255859375, 0.947479248046875, 0.9948272705078125, 1.04217529296875, 1.0895233154296875, 1.136871337890625, 1.1842193603515625, 1.2315673828125, 1.2789154052734375, 1.326263427734375, 1.3736114501953125, 1.42095947265625, 1.4683074951171875, 1.515655517578125, 1.5630035400390625, 1.6103515625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 10.0, 10.0, 24.0, 67.0, 137.0, 545.0, 2481.0, 512.0, 146.0, 63.0, 31.0, 17.0, 7.0, 4.0, 9.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3662109375, -1.3253936767578125, -1.284576416015625, -1.2437591552734375, -1.20294189453125, -1.1621246337890625, -1.121307373046875, -1.0804901123046875, -1.0396728515625, -0.9988555908203125, -0.958038330078125, -0.9172210693359375, -0.87640380859375, -0.8355865478515625, -0.794769287109375, -0.7539520263671875, -0.713134765625, -0.6723175048828125, -0.631500244140625, -0.5906829833984375, -0.54986572265625, -0.5090484619140625, -0.468231201171875, -0.4274139404296875, -0.3865966796875, -0.3457794189453125, -0.304962158203125, -0.2641448974609375, -0.22332763671875, -0.1825103759765625, -0.141693115234375, -0.1008758544921875, -0.06005859375, -0.0192413330078125, 0.021575927734375, 0.0623931884765625, 0.10321044921875, 0.1440277099609375, 0.184844970703125, 0.2256622314453125, 0.2664794921875, 0.3072967529296875, 0.348114013671875, 0.3889312744140625, 0.42974853515625, 0.4705657958984375, 0.511383056640625, 0.5522003173828125, 0.593017578125, 0.6338348388671875, 0.674652099609375, 0.7154693603515625, 0.75628662109375, 0.7971038818359375, 0.837921142578125, 0.8787384033203125, 0.9195556640625, 0.9603729248046875, 1.001190185546875, 1.0420074462890625, 1.08282470703125, 1.1236419677734375, 1.164459228515625, 1.2052764892578125, 1.24609375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 37.0, 86.0, 252.0, 345.0, 185.0, 61.0, 23.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4050207138061523, -2.1402840614318848, -1.8755474090576172, -1.6108107566833496, -1.346074104309082, -1.0813374519348145, -0.8166007995605469, -0.5518641471862793, -0.2871274948120117, -0.02239084243774414, 0.24234580993652344, 0.507082462310791, 0.7718191146850586, 1.0365557670593262, 1.3012924194335938, 1.5660290718078613, 1.830765724182129, 2.0955023765563965, 2.360239028930664, 2.6249756813049316, 2.889712333679199, 3.154448986053467, 3.4191856384277344, 3.683922290802002, 3.9486589431762695, 4.213395595550537, 4.478132247924805, 4.742868900299072, 5.00760555267334, 5.272342205047607, 5.537078857421875, 5.801815509796143, 6.066553115844727, 6.331289768218994, 6.596026420593262, 6.860763072967529, 7.125499725341797, 7.3902363777160645, 7.654973030090332, 7.9197096824646, 8.184446334838867, 8.449182510375977, 8.713919639587402, 8.978656768798828, 9.243392944335938, 9.508129119873047, 9.772866249084473, 10.037603378295898, 10.302339553833008, 10.567075729370117, 10.831812858581543, 11.096549987792969, 11.361286163330078, 11.626022338867188, 11.890759468078613, 12.155496597290039, 12.420232772827148, 12.684968948364258, 12.949706077575684, 13.21444320678711, 13.479179382324219, 13.743915557861328, 14.008652687072754, 14.27338981628418, 14.538125991821289]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 13.0, 15.0, 13.0, 18.0, 24.0, 31.0, 39.0, 39.0, 42.0, 51.0, 52.0, 53.0, 61.0, 60.0, 64.0, 70.0, 66.0, 36.0, 48.0, 37.0, 39.0, 32.0, 27.0, 22.0, 16.0, 8.0, 9.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6382036209106445, -2.542146921157837, -2.4460902214050293, -2.3500335216522217, -2.253976821899414, -2.1579201221466064, -2.061863422393799, -1.9658067226409912, -1.8697500228881836, -1.773693323135376, -1.6776366233825684, -1.5815799236297607, -1.4855232238769531, -1.3894665241241455, -1.293409824371338, -1.1973531246185303, -1.101296305656433, -1.0052396059036255, -0.9091829061508179, -0.8131262063980103, -0.7170695066452026, -0.621012806892395, -0.5249560475349426, -0.428899347782135, -0.3328426480293274, -0.23678594827651978, -0.14072923362255096, -0.04467251896858215, 0.051384180784225464, 0.14744088053703308, 0.24349761009216309, 0.3395543098449707, 0.4356110095977783, 0.5316677093505859, 0.6277244091033936, 0.7237811088562012, 0.8198378086090088, 0.9158945083618164, 1.011951208114624, 1.1080079078674316, 1.2040646076202393, 1.3001213073730469, 1.3961780071258545, 1.492234706878662, 1.5882914066314697, 1.6843481063842773, 1.780404806137085, 1.8764615058898926, 1.9725183248519897, 2.068575143814087, 2.1646318435668945, 2.260688543319702, 2.3567452430725098, 2.4528019428253174, 2.548858642578125, 2.6449153423309326, 2.7409720420837402, 2.837028741836548, 2.9330854415893555, 3.029142141342163, 3.1251988410949707, 3.2212555408477783, 3.317312240600586, 3.4133689403533936, 3.509425640106201]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 7.0, 7.0, 10.0, 14.0, 17.0, 31.0, 29.0, 65.0, 88.0, 143.0, 221.0, 328.0, 538.0, 987.0, 1808.0, 3524.0, 7512.0, 18998.0, 52313.0, 148402.0, 310873.0, 294023.0, 131616.0, 45920.0, 16931.0, 6924.0, 3159.0, 1652.0, 927.0, 535.0, 308.0, 216.0, 139.0, 87.0, 69.0, 34.0, 19.0, 21.0, 15.0, 10.0, 8.0, 6.0, 5.0, 9.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.4951171875, -1.4510650634765625, -1.407012939453125, -1.3629608154296875, -1.31890869140625, -1.2748565673828125, -1.230804443359375, -1.1867523193359375, -1.1427001953125, -1.0986480712890625, -1.054595947265625, -1.0105438232421875, -0.96649169921875, -0.9224395751953125, -0.878387451171875, -0.8343353271484375, -0.790283203125, -0.7462310791015625, -0.702178955078125, -0.6581268310546875, -0.61407470703125, -0.5700225830078125, -0.525970458984375, -0.4819183349609375, -0.4378662109375, -0.3938140869140625, -0.349761962890625, -0.3057098388671875, -0.26165771484375, -0.2176055908203125, -0.173553466796875, -0.1295013427734375, -0.08544921875, -0.0413970947265625, 0.002655029296875, 0.0467071533203125, 0.09075927734375, 0.1348114013671875, 0.178863525390625, 0.2229156494140625, 0.2669677734375, 0.3110198974609375, 0.355072021484375, 0.3991241455078125, 0.44317626953125, 0.4872283935546875, 0.531280517578125, 0.5753326416015625, 0.619384765625, 0.6634368896484375, 0.707489013671875, 0.7515411376953125, 0.79559326171875, 0.8396453857421875, 0.883697509765625, 0.9277496337890625, 0.9718017578125, 1.0158538818359375, 1.059906005859375, 1.1039581298828125, 1.14801025390625, 1.1920623779296875, 1.236114501953125, 1.2801666259765625, 1.32421875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 11.0, 7.0, 15.0, 22.0, 20.0, 22.0, 18.0, 37.0, 35.0, 53.0, 51.0, 50.0, 60.0, 69.0, 64.0, 54.0, 59.0, 62.0, 46.0, 37.0, 51.0, 29.0, 34.0, 19.0, 22.0, 8.0, 12.0, 8.0, 5.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5407028198242188, -0.5223236083984375, -0.5039443969726562, -0.485565185546875, -0.46718597412109375, -0.4488067626953125, -0.43042755126953125, -0.41204833984375, -0.39366912841796875, -0.3752899169921875, -0.35691070556640625, -0.338531494140625, -0.32015228271484375, -0.3017730712890625, -0.28339385986328125, -0.2650146484375, -0.24663543701171875, -0.2282562255859375, -0.20987701416015625, -0.191497802734375, -0.17311859130859375, -0.1547393798828125, -0.13636016845703125, -0.11798095703125, -0.09960174560546875, -0.0812225341796875, -0.06284332275390625, -0.044464111328125, -0.02608489990234375, -0.0077056884765625, 0.01067352294921875, 0.029052734375, 0.04743194580078125, 0.0658111572265625, 0.08419036865234375, 0.102569580078125, 0.12094879150390625, 0.1393280029296875, 0.15770721435546875, 0.17608642578125, 0.19446563720703125, 0.2128448486328125, 0.23122406005859375, 0.249603271484375, 0.26798248291015625, 0.2863616943359375, 0.30474090576171875, 0.3231201171875, 0.34149932861328125, 0.3598785400390625, 0.37825775146484375, 0.396636962890625, 0.41501617431640625, 0.4333953857421875, 0.45177459716796875, 0.47015380859375, 0.48853302001953125, 0.5069122314453125, 0.5252914428710938, 0.543670654296875, 0.5620498657226562, 0.5804290771484375, 0.5988082885742188, 0.6171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 12.0, 16.0, 21.0, 28.0, 29.0, 56.0, 84.0, 137.0, 196.0, 303.0, 586.0, 1233.0, 3182.0, 11754.0, 65663.0, 418752.0, 453693.0, 73673.0, 12895.0, 3369.0, 1285.0, 640.0, 344.0, 210.0, 148.0, 80.0, 46.0, 43.0, 24.0, 18.0, 12.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.861663818359375, -2.77996826171875, -2.698272705078125, -2.6165771484375, -2.534881591796875, -2.45318603515625, -2.371490478515625, -2.289794921875, -2.208099365234375, -2.12640380859375, -2.044708251953125, -1.9630126953125, -1.881317138671875, -1.79962158203125, -1.717926025390625, -1.63623046875, -1.554534912109375, -1.47283935546875, -1.391143798828125, -1.3094482421875, -1.227752685546875, -1.14605712890625, -1.064361572265625, -0.982666015625, -0.900970458984375, -0.81927490234375, -0.737579345703125, -0.6558837890625, -0.574188232421875, -0.49249267578125, -0.410797119140625, -0.3291015625, -0.247406005859375, -0.16571044921875, -0.084014892578125, -0.0023193359375, 0.079376220703125, 0.16107177734375, 0.242767333984375, 0.324462890625, 0.406158447265625, 0.48785400390625, 0.569549560546875, 0.6512451171875, 0.732940673828125, 0.81463623046875, 0.896331787109375, 0.97802734375, 1.059722900390625, 1.14141845703125, 1.223114013671875, 1.3048095703125, 1.386505126953125, 1.46820068359375, 1.549896240234375, 1.631591796875, 1.713287353515625, 1.79498291015625, 1.876678466796875, 1.9583740234375, 2.040069580078125, 2.12176513671875, 2.203460693359375, 2.28515625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 9.0, 9.0, 11.0, 15.0, 24.0, 35.0, 27.0, 41.0, 37.0, 48.0, 52.0, 57.0, 56.0, 50.0, 46.0, 50.0, 60.0, 47.0, 53.0, 30.0, 39.0, 38.0, 31.0, 17.0, 29.0, 16.0, 14.0, 14.0, 8.0, 8.0, 8.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.5689697265625, -2.466064453125, -2.3631591796875, -2.26025390625, -2.1573486328125, -2.054443359375, -1.9515380859375, -1.8486328125, -1.7457275390625, -1.642822265625, -1.5399169921875, -1.43701171875, -1.3341064453125, -1.231201171875, -1.1282958984375, -1.025390625, -0.9224853515625, -0.819580078125, -0.7166748046875, -0.61376953125, -0.5108642578125, -0.407958984375, -0.3050537109375, -0.2021484375, -0.0992431640625, 0.003662109375, 0.1065673828125, 0.20947265625, 0.3123779296875, 0.415283203125, 0.5181884765625, 0.62109375, 0.7239990234375, 0.826904296875, 0.9298095703125, 1.03271484375, 1.1356201171875, 1.238525390625, 1.3414306640625, 1.4443359375, 1.5472412109375, 1.650146484375, 1.7530517578125, 1.85595703125, 1.9588623046875, 2.061767578125, 2.1646728515625, 2.267578125, 2.3704833984375, 2.473388671875, 2.5762939453125, 2.67919921875, 2.7821044921875, 2.885009765625, 2.9879150390625, 3.0908203125, 3.1937255859375, 3.296630859375, 3.3995361328125, 3.50244140625, 3.6053466796875, 3.708251953125, 3.8111572265625, 3.9140625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 6.0, 3.0, 6.0, 13.0, 16.0, 25.0, 19.0, 34.0, 49.0, 90.0, 159.0, 316.0, 717.0, 2094.0, 8894.0, 86749.0, 751073.0, 179172.0, 14493.0, 2856.0, 918.0, 364.0, 196.0, 91.0, 60.0, 33.0, 37.0, 24.0, 10.0, 10.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5439453125, -1.4980316162109375, -1.452117919921875, -1.4062042236328125, -1.36029052734375, -1.3143768310546875, -1.268463134765625, -1.2225494384765625, -1.1766357421875, -1.1307220458984375, -1.084808349609375, -1.0388946533203125, -0.99298095703125, -0.9470672607421875, -0.901153564453125, -0.8552398681640625, -0.809326171875, -0.7634124755859375, -0.717498779296875, -0.6715850830078125, -0.62567138671875, -0.5797576904296875, -0.533843994140625, -0.4879302978515625, -0.4420166015625, -0.3961029052734375, -0.350189208984375, -0.3042755126953125, -0.25836181640625, -0.2124481201171875, -0.166534423828125, -0.1206207275390625, -0.07470703125, -0.0287933349609375, 0.017120361328125, 0.0630340576171875, 0.10894775390625, 0.1548614501953125, 0.200775146484375, 0.2466888427734375, 0.2926025390625, 0.3385162353515625, 0.384429931640625, 0.4303436279296875, 0.47625732421875, 0.5221710205078125, 0.568084716796875, 0.6139984130859375, 0.659912109375, 0.7058258056640625, 0.751739501953125, 0.7976531982421875, 0.84356689453125, 0.8894805908203125, 0.935394287109375, 0.9813079833984375, 1.0272216796875, 1.0731353759765625, 1.119049072265625, 1.1649627685546875, 1.21087646484375, 1.2567901611328125, 1.302703857421875, 1.3486175537109375, 1.39453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 21.0, 31.0, 37.0, 32.0, 55.0, 70.0, 77.0, 93.0, 87.0, 87.0, 106.0, 73.0, 50.0, 50.0, 37.0, 21.0, 9.0, 14.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001678466796875, -0.00016132742166519165, -0.0001548081636428833, -0.00014828890562057495, -0.0001417696475982666, -0.00013525038957595825, -0.0001287311315536499, -0.00012221187353134155, -0.0001156926155090332, -0.00010917335748672485, -0.0001026540994644165, -9.613484144210815e-05, -8.96155834197998e-05, -8.309632539749146e-05, -7.65770673751831e-05, -7.005780935287476e-05, -6.35385513305664e-05, -5.701929330825806e-05, -5.050003528594971e-05, -4.398077726364136e-05, -3.746151924133301e-05, -3.094226121902466e-05, -2.442300319671631e-05, -1.790374517440796e-05, -1.138448715209961e-05, -4.86522912979126e-06, 1.6540288925170898e-06, 8.17328691482544e-06, 1.4692544937133789e-05, 2.121180295944214e-05, 2.7731060981750488e-05, 3.425031900405884e-05, 4.076957702636719e-05, 4.728883504867554e-05, 5.380809307098389e-05, 6.0327351093292236e-05, 6.684660911560059e-05, 7.336586713790894e-05, 7.988512516021729e-05, 8.640438318252563e-05, 9.292364120483398e-05, 9.944289922714233e-05, 0.00010596215724945068, 0.00011248141527175903, 0.00011900067329406738, 0.00012551993131637573, 0.00013203918933868408, 0.00013855844736099243, 0.00014507770538330078, 0.00015159696340560913, 0.00015811622142791748, 0.00016463547945022583, 0.00017115473747253418, 0.00017767399549484253, 0.00018419325351715088, 0.00019071251153945923, 0.00019723176956176758, 0.00020375102758407593, 0.00021027028560638428, 0.00021678954362869263, 0.00022330880165100098, 0.00022982805967330933, 0.00023634731769561768, 0.00024286657571792603, 0.0002493858337402344]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 10.0, 11.0, 15.0, 21.0, 26.0, 34.0, 44.0, 70.0, 80.0, 155.0, 196.0, 250.0, 421.0, 670.0, 1145.0, 2144.0, 5080.0, 13992.0, 47643.0, 172045.0, 432623.0, 260102.0, 76432.0, 21414.0, 7096.0, 3017.0, 1422.0, 816.0, 501.0, 328.0, 211.0, 157.0, 100.0, 69.0, 50.0, 31.0, 34.0, 23.0, 15.0, 17.0, 10.0, 8.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 6.0], "bins": [-0.68896484375, -0.6685104370117188, -0.6480560302734375, -0.6276016235351562, -0.607147216796875, -0.5866928100585938, -0.5662384033203125, -0.5457839965820312, -0.52532958984375, -0.5048751831054688, -0.4844207763671875, -0.46396636962890625, -0.443511962890625, -0.42305755615234375, -0.4026031494140625, -0.38214874267578125, -0.3616943359375, -0.34123992919921875, -0.3207855224609375, -0.30033111572265625, -0.279876708984375, -0.25942230224609375, -0.2389678955078125, -0.21851348876953125, -0.19805908203125, -0.17760467529296875, -0.1571502685546875, -0.13669586181640625, -0.116241455078125, -0.09578704833984375, -0.0753326416015625, -0.05487823486328125, -0.034423828125, -0.01396942138671875, 0.0064849853515625, 0.02693939208984375, 0.047393798828125, 0.06784820556640625, 0.0883026123046875, 0.10875701904296875, 0.12921142578125, 0.14966583251953125, 0.1701202392578125, 0.19057464599609375, 0.211029052734375, 0.23148345947265625, 0.2519378662109375, 0.27239227294921875, 0.2928466796875, 0.31330108642578125, 0.3337554931640625, 0.35420989990234375, 0.374664306640625, 0.39511871337890625, 0.4155731201171875, 0.43602752685546875, 0.45648193359375, 0.47693634033203125, 0.4973907470703125, 0.5178451538085938, 0.538299560546875, 0.5587539672851562, 0.5792083740234375, 0.5996627807617188, 0.6201171875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 8.0, 6.0, 15.0, 15.0, 14.0, 34.0, 34.0, 50.0, 74.0, 61.0, 105.0, 111.0, 98.0, 77.0, 78.0, 66.0, 40.0, 25.0, 16.0, 17.0, 15.0, 10.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.0988922119140625, -1.062042236328125, -1.0251922607421875, -0.98834228515625, -0.9514923095703125, -0.914642333984375, -0.8777923583984375, -0.8409423828125, -0.8040924072265625, -0.767242431640625, -0.7303924560546875, -0.69354248046875, -0.6566925048828125, -0.619842529296875, -0.5829925537109375, -0.546142578125, -0.5092926025390625, -0.472442626953125, -0.4355926513671875, -0.39874267578125, -0.3618927001953125, -0.325042724609375, -0.2881927490234375, -0.2513427734375, -0.2144927978515625, -0.177642822265625, -0.1407928466796875, -0.10394287109375, -0.0670928955078125, -0.030242919921875, 0.0066070556640625, 0.04345703125, 0.0803070068359375, 0.117156982421875, 0.1540069580078125, 0.19085693359375, 0.2277069091796875, 0.264556884765625, 0.3014068603515625, 0.3382568359375, 0.3751068115234375, 0.411956787109375, 0.4488067626953125, 0.48565673828125, 0.5225067138671875, 0.559356689453125, 0.5962066650390625, 0.633056640625, 0.6699066162109375, 0.706756591796875, 0.7436065673828125, 0.78045654296875, 0.8173065185546875, 0.854156494140625, 0.8910064697265625, 0.9278564453125, 0.9647064208984375, 1.001556396484375, 1.0384063720703125, 1.07525634765625, 1.1121063232421875, 1.148956298828125, 1.1858062744140625, 1.22265625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 10.0, 12.0, 31.0, 61.0, 109.0, 168.0, 195.0, 178.0, 100.0, 56.0, 42.0, 18.0, 18.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.303489685058594, -33.625221252441406, -32.94694900512695, -32.268680572509766, -31.590410232543945, -30.912139892578125, -30.233871459960938, -29.555601119995117, -28.877330780029297, -28.199060440063477, -27.520790100097656, -26.84252166748047, -26.16425132751465, -25.485980987548828, -24.80771255493164, -24.12944221496582, -23.451171875, -22.77290153503418, -22.09463119506836, -21.416362762451172, -20.73809242248535, -20.05982208251953, -19.381553649902344, -18.703283309936523, -18.025012969970703, -17.346742630004883, -16.668472290039062, -15.990203857421875, -15.311933517456055, -14.633663177490234, -13.95539379119873, -13.277124404907227, -12.598852157592773, -11.920581817626953, -11.24231243133545, -10.564043045043945, -9.885772705078125, -9.207502365112305, -8.5292329788208, -7.850963115692139, -7.172693252563477, -6.4944233894348145, -5.816153526306152, -5.13788366317749, -4.459613800048828, -3.781343936920166, -3.103074073791504, -2.424804210662842, -1.7465343475341797, -1.0682644844055176, -0.38999462127685547, 0.28827524185180664, 0.9665451049804688, 1.6448149681091309, 2.323084831237793, 3.001354694366455, 3.679624557495117, 4.357894420623779, 5.036164283752441, 5.7144341468811035, 6.392704010009766, 7.070973873138428, 7.74924373626709, 8.427513122558594, 9.105783462524414]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 10.0, 5.0, 10.0, 11.0, 17.0, 21.0, 15.0, 14.0, 30.0, 45.0, 25.0, 42.0, 41.0, 56.0, 43.0, 49.0, 63.0, 41.0, 44.0, 50.0, 49.0, 42.0, 29.0, 41.0, 22.0, 28.0, 20.0, 28.0, 21.0, 8.0, 17.0, 17.0, 6.0, 5.0, 4.0, 9.0, 5.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.063925743103027, -13.568740844726562, -13.073555946350098, -12.578371047973633, -12.083186149597168, -11.588001251220703, -11.092815399169922, -10.597631454467773, -10.102445602416992, -9.607260704040527, -9.112075805664062, -8.616890907287598, -8.121706008911133, -7.626521110534668, -7.131335735321045, -6.63615083694458, -6.140966415405273, -5.645781517028809, -5.150596618652344, -4.655411720275879, -4.160226821899414, -3.66504168510437, -3.169856548309326, -2.6746716499328613, -2.1794867515563965, -1.6843018531799316, -1.1891168355941772, -0.6939318180084229, -0.198746919631958, 0.29643797874450684, 0.7916231155395508, 1.2868080139160156, 1.781991958618164, 2.277176856994629, 2.7723617553710938, 3.2675468921661377, 3.7627317905426025, 4.257916450500488, 4.753101825714111, 5.248286724090576, 5.743471622467041, 6.238656520843506, 6.733841419219971, 7.229026794433594, 7.724211692810059, 8.219396591186523, 8.714581489562988, 9.209766387939453, 9.704951286315918, 10.200136184692383, 10.695321083068848, 11.190505981445312, 11.685690879821777, 12.180875778198242, 12.676061630249023, 13.171245574951172, 13.666431427001953, 14.161616325378418, 14.656801223754883, 15.151986122131348, 15.647171020507812, 16.142356872558594, 16.637540817260742, 17.132726669311523, 17.627910614013672]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 11.0, 27.0, 51.0, 116.0, 304.0, 1221.0, 10391.0, 3887924.0, 285730.0, 6902.0, 1074.0, 340.0, 109.0, 46.0, 21.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.802490234375, -3.65576171875, -3.509033203125, -3.3623046875, -3.215576171875, -3.06884765625, -2.922119140625, -2.775390625, -2.628662109375, -2.48193359375, -2.335205078125, -2.1884765625, -2.041748046875, -1.89501953125, -1.748291015625, -1.6015625, -1.454833984375, -1.30810546875, -1.161376953125, -1.0146484375, -0.867919921875, -0.72119140625, -0.574462890625, -0.427734375, -0.281005859375, -0.13427734375, 0.012451171875, 0.1591796875, 0.305908203125, 0.45263671875, 0.599365234375, 0.74609375, 0.892822265625, 1.03955078125, 1.186279296875, 1.3330078125, 1.479736328125, 1.62646484375, 1.773193359375, 1.919921875, 2.066650390625, 2.21337890625, 2.360107421875, 2.5068359375, 2.653564453125, 2.80029296875, 2.947021484375, 3.09375, 3.240478515625, 3.38720703125, 3.533935546875, 3.6806640625, 3.827392578125, 3.97412109375, 4.120849609375, 4.267578125, 4.414306640625, 4.56103515625, 4.707763671875, 4.8544921875, 5.001220703125, 5.14794921875, 5.294677734375, 5.44140625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 10.0, 3.0, 11.0, 9.0, 16.0, 20.0, 12.0, 31.0, 33.0, 35.0, 38.0, 32.0, 52.0, 59.0, 58.0, 61.0, 50.0, 66.0, 58.0, 45.0, 37.0, 48.0, 41.0, 30.0, 29.0, 15.0, 20.0, 15.0, 16.0, 7.0, 11.0, 10.0, 6.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6015625, -0.5797042846679688, -0.5578460693359375, -0.5359878540039062, -0.514129638671875, -0.49227142333984375, -0.4704132080078125, -0.44855499267578125, -0.42669677734375, -0.40483856201171875, -0.3829803466796875, -0.36112213134765625, -0.339263916015625, -0.31740570068359375, -0.2955474853515625, -0.27368927001953125, -0.2518310546875, -0.22997283935546875, -0.2081146240234375, -0.18625640869140625, -0.164398193359375, -0.14253997802734375, -0.1206817626953125, -0.09882354736328125, -0.07696533203125, -0.05510711669921875, -0.0332489013671875, -0.01139068603515625, 0.010467529296875, 0.03232574462890625, 0.0541839599609375, 0.07604217529296875, 0.097900390625, 0.11975860595703125, 0.1416168212890625, 0.16347503662109375, 0.185333251953125, 0.20719146728515625, 0.2290496826171875, 0.25090789794921875, 0.27276611328125, 0.29462432861328125, 0.3164825439453125, 0.33834075927734375, 0.360198974609375, 0.38205718994140625, 0.4039154052734375, 0.42577362060546875, 0.4476318359375, 0.46949005126953125, 0.4913482666015625, 0.5132064819335938, 0.535064697265625, 0.5569229125976562, 0.5787811279296875, 0.6006393432617188, 0.62249755859375, 0.6443557739257812, 0.6662139892578125, 0.6880722045898438, 0.709930419921875, 0.7317886352539062, 0.7536468505859375, 0.7755050659179688, 0.79736328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 6.0, 4.0, 3.0, 6.0, 14.0, 18.0, 15.0, 22.0, 34.0, 38.0, 49.0, 90.0, 156.0, 229.0, 389.0, 652.0, 1190.0, 2116.0, 4568.0, 10439.0, 31061.0, 149984.0, 3717427.0, 214040.0, 38697.0, 12473.0, 5169.0, 2377.0, 1218.0, 671.0, 401.0, 247.0, 144.0, 75.0, 62.0, 63.0, 32.0, 27.0, 29.0, 7.0, 10.0, 9.0, 9.0, 4.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.099609375, -1.064788818359375, -1.02996826171875, -0.995147705078125, -0.9603271484375, -0.925506591796875, -0.89068603515625, -0.855865478515625, -0.821044921875, -0.786224365234375, -0.75140380859375, -0.716583251953125, -0.6817626953125, -0.646942138671875, -0.61212158203125, -0.577301025390625, -0.54248046875, -0.507659912109375, -0.47283935546875, -0.438018798828125, -0.4031982421875, -0.368377685546875, -0.33355712890625, -0.298736572265625, -0.263916015625, -0.229095458984375, -0.19427490234375, -0.159454345703125, -0.1246337890625, -0.089813232421875, -0.05499267578125, -0.020172119140625, 0.0146484375, 0.049468994140625, 0.08428955078125, 0.119110107421875, 0.1539306640625, 0.188751220703125, 0.22357177734375, 0.258392333984375, 0.293212890625, 0.328033447265625, 0.36285400390625, 0.397674560546875, 0.4324951171875, 0.467315673828125, 0.50213623046875, 0.536956787109375, 0.57177734375, 0.606597900390625, 0.64141845703125, 0.676239013671875, 0.7110595703125, 0.745880126953125, 0.78070068359375, 0.815521240234375, 0.850341796875, 0.885162353515625, 0.91998291015625, 0.954803466796875, 0.9896240234375, 1.024444580078125, 1.05926513671875, 1.094085693359375, 1.12890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 6.0, 10.0, 16.0, 13.0, 33.0, 56.0, 92.0, 233.0, 2839.0, 442.0, 140.0, 63.0, 49.0, 22.0, 13.0, 14.0, 8.0, 6.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.39599609375, -0.3860187530517578, -0.3760414123535156, -0.36606407165527344, -0.35608673095703125, -0.34610939025878906, -0.3361320495605469, -0.3261547088623047, -0.3161773681640625, -0.3062000274658203, -0.2962226867675781, -0.28624534606933594, -0.27626800537109375, -0.26629066467285156, -0.2563133239746094, -0.2463359832763672, -0.236358642578125, -0.2263813018798828, -0.21640396118164062, -0.20642662048339844, -0.19644927978515625, -0.18647193908691406, -0.17649459838867188, -0.1665172576904297, -0.1565399169921875, -0.1465625762939453, -0.13658523559570312, -0.12660789489746094, -0.11663055419921875, -0.10665321350097656, -0.09667587280273438, -0.08669853210449219, -0.07672119140625, -0.06674385070800781, -0.056766510009765625, -0.04678916931152344, -0.03681182861328125, -0.026834487915039062, -0.016857147216796875, -0.0068798065185546875, 0.0030975341796875, 0.013074874877929688, 0.023052215576171875, 0.03302955627441406, 0.04300689697265625, 0.05298423767089844, 0.06296157836914062, 0.07293891906738281, 0.082916259765625, 0.09289360046386719, 0.10287094116210938, 0.11284828186035156, 0.12282562255859375, 0.13280296325683594, 0.14278030395507812, 0.1527576446533203, 0.1627349853515625, 0.1727123260498047, 0.18268966674804688, 0.19266700744628906, 0.20264434814453125, 0.21262168884277344, 0.22259902954101562, 0.2325763702392578, 0.2425537109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 7.0, 11.0, 21.0, 35.0, 47.0, 65.0, 63.0, 92.0, 116.0, 108.0, 113.0, 109.0, 66.0, 56.0, 33.0, 19.0, 14.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3547124862670898, -1.3212316036224365, -1.2877506017684937, -1.2542697191238403, -1.220788836479187, -1.1873078346252441, -1.1538269519805908, -1.1203460693359375, -1.0868651866912842, -1.0533843040466309, -1.019903302192688, -0.9864224195480347, -0.9529415369033813, -0.9194605946540833, -0.8859796524047852, -0.8524987697601318, -0.819017767906189, -0.7855368256568909, -0.7520559430122375, -0.7185750007629395, -0.6850941181182861, -0.651613175868988, -0.6181322336196899, -0.5846513509750366, -0.5511704087257385, -0.5176894664764404, -0.4842085838317871, -0.450727641582489, -0.4172467291355133, -0.3837658166885376, -0.3502848744392395, -0.3168039619922638, -0.28332293033599854, -0.24984201788902283, -0.21636109054088593, -0.18288016319274902, -0.14939925074577332, -0.11591833829879761, -0.0824374109506607, -0.048956483602523804, -0.015475571155548096, 0.01800534874200821, 0.051486268639564514, 0.08496718853712082, 0.11844810843467712, 0.15192902088165283, 0.18540994822978973, 0.21889087557792664, 0.25237178802490234, 0.28585270047187805, 0.31933361291885376, 0.35281455516815186, 0.38629546761512756, 0.41977638006210327, 0.45325732231140137, 0.4867382347583771, 0.5202191472053528, 0.5537000894546509, 0.5871809720993042, 0.6206619143486023, 0.6541428565979004, 0.6876237392425537, 0.7211046814918518, 0.7545856237411499, 0.7880665063858032]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 8.0, 6.0, 10.0, 13.0, 9.0, 20.0, 24.0, 24.0, 25.0, 30.0, 28.0, 34.0, 33.0, 26.0, 37.0, 32.0, 48.0, 41.0, 42.0, 47.0, 45.0, 37.0, 30.0, 34.0, 42.0, 27.0, 30.0, 38.0, 29.0, 22.0, 20.0, 17.0, 16.0, 11.0, 8.0, 10.0, 7.0, 4.0, 6.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5871879458427429, -0.5681593418121338, -0.5491307377815247, -0.5301021337509155, -0.5110734701156616, -0.4920448958873749, -0.47301626205444336, -0.45398765802383423, -0.4349590539932251, -0.41593044996261597, -0.39690184593200684, -0.3778732120990753, -0.3588446080684662, -0.33981600403785706, -0.32078737020492554, -0.3017587661743164, -0.2827301621437073, -0.26370155811309814, -0.24467293918132782, -0.2256443202495575, -0.20661571621894836, -0.18758711218833923, -0.1685584932565689, -0.14952987432479858, -0.13050127029418945, -0.11147265881299973, -0.09244404733181, -0.07341543585062027, -0.05438682436943054, -0.035358212888240814, -0.016329601407051086, 0.0026990175247192383, 0.021727681159973145, 0.04075629264116287, 0.0597849041223526, 0.07881351560354233, 0.09784212708473206, 0.11687073856592178, 0.1358993500471115, 0.15492796897888184, 0.17395657300949097, 0.1929851770401001, 0.21201379597187042, 0.23104241490364075, 0.2500710189342499, 0.269099622964859, 0.2881282567977905, 0.30715686082839966, 0.3261854648590088, 0.3452140688896179, 0.36424267292022705, 0.38327130675315857, 0.4022999107837677, 0.42132851481437683, 0.44035714864730835, 0.4593857526779175, 0.4784143567085266, 0.49744296073913574, 0.5164715647697449, 0.535500168800354, 0.5545288324356079, 0.573557436466217, 0.5925860404968262, 0.6116146445274353, 0.6306432485580444]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 11.0, 8.0, 11.0, 16.0, 21.0, 31.0, 59.0, 90.0, 155.0, 284.0, 590.0, 1332.0, 3314.0, 9357.0, 31222.0, 121646.0, 384058.0, 352217.0, 102946.0, 27223.0, 8413.0, 3053.0, 1212.0, 585.0, 304.0, 141.0, 84.0, 60.0, 35.0, 19.0, 14.0, 8.0, 8.0, 8.0, 6.0, 3.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.64453125, -1.58349609375, -1.5224609375, -1.46142578125, -1.400390625, -1.33935546875, -1.2783203125, -1.21728515625, -1.15625, -1.09521484375, -1.0341796875, -0.97314453125, -0.912109375, -0.85107421875, -0.7900390625, -0.72900390625, -0.66796875, -0.60693359375, -0.5458984375, -0.48486328125, -0.423828125, -0.36279296875, -0.3017578125, -0.24072265625, -0.1796875, -0.11865234375, -0.0576171875, 0.00341796875, 0.064453125, 0.12548828125, 0.1865234375, 0.24755859375, 0.30859375, 0.36962890625, 0.4306640625, 0.49169921875, 0.552734375, 0.61376953125, 0.6748046875, 0.73583984375, 0.796875, 0.85791015625, 0.9189453125, 0.97998046875, 1.041015625, 1.10205078125, 1.1630859375, 1.22412109375, 1.28515625, 1.34619140625, 1.4072265625, 1.46826171875, 1.529296875, 1.59033203125, 1.6513671875, 1.71240234375, 1.7734375, 1.83447265625, 1.8955078125, 1.95654296875, 2.017578125, 2.07861328125, 2.1396484375, 2.20068359375, 2.26171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 6.0, 1.0, 11.0, 16.0, 12.0, 20.0, 27.0, 26.0, 28.0, 44.0, 32.0, 42.0, 53.0, 57.0, 60.0, 64.0, 58.0, 46.0, 39.0, 47.0, 53.0, 37.0, 26.0, 37.0, 25.0, 25.0, 20.0, 14.0, 9.0, 11.0, 10.0, 7.0, 8.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5712890625, -0.55023193359375, -0.5291748046875, -0.50811767578125, -0.487060546875, -0.46600341796875, -0.4449462890625, -0.42388916015625, -0.40283203125, -0.38177490234375, -0.3607177734375, -0.33966064453125, -0.318603515625, -0.29754638671875, -0.2764892578125, -0.25543212890625, -0.234375, -0.21331787109375, -0.1922607421875, -0.17120361328125, -0.150146484375, -0.12908935546875, -0.1080322265625, -0.08697509765625, -0.06591796875, -0.04486083984375, -0.0238037109375, -0.00274658203125, 0.018310546875, 0.03936767578125, 0.0604248046875, 0.08148193359375, 0.1025390625, 0.12359619140625, 0.1446533203125, 0.16571044921875, 0.186767578125, 0.20782470703125, 0.2288818359375, 0.24993896484375, 0.27099609375, 0.29205322265625, 0.3131103515625, 0.33416748046875, 0.355224609375, 0.37628173828125, 0.3973388671875, 0.41839599609375, 0.439453125, 0.46051025390625, 0.4815673828125, 0.50262451171875, 0.523681640625, 0.54473876953125, 0.5657958984375, 0.58685302734375, 0.60791015625, 0.62896728515625, 0.6500244140625, 0.67108154296875, 0.692138671875, 0.71319580078125, 0.7342529296875, 0.75531005859375, 0.7763671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 10.0, 13.0, 10.0, 13.0, 25.0, 53.0, 98.0, 159.0, 345.0, 881.0, 2905.0, 16944.0, 287711.0, 693301.0, 38975.0, 4891.0, 1250.0, 475.0, 207.0, 110.0, 70.0, 33.0, 21.0, 17.0, 11.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0234375, -4.880615234375, -4.73779296875, -4.594970703125, -4.4521484375, -4.309326171875, -4.16650390625, -4.023681640625, -3.880859375, -3.738037109375, -3.59521484375, -3.452392578125, -3.3095703125, -3.166748046875, -3.02392578125, -2.881103515625, -2.73828125, -2.595458984375, -2.45263671875, -2.309814453125, -2.1669921875, -2.024169921875, -1.88134765625, -1.738525390625, -1.595703125, -1.452880859375, -1.31005859375, -1.167236328125, -1.0244140625, -0.881591796875, -0.73876953125, -0.595947265625, -0.453125, -0.310302734375, -0.16748046875, -0.024658203125, 0.1181640625, 0.260986328125, 0.40380859375, 0.546630859375, 0.689453125, 0.832275390625, 0.97509765625, 1.117919921875, 1.2607421875, 1.403564453125, 1.54638671875, 1.689208984375, 1.83203125, 1.974853515625, 2.11767578125, 2.260498046875, 2.4033203125, 2.546142578125, 2.68896484375, 2.831787109375, 2.974609375, 3.117431640625, 3.26025390625, 3.403076171875, 3.5458984375, 3.688720703125, 3.83154296875, 3.974365234375, 4.1171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 4.0, 12.0, 13.0, 18.0, 20.0, 22.0, 40.0, 40.0, 42.0, 53.0, 54.0, 67.0, 56.0, 64.0, 67.0, 70.0, 54.0, 55.0, 59.0, 38.0, 30.0, 25.0, 21.0, 15.0, 15.0, 9.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.234375, -5.0791015625, -4.923828125, -4.7685546875, -4.61328125, -4.4580078125, -4.302734375, -4.1474609375, -3.9921875, -3.8369140625, -3.681640625, -3.5263671875, -3.37109375, -3.2158203125, -3.060546875, -2.9052734375, -2.75, -2.5947265625, -2.439453125, -2.2841796875, -2.12890625, -1.9736328125, -1.818359375, -1.6630859375, -1.5078125, -1.3525390625, -1.197265625, -1.0419921875, -0.88671875, -0.7314453125, -0.576171875, -0.4208984375, -0.265625, -0.1103515625, 0.044921875, 0.2001953125, 0.35546875, 0.5107421875, 0.666015625, 0.8212890625, 0.9765625, 1.1318359375, 1.287109375, 1.4423828125, 1.59765625, 1.7529296875, 1.908203125, 2.0634765625, 2.21875, 2.3740234375, 2.529296875, 2.6845703125, 2.83984375, 2.9951171875, 3.150390625, 3.3056640625, 3.4609375, 3.6162109375, 3.771484375, 3.9267578125, 4.08203125, 4.2373046875, 4.392578125, 4.5478515625, 4.703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 5.0, 18.0, 17.0, 27.0, 30.0, 59.0, 80.0, 107.0, 185.0, 340.0, 843.0, 3086.0, 24693.0, 847089.0, 161587.0, 7682.0, 1486.0, 544.0, 215.0, 146.0, 91.0, 73.0, 31.0, 30.0, 31.0, 20.0, 13.0, 5.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.267578125, -3.187408447265625, -3.10723876953125, -3.027069091796875, -2.9468994140625, -2.866729736328125, -2.78656005859375, -2.706390380859375, -2.626220703125, -2.546051025390625, -2.46588134765625, -2.385711669921875, -2.3055419921875, -2.225372314453125, -2.14520263671875, -2.065032958984375, -1.98486328125, -1.904693603515625, -1.82452392578125, -1.744354248046875, -1.6641845703125, -1.584014892578125, -1.50384521484375, -1.423675537109375, -1.343505859375, -1.263336181640625, -1.18316650390625, -1.102996826171875, -1.0228271484375, -0.942657470703125, -0.86248779296875, -0.782318115234375, -0.7021484375, -0.621978759765625, -0.54180908203125, -0.461639404296875, -0.3814697265625, -0.301300048828125, -0.22113037109375, -0.140960693359375, -0.060791015625, 0.019378662109375, 0.09954833984375, 0.179718017578125, 0.2598876953125, 0.340057373046875, 0.42022705078125, 0.500396728515625, 0.58056640625, 0.660736083984375, 0.74090576171875, 0.821075439453125, 0.9012451171875, 0.981414794921875, 1.06158447265625, 1.141754150390625, 1.221923828125, 1.302093505859375, 1.38226318359375, 1.462432861328125, 1.5426025390625, 1.622772216796875, 1.70294189453125, 1.783111572265625, 1.86328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 10.0, 8.0, 33.0, 49.0, 107.0, 148.0, 208.0, 154.0, 144.0, 62.0, 44.0, 18.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022399425506591797, -0.00021062977612018585, -0.00019726529717445374, -0.00018390081822872162, -0.0001705363392829895, -0.00015717186033725739, -0.00014380738139152527, -0.00013044290244579315, -0.00011707842350006104, -0.00010371394455432892, -9.03494656085968e-05, -7.698498666286469e-05, -6.362050771713257e-05, -5.025602877140045e-05, -3.6891549825668335e-05, -2.3527070879936218e-05, -1.0162591934204102e-05, 3.201887011528015e-06, 1.6566365957260132e-05, 2.993084490299225e-05, 4.3295323848724365e-05, 5.665980279445648e-05, 7.00242817401886e-05, 8.338876068592072e-05, 9.675323963165283e-05, 0.00011011771857738495, 0.00012348219752311707, 0.00013684667646884918, 0.0001502111554145813, 0.00016357563436031342, 0.00017694011330604553, 0.00019030459225177765, 0.00020366907119750977, 0.00021703355014324188, 0.000230398029088974, 0.00024376250803470612, 0.00025712698698043823, 0.00027049146592617035, 0.00028385594487190247, 0.0002972204238176346, 0.0003105849027633667, 0.0003239493817090988, 0.00033731386065483093, 0.00035067833960056305, 0.00036404281854629517, 0.0003774072974920273, 0.0003907717764377594, 0.0004041362553834915, 0.00041750073432922363, 0.00043086521327495575, 0.00044422969222068787, 0.00045759417116642, 0.0004709586501121521, 0.0004843231290578842, 0.0004976876080036163, 0.0005110520869493484, 0.0005244165658950806, 0.0005377810448408127, 0.0005511455237865448, 0.0005645100027322769, 0.000577874481678009, 0.0005912389606237411, 0.0006046034395694733, 0.0006179679185152054, 0.0006313323974609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 10.0, 12.0, 25.0, 44.0, 53.0, 88.0, 171.0, 348.0, 785.0, 2093.0, 8164.0, 77232.0, 835688.0, 109796.0, 10135.0, 2280.0, 805.0, 388.0, 177.0, 98.0, 48.0, 39.0, 12.0, 17.0, 14.0, 7.0, 4.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.513671875, -1.460662841796875, -1.40765380859375, -1.354644775390625, -1.3016357421875, -1.248626708984375, -1.19561767578125, -1.142608642578125, -1.089599609375, -1.036590576171875, -0.98358154296875, -0.930572509765625, -0.8775634765625, -0.824554443359375, -0.77154541015625, -0.718536376953125, -0.66552734375, -0.612518310546875, -0.55950927734375, -0.506500244140625, -0.4534912109375, -0.400482177734375, -0.34747314453125, -0.294464111328125, -0.241455078125, -0.188446044921875, -0.13543701171875, -0.082427978515625, -0.0294189453125, 0.023590087890625, 0.07659912109375, 0.129608154296875, 0.1826171875, 0.235626220703125, 0.28863525390625, 0.341644287109375, 0.3946533203125, 0.447662353515625, 0.50067138671875, 0.553680419921875, 0.606689453125, 0.659698486328125, 0.71270751953125, 0.765716552734375, 0.8187255859375, 0.871734619140625, 0.92474365234375, 0.977752685546875, 1.03076171875, 1.083770751953125, 1.13677978515625, 1.189788818359375, 1.2427978515625, 1.295806884765625, 1.34881591796875, 1.401824951171875, 1.454833984375, 1.507843017578125, 1.56085205078125, 1.613861083984375, 1.6668701171875, 1.719879150390625, 1.77288818359375, 1.825897216796875, 1.87890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 8.0, 4.0, 1.0, 5.0, 9.0, 6.0, 13.0, 31.0, 50.0, 58.0, 113.0, 154.0, 169.0, 142.0, 85.0, 49.0, 31.0, 22.0, 17.0, 7.0, 6.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.908203125, -2.8321990966796875, -2.756195068359375, -2.6801910400390625, -2.60418701171875, -2.5281829833984375, -2.452178955078125, -2.3761749267578125, -2.3001708984375, -2.2241668701171875, -2.148162841796875, -2.0721588134765625, -1.99615478515625, -1.9201507568359375, -1.844146728515625, -1.7681427001953125, -1.692138671875, -1.6161346435546875, -1.540130615234375, -1.4641265869140625, -1.38812255859375, -1.3121185302734375, -1.236114501953125, -1.1601104736328125, -1.0841064453125, -1.0081024169921875, -0.932098388671875, -0.8560943603515625, -0.78009033203125, -0.7040863037109375, -0.628082275390625, -0.5520782470703125, -0.47607421875, -0.4000701904296875, -0.324066162109375, -0.2480621337890625, -0.17205810546875, -0.0960540771484375, -0.020050048828125, 0.0559539794921875, 0.1319580078125, 0.2079620361328125, 0.283966064453125, 0.3599700927734375, 0.43597412109375, 0.5119781494140625, 0.587982177734375, 0.6639862060546875, 0.739990234375, 0.8159942626953125, 0.891998291015625, 0.9680023193359375, 1.04400634765625, 1.1200103759765625, 1.196014404296875, 1.2720184326171875, 1.3480224609375, 1.4240264892578125, 1.500030517578125, 1.5760345458984375, 1.65203857421875, 1.7280426025390625, 1.804046630859375, 1.8800506591796875, 1.9560546875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 9.0, 17.0, 15.0, 25.0, 63.0, 96.0, 125.0, 142.0, 132.0, 120.0, 82.0, 62.0, 50.0, 21.0, 13.0, 10.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.31902027130127, -11.608627319335938, -10.898234367370605, -10.187841415405273, -9.477447509765625, -8.767054557800293, -8.056661605834961, -7.346268177032471, -6.635875225067139, -5.925482273101807, -5.215088844299316, -4.504695892333984, -3.7943027019500732, -3.083909511566162, -2.37351655960083, -1.6631231307983398, -0.9527301788330078, -0.24233704805374146, 0.4680560827255249, 1.1784491539001465, 1.8888423442840576, 2.5992355346679688, 3.309628486633301, 4.020021915435791, 4.730414867401123, 5.440807819366455, 6.151201248168945, 6.861594200134277, 7.571987152099609, 8.282381057739258, 8.992773056030273, 9.703166961669922, 10.41356086730957, 11.123953819274902, 11.834346771240234, 12.544740676879883, 13.255133628845215, 13.965526580810547, 14.675919532775879, 15.386312484741211, 16.09670639038086, 16.807100296020508, 17.517492294311523, 18.227886199951172, 18.938278198242188, 19.648672103881836, 20.359066009521484, 21.0694580078125, 21.779850006103516, 22.490243911743164, 23.20063591003418, 23.911029815673828, 24.621421813964844, 25.331815719604492, 26.04220962524414, 26.752601623535156, 27.462995529174805, 28.173389434814453, 28.88378143310547, 29.594175338745117, 30.304567337036133, 31.01496124267578, 31.725353240966797, 32.43574905395508, 33.146141052246094]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 7.0, 5.0, 7.0, 13.0, 23.0, 23.0, 21.0, 35.0, 40.0, 39.0, 36.0, 59.0, 49.0, 63.0, 64.0, 63.0, 56.0, 48.0, 50.0, 43.0, 33.0, 21.0, 41.0, 23.0, 23.0, 17.0, 20.0, 14.0, 12.0, 12.0, 7.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.74024200439453, -16.0953369140625, -15.450429916381836, -14.805524826049805, -14.160618782043457, -13.51571273803711, -12.870807647705078, -12.22590160369873, -11.580995559692383, -10.936089515686035, -10.291183471679688, -9.646278381347656, -9.001372337341309, -8.356466293334961, -7.7115607261657715, -7.066655158996582, -6.421749114990234, -5.776843070983887, -5.131937503814697, -4.487031936645508, -3.84212589263916, -3.1972200870513916, -2.552314281463623, -1.9074087142944336, -1.262502670288086, -0.6175968647003174, 0.027308940887451172, 0.6722147464752197, 1.3171205520629883, 1.9620263576507568, 2.6069321632385254, 3.251837730407715, 3.8967437744140625, 4.54164981842041, 5.1865553855896, 5.831460952758789, 6.476366996765137, 7.121273040771484, 7.766178607940674, 8.411084175109863, 9.055990219116211, 9.700896263122559, 10.345802307128906, 10.990707397460938, 11.635613441467285, 12.280519485473633, 12.925424575805664, 13.570330619812012, 14.21523666381836, 14.860142707824707, 15.505048751831055, 16.149953842163086, 16.79486083984375, 17.43976593017578, 18.084671020507812, 18.729576110839844, 19.374483108520508, 20.01938819885254, 20.664295196533203, 21.309200286865234, 21.954105377197266, 22.59901237487793, 23.24391746520996, 23.888824462890625, 24.533729553222656]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 11.0, 11.0, 21.0, 62.0, 54.0, 147.0, 271.0, 741.0, 2167.0, 9657.0, 120222.0, 4011509.0, 40932.0, 5631.0, 1630.0, 620.0, 274.0, 119.0, 73.0, 33.0, 31.0, 16.0, 14.0, 5.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-3.447265625, -3.321136474609375, -3.19500732421875, -3.068878173828125, -2.9427490234375, -2.816619873046875, -2.69049072265625, -2.564361572265625, -2.438232421875, -2.312103271484375, -2.18597412109375, -2.059844970703125, -1.9337158203125, -1.807586669921875, -1.68145751953125, -1.555328369140625, -1.42919921875, -1.303070068359375, -1.17694091796875, -1.050811767578125, -0.9246826171875, -0.798553466796875, -0.67242431640625, -0.546295166015625, -0.420166015625, -0.294036865234375, -0.16790771484375, -0.041778564453125, 0.0843505859375, 0.210479736328125, 0.33660888671875, 0.462738037109375, 0.5888671875, 0.714996337890625, 0.84112548828125, 0.967254638671875, 1.0933837890625, 1.219512939453125, 1.34564208984375, 1.471771240234375, 1.597900390625, 1.724029541015625, 1.85015869140625, 1.976287841796875, 2.1024169921875, 2.228546142578125, 2.35467529296875, 2.480804443359375, 2.60693359375, 2.733062744140625, 2.85919189453125, 2.985321044921875, 3.1114501953125, 3.237579345703125, 3.36370849609375, 3.489837646484375, 3.615966796875, 3.742095947265625, 3.86822509765625, 3.994354248046875, 4.1204833984375, 4.246612548828125, 4.37274169921875, 4.498870849609375, 4.625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 9.0, 9.0, 9.0, 17.0, 15.0, 23.0, 30.0, 40.0, 61.0, 47.0, 61.0, 67.0, 73.0, 90.0, 73.0, 74.0, 64.0, 48.0, 34.0, 30.0, 16.0, 20.0, 18.0, 16.0, 14.0, 12.0, 6.0, 8.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7412109375, -0.7108917236328125, -0.680572509765625, -0.6502532958984375, -0.61993408203125, -0.5896148681640625, -0.559295654296875, -0.5289764404296875, -0.4986572265625, -0.4683380126953125, -0.438018798828125, -0.4076995849609375, -0.37738037109375, -0.3470611572265625, -0.316741943359375, -0.2864227294921875, -0.256103515625, -0.2257843017578125, -0.195465087890625, -0.1651458740234375, -0.13482666015625, -0.1045074462890625, -0.074188232421875, -0.0438690185546875, -0.0135498046875, 0.0167694091796875, 0.047088623046875, 0.0774078369140625, 0.10772705078125, 0.1380462646484375, 0.168365478515625, 0.1986846923828125, 0.22900390625, 0.2593231201171875, 0.289642333984375, 0.3199615478515625, 0.35028076171875, 0.3805999755859375, 0.410919189453125, 0.4412384033203125, 0.4715576171875, 0.5018768310546875, 0.532196044921875, 0.5625152587890625, 0.59283447265625, 0.6231536865234375, 0.653472900390625, 0.6837921142578125, 0.714111328125, 0.7444305419921875, 0.774749755859375, 0.8050689697265625, 0.83538818359375, 0.8657073974609375, 0.896026611328125, 0.9263458251953125, 0.9566650390625, 0.9869842529296875, 1.017303466796875, 1.0476226806640625, 1.07794189453125, 1.1082611083984375, 1.138580322265625, 1.1688995361328125, 1.19921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 11.0, 13.0, 9.0, 23.0, 27.0, 40.0, 63.0, 97.0, 132.0, 191.0, 283.0, 458.0, 869.0, 1724.0, 3699.0, 9043.0, 27059.0, 113640.0, 3339001.0, 594277.0, 71212.0, 19043.0, 7133.0, 2920.0, 1388.0, 703.0, 405.0, 250.0, 187.0, 110.0, 85.0, 46.0, 37.0, 32.0, 20.0, 10.0, 14.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.294921875, -1.2467041015625, -1.198486328125, -1.1502685546875, -1.10205078125, -1.0538330078125, -1.005615234375, -0.9573974609375, -0.9091796875, -0.8609619140625, -0.812744140625, -0.7645263671875, -0.71630859375, -0.6680908203125, -0.619873046875, -0.5716552734375, -0.5234375, -0.4752197265625, -0.427001953125, -0.3787841796875, -0.33056640625, -0.2823486328125, -0.234130859375, -0.1859130859375, -0.1376953125, -0.0894775390625, -0.041259765625, 0.0069580078125, 0.05517578125, 0.1033935546875, 0.151611328125, 0.1998291015625, 0.248046875, 0.2962646484375, 0.344482421875, 0.3927001953125, 0.44091796875, 0.4891357421875, 0.537353515625, 0.5855712890625, 0.6337890625, 0.6820068359375, 0.730224609375, 0.7784423828125, 0.82666015625, 0.8748779296875, 0.923095703125, 0.9713134765625, 1.01953125, 1.0677490234375, 1.115966796875, 1.1641845703125, 1.21240234375, 1.2606201171875, 1.308837890625, 1.3570556640625, 1.4052734375, 1.4534912109375, 1.501708984375, 1.5499267578125, 1.59814453125, 1.6463623046875, 1.694580078125, 1.7427978515625, 1.791015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 10.0, 16.0, 21.0, 27.0, 51.0, 75.0, 158.0, 419.0, 2604.0, 338.0, 135.0, 92.0, 47.0, 27.0, 11.0, 15.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.408203125, -0.39084625244140625, -0.3734893798828125, -0.35613250732421875, -0.338775634765625, -0.32141876220703125, -0.3040618896484375, -0.28670501708984375, -0.26934814453125, -0.25199127197265625, -0.2346343994140625, -0.21727752685546875, -0.199920654296875, -0.18256378173828125, -0.1652069091796875, -0.14785003662109375, -0.1304931640625, -0.11313629150390625, -0.0957794189453125, -0.07842254638671875, -0.061065673828125, -0.04370880126953125, -0.0263519287109375, -0.00899505615234375, 0.00836181640625, 0.02571868896484375, 0.0430755615234375, 0.06043243408203125, 0.077789306640625, 0.09514617919921875, 0.1125030517578125, 0.12985992431640625, 0.147216796875, 0.16457366943359375, 0.1819305419921875, 0.19928741455078125, 0.216644287109375, 0.23400115966796875, 0.2513580322265625, 0.26871490478515625, 0.28607177734375, 0.30342864990234375, 0.3207855224609375, 0.33814239501953125, 0.355499267578125, 0.37285614013671875, 0.3902130126953125, 0.40756988525390625, 0.4249267578125, 0.44228363037109375, 0.4596405029296875, 0.47699737548828125, 0.494354248046875, 0.5117111206054688, 0.5290679931640625, 0.5464248657226562, 0.56378173828125, 0.5811386108398438, 0.5984954833984375, 0.6158523559570312, 0.633209228515625, 0.6505661010742188, 0.6679229736328125, 0.6852798461914062, 0.70263671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 11.0, 11.0, 18.0, 32.0, 31.0, 46.0, 66.0, 88.0, 78.0, 101.0, 99.0, 111.0, 84.0, 56.0, 46.0, 44.0, 26.0, 20.0, 16.0, 4.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.191689968109131, -2.1373183727264404, -2.08294677734375, -2.0285751819610596, -1.9742035865783691, -1.9198319911956787, -1.8654603958129883, -1.8110888004302979, -1.7567172050476074, -1.702345609664917, -1.6479740142822266, -1.5936024188995361, -1.5392308235168457, -1.4848592281341553, -1.4304876327514648, -1.3761160373687744, -1.321744441986084, -1.2673728466033936, -1.2130012512207031, -1.1586296558380127, -1.1042580604553223, -1.0498864650726318, -0.9955148696899414, -0.941143274307251, -0.8867716789245605, -0.8324000835418701, -0.7780284881591797, -0.7236568927764893, -0.6692852973937988, -0.6149137020111084, -0.560542106628418, -0.5061705112457275, -0.4517989158630371, -0.3974273204803467, -0.34305572509765625, -0.2886841297149658, -0.2343125343322754, -0.17994093894958496, -0.12556934356689453, -0.0711977481842041, -0.016826152801513672, 0.03754544258117676, 0.09191703796386719, 0.14628863334655762, 0.20066022872924805, 0.2550318241119385, 0.3094034194946289, 0.36377501487731934, 0.41814661026000977, 0.4725182056427002, 0.5268898010253906, 0.581261396408081, 0.6356329917907715, 0.6900045871734619, 0.7443761825561523, 0.7987477779388428, 0.8531193733215332, 0.9074909687042236, 0.9618625640869141, 1.0162341594696045, 1.070605754852295, 1.1249773502349854, 1.1793489456176758, 1.2337205410003662, 1.2880921363830566]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 10.0, 12.0, 20.0, 14.0, 23.0, 22.0, 17.0, 19.0, 29.0, 26.0, 24.0, 30.0, 28.0, 40.0, 44.0, 29.0, 43.0, 32.0, 38.0, 34.0, 40.0, 30.0, 35.0, 36.0, 36.0, 21.0, 17.0, 31.0, 22.0, 29.0, 19.0, 27.0, 18.0, 14.0, 12.0, 18.0, 14.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.184389352798462, -1.148285150527954, -1.1121809482574463, -1.076076865196228, -1.0399726629257202, -1.0038684606552124, -0.9677642583847046, -0.9316601157188416, -0.8955559730529785, -0.8594517707824707, -0.8233476281166077, -0.7872434258460999, -0.7511392831802368, -0.715035080909729, -0.6789308786392212, -0.6428267359733582, -0.6067225337028503, -0.5706183314323425, -0.5345141887664795, -0.4984099864959717, -0.46230584383010864, -0.42620164155960083, -0.3900974690914154, -0.35399329662323, -0.31788912415504456, -0.28178495168685913, -0.2456807792186737, -0.2095765918493271, -0.17347241938114166, -0.13736824691295624, -0.10126405954360962, -0.0651598870754242, -0.02905571460723877, 0.007048461586236954, 0.04315263777971268, 0.0792568176984787, 0.11536099016666412, 0.15146516263484955, 0.18756935000419617, 0.2236735224723816, 0.259777694940567, 0.29588186740875244, 0.33198603987693787, 0.3680902123451233, 0.4041944146156311, 0.44029855728149414, 0.47640275955200195, 0.5125069618225098, 0.5486111044883728, 0.5847153067588806, 0.6208194494247437, 0.6569236516952515, 0.6930277943611145, 0.7291319966316223, 0.7652361392974854, 0.8013403415679932, 0.837444543838501, 0.8735487461090088, 0.9096528887748718, 0.9457570910453796, 0.9818612337112427, 1.0179654359817505, 1.0540696382522583, 1.0901737213134766, 1.1262779235839844]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 11.0, 28.0, 48.0, 73.0, 122.0, 226.0, 478.0, 1053.0, 2784.0, 8359.0, 30260.0, 138597.0, 456850.0, 313692.0, 70541.0, 16807.0, 5185.0, 1830.0, 760.0, 404.0, 163.0, 109.0, 71.0, 28.0, 15.0, 14.0, 10.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.23828125, -2.180572509765625, -2.12286376953125, -2.065155029296875, -2.0074462890625, -1.949737548828125, -1.89202880859375, -1.834320068359375, -1.776611328125, -1.718902587890625, -1.66119384765625, -1.603485107421875, -1.5457763671875, -1.488067626953125, -1.43035888671875, -1.372650146484375, -1.31494140625, -1.257232666015625, -1.19952392578125, -1.141815185546875, -1.0841064453125, -1.026397705078125, -0.96868896484375, -0.910980224609375, -0.853271484375, -0.795562744140625, -0.73785400390625, -0.680145263671875, -0.6224365234375, -0.564727783203125, -0.50701904296875, -0.449310302734375, -0.3916015625, -0.333892822265625, -0.27618408203125, -0.218475341796875, -0.1607666015625, -0.103057861328125, -0.04534912109375, 0.012359619140625, 0.070068359375, 0.127777099609375, 0.18548583984375, 0.243194580078125, 0.3009033203125, 0.358612060546875, 0.41632080078125, 0.474029541015625, 0.53173828125, 0.589447021484375, 0.64715576171875, 0.704864501953125, 0.7625732421875, 0.820281982421875, 0.87799072265625, 0.935699462890625, 0.993408203125, 1.051116943359375, 1.10882568359375, 1.166534423828125, 1.2242431640625, 1.281951904296875, 1.33966064453125, 1.397369384765625, 1.455078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 9.0, 11.0, 13.0, 9.0, 11.0, 19.0, 21.0, 26.0, 37.0, 37.0, 49.0, 53.0, 65.0, 80.0, 71.0, 83.0, 66.0, 57.0, 53.0, 42.0, 37.0, 30.0, 20.0, 17.0, 15.0, 16.0, 16.0, 7.0, 6.0, 7.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.71826171875, -0.6904983520507812, -0.6627349853515625, -0.6349716186523438, -0.607208251953125, -0.5794448852539062, -0.5516815185546875, -0.5239181518554688, -0.49615478515625, -0.46839141845703125, -0.4406280517578125, -0.41286468505859375, -0.385101318359375, -0.35733795166015625, -0.3295745849609375, -0.30181121826171875, -0.2740478515625, -0.24628448486328125, -0.2185211181640625, -0.19075775146484375, -0.162994384765625, -0.13523101806640625, -0.1074676513671875, -0.07970428466796875, -0.05194091796875, -0.02417755126953125, 0.0035858154296875, 0.03134918212890625, 0.059112548828125, 0.08687591552734375, 0.1146392822265625, 0.14240264892578125, 0.170166015625, 0.19792938232421875, 0.2256927490234375, 0.25345611572265625, 0.281219482421875, 0.30898284912109375, 0.3367462158203125, 0.36450958251953125, 0.39227294921875, 0.42003631591796875, 0.4477996826171875, 0.47556304931640625, 0.503326416015625, 0.5310897827148438, 0.5588531494140625, 0.5866165161132812, 0.6143798828125, 0.6421432495117188, 0.6699066162109375, 0.6976699829101562, 0.725433349609375, 0.7531967163085938, 0.7809600830078125, 0.8087234497070312, 0.83648681640625, 0.8642501831054688, 0.8920135498046875, 0.9197769165039062, 0.947540283203125, 0.9753036499023438, 1.0030670166015625, 1.0308303833007812, 1.05859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 8.0, 4.0, 6.0, 10.0, 13.0, 12.0, 22.0, 27.0, 59.0, 85.0, 133.0, 265.0, 460.0, 1157.0, 4107.0, 30976.0, 621916.0, 365674.0, 18553.0, 3050.0, 983.0, 421.0, 235.0, 127.0, 81.0, 51.0, 30.0, 30.0, 18.0, 11.0, 3.0, 7.0, 5.0, 6.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.83984375, -2.72100830078125, -2.6021728515625, -2.48333740234375, -2.364501953125, -2.24566650390625, -2.1268310546875, -2.00799560546875, -1.88916015625, -1.77032470703125, -1.6514892578125, -1.53265380859375, -1.413818359375, -1.29498291015625, -1.1761474609375, -1.05731201171875, -0.9384765625, -0.81964111328125, -0.7008056640625, -0.58197021484375, -0.463134765625, -0.34429931640625, -0.2254638671875, -0.10662841796875, 0.01220703125, 0.13104248046875, 0.2498779296875, 0.36871337890625, 0.487548828125, 0.60638427734375, 0.7252197265625, 0.84405517578125, 0.962890625, 1.08172607421875, 1.2005615234375, 1.31939697265625, 1.438232421875, 1.55706787109375, 1.6759033203125, 1.79473876953125, 1.91357421875, 2.03240966796875, 2.1512451171875, 2.27008056640625, 2.388916015625, 2.50775146484375, 2.6265869140625, 2.74542236328125, 2.8642578125, 2.98309326171875, 3.1019287109375, 3.22076416015625, 3.339599609375, 3.45843505859375, 3.5772705078125, 3.69610595703125, 3.81494140625, 3.93377685546875, 4.0526123046875, 4.17144775390625, 4.290283203125, 4.40911865234375, 4.5279541015625, 4.64678955078125, 4.765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 3.0, 10.0, 11.0, 19.0, 17.0, 16.0, 27.0, 21.0, 33.0, 32.0, 40.0, 49.0, 42.0, 51.0, 53.0, 51.0, 60.0, 45.0, 51.0, 43.0, 44.0, 39.0, 52.0, 26.0, 37.0, 21.0, 22.0, 22.0, 5.0, 5.0, 7.0, 4.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.384765625, -3.266082763671875, -3.14739990234375, -3.028717041015625, -2.9100341796875, -2.791351318359375, -2.67266845703125, -2.553985595703125, -2.435302734375, -2.316619873046875, -2.19793701171875, -2.079254150390625, -1.9605712890625, -1.841888427734375, -1.72320556640625, -1.604522705078125, -1.48583984375, -1.367156982421875, -1.24847412109375, -1.129791259765625, -1.0111083984375, -0.892425537109375, -0.77374267578125, -0.655059814453125, -0.536376953125, -0.417694091796875, -0.29901123046875, -0.180328369140625, -0.0616455078125, 0.057037353515625, 0.17572021484375, 0.294403076171875, 0.4130859375, 0.531768798828125, 0.65045166015625, 0.769134521484375, 0.8878173828125, 1.006500244140625, 1.12518310546875, 1.243865966796875, 1.362548828125, 1.481231689453125, 1.59991455078125, 1.718597412109375, 1.8372802734375, 1.955963134765625, 2.07464599609375, 2.193328857421875, 2.31201171875, 2.430694580078125, 2.54937744140625, 2.668060302734375, 2.7867431640625, 2.905426025390625, 3.02410888671875, 3.142791748046875, 3.261474609375, 3.380157470703125, 3.49884033203125, 3.617523193359375, 3.7362060546875, 3.854888916015625, 3.97357177734375, 4.092254638671875, 4.2109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 16.0, 23.0, 37.0, 94.0, 156.0, 358.0, 1084.0, 9250.0, 976302.0, 58167.0, 2073.0, 507.0, 219.0, 96.0, 64.0, 28.0, 15.0, 16.0, 15.0, 7.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.80279541015625, -4.6602783203125, -4.51776123046875, -4.375244140625, -4.23272705078125, -4.0902099609375, -3.94769287109375, -3.80517578125, -3.66265869140625, -3.5201416015625, -3.37762451171875, -3.235107421875, -3.09259033203125, -2.9500732421875, -2.80755615234375, -2.6650390625, -2.52252197265625, -2.3800048828125, -2.23748779296875, -2.094970703125, -1.95245361328125, -1.8099365234375, -1.66741943359375, -1.52490234375, -1.38238525390625, -1.2398681640625, -1.09735107421875, -0.954833984375, -0.81231689453125, -0.6697998046875, -0.52728271484375, -0.384765625, -0.24224853515625, -0.0997314453125, 0.04278564453125, 0.185302734375, 0.32781982421875, 0.4703369140625, 0.61285400390625, 0.75537109375, 0.89788818359375, 1.0404052734375, 1.18292236328125, 1.325439453125, 1.46795654296875, 1.6104736328125, 1.75299072265625, 1.8955078125, 2.03802490234375, 2.1805419921875, 2.32305908203125, 2.465576171875, 2.60809326171875, 2.7506103515625, 2.89312744140625, 3.03564453125, 3.17816162109375, 3.3206787109375, 3.46319580078125, 3.605712890625, 3.74822998046875, 3.8907470703125, 4.03326416015625, 4.17578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 8.0, 10.0, 23.0, 35.0, 50.0, 59.0, 87.0, 109.0, 114.0, 115.0, 115.0, 82.0, 69.0, 46.0, 29.0, 22.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002582073211669922, -0.00025011226534843445, -0.0002420172095298767, -0.00023392215371131897, -0.00022582709789276123, -0.0002177320420742035, -0.00020963698625564575, -0.000201541930437088, -0.00019344687461853027, -0.00018535181879997253, -0.0001772567629814148, -0.00016916170716285706, -0.00016106665134429932, -0.00015297159552574158, -0.00014487653970718384, -0.0001367814838886261, -0.00012868642807006836, -0.00012059137225151062, -0.00011249631643295288, -0.00010440126061439514, -9.63062047958374e-05, -8.821114897727966e-05, -8.011609315872192e-05, -7.202103734016418e-05, -6.392598152160645e-05, -5.5830925703048706e-05, -4.773586988449097e-05, -3.964081406593323e-05, -3.154575824737549e-05, -2.345070242881775e-05, -1.535564661026001e-05, -7.2605907917022705e-06, 8.344650268554688e-07, 8.929520845413208e-06, 1.7024576663970947e-05, 2.5119632482528687e-05, 3.3214688301086426e-05, 4.1309744119644165e-05, 4.9404799938201904e-05, 5.7499855756759644e-05, 6.559491157531738e-05, 7.368996739387512e-05, 8.178502321243286e-05, 8.98800790309906e-05, 9.797513484954834e-05, 0.00010607019066810608, 0.00011416524648666382, 0.00012226030230522156, 0.0001303553581237793, 0.00013845041394233704, 0.00014654546976089478, 0.00015464052557945251, 0.00016273558139801025, 0.000170830637216568, 0.00017892569303512573, 0.00018702074885368347, 0.0001951158046722412, 0.00020321086049079895, 0.0002113059163093567, 0.00021940097212791443, 0.00022749602794647217, 0.0002355910837650299, 0.00024368613958358765, 0.0002517811954021454, 0.0002598762512207031]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 16.0, 22.0, 27.0, 43.0, 79.0, 160.0, 431.0, 1364.0, 7473.0, 239796.0, 778040.0, 17811.0, 2147.0, 639.0, 245.0, 100.0, 57.0, 33.0, 17.0, 14.0, 16.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.939453125, -1.855743408203125, -1.77203369140625, -1.688323974609375, -1.6046142578125, -1.520904541015625, -1.43719482421875, -1.353485107421875, -1.269775390625, -1.186065673828125, -1.10235595703125, -1.018646240234375, -0.9349365234375, -0.851226806640625, -0.76751708984375, -0.683807373046875, -0.60009765625, -0.516387939453125, -0.43267822265625, -0.348968505859375, -0.2652587890625, -0.181549072265625, -0.09783935546875, -0.014129638671875, 0.069580078125, 0.153289794921875, 0.23699951171875, 0.320709228515625, 0.4044189453125, 0.488128662109375, 0.57183837890625, 0.655548095703125, 0.7392578125, 0.822967529296875, 0.90667724609375, 0.990386962890625, 1.0740966796875, 1.157806396484375, 1.24151611328125, 1.325225830078125, 1.408935546875, 1.492645263671875, 1.57635498046875, 1.660064697265625, 1.7437744140625, 1.827484130859375, 1.91119384765625, 1.994903564453125, 2.07861328125, 2.162322998046875, 2.24603271484375, 2.329742431640625, 2.4134521484375, 2.497161865234375, 2.58087158203125, 2.664581298828125, 2.748291015625, 2.832000732421875, 2.91571044921875, 2.999420166015625, 3.0831298828125, 3.166839599609375, 3.25054931640625, 3.334259033203125, 3.41796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 21.0, 21.0, 27.0, 52.0, 91.0, 116.0, 135.0, 119.0, 121.0, 80.0, 68.0, 40.0, 36.0, 17.0, 11.0, 10.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.21484375, -2.1539306640625, -2.093017578125, -2.0321044921875, -1.97119140625, -1.9102783203125, -1.849365234375, -1.7884521484375, -1.7275390625, -1.6666259765625, -1.605712890625, -1.5447998046875, -1.48388671875, -1.4229736328125, -1.362060546875, -1.3011474609375, -1.240234375, -1.1793212890625, -1.118408203125, -1.0574951171875, -0.99658203125, -0.9356689453125, -0.874755859375, -0.8138427734375, -0.7529296875, -0.6920166015625, -0.631103515625, -0.5701904296875, -0.50927734375, -0.4483642578125, -0.387451171875, -0.3265380859375, -0.265625, -0.2047119140625, -0.143798828125, -0.0828857421875, -0.02197265625, 0.0389404296875, 0.099853515625, 0.1607666015625, 0.2216796875, 0.2825927734375, 0.343505859375, 0.4044189453125, 0.46533203125, 0.5262451171875, 0.587158203125, 0.6480712890625, 0.708984375, 0.7698974609375, 0.830810546875, 0.8917236328125, 0.95263671875, 1.0135498046875, 1.074462890625, 1.1353759765625, 1.1962890625, 1.2572021484375, 1.318115234375, 1.3790283203125, 1.43994140625, 1.5008544921875, 1.561767578125, 1.6226806640625, 1.68359375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 11.0, 26.0, 81.0, 184.0, 336.0, 246.0, 76.0, 32.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.57486724853516, -68.17388153076172, -66.77290344238281, -65.37191772460938, -63.97093200683594, -62.5699462890625, -61.16896438598633, -59.767982482910156, -58.36699676513672, -56.96601104736328, -55.56502914428711, -54.16404724121094, -52.7630615234375, -51.36207580566406, -49.96109390258789, -48.56011199951172, -47.15912628173828, -45.758140563964844, -44.35715866088867, -42.9561767578125, -41.55519104003906, -40.154205322265625, -38.75322341918945, -37.35224151611328, -35.951255798339844, -34.550270080566406, -33.149288177490234, -31.74830436706543, -30.347320556640625, -28.94633674621582, -27.545352935791016, -26.14436912536621, -24.74338150024414, -23.342397689819336, -21.94141387939453, -20.540430068969727, -19.139446258544922, -17.738462448120117, -16.337478637695312, -14.936494827270508, -13.535511016845703, -12.134527206420898, -10.733543395996094, -9.332559585571289, -7.931575775146484, -6.53059196472168, -5.129608154296875, -3.7286243438720703, -2.3276405334472656, -0.9266567230224609, 0.47432708740234375, 1.8753108978271484, 3.276294708251953, 4.677278518676758, 6.0782623291015625, 7.479246139526367, 8.880229949951172, 10.281213760375977, 11.682197570800781, 13.083181381225586, 14.48416519165039, 15.885149002075195, 17.2861328125, 18.687116622924805, 20.08810043334961]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 6.0, 12.0, 8.0, 22.0, 14.0, 14.0, 18.0, 11.0, 23.0, 19.0, 24.0, 36.0, 28.0, 41.0, 45.0, 42.0, 46.0, 43.0, 53.0, 36.0, 40.0, 48.0, 41.0, 31.0, 30.0, 42.0, 33.0, 22.0, 37.0, 17.0, 23.0, 11.0, 16.0, 12.0, 9.0, 7.0, 6.0, 2.0, 3.0, 6.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.174919128417969, -12.74792766571045, -12.32093620300293, -11.89394474029541, -11.46695327758789, -11.039961814880371, -10.612970352172852, -10.185977935791016, -9.758987426757812, -9.331995964050293, -8.905004501342773, -8.478013038635254, -8.051021575927734, -7.624030113220215, -7.197038173675537, -6.770046710968018, -6.34305477142334, -5.91606330871582, -5.489071846008301, -5.062080383300781, -4.635088920593262, -4.208097457885742, -3.7811055183410645, -3.354114055633545, -2.9271225929260254, -2.500131130218506, -2.0731396675109863, -1.6461479663848877, -1.2191565036773682, -0.7921650409698486, -0.36517333984375, 0.06181812286376953, 0.48880958557128906, 0.9158011078834534, 1.3427926301956177, 1.7697842121124268, 2.1967756748199463, 2.623767137527466, 3.0507588386535645, 3.477750301361084, 3.9047417640686035, 4.331733226776123, 4.758724689483643, 5.18571662902832, 5.61270809173584, 6.039699554443359, 6.466691017150879, 6.893682479858398, 7.320673942565918, 7.7476654052734375, 8.174656867980957, 8.601648330688477, 9.028639793395996, 9.455631256103516, 9.882623672485352, 10.309614181518555, 10.73660659790039, 11.16359806060791, 11.59058952331543, 12.01758098602295, 12.444572448730469, 12.871563911437988, 13.298555374145508, 13.725547790527344, 14.152538299560547]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 10.0, 8.0, 10.0, 19.0, 16.0, 32.0, 46.0, 75.0, 121.0, 228.0, 462.0, 1063.0, 2846.0, 10705.0, 87338.0, 4035205.0, 44249.0, 7542.0, 2323.0, 878.0, 456.0, 245.0, 153.0, 99.0, 53.0, 35.0, 22.0, 9.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.119140625, -3.005218505859375, -2.89129638671875, -2.777374267578125, -2.6634521484375, -2.549530029296875, -2.43560791015625, -2.321685791015625, -2.207763671875, -2.093841552734375, -1.97991943359375, -1.865997314453125, -1.7520751953125, -1.638153076171875, -1.52423095703125, -1.410308837890625, -1.29638671875, -1.182464599609375, -1.06854248046875, -0.954620361328125, -0.8406982421875, -0.726776123046875, -0.61285400390625, -0.498931884765625, -0.385009765625, -0.271087646484375, -0.15716552734375, -0.043243408203125, 0.0706787109375, 0.184600830078125, 0.29852294921875, 0.412445068359375, 0.5263671875, 0.640289306640625, 0.75421142578125, 0.868133544921875, 0.9820556640625, 1.095977783203125, 1.20989990234375, 1.323822021484375, 1.437744140625, 1.551666259765625, 1.66558837890625, 1.779510498046875, 1.8934326171875, 2.007354736328125, 2.12127685546875, 2.235198974609375, 2.34912109375, 2.463043212890625, 2.57696533203125, 2.690887451171875, 2.8048095703125, 2.918731689453125, 3.03265380859375, 3.146575927734375, 3.260498046875, 3.374420166015625, 3.48834228515625, 3.602264404296875, 3.7161865234375, 3.830108642578125, 3.94403076171875, 4.057952880859375, 4.171875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 4.0, 6.0, 7.0, 14.0, 11.0, 13.0, 25.0, 24.0, 34.0, 41.0, 44.0, 46.0, 55.0, 76.0, 76.0, 71.0, 77.0, 56.0, 51.0, 41.0, 41.0, 35.0, 27.0, 29.0, 12.0, 14.0, 10.0, 9.0, 12.0, 8.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6845703125, -0.656524658203125, -0.62847900390625, -0.600433349609375, -0.5723876953125, -0.544342041015625, -0.51629638671875, -0.488250732421875, -0.460205078125, -0.432159423828125, -0.40411376953125, -0.376068115234375, -0.3480224609375, -0.319976806640625, -0.29193115234375, -0.263885498046875, -0.23583984375, -0.207794189453125, -0.17974853515625, -0.151702880859375, -0.1236572265625, -0.095611572265625, -0.06756591796875, -0.039520263671875, -0.011474609375, 0.016571044921875, 0.04461669921875, 0.072662353515625, 0.1007080078125, 0.128753662109375, 0.15679931640625, 0.184844970703125, 0.212890625, 0.240936279296875, 0.26898193359375, 0.297027587890625, 0.3250732421875, 0.353118896484375, 0.38116455078125, 0.409210205078125, 0.437255859375, 0.465301513671875, 0.49334716796875, 0.521392822265625, 0.5494384765625, 0.577484130859375, 0.60552978515625, 0.633575439453125, 0.66162109375, 0.689666748046875, 0.71771240234375, 0.745758056640625, 0.7738037109375, 0.801849365234375, 0.82989501953125, 0.857940673828125, 0.885986328125, 0.914031982421875, 0.94207763671875, 0.970123291015625, 0.9981689453125, 1.026214599609375, 1.05426025390625, 1.082305908203125, 1.1103515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 10.0, 8.0, 16.0, 20.0, 36.0, 44.0, 76.0, 108.0, 180.0, 358.0, 754.0, 1825.0, 4613.0, 16000.0, 94176.0, 3894474.0, 151225.0, 20670.0, 5807.0, 2108.0, 853.0, 381.0, 224.0, 115.0, 77.0, 49.0, 24.0, 20.0, 7.0, 9.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.499481201171875, -2.42279052734375, -2.346099853515625, -2.2694091796875, -2.192718505859375, -2.11602783203125, -2.039337158203125, -1.962646484375, -1.885955810546875, -1.80926513671875, -1.732574462890625, -1.6558837890625, -1.579193115234375, -1.50250244140625, -1.425811767578125, -1.34912109375, -1.272430419921875, -1.19573974609375, -1.119049072265625, -1.0423583984375, -0.965667724609375, -0.88897705078125, -0.812286376953125, -0.735595703125, -0.658905029296875, -0.58221435546875, -0.505523681640625, -0.4288330078125, -0.352142333984375, -0.27545166015625, -0.198760986328125, -0.1220703125, -0.045379638671875, 0.03131103515625, 0.108001708984375, 0.1846923828125, 0.261383056640625, 0.33807373046875, 0.414764404296875, 0.491455078125, 0.568145751953125, 0.64483642578125, 0.721527099609375, 0.7982177734375, 0.874908447265625, 0.95159912109375, 1.028289794921875, 1.10498046875, 1.181671142578125, 1.25836181640625, 1.335052490234375, 1.4117431640625, 1.488433837890625, 1.56512451171875, 1.641815185546875, 1.718505859375, 1.795196533203125, 1.87188720703125, 1.948577880859375, 2.0252685546875, 2.101959228515625, 2.17864990234375, 2.255340576171875, 2.33203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 17.0, 13.0, 21.0, 23.0, 48.0, 110.0, 379.0, 3021.0, 239.0, 91.0, 42.0, 30.0, 13.0, 11.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.93701171875, -0.9153556823730469, -0.8936996459960938, -0.8720436096191406, -0.8503875732421875, -0.8287315368652344, -0.8070755004882812, -0.7854194641113281, -0.763763427734375, -0.7421073913574219, -0.7204513549804688, -0.6987953186035156, -0.6771392822265625, -0.6554832458496094, -0.6338272094726562, -0.6121711730957031, -0.59051513671875, -0.5688591003417969, -0.5472030639648438, -0.5255470275878906, -0.5038909912109375, -0.4822349548339844, -0.46057891845703125, -0.4389228820800781, -0.417266845703125, -0.3956108093261719, -0.37395477294921875, -0.3522987365722656, -0.3306427001953125, -0.3089866638183594, -0.28733062744140625, -0.2656745910644531, -0.2440185546875, -0.22236251831054688, -0.20070648193359375, -0.17905044555664062, -0.1573944091796875, -0.13573837280273438, -0.11408233642578125, -0.09242630004882812, -0.070770263671875, -0.049114227294921875, -0.02745819091796875, -0.005802154541015625, 0.0158538818359375, 0.037509918212890625, 0.05916595458984375, 0.08082199096679688, 0.10247802734375, 0.12413406372070312, 0.14579010009765625, 0.16744613647460938, 0.1891021728515625, 0.21075820922851562, 0.23241424560546875, 0.2540702819824219, 0.275726318359375, 0.2973823547363281, 0.31903839111328125, 0.3406944274902344, 0.3623504638671875, 0.3840065002441406, 0.40566253662109375, 0.4273185729980469, 0.448974609375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 15.0, 32.0, 40.0, 77.0, 136.0, 119.0, 134.0, 129.0, 106.0, 77.0, 48.0, 29.0, 14.0, 8.0, 12.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2608141899108887, -2.183840274810791, -2.1068663597106934, -2.029892683029175, -1.9529187679290771, -1.8759448528289795, -1.7989709377288818, -1.7219970226287842, -1.645023226737976, -1.5680493116378784, -1.4910755157470703, -1.4141016006469727, -1.337127685546875, -1.260153889656067, -1.1831799745559692, -1.1062061786651611, -1.0292322635650635, -0.9522584080696106, -0.8752845525741577, -0.7983106374740601, -0.7213367819786072, -0.6443629264831543, -0.5673890113830566, -0.49041515588760376, -0.4134413003921509, -0.336467444896698, -0.25949355959892273, -0.18251968920230865, -0.10554581880569458, -0.0285719633102417, 0.04840192198753357, 0.12537580728530884, 0.20234966278076172, 0.2793235182762146, 0.35629740357398987, 0.43327128887176514, 0.510245144367218, 0.5872189998626709, 0.6641929149627686, 0.7411667704582214, 0.8181406259536743, 0.8951144814491272, 0.9720883369445801, 1.0490622520446777, 1.1260361671447754, 1.2030099630355835, 1.2799838781356812, 1.3569576740264893, 1.433931589126587, 1.5109055042266846, 1.5878793001174927, 1.6648532152175903, 1.7418270111083984, 1.818800926208496, 1.8957748413085938, 1.9727487564086914, 2.049722671508789, 2.1266965866088867, 2.2036705017089844, 2.280644178390503, 2.3576180934906006, 2.4345920085906982, 2.511565923690796, 2.5885398387908936, 2.665513515472412]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 16.0, 17.0, 18.0, 16.0, 21.0, 30.0, 34.0, 39.0, 45.0, 75.0, 50.0, 58.0, 55.0, 65.0, 56.0, 52.0, 58.0, 38.0, 35.0, 44.0, 35.0, 26.0, 27.0, 22.0, 14.0, 21.0, 7.0, 5.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0105741024017334, -1.9584375619888306, -1.9063009023666382, -1.8541643619537354, -1.802027702331543, -1.7498911619186401, -1.6977545022964478, -1.645617961883545, -1.5934813022613525, -1.5413447618484497, -1.4892081022262573, -1.4370715618133545, -1.384934902191162, -1.3327983617782593, -1.280661702156067, -1.228525161743164, -1.1763885021209717, -1.1242519617080688, -1.0721153020858765, -1.0199787616729736, -0.9678421020507812, -0.9157055616378784, -0.863568902015686, -0.8114323616027832, -0.7592958211898804, -0.7071592211723328, -0.6550226211547852, -0.6028860211372375, -0.5507494211196899, -0.4986128509044647, -0.4464762508869171, -0.3943396508693695, -0.3422030210494995, -0.2900664210319519, -0.2379298210144043, -0.18579323589801788, -0.13365663588047028, -0.08152005076408386, -0.029383450746536255, 0.022753149271011353, 0.07488974928855896, 0.12702634930610657, 0.17916294932365417, 0.2312995344400406, 0.283436119556427, 0.3355727195739746, 0.3877093195915222, 0.4398459196090698, 0.49198251962661743, 0.544119119644165, 0.5962557196617126, 0.6483923196792603, 0.7005289196968079, 0.7526655197143555, 0.8048020601272583, 0.8569387197494507, 0.9090752601623535, 0.9612118601799011, 1.0133484601974487, 1.0654850006103516, 1.117621660232544, 1.1697582006454468, 1.2218948602676392, 1.274031400680542, 1.3261680603027344]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 4.0, 6.0, 9.0, 14.0, 41.0, 46.0, 97.0, 187.0, 257.0, 601.0, 1382.0, 3835.0, 12938.0, 61692.0, 375168.0, 480561.0, 87245.0, 16772.0, 4559.0, 1672.0, 726.0, 333.0, 179.0, 84.0, 54.0, 27.0, 26.0, 20.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5673828125, -1.5023345947265625, -1.437286376953125, -1.3722381591796875, -1.30718994140625, -1.2421417236328125, -1.177093505859375, -1.1120452880859375, -1.0469970703125, -0.9819488525390625, -0.916900634765625, -0.8518524169921875, -0.78680419921875, -0.7217559814453125, -0.656707763671875, -0.5916595458984375, -0.526611328125, -0.4615631103515625, -0.396514892578125, -0.3314666748046875, -0.26641845703125, -0.2013702392578125, -0.136322021484375, -0.0712738037109375, -0.0062255859375, 0.0588226318359375, 0.123870849609375, 0.1889190673828125, 0.25396728515625, 0.3190155029296875, 0.384063720703125, 0.4491119384765625, 0.51416015625, 0.5792083740234375, 0.644256591796875, 0.7093048095703125, 0.77435302734375, 0.8394012451171875, 0.904449462890625, 0.9694976806640625, 1.0345458984375, 1.0995941162109375, 1.164642333984375, 1.2296905517578125, 1.29473876953125, 1.3597869873046875, 1.424835205078125, 1.4898834228515625, 1.554931640625, 1.6199798583984375, 1.685028076171875, 1.7500762939453125, 1.81512451171875, 1.8801727294921875, 1.945220947265625, 2.0102691650390625, 2.0753173828125, 2.1403656005859375, 2.205413818359375, 2.2704620361328125, 2.33551025390625, 2.4005584716796875, 2.465606689453125, 2.5306549072265625, 2.595703125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 14.0, 3.0, 14.0, 10.0, 15.0, 21.0, 36.0, 37.0, 38.0, 48.0, 55.0, 56.0, 84.0, 68.0, 71.0, 66.0, 54.0, 49.0, 51.0, 33.0, 34.0, 21.0, 18.0, 23.0, 16.0, 12.0, 14.0, 11.0, 4.0, 1.0, 4.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71923828125, -0.6906051635742188, -0.6619720458984375, -0.6333389282226562, -0.604705810546875, -0.5760726928710938, -0.5474395751953125, -0.5188064575195312, -0.49017333984375, -0.46154022216796875, -0.4329071044921875, -0.40427398681640625, -0.375640869140625, -0.34700775146484375, -0.3183746337890625, -0.28974151611328125, -0.2611083984375, -0.23247528076171875, -0.2038421630859375, -0.17520904541015625, -0.146575927734375, -0.11794281005859375, -0.0893096923828125, -0.06067657470703125, -0.03204345703125, -0.00341033935546875, 0.0252227783203125, 0.05385589599609375, 0.082489013671875, 0.11112213134765625, 0.1397552490234375, 0.16838836669921875, 0.197021484375, 0.22565460205078125, 0.2542877197265625, 0.28292083740234375, 0.311553955078125, 0.34018707275390625, 0.3688201904296875, 0.39745330810546875, 0.42608642578125, 0.45471954345703125, 0.4833526611328125, 0.5119857788085938, 0.540618896484375, 0.5692520141601562, 0.5978851318359375, 0.6265182495117188, 0.6551513671875, 0.6837844848632812, 0.7124176025390625, 0.7410507202148438, 0.769683837890625, 0.7983169555664062, 0.8269500732421875, 0.8555831909179688, 0.88421630859375, 0.9128494262695312, 0.9414825439453125, 0.9701156616210938, 0.998748779296875, 1.0273818969726562, 1.0560150146484375, 1.0846481323242188, 1.11328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 8.0, 4.0, 10.0, 15.0, 21.0, 21.0, 30.0, 47.0, 68.0, 117.0, 172.0, 247.0, 454.0, 839.0, 1549.0, 4559.0, 27186.0, 383456.0, 577957.0, 41518.0, 5956.0, 1962.0, 927.0, 542.0, 325.0, 176.0, 117.0, 78.0, 55.0, 32.0, 26.0, 16.0, 17.0, 5.0, 10.0, 5.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.60546875, -2.52166748046875, -2.4378662109375, -2.35406494140625, -2.270263671875, -2.18646240234375, -2.1026611328125, -2.01885986328125, -1.93505859375, -1.85125732421875, -1.7674560546875, -1.68365478515625, -1.599853515625, -1.51605224609375, -1.4322509765625, -1.34844970703125, -1.2646484375, -1.18084716796875, -1.0970458984375, -1.01324462890625, -0.929443359375, -0.84564208984375, -0.7618408203125, -0.67803955078125, -0.59423828125, -0.51043701171875, -0.4266357421875, -0.34283447265625, -0.259033203125, -0.17523193359375, -0.0914306640625, -0.00762939453125, 0.076171875, 0.15997314453125, 0.2437744140625, 0.32757568359375, 0.411376953125, 0.49517822265625, 0.5789794921875, 0.66278076171875, 0.74658203125, 0.83038330078125, 0.9141845703125, 0.99798583984375, 1.081787109375, 1.16558837890625, 1.2493896484375, 1.33319091796875, 1.4169921875, 1.50079345703125, 1.5845947265625, 1.66839599609375, 1.752197265625, 1.83599853515625, 1.9197998046875, 2.00360107421875, 2.08740234375, 2.17120361328125, 2.2550048828125, 2.33880615234375, 2.422607421875, 2.50640869140625, 2.5902099609375, 2.67401123046875, 2.7578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 11.0, 7.0, 22.0, 20.0, 24.0, 31.0, 30.0, 42.0, 45.0, 66.0, 60.0, 78.0, 70.0, 72.0, 64.0, 60.0, 56.0, 47.0, 45.0, 31.0, 24.0, 12.0, 20.0, 16.0, 16.0, 5.0, 4.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.01171875, -4.85626220703125, -4.7008056640625, -4.54534912109375, -4.389892578125, -4.23443603515625, -4.0789794921875, -3.92352294921875, -3.76806640625, -3.61260986328125, -3.4571533203125, -3.30169677734375, -3.146240234375, -2.99078369140625, -2.8353271484375, -2.67987060546875, -2.5244140625, -2.36895751953125, -2.2135009765625, -2.05804443359375, -1.902587890625, -1.74713134765625, -1.5916748046875, -1.43621826171875, -1.28076171875, -1.12530517578125, -0.9698486328125, -0.81439208984375, -0.658935546875, -0.50347900390625, -0.3480224609375, -0.19256591796875, -0.037109375, 0.11834716796875, 0.2738037109375, 0.42926025390625, 0.584716796875, 0.74017333984375, 0.8956298828125, 1.05108642578125, 1.20654296875, 1.36199951171875, 1.5174560546875, 1.67291259765625, 1.828369140625, 1.98382568359375, 2.1392822265625, 2.29473876953125, 2.4501953125, 2.60565185546875, 2.7611083984375, 2.91656494140625, 3.072021484375, 3.22747802734375, 3.3829345703125, 3.53839111328125, 3.69384765625, 3.84930419921875, 4.0047607421875, 4.16021728515625, 4.315673828125, 4.47113037109375, 4.6265869140625, 4.78204345703125, 4.9375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 3.0, 2.0, 6.0, 6.0, 15.0, 22.0, 12.0, 38.0, 31.0, 55.0, 91.0, 137.0, 259.0, 470.0, 1224.0, 4365.0, 59260.0, 910872.0, 64724.0, 4506.0, 1258.0, 475.0, 257.0, 162.0, 87.0, 61.0, 40.0, 36.0, 18.0, 11.0, 6.0, 9.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9609375, -1.89666748046875, -1.8323974609375, -1.76812744140625, -1.703857421875, -1.63958740234375, -1.5753173828125, -1.51104736328125, -1.44677734375, -1.38250732421875, -1.3182373046875, -1.25396728515625, -1.189697265625, -1.12542724609375, -1.0611572265625, -0.99688720703125, -0.9326171875, -0.86834716796875, -0.8040771484375, -0.73980712890625, -0.675537109375, -0.61126708984375, -0.5469970703125, -0.48272705078125, -0.41845703125, -0.35418701171875, -0.2899169921875, -0.22564697265625, -0.161376953125, -0.09710693359375, -0.0328369140625, 0.03143310546875, 0.095703125, 0.15997314453125, 0.2242431640625, 0.28851318359375, 0.352783203125, 0.41705322265625, 0.4813232421875, 0.54559326171875, 0.60986328125, 0.67413330078125, 0.7384033203125, 0.80267333984375, 0.866943359375, 0.93121337890625, 0.9954833984375, 1.05975341796875, 1.1240234375, 1.18829345703125, 1.2525634765625, 1.31683349609375, 1.381103515625, 1.44537353515625, 1.5096435546875, 1.57391357421875, 1.63818359375, 1.70245361328125, 1.7667236328125, 1.83099365234375, 1.895263671875, 1.95953369140625, 2.0238037109375, 2.08807373046875, 2.15234375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 11.0, 9.0, 9.0, 19.0, 26.0, 31.0, 36.0, 43.0, 52.0, 76.0, 84.0, 127.0, 89.0, 82.0, 70.0, 47.0, 41.0, 42.0, 24.0, 20.0, 20.0, 10.0, 6.0, 5.0, 7.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001537799835205078, -0.00014876574277877808, -0.00014375150203704834, -0.0001387372612953186, -0.00013372302055358887, -0.00012870877981185913, -0.0001236945390701294, -0.00011868029832839966, -0.00011366605758666992, -0.00010865181684494019, -0.00010363757610321045, -9.862333536148071e-05, -9.360909461975098e-05, -8.859485387802124e-05, -8.35806131362915e-05, -7.856637239456177e-05, -7.355213165283203e-05, -6.85378909111023e-05, -6.352365016937256e-05, -5.850940942764282e-05, -5.3495168685913086e-05, -4.848092794418335e-05, -4.346668720245361e-05, -3.845244646072388e-05, -3.343820571899414e-05, -2.8423964977264404e-05, -2.3409724235534668e-05, -1.839548349380493e-05, -1.3381242752075195e-05, -8.367002010345459e-06, -3.3527612686157227e-06, 1.6614794731140137e-06, 6.67572021484375e-06, 1.1689960956573486e-05, 1.6704201698303223e-05, 2.171844244003296e-05, 2.6732683181762695e-05, 3.174692392349243e-05, 3.676116466522217e-05, 4.1775405406951904e-05, 4.678964614868164e-05, 5.180388689041138e-05, 5.681812763214111e-05, 6.183236837387085e-05, 6.684660911560059e-05, 7.186084985733032e-05, 7.687509059906006e-05, 8.18893313407898e-05, 8.690357208251953e-05, 9.191781282424927e-05, 9.6932053565979e-05, 0.00010194629430770874, 0.00010696053504943848, 0.00011197477579116821, 0.00011698901653289795, 0.00012200325727462769, 0.00012701749801635742, 0.00013203173875808716, 0.0001370459794998169, 0.00014206022024154663, 0.00014707446098327637, 0.0001520887017250061, 0.00015710294246673584, 0.00016211718320846558, 0.0001671314239501953]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 9.0, 13.0, 37.0, 31.0, 47.0, 75.0, 164.0, 329.0, 774.0, 2461.0, 14865.0, 497998.0, 512880.0, 14923.0, 2439.0, 767.0, 325.0, 160.0, 86.0, 62.0, 30.0, 22.0, 9.0, 7.0, 10.0, 9.0, 1.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4267578125, -1.3647308349609375, -1.302703857421875, -1.2406768798828125, -1.17864990234375, -1.1166229248046875, -1.054595947265625, -0.9925689697265625, -0.9305419921875, -0.8685150146484375, -0.806488037109375, -0.7444610595703125, -0.68243408203125, -0.6204071044921875, -0.558380126953125, -0.4963531494140625, -0.434326171875, -0.3722991943359375, -0.310272216796875, -0.2482452392578125, -0.18621826171875, -0.1241912841796875, -0.062164306640625, -0.0001373291015625, 0.0618896484375, 0.1239166259765625, 0.185943603515625, 0.2479705810546875, 0.30999755859375, 0.3720245361328125, 0.434051513671875, 0.4960784912109375, 0.55810546875, 0.6201324462890625, 0.682159423828125, 0.7441864013671875, 0.80621337890625, 0.8682403564453125, 0.930267333984375, 0.9922943115234375, 1.0543212890625, 1.1163482666015625, 1.178375244140625, 1.2404022216796875, 1.30242919921875, 1.3644561767578125, 1.426483154296875, 1.4885101318359375, 1.550537109375, 1.6125640869140625, 1.674591064453125, 1.7366180419921875, 1.79864501953125, 1.8606719970703125, 1.922698974609375, 1.9847259521484375, 2.0467529296875, 2.1087799072265625, 2.170806884765625, 2.2328338623046875, 2.29486083984375, 2.3568878173828125, 2.418914794921875, 2.4809417724609375, 2.54296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 5.0, 8.0, 9.0, 18.0, 12.0, 31.0, 26.0, 43.0, 40.0, 69.0, 67.0, 87.0, 82.0, 86.0, 71.0, 82.0, 50.0, 46.0, 33.0, 34.0, 20.0, 18.0, 10.0, 8.0, 9.0, 10.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.45703125, -1.414154052734375, -1.37127685546875, -1.328399658203125, -1.2855224609375, -1.242645263671875, -1.19976806640625, -1.156890869140625, -1.114013671875, -1.071136474609375, -1.02825927734375, -0.985382080078125, -0.9425048828125, -0.899627685546875, -0.85675048828125, -0.813873291015625, -0.77099609375, -0.728118896484375, -0.68524169921875, -0.642364501953125, -0.5994873046875, -0.556610107421875, -0.51373291015625, -0.470855712890625, -0.427978515625, -0.385101318359375, -0.34222412109375, -0.299346923828125, -0.2564697265625, -0.213592529296875, -0.17071533203125, -0.127838134765625, -0.0849609375, -0.042083740234375, 0.00079345703125, 0.043670654296875, 0.0865478515625, 0.129425048828125, 0.17230224609375, 0.215179443359375, 0.258056640625, 0.300933837890625, 0.34381103515625, 0.386688232421875, 0.4295654296875, 0.472442626953125, 0.51531982421875, 0.558197021484375, 0.60107421875, 0.643951416015625, 0.68682861328125, 0.729705810546875, 0.7725830078125, 0.815460205078125, 0.85833740234375, 0.901214599609375, 0.944091796875, 0.986968994140625, 1.02984619140625, 1.072723388671875, 1.1156005859375, 1.158477783203125, 1.20135498046875, 1.244232177734375, 1.287109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 8.0, 7.0, 11.0, 25.0, 46.0, 72.0, 118.0, 165.0, 184.0, 151.0, 92.0, 67.0, 28.0, 16.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.17974090576172, -19.559104919433594, -18.93846893310547, -18.317834854125977, -17.69719886779785, -17.076562881469727, -16.4559268951416, -15.835291862487793, -15.214656829833984, -14.59402084350586, -13.97338581085205, -13.352749824523926, -12.732114791870117, -12.111478805541992, -11.490842819213867, -10.870207786560059, -10.249571800231934, -9.628935813903809, -9.00830078125, -8.387664794921875, -7.767029762268066, -7.146393775939941, -6.525758266448975, -5.905122756958008, -5.284487247467041, -4.663851737976074, -4.043216228485107, -3.4225804805755615, -2.8019449710845947, -2.181309461593628, -1.560673713684082, -0.9400382041931152, -0.31940269470214844, 0.30123287439346313, 0.9218684434890747, 1.542504072189331, 2.163139581680298, 2.7837750911712646, 3.4044108390808105, 4.025046348571777, 4.645681858062744, 5.266317367553711, 5.886952877044678, 6.5075883865356445, 7.1282243728637695, 7.748859405517578, 8.369495391845703, 8.990131378173828, 9.610766410827637, 10.231402397155762, 10.85203742980957, 11.472673416137695, 12.093308448791504, 12.713944435119629, 13.334579467773438, 13.955215454101562, 14.575851440429688, 15.196487426757812, 15.817122459411621, 16.43775749206543, 17.058393478393555, 17.67902946472168, 18.299665451049805, 18.920299530029297, 19.540935516357422]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 6.0, 3.0, 8.0, 8.0, 17.0, 11.0, 19.0, 17.0, 26.0, 45.0, 46.0, 41.0, 68.0, 52.0, 55.0, 62.0, 73.0, 52.0, 52.0, 52.0, 53.0, 43.0, 35.0, 32.0, 26.0, 28.0, 15.0, 14.0, 13.0, 9.0, 8.0, 10.0, 9.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.626644134521484, -17.07843017578125, -16.530216217041016, -15.982003211975098, -15.43379020690918, -14.885576248168945, -14.337362289428711, -13.789148330688477, -13.240935325622559, -12.692721366882324, -12.144508361816406, -11.596294403076172, -11.048080444335938, -10.49986743927002, -9.951653480529785, -9.403440475463867, -8.855226516723633, -8.307012557983398, -7.7587995529174805, -7.210585594177246, -6.66237211227417, -6.114158630371094, -5.565944671630859, -5.017731189727783, -4.469517707824707, -3.921304225921631, -3.3730905055999756, -2.8248767852783203, -2.276663303375244, -1.728449821472168, -1.1802361011505127, -0.6320223808288574, -0.08380889892578125, 0.4644047021865845, 1.0126183032989502, 1.560831904411316, 2.1090455055236816, 2.657258987426758, 3.205472707748413, 3.7536864280700684, 4.3018999099731445, 4.850113391876221, 5.398326873779297, 5.946540832519531, 6.494754314422607, 7.042967796325684, 7.591181755065918, 8.139394760131836, 8.68760871887207, 9.235822677612305, 9.784035682678223, 10.332249641418457, 10.880462646484375, 11.42867660522461, 11.976890563964844, 12.525104522705078, 13.073317527770996, 13.62153148651123, 14.169744491577148, 14.717958450317383, 15.266172409057617, 15.814385414123535, 16.362598419189453, 16.910812377929688, 17.459026336669922]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 13.0, 18.0, 41.0, 78.0, 90.0, 177.0, 357.0, 733.0, 1906.0, 6719.0, 39895.0, 3628608.0, 481650.0, 26058.0, 4904.0, 1632.0, 636.0, 319.0, 185.0, 96.0, 42.0, 43.0, 14.0, 19.0, 6.0, 9.0, 8.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.693359375, -2.611480712890625, -2.52960205078125, -2.447723388671875, -2.3658447265625, -2.283966064453125, -2.20208740234375, -2.120208740234375, -2.038330078125, -1.956451416015625, -1.87457275390625, -1.792694091796875, -1.7108154296875, -1.628936767578125, -1.54705810546875, -1.465179443359375, -1.38330078125, -1.301422119140625, -1.21954345703125, -1.137664794921875, -1.0557861328125, -0.973907470703125, -0.89202880859375, -0.810150146484375, -0.728271484375, -0.646392822265625, -0.56451416015625, -0.482635498046875, -0.4007568359375, -0.318878173828125, -0.23699951171875, -0.155120849609375, -0.0732421875, 0.008636474609375, 0.09051513671875, 0.172393798828125, 0.2542724609375, 0.336151123046875, 0.41802978515625, 0.499908447265625, 0.581787109375, 0.663665771484375, 0.74554443359375, 0.827423095703125, 0.9093017578125, 0.991180419921875, 1.07305908203125, 1.154937744140625, 1.23681640625, 1.318695068359375, 1.40057373046875, 1.482452392578125, 1.5643310546875, 1.646209716796875, 1.72808837890625, 1.809967041015625, 1.891845703125, 1.973724365234375, 2.05560302734375, 2.137481689453125, 2.2193603515625, 2.301239013671875, 2.38311767578125, 2.464996337890625, 2.546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 13.0, 17.0, 19.0, 35.0, 35.0, 30.0, 47.0, 60.0, 71.0, 68.0, 80.0, 88.0, 66.0, 60.0, 45.0, 55.0, 57.0, 34.0, 29.0, 20.0, 20.0, 9.0, 5.0, 8.0, 7.0, 5.0, 1.0, 6.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.162109375, -1.1309432983398438, -1.0997772216796875, -1.0686111450195312, -1.037445068359375, -1.0062789916992188, -0.9751129150390625, -0.9439468383789062, -0.91278076171875, -0.8816146850585938, -0.8504486083984375, -0.8192825317382812, -0.788116455078125, -0.7569503784179688, -0.7257843017578125, -0.6946182250976562, -0.6634521484375, -0.6322860717773438, -0.6011199951171875, -0.5699539184570312, -0.538787841796875, -0.5076217651367188, -0.4764556884765625, -0.44528961181640625, -0.41412353515625, -0.38295745849609375, -0.3517913818359375, -0.32062530517578125, -0.289459228515625, -0.25829315185546875, -0.2271270751953125, -0.19596099853515625, -0.164794921875, -0.13362884521484375, -0.1024627685546875, -0.07129669189453125, -0.040130615234375, -0.00896453857421875, 0.0222015380859375, 0.05336761474609375, 0.08453369140625, 0.11569976806640625, 0.1468658447265625, 0.17803192138671875, 0.209197998046875, 0.24036407470703125, 0.2715301513671875, 0.30269622802734375, 0.3338623046875, 0.36502838134765625, 0.3961944580078125, 0.42736053466796875, 0.458526611328125, 0.48969268798828125, 0.5208587646484375, 0.5520248413085938, 0.58319091796875, 0.6143569946289062, 0.6455230712890625, 0.6766891479492188, 0.707855224609375, 0.7390213012695312, 0.7701873779296875, 0.8013534545898438, 0.83251953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 7.0, 13.0, 19.0, 21.0, 27.0, 39.0, 42.0, 81.0, 99.0, 192.0, 259.0, 361.0, 628.0, 965.0, 1924.0, 3756.0, 8708.0, 23567.0, 85879.0, 666038.0, 3189817.0, 152685.0, 36145.0, 12225.0, 5062.0, 2294.0, 1289.0, 747.0, 463.0, 292.0, 192.0, 151.0, 78.0, 50.0, 50.0, 34.0, 25.0, 15.0, 11.0, 4.0, 4.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.2177734375, -1.1821441650390625, -1.146514892578125, -1.1108856201171875, -1.07525634765625, -1.0396270751953125, -1.003997802734375, -0.9683685302734375, -0.9327392578125, -0.8971099853515625, -0.861480712890625, -0.8258514404296875, -0.79022216796875, -0.7545928955078125, -0.718963623046875, -0.6833343505859375, -0.647705078125, -0.6120758056640625, -0.576446533203125, -0.5408172607421875, -0.50518798828125, -0.4695587158203125, -0.433929443359375, -0.3983001708984375, -0.3626708984375, -0.3270416259765625, -0.291412353515625, -0.2557830810546875, -0.22015380859375, -0.1845245361328125, -0.148895263671875, -0.1132659912109375, -0.07763671875, -0.0420074462890625, -0.006378173828125, 0.0292510986328125, 0.06488037109375, 0.1005096435546875, 0.136138916015625, 0.1717681884765625, 0.2073974609375, 0.2430267333984375, 0.278656005859375, 0.3142852783203125, 0.34991455078125, 0.3855438232421875, 0.421173095703125, 0.4568023681640625, 0.492431640625, 0.5280609130859375, 0.563690185546875, 0.5993194580078125, 0.63494873046875, 0.6705780029296875, 0.706207275390625, 0.7418365478515625, 0.7774658203125, 0.8130950927734375, 0.848724365234375, 0.8843536376953125, 0.91998291015625, 0.9556121826171875, 0.991241455078125, 1.0268707275390625, 1.0625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 17.0, 31.0, 70.0, 123.0, 273.0, 2337.0, 800.0, 206.0, 89.0, 46.0, 29.0, 18.0, 9.0, 12.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.314453125, -1.2805938720703125, -1.246734619140625, -1.2128753662109375, -1.17901611328125, -1.1451568603515625, -1.111297607421875, -1.0774383544921875, -1.0435791015625, -1.0097198486328125, -0.975860595703125, -0.9420013427734375, -0.90814208984375, -0.8742828369140625, -0.840423583984375, -0.8065643310546875, -0.772705078125, -0.7388458251953125, -0.704986572265625, -0.6711273193359375, -0.63726806640625, -0.6034088134765625, -0.569549560546875, -0.5356903076171875, -0.5018310546875, -0.4679718017578125, -0.434112548828125, -0.4002532958984375, -0.36639404296875, -0.3325347900390625, -0.298675537109375, -0.2648162841796875, -0.23095703125, -0.1970977783203125, -0.163238525390625, -0.1293792724609375, -0.09552001953125, -0.0616607666015625, -0.027801513671875, 0.0060577392578125, 0.0399169921875, 0.0737762451171875, 0.107635498046875, 0.1414947509765625, 0.17535400390625, 0.2092132568359375, 0.243072509765625, 0.2769317626953125, 0.310791015625, 0.3446502685546875, 0.378509521484375, 0.4123687744140625, 0.44622802734375, 0.4800872802734375, 0.513946533203125, 0.5478057861328125, 0.5816650390625, 0.6155242919921875, 0.649383544921875, 0.6832427978515625, 0.71710205078125, 0.7509613037109375, 0.784820556640625, 0.8186798095703125, 0.8525390625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 13.0, 14.0, 24.0, 35.0, 42.0, 56.0, 79.0, 80.0, 104.0, 107.0, 112.0, 89.0, 71.0, 50.0, 33.0, 23.0, 20.0, 11.0, 6.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671140670776367, -2.5839414596557617, -2.4967422485351562, -2.40954327583313, -2.3223440647125244, -2.235144853591919, -2.1479458808898926, -2.060746669769287, -1.9735474586486816, -1.8863482475280762, -1.7991491556167603, -1.7119500637054443, -1.6247508525848389, -1.5375516414642334, -1.4503525495529175, -1.3631534576416016, -1.275954246520996, -1.1887550354003906, -1.1015559434890747, -1.0143568515777588, -0.9271576404571533, -0.8399584889411926, -0.7527593374252319, -0.6655601859092712, -0.5783610343933105, -0.49116188287734985, -0.40396273136138916, -0.31676357984542847, -0.22956442832946777, -0.14236527681350708, -0.05516612529754639, 0.03203302621841431, 0.119232177734375, 0.2064313292503357, 0.2936304807662964, 0.3808296322822571, 0.4680287837982178, 0.5552279353141785, 0.6424270868301392, 0.7296262383460999, 0.8168253898620605, 0.9040245413780212, 0.9912236928939819, 1.0784227848052979, 1.1656219959259033, 1.2528212070465088, 1.3400202989578247, 1.4272193908691406, 1.514418601989746, 1.6016178131103516, 1.6888169050216675, 1.7760159969329834, 1.8632152080535889, 1.9504144191741943, 2.0376133918762207, 2.124812602996826, 2.2120118141174316, 2.299211025238037, 2.3864102363586426, 2.473609209060669, 2.5608084201812744, 2.64800763130188, 2.7352066040039062, 2.8224058151245117, 2.909605026245117]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 5.0, 9.0, 7.0, 7.0, 21.0, 10.0, 16.0, 21.0, 19.0, 28.0, 22.0, 36.0, 32.0, 45.0, 30.0, 40.0, 53.0, 59.0, 48.0, 53.0, 56.0, 50.0, 51.0, 38.0, 33.0, 31.0, 32.0, 21.0, 23.0, 25.0, 19.0, 16.0, 11.0, 12.0, 11.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9932039976119995, -1.91867196559906, -1.844139814376831, -1.7696077823638916, -1.6950757503509521, -1.6205437183380127, -1.5460115671157837, -1.4714795351028442, -1.3969473838806152, -1.3224153518676758, -1.2478832006454468, -1.1733511686325073, -1.0988191366195679, -1.0242869853973389, -0.9497549533843994, -0.87522292137146, -0.8006908893585205, -0.7261587977409363, -0.6516267657279968, -0.5770946741104126, -0.5025626420974731, -0.4280305504798889, -0.3534984588623047, -0.27896642684936523, -0.204434335231781, -0.12990227341651917, -0.05537019670009613, 0.019161880016326904, 0.09369394183158875, 0.16822600364685059, 0.24275809526443481, 0.31729012727737427, 0.39182209968566895, 0.4663541615009308, 0.5408862233161926, 0.6154183149337769, 0.6899503469467163, 0.7644824385643005, 0.8390145301818848, 0.9135465621948242, 0.9880786538124084, 1.0626107454299927, 1.1371427774429321, 1.2116749286651611, 1.2862069606781006, 1.36073899269104, 1.4352710247039795, 1.509803056716919, 1.584335207939148, 1.6588672399520874, 1.7333993911743164, 1.8079314231872559, 1.8824634552001953, 1.9569954872131348, 2.031527519226074, 2.1060595512390137, 2.1805918216705322, 2.2551238536834717, 2.329655885696411, 2.4041881561279297, 2.478720188140869, 2.5532522201538086, 2.627784252166748, 2.7023162841796875, 2.776848316192627]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0, 8.0, 17.0, 24.0, 50.0, 101.0, 246.0, 720.0, 2891.0, 18930.0, 255012.0, 696962.0, 64829.0, 6741.0, 1355.0, 383.0, 145.0, 51.0, 28.0, 16.0, 14.0, 11.0, 7.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.287109375, -3.1851806640625, -3.083251953125, -2.9813232421875, -2.87939453125, -2.7774658203125, -2.675537109375, -2.5736083984375, -2.4716796875, -2.3697509765625, -2.267822265625, -2.1658935546875, -2.06396484375, -1.9620361328125, -1.860107421875, -1.7581787109375, -1.65625, -1.5543212890625, -1.452392578125, -1.3504638671875, -1.24853515625, -1.1466064453125, -1.044677734375, -0.9427490234375, -0.8408203125, -0.7388916015625, -0.636962890625, -0.5350341796875, -0.43310546875, -0.3311767578125, -0.229248046875, -0.1273193359375, -0.025390625, 0.0765380859375, 0.178466796875, 0.2803955078125, 0.38232421875, 0.4842529296875, 0.586181640625, 0.6881103515625, 0.7900390625, 0.8919677734375, 0.993896484375, 1.0958251953125, 1.19775390625, 1.2996826171875, 1.401611328125, 1.5035400390625, 1.60546875, 1.7073974609375, 1.809326171875, 1.9112548828125, 2.01318359375, 2.1151123046875, 2.217041015625, 2.3189697265625, 2.4208984375, 2.5228271484375, 2.624755859375, 2.7266845703125, 2.82861328125, 2.9305419921875, 3.032470703125, 3.1343994140625, 3.236328125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 7.0, 7.0, 6.0, 7.0, 19.0, 28.0, 33.0, 45.0, 48.0, 38.0, 54.0, 58.0, 73.0, 70.0, 58.0, 75.0, 57.0, 52.0, 48.0, 42.0, 35.0, 40.0, 24.0, 17.0, 16.0, 12.0, 9.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.92041015625, -0.8918914794921875, -0.863372802734375, -0.8348541259765625, -0.80633544921875, -0.7778167724609375, -0.749298095703125, -0.7207794189453125, -0.6922607421875, -0.6637420654296875, -0.635223388671875, -0.6067047119140625, -0.57818603515625, -0.5496673583984375, -0.521148681640625, -0.4926300048828125, -0.464111328125, -0.4355926513671875, -0.407073974609375, -0.3785552978515625, -0.35003662109375, -0.3215179443359375, -0.292999267578125, -0.2644805908203125, -0.2359619140625, -0.2074432373046875, -0.178924560546875, -0.1504058837890625, -0.12188720703125, -0.0933685302734375, -0.064849853515625, -0.0363311767578125, -0.0078125, 0.0207061767578125, 0.049224853515625, 0.0777435302734375, 0.10626220703125, 0.1347808837890625, 0.163299560546875, 0.1918182373046875, 0.2203369140625, 0.2488555908203125, 0.277374267578125, 0.3058929443359375, 0.33441162109375, 0.3629302978515625, 0.391448974609375, 0.4199676513671875, 0.448486328125, 0.4770050048828125, 0.505523681640625, 0.5340423583984375, 0.56256103515625, 0.5910797119140625, 0.619598388671875, 0.6481170654296875, 0.6766357421875, 0.7051544189453125, 0.733673095703125, 0.7621917724609375, 0.79071044921875, 0.8192291259765625, 0.847747802734375, 0.8762664794921875, 0.90478515625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 7.0, 16.0, 13.0, 27.0, 40.0, 50.0, 88.0, 131.0, 230.0, 452.0, 974.0, 2630.0, 13541.0, 275833.0, 716108.0, 31532.0, 4236.0, 1251.0, 603.0, 296.0, 168.0, 91.0, 71.0, 50.0, 25.0, 21.0, 13.0, 10.0, 9.0, 5.0, 2.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.57257080078125, -2.4615478515625, -2.35052490234375, -2.239501953125, -2.12847900390625, -2.0174560546875, -1.90643310546875, -1.79541015625, -1.68438720703125, -1.5733642578125, -1.46234130859375, -1.351318359375, -1.24029541015625, -1.1292724609375, -1.01824951171875, -0.9072265625, -0.79620361328125, -0.6851806640625, -0.57415771484375, -0.463134765625, -0.35211181640625, -0.2410888671875, -0.13006591796875, -0.01904296875, 0.09197998046875, 0.2030029296875, 0.31402587890625, 0.425048828125, 0.53607177734375, 0.6470947265625, 0.75811767578125, 0.869140625, 0.98016357421875, 1.0911865234375, 1.20220947265625, 1.313232421875, 1.42425537109375, 1.5352783203125, 1.64630126953125, 1.75732421875, 1.86834716796875, 1.9793701171875, 2.09039306640625, 2.201416015625, 2.31243896484375, 2.4234619140625, 2.53448486328125, 2.6455078125, 2.75653076171875, 2.8675537109375, 2.97857666015625, 3.089599609375, 3.20062255859375, 3.3116455078125, 3.42266845703125, 3.53369140625, 3.64471435546875, 3.7557373046875, 3.86676025390625, 3.977783203125, 4.08880615234375, 4.1998291015625, 4.31085205078125, 4.421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 1.0, 13.0, 7.0, 12.0, 15.0, 13.0, 28.0, 29.0, 36.0, 39.0, 51.0, 44.0, 60.0, 70.0, 59.0, 68.0, 61.0, 55.0, 49.0, 62.0, 39.0, 32.0, 33.0, 25.0, 23.0, 11.0, 10.0, 13.0, 5.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.49609375, -4.377288818359375, -4.25848388671875, -4.139678955078125, -4.0208740234375, -3.902069091796875, -3.78326416015625, -3.664459228515625, -3.545654296875, -3.426849365234375, -3.30804443359375, -3.189239501953125, -3.0704345703125, -2.951629638671875, -2.83282470703125, -2.714019775390625, -2.59521484375, -2.476409912109375, -2.35760498046875, -2.238800048828125, -2.1199951171875, -2.001190185546875, -1.88238525390625, -1.763580322265625, -1.644775390625, -1.525970458984375, -1.40716552734375, -1.288360595703125, -1.1695556640625, -1.050750732421875, -0.93194580078125, -0.813140869140625, -0.6943359375, -0.575531005859375, -0.45672607421875, -0.337921142578125, -0.2191162109375, -0.100311279296875, 0.01849365234375, 0.137298583984375, 0.256103515625, 0.374908447265625, 0.49371337890625, 0.612518310546875, 0.7313232421875, 0.850128173828125, 0.96893310546875, 1.087738037109375, 1.20654296875, 1.325347900390625, 1.44415283203125, 1.562957763671875, 1.6817626953125, 1.800567626953125, 1.91937255859375, 2.038177490234375, 2.156982421875, 2.275787353515625, 2.39459228515625, 2.513397216796875, 2.6322021484375, 2.751007080078125, 2.86981201171875, 2.988616943359375, 3.107421875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 2.0, 2.0, 10.0, 3.0, 9.0, 12.0, 10.0, 28.0, 32.0, 36.0, 79.0, 83.0, 154.0, 226.0, 504.0, 967.0, 2486.0, 9242.0, 59873.0, 575861.0, 351703.0, 36842.0, 6590.0, 1892.0, 805.0, 410.0, 257.0, 138.0, 83.0, 62.0, 49.0, 23.0, 19.0, 19.0, 13.0, 9.0, 6.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7529296875, -0.7259292602539062, -0.6989288330078125, -0.6719284057617188, -0.644927978515625, -0.6179275512695312, -0.5909271240234375, -0.5639266967773438, -0.53692626953125, -0.5099258422851562, -0.4829254150390625, -0.45592498779296875, -0.428924560546875, -0.40192413330078125, -0.3749237060546875, -0.34792327880859375, -0.3209228515625, -0.29392242431640625, -0.2669219970703125, -0.23992156982421875, -0.212921142578125, -0.18592071533203125, -0.1589202880859375, -0.13191986083984375, -0.10491943359375, -0.07791900634765625, -0.0509185791015625, -0.02391815185546875, 0.003082275390625, 0.03008270263671875, 0.0570831298828125, 0.08408355712890625, 0.111083984375, 0.13808441162109375, 0.1650848388671875, 0.19208526611328125, 0.219085693359375, 0.24608612060546875, 0.2730865478515625, 0.30008697509765625, 0.32708740234375, 0.35408782958984375, 0.3810882568359375, 0.40808868408203125, 0.435089111328125, 0.46208953857421875, 0.4890899658203125, 0.5160903930664062, 0.5430908203125, 0.5700912475585938, 0.5970916748046875, 0.6240921020507812, 0.651092529296875, 0.6780929565429688, 0.7050933837890625, 0.7320938110351562, 0.75909423828125, 0.7860946655273438, 0.8130950927734375, 0.8400955200195312, 0.867095947265625, 0.8940963745117188, 0.9210968017578125, 0.9480972290039062, 0.97509765625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 8.0, 2.0, 7.0, 7.0, 9.0, 11.0, 18.0, 14.0, 19.0, 23.0, 32.0, 39.0, 49.0, 47.0, 55.0, 77.0, 88.0, 97.0, 76.0, 70.0, 38.0, 44.0, 31.0, 23.0, 27.0, 16.0, 22.0, 16.0, 12.0, 4.0, 7.0, 4.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013637542724609375, -0.00013183988630771637, -0.000127304345369339, -0.0001227688044309616, -0.00011823326349258423, -0.00011369772255420685, -0.00010916218161582947, -0.00010462664067745209, -0.00010009109973907471, -9.555555880069733e-05, -9.102001786231995e-05, -8.648447692394257e-05, -8.194893598556519e-05, -7.74133950471878e-05, -7.287785410881042e-05, -6.834231317043304e-05, -6.380677223205566e-05, -5.9271231293678284e-05, -5.47356903553009e-05, -5.020014941692352e-05, -4.566460847854614e-05, -4.112906754016876e-05, -3.659352660179138e-05, -3.2057985663414e-05, -2.752244472503662e-05, -2.298690378665924e-05, -1.845136284828186e-05, -1.391582190990448e-05, -9.3802809715271e-06, -4.844740033149719e-06, -3.0919909477233887e-07, 4.2263418436050415e-06, 8.761882781982422e-06, 1.3297423720359802e-05, 1.7832964658737183e-05, 2.2368505597114563e-05, 2.6904046535491943e-05, 3.1439587473869324e-05, 3.5975128412246704e-05, 4.0510669350624084e-05, 4.5046210289001465e-05, 4.9581751227378845e-05, 5.4117292165756226e-05, 5.8652833104133606e-05, 6.318837404251099e-05, 6.772391498088837e-05, 7.225945591926575e-05, 7.679499685764313e-05, 8.133053779602051e-05, 8.586607873439789e-05, 9.040161967277527e-05, 9.493716061115265e-05, 9.947270154953003e-05, 0.00010400824248790741, 0.00010854378342628479, 0.00011307932436466217, 0.00011761486530303955, 0.00012215040624141693, 0.0001266859471797943, 0.0001312214881181717, 0.00013575702905654907, 0.00014029256999492645, 0.00014482811093330383, 0.0001493636518716812, 0.0001538991928100586]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 12.0, 26.0, 31.0, 29.0, 46.0, 62.0, 120.0, 163.0, 262.0, 410.0, 860.0, 1822.0, 5048.0, 19368.0, 145344.0, 711028.0, 136665.0, 18604.0, 4813.0, 1774.0, 816.0, 475.0, 265.0, 158.0, 101.0, 63.0, 45.0, 28.0, 27.0, 15.0, 7.0, 13.0, 4.0, 8.0, 5.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.86279296875, -0.8362350463867188, -0.8096771240234375, -0.7831192016601562, -0.756561279296875, -0.7300033569335938, -0.7034454345703125, -0.6768875122070312, -0.65032958984375, -0.6237716674804688, -0.5972137451171875, -0.5706558227539062, -0.544097900390625, -0.5175399780273438, -0.4909820556640625, -0.46442413330078125, -0.4378662109375, -0.41130828857421875, -0.3847503662109375, -0.35819244384765625, -0.331634521484375, -0.30507659912109375, -0.2785186767578125, -0.25196075439453125, -0.22540283203125, -0.19884490966796875, -0.1722869873046875, -0.14572906494140625, -0.119171142578125, -0.09261322021484375, -0.0660552978515625, -0.03949737548828125, -0.012939453125, 0.01361846923828125, 0.0401763916015625, 0.06673431396484375, 0.093292236328125, 0.11985015869140625, 0.1464080810546875, 0.17296600341796875, 0.19952392578125, 0.22608184814453125, 0.2526397705078125, 0.27919769287109375, 0.305755615234375, 0.33231353759765625, 0.3588714599609375, 0.38542938232421875, 0.4119873046875, 0.43854522705078125, 0.4651031494140625, 0.49166107177734375, 0.518218994140625, 0.5447769165039062, 0.5713348388671875, 0.5978927612304688, 0.62445068359375, 0.6510086059570312, 0.6775665283203125, 0.7041244506835938, 0.730682373046875, 0.7572402954101562, 0.7837982177734375, 0.8103561401367188, 0.8369140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 7.0, 5.0, 5.0, 3.0, 7.0, 11.0, 11.0, 19.0, 20.0, 27.0, 29.0, 44.0, 55.0, 66.0, 67.0, 85.0, 78.0, 70.0, 85.0, 56.0, 53.0, 45.0, 43.0, 14.0, 16.0, 16.0, 18.0, 13.0, 7.0, 4.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.6647872924804688, -0.6420745849609375, -0.6193618774414062, -0.596649169921875, -0.5739364624023438, -0.5512237548828125, -0.5285110473632812, -0.50579833984375, -0.48308563232421875, -0.4603729248046875, -0.43766021728515625, -0.414947509765625, -0.39223480224609375, -0.3695220947265625, -0.34680938720703125, -0.3240966796875, -0.30138397216796875, -0.2786712646484375, -0.25595855712890625, -0.233245849609375, -0.21053314208984375, -0.1878204345703125, -0.16510772705078125, -0.14239501953125, -0.11968231201171875, -0.0969696044921875, -0.07425689697265625, -0.051544189453125, -0.02883148193359375, -0.0061187744140625, 0.01659393310546875, 0.039306640625, 0.06201934814453125, 0.0847320556640625, 0.10744476318359375, 0.130157470703125, 0.15287017822265625, 0.1755828857421875, 0.19829559326171875, 0.22100830078125, 0.24372100830078125, 0.2664337158203125, 0.28914642333984375, 0.311859130859375, 0.33457183837890625, 0.3572845458984375, 0.37999725341796875, 0.4027099609375, 0.42542266845703125, 0.4481353759765625, 0.47084808349609375, 0.493560791015625, 0.5162734985351562, 0.5389862060546875, 0.5616989135742188, 0.58441162109375, 0.6071243286132812, 0.6298370361328125, 0.6525497436523438, 0.675262451171875, 0.6979751586914062, 0.7206878662109375, 0.7434005737304688, 0.76611328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 12.0, 23.0, 71.0, 139.0, 251.0, 239.0, 156.0, 53.0, 26.0, 11.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.802682876586914, -24.9943904876709, -24.186098098754883, -23.377805709838867, -22.569515228271484, -21.76122283935547, -20.952930450439453, -20.144638061523438, -19.336345672607422, -18.528053283691406, -17.71976089477539, -16.911468505859375, -16.10317611694336, -15.29488468170166, -14.486593246459961, -13.678300857543945, -12.87000846862793, -12.061716079711914, -11.253423690795898, -10.4451322555542, -9.636839866638184, -8.828547477722168, -8.020256042480469, -7.211963653564453, -6.4036712646484375, -5.595378875732422, -4.7870869636535645, -3.978794813156128, -3.1705026626586914, -2.362210273742676, -1.5539183616638184, -0.7456264495849609, 0.06266403198242188, 0.8709561824798584, 1.679248332977295, 2.4875404834747314, 3.295832633972168, 4.104125022888184, 4.912416934967041, 5.720708847045898, 6.529001235961914, 7.33729362487793, 8.145586013793945, 8.953877449035645, 9.76216983795166, 10.570462226867676, 11.378753662109375, 12.18704605102539, 12.995338439941406, 13.803630828857422, 14.611923217773438, 15.420214653015137, 16.22850799560547, 17.036800384521484, 17.845090866088867, 18.653383255004883, 19.4616756439209, 20.269968032836914, 21.07826042175293, 21.886552810668945, 22.694843292236328, 23.503135681152344, 24.31142807006836, 25.119720458984375, 25.92801284790039]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 9.0, 12.0, 7.0, 12.0, 12.0, 15.0, 19.0, 18.0, 29.0, 39.0, 27.0, 43.0, 34.0, 52.0, 56.0, 54.0, 49.0, 62.0, 44.0, 49.0, 46.0, 26.0, 29.0, 35.0, 39.0, 30.0, 23.0, 22.0, 19.0, 16.0, 10.0, 17.0, 5.0, 8.0, 3.0, 7.0, 4.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.991949081420898, -12.59127140045166, -12.190594673156738, -11.7899169921875, -11.389240264892578, -10.98856258392334, -10.587885856628418, -10.18720817565918, -9.786531448364258, -9.38585376739502, -8.985177040100098, -8.58449935913086, -8.183822631835938, -7.783144950866699, -7.382468223571777, -6.981790542602539, -6.581113338470459, -6.180436134338379, -5.779758930206299, -5.379081726074219, -4.978404521942139, -4.577727317810059, -4.17704963684082, -3.7763726711273193, -3.3756954669952393, -2.975018262863159, -2.574341058731079, -2.17366361618042, -1.7729865312576294, -1.3723092079162598, -0.9716320037841797, -0.5709547996520996, -0.17027759552001953, 0.23039963841438293, 0.6310768723487854, 1.0317541360855103, 1.4324313402175903, 1.83310866355896, 2.23378586769104, 2.63446307182312, 3.0351402759552, 3.4358174800872803, 3.8364946842193604, 4.2371721267700195, 4.6378493309021, 5.03852653503418, 5.43920373916626, 5.83988094329834, 6.24055814743042, 6.6412353515625, 7.04191255569458, 7.44258975982666, 7.84326696395874, 8.24394416809082, 8.644621849060059, 9.04529857635498, 9.445976257324219, 9.846653938293457, 10.247330665588379, 10.648008346557617, 11.048685073852539, 11.449362754821777, 11.8500394821167, 12.250717163085938, 12.65139389038086]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 6.0, 6.0, 9.0, 18.0, 18.0, 20.0, 30.0, 55.0, 89.0, 149.0, 272.0, 772.0, 2601.0, 12945.0, 176297.0, 3749503.0, 232105.0, 14762.0, 2873.0, 922.0, 344.0, 162.0, 100.0, 69.0, 50.0, 26.0, 12.0, 12.0, 12.0, 8.0, 11.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.244140625, -2.184356689453125, -2.12457275390625, -2.064788818359375, -2.0050048828125, -1.945220947265625, -1.88543701171875, -1.825653076171875, -1.765869140625, -1.706085205078125, -1.64630126953125, -1.586517333984375, -1.5267333984375, -1.466949462890625, -1.40716552734375, -1.347381591796875, -1.28759765625, -1.227813720703125, -1.16802978515625, -1.108245849609375, -1.0484619140625, -0.988677978515625, -0.92889404296875, -0.869110107421875, -0.809326171875, -0.749542236328125, -0.68975830078125, -0.629974365234375, -0.5701904296875, -0.510406494140625, -0.45062255859375, -0.390838623046875, -0.3310546875, -0.271270751953125, -0.21148681640625, -0.151702880859375, -0.0919189453125, -0.032135009765625, 0.02764892578125, 0.087432861328125, 0.147216796875, 0.207000732421875, 0.26678466796875, 0.326568603515625, 0.3863525390625, 0.446136474609375, 0.50592041015625, 0.565704345703125, 0.62548828125, 0.685272216796875, 0.74505615234375, 0.804840087890625, 0.8646240234375, 0.924407958984375, 0.98419189453125, 1.043975830078125, 1.103759765625, 1.163543701171875, 1.22332763671875, 1.283111572265625, 1.3428955078125, 1.402679443359375, 1.46246337890625, 1.522247314453125, 1.58203125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 0.0, 4.0, 5.0, 11.0, 17.0, 7.0, 14.0, 28.0, 30.0, 35.0, 40.0, 47.0, 59.0, 44.0, 69.0, 60.0, 83.0, 64.0, 66.0, 63.0, 54.0, 41.0, 30.0, 35.0, 26.0, 23.0, 11.0, 8.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5533599853515625, -0.528594970703125, -0.5038299560546875, -0.47906494140625, -0.4542999267578125, -0.429534912109375, -0.4047698974609375, -0.3800048828125, -0.3552398681640625, -0.330474853515625, -0.3057098388671875, -0.28094482421875, -0.2561798095703125, -0.231414794921875, -0.2066497802734375, -0.181884765625, -0.1571197509765625, -0.132354736328125, -0.1075897216796875, -0.08282470703125, -0.0580596923828125, -0.033294677734375, -0.0085296630859375, 0.0162353515625, 0.0410003662109375, 0.065765380859375, 0.0905303955078125, 0.11529541015625, 0.1400604248046875, 0.164825439453125, 0.1895904541015625, 0.21435546875, 0.2391204833984375, 0.263885498046875, 0.2886505126953125, 0.31341552734375, 0.3381805419921875, 0.362945556640625, 0.3877105712890625, 0.4124755859375, 0.4372406005859375, 0.462005615234375, 0.4867706298828125, 0.51153564453125, 0.5363006591796875, 0.561065673828125, 0.5858306884765625, 0.610595703125, 0.6353607177734375, 0.660125732421875, 0.6848907470703125, 0.70965576171875, 0.7344207763671875, 0.759185791015625, 0.7839508056640625, 0.8087158203125, 0.8334808349609375, 0.858245849609375, 0.8830108642578125, 0.90777587890625, 0.9325408935546875, 0.957305908203125, 0.9820709228515625, 1.0068359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 6.0, 10.0, 8.0, 15.0, 26.0, 51.0, 105.0, 188.0, 595.0, 2249.0, 10996.0, 109187.0, 3522560.0, 517742.0, 24528.0, 4222.0, 1082.0, 365.0, 141.0, 60.0, 46.0, 35.0, 13.0, 9.0, 4.0, 8.0, 6.0, 4.0, 1.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6103515625, -1.55615234375, -1.501953125, -1.44775390625, -1.3935546875, -1.33935546875, -1.28515625, -1.23095703125, -1.1767578125, -1.12255859375, -1.068359375, -1.01416015625, -0.9599609375, -0.90576171875, -0.8515625, -0.79736328125, -0.7431640625, -0.68896484375, -0.634765625, -0.58056640625, -0.5263671875, -0.47216796875, -0.41796875, -0.36376953125, -0.3095703125, -0.25537109375, -0.201171875, -0.14697265625, -0.0927734375, -0.03857421875, 0.015625, 0.06982421875, 0.1240234375, 0.17822265625, 0.232421875, 0.28662109375, 0.3408203125, 0.39501953125, 0.44921875, 0.50341796875, 0.5576171875, 0.61181640625, 0.666015625, 0.72021484375, 0.7744140625, 0.82861328125, 0.8828125, 0.93701171875, 0.9912109375, 1.04541015625, 1.099609375, 1.15380859375, 1.2080078125, 1.26220703125, 1.31640625, 1.37060546875, 1.4248046875, 1.47900390625, 1.533203125, 1.58740234375, 1.6416015625, 1.69580078125, 1.75, 1.80419921875, 1.8583984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 10.0, 9.0, 10.0, 10.0, 23.0, 31.0, 36.0, 68.0, 104.0, 147.0, 264.0, 487.0, 693.0, 753.0, 543.0, 342.0, 208.0, 114.0, 84.0, 49.0, 24.0, 19.0, 13.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.212890625, -1.17413330078125, -1.1353759765625, -1.09661865234375, -1.057861328125, -1.01910400390625, -0.9803466796875, -0.94158935546875, -0.90283203125, -0.86407470703125, -0.8253173828125, -0.78656005859375, -0.747802734375, -0.70904541015625, -0.6702880859375, -0.63153076171875, -0.5927734375, -0.55401611328125, -0.5152587890625, -0.47650146484375, -0.437744140625, -0.39898681640625, -0.3602294921875, -0.32147216796875, -0.28271484375, -0.24395751953125, -0.2052001953125, -0.16644287109375, -0.127685546875, -0.08892822265625, -0.0501708984375, -0.01141357421875, 0.02734375, 0.06610107421875, 0.1048583984375, 0.14361572265625, 0.182373046875, 0.22113037109375, 0.2598876953125, 0.29864501953125, 0.33740234375, 0.37615966796875, 0.4149169921875, 0.45367431640625, 0.492431640625, 0.53118896484375, 0.5699462890625, 0.60870361328125, 0.6474609375, 0.68621826171875, 0.7249755859375, 0.76373291015625, 0.802490234375, 0.84124755859375, 0.8800048828125, 0.91876220703125, 0.95751953125, 0.99627685546875, 1.0350341796875, 1.07379150390625, 1.112548828125, 1.15130615234375, 1.1900634765625, 1.22882080078125, 1.267578125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 6.0, 3.0, 14.0, 13.0, 28.0, 39.0, 76.0, 123.0, 155.0, 155.0, 146.0, 88.0, 75.0, 36.0, 13.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.030561447143555, -7.705508708953857, -7.380456447601318, -7.055403709411621, -6.730350971221924, -6.405298233032227, -6.0802459716796875, -5.75519323348999, -5.430140495300293, -5.105087757110596, -4.780035495758057, -4.454982757568359, -4.129930019378662, -3.804877519607544, -3.479825019836426, -3.1547722816467285, -2.8297200202941895, -2.5046675205230713, -2.179614782333374, -1.8545622825622559, -1.5295096635818481, -1.2044570446014404, -0.8794045448303223, -0.554351806640625, -0.22929930686950684, 0.09575328230857849, 0.4208058714866638, 0.7458584308624268, 1.0709110498428345, 1.3959636688232422, 1.7210161685943604, 2.0460689067840576, 2.371121406555176, 2.696173906326294, 3.021226644515991, 3.3462791442871094, 3.6713318824768066, 3.996384382247925, 4.321436882019043, 4.64648962020874, 4.9715423583984375, 5.296595096588135, 5.621647357940674, 5.946700096130371, 6.271752834320068, 6.596805572509766, 6.921857833862305, 7.246910572052002, 7.571962833404541, 7.897015571594238, 8.222067832946777, 8.547121047973633, 8.872173309326172, 9.197225570678711, 9.52227783203125, 9.847331047058105, 10.172383308410645, 10.497435569763184, 10.822488784790039, 11.147541046142578, 11.472593307495117, 11.797646522521973, 12.122698783874512, 12.447751998901367, 12.772804260253906]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 7.0, 7.0, 10.0, 10.0, 14.0, 24.0, 30.0, 29.0, 36.0, 39.0, 34.0, 39.0, 47.0, 39.0, 48.0, 34.0, 57.0, 49.0, 42.0, 48.0, 44.0, 47.0, 38.0, 35.0, 32.0, 28.0, 31.0, 19.0, 17.0, 9.0, 8.0, 16.0, 6.0, 12.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.963579177856445, -5.777353286743164, -5.591127395629883, -5.40490198135376, -5.2186760902404785, -5.032450199127197, -4.846224784851074, -4.659998893737793, -4.473773002624512, -4.2875471115112305, -4.101321220397949, -3.915095806121826, -3.728869915008545, -3.5426440238952637, -3.3564183712005615, -3.1701927185058594, -2.983966827392578, -2.797740936279297, -2.6115152835845947, -2.4252896308898926, -2.2390637397766113, -2.05283784866333, -1.866612195968628, -1.6803864240646362, -1.4941606521606445, -1.3079348802566528, -1.1217091083526611, -0.9354833364486694, -0.7492575645446777, -0.563031792640686, -0.37680602073669434, -0.19058024883270264, -0.0043544769287109375, 0.18187129497528076, 0.36809706687927246, 0.5543228387832642, 0.7405486106872559, 0.9267743825912476, 1.1130001544952393, 1.299225926399231, 1.4854516983032227, 1.6716774702072144, 1.857903242111206, 2.044128894805908, 2.2303547859191895, 2.4165806770324707, 2.602806329727173, 2.789031982421875, 2.9752578735351562, 3.1614837646484375, 3.3477094173431396, 3.533935070037842, 3.720160961151123, 3.9063868522644043, 4.092612266540527, 4.278838157653809, 4.46506404876709, 4.651289939880371, 4.837515830993652, 5.023741245269775, 5.209967136383057, 5.396193027496338, 5.582418441772461, 5.768644332885742, 5.954870223999023]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 12.0, 13.0, 25.0, 40.0, 57.0, 89.0, 171.0, 251.0, 379.0, 689.0, 1296.0, 2466.0, 5339.0, 11991.0, 30341.0, 87042.0, 289242.0, 407079.0, 136791.0, 44197.0, 16870.0, 6960.0, 3301.0, 1642.0, 906.0, 544.0, 281.0, 178.0, 120.0, 63.0, 55.0, 30.0, 29.0, 18.0, 13.0, 8.0, 7.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1025390625, -1.0693206787109375, -1.036102294921875, -1.0028839111328125, -0.96966552734375, -0.9364471435546875, -0.903228759765625, -0.8700103759765625, -0.8367919921875, -0.8035736083984375, -0.770355224609375, -0.7371368408203125, -0.70391845703125, -0.6707000732421875, -0.637481689453125, -0.6042633056640625, -0.571044921875, -0.5378265380859375, -0.504608154296875, -0.4713897705078125, -0.43817138671875, -0.4049530029296875, -0.371734619140625, -0.3385162353515625, -0.3052978515625, -0.2720794677734375, -0.238861083984375, -0.2056427001953125, -0.17242431640625, -0.1392059326171875, -0.105987548828125, -0.0727691650390625, -0.03955078125, -0.0063323974609375, 0.026885986328125, 0.0601043701171875, 0.09332275390625, 0.1265411376953125, 0.159759521484375, 0.1929779052734375, 0.2261962890625, 0.2594146728515625, 0.292633056640625, 0.3258514404296875, 0.35906982421875, 0.3922882080078125, 0.425506591796875, 0.4587249755859375, 0.491943359375, 0.5251617431640625, 0.558380126953125, 0.5915985107421875, 0.62481689453125, 0.6580352783203125, 0.691253662109375, 0.7244720458984375, 0.7576904296875, 0.7909088134765625, 0.824127197265625, 0.8573455810546875, 0.89056396484375, 0.9237823486328125, 0.957000732421875, 0.9902191162109375, 1.0234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 11.0, 17.0, 18.0, 25.0, 20.0, 27.0, 37.0, 49.0, 55.0, 49.0, 71.0, 58.0, 61.0, 72.0, 60.0, 55.0, 47.0, 66.0, 35.0, 36.0, 29.0, 18.0, 18.0, 7.0, 10.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5498046875, -0.5266265869140625, -0.503448486328125, -0.4802703857421875, -0.45709228515625, -0.4339141845703125, -0.410736083984375, -0.3875579833984375, -0.3643798828125, -0.3412017822265625, -0.318023681640625, -0.2948455810546875, -0.27166748046875, -0.2484893798828125, -0.225311279296875, -0.2021331787109375, -0.178955078125, -0.1557769775390625, -0.132598876953125, -0.1094207763671875, -0.08624267578125, -0.0630645751953125, -0.039886474609375, -0.0167083740234375, 0.0064697265625, 0.0296478271484375, 0.052825927734375, 0.0760040283203125, 0.09918212890625, 0.1223602294921875, 0.145538330078125, 0.1687164306640625, 0.19189453125, 0.2150726318359375, 0.238250732421875, 0.2614288330078125, 0.28460693359375, 0.3077850341796875, 0.330963134765625, 0.3541412353515625, 0.3773193359375, 0.4004974365234375, 0.423675537109375, 0.4468536376953125, 0.47003173828125, 0.4932098388671875, 0.516387939453125, 0.5395660400390625, 0.562744140625, 0.5859222412109375, 0.609100341796875, 0.6322784423828125, 0.65545654296875, 0.6786346435546875, 0.701812744140625, 0.7249908447265625, 0.7481689453125, 0.7713470458984375, 0.794525146484375, 0.8177032470703125, 0.84088134765625, 0.8640594482421875, 0.887237548828125, 0.9104156494140625, 0.93359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 9.0, 14.0, 23.0, 17.0, 30.0, 64.0, 107.0, 173.0, 333.0, 654.0, 1708.0, 8173.0, 198077.0, 815841.0, 18721.0, 2752.0, 933.0, 404.0, 215.0, 102.0, 69.0, 35.0, 27.0, 16.0, 15.0, 10.0, 8.0, 4.0, 7.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.39453125, -3.2781982421875, -3.161865234375, -3.0455322265625, -2.92919921875, -2.8128662109375, -2.696533203125, -2.5802001953125, -2.4638671875, -2.3475341796875, -2.231201171875, -2.1148681640625, -1.99853515625, -1.8822021484375, -1.765869140625, -1.6495361328125, -1.533203125, -1.4168701171875, -1.300537109375, -1.1842041015625, -1.06787109375, -0.9515380859375, -0.835205078125, -0.7188720703125, -0.6025390625, -0.4862060546875, -0.369873046875, -0.2535400390625, -0.13720703125, -0.0208740234375, 0.095458984375, 0.2117919921875, 0.328125, 0.4444580078125, 0.560791015625, 0.6771240234375, 0.79345703125, 0.9097900390625, 1.026123046875, 1.1424560546875, 1.2587890625, 1.3751220703125, 1.491455078125, 1.6077880859375, 1.72412109375, 1.8404541015625, 1.956787109375, 2.0731201171875, 2.189453125, 2.3057861328125, 2.422119140625, 2.5384521484375, 2.65478515625, 2.7711181640625, 2.887451171875, 3.0037841796875, 3.1201171875, 3.2364501953125, 3.352783203125, 3.4691162109375, 3.58544921875, 3.7017822265625, 3.818115234375, 3.9344482421875, 4.05078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 4.0, 13.0, 18.0, 33.0, 28.0, 36.0, 51.0, 62.0, 78.0, 75.0, 93.0, 82.0, 78.0, 65.0, 72.0, 58.0, 43.0, 20.0, 15.0, 16.0, 13.0, 4.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.85546875, -3.724365234375, -3.59326171875, -3.462158203125, -3.3310546875, -3.199951171875, -3.06884765625, -2.937744140625, -2.806640625, -2.675537109375, -2.54443359375, -2.413330078125, -2.2822265625, -2.151123046875, -2.02001953125, -1.888916015625, -1.7578125, -1.626708984375, -1.49560546875, -1.364501953125, -1.2333984375, -1.102294921875, -0.97119140625, -0.840087890625, -0.708984375, -0.577880859375, -0.44677734375, -0.315673828125, -0.1845703125, -0.053466796875, 0.07763671875, 0.208740234375, 0.33984375, 0.470947265625, 0.60205078125, 0.733154296875, 0.8642578125, 0.995361328125, 1.12646484375, 1.257568359375, 1.388671875, 1.519775390625, 1.65087890625, 1.781982421875, 1.9130859375, 2.044189453125, 2.17529296875, 2.306396484375, 2.4375, 2.568603515625, 2.69970703125, 2.830810546875, 2.9619140625, 3.093017578125, 3.22412109375, 3.355224609375, 3.486328125, 3.617431640625, 3.74853515625, 3.879638671875, 4.0107421875, 4.141845703125, 4.27294921875, 4.404052734375, 4.53515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 9.0, 7.0, 9.0, 11.0, 24.0, 22.0, 39.0, 39.0, 68.0, 114.0, 150.0, 350.0, 668.0, 1780.0, 8121.0, 73619.0, 855501.0, 94820.0, 9519.0, 2030.0, 708.0, 348.0, 186.0, 137.0, 72.0, 52.0, 34.0, 22.0, 22.0, 17.0, 6.0, 5.0, 9.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.265625, -1.2289886474609375, -1.192352294921875, -1.1557159423828125, -1.11907958984375, -1.0824432373046875, -1.045806884765625, -1.0091705322265625, -0.9725341796875, -0.9358978271484375, -0.899261474609375, -0.8626251220703125, -0.82598876953125, -0.7893524169921875, -0.752716064453125, -0.7160797119140625, -0.679443359375, -0.6428070068359375, -0.606170654296875, -0.5695343017578125, -0.53289794921875, -0.4962615966796875, -0.459625244140625, -0.4229888916015625, -0.3863525390625, -0.3497161865234375, -0.313079833984375, -0.2764434814453125, -0.23980712890625, -0.2031707763671875, -0.166534423828125, -0.1298980712890625, -0.09326171875, -0.0566253662109375, -0.019989013671875, 0.0166473388671875, 0.05328369140625, 0.0899200439453125, 0.126556396484375, 0.1631927490234375, 0.1998291015625, 0.2364654541015625, 0.273101806640625, 0.3097381591796875, 0.34637451171875, 0.3830108642578125, 0.419647216796875, 0.4562835693359375, 0.492919921875, 0.5295562744140625, 0.566192626953125, 0.6028289794921875, 0.63946533203125, 0.6761016845703125, 0.712738037109375, 0.7493743896484375, 0.7860107421875, 0.8226470947265625, 0.859283447265625, 0.8959197998046875, 0.93255615234375, 0.9691925048828125, 1.005828857421875, 1.0424652099609375, 1.0791015625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 2.0, 8.0, 8.0, 12.0, 15.0, 16.0, 20.0, 16.0, 23.0, 41.0, 43.0, 78.0, 102.0, 149.0, 107.0, 92.0, 48.0, 40.0, 27.0, 22.0, 18.0, 19.0, 21.0, 13.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014138221740722656, -0.00013662129640579224, -0.0001318603754043579, -0.00012709945440292358, -0.00012233853340148926, -0.00011757761240005493, -0.0001128166913986206, -0.00010805577039718628, -0.00010329484939575195, -9.853392839431763e-05, -9.37730073928833e-05, -8.901208639144897e-05, -8.425116539001465e-05, -7.949024438858032e-05, -7.4729323387146e-05, -6.996840238571167e-05, -6.520748138427734e-05, -6.044656038284302e-05, -5.568563938140869e-05, -5.0924718379974365e-05, -4.616379737854004e-05, -4.140287637710571e-05, -3.664195537567139e-05, -3.188103437423706e-05, -2.7120113372802734e-05, -2.2359192371368408e-05, -1.7598271369934082e-05, -1.2837350368499756e-05, -8.07642936706543e-06, -3.3155083656311035e-06, 1.4454126358032227e-06, 6.206333637237549e-06, 1.0967254638671875e-05, 1.57281756401062e-05, 2.0489096641540527e-05, 2.5250017642974854e-05, 3.001093864440918e-05, 3.4771859645843506e-05, 3.953278064727783e-05, 4.429370164871216e-05, 4.9054622650146484e-05, 5.381554365158081e-05, 5.857646465301514e-05, 6.333738565444946e-05, 6.809830665588379e-05, 7.285922765731812e-05, 7.762014865875244e-05, 8.238106966018677e-05, 8.71419906616211e-05, 9.190291166305542e-05, 9.666383266448975e-05, 0.00010142475366592407, 0.0001061856746673584, 0.00011094659566879272, 0.00011570751667022705, 0.00012046843767166138, 0.0001252293586730957, 0.00012999027967453003, 0.00013475120067596436, 0.00013951212167739868, 0.000144273042678833, 0.00014903396368026733, 0.00015379488468170166, 0.00015855580568313599, 0.0001633167266845703]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 6.0, 11.0, 17.0, 22.0, 45.0, 55.0, 76.0, 138.0, 196.0, 376.0, 683.0, 1432.0, 4080.0, 17572.0, 160266.0, 789975.0, 59295.0, 9289.0, 2714.0, 1016.0, 525.0, 278.0, 141.0, 105.0, 68.0, 45.0, 26.0, 23.0, 17.0, 10.0, 9.0, 6.0, 9.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99658203125, -0.9625778198242188, -0.9285736083984375, -0.8945693969726562, -0.860565185546875, -0.8265609741210938, -0.7925567626953125, -0.7585525512695312, -0.72454833984375, -0.6905441284179688, -0.6565399169921875, -0.6225357055664062, -0.588531494140625, -0.5545272827148438, -0.5205230712890625, -0.48651885986328125, -0.4525146484375, -0.41851043701171875, -0.3845062255859375, -0.35050201416015625, -0.316497802734375, -0.28249359130859375, -0.2484893798828125, -0.21448516845703125, -0.18048095703125, -0.14647674560546875, -0.1124725341796875, -0.07846832275390625, -0.044464111328125, -0.01045989990234375, 0.0235443115234375, 0.05754852294921875, 0.091552734375, 0.12555694580078125, 0.1595611572265625, 0.19356536865234375, 0.227569580078125, 0.26157379150390625, 0.2955780029296875, 0.32958221435546875, 0.36358642578125, 0.39759063720703125, 0.4315948486328125, 0.46559906005859375, 0.499603271484375, 0.5336074829101562, 0.5676116943359375, 0.6016159057617188, 0.6356201171875, 0.6696243286132812, 0.7036285400390625, 0.7376327514648438, 0.771636962890625, 0.8056411743164062, 0.8396453857421875, 0.8736495971679688, 0.90765380859375, 0.9416580200195312, 0.9756622314453125, 1.0096664428710938, 1.043670654296875, 1.0776748657226562, 1.1116790771484375, 1.1456832885742188, 1.1796875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 9.0, 12.0, 15.0, 15.0, 28.0, 27.0, 40.0, 58.0, 72.0, 84.0, 83.0, 93.0, 106.0, 95.0, 61.0, 44.0, 27.0, 22.0, 20.0, 14.0, 14.0, 12.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.91748046875, -0.8915252685546875, -0.865570068359375, -0.8396148681640625, -0.81365966796875, -0.7877044677734375, -0.761749267578125, -0.7357940673828125, -0.7098388671875, -0.6838836669921875, -0.657928466796875, -0.6319732666015625, -0.60601806640625, -0.5800628662109375, -0.554107666015625, -0.5281524658203125, -0.502197265625, -0.4762420654296875, -0.450286865234375, -0.4243316650390625, -0.39837646484375, -0.3724212646484375, -0.346466064453125, -0.3205108642578125, -0.2945556640625, -0.2686004638671875, -0.242645263671875, -0.2166900634765625, -0.19073486328125, -0.1647796630859375, -0.138824462890625, -0.1128692626953125, -0.0869140625, -0.0609588623046875, -0.035003662109375, -0.0090484619140625, 0.01690673828125, 0.0428619384765625, 0.068817138671875, 0.0947723388671875, 0.1207275390625, 0.1466827392578125, 0.172637939453125, 0.1985931396484375, 0.22454833984375, 0.2505035400390625, 0.276458740234375, 0.3024139404296875, 0.328369140625, 0.3543243408203125, 0.380279541015625, 0.4062347412109375, 0.43218994140625, 0.4581451416015625, 0.484100341796875, 0.5100555419921875, 0.5360107421875, 0.5619659423828125, 0.587921142578125, 0.6138763427734375, 0.63983154296875, 0.6657867431640625, 0.691741943359375, 0.7176971435546875, 0.74365234375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 7.0, 38.0, 181.0, 376.0, 276.0, 86.0, 15.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.243545532226562, -11.285758972167969, -10.327972412109375, -9.370185852050781, -8.412399291992188, -7.454613208770752, -6.496826648712158, -5.5390400886535645, -4.581253528594971, -3.623466968536377, -2.665680408477783, -1.7078940868377686, -0.7501075267791748, 0.20767879486083984, 1.1654653549194336, 2.1232519149780273, 3.081038475036621, 4.038825035095215, 4.996611595153809, 5.954398155212402, 6.912184715270996, 7.869970798492432, 8.827756881713867, 9.785543441772461, 10.743330001831055, 11.701116561889648, 12.658903121948242, 13.616689682006836, 14.57447624206543, 15.532262802124023, 16.490049362182617, 17.44783592224121, 18.405622482299805, 19.3634090423584, 20.321195602416992, 21.278982162475586, 22.23676872253418, 23.194555282592773, 24.152341842651367, 25.11012840270996, 26.067914962768555, 27.02570152282715, 27.983488082885742, 28.941274642944336, 29.89906120300293, 30.856847763061523, 31.814634323120117, 32.77241897583008, 33.73020553588867, 34.687992095947266, 35.64577865600586, 36.60356521606445, 37.56135177612305, 38.51913833618164, 39.476924896240234, 40.43471145629883, 41.39249801635742, 42.350284576416016, 43.30807113647461, 44.2658576965332, 45.2236442565918, 46.18143081665039, 47.139217376708984, 48.09700393676758, 49.05479049682617]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 10.0, 7.0, 11.0, 12.0, 21.0, 19.0, 26.0, 35.0, 41.0, 42.0, 55.0, 55.0, 69.0, 67.0, 67.0, 64.0, 58.0, 52.0, 50.0, 50.0, 38.0, 30.0, 33.0, 23.0, 11.0, 18.0, 9.0, 5.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.416694641113281, -9.057862281799316, -8.699029922485352, -8.340197563171387, -7.981365203857422, -7.622532844543457, -7.26370096206665, -6.9048686027526855, -6.546036243438721, -6.187203884124756, -5.828371524810791, -5.469539642333984, -5.1107072830200195, -4.751874923706055, -4.39304256439209, -4.034210205078125, -3.67537784576416, -3.3165454864501953, -2.9577131271362305, -2.5988810062408447, -2.24004864692688, -1.881216287612915, -1.5223841667175293, -1.1635518074035645, -0.8047194480895996, -0.44588714838027954, -0.08705484867095947, 0.2717773914337158, 0.6306097507476807, 0.9894421100616455, 1.3482742309570312, 1.707106590270996, 2.0659379959106445, 2.4247703552246094, 2.783602714538574, 3.14243483543396, 3.501267194747925, 3.8600995540618896, 4.218931674957275, 4.57776403427124, 4.936596393585205, 5.29542875289917, 5.654261112213135, 6.013092994689941, 6.371925354003906, 6.730757713317871, 7.089590072631836, 7.448422431945801, 7.807254791259766, 8.16608715057373, 8.524919509887695, 8.88375186920166, 9.242584228515625, 9.60141658782959, 9.960248947143555, 10.319080352783203, 10.677913665771484, 11.03674602508545, 11.395578384399414, 11.754410743713379, 12.113243103027344, 12.472075462341309, 12.830907821655273, 13.189739227294922, 13.548571586608887]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 16.0, 25.0, 48.0, 88.0, 197.0, 553.0, 763926.0, 3428339.0, 660.0, 192.0, 97.0, 60.0, 28.0, 14.0, 8.0, 3.0, 2.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0390625, -7.76220703125, -7.4853515625, -7.20849609375, -6.931640625, -6.65478515625, -6.3779296875, -6.10107421875, -5.82421875, -5.54736328125, -5.2705078125, -4.99365234375, -4.716796875, -4.43994140625, -4.1630859375, -3.88623046875, -3.609375, -3.33251953125, -3.0556640625, -2.77880859375, -2.501953125, -2.22509765625, -1.9482421875, -1.67138671875, -1.39453125, -1.11767578125, -0.8408203125, -0.56396484375, -0.287109375, -0.01025390625, 0.2666015625, 0.54345703125, 0.8203125, 1.09716796875, 1.3740234375, 1.65087890625, 1.927734375, 2.20458984375, 2.4814453125, 2.75830078125, 3.03515625, 3.31201171875, 3.5888671875, 3.86572265625, 4.142578125, 4.41943359375, 4.6962890625, 4.97314453125, 5.25, 5.52685546875, 5.8037109375, 6.08056640625, 6.357421875, 6.63427734375, 6.9111328125, 7.18798828125, 7.46484375, 7.74169921875, 8.0185546875, 8.29541015625, 8.572265625, 8.84912109375, 9.1259765625, 9.40283203125, 9.6796875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 11.0, 6.0, 16.0, 22.0, 28.0, 18.0, 29.0, 40.0, 55.0, 50.0, 49.0, 53.0, 71.0, 69.0, 69.0, 62.0, 71.0, 51.0, 43.0, 51.0, 33.0, 30.0, 18.0, 15.0, 9.0, 7.0, 4.0, 2.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5966796875, -0.5734176635742188, -0.5501556396484375, -0.5268936157226562, -0.503631591796875, -0.48036956787109375, -0.4571075439453125, -0.43384552001953125, -0.41058349609375, -0.38732147216796875, -0.3640594482421875, -0.34079742431640625, -0.317535400390625, -0.29427337646484375, -0.2710113525390625, -0.24774932861328125, -0.2244873046875, -0.20122528076171875, -0.1779632568359375, -0.15470123291015625, -0.131439208984375, -0.10817718505859375, -0.0849151611328125, -0.06165313720703125, -0.03839111328125, -0.01512908935546875, 0.0081329345703125, 0.03139495849609375, 0.054656982421875, 0.07791900634765625, 0.1011810302734375, 0.12444305419921875, 0.147705078125, 0.17096710205078125, 0.1942291259765625, 0.21749114990234375, 0.240753173828125, 0.26401519775390625, 0.2872772216796875, 0.31053924560546875, 0.33380126953125, 0.35706329345703125, 0.3803253173828125, 0.40358734130859375, 0.426849365234375, 0.45011138916015625, 0.4733734130859375, 0.49663543701171875, 0.5198974609375, 0.5431594848632812, 0.5664215087890625, 0.5896835327148438, 0.612945556640625, 0.6362075805664062, 0.6594696044921875, 0.6827316284179688, 0.70599365234375, 0.7292556762695312, 0.7525177001953125, 0.7757797241210938, 0.799041748046875, 0.8223037719726562, 0.8455657958984375, 0.8688278198242188, 0.89208984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 12.0, 8.0, 15.0, 32.0, 47.0, 117.0, 233.0, 552.0, 1401.0, 3878.0, 12210.0, 53508.0, 572896.0, 3115306.0, 376405.0, 42091.0, 10087.0, 3252.0, 1315.0, 500.0, 205.0, 106.0, 41.0, 21.0, 13.0, 9.0, 9.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83251953125, -0.8021621704101562, -0.7718048095703125, -0.7414474487304688, -0.711090087890625, -0.6807327270507812, -0.6503753662109375, -0.6200180053710938, -0.58966064453125, -0.5593032836914062, -0.5289459228515625, -0.49858856201171875, -0.468231201171875, -0.43787384033203125, -0.4075164794921875, -0.37715911865234375, -0.3468017578125, -0.31644439697265625, -0.2860870361328125, -0.25572967529296875, -0.225372314453125, -0.19501495361328125, -0.1646575927734375, -0.13430023193359375, -0.10394287109375, -0.07358551025390625, -0.0432281494140625, -0.01287078857421875, 0.017486572265625, 0.04784393310546875, 0.0782012939453125, 0.10855865478515625, 0.138916015625, 0.16927337646484375, 0.1996307373046875, 0.22998809814453125, 0.260345458984375, 0.29070281982421875, 0.3210601806640625, 0.35141754150390625, 0.38177490234375, 0.41213226318359375, 0.4424896240234375, 0.47284698486328125, 0.503204345703125, 0.5335617065429688, 0.5639190673828125, 0.5942764282226562, 0.6246337890625, 0.6549911499023438, 0.6853485107421875, 0.7157058715820312, 0.746063232421875, 0.7764205932617188, 0.8067779541015625, 0.8371353149414062, 0.86749267578125, 0.8978500366210938, 0.9282073974609375, 0.9585647583007812, 0.988922119140625, 1.0192794799804688, 1.0496368408203125, 1.0799942016601562, 1.1103515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 10.0, 11.0, 16.0, 17.0, 27.0, 36.0, 40.0, 105.0, 144.0, 222.0, 342.0, 543.0, 640.0, 596.0, 439.0, 278.0, 191.0, 138.0, 70.0, 48.0, 36.0, 29.0, 21.0, 10.0, 12.0, 7.0, 5.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8671875, -0.8389663696289062, -0.8107452392578125, -0.7825241088867188, -0.754302978515625, -0.7260818481445312, -0.6978607177734375, -0.6696395874023438, -0.64141845703125, -0.6131973266601562, -0.5849761962890625, -0.5567550659179688, -0.528533935546875, -0.5003128051757812, -0.4720916748046875, -0.44387054443359375, -0.4156494140625, -0.38742828369140625, -0.3592071533203125, -0.33098602294921875, -0.302764892578125, -0.27454376220703125, -0.2463226318359375, -0.21810150146484375, -0.18988037109375, -0.16165924072265625, -0.1334381103515625, -0.10521697998046875, -0.076995849609375, -0.04877471923828125, -0.0205535888671875, 0.00766754150390625, 0.035888671875, 0.06410980224609375, 0.0923309326171875, 0.12055206298828125, 0.148773193359375, 0.17699432373046875, 0.2052154541015625, 0.23343658447265625, 0.26165771484375, 0.28987884521484375, 0.3180999755859375, 0.34632110595703125, 0.374542236328125, 0.40276336669921875, 0.4309844970703125, 0.45920562744140625, 0.4874267578125, 0.5156478881835938, 0.5438690185546875, 0.5720901489257812, 0.600311279296875, 0.6285324096679688, 0.6567535400390625, 0.6849746704101562, 0.71319580078125, 0.7414169311523438, 0.7696380615234375, 0.7978591918945312, 0.826080322265625, 0.8543014526367188, 0.8825225830078125, 0.9107437133789062, 0.93896484375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 11.0, 13.0, 19.0, 78.0, 135.0, 212.0, 216.0, 154.0, 82.0, 36.0, 13.0, 10.0, 5.0, 5.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.778206825256348, -8.465622901916504, -8.153038024902344, -7.8404541015625, -7.527870178222656, -7.215285778045654, -6.902701377868652, -6.590117454528809, -6.277533054351807, -5.964948654174805, -5.652364730834961, -5.339780330657959, -5.027195930480957, -4.714612007141113, -4.402027606964111, -4.089443206787109, -3.7768592834472656, -3.4642751216888428, -3.15169095993042, -2.839106559753418, -2.526522397994995, -2.2139382362365723, -1.9013539552688599, -1.5887696743011475, -1.2761855125427246, -0.963601291179657, -0.6510170698165894, -0.33843284845352173, -0.0258486270904541, 0.28673553466796875, 0.5993198156356812, 0.9119040966033936, 1.2244873046875, 1.5370714664459229, 1.8496557474136353, 2.1622400283813477, 2.4748241901397705, 2.7874083518981934, 3.0999927520751953, 3.412576913833618, 3.725161075592041, 4.037745475769043, 4.350329399108887, 4.662913799285889, 4.975498199462891, 5.288082122802734, 5.600666522979736, 5.913250923156738, 6.225834846496582, 6.538419246673584, 6.851003170013428, 7.16358757019043, 7.476171493530273, 7.788755893707275, 8.101340293884277, 8.413924217224121, 8.726509094238281, 9.039093017578125, 9.351677894592285, 9.664261817932129, 9.976845741271973, 10.289430618286133, 10.602014541625977, 10.91459846496582, 11.227182388305664]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 7.0, 6.0, 6.0, 8.0, 13.0, 11.0, 16.0, 14.0, 20.0, 20.0, 24.0, 36.0, 22.0, 24.0, 41.0, 54.0, 54.0, 55.0, 43.0, 45.0, 41.0, 44.0, 47.0, 43.0, 39.0, 49.0, 41.0, 30.0, 28.0, 22.0, 23.0, 12.0, 13.0, 11.0, 10.0, 12.0, 3.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.838140487670898, -4.7023725509643555, -4.566605091094971, -4.430837154388428, -4.295069217681885, -4.1593017578125, -4.023533821105957, -3.887766122817993, -3.7519984245300293, -3.6162307262420654, -3.4804627895355225, -3.3446950912475586, -3.2089273929595947, -3.073159694671631, -2.937391757965088, -2.801624059677124, -2.665856122970581, -2.530088424682617, -2.394320487976074, -2.2585527896881104, -2.1227850914001465, -1.987017273902893, -1.8512494564056396, -1.7154817581176758, -1.5797139406204224, -1.443946123123169, -1.308178424835205, -1.1724106073379517, -1.0366427898406982, -0.9008750915527344, -0.765107274055481, -0.6293395161628723, -0.49357151985168457, -0.3578037619590759, -0.2220359742641449, -0.08626818656921387, 0.049499571323394775, 0.18526732921600342, 0.32103514671325684, 0.4568029046058655, 0.5925706624984741, 0.7283384203910828, 0.8641061782836914, 0.9998739957809448, 1.1356418132781982, 1.271409511566162, 1.4071773290634155, 1.542945146560669, 1.6787128448486328, 1.8144806623458862, 1.95024836063385, 2.0860161781311035, 2.2217838764190674, 2.3575515747070312, 2.493319511413574, 2.629087209701538, 2.764854907989502, 2.900622606277466, 3.036390542984009, 3.1721582412719727, 3.3079259395599365, 3.4436936378479004, 3.5794615745544434, 3.7152292728424072, 3.85099720954895]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 10.0, 11.0, 13.0, 18.0, 16.0, 24.0, 48.0, 62.0, 113.0, 145.0, 287.0, 462.0, 910.0, 1795.0, 3913.0, 9820.0, 27246.0, 92258.0, 384359.0, 388555.0, 92657.0, 27670.0, 9943.0, 4074.0, 1873.0, 999.0, 490.0, 285.0, 155.0, 107.0, 74.0, 46.0, 31.0, 22.0, 21.0, 7.0, 6.0, 8.0, 2.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.2158203125, -1.1820526123046875, -1.148284912109375, -1.1145172119140625, -1.08074951171875, -1.0469818115234375, -1.013214111328125, -0.9794464111328125, -0.9456787109375, -0.9119110107421875, -0.878143310546875, -0.8443756103515625, -0.81060791015625, -0.7768402099609375, -0.743072509765625, -0.7093048095703125, -0.675537109375, -0.6417694091796875, -0.608001708984375, -0.5742340087890625, -0.54046630859375, -0.5066986083984375, -0.472930908203125, -0.4391632080078125, -0.4053955078125, -0.3716278076171875, -0.337860107421875, -0.3040924072265625, -0.27032470703125, -0.2365570068359375, -0.202789306640625, -0.1690216064453125, -0.13525390625, -0.1014862060546875, -0.067718505859375, -0.0339508056640625, -0.00018310546875, 0.0335845947265625, 0.067352294921875, 0.1011199951171875, 0.1348876953125, 0.1686553955078125, 0.202423095703125, 0.2361907958984375, 0.26995849609375, 0.3037261962890625, 0.337493896484375, 0.3712615966796875, 0.405029296875, 0.4387969970703125, 0.472564697265625, 0.5063323974609375, 0.54010009765625, 0.5738677978515625, 0.607635498046875, 0.6414031982421875, 0.6751708984375, 0.7089385986328125, 0.742706298828125, 0.7764739990234375, 0.81024169921875, 0.8440093994140625, 0.877777099609375, 0.9115447998046875, 0.9453125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 6.0, 13.0, 14.0, 14.0, 26.0, 28.0, 38.0, 40.0, 44.0, 66.0, 49.0, 48.0, 76.0, 68.0, 75.0, 61.0, 52.0, 61.0, 37.0, 52.0, 29.0, 24.0, 22.0, 17.0, 10.0, 7.0, 6.0, 6.0, 1.0, 6.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.623046875, -0.5995025634765625, -0.575958251953125, -0.5524139404296875, -0.52886962890625, -0.5053253173828125, -0.481781005859375, -0.4582366943359375, -0.4346923828125, -0.4111480712890625, -0.387603759765625, -0.3640594482421875, -0.34051513671875, -0.3169708251953125, -0.293426513671875, -0.2698822021484375, -0.246337890625, -0.2227935791015625, -0.199249267578125, -0.1757049560546875, -0.15216064453125, -0.1286163330078125, -0.105072021484375, -0.0815277099609375, -0.0579833984375, -0.0344390869140625, -0.010894775390625, 0.0126495361328125, 0.03619384765625, 0.0597381591796875, 0.083282470703125, 0.1068267822265625, 0.13037109375, 0.1539154052734375, 0.177459716796875, 0.2010040283203125, 0.22454833984375, 0.2480926513671875, 0.271636962890625, 0.2951812744140625, 0.3187255859375, 0.3422698974609375, 0.365814208984375, 0.3893585205078125, 0.41290283203125, 0.4364471435546875, 0.459991455078125, 0.4835357666015625, 0.507080078125, 0.5306243896484375, 0.554168701171875, 0.5777130126953125, 0.60125732421875, 0.6248016357421875, 0.648345947265625, 0.6718902587890625, 0.6954345703125, 0.7189788818359375, 0.742523193359375, 0.7660675048828125, 0.78961181640625, 0.8131561279296875, 0.836700439453125, 0.8602447509765625, 0.8837890625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 7.0, 13.0, 14.0, 15.0, 22.0, 38.0, 77.0, 123.0, 261.0, 518.0, 1341.0, 4261.0, 25284.0, 388201.0, 588907.0, 31964.0, 4895.0, 1413.0, 579.0, 270.0, 127.0, 82.0, 43.0, 34.0, 22.0, 10.0, 12.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.84765625, -2.778289794921875, -2.70892333984375, -2.639556884765625, -2.5701904296875, -2.500823974609375, -2.43145751953125, -2.362091064453125, -2.292724609375, -2.223358154296875, -2.15399169921875, -2.084625244140625, -2.0152587890625, -1.945892333984375, -1.87652587890625, -1.807159423828125, -1.73779296875, -1.668426513671875, -1.59906005859375, -1.529693603515625, -1.4603271484375, -1.390960693359375, -1.32159423828125, -1.252227783203125, -1.182861328125, -1.113494873046875, -1.04412841796875, -0.974761962890625, -0.9053955078125, -0.836029052734375, -0.76666259765625, -0.697296142578125, -0.6279296875, -0.558563232421875, -0.48919677734375, -0.419830322265625, -0.3504638671875, -0.281097412109375, -0.21173095703125, -0.142364501953125, -0.072998046875, -0.003631591796875, 0.06573486328125, 0.135101318359375, 0.2044677734375, 0.273834228515625, 0.34320068359375, 0.412567138671875, 0.48193359375, 0.551300048828125, 0.62066650390625, 0.690032958984375, 0.7593994140625, 0.828765869140625, 0.89813232421875, 0.967498779296875, 1.036865234375, 1.106231689453125, 1.17559814453125, 1.244964599609375, 1.3143310546875, 1.383697509765625, 1.45306396484375, 1.522430419921875, 1.591796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 6.0, 7.0, 7.0, 8.0, 9.0, 10.0, 21.0, 33.0, 22.0, 37.0, 38.0, 53.0, 48.0, 35.0, 61.0, 64.0, 55.0, 59.0, 69.0, 51.0, 50.0, 39.0, 39.0, 42.0, 33.0, 18.0, 17.0, 16.0, 6.0, 10.0, 7.0, 13.0, 2.0, 5.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.548828125, -2.468353271484375, -2.38787841796875, -2.307403564453125, -2.2269287109375, -2.146453857421875, -2.06597900390625, -1.985504150390625, -1.905029296875, -1.824554443359375, -1.74407958984375, -1.663604736328125, -1.5831298828125, -1.502655029296875, -1.42218017578125, -1.341705322265625, -1.26123046875, -1.180755615234375, -1.10028076171875, -1.019805908203125, -0.9393310546875, -0.858856201171875, -0.77838134765625, -0.697906494140625, -0.617431640625, -0.536956787109375, -0.45648193359375, -0.376007080078125, -0.2955322265625, -0.215057373046875, -0.13458251953125, -0.054107666015625, 0.0263671875, 0.106842041015625, 0.18731689453125, 0.267791748046875, 0.3482666015625, 0.428741455078125, 0.50921630859375, 0.589691162109375, 0.670166015625, 0.750640869140625, 0.83111572265625, 0.911590576171875, 0.9920654296875, 1.072540283203125, 1.15301513671875, 1.233489990234375, 1.31396484375, 1.394439697265625, 1.47491455078125, 1.555389404296875, 1.6358642578125, 1.716339111328125, 1.79681396484375, 1.877288818359375, 1.957763671875, 2.038238525390625, 2.11871337890625, 2.199188232421875, 2.2796630859375, 2.360137939453125, 2.44061279296875, 2.521087646484375, 2.6015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 10.0, 14.0, 18.0, 19.0, 29.0, 81.0, 157.0, 547.0, 2144.0, 24141.0, 958815.0, 58102.0, 3363.0, 658.0, 228.0, 88.0, 49.0, 26.0, 19.0, 8.0, 10.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.4756011962890625, -1.413116455078125, -1.3506317138671875, -1.28814697265625, -1.2256622314453125, -1.163177490234375, -1.1006927490234375, -1.0382080078125, -0.9757232666015625, -0.913238525390625, -0.8507537841796875, -0.78826904296875, -0.7257843017578125, -0.663299560546875, -0.6008148193359375, -0.538330078125, -0.4758453369140625, -0.413360595703125, -0.3508758544921875, -0.28839111328125, -0.2259063720703125, -0.163421630859375, -0.1009368896484375, -0.0384521484375, 0.0240325927734375, 0.086517333984375, 0.1490020751953125, 0.21148681640625, 0.2739715576171875, 0.336456298828125, 0.3989410400390625, 0.46142578125, 0.5239105224609375, 0.586395263671875, 0.6488800048828125, 0.71136474609375, 0.7738494873046875, 0.836334228515625, 0.8988189697265625, 0.9613037109375, 1.0237884521484375, 1.086273193359375, 1.1487579345703125, 1.21124267578125, 1.2737274169921875, 1.336212158203125, 1.3986968994140625, 1.461181640625, 1.5236663818359375, 1.586151123046875, 1.6486358642578125, 1.71112060546875, 1.7736053466796875, 1.836090087890625, 1.8985748291015625, 1.9610595703125, 2.0235443115234375, 2.086029052734375, 2.1485137939453125, 2.21099853515625, 2.2734832763671875, 2.335968017578125, 2.3984527587890625, 2.4609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 8.0, 8.0, 6.0, 12.0, 11.0, 22.0, 23.0, 40.0, 53.0, 77.0, 138.0, 191.0, 158.0, 81.0, 54.0, 37.0, 20.0, 12.0, 9.0, 14.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001983642578125, -0.00019229575991630554, -0.00018622726202011108, -0.00018015876412391663, -0.00017409026622772217, -0.0001680217683315277, -0.00016195327043533325, -0.0001558847725391388, -0.00014981627464294434, -0.00014374777674674988, -0.00013767927885055542, -0.00013161078095436096, -0.0001255422830581665, -0.00011947378516197205, -0.00011340528726577759, -0.00010733678936958313, -0.00010126829147338867, -9.519979357719421e-05, -8.913129568099976e-05, -8.30627977848053e-05, -7.699429988861084e-05, -7.092580199241638e-05, -6.485730409622192e-05, -5.8788806200027466e-05, -5.272030830383301e-05, -4.665181040763855e-05, -4.058331251144409e-05, -3.4514814615249634e-05, -2.8446316719055176e-05, -2.2377818822860718e-05, -1.630932092666626e-05, -1.0240823030471802e-05, -4.172325134277344e-06, 1.8961727619171143e-06, 7.964670658111572e-06, 1.403316855430603e-05, 2.0101666450500488e-05, 2.6170164346694946e-05, 3.2238662242889404e-05, 3.830716013908386e-05, 4.437565803527832e-05, 5.044415593147278e-05, 5.6512653827667236e-05, 6.25811517238617e-05, 6.864964962005615e-05, 7.471814751625061e-05, 8.078664541244507e-05, 8.685514330863953e-05, 9.292364120483398e-05, 9.899213910102844e-05, 0.0001050606369972229, 0.00011112913489341736, 0.00011719763278961182, 0.00012326613068580627, 0.00012933462858200073, 0.0001354031264781952, 0.00014147162437438965, 0.0001475401222705841, 0.00015360862016677856, 0.00015967711806297302, 0.00016574561595916748, 0.00017181411385536194, 0.0001778826117515564, 0.00018395110964775085, 0.0001900196075439453]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 5.0, 14.0, 20.0, 29.0, 34.0, 56.0, 73.0, 111.0, 175.0, 290.0, 530.0, 982.0, 2148.0, 5205.0, 15022.0, 65623.0, 607457.0, 292066.0, 40490.0, 10683.0, 3877.0, 1715.0, 786.0, 404.0, 246.0, 147.0, 105.0, 68.0, 37.0, 47.0, 25.0, 21.0, 10.0, 6.0, 7.0, 12.0, 3.0, 3.0, 4.0, 5.0, 1.0, 2.0], "bins": [-0.8193359375, -0.798248291015625, -0.77716064453125, -0.756072998046875, -0.7349853515625, -0.713897705078125, -0.69281005859375, -0.671722412109375, -0.650634765625, -0.629547119140625, -0.60845947265625, -0.587371826171875, -0.5662841796875, -0.545196533203125, -0.52410888671875, -0.503021240234375, -0.48193359375, -0.460845947265625, -0.43975830078125, -0.418670654296875, -0.3975830078125, -0.376495361328125, -0.35540771484375, -0.334320068359375, -0.313232421875, -0.292144775390625, -0.27105712890625, -0.249969482421875, -0.2288818359375, -0.207794189453125, -0.18670654296875, -0.165618896484375, -0.14453125, -0.123443603515625, -0.10235595703125, -0.081268310546875, -0.0601806640625, -0.039093017578125, -0.01800537109375, 0.003082275390625, 0.024169921875, 0.045257568359375, 0.06634521484375, 0.087432861328125, 0.1085205078125, 0.129608154296875, 0.15069580078125, 0.171783447265625, 0.19287109375, 0.213958740234375, 0.23504638671875, 0.256134033203125, 0.2772216796875, 0.298309326171875, 0.31939697265625, 0.340484619140625, 0.361572265625, 0.382659912109375, 0.40374755859375, 0.424835205078125, 0.4459228515625, 0.467010498046875, 0.48809814453125, 0.509185791015625, 0.5302734375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 3.0, 8.0, 12.0, 11.0, 27.0, 26.0, 40.0, 58.0, 78.0, 104.0, 131.0, 108.0, 110.0, 69.0, 52.0, 48.0, 28.0, 28.0, 17.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7578125, -0.734100341796875, -0.71038818359375, -0.686676025390625, -0.6629638671875, -0.639251708984375, -0.61553955078125, -0.591827392578125, -0.568115234375, -0.544403076171875, -0.52069091796875, -0.496978759765625, -0.4732666015625, -0.449554443359375, -0.42584228515625, -0.402130126953125, -0.37841796875, -0.354705810546875, -0.33099365234375, -0.307281494140625, -0.2835693359375, -0.259857177734375, -0.23614501953125, -0.212432861328125, -0.188720703125, -0.165008544921875, -0.14129638671875, -0.117584228515625, -0.0938720703125, -0.070159912109375, -0.04644775390625, -0.022735595703125, 0.0009765625, 0.024688720703125, 0.04840087890625, 0.072113037109375, 0.0958251953125, 0.119537353515625, 0.14324951171875, 0.166961669921875, 0.190673828125, 0.214385986328125, 0.23809814453125, 0.261810302734375, 0.2855224609375, 0.309234619140625, 0.33294677734375, 0.356658935546875, 0.38037109375, 0.404083251953125, 0.42779541015625, 0.451507568359375, 0.4752197265625, 0.498931884765625, 0.52264404296875, 0.546356201171875, 0.570068359375, 0.593780517578125, 0.61749267578125, 0.641204833984375, 0.6649169921875, 0.688629150390625, 0.71234130859375, 0.736053466796875, 0.759765625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 9.0, 35.0, 113.0, 265.0, 307.0, 168.0, 53.0, 26.0, 7.0, 8.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.122325897216797, -19.498199462890625, -18.874074935913086, -18.249950408935547, -17.625823974609375, -17.001697540283203, -16.377573013305664, -15.753447532653809, -15.129322052001953, -14.505196571350098, -13.881071090698242, -13.256945610046387, -12.632820129394531, -12.008694648742676, -11.38456916809082, -10.760443687438965, -10.13631820678711, -9.512192726135254, -8.888067245483398, -8.263941764831543, -7.6398162841796875, -7.015690803527832, -6.391565322875977, -5.767439842224121, -5.143314361572266, -4.51918888092041, -3.8950634002685547, -3.270937919616699, -2.6468124389648438, -2.0226869583129883, -1.3985614776611328, -0.7744359970092773, -0.15030860900878906, 0.4738168716430664, 1.0979423522949219, 1.7220678329467773, 2.346193313598633, 2.9703187942504883, 3.5944442749023438, 4.218569755554199, 4.842695236206055, 5.46682071685791, 6.090946197509766, 6.715071678161621, 7.339197158813477, 7.963322639465332, 8.587448120117188, 9.211573600769043, 9.835699081420898, 10.459824562072754, 11.08395004272461, 11.708075523376465, 12.33220100402832, 12.956326484680176, 13.580451965332031, 14.204577445983887, 14.828702926635742, 15.452828407287598, 16.076953887939453, 16.701080322265625, 17.325204849243164, 17.949329376220703, 18.573455810546875, 19.197582244873047, 19.821706771850586]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 2.0, 8.0, 15.0, 17.0, 15.0, 10.0, 20.0, 31.0, 25.0, 30.0, 34.0, 40.0, 40.0, 45.0, 78.0, 68.0, 65.0, 61.0, 50.0, 55.0, 46.0, 37.0, 35.0, 32.0, 29.0, 30.0, 22.0, 17.0, 9.0, 11.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.19511890411377, -10.891559600830078, -10.588000297546387, -10.284440040588379, -9.980880737304688, -9.677321434020996, -9.373762130737305, -9.070202827453613, -8.766643524169922, -8.46308422088623, -8.159524917602539, -7.8559651374816895, -7.55240535736084, -7.248846054077148, -6.945286750793457, -6.641727447509766, -6.338167190551758, -6.034607887268066, -5.731048107147217, -5.427488803863525, -5.123929023742676, -4.820369720458984, -4.516810417175293, -4.213251113891602, -3.909691333770752, -3.6061317920684814, -3.302572250366211, -2.9990129470825195, -2.695453405380249, -2.3918938636779785, -2.088334560394287, -1.7847750186920166, -1.4812145233154297, -1.1776549816131592, -0.8740955591201782, -0.5705360770225525, -0.26697659492492676, 0.03658294677734375, 0.3401423692703247, 0.6437017917633057, 0.9472613334655762, 1.2508208751678467, 1.5543802976608276, 1.8579397201538086, 2.161499261856079, 2.4650588035583496, 2.768618106842041, 3.0721776485443115, 3.375737190246582, 3.6792967319488525, 3.982856273651123, 4.2864155769348145, 4.589975357055664, 4.8935346603393555, 5.197093963623047, 5.500653266906738, 5.804213047027588, 6.107772350311279, 6.411332130432129, 6.71489143371582, 7.018450736999512, 7.322010517120361, 7.625569820404053, 7.929129600524902, 8.232688903808594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 7.0, 10.0, 10.0, 20.0, 25.0, 66.0, 108.0, 211.0, 593.0, 2501.0, 17109.0, 349682.0, 3615868.0, 192703.0, 11830.0, 2252.0, 688.0, 274.0, 138.0, 74.0, 42.0, 22.0, 22.0, 13.0, 2.0, 4.0, 3.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4853515625, -1.44091796875, -1.396484375, -1.35205078125, -1.3076171875, -1.26318359375, -1.21875, -1.17431640625, -1.1298828125, -1.08544921875, -1.041015625, -0.99658203125, -0.9521484375, -0.90771484375, -0.86328125, -0.81884765625, -0.7744140625, -0.72998046875, -0.685546875, -0.64111328125, -0.5966796875, -0.55224609375, -0.5078125, -0.46337890625, -0.4189453125, -0.37451171875, -0.330078125, -0.28564453125, -0.2412109375, -0.19677734375, -0.15234375, -0.10791015625, -0.0634765625, -0.01904296875, 0.025390625, 0.06982421875, 0.1142578125, 0.15869140625, 0.203125, 0.24755859375, 0.2919921875, 0.33642578125, 0.380859375, 0.42529296875, 0.4697265625, 0.51416015625, 0.55859375, 0.60302734375, 0.6474609375, 0.69189453125, 0.736328125, 0.78076171875, 0.8251953125, 0.86962890625, 0.9140625, 0.95849609375, 1.0029296875, 1.04736328125, 1.091796875, 1.13623046875, 1.1806640625, 1.22509765625, 1.26953125, 1.31396484375, 1.3583984375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 17.0, 27.0, 36.0, 52.0, 69.0, 87.0, 101.0, 134.0, 119.0, 76.0, 89.0, 69.0, 50.0, 30.0, 15.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.24609375, -1.2102813720703125, -1.174468994140625, -1.1386566162109375, -1.10284423828125, -1.0670318603515625, -1.031219482421875, -0.9954071044921875, -0.9595947265625, -0.9237823486328125, -0.887969970703125, -0.8521575927734375, -0.81634521484375, -0.7805328369140625, -0.744720458984375, -0.7089080810546875, -0.673095703125, -0.6372833251953125, -0.601470947265625, -0.5656585693359375, -0.52984619140625, -0.4940338134765625, -0.458221435546875, -0.4224090576171875, -0.3865966796875, -0.3507843017578125, -0.314971923828125, -0.2791595458984375, -0.24334716796875, -0.2075347900390625, -0.171722412109375, -0.1359100341796875, -0.10009765625, -0.0642852783203125, -0.028472900390625, 0.0073394775390625, 0.04315185546875, 0.0789642333984375, 0.114776611328125, 0.1505889892578125, 0.1864013671875, 0.2222137451171875, 0.258026123046875, 0.2938385009765625, 0.32965087890625, 0.3654632568359375, 0.401275634765625, 0.4370880126953125, 0.472900390625, 0.5087127685546875, 0.544525146484375, 0.5803375244140625, 0.61614990234375, 0.6519622802734375, 0.687774658203125, 0.7235870361328125, 0.7593994140625, 0.7952117919921875, 0.831024169921875, 0.8668365478515625, 0.90264892578125, 0.9384613037109375, 0.974273681640625, 1.0100860595703125, 1.0458984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 1.0, 8.0, 9.0, 16.0, 14.0, 22.0, 22.0, 44.0, 64.0, 112.0, 162.0, 263.0, 441.0, 901.0, 1854.0, 4491.0, 11729.0, 37153.0, 161371.0, 1270098.0, 2302649.0, 317539.0, 58450.0, 16485.0, 5717.0, 2252.0, 1029.0, 520.0, 295.0, 187.0, 121.0, 76.0, 51.0, 37.0, 18.0, 24.0, 12.0, 14.0, 6.0, 2.0, 5.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.69580078125, -0.6734848022460938, -0.6511688232421875, -0.6288528442382812, -0.606536865234375, -0.5842208862304688, -0.5619049072265625, -0.5395889282226562, -0.51727294921875, -0.49495697021484375, -0.4726409912109375, -0.45032501220703125, -0.428009033203125, -0.40569305419921875, -0.3833770751953125, -0.36106109619140625, -0.3387451171875, -0.31642913818359375, -0.2941131591796875, -0.27179718017578125, -0.249481201171875, -0.22716522216796875, -0.2048492431640625, -0.18253326416015625, -0.16021728515625, -0.13790130615234375, -0.1155853271484375, -0.09326934814453125, -0.070953369140625, -0.04863739013671875, -0.0263214111328125, -0.00400543212890625, 0.018310546875, 0.04062652587890625, 0.0629425048828125, 0.08525848388671875, 0.107574462890625, 0.12989044189453125, 0.1522064208984375, 0.17452239990234375, 0.19683837890625, 0.21915435791015625, 0.2414703369140625, 0.26378631591796875, 0.286102294921875, 0.30841827392578125, 0.3307342529296875, 0.35305023193359375, 0.3753662109375, 0.39768218994140625, 0.4199981689453125, 0.44231414794921875, 0.464630126953125, 0.48694610595703125, 0.5092620849609375, 0.5315780639648438, 0.55389404296875, 0.5762100219726562, 0.5985260009765625, 0.6208419799804688, 0.643157958984375, 0.6654739379882812, 0.6877899169921875, 0.7101058959960938, 0.732421875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 7.0, 3.0, 6.0, 16.0, 12.0, 16.0, 28.0, 37.0, 73.0, 125.0, 220.0, 375.0, 660.0, 830.0, 665.0, 438.0, 241.0, 110.0, 91.0, 43.0, 25.0, 18.0, 13.0, 10.0, 10.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.162109375, -1.1199493408203125, -1.077789306640625, -1.0356292724609375, -0.99346923828125, -0.9513092041015625, -0.909149169921875, -0.8669891357421875, -0.8248291015625, -0.7826690673828125, -0.740509033203125, -0.6983489990234375, -0.65618896484375, -0.6140289306640625, -0.571868896484375, -0.5297088623046875, -0.487548828125, -0.4453887939453125, -0.403228759765625, -0.3610687255859375, -0.31890869140625, -0.2767486572265625, -0.234588623046875, -0.1924285888671875, -0.1502685546875, -0.1081085205078125, -0.065948486328125, -0.0237884521484375, 0.01837158203125, 0.0605316162109375, 0.102691650390625, 0.1448516845703125, 0.18701171875, 0.2291717529296875, 0.271331787109375, 0.3134918212890625, 0.35565185546875, 0.3978118896484375, 0.439971923828125, 0.4821319580078125, 0.5242919921875, 0.5664520263671875, 0.608612060546875, 0.6507720947265625, 0.69293212890625, 0.7350921630859375, 0.777252197265625, 0.8194122314453125, 0.861572265625, 0.9037322998046875, 0.945892333984375, 0.9880523681640625, 1.03021240234375, 1.0723724365234375, 1.114532470703125, 1.1566925048828125, 1.1988525390625, 1.2410125732421875, 1.283172607421875, 1.3253326416015625, 1.36749267578125, 1.4096527099609375, 1.451812744140625, 1.4939727783203125, 1.5361328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 5.0, 12.0, 14.0, 48.0, 111.0, 173.0, 193.0, 187.0, 124.0, 49.0, 40.0, 17.0, 15.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.897523880004883, -11.520047187805176, -11.142571449279785, -10.765094757080078, -10.387619018554688, -10.01014232635498, -9.63266658782959, -9.255189895629883, -8.877714157104492, -8.500237464904785, -8.122761726379395, -7.745285511016846, -7.367809295654297, -6.990333080291748, -6.612856864929199, -6.235380172729492, -5.857903957366943, -5.4804277420043945, -5.102951526641846, -4.725475311279297, -4.347999095916748, -3.970522880554199, -3.5930464267730713, -3.2155702114105225, -2.8380939960479736, -2.460617780685425, -2.083141565322876, -1.7056652307510376, -1.3281890153884888, -0.9507128000259399, -0.5732364654541016, -0.19576025009155273, 0.1817159652709961, 0.5591921806335449, 0.9366684556007385, 1.3141447305679321, 1.691620945930481, 2.0690970420837402, 2.446573495864868, 2.824049711227417, 3.201525926589966, 3.5790021419525146, 3.9564783573150635, 4.333954811096191, 4.71143102645874, 5.088907241821289, 5.466383457183838, 5.843859672546387, 6.2213358879089355, 6.598812103271484, 6.976288318634033, 7.353764533996582, 7.731240749359131, 8.10871696472168, 8.486193656921387, 8.863669395446777, 9.241146087646484, 9.618622779846191, 9.996098518371582, 10.373575210571289, 10.75105094909668, 11.128527641296387, 11.506003379821777, 11.883480072021484, 12.260955810546875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 9.0, 5.0, 9.0, 12.0, 14.0, 21.0, 28.0, 25.0, 44.0, 42.0, 49.0, 55.0, 64.0, 58.0, 59.0, 57.0, 74.0, 53.0, 53.0, 53.0, 42.0, 37.0, 31.0, 25.0, 22.0, 15.0, 14.0, 12.0, 6.0, 5.0, 8.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.308134078979492, -7.113401412963867, -6.918668746948242, -6.723936080932617, -6.529203414916992, -6.334471225738525, -6.1397385597229, -5.945005893707275, -5.75027322769165, -5.555540561676025, -5.3608078956604, -5.166075229644775, -4.971343040466309, -4.776610374450684, -4.581877708435059, -4.387145042419434, -4.192412376403809, -3.9976797103881836, -3.8029470443725586, -3.6082146167755127, -3.4134819507598877, -3.2187492847442627, -3.024016857147217, -2.829284191131592, -2.634551525115967, -2.439818859100342, -2.245086193084717, -2.050353765487671, -1.855621099472046, -1.660888433456421, -1.4661558866500854, -1.27142333984375, -1.0766911506652832, -0.881958544254303, -0.6872259378433228, -0.49249333143234253, -0.2977607250213623, -0.10302811861038208, 0.09170448780059814, 0.2864370346069336, 0.4811697006225586, 0.6759023070335388, 0.870634913444519, 1.0653674602508545, 1.2601001262664795, 1.4548327922821045, 1.64956533908844, 1.8442978858947754, 2.0390305519104004, 2.2337632179260254, 2.4284958839416504, 2.6232283115386963, 2.8179609775543213, 3.0126936435699463, 3.207426071166992, 3.402158737182617, 3.596891403198242, 3.791624069213867, 3.986356735229492, 4.181089401245117, 4.375822067260742, 4.570554256439209, 4.765286922454834, 4.960019588470459, 5.154752254486084]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 7.0, 6.0, 11.0, 23.0, 30.0, 36.0, 53.0, 67.0, 128.0, 222.0, 344.0, 654.0, 1281.0, 3064.0, 7895.0, 23138.0, 71758.0, 230785.0, 437353.0, 183832.0, 57357.0, 18815.0, 6586.0, 2567.0, 1172.0, 587.0, 337.0, 157.0, 93.0, 57.0, 45.0, 28.0, 20.0, 15.0, 10.0, 8.0, 3.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.15234375, -1.1206893920898438, -1.0890350341796875, -1.0573806762695312, -1.025726318359375, -0.9940719604492188, -0.9624176025390625, -0.9307632446289062, -0.89910888671875, -0.8674545288085938, -0.8358001708984375, -0.8041458129882812, -0.772491455078125, -0.7408370971679688, -0.7091827392578125, -0.6775283813476562, -0.6458740234375, -0.6142196655273438, -0.5825653076171875, -0.5509109497070312, -0.519256591796875, -0.48760223388671875, -0.4559478759765625, -0.42429351806640625, -0.39263916015625, -0.36098480224609375, -0.3293304443359375, -0.29767608642578125, -0.266021728515625, -0.23436737060546875, -0.2027130126953125, -0.17105865478515625, -0.139404296875, -0.10774993896484375, -0.0760955810546875, -0.04444122314453125, -0.012786865234375, 0.01886749267578125, 0.0505218505859375, 0.08217620849609375, 0.11383056640625, 0.14548492431640625, 0.1771392822265625, 0.20879364013671875, 0.240447998046875, 0.27210235595703125, 0.3037567138671875, 0.33541107177734375, 0.3670654296875, 0.39871978759765625, 0.4303741455078125, 0.46202850341796875, 0.493682861328125, 0.5253372192382812, 0.5569915771484375, 0.5886459350585938, 0.62030029296875, 0.6519546508789062, 0.6836090087890625, 0.7152633666992188, 0.746917724609375, 0.7785720825195312, 0.8102264404296875, 0.8418807983398438, 0.87353515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 7.0, 6.0, 4.0, 17.0, 19.0, 30.0, 46.0, 56.0, 72.0, 86.0, 111.0, 106.0, 98.0, 106.0, 75.0, 58.0, 36.0, 24.0, 19.0, 10.0, 9.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3193359375, -1.286773681640625, -1.25421142578125, -1.221649169921875, -1.1890869140625, -1.156524658203125, -1.12396240234375, -1.091400146484375, -1.058837890625, -1.026275634765625, -0.99371337890625, -0.961151123046875, -0.9285888671875, -0.896026611328125, -0.86346435546875, -0.830902099609375, -0.79833984375, -0.765777587890625, -0.73321533203125, -0.700653076171875, -0.6680908203125, -0.635528564453125, -0.60296630859375, -0.570404052734375, -0.537841796875, -0.505279541015625, -0.47271728515625, -0.440155029296875, -0.4075927734375, -0.375030517578125, -0.34246826171875, -0.309906005859375, -0.27734375, -0.244781494140625, -0.21221923828125, -0.179656982421875, -0.1470947265625, -0.114532470703125, -0.08197021484375, -0.049407958984375, -0.016845703125, 0.015716552734375, 0.04827880859375, 0.080841064453125, 0.1134033203125, 0.145965576171875, 0.17852783203125, 0.211090087890625, 0.24365234375, 0.276214599609375, 0.30877685546875, 0.341339111328125, 0.3739013671875, 0.406463623046875, 0.43902587890625, 0.471588134765625, 0.504150390625, 0.536712646484375, 0.56927490234375, 0.601837158203125, 0.6343994140625, 0.666961669921875, 0.69952392578125, 0.732086181640625, 0.7646484375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 9.0, 9.0, 9.0, 12.0, 16.0, 24.0, 32.0, 40.0, 72.0, 72.0, 142.0, 221.0, 346.0, 583.0, 1056.0, 2103.0, 4914.0, 16713.0, 110974.0, 753019.0, 129531.0, 18507.0, 5320.0, 2097.0, 1061.0, 611.0, 342.0, 243.0, 160.0, 102.0, 70.0, 48.0, 30.0, 23.0, 18.0, 10.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.99609375, -1.9365692138671875, -1.877044677734375, -1.8175201416015625, -1.75799560546875, -1.6984710693359375, -1.638946533203125, -1.5794219970703125, -1.5198974609375, -1.4603729248046875, -1.400848388671875, -1.3413238525390625, -1.28179931640625, -1.2222747802734375, -1.162750244140625, -1.1032257080078125, -1.043701171875, -0.9841766357421875, -0.924652099609375, -0.8651275634765625, -0.80560302734375, -0.7460784912109375, -0.686553955078125, -0.6270294189453125, -0.5675048828125, -0.5079803466796875, -0.448455810546875, -0.3889312744140625, -0.32940673828125, -0.2698822021484375, -0.210357666015625, -0.1508331298828125, -0.09130859375, -0.0317840576171875, 0.027740478515625, 0.0872650146484375, 0.14678955078125, 0.2063140869140625, 0.265838623046875, 0.3253631591796875, 0.3848876953125, 0.4444122314453125, 0.503936767578125, 0.5634613037109375, 0.62298583984375, 0.6825103759765625, 0.742034912109375, 0.8015594482421875, 0.861083984375, 0.9206085205078125, 0.980133056640625, 1.0396575927734375, 1.09918212890625, 1.1587066650390625, 1.218231201171875, 1.2777557373046875, 1.3372802734375, 1.3968048095703125, 1.456329345703125, 1.5158538818359375, 1.57537841796875, 1.6349029541015625, 1.694427490234375, 1.7539520263671875, 1.8134765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 7.0, 9.0, 19.0, 13.0, 15.0, 20.0, 24.0, 44.0, 39.0, 73.0, 72.0, 80.0, 81.0, 82.0, 76.0, 57.0, 59.0, 68.0, 45.0, 36.0, 17.0, 15.0, 9.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.0625, -3.9493408203125, -3.836181640625, -3.7230224609375, -3.60986328125, -3.4967041015625, -3.383544921875, -3.2703857421875, -3.1572265625, -3.0440673828125, -2.930908203125, -2.8177490234375, -2.70458984375, -2.5914306640625, -2.478271484375, -2.3651123046875, -2.251953125, -2.1387939453125, -2.025634765625, -1.9124755859375, -1.79931640625, -1.6861572265625, -1.572998046875, -1.4598388671875, -1.3466796875, -1.2335205078125, -1.120361328125, -1.0072021484375, -0.89404296875, -0.7808837890625, -0.667724609375, -0.5545654296875, -0.44140625, -0.3282470703125, -0.215087890625, -0.1019287109375, 0.01123046875, 0.1243896484375, 0.237548828125, 0.3507080078125, 0.4638671875, 0.5770263671875, 0.690185546875, 0.8033447265625, 0.91650390625, 1.0296630859375, 1.142822265625, 1.2559814453125, 1.369140625, 1.4822998046875, 1.595458984375, 1.7086181640625, 1.82177734375, 1.9349365234375, 2.048095703125, 2.1612548828125, 2.2744140625, 2.3875732421875, 2.500732421875, 2.6138916015625, 2.72705078125, 2.8402099609375, 2.953369140625, 3.0665283203125, 3.1796875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 13.0, 10.0, 15.0, 31.0, 31.0, 56.0, 88.0, 144.0, 209.0, 394.0, 741.0, 1606.0, 4475.0, 16301.0, 79543.0, 687864.0, 208850.0, 34688.0, 8330.0, 2772.0, 1089.0, 522.0, 299.0, 153.0, 90.0, 63.0, 51.0, 24.0, 22.0, 19.0, 12.0, 11.0, 7.0, 7.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.81982421875, -0.796234130859375, -0.77264404296875, -0.749053955078125, -0.7254638671875, -0.701873779296875, -0.67828369140625, -0.654693603515625, -0.631103515625, -0.607513427734375, -0.58392333984375, -0.560333251953125, -0.5367431640625, -0.513153076171875, -0.48956298828125, -0.465972900390625, -0.4423828125, -0.418792724609375, -0.39520263671875, -0.371612548828125, -0.3480224609375, -0.324432373046875, -0.30084228515625, -0.277252197265625, -0.253662109375, -0.230072021484375, -0.20648193359375, -0.182891845703125, -0.1593017578125, -0.135711669921875, -0.11212158203125, -0.088531494140625, -0.06494140625, -0.041351318359375, -0.01776123046875, 0.005828857421875, 0.0294189453125, 0.053009033203125, 0.07659912109375, 0.100189208984375, 0.123779296875, 0.147369384765625, 0.17095947265625, 0.194549560546875, 0.2181396484375, 0.241729736328125, 0.26531982421875, 0.288909912109375, 0.3125, 0.336090087890625, 0.35968017578125, 0.383270263671875, 0.4068603515625, 0.430450439453125, 0.45404052734375, 0.477630615234375, 0.501220703125, 0.524810791015625, 0.54840087890625, 0.571990966796875, 0.5955810546875, 0.619171142578125, 0.64276123046875, 0.666351318359375, 0.68994140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 7.0, 2.0, 9.0, 8.0, 8.0, 9.0, 12.0, 16.0, 16.0, 24.0, 29.0, 42.0, 52.0, 60.0, 107.0, 164.0, 127.0, 69.0, 49.0, 41.0, 29.0, 23.0, 21.0, 17.0, 9.0, 18.0, 8.0, 6.0, 5.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021076202392578125, -0.00020409375429153442, -0.0001974254846572876, -0.00019075721502304077, -0.00018408894538879395, -0.00017742067575454712, -0.0001707524061203003, -0.00016408413648605347, -0.00015741586685180664, -0.00015074759721755981, -0.000144079327583313, -0.00013741105794906616, -0.00013074278831481934, -0.0001240745186805725, -0.00011740624904632568, -0.00011073797941207886, -0.00010406970977783203, -9.74014401435852e-05, -9.073317050933838e-05, -8.406490087509155e-05, -7.739663124084473e-05, -7.07283616065979e-05, -6.406009197235107e-05, -5.739182233810425e-05, -5.072355270385742e-05, -4.4055283069610596e-05, -3.738701343536377e-05, -3.071874380111694e-05, -2.4050474166870117e-05, -1.738220453262329e-05, -1.0713934898376465e-05, -4.045665264129639e-06, 2.6226043701171875e-06, 9.290874004364014e-06, 1.595914363861084e-05, 2.2627413272857666e-05, 2.9295682907104492e-05, 3.596395254135132e-05, 4.2632222175598145e-05, 4.930049180984497e-05, 5.59687614440918e-05, 6.263703107833862e-05, 6.930530071258545e-05, 7.597357034683228e-05, 8.26418399810791e-05, 8.931010961532593e-05, 9.597837924957275e-05, 0.00010264664888381958, 0.0001093149185180664, 0.00011598318815231323, 0.00012265145778656006, 0.00012931972742080688, 0.0001359879970550537, 0.00014265626668930054, 0.00014932453632354736, 0.0001559928059577942, 0.00016266107559204102, 0.00016932934522628784, 0.00017599761486053467, 0.0001826658844947815, 0.00018933415412902832, 0.00019600242376327515, 0.00020267069339752197, 0.0002093389630317688, 0.00021600723266601562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 6.0, 7.0, 6.0, 9.0, 18.0, 25.0, 53.0, 48.0, 86.0, 107.0, 196.0, 350.0, 621.0, 1317.0, 2836.0, 7590.0, 24979.0, 128460.0, 735892.0, 110907.0, 22438.0, 7076.0, 2699.0, 1237.0, 647.0, 331.0, 191.0, 129.0, 103.0, 63.0, 34.0, 23.0, 24.0, 18.0, 11.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78662109375, -0.7631149291992188, -0.7396087646484375, -0.7161026000976562, -0.692596435546875, -0.6690902709960938, -0.6455841064453125, -0.6220779418945312, -0.59857177734375, -0.5750656127929688, -0.5515594482421875, -0.5280532836914062, -0.504547119140625, -0.48104095458984375, -0.4575347900390625, -0.43402862548828125, -0.4105224609375, -0.38701629638671875, -0.3635101318359375, -0.34000396728515625, -0.316497802734375, -0.29299163818359375, -0.2694854736328125, -0.24597930908203125, -0.22247314453125, -0.19896697998046875, -0.1754608154296875, -0.15195465087890625, -0.128448486328125, -0.10494232177734375, -0.0814361572265625, -0.05792999267578125, -0.034423828125, -0.01091766357421875, 0.0125885009765625, 0.03609466552734375, 0.059600830078125, 0.08310699462890625, 0.1066131591796875, 0.13011932373046875, 0.15362548828125, 0.17713165283203125, 0.2006378173828125, 0.22414398193359375, 0.247650146484375, 0.27115631103515625, 0.2946624755859375, 0.31816864013671875, 0.3416748046875, 0.36518096923828125, 0.3886871337890625, 0.41219329833984375, 0.435699462890625, 0.45920562744140625, 0.4827117919921875, 0.5062179565429688, 0.52972412109375, 0.5532302856445312, 0.5767364501953125, 0.6002426147460938, 0.623748779296875, 0.6472549438476562, 0.6707611083984375, 0.6942672729492188, 0.7177734375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 13.0, 9.0, 8.0, 13.0, 14.0, 19.0, 30.0, 43.0, 54.0, 51.0, 78.0, 134.0, 136.0, 89.0, 66.0, 50.0, 42.0, 35.0, 27.0, 14.0, 14.0, 14.0, 9.0, 6.0, 4.0, 2.0, 1.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8662109375, -0.8433609008789062, -0.8205108642578125, -0.7976608276367188, -0.774810791015625, -0.7519607543945312, -0.7291107177734375, -0.7062606811523438, -0.68341064453125, -0.6605606079101562, -0.6377105712890625, -0.6148605346679688, -0.592010498046875, -0.5691604614257812, -0.5463104248046875, -0.5234603881835938, -0.5006103515625, -0.47776031494140625, -0.4549102783203125, -0.43206024169921875, -0.409210205078125, -0.38636016845703125, -0.3635101318359375, -0.34066009521484375, -0.31781005859375, -0.29496002197265625, -0.2721099853515625, -0.24925994873046875, -0.226409912109375, -0.20355987548828125, -0.1807098388671875, -0.15785980224609375, -0.135009765625, -0.11215972900390625, -0.0893096923828125, -0.06645965576171875, -0.043609619140625, -0.02075958251953125, 0.0020904541015625, 0.02494049072265625, 0.04779052734375, 0.07064056396484375, 0.0934906005859375, 0.11634063720703125, 0.139190673828125, 0.16204071044921875, 0.1848907470703125, 0.20774078369140625, 0.2305908203125, 0.25344085693359375, 0.2762908935546875, 0.29914093017578125, 0.321990966796875, 0.34484100341796875, 0.3676910400390625, 0.39054107666015625, 0.41339111328125, 0.43624114990234375, 0.4590911865234375, 0.48194122314453125, 0.504791259765625, 0.5276412963867188, 0.5504913330078125, 0.5733413696289062, 0.59619140625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 27.0, 55.0, 108.0, 170.0, 260.0, 166.0, 90.0, 33.0, 25.0, 14.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.505977630615234, -12.052691459655762, -11.599405288696289, -11.146119117736816, -10.692832946777344, -10.239546775817871, -9.786260604858398, -9.33297348022461, -8.879688262939453, -8.42640209197998, -7.973115921020508, -7.519829750061035, -7.0665435791015625, -6.61325740814209, -6.159970760345459, -5.706684589385986, -5.2533979415893555, -4.800111770629883, -4.34682559967041, -3.8935391902923584, -3.4402530193328857, -2.986966848373413, -2.5336804389953613, -2.0803942680358887, -1.627108097076416, -1.1738219261169434, -0.7205356359481812, -0.26724934577941895, 0.1860368251800537, 0.6393229961395264, 1.0926094055175781, 1.5458955764770508, 1.9991817474365234, 2.452467918395996, 2.9057540893554688, 3.3590404987335205, 3.812326669692993, 4.265612602233887, 4.718899250030518, 5.17218542098999, 5.625471591949463, 6.0787577629089355, 6.532043933868408, 6.985330581665039, 7.438616752624512, 7.891902923583984, 8.345189094543457, 8.79847526550293, 9.251761436462402, 9.705047607421875, 10.158333778381348, 10.61161994934082, 11.064906120300293, 11.518192291259766, 11.971479415893555, 12.424764633178711, 12.8780517578125, 13.331337928771973, 13.784624099731445, 14.237910270690918, 14.69119644165039, 15.144482612609863, 15.597768783569336, 16.051055908203125, 16.50434112548828]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 8.0, 5.0, 7.0, 12.0, 14.0, 10.0, 18.0, 26.0, 29.0, 24.0, 38.0, 32.0, 50.0, 41.0, 47.0, 73.0, 61.0, 75.0, 67.0, 53.0, 41.0, 42.0, 34.0, 47.0, 27.0, 26.0, 24.0, 9.0, 12.0, 14.0, 19.0, 7.0, 7.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.104803085327148, -9.786523818969727, -9.468244552612305, -9.149964332580566, -8.831685066223145, -8.513405799865723, -8.1951265335083, -7.876846790313721, -7.558567047119141, -7.240287780761719, -6.922008037567139, -6.603728771209717, -6.285449028015137, -5.967169761657715, -5.648890495300293, -5.330610752105713, -5.012331485748291, -4.694052219390869, -4.375772476196289, -4.057493209838867, -3.739213466644287, -3.4209342002868652, -3.1026546955108643, -2.7843751907348633, -2.4660956859588623, -2.1478161811828613, -1.8295366764068604, -1.511257290840149, -1.192977786064148, -0.874698281288147, -0.5564188957214355, -0.23813939094543457, 0.0801401138305664, 0.398419588804245, 0.7166990637779236, 1.0349785089492798, 1.3532580137252808, 1.6715375185012817, 1.9898169040679932, 2.308096408843994, 2.626375913619995, 2.944655418395996, 3.262934923171997, 3.581214427947998, 3.89949369430542, 4.2177734375, 4.536052703857422, 4.854331970214844, 5.172611713409424, 5.490890979766846, 5.809170722961426, 6.127449989318848, 6.445729732513428, 6.76400899887085, 7.08228874206543, 7.400568008422852, 7.718847274780273, 8.037126541137695, 8.355405807495117, 8.673686027526855, 8.991965293884277, 9.3102445602417, 9.628523826599121, 9.94680404663086, 10.265083312988281]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 12.0, 25.0, 49.0, 83.0, 199.0, 584.0, 2472.0, 26521.0, 2713625.0, 1431524.0, 16223.0, 1989.0, 620.0, 192.0, 81.0, 44.0, 20.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.66015625, -2.5995941162109375, -2.539031982421875, -2.4784698486328125, -2.41790771484375, -2.3573455810546875, -2.296783447265625, -2.2362213134765625, -2.1756591796875, -2.1150970458984375, -2.054534912109375, -1.9939727783203125, -1.93341064453125, -1.8728485107421875, -1.812286376953125, -1.7517242431640625, -1.691162109375, -1.6305999755859375, -1.570037841796875, -1.5094757080078125, -1.44891357421875, -1.3883514404296875, -1.327789306640625, -1.2672271728515625, -1.2066650390625, -1.1461029052734375, -1.085540771484375, -1.0249786376953125, -0.96441650390625, -0.9038543701171875, -0.843292236328125, -0.7827301025390625, -0.72216796875, -0.6616058349609375, -0.601043701171875, -0.5404815673828125, -0.47991943359375, -0.4193572998046875, -0.358795166015625, -0.2982330322265625, -0.2376708984375, -0.1771087646484375, -0.116546630859375, -0.0559844970703125, 0.00457763671875, 0.0651397705078125, 0.125701904296875, 0.1862640380859375, 0.246826171875, 0.3073883056640625, 0.367950439453125, 0.4285125732421875, 0.48907470703125, 0.5496368408203125, 0.610198974609375, 0.6707611083984375, 0.7313232421875, 0.7918853759765625, 0.852447509765625, 0.9130096435546875, 0.97357177734375, 1.0341339111328125, 1.094696044921875, 1.1552581787109375, 1.2158203125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 5.0, 10.0, 14.0, 16.0, 18.0, 30.0, 33.0, 35.0, 47.0, 61.0, 77.0, 58.0, 67.0, 80.0, 68.0, 66.0, 58.0, 48.0, 46.0, 36.0, 27.0, 32.0, 17.0, 9.0, 13.0, 10.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69287109375, -0.6707077026367188, -0.6485443115234375, -0.6263809204101562, -0.604217529296875, -0.5820541381835938, -0.5598907470703125, -0.5377273559570312, -0.51556396484375, -0.49340057373046875, -0.4712371826171875, -0.44907379150390625, -0.426910400390625, -0.40474700927734375, -0.3825836181640625, -0.36042022705078125, -0.3382568359375, -0.31609344482421875, -0.2939300537109375, -0.27176666259765625, -0.249603271484375, -0.22743988037109375, -0.2052764892578125, -0.18311309814453125, -0.16094970703125, -0.13878631591796875, -0.1166229248046875, -0.09445953369140625, -0.072296142578125, -0.05013275146484375, -0.0279693603515625, -0.00580596923828125, 0.016357421875, 0.03852081298828125, 0.0606842041015625, 0.08284759521484375, 0.105010986328125, 0.12717437744140625, 0.1493377685546875, 0.17150115966796875, 0.19366455078125, 0.21582794189453125, 0.2379913330078125, 0.26015472412109375, 0.282318115234375, 0.30448150634765625, 0.3266448974609375, 0.34880828857421875, 0.3709716796875, 0.39313507080078125, 0.4152984619140625, 0.43746185302734375, 0.459625244140625, 0.48178863525390625, 0.5039520263671875, 0.5261154174804688, 0.54827880859375, 0.5704421997070312, 0.5926055908203125, 0.6147689819335938, 0.636932373046875, 0.6590957641601562, 0.6812591552734375, 0.7034225463867188, 0.7255859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 4.0, 4.0, 12.0, 12.0, 21.0, 27.0, 33.0, 77.0, 77.0, 151.0, 321.0, 591.0, 1446.0, 5241.0, 40266.0, 1324140.0, 2744297.0, 66244.0, 7599.0, 2011.0, 789.0, 379.0, 208.0, 133.0, 76.0, 48.0, 26.0, 19.0, 9.0, 14.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5048828125, -1.4580078125, -1.4111328125, -1.3642578125, -1.3173828125, -1.2705078125, -1.2236328125, -1.1767578125, -1.1298828125, -1.0830078125, -1.0361328125, -0.9892578125, -0.9423828125, -0.8955078125, -0.8486328125, -0.8017578125, -0.7548828125, -0.7080078125, -0.6611328125, -0.6142578125, -0.5673828125, -0.5205078125, -0.4736328125, -0.4267578125, -0.3798828125, -0.3330078125, -0.2861328125, -0.2392578125, -0.1923828125, -0.1455078125, -0.0986328125, -0.0517578125, -0.0048828125, 0.0419921875, 0.0888671875, 0.1357421875, 0.1826171875, 0.2294921875, 0.2763671875, 0.3232421875, 0.3701171875, 0.4169921875, 0.4638671875, 0.5107421875, 0.5576171875, 0.6044921875, 0.6513671875, 0.6982421875, 0.7451171875, 0.7919921875, 0.8388671875, 0.8857421875, 0.9326171875, 0.9794921875, 1.0263671875, 1.0732421875, 1.1201171875, 1.1669921875, 1.2138671875, 1.2607421875, 1.3076171875, 1.3544921875, 1.4013671875, 1.4482421875, 1.4951171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 19.0, 23.0, 34.0, 31.0, 65.0, 95.0, 151.0, 273.0, 517.0, 719.0, 763.0, 546.0, 353.0, 182.0, 125.0, 53.0, 51.0, 19.0, 18.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81103515625, -0.7706832885742188, -0.7303314208984375, -0.6899795532226562, -0.649627685546875, -0.6092758178710938, -0.5689239501953125, -0.5285720825195312, -0.48822021484375, -0.44786834716796875, -0.4075164794921875, -0.36716461181640625, -0.326812744140625, -0.28646087646484375, -0.2461090087890625, -0.20575714111328125, -0.1654052734375, -0.12505340576171875, -0.0847015380859375, -0.04434967041015625, -0.003997802734375, 0.03635406494140625, 0.0767059326171875, 0.11705780029296875, 0.15740966796875, 0.19776153564453125, 0.2381134033203125, 0.27846527099609375, 0.318817138671875, 0.35916900634765625, 0.3995208740234375, 0.43987274169921875, 0.480224609375, 0.5205764770507812, 0.5609283447265625, 0.6012802124023438, 0.641632080078125, 0.6819839477539062, 0.7223358154296875, 0.7626876831054688, 0.80303955078125, 0.8433914184570312, 0.8837432861328125, 0.9240951538085938, 0.964447021484375, 1.0047988891601562, 1.0451507568359375, 1.0855026245117188, 1.1258544921875, 1.1662063598632812, 1.2065582275390625, 1.2469100952148438, 1.287261962890625, 1.3276138305664062, 1.3679656982421875, 1.4083175659179688, 1.44866943359375, 1.4890213012695312, 1.5293731689453125, 1.5697250366210938, 1.610076904296875, 1.6504287719726562, 1.6907806396484375, 1.7311325073242188, 1.771484375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 7.0, 10.0, 21.0, 86.0, 224.0, 308.0, 211.0, 76.0, 29.0, 16.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.411293029785156, -15.835451126098633, -15.259610176086426, -14.683768272399902, -14.107927322387695, -13.532085418701172, -12.956243515014648, -12.380402565002441, -11.804561614990234, -11.228719711303711, -10.652878761291504, -10.07703685760498, -9.501195907592773, -8.92535400390625, -8.349512100219727, -7.7736711502075195, -7.197829246520996, -6.621987819671631, -6.046146392822266, -5.470304489135742, -4.894463539123535, -4.318621635437012, -3.7427802085876465, -3.1669387817382812, -2.591097354888916, -2.015255928039551, -1.439414381980896, -0.8635728359222412, -0.287731409072876, 0.28811001777648926, 0.8639516830444336, 1.4397931098937988, 2.015634536743164, 2.5914759635925293, 3.1673173904418945, 3.743159055709839, 4.319000244140625, 4.894842147827148, 5.470683574676514, 6.046525001525879, 6.622366428375244, 7.198207855224609, 7.774049282073975, 8.34989070892334, 8.925732612609863, 9.50157356262207, 10.077415466308594, 10.653257369995117, 11.229098320007324, 11.804940223693848, 12.380781173706055, 12.956623077392578, 13.532464027404785, 14.108305931091309, 14.684146881103516, 15.259988784790039, 15.835830688476562, 16.411672592163086, 16.98751449584961, 17.5633544921875, 18.139196395874023, 18.715038299560547, 19.29088020324707, 19.866722106933594, 20.442562103271484]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 10.0, 12.0, 16.0, 18.0, 21.0, 32.0, 36.0, 33.0, 41.0, 47.0, 65.0, 62.0, 64.0, 59.0, 65.0, 52.0, 58.0, 41.0, 50.0, 34.0, 32.0, 30.0, 29.0, 20.0, 17.0, 13.0, 9.0, 9.0, 4.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.251339912414551, -6.0603742599487305, -5.869408130645752, -5.678442001342773, -5.487476348876953, -5.296510696411133, -5.105544567108154, -4.914578437805176, -4.7236127853393555, -4.532647132873535, -4.341681003570557, -4.150714874267578, -3.959749221801758, -3.7687833309173584, -3.577817440032959, -3.3868515491485596, -3.19588565826416, -3.0049197673797607, -2.8139538764953613, -2.622987985610962, -2.4320220947265625, -2.241056203842163, -2.0500903129577637, -1.8591244220733643, -1.6681585311889648, -1.4771926403045654, -1.286226749420166, -1.0952608585357666, -0.9042949676513672, -0.7133290767669678, -0.5223631858825684, -0.33139729499816895, -0.14043092727661133, 0.050534963607788086, 0.2415008544921875, 0.4324667453765869, 0.6234326362609863, 0.8143985271453857, 1.0053644180297852, 1.1963303089141846, 1.387296199798584, 1.5782620906829834, 1.7692279815673828, 1.9601938724517822, 2.1511597633361816, 2.342125654220581, 2.5330915451049805, 2.72405743598938, 2.9150233268737793, 3.1059892177581787, 3.296955108642578, 3.4879209995269775, 3.678886890411377, 3.8698527812957764, 4.060818672180176, 4.251784324645996, 4.442750453948975, 4.633716583251953, 4.824682235717773, 5.015647888183594, 5.206614017486572, 5.397580146789551, 5.588545799255371, 5.779511451721191, 5.97047758102417]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 8.0, 8.0, 16.0, 14.0, 28.0, 44.0, 84.0, 120.0, 206.0, 463.0, 979.0, 2324.0, 6638.0, 21784.0, 89406.0, 434928.0, 385295.0, 76883.0, 19391.0, 5942.0, 2123.0, 889.0, 431.0, 233.0, 122.0, 78.0, 40.0, 21.0, 21.0, 13.0, 6.0, 9.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1640625, -1.1251983642578125, -1.086334228515625, -1.0474700927734375, -1.00860595703125, -0.9697418212890625, -0.930877685546875, -0.8920135498046875, -0.8531494140625, -0.8142852783203125, -0.775421142578125, -0.7365570068359375, -0.69769287109375, -0.6588287353515625, -0.619964599609375, -0.5811004638671875, -0.542236328125, -0.5033721923828125, -0.464508056640625, -0.4256439208984375, -0.38677978515625, -0.3479156494140625, -0.309051513671875, -0.2701873779296875, -0.2313232421875, -0.1924591064453125, -0.153594970703125, -0.1147308349609375, -0.07586669921875, -0.0370025634765625, 0.001861572265625, 0.0407257080078125, 0.07958984375, 0.1184539794921875, 0.157318115234375, 0.1961822509765625, 0.23504638671875, 0.2739105224609375, 0.312774658203125, 0.3516387939453125, 0.3905029296875, 0.4293670654296875, 0.468231201171875, 0.5070953369140625, 0.54595947265625, 0.5848236083984375, 0.623687744140625, 0.6625518798828125, 0.701416015625, 0.7402801513671875, 0.779144287109375, 0.8180084228515625, 0.85687255859375, 0.8957366943359375, 0.934600830078125, 0.9734649658203125, 1.0123291015625, 1.0511932373046875, 1.090057373046875, 1.1289215087890625, 1.16778564453125, 1.2066497802734375, 1.245513916015625, 1.2843780517578125, 1.3232421875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 5.0, 0.0, 5.0, 4.0, 6.0, 12.0, 14.0, 12.0, 17.0, 25.0, 30.0, 35.0, 30.0, 31.0, 37.0, 57.0, 40.0, 47.0, 56.0, 39.0, 56.0, 61.0, 53.0, 38.0, 36.0, 34.0, 44.0, 24.0, 25.0, 26.0, 15.0, 16.0, 13.0, 8.0, 7.0, 13.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.52099609375, -0.5050048828125, -0.489013671875, -0.4730224609375, -0.45703125, -0.4410400390625, -0.425048828125, -0.4090576171875, -0.39306640625, -0.3770751953125, -0.361083984375, -0.3450927734375, -0.3291015625, -0.3131103515625, -0.297119140625, -0.2811279296875, -0.26513671875, -0.2491455078125, -0.233154296875, -0.2171630859375, -0.201171875, -0.1851806640625, -0.169189453125, -0.1531982421875, -0.13720703125, -0.1212158203125, -0.105224609375, -0.0892333984375, -0.0732421875, -0.0572509765625, -0.041259765625, -0.0252685546875, -0.00927734375, 0.0067138671875, 0.022705078125, 0.0386962890625, 0.0546875, 0.0706787109375, 0.086669921875, 0.1026611328125, 0.11865234375, 0.1346435546875, 0.150634765625, 0.1666259765625, 0.1826171875, 0.1986083984375, 0.214599609375, 0.2305908203125, 0.24658203125, 0.2625732421875, 0.278564453125, 0.2945556640625, 0.310546875, 0.3265380859375, 0.342529296875, 0.3585205078125, 0.37451171875, 0.3905029296875, 0.406494140625, 0.4224853515625, 0.4384765625, 0.4544677734375, 0.470458984375, 0.4864501953125, 0.50244140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 16.0, 16.0, 21.0, 32.0, 53.0, 52.0, 75.0, 151.0, 262.0, 472.0, 920.0, 2093.0, 6362.0, 35939.0, 622743.0, 343104.0, 26906.0, 5468.0, 1874.0, 885.0, 448.0, 206.0, 147.0, 98.0, 53.0, 39.0, 38.0, 22.0, 15.0, 10.0, 9.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.7517852783203125, -1.684234619140625, -1.6166839599609375, -1.54913330078125, -1.4815826416015625, -1.414031982421875, -1.3464813232421875, -1.2789306640625, -1.2113800048828125, -1.143829345703125, -1.0762786865234375, -1.00872802734375, -0.9411773681640625, -0.873626708984375, -0.8060760498046875, -0.738525390625, -0.6709747314453125, -0.603424072265625, -0.5358734130859375, -0.46832275390625, -0.4007720947265625, -0.333221435546875, -0.2656707763671875, -0.1981201171875, -0.1305694580078125, -0.063018798828125, 0.0045318603515625, 0.07208251953125, 0.1396331787109375, 0.207183837890625, 0.2747344970703125, 0.34228515625, 0.4098358154296875, 0.477386474609375, 0.5449371337890625, 0.61248779296875, 0.6800384521484375, 0.747589111328125, 0.8151397705078125, 0.8826904296875, 0.9502410888671875, 1.017791748046875, 1.0853424072265625, 1.15289306640625, 1.2204437255859375, 1.287994384765625, 1.3555450439453125, 1.423095703125, 1.4906463623046875, 1.558197021484375, 1.6257476806640625, 1.69329833984375, 1.7608489990234375, 1.828399658203125, 1.8959503173828125, 1.9635009765625, 2.0310516357421875, 2.098602294921875, 2.1661529541015625, 2.23370361328125, 2.3012542724609375, 2.368804931640625, 2.4363555908203125, 2.50390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 2.0, 10.0, 6.0, 9.0, 16.0, 14.0, 15.0, 16.0, 16.0, 21.0, 29.0, 32.0, 23.0, 39.0, 42.0, 45.0, 43.0, 51.0, 47.0, 44.0, 43.0, 52.0, 48.0, 41.0, 36.0, 34.0, 30.0, 29.0, 30.0, 24.0, 17.0, 14.0, 23.0, 12.0, 9.0, 3.0, 6.0, 3.0, 1.0, 5.0, 4.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.0234375, -1.9607696533203125, -1.898101806640625, -1.8354339599609375, -1.77276611328125, -1.7100982666015625, -1.647430419921875, -1.5847625732421875, -1.5220947265625, -1.4594268798828125, -1.396759033203125, -1.3340911865234375, -1.27142333984375, -1.2087554931640625, -1.146087646484375, -1.0834197998046875, -1.020751953125, -0.9580841064453125, -0.895416259765625, -0.8327484130859375, -0.77008056640625, -0.7074127197265625, -0.644744873046875, -0.5820770263671875, -0.5194091796875, -0.4567413330078125, -0.394073486328125, -0.3314056396484375, -0.26873779296875, -0.2060699462890625, -0.143402099609375, -0.0807342529296875, -0.01806640625, 0.0446014404296875, 0.107269287109375, 0.1699371337890625, 0.23260498046875, 0.2952728271484375, 0.357940673828125, 0.4206085205078125, 0.4832763671875, 0.5459442138671875, 0.608612060546875, 0.6712799072265625, 0.73394775390625, 0.7966156005859375, 0.859283447265625, 0.9219512939453125, 0.984619140625, 1.0472869873046875, 1.109954833984375, 1.1726226806640625, 1.23529052734375, 1.2979583740234375, 1.360626220703125, 1.4232940673828125, 1.4859619140625, 1.5486297607421875, 1.611297607421875, 1.6739654541015625, 1.73663330078125, 1.7993011474609375, 1.861968994140625, 1.9246368408203125, 1.9873046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 3.0, 6.0, 8.0, 4.0, 8.0, 7.0, 14.0, 14.0, 18.0, 21.0, 29.0, 43.0, 72.0, 104.0, 149.0, 281.0, 550.0, 1118.0, 3038.0, 10015.0, 43070.0, 353647.0, 570082.0, 49100.0, 11333.0, 3299.0, 1226.0, 526.0, 272.0, 158.0, 102.0, 64.0, 42.0, 32.0, 25.0, 19.0, 11.0, 13.0, 6.0, 8.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.90625, -0.8803863525390625, -0.854522705078125, -0.8286590576171875, -0.80279541015625, -0.7769317626953125, -0.751068115234375, -0.7252044677734375, -0.6993408203125, -0.6734771728515625, -0.647613525390625, -0.6217498779296875, -0.59588623046875, -0.5700225830078125, -0.544158935546875, -0.5182952880859375, -0.492431640625, -0.4665679931640625, -0.440704345703125, -0.4148406982421875, -0.38897705078125, -0.3631134033203125, -0.337249755859375, -0.3113861083984375, -0.2855224609375, -0.2596588134765625, -0.233795166015625, -0.2079315185546875, -0.18206787109375, -0.1562042236328125, -0.130340576171875, -0.1044769287109375, -0.07861328125, -0.0527496337890625, -0.026885986328125, -0.0010223388671875, 0.02484130859375, 0.0507049560546875, 0.076568603515625, 0.1024322509765625, 0.1282958984375, 0.1541595458984375, 0.180023193359375, 0.2058868408203125, 0.23175048828125, 0.2576141357421875, 0.283477783203125, 0.3093414306640625, 0.335205078125, 0.3610687255859375, 0.386932373046875, 0.4127960205078125, 0.43865966796875, 0.4645233154296875, 0.490386962890625, 0.5162506103515625, 0.5421142578125, 0.5679779052734375, 0.593841552734375, 0.6197052001953125, 0.64556884765625, 0.6714324951171875, 0.697296142578125, 0.7231597900390625, 0.7490234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 7.0, 9.0, 10.0, 26.0, 26.0, 43.0, 74.0, 120.0, 181.0, 185.0, 98.0, 56.0, 33.0, 27.0, 16.0, 14.0, 12.0, 15.0, 10.0, 7.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021910667419433594, -0.00021095573902130127, -0.0002028048038482666, -0.00019465386867523193, -0.00018650293350219727, -0.0001783519983291626, -0.00017020106315612793, -0.00016205012798309326, -0.0001538991928100586, -0.00014574825763702393, -0.00013759732246398926, -0.0001294463872909546, -0.00012129545211791992, -0.00011314451694488525, -0.00010499358177185059, -9.684264659881592e-05, -8.869171142578125e-05, -8.054077625274658e-05, -7.238984107971191e-05, -6.423890590667725e-05, -5.608797073364258e-05, -4.793703556060791e-05, -3.978610038757324e-05, -3.1635165214538574e-05, -2.3484230041503906e-05, -1.5333294868469238e-05, -7.18235969543457e-06, 9.685754776000977e-07, 9.119510650634766e-06, 1.7270445823669434e-05, 2.54213809967041e-05, 3.357231616973877e-05, 4.172325134277344e-05, 4.9874186515808105e-05, 5.8025121688842773e-05, 6.617605686187744e-05, 7.432699203491211e-05, 8.247792720794678e-05, 9.062886238098145e-05, 9.877979755401611e-05, 0.00010693073272705078, 0.00011508166790008545, 0.00012323260307312012, 0.00013138353824615479, 0.00013953447341918945, 0.00014768540859222412, 0.0001558363437652588, 0.00016398727893829346, 0.00017213821411132812, 0.0001802891492843628, 0.00018844008445739746, 0.00019659101963043213, 0.0002047419548034668, 0.00021289288997650146, 0.00022104382514953613, 0.0002291947603225708, 0.00023734569549560547, 0.00024549663066864014, 0.0002536475658416748, 0.00026179850101470947, 0.00026994943618774414, 0.0002781003713607788, 0.0002862513065338135, 0.00029440224170684814, 0.0003025531768798828]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 18.0, 22.0, 29.0, 43.0, 77.0, 92.0, 152.0, 316.0, 570.0, 1258.0, 3085.0, 10395.0, 49117.0, 639700.0, 295895.0, 34906.0, 8001.0, 2532.0, 1102.0, 477.0, 300.0, 162.0, 97.0, 67.0, 39.0, 23.0, 18.0, 10.0, 9.0, 5.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.95947265625, -0.9327468872070312, -0.9060211181640625, -0.8792953491210938, -0.852569580078125, -0.8258438110351562, -0.7991180419921875, -0.7723922729492188, -0.74566650390625, -0.7189407348632812, -0.6922149658203125, -0.6654891967773438, -0.638763427734375, -0.6120376586914062, -0.5853118896484375, -0.5585861206054688, -0.5318603515625, -0.5051345825195312, -0.4784088134765625, -0.45168304443359375, -0.424957275390625, -0.39823150634765625, -0.3715057373046875, -0.34477996826171875, -0.31805419921875, -0.29132843017578125, -0.2646026611328125, -0.23787689208984375, -0.211151123046875, -0.18442535400390625, -0.1576995849609375, -0.13097381591796875, -0.104248046875, -0.07752227783203125, -0.0507965087890625, -0.02407073974609375, 0.002655029296875, 0.02938079833984375, 0.0561065673828125, 0.08283233642578125, 0.10955810546875, 0.13628387451171875, 0.1630096435546875, 0.18973541259765625, 0.216461181640625, 0.24318695068359375, 0.2699127197265625, 0.29663848876953125, 0.3233642578125, 0.35009002685546875, 0.3768157958984375, 0.40354156494140625, 0.430267333984375, 0.45699310302734375, 0.4837188720703125, 0.5104446411132812, 0.53717041015625, 0.5638961791992188, 0.5906219482421875, 0.6173477172851562, 0.644073486328125, 0.6707992553710938, 0.6975250244140625, 0.7242507934570312, 0.7509765625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 4.0, 1.0, 10.0, 8.0, 5.0, 6.0, 8.0, 15.0, 13.0, 23.0, 13.0, 29.0, 35.0, 34.0, 58.0, 55.0, 62.0, 74.0, 67.0, 93.0, 63.0, 61.0, 40.0, 35.0, 32.0, 24.0, 16.0, 13.0, 18.0, 9.0, 10.0, 7.0, 3.0, 8.0, 7.0, 7.0, 6.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.486572265625, -0.4714012145996094, -0.45623016357421875, -0.4410591125488281, -0.4258880615234375, -0.4107170104980469, -0.39554595947265625, -0.3803749084472656, -0.365203857421875, -0.3500328063964844, -0.33486175537109375, -0.3196907043457031, -0.3045196533203125, -0.2893486022949219, -0.27417755126953125, -0.2590065002441406, -0.24383544921875, -0.22866439819335938, -0.21349334716796875, -0.19832229614257812, -0.1831512451171875, -0.16798019409179688, -0.15280914306640625, -0.13763809204101562, -0.122467041015625, -0.10729598999023438, -0.09212493896484375, -0.07695388793945312, -0.0617828369140625, -0.046611785888671875, -0.03144073486328125, -0.016269683837890625, -0.0010986328125, 0.014072418212890625, 0.02924346923828125, 0.044414520263671875, 0.0595855712890625, 0.07475662231445312, 0.08992767333984375, 0.10509872436523438, 0.120269775390625, 0.13544082641601562, 0.15061187744140625, 0.16578292846679688, 0.1809539794921875, 0.19612503051757812, 0.21129608154296875, 0.22646713256835938, 0.24163818359375, 0.2568092346191406, 0.27198028564453125, 0.2871513366699219, 0.3023223876953125, 0.3174934387207031, 0.33266448974609375, 0.3478355407714844, 0.363006591796875, 0.3781776428222656, 0.39334869384765625, 0.4085197448730469, 0.4236907958984375, 0.4388618469238281, 0.45403289794921875, 0.4692039489746094, 0.484375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 9.0, 30.0, 77.0, 164.0, 345.0, 216.0, 89.0, 26.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.00396728515625, -19.39335060119629, -18.782733917236328, -18.172119140625, -17.56150245666504, -16.950885772705078, -16.340269088745117, -15.729652404785156, -15.119036674499512, -14.50841999053955, -13.897804260253906, -13.287187576293945, -12.676570892333984, -12.06595516204834, -11.455338478088379, -10.844722747802734, -10.234106063842773, -9.623489379882812, -9.012873649597168, -8.402256965637207, -7.791640758514404, -7.181024551391602, -6.570407867431641, -5.959791660308838, -5.349175453186035, -4.738559246063232, -4.12794303894043, -3.5173263549804688, -2.906710147857666, -2.2960939407348633, -1.6854774951934814, -1.0748610496520996, -0.4642448425292969, 0.1463714838027954, 0.7569878101348877, 1.36760413646698, 1.9782204627990723, 2.588836669921875, 3.199453115463257, 3.8100695610046387, 4.420685768127441, 5.031301975250244, 5.641918182373047, 6.252534866333008, 6.8631510734558105, 7.473767280578613, 8.084383964538574, 8.694999694824219, 9.30561637878418, 9.91623306274414, 10.526848793029785, 11.137465476989746, 11.74808120727539, 12.358697891235352, 12.969314575195312, 13.579931259155273, 14.190546989440918, 14.801163673400879, 15.411779403686523, 16.022396087646484, 16.633012771606445, 17.243629455566406, 17.854244232177734, 18.464860916137695, 19.075477600097656]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 9.0, 10.0, 7.0, 5.0, 19.0, 18.0, 14.0, 23.0, 16.0, 21.0, 31.0, 39.0, 37.0, 45.0, 39.0, 52.0, 75.0, 64.0, 65.0, 62.0, 42.0, 41.0, 27.0, 33.0, 22.0, 36.0, 18.0, 24.0, 13.0, 16.0, 14.0, 10.0, 8.0, 6.0, 7.0, 4.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.925919532775879, -8.65841007232666, -8.390901565551758, -8.123392105102539, -7.855883598327637, -7.588374614715576, -7.320865631103516, -7.053356170654297, -6.7858476638793945, -6.518338680267334, -6.250829696655273, -5.983320713043213, -5.715811729431152, -5.448302745819092, -5.180793762207031, -4.9132843017578125, -4.645775318145752, -4.378266334533691, -4.110757350921631, -3.8432483673095703, -3.5757393836975098, -3.308230400085449, -3.0407211780548096, -2.773212194442749, -2.5057032108306885, -2.238194227218628, -1.9706852436065674, -1.7031761407852173, -1.4356671571731567, -1.1681581735610962, -0.9006490707397461, -0.6331400871276855, -0.365631103515625, -0.09812209010124207, 0.16938692331314087, 0.4368959665298462, 0.7044049501419067, 0.9719139337539673, 1.2394230365753174, 1.506932020187378, 1.7744410037994385, 2.041949987411499, 2.3094589710235596, 2.576968193054199, 2.8444771766662598, 3.1119861602783203, 3.379495143890381, 3.6470041275024414, 3.914513111114502, 4.1820220947265625, 4.449531078338623, 4.717040061950684, 4.984549045562744, 5.252058029174805, 5.519567489624023, 5.787075996398926, 6.0545854568481445, 6.322094440460205, 6.589603424072266, 6.857112407684326, 7.124621391296387, 7.392130374908447, 7.659639358520508, 7.927148818969727, 8.194657325744629]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 9.0, 10.0, 17.0, 23.0, 21.0, 44.0, 85.0, 155.0, 288.0, 662.0, 1753.0, 6696.0, 50750.0, 1691167.0, 2359379.0, 69899.0, 9121.0, 2433.0, 939.0, 411.0, 166.0, 105.0, 58.0, 34.0, 19.0, 12.0, 8.0, 4.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.07025146484375, -1.0321044921875, -0.99395751953125, -0.955810546875, -0.91766357421875, -0.8795166015625, -0.84136962890625, -0.80322265625, -0.76507568359375, -0.7269287109375, -0.68878173828125, -0.650634765625, -0.61248779296875, -0.5743408203125, -0.53619384765625, -0.498046875, -0.45989990234375, -0.4217529296875, -0.38360595703125, -0.345458984375, -0.30731201171875, -0.2691650390625, -0.23101806640625, -0.19287109375, -0.15472412109375, -0.1165771484375, -0.07843017578125, -0.040283203125, -0.00213623046875, 0.0360107421875, 0.07415771484375, 0.1123046875, 0.15045166015625, 0.1885986328125, 0.22674560546875, 0.264892578125, 0.30303955078125, 0.3411865234375, 0.37933349609375, 0.41748046875, 0.45562744140625, 0.4937744140625, 0.53192138671875, 0.570068359375, 0.60821533203125, 0.6463623046875, 0.68450927734375, 0.72265625, 0.76080322265625, 0.7989501953125, 0.83709716796875, 0.875244140625, 0.91339111328125, 0.9515380859375, 0.98968505859375, 1.02783203125, 1.06597900390625, 1.1041259765625, 1.14227294921875, 1.180419921875, 1.21856689453125, 1.2567138671875, 1.29486083984375, 1.3330078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 2.0, 10.0, 8.0, 9.0, 16.0, 17.0, 38.0, 44.0, 44.0, 44.0, 68.0, 51.0, 70.0, 72.0, 63.0, 58.0, 65.0, 81.0, 63.0, 38.0, 36.0, 27.0, 14.0, 16.0, 10.0, 10.0, 6.0, 7.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8037109375, -0.7819976806640625, -0.760284423828125, -0.7385711669921875, -0.71685791015625, -0.6951446533203125, -0.673431396484375, -0.6517181396484375, -0.6300048828125, -0.6082916259765625, -0.586578369140625, -0.5648651123046875, -0.54315185546875, -0.5214385986328125, -0.499725341796875, -0.4780120849609375, -0.456298828125, -0.4345855712890625, -0.412872314453125, -0.3911590576171875, -0.36944580078125, -0.3477325439453125, -0.326019287109375, -0.3043060302734375, -0.2825927734375, -0.2608795166015625, -0.239166259765625, -0.2174530029296875, -0.19573974609375, -0.1740264892578125, -0.152313232421875, -0.1305999755859375, -0.10888671875, -0.0871734619140625, -0.065460205078125, -0.0437469482421875, -0.02203369140625, -0.0003204345703125, 0.021392822265625, 0.0431060791015625, 0.0648193359375, 0.0865325927734375, 0.108245849609375, 0.1299591064453125, 0.15167236328125, 0.1733856201171875, 0.195098876953125, 0.2168121337890625, 0.238525390625, 0.2602386474609375, 0.281951904296875, 0.3036651611328125, 0.32537841796875, 0.3470916748046875, 0.368804931640625, 0.3905181884765625, 0.4122314453125, 0.4339447021484375, 0.455657958984375, 0.4773712158203125, 0.49908447265625, 0.5207977294921875, 0.542510986328125, 0.5642242431640625, 0.5859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 7.0, 12.0, 14.0, 36.0, 54.0, 107.0, 218.0, 533.0, 1510.0, 6247.0, 137569.0, 3992921.0, 47989.0, 4771.0, 1284.0, 486.0, 227.0, 123.0, 59.0, 42.0, 28.0, 15.0, 9.0, 8.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.490936279296875, -2.41156005859375, -2.332183837890625, -2.2528076171875, -2.173431396484375, -2.09405517578125, -2.014678955078125, -1.935302734375, -1.855926513671875, -1.77655029296875, -1.697174072265625, -1.6177978515625, -1.538421630859375, -1.45904541015625, -1.379669189453125, -1.30029296875, -1.220916748046875, -1.14154052734375, -1.062164306640625, -0.9827880859375, -0.903411865234375, -0.82403564453125, -0.744659423828125, -0.665283203125, -0.585906982421875, -0.50653076171875, -0.427154541015625, -0.3477783203125, -0.268402099609375, -0.18902587890625, -0.109649658203125, -0.0302734375, 0.049102783203125, 0.12847900390625, 0.207855224609375, 0.2872314453125, 0.366607666015625, 0.44598388671875, 0.525360107421875, 0.604736328125, 0.684112548828125, 0.76348876953125, 0.842864990234375, 0.9222412109375, 1.001617431640625, 1.08099365234375, 1.160369873046875, 1.23974609375, 1.319122314453125, 1.39849853515625, 1.477874755859375, 1.5572509765625, 1.636627197265625, 1.71600341796875, 1.795379638671875, 1.874755859375, 1.954132080078125, 2.03350830078125, 2.112884521484375, 2.1922607421875, 2.271636962890625, 2.35101318359375, 2.430389404296875, 2.509765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 13.0, 10.0, 26.0, 41.0, 80.0, 231.0, 494.0, 1042.0, 1146.0, 558.0, 215.0, 109.0, 45.0, 30.0, 11.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.38946533203125, -1.3316650390625, -1.27386474609375, -1.216064453125, -1.15826416015625, -1.1004638671875, -1.04266357421875, -0.98486328125, -0.92706298828125, -0.8692626953125, -0.81146240234375, -0.753662109375, -0.69586181640625, -0.6380615234375, -0.58026123046875, -0.5224609375, -0.46466064453125, -0.4068603515625, -0.34906005859375, -0.291259765625, -0.23345947265625, -0.1756591796875, -0.11785888671875, -0.06005859375, -0.00225830078125, 0.0555419921875, 0.11334228515625, 0.171142578125, 0.22894287109375, 0.2867431640625, 0.34454345703125, 0.40234375, 0.46014404296875, 0.5179443359375, 0.57574462890625, 0.633544921875, 0.69134521484375, 0.7491455078125, 0.80694580078125, 0.86474609375, 0.92254638671875, 0.9803466796875, 1.03814697265625, 1.095947265625, 1.15374755859375, 1.2115478515625, 1.26934814453125, 1.3271484375, 1.38494873046875, 1.4427490234375, 1.50054931640625, 1.558349609375, 1.61614990234375, 1.6739501953125, 1.73175048828125, 1.78955078125, 1.84735107421875, 1.9051513671875, 1.96295166015625, 2.020751953125, 2.07855224609375, 2.1363525390625, 2.19415283203125, 2.251953125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 9.0, 22.0, 53.0, 103.0, 216.0, 262.0, 169.0, 76.0, 37.0, 15.0, 8.0, 5.0, 4.0, 2.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.450057983398438, -10.977423667907715, -10.504789352416992, -10.03215503692627, -9.559520721435547, -9.086886405944824, -8.614252090454102, -8.141616821289062, -7.668982982635498, -7.196348667144775, -6.723714351654053, -6.251079559326172, -5.778445243835449, -5.305810928344727, -4.833176612854004, -4.360542297363281, -3.8879079818725586, -3.415273666381836, -2.9426393508911133, -2.4700047969818115, -1.9973704814910889, -1.5247361660003662, -1.0521016120910645, -0.5794672966003418, -0.10683298110961914, 0.3658013939857483, 0.8384357690811157, 1.311070203781128, 1.7837045192718506, 2.2563388347625732, 2.728973388671875, 3.2016077041625977, 3.6742420196533203, 4.146876335144043, 4.619510650634766, 5.092144966125488, 5.564779281616211, 6.037413597106934, 6.5100483894348145, 6.982682704925537, 7.45531702041626, 7.927951335906982, 8.400586128234863, 8.873220443725586, 9.345854759216309, 9.818489074707031, 10.291123390197754, 10.763757705688477, 11.2363920211792, 11.709026336669922, 12.181660652160645, 12.654294967651367, 13.12692928314209, 13.599563598632812, 14.072198867797852, 14.544832229614258, 15.017467498779297, 15.49010181427002, 15.962736129760742, 16.43537139892578, 16.908004760742188, 17.380640029907227, 17.853273391723633, 18.325908660888672, 18.798542022705078]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 1.0, 5.0, 9.0, 8.0, 13.0, 25.0, 30.0, 40.0, 34.0, 62.0, 51.0, 61.0, 67.0, 76.0, 65.0, 63.0, 70.0, 53.0, 42.0, 39.0, 28.0, 35.0, 33.0, 18.0, 22.0, 10.0, 12.0, 13.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.846399784088135, -5.643702983856201, -5.441006183624268, -5.238309860229492, -5.035613059997559, -4.832916259765625, -4.630219459533691, -4.427522659301758, -4.224825859069824, -4.022129058837891, -3.819432497024536, -3.6167356967926025, -3.414039134979248, -3.2113423347473145, -3.008645534515381, -2.8059487342834473, -2.603252410888672, -2.4005556106567383, -2.197859048843384, -1.9951622486114502, -1.7924655675888062, -1.589768886566162, -1.3870720863342285, -1.1843754053115845, -0.9816787242889404, -0.7789820432662964, -0.5762853026390076, -0.37358856201171875, -0.1708918809890747, 0.031804800033569336, 0.23450160026550293, 0.437198281288147, 0.6398944854736328, 0.8425911664962769, 1.045287847518921, 1.2479846477508545, 1.4506813287734985, 1.6533780097961426, 1.8560748100280762, 2.0587716102600098, 2.2614681720733643, 2.464164972305298, 2.6668615341186523, 2.869558334350586, 3.0722551345825195, 3.274951696395874, 3.4776484966278076, 3.680345058441162, 3.8830418586730957, 4.085738658905029, 4.288435459136963, 4.491131782531738, 4.693828582763672, 4.8965253829956055, 5.099222183227539, 5.301918983459473, 5.504615783691406, 5.70731258392334, 5.910009384155273, 6.112706184387207, 6.315402507781982, 6.518099308013916, 6.72079610824585, 6.923492908477783, 7.126189231872559]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 15.0, 15.0, 17.0, 24.0, 53.0, 75.0, 127.0, 242.0, 462.0, 1115.0, 3170.0, 10568.0, 48196.0, 291555.0, 539523.0, 122051.0, 22428.0, 5600.0, 1827.0, 697.0, 311.0, 151.0, 108.0, 63.0, 33.0, 31.0, 24.0, 13.0, 9.0, 10.0, 7.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.943359375, -0.90875244140625, -0.8741455078125, -0.83953857421875, -0.804931640625, -0.77032470703125, -0.7357177734375, -0.70111083984375, -0.66650390625, -0.63189697265625, -0.5972900390625, -0.56268310546875, -0.528076171875, -0.49346923828125, -0.4588623046875, -0.42425537109375, -0.3896484375, -0.35504150390625, -0.3204345703125, -0.28582763671875, -0.251220703125, -0.21661376953125, -0.1820068359375, -0.14739990234375, -0.11279296875, -0.07818603515625, -0.0435791015625, -0.00897216796875, 0.025634765625, 0.06024169921875, 0.0948486328125, 0.12945556640625, 0.1640625, 0.19866943359375, 0.2332763671875, 0.26788330078125, 0.302490234375, 0.33709716796875, 0.3717041015625, 0.40631103515625, 0.44091796875, 0.47552490234375, 0.5101318359375, 0.54473876953125, 0.579345703125, 0.61395263671875, 0.6485595703125, 0.68316650390625, 0.7177734375, 0.75238037109375, 0.7869873046875, 0.82159423828125, 0.856201171875, 0.89080810546875, 0.9254150390625, 0.96002197265625, 0.99462890625, 1.02923583984375, 1.0638427734375, 1.09844970703125, 1.133056640625, 1.16766357421875, 1.2022705078125, 1.23687744140625, 1.271484375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 3.0, 7.0, 10.0, 16.0, 22.0, 30.0, 25.0, 34.0, 39.0, 46.0, 51.0, 48.0, 72.0, 55.0, 52.0, 73.0, 64.0, 54.0, 54.0, 55.0, 36.0, 28.0, 23.0, 17.0, 23.0, 16.0, 13.0, 9.0, 10.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.6799545288085938, -0.6602020263671875, -0.6404495239257812, -0.620697021484375, -0.6009445190429688, -0.5811920166015625, -0.5614395141601562, -0.54168701171875, -0.5219345092773438, -0.5021820068359375, -0.48242950439453125, -0.462677001953125, -0.44292449951171875, -0.4231719970703125, -0.40341949462890625, -0.3836669921875, -0.36391448974609375, -0.3441619873046875, -0.32440948486328125, -0.304656982421875, -0.28490447998046875, -0.2651519775390625, -0.24539947509765625, -0.22564697265625, -0.20589447021484375, -0.1861419677734375, -0.16638946533203125, -0.146636962890625, -0.12688446044921875, -0.1071319580078125, -0.08737945556640625, -0.067626953125, -0.04787445068359375, -0.0281219482421875, -0.00836944580078125, 0.011383056640625, 0.03113555908203125, 0.0508880615234375, 0.07064056396484375, 0.09039306640625, 0.11014556884765625, 0.1298980712890625, 0.14965057373046875, 0.169403076171875, 0.18915557861328125, 0.2089080810546875, 0.22866058349609375, 0.2484130859375, 0.26816558837890625, 0.2879180908203125, 0.30767059326171875, 0.327423095703125, 0.34717559814453125, 0.3669281005859375, 0.38668060302734375, 0.40643310546875, 0.42618560791015625, 0.4459381103515625, 0.46569061279296875, 0.485443115234375, 0.5051956176757812, 0.5249481201171875, 0.5447006225585938, 0.564453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 7.0, 19.0, 27.0, 31.0, 53.0, 93.0, 139.0, 323.0, 893.0, 3286.0, 18753.0, 228646.0, 734531.0, 52216.0, 6970.0, 1566.0, 516.0, 205.0, 93.0, 66.0, 37.0, 27.0, 18.0, 9.0, 6.0, 4.0, 3.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4716796875, -1.4195404052734375, -1.367401123046875, -1.3152618408203125, -1.26312255859375, -1.2109832763671875, -1.158843994140625, -1.1067047119140625, -1.0545654296875, -1.0024261474609375, -0.950286865234375, -0.8981475830078125, -0.84600830078125, -0.7938690185546875, -0.741729736328125, -0.6895904541015625, -0.637451171875, -0.5853118896484375, -0.533172607421875, -0.4810333251953125, -0.42889404296875, -0.3767547607421875, -0.324615478515625, -0.2724761962890625, -0.2203369140625, -0.1681976318359375, -0.116058349609375, -0.0639190673828125, -0.01177978515625, 0.0403594970703125, 0.092498779296875, 0.1446380615234375, 0.19677734375, 0.2489166259765625, 0.301055908203125, 0.3531951904296875, 0.40533447265625, 0.4574737548828125, 0.509613037109375, 0.5617523193359375, 0.6138916015625, 0.6660308837890625, 0.718170166015625, 0.7703094482421875, 0.82244873046875, 0.8745880126953125, 0.926727294921875, 0.9788665771484375, 1.031005859375, 1.0831451416015625, 1.135284423828125, 1.1874237060546875, 1.23956298828125, 1.2917022705078125, 1.343841552734375, 1.3959808349609375, 1.4481201171875, 1.5002593994140625, 1.552398681640625, 1.6045379638671875, 1.65667724609375, 1.7088165283203125, 1.760955810546875, 1.8130950927734375, 1.865234375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 7.0, 9.0, 8.0, 20.0, 15.0, 15.0, 24.0, 23.0, 27.0, 47.0, 46.0, 42.0, 41.0, 63.0, 63.0, 61.0, 60.0, 53.0, 43.0, 63.0, 48.0, 35.0, 29.0, 36.0, 16.0, 17.0, 13.0, 19.0, 11.0, 8.0, 3.0, 4.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.89453125, -1.82769775390625, -1.7608642578125, -1.69403076171875, -1.627197265625, -1.56036376953125, -1.4935302734375, -1.42669677734375, -1.35986328125, -1.29302978515625, -1.2261962890625, -1.15936279296875, -1.092529296875, -1.02569580078125, -0.9588623046875, -0.89202880859375, -0.8251953125, -0.75836181640625, -0.6915283203125, -0.62469482421875, -0.557861328125, -0.49102783203125, -0.4241943359375, -0.35736083984375, -0.29052734375, -0.22369384765625, -0.1568603515625, -0.09002685546875, -0.023193359375, 0.04364013671875, 0.1104736328125, 0.17730712890625, 0.244140625, 0.31097412109375, 0.3778076171875, 0.44464111328125, 0.511474609375, 0.57830810546875, 0.6451416015625, 0.71197509765625, 0.77880859375, 0.84564208984375, 0.9124755859375, 0.97930908203125, 1.046142578125, 1.11297607421875, 1.1798095703125, 1.24664306640625, 1.3134765625, 1.38031005859375, 1.4471435546875, 1.51397705078125, 1.580810546875, 1.64764404296875, 1.7144775390625, 1.78131103515625, 1.84814453125, 1.91497802734375, 1.9818115234375, 2.04864501953125, 2.115478515625, 2.18231201171875, 2.2491455078125, 2.31597900390625, 2.3828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 7.0, 2.0, 10.0, 13.0, 16.0, 24.0, 34.0, 58.0, 99.0, 185.0, 346.0, 822.0, 1826.0, 4606.0, 12396.0, 38758.0, 162021.0, 634580.0, 139577.0, 34765.0, 11139.0, 4116.0, 1711.0, 727.0, 339.0, 167.0, 82.0, 48.0, 17.0, 16.0, 13.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3466796875, -0.33449554443359375, -0.3223114013671875, -0.31012725830078125, -0.297943115234375, -0.28575897216796875, -0.2735748291015625, -0.26139068603515625, -0.24920654296875, -0.23702239990234375, -0.2248382568359375, -0.21265411376953125, -0.200469970703125, -0.18828582763671875, -0.1761016845703125, -0.16391754150390625, -0.1517333984375, -0.13954925537109375, -0.1273651123046875, -0.11518096923828125, -0.102996826171875, -0.09081268310546875, -0.0786285400390625, -0.06644439697265625, -0.05426025390625, -0.04207611083984375, -0.0298919677734375, -0.01770782470703125, -0.005523681640625, 0.00666046142578125, 0.0188446044921875, 0.03102874755859375, 0.043212890625, 0.05539703369140625, 0.0675811767578125, 0.07976531982421875, 0.091949462890625, 0.10413360595703125, 0.1163177490234375, 0.12850189208984375, 0.14068603515625, 0.15287017822265625, 0.1650543212890625, 0.17723846435546875, 0.189422607421875, 0.20160675048828125, 0.2137908935546875, 0.22597503662109375, 0.2381591796875, 0.25034332275390625, 0.2625274658203125, 0.27471160888671875, 0.286895751953125, 0.29907989501953125, 0.3112640380859375, 0.32344818115234375, 0.33563232421875, 0.34781646728515625, 0.3600006103515625, 0.37218475341796875, 0.384368896484375, 0.39655303955078125, 0.4087371826171875, 0.42092132568359375, 0.43310546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 9.0, 7.0, 17.0, 15.0, 17.0, 40.0, 32.0, 65.0, 73.0, 94.0, 117.0, 129.0, 101.0, 64.0, 49.0, 42.0, 27.0, 21.0, 11.0, 16.0, 7.0, 10.0, 7.0, 5.0, 5.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.918212890625e-05, -9.536370635032654e-05, -9.154528379440308e-05, -8.772686123847961e-05, -8.390843868255615e-05, -8.009001612663269e-05, -7.627159357070923e-05, -7.245317101478577e-05, -6.86347484588623e-05, -6.481632590293884e-05, -6.099790334701538e-05, -5.717948079109192e-05, -5.336105823516846e-05, -4.9542635679244995e-05, -4.572421312332153e-05, -4.190579056739807e-05, -3.808736801147461e-05, -3.426894545555115e-05, -3.0450522899627686e-05, -2.6632100343704224e-05, -2.2813677787780762e-05, -1.89952552318573e-05, -1.5176832675933838e-05, -1.1358410120010376e-05, -7.539987564086914e-06, -3.721565008163452e-06, 9.685754776000977e-08, 3.915280103683472e-06, 7.733702659606934e-06, 1.1552125215530396e-05, 1.5370547771453857e-05, 1.918897032737732e-05, 2.300739288330078e-05, 2.6825815439224243e-05, 3.0644237995147705e-05, 3.446266055107117e-05, 3.828108310699463e-05, 4.209950566291809e-05, 4.591792821884155e-05, 4.9736350774765015e-05, 5.3554773330688477e-05, 5.737319588661194e-05, 6.11916184425354e-05, 6.501004099845886e-05, 6.882846355438232e-05, 7.264688611030579e-05, 7.646530866622925e-05, 8.028373122215271e-05, 8.410215377807617e-05, 8.792057633399963e-05, 9.17389988899231e-05, 9.555742144584656e-05, 9.937584400177002e-05, 0.00010319426655769348, 0.00010701268911361694, 0.0001108311116695404, 0.00011464953422546387, 0.00011846795678138733, 0.0001222863793373108, 0.00012610480189323425, 0.00012992322444915771, 0.00013374164700508118, 0.00013756006956100464, 0.0001413784921169281, 0.00014519691467285156]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 5.0, 19.0, 22.0, 31.0, 68.0, 104.0, 247.0, 673.0, 2189.0, 8976.0, 46309.0, 517169.0, 415605.0, 45073.0, 8690.0, 2195.0, 684.0, 235.0, 118.0, 56.0, 30.0, 20.0, 9.0, 9.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4306640625, -0.41193389892578125, -0.3932037353515625, -0.37447357177734375, -0.355743408203125, -0.33701324462890625, -0.3182830810546875, -0.29955291748046875, -0.28082275390625, -0.26209259033203125, -0.2433624267578125, -0.22463226318359375, -0.205902099609375, -0.18717193603515625, -0.1684417724609375, -0.14971160888671875, -0.1309814453125, -0.11225128173828125, -0.0935211181640625, -0.07479095458984375, -0.056060791015625, -0.03733062744140625, -0.0186004638671875, 0.00012969970703125, 0.01885986328125, 0.03759002685546875, 0.0563201904296875, 0.07505035400390625, 0.093780517578125, 0.11251068115234375, 0.1312408447265625, 0.14997100830078125, 0.168701171875, 0.18743133544921875, 0.2061614990234375, 0.22489166259765625, 0.243621826171875, 0.26235198974609375, 0.2810821533203125, 0.29981231689453125, 0.31854248046875, 0.33727264404296875, 0.3560028076171875, 0.37473297119140625, 0.393463134765625, 0.41219329833984375, 0.4309234619140625, 0.44965362548828125, 0.4683837890625, 0.48711395263671875, 0.5058441162109375, 0.5245742797851562, 0.543304443359375, 0.5620346069335938, 0.5807647705078125, 0.5994949340820312, 0.61822509765625, 0.6369552612304688, 0.6556854248046875, 0.6744155883789062, 0.693145751953125, 0.7118759155273438, 0.7306060791015625, 0.7493362426757812, 0.76806640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 2.0, 3.0, 9.0, 6.0, 12.0, 12.0, 11.0, 17.0, 38.0, 45.0, 53.0, 67.0, 64.0, 83.0, 96.0, 88.0, 87.0, 66.0, 70.0, 41.0, 27.0, 17.0, 15.0, 15.0, 9.0, 12.0, 7.0, 5.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3662109375, -0.352508544921875, -0.33880615234375, -0.325103759765625, -0.3114013671875, -0.297698974609375, -0.28399658203125, -0.270294189453125, -0.256591796875, -0.242889404296875, -0.22918701171875, -0.215484619140625, -0.2017822265625, -0.188079833984375, -0.17437744140625, -0.160675048828125, -0.14697265625, -0.133270263671875, -0.11956787109375, -0.105865478515625, -0.0921630859375, -0.078460693359375, -0.06475830078125, -0.051055908203125, -0.037353515625, -0.023651123046875, -0.00994873046875, 0.003753662109375, 0.0174560546875, 0.031158447265625, 0.04486083984375, 0.058563232421875, 0.072265625, 0.085968017578125, 0.09967041015625, 0.113372802734375, 0.1270751953125, 0.140777587890625, 0.15447998046875, 0.168182373046875, 0.181884765625, 0.195587158203125, 0.20928955078125, 0.222991943359375, 0.2366943359375, 0.250396728515625, 0.26409912109375, 0.277801513671875, 0.29150390625, 0.305206298828125, 0.31890869140625, 0.332611083984375, 0.3463134765625, 0.360015869140625, 0.37371826171875, 0.387420654296875, 0.401123046875, 0.414825439453125, 0.42852783203125, 0.442230224609375, 0.4559326171875, 0.469635009765625, 0.48333740234375, 0.497039794921875, 0.5107421875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 11.0, 6.0, 9.0, 15.0, 41.0, 96.0, 156.0, 323.0, 179.0, 88.0, 47.0, 10.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.746142387390137, -11.349281311035156, -10.95241928100586, -10.555558204650879, -10.158697128295898, -9.761836051940918, -9.364974021911621, -8.96811294555664, -8.57125186920166, -8.17439079284668, -7.777529239654541, -7.380667686462402, -6.983806610107422, -6.586945056915283, -6.1900835037231445, -5.793222427368164, -5.396360874176025, -4.999499320983887, -4.602638244628906, -4.205776691436768, -3.808915615081787, -3.4120540618896484, -3.015192747116089, -2.6183314323425293, -2.2214701175689697, -1.8246088027954102, -1.4277474880218506, -1.0308860540390015, -0.6340247392654419, -0.23716342449188232, 0.1596980094909668, 0.5565593242645264, 0.9534206390380859, 1.3502819538116455, 1.747143268585205, 2.1440048217773438, 2.540865898132324, 2.937727451324463, 3.3345887660980225, 3.731450080871582, 4.1283111572265625, 4.525172710418701, 4.922033786773682, 5.31889533996582, 5.715756416320801, 6.1126179695129395, 6.509479522705078, 6.906340599060059, 7.303202152252197, 7.700063705444336, 8.096924781799316, 8.493785858154297, 8.890647888183594, 9.287508964538574, 9.684370040893555, 10.081232070922852, 10.478093147277832, 10.874954223632812, 11.27181625366211, 11.66867733001709, 12.06553840637207, 12.46239948272705, 12.859261512756348, 13.256122589111328, 13.652983665466309]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 12.0, 19.0, 23.0, 23.0, 27.0, 38.0, 42.0, 35.0, 59.0, 54.0, 80.0, 92.0, 99.0, 77.0, 39.0, 43.0, 50.0, 31.0, 31.0, 19.0, 12.0, 13.0, 17.0, 11.0, 9.0, 5.0, 3.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.235578536987305, -8.93403148651123, -8.632484436035156, -8.330938339233398, -8.029391288757324, -7.72784423828125, -7.426297664642334, -7.124751091003418, -6.823204040527344, -6.5216569900512695, -6.2201104164123535, -5.9185638427734375, -5.617016792297363, -5.315469741821289, -5.013923168182373, -4.712376594543457, -4.410829544067383, -4.109282493591309, -3.8077359199523926, -3.5061891078948975, -3.2046422958374023, -2.9030954837799072, -2.601548671722412, -2.300001859664917, -1.9984550476074219, -1.6969082355499268, -1.3953614234924316, -1.0938146114349365, -0.7922677993774414, -0.4907209873199463, -0.18917417526245117, 0.11237263679504395, 0.41391944885253906, 0.7154662609100342, 1.0170130729675293, 1.3185598850250244, 1.6201066970825195, 1.9216535091400146, 2.2232003211975098, 2.524747133255005, 2.8262939453125, 3.127840757369995, 3.4293875694274902, 3.7309343814849854, 4.0324811935424805, 4.334028244018555, 4.635574817657471, 4.937121391296387, 5.238668441772461, 5.540215492248535, 5.841762065887451, 6.143308639526367, 6.444855690002441, 6.746402740478516, 7.047949314117432, 7.349495887756348, 7.651042938232422, 7.952589988708496, 8.25413703918457, 8.555683135986328, 8.857230186462402, 9.158777236938477, 9.460323333740234, 9.761870384216309, 10.063417434692383]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 8.0, 3.0, 11.0, 10.0, 10.0, 20.0, 29.0, 42.0, 55.0, 82.0, 130.0, 195.0, 327.0, 594.0, 1100.0, 2353.0, 5651.0, 18161.0, 90712.0, 757779.0, 2688134.0, 540619.0, 65587.0, 13816.0, 4620.0, 1948.0, 936.0, 513.0, 241.0, 183.0, 119.0, 91.0, 53.0, 39.0, 28.0, 28.0, 21.0, 12.0, 4.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.77099609375, -0.7509307861328125, -0.730865478515625, -0.7108001708984375, -0.69073486328125, -0.6706695556640625, -0.650604248046875, -0.6305389404296875, -0.6104736328125, -0.5904083251953125, -0.570343017578125, -0.5502777099609375, -0.53021240234375, -0.5101470947265625, -0.490081787109375, -0.4700164794921875, -0.449951171875, -0.4298858642578125, -0.409820556640625, -0.3897552490234375, -0.36968994140625, -0.3496246337890625, -0.329559326171875, -0.3094940185546875, -0.2894287109375, -0.2693634033203125, -0.249298095703125, -0.2292327880859375, -0.20916748046875, -0.1891021728515625, -0.169036865234375, -0.1489715576171875, -0.12890625, -0.1088409423828125, -0.088775634765625, -0.0687103271484375, -0.04864501953125, -0.0285797119140625, -0.008514404296875, 0.0115509033203125, 0.0316162109375, 0.0516815185546875, 0.071746826171875, 0.0918121337890625, 0.11187744140625, 0.1319427490234375, 0.152008056640625, 0.1720733642578125, 0.192138671875, 0.2122039794921875, 0.232269287109375, 0.2523345947265625, 0.27239990234375, 0.2924652099609375, 0.312530517578125, 0.3325958251953125, 0.3526611328125, 0.3727264404296875, 0.392791748046875, 0.4128570556640625, 0.43292236328125, 0.4529876708984375, 0.473052978515625, 0.4931182861328125, 0.51318359375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 9.0, 9.0, 7.0, 8.0, 23.0, 17.0, 25.0, 20.0, 33.0, 34.0, 36.0, 44.0, 40.0, 50.0, 53.0, 59.0, 56.0, 49.0, 49.0, 45.0, 52.0, 52.0, 36.0, 33.0, 31.0, 14.0, 22.0, 29.0, 18.0, 12.0, 12.0, 4.0, 6.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.494384765625, -0.4777565002441406, -0.46112823486328125, -0.4444999694824219, -0.4278717041015625, -0.4112434387207031, -0.39461517333984375, -0.3779869079589844, -0.361358642578125, -0.3447303771972656, -0.32810211181640625, -0.3114738464355469, -0.2948455810546875, -0.2782173156738281, -0.26158905029296875, -0.24496078491210938, -0.22833251953125, -0.21170425415039062, -0.19507598876953125, -0.17844772338867188, -0.1618194580078125, -0.14519119262695312, -0.12856292724609375, -0.11193466186523438, -0.095306396484375, -0.07867813110351562, -0.06204986572265625, -0.045421600341796875, -0.0287933349609375, -0.012165069580078125, 0.00446319580078125, 0.021091461181640625, 0.0377197265625, 0.054347991943359375, 0.07097625732421875, 0.08760452270507812, 0.1042327880859375, 0.12086105346679688, 0.13748931884765625, 0.15411758422851562, 0.170745849609375, 0.18737411499023438, 0.20400238037109375, 0.22063064575195312, 0.2372589111328125, 0.2538871765136719, 0.27051544189453125, 0.2871437072753906, 0.30377197265625, 0.3204002380371094, 0.33702850341796875, 0.3536567687988281, 0.3702850341796875, 0.3869132995605469, 0.40354156494140625, 0.4201698303222656, 0.436798095703125, 0.4534263610839844, 0.47005462646484375, 0.4866828918457031, 0.5033111572265625, 0.5199394226074219, 0.5365676879882812, 0.5531959533691406, 0.56982421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 13.0, 24.0, 21.0, 46.0, 74.0, 151.0, 358.0, 978.0, 7861.0, 2050658.0, 2124119.0, 8257.0, 1032.0, 348.0, 142.0, 84.0, 39.0, 30.0, 20.0, 9.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.802734375, -2.720306396484375, -2.63787841796875, -2.555450439453125, -2.4730224609375, -2.390594482421875, -2.30816650390625, -2.225738525390625, -2.143310546875, -2.060882568359375, -1.97845458984375, -1.896026611328125, -1.8135986328125, -1.731170654296875, -1.64874267578125, -1.566314697265625, -1.48388671875, -1.401458740234375, -1.31903076171875, -1.236602783203125, -1.1541748046875, -1.071746826171875, -0.98931884765625, -0.906890869140625, -0.824462890625, -0.742034912109375, -0.65960693359375, -0.577178955078125, -0.4947509765625, -0.412322998046875, -0.32989501953125, -0.247467041015625, -0.1650390625, -0.082611083984375, -0.00018310546875, 0.082244873046875, 0.1646728515625, 0.247100830078125, 0.32952880859375, 0.411956787109375, 0.494384765625, 0.576812744140625, 0.65924072265625, 0.741668701171875, 0.8240966796875, 0.906524658203125, 0.98895263671875, 1.071380615234375, 1.15380859375, 1.236236572265625, 1.31866455078125, 1.401092529296875, 1.4835205078125, 1.565948486328125, 1.64837646484375, 1.730804443359375, 1.813232421875, 1.895660400390625, 1.97808837890625, 2.060516357421875, 2.1429443359375, 2.225372314453125, 2.30780029296875, 2.390228271484375, 2.47265625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 18.0, 12.0, 30.0, 46.0, 72.0, 142.0, 249.0, 440.0, 786.0, 869.0, 626.0, 341.0, 188.0, 92.0, 54.0, 28.0, 24.0, 16.0, 12.0, 2.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.876953125, -0.8407745361328125, -0.804595947265625, -0.7684173583984375, -0.73223876953125, -0.6960601806640625, -0.659881591796875, -0.6237030029296875, -0.5875244140625, -0.5513458251953125, -0.515167236328125, -0.4789886474609375, -0.44281005859375, -0.4066314697265625, -0.370452880859375, -0.3342742919921875, -0.298095703125, -0.2619171142578125, -0.225738525390625, -0.1895599365234375, -0.15338134765625, -0.1172027587890625, -0.081024169921875, -0.0448455810546875, -0.0086669921875, 0.0275115966796875, 0.063690185546875, 0.0998687744140625, 0.13604736328125, 0.1722259521484375, 0.208404541015625, 0.2445831298828125, 0.28076171875, 0.3169403076171875, 0.353118896484375, 0.3892974853515625, 0.42547607421875, 0.4616546630859375, 0.497833251953125, 0.5340118408203125, 0.5701904296875, 0.6063690185546875, 0.642547607421875, 0.6787261962890625, 0.71490478515625, 0.7510833740234375, 0.787261962890625, 0.8234405517578125, 0.859619140625, 0.8957977294921875, 0.931976318359375, 0.9681549072265625, 1.00433349609375, 1.0405120849609375, 1.076690673828125, 1.1128692626953125, 1.1490478515625, 1.1852264404296875, 1.221405029296875, 1.2575836181640625, 1.29376220703125, 1.3299407958984375, 1.366119384765625, 1.4022979736328125, 1.4384765625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 12.0, 92.0, 240.0, 367.0, 210.0, 54.0, 18.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.834590911865234, -29.217252731323242, -28.599916458129883, -27.98257827758789, -27.3652400970459, -26.747901916503906, -26.130565643310547, -25.513227462768555, -24.895889282226562, -24.27855110168457, -23.66121482849121, -23.04387664794922, -22.426538467407227, -21.809200286865234, -21.191864013671875, -20.574525833129883, -19.957189559936523, -19.33985137939453, -18.722515106201172, -18.10517692565918, -17.487838745117188, -16.870502471923828, -16.253164291381836, -15.635826110839844, -15.018488883972168, -14.401151657104492, -13.7838134765625, -13.166476249694824, -12.549139022827148, -11.931800842285156, -11.31446361541748, -10.697126388549805, -10.07978630065918, -9.462449073791504, -8.845110893249512, -8.227773666381836, -7.610435962677002, -6.993098258972168, -6.375761032104492, -5.758423328399658, -5.141085624694824, -4.52374792098999, -3.9064104557037354, -3.2890729904174805, -2.6717352867126465, -2.0543975830078125, -1.4370601177215576, -0.8197226524353027, -0.20238494873046875, 0.4149526357650757, 1.0322902202606201, 1.6496278047561646, 2.266965389251709, 2.884303092956543, 3.501640558242798, 4.118978023529053, 4.736315727233887, 5.353653430938721, 5.970991134643555, 6.5883283615112305, 7.2056660652160645, 7.823003768920898, 8.440340995788574, 9.05767822265625, 9.675016403198242]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 6.0, 5.0, 14.0, 12.0, 17.0, 21.0, 33.0, 31.0, 34.0, 50.0, 29.0, 57.0, 53.0, 62.0, 68.0, 73.0, 48.0, 57.0, 49.0, 46.0, 39.0, 37.0, 30.0, 27.0, 29.0, 14.0, 17.0, 6.0, 12.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.1877522468566895, -5.050219535827637, -4.912686824798584, -4.775153636932373, -4.63762092590332, -4.500088214874268, -4.362555503845215, -4.225022792816162, -4.087490081787109, -3.9499573707580566, -3.812424421310425, -3.674891710281372, -3.5373587608337402, -3.3998260498046875, -3.2622933387756348, -3.124760627746582, -2.987227439880371, -2.8496947288513184, -2.7121617794036865, -2.574629068374634, -2.437096118927002, -2.299563407897949, -2.1620306968688965, -2.0244979858398438, -1.886965036392212, -1.7494322061538696, -1.6118993759155273, -1.4743666648864746, -1.3368338346481323, -1.19930100440979, -1.0617682933807373, -0.924235463142395, -0.7867026329040527, -0.6491698026657104, -0.5116370320320129, -0.37410423159599304, -0.23657143115997314, -0.09903860092163086, 0.03849416971206665, 0.17602694034576416, 0.31355977058410645, 0.45109257102012634, 0.5886253714561462, 0.7261581420898438, 0.863690972328186, 1.0012238025665283, 1.138756513595581, 1.2762893438339233, 1.4138221740722656, 1.551355004310608, 1.6888878345489502, 1.826420545578003, 1.9639533758163452, 2.1014862060546875, 2.2390189170837402, 2.376551628112793, 2.514084577560425, 2.6516172885894775, 2.7891502380371094, 2.926682949066162, 3.064215660095215, 3.2017486095428467, 3.3392813205718994, 3.4768142700195312, 3.614346981048584]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 11.0, 6.0, 8.0, 11.0, 19.0, 42.0, 48.0, 93.0, 183.0, 299.0, 712.0, 1672.0, 4698.0, 15004.0, 61200.0, 300263.0, 499092.0, 125291.0, 27530.0, 7771.0, 2675.0, 965.0, 448.0, 209.0, 112.0, 75.0, 34.0, 28.0, 14.0, 15.0, 7.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95849609375, -0.9296493530273438, -0.9008026123046875, -0.8719558715820312, -0.843109130859375, -0.8142623901367188, -0.7854156494140625, -0.7565689086914062, -0.72772216796875, -0.6988754272460938, -0.6700286865234375, -0.6411819458007812, -0.612335205078125, -0.5834884643554688, -0.5546417236328125, -0.5257949829101562, -0.4969482421875, -0.46810150146484375, -0.4392547607421875, -0.41040802001953125, -0.381561279296875, -0.35271453857421875, -0.3238677978515625, -0.29502105712890625, -0.26617431640625, -0.23732757568359375, -0.2084808349609375, -0.17963409423828125, -0.150787353515625, -0.12194061279296875, -0.0930938720703125, -0.06424713134765625, -0.035400390625, -0.00655364990234375, 0.0222930908203125, 0.05113983154296875, 0.079986572265625, 0.10883331298828125, 0.1376800537109375, 0.16652679443359375, 0.19537353515625, 0.22422027587890625, 0.2530670166015625, 0.28191375732421875, 0.310760498046875, 0.33960723876953125, 0.3684539794921875, 0.39730072021484375, 0.4261474609375, 0.45499420166015625, 0.4838409423828125, 0.5126876831054688, 0.541534423828125, 0.5703811645507812, 0.5992279052734375, 0.6280746459960938, 0.65692138671875, 0.6857681274414062, 0.7146148681640625, 0.7434616088867188, 0.772308349609375, 0.8011550903320312, 0.8300018310546875, 0.8588485717773438, 0.8876953125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 11.0, 11.0, 15.0, 18.0, 16.0, 17.0, 18.0, 18.0, 26.0, 35.0, 37.0, 47.0, 38.0, 47.0, 40.0, 38.0, 52.0, 59.0, 53.0, 47.0, 46.0, 49.0, 42.0, 33.0, 34.0, 30.0, 11.0, 16.0, 16.0, 15.0, 12.0, 12.0, 12.0, 7.0, 5.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.481689453125, -0.4656715393066406, -0.44965362548828125, -0.4336357116699219, -0.4176177978515625, -0.4015998840332031, -0.38558197021484375, -0.3695640563964844, -0.353546142578125, -0.3375282287597656, -0.32151031494140625, -0.3054924011230469, -0.2894744873046875, -0.2734565734863281, -0.25743865966796875, -0.24142074584960938, -0.22540283203125, -0.20938491821289062, -0.19336700439453125, -0.17734909057617188, -0.1613311767578125, -0.14531326293945312, -0.12929534912109375, -0.11327743530273438, -0.097259521484375, -0.08124160766601562, -0.06522369384765625, -0.049205780029296875, -0.0331878662109375, -0.017169952392578125, -0.00115203857421875, 0.014865875244140625, 0.0308837890625, 0.046901702880859375, 0.06291961669921875, 0.07893753051757812, 0.0949554443359375, 0.11097335815429688, 0.12699127197265625, 0.14300918579101562, 0.159027099609375, 0.17504501342773438, 0.19106292724609375, 0.20708084106445312, 0.2230987548828125, 0.23911666870117188, 0.25513458251953125, 0.2711524963378906, 0.28717041015625, 0.3031883239746094, 0.31920623779296875, 0.3352241516113281, 0.3512420654296875, 0.3672599792480469, 0.38327789306640625, 0.3992958068847656, 0.415313720703125, 0.4313316345214844, 0.44734954833984375, 0.4633674621582031, 0.4793853759765625, 0.4954032897949219, 0.5114212036132812, 0.5274391174316406, 0.54345703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 7.0, 4.0, 16.0, 13.0, 26.0, 41.0, 47.0, 49.0, 82.0, 135.0, 198.0, 323.0, 594.0, 1378.0, 3917.0, 15690.0, 90632.0, 696751.0, 199231.0, 29194.0, 6355.0, 1972.0, 780.0, 414.0, 223.0, 143.0, 106.0, 70.0, 44.0, 40.0, 30.0, 13.0, 19.0, 9.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9304733276367188, -0.8956146240234375, -0.8607559204101562, -0.825897216796875, -0.7910385131835938, -0.7561798095703125, -0.7213211059570312, -0.68646240234375, -0.6516036987304688, -0.6167449951171875, -0.5818862915039062, -0.547027587890625, -0.5121688842773438, -0.4773101806640625, -0.44245147705078125, -0.4075927734375, -0.37273406982421875, -0.3378753662109375, -0.30301666259765625, -0.268157958984375, -0.23329925537109375, -0.1984405517578125, -0.16358184814453125, -0.12872314453125, -0.09386444091796875, -0.0590057373046875, -0.02414703369140625, 0.010711669921875, 0.04557037353515625, 0.0804290771484375, 0.11528778076171875, 0.150146484375, 0.18500518798828125, 0.2198638916015625, 0.25472259521484375, 0.289581298828125, 0.32444000244140625, 0.3592987060546875, 0.39415740966796875, 0.42901611328125, 0.46387481689453125, 0.4987335205078125, 0.5335922241210938, 0.568450927734375, 0.6033096313476562, 0.6381683349609375, 0.6730270385742188, 0.7078857421875, 0.7427444458007812, 0.7776031494140625, 0.8124618530273438, 0.847320556640625, 0.8821792602539062, 0.9170379638671875, 0.9518966674804688, 0.98675537109375, 1.0216140747070312, 1.0564727783203125, 1.0913314819335938, 1.126190185546875, 1.1610488891601562, 1.1959075927734375, 1.2307662963867188, 1.265625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 4.0, 5.0, 8.0, 10.0, 6.0, 17.0, 16.0, 25.0, 23.0, 34.0, 26.0, 38.0, 29.0, 47.0, 38.0, 41.0, 47.0, 35.0, 40.0, 69.0, 48.0, 40.0, 43.0, 47.0, 30.0, 36.0, 25.0, 28.0, 26.0, 17.0, 17.0, 15.0, 10.0, 10.0, 8.0, 9.0, 5.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6748046875, -1.6216278076171875, -1.568450927734375, -1.5152740478515625, -1.46209716796875, -1.4089202880859375, -1.355743408203125, -1.3025665283203125, -1.2493896484375, -1.1962127685546875, -1.143035888671875, -1.0898590087890625, -1.03668212890625, -0.9835052490234375, -0.930328369140625, -0.8771514892578125, -0.823974609375, -0.7707977294921875, -0.717620849609375, -0.6644439697265625, -0.61126708984375, -0.5580902099609375, -0.504913330078125, -0.4517364501953125, -0.3985595703125, -0.3453826904296875, -0.292205810546875, -0.2390289306640625, -0.18585205078125, -0.1326751708984375, -0.079498291015625, -0.0263214111328125, 0.02685546875, 0.0800323486328125, 0.133209228515625, 0.1863861083984375, 0.23956298828125, 0.2927398681640625, 0.345916748046875, 0.3990936279296875, 0.4522705078125, 0.5054473876953125, 0.558624267578125, 0.6118011474609375, 0.66497802734375, 0.7181549072265625, 0.771331787109375, 0.8245086669921875, 0.877685546875, 0.9308624267578125, 0.984039306640625, 1.0372161865234375, 1.09039306640625, 1.1435699462890625, 1.196746826171875, 1.2499237060546875, 1.3031005859375, 1.3562774658203125, 1.409454345703125, 1.4626312255859375, 1.51580810546875, 1.5689849853515625, 1.622161865234375, 1.6753387451171875, 1.728515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 7.0, 10.0, 11.0, 20.0, 26.0, 39.0, 51.0, 119.0, 164.0, 252.0, 416.0, 814.0, 1565.0, 3337.0, 7903.0, 21742.0, 74263.0, 609095.0, 248896.0, 51482.0, 16619.0, 6084.0, 2666.0, 1309.0, 678.0, 387.0, 203.0, 162.0, 95.0, 48.0, 29.0, 17.0, 15.0, 4.0, 13.0, 4.0, 9.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.327880859375, -0.31652069091796875, -0.3051605224609375, -0.29380035400390625, -0.282440185546875, -0.27108001708984375, -0.2597198486328125, -0.24835968017578125, -0.23699951171875, -0.22563934326171875, -0.2142791748046875, -0.20291900634765625, -0.191558837890625, -0.18019866943359375, -0.1688385009765625, -0.15747833251953125, -0.1461181640625, -0.13475799560546875, -0.1233978271484375, -0.11203765869140625, -0.100677490234375, -0.08931732177734375, -0.0779571533203125, -0.06659698486328125, -0.05523681640625, -0.04387664794921875, -0.0325164794921875, -0.02115631103515625, -0.009796142578125, 0.00156402587890625, 0.0129241943359375, 0.02428436279296875, 0.03564453125, 0.04700469970703125, 0.0583648681640625, 0.06972503662109375, 0.081085205078125, 0.09244537353515625, 0.1038055419921875, 0.11516571044921875, 0.12652587890625, 0.13788604736328125, 0.1492462158203125, 0.16060638427734375, 0.171966552734375, 0.18332672119140625, 0.1946868896484375, 0.20604705810546875, 0.2174072265625, 0.22876739501953125, 0.2401275634765625, 0.25148773193359375, 0.262847900390625, 0.27420806884765625, 0.2855682373046875, 0.29692840576171875, 0.30828857421875, 0.31964874267578125, 0.3310089111328125, 0.34236907958984375, 0.353729248046875, 0.36508941650390625, 0.3764495849609375, 0.38780975341796875, 0.399169921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 2.0, 4.0, 7.0, 6.0, 11.0, 10.0, 15.0, 22.0, 11.0, 7.0, 34.0, 47.0, 60.0, 102.0, 142.0, 127.0, 109.0, 68.0, 57.0, 42.0, 27.0, 29.0, 16.0, 11.0, 12.0, 4.0, 6.0, 6.0, 3.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012105703353881836, -0.00011742021888494492, -0.00011378340423107147, -0.00011014658957719803, -0.00010650977492332458, -0.00010287296026945114, -9.92361456155777e-05, -9.559933096170425e-05, -9.196251630783081e-05, -8.832570165395737e-05, -8.468888700008392e-05, -8.105207234621048e-05, -7.741525769233704e-05, -7.377844303846359e-05, -7.014162838459015e-05, -6.65048137307167e-05, -6.286799907684326e-05, -5.923118442296982e-05, -5.5594369769096375e-05, -5.195755511522293e-05, -4.832074046134949e-05, -4.4683925807476044e-05, -4.10471111536026e-05, -3.7410296499729156e-05, -3.377348184585571e-05, -3.013666719198227e-05, -2.6499852538108826e-05, -2.2863037884235382e-05, -1.922622323036194e-05, -1.5589408576488495e-05, -1.1952593922615051e-05, -8.315779268741608e-06, -4.678964614868164e-06, -1.0421499609947205e-06, 2.594664692878723e-06, 6.231479346752167e-06, 9.86829400062561e-06, 1.3505108654499054e-05, 1.7141923308372498e-05, 2.077873796224594e-05, 2.4415552616119385e-05, 2.805236726999283e-05, 3.168918192386627e-05, 3.5325996577739716e-05, 3.896281123161316e-05, 4.25996258854866e-05, 4.6236440539360046e-05, 4.987325519323349e-05, 5.3510069847106934e-05, 5.714688450098038e-05, 6.078369915485382e-05, 6.442051380872726e-05, 6.805732846260071e-05, 7.169414311647415e-05, 7.53309577703476e-05, 7.896777242422104e-05, 8.260458707809448e-05, 8.624140173196793e-05, 8.987821638584137e-05, 9.351503103971481e-05, 9.715184569358826e-05, 0.0001007886603474617, 0.00010442547500133514, 0.00010806228965520859, 0.00011169910430908203]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 9.0, 2.0, 3.0, 7.0, 16.0, 17.0, 28.0, 44.0, 63.0, 93.0, 137.0, 162.0, 290.0, 400.0, 661.0, 1179.0, 2177.0, 4978.0, 12429.0, 36542.0, 138287.0, 668626.0, 126390.0, 34238.0, 11728.0, 4782.0, 2217.0, 1158.0, 622.0, 403.0, 274.0, 193.0, 119.0, 74.0, 78.0, 37.0, 23.0, 21.0, 20.0, 7.0, 3.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.369140625, -0.3577728271484375, -0.346405029296875, -0.3350372314453125, -0.32366943359375, -0.3123016357421875, -0.300933837890625, -0.2895660400390625, -0.2781982421875, -0.2668304443359375, -0.255462646484375, -0.2440948486328125, -0.23272705078125, -0.2213592529296875, -0.209991455078125, -0.1986236572265625, -0.187255859375, -0.1758880615234375, -0.164520263671875, -0.1531524658203125, -0.14178466796875, -0.1304168701171875, -0.119049072265625, -0.1076812744140625, -0.0963134765625, -0.0849456787109375, -0.073577880859375, -0.0622100830078125, -0.05084228515625, -0.0394744873046875, -0.028106689453125, -0.0167388916015625, -0.00537109375, 0.0059967041015625, 0.017364501953125, 0.0287322998046875, 0.04010009765625, 0.0514678955078125, 0.062835693359375, 0.0742034912109375, 0.0855712890625, 0.0969390869140625, 0.108306884765625, 0.1196746826171875, 0.13104248046875, 0.1424102783203125, 0.153778076171875, 0.1651458740234375, 0.176513671875, 0.1878814697265625, 0.199249267578125, 0.2106170654296875, 0.22198486328125, 0.2333526611328125, 0.244720458984375, 0.2560882568359375, 0.2674560546875, 0.2788238525390625, 0.290191650390625, 0.3015594482421875, 0.31292724609375, 0.3242950439453125, 0.335662841796875, 0.3470306396484375, 0.3583984375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 8.0, 10.0, 8.0, 16.0, 15.0, 23.0, 32.0, 32.0, 65.0, 72.0, 92.0, 105.0, 116.0, 88.0, 78.0, 49.0, 40.0, 36.0, 26.0, 23.0, 14.0, 7.0, 10.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.56396484375, -0.55059814453125, -0.5372314453125, -0.52386474609375, -0.510498046875, -0.49713134765625, -0.4837646484375, -0.47039794921875, -0.45703125, -0.44366455078125, -0.4302978515625, -0.41693115234375, -0.403564453125, -0.39019775390625, -0.3768310546875, -0.36346435546875, -0.35009765625, -0.33673095703125, -0.3233642578125, -0.30999755859375, -0.296630859375, -0.28326416015625, -0.2698974609375, -0.25653076171875, -0.2431640625, -0.22979736328125, -0.2164306640625, -0.20306396484375, -0.189697265625, -0.17633056640625, -0.1629638671875, -0.14959716796875, -0.13623046875, -0.12286376953125, -0.1094970703125, -0.09613037109375, -0.082763671875, -0.06939697265625, -0.0560302734375, -0.04266357421875, -0.029296875, -0.01593017578125, -0.0025634765625, 0.01080322265625, 0.024169921875, 0.03753662109375, 0.0509033203125, 0.06427001953125, 0.07763671875, 0.09100341796875, 0.1043701171875, 0.11773681640625, 0.131103515625, 0.14447021484375, 0.1578369140625, 0.17120361328125, 0.1845703125, 0.19793701171875, 0.2113037109375, 0.22467041015625, 0.238037109375, 0.25140380859375, 0.2647705078125, 0.27813720703125, 0.29150390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 8.0, 7.0, 16.0, 28.0, 40.0, 79.0, 130.0, 231.0, 237.0, 103.0, 55.0, 28.0, 15.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.214534759521484, -8.908130645751953, -8.601727485656738, -8.295323371887207, -7.988920211791992, -7.682516574859619, -7.376112937927246, -7.069708824157715, -6.7633056640625, -6.456902027130127, -6.150498390197754, -5.844094753265381, -5.537691116333008, -5.231287479400635, -4.924883842468262, -4.6184797286987305, -4.312076091766357, -4.005672454833984, -3.6992688179016113, -3.3928651809692383, -3.0864615440368652, -2.780057907104492, -2.47365403175354, -2.167250394821167, -1.860846757888794, -1.554443120956421, -1.2480394840240479, -0.9416357278823853, -0.6352320909500122, -0.32882845401763916, -0.022424697875976562, 0.2839789390563965, 0.5903825759887695, 0.8967862129211426, 1.2031898498535156, 1.5095936059951782, 1.8159972429275513, 2.1224007606506348, 2.428804636001587, 2.73520827293396, 3.041611909866333, 3.348015546798706, 3.654419183731079, 3.9608230590820312, 4.267226696014404, 4.573630332946777, 4.88003396987915, 5.186437606811523, 5.4928412437438965, 5.7992448806762695, 6.105648517608643, 6.412052154541016, 6.718455791473389, 7.024859428405762, 7.331263542175293, 7.637666702270508, 7.944070816040039, 8.25047492980957, 8.556878089904785, 8.863282203674316, 9.169685363769531, 9.476089477539062, 9.782492637634277, 10.088896751403809, 10.395299911499023]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 9.0, 13.0, 20.0, 15.0, 22.0, 26.0, 27.0, 35.0, 30.0, 48.0, 54.0, 91.0, 108.0, 90.0, 65.0, 46.0, 31.0, 42.0, 37.0, 28.0, 27.0, 30.0, 23.0, 11.0, 11.0, 9.0, 10.0, 12.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.514820098876953, -8.262754440307617, -8.010689735412598, -7.758624076843262, -7.506558895111084, -7.254493713378906, -7.0024285316467285, -6.750363349914551, -6.498297691345215, -6.246232509613037, -5.994167327880859, -5.742101669311523, -5.490036487579346, -5.237971305847168, -4.98590612411499, -4.7338409423828125, -4.481775760650635, -4.229710578918457, -3.9776451587677, -3.7255799770355225, -3.4735145568847656, -3.221449375152588, -2.96938419342041, -2.7173190116882324, -2.4652535915374756, -2.213188409805298, -1.961122989654541, -1.7090578079223633, -1.456992506980896, -1.2049272060394287, -0.952862024307251, -0.7007967233657837, -0.4487318992614746, -0.1966666281223297, 0.055398643016815186, 0.3074638843536377, 0.559529185295105, 0.8115944862365723, 1.06365966796875, 1.3157249689102173, 1.5677902698516846, 1.8198555707931519, 2.071920871734619, 2.323986053466797, 2.5760512351989746, 2.8281166553497314, 3.080181837081909, 3.332247257232666, 3.5843124389648438, 3.8363776206970215, 4.088442802429199, 4.340508460998535, 4.592573642730713, 4.844638824462891, 5.096704006195068, 5.348769187927246, 5.600834846496582, 5.85290002822876, 6.1049652099609375, 6.357030868530273, 6.609096050262451, 6.861161231994629, 7.113226413726807, 7.365291595458984, 7.617356777191162]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 5.0, 9.0, 9.0, 17.0, 14.0, 23.0, 25.0, 42.0, 48.0, 50.0, 98.0, 124.0, 161.0, 250.0, 456.0, 874.0, 1997.0, 4695.0, 17079.0, 96448.0, 1001670.0, 2641142.0, 370416.0, 42861.0, 9632.0, 3181.0, 1266.0, 583.0, 339.0, 236.0, 144.0, 111.0, 77.0, 58.0, 36.0, 29.0, 16.0, 14.0, 10.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.779296875, -0.7551651000976562, -0.7310333251953125, -0.7069015502929688, -0.682769775390625, -0.6586380004882812, -0.6345062255859375, -0.6103744506835938, -0.58624267578125, -0.5621109008789062, -0.5379791259765625, -0.5138473510742188, -0.489715576171875, -0.46558380126953125, -0.4414520263671875, -0.41732025146484375, -0.3931884765625, -0.36905670166015625, -0.3449249267578125, -0.32079315185546875, -0.296661376953125, -0.27252960205078125, -0.2483978271484375, -0.22426605224609375, -0.20013427734375, -0.17600250244140625, -0.1518707275390625, -0.12773895263671875, -0.103607177734375, -0.07947540283203125, -0.0553436279296875, -0.03121185302734375, -0.007080078125, 0.01705169677734375, 0.0411834716796875, 0.06531524658203125, 0.089447021484375, 0.11357879638671875, 0.1377105712890625, 0.16184234619140625, 0.18597412109375, 0.21010589599609375, 0.2342376708984375, 0.25836944580078125, 0.282501220703125, 0.30663299560546875, 0.3307647705078125, 0.35489654541015625, 0.3790283203125, 0.40316009521484375, 0.4272918701171875, 0.45142364501953125, 0.475555419921875, 0.49968719482421875, 0.5238189697265625, 0.5479507446289062, 0.57208251953125, 0.5962142944335938, 0.6203460693359375, 0.6444778442382812, 0.668609619140625, 0.6927413940429688, 0.7168731689453125, 0.7410049438476562, 0.76513671875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 9.0, 3.0, 9.0, 4.0, 13.0, 17.0, 18.0, 28.0, 20.0, 21.0, 35.0, 34.0, 25.0, 51.0, 44.0, 45.0, 50.0, 55.0, 43.0, 60.0, 49.0, 61.0, 43.0, 43.0, 44.0, 28.0, 28.0, 19.0, 13.0, 23.0, 12.0, 8.0, 8.0, 14.0, 7.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46630859375, -0.4503173828125, -0.434326171875, -0.4183349609375, -0.40234375, -0.3863525390625, -0.370361328125, -0.3543701171875, -0.33837890625, -0.3223876953125, -0.306396484375, -0.2904052734375, -0.2744140625, -0.2584228515625, -0.242431640625, -0.2264404296875, -0.21044921875, -0.1944580078125, -0.178466796875, -0.1624755859375, -0.146484375, -0.1304931640625, -0.114501953125, -0.0985107421875, -0.08251953125, -0.0665283203125, -0.050537109375, -0.0345458984375, -0.0185546875, -0.0025634765625, 0.013427734375, 0.0294189453125, 0.04541015625, 0.0614013671875, 0.077392578125, 0.0933837890625, 0.109375, 0.1253662109375, 0.141357421875, 0.1573486328125, 0.17333984375, 0.1893310546875, 0.205322265625, 0.2213134765625, 0.2373046875, 0.2532958984375, 0.269287109375, 0.2852783203125, 0.30126953125, 0.3172607421875, 0.333251953125, 0.3492431640625, 0.365234375, 0.3812255859375, 0.397216796875, 0.4132080078125, 0.42919921875, 0.4451904296875, 0.461181640625, 0.4771728515625, 0.4931640625, 0.5091552734375, 0.525146484375, 0.5411376953125, 0.55712890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 2.0, 9.0, 4.0, 12.0, 15.0, 9.0, 18.0, 14.0, 12.0, 33.0, 43.0, 56.0, 54.0, 102.0, 164.0, 251.0, 568.0, 1527.0, 6926.0, 67723.0, 3607039.0, 487344.0, 17490.0, 2928.0, 889.0, 405.0, 187.0, 131.0, 70.0, 52.0, 47.0, 22.0, 37.0, 22.0, 12.0, 18.0, 16.0, 7.0, 4.0, 7.0, 4.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.853515625, -1.8001556396484375, -1.746795654296875, -1.6934356689453125, -1.64007568359375, -1.5867156982421875, -1.533355712890625, -1.4799957275390625, -1.4266357421875, -1.3732757568359375, -1.319915771484375, -1.2665557861328125, -1.21319580078125, -1.1598358154296875, -1.106475830078125, -1.0531158447265625, -0.999755859375, -0.9463958740234375, -0.893035888671875, -0.8396759033203125, -0.78631591796875, -0.7329559326171875, -0.679595947265625, -0.6262359619140625, -0.5728759765625, -0.5195159912109375, -0.466156005859375, -0.4127960205078125, -0.35943603515625, -0.3060760498046875, -0.252716064453125, -0.1993560791015625, -0.14599609375, -0.0926361083984375, -0.039276123046875, 0.0140838623046875, 0.06744384765625, 0.1208038330078125, 0.174163818359375, 0.2275238037109375, 0.2808837890625, 0.3342437744140625, 0.387603759765625, 0.4409637451171875, 0.49432373046875, 0.5476837158203125, 0.601043701171875, 0.6544036865234375, 0.707763671875, 0.7611236572265625, 0.814483642578125, 0.8678436279296875, 0.92120361328125, 0.9745635986328125, 1.027923583984375, 1.0812835693359375, 1.1346435546875, 1.1880035400390625, 1.241363525390625, 1.2947235107421875, 1.34808349609375, 1.4014434814453125, 1.454803466796875, 1.5081634521484375, 1.5615234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 3.0, 13.0, 13.0, 15.0, 30.0, 31.0, 52.0, 94.0, 167.0, 248.0, 419.0, 619.0, 681.0, 591.0, 384.0, 250.0, 170.0, 92.0, 55.0, 33.0, 30.0, 19.0, 16.0, 8.0, 12.0, 4.0, 5.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8212890625, -0.7889251708984375, -0.756561279296875, -0.7241973876953125, -0.69183349609375, -0.6594696044921875, -0.627105712890625, -0.5947418212890625, -0.5623779296875, -0.5300140380859375, -0.497650146484375, -0.4652862548828125, -0.43292236328125, -0.4005584716796875, -0.368194580078125, -0.3358306884765625, -0.303466796875, -0.2711029052734375, -0.238739013671875, -0.2063751220703125, -0.17401123046875, -0.1416473388671875, -0.109283447265625, -0.0769195556640625, -0.0445556640625, -0.0121917724609375, 0.020172119140625, 0.0525360107421875, 0.08489990234375, 0.1172637939453125, 0.149627685546875, 0.1819915771484375, 0.21435546875, 0.2467193603515625, 0.279083251953125, 0.3114471435546875, 0.34381103515625, 0.3761749267578125, 0.408538818359375, 0.4409027099609375, 0.4732666015625, 0.5056304931640625, 0.537994384765625, 0.5703582763671875, 0.60272216796875, 0.6350860595703125, 0.667449951171875, 0.6998138427734375, 0.732177734375, 0.7645416259765625, 0.796905517578125, 0.8292694091796875, 0.86163330078125, 0.8939971923828125, 0.926361083984375, 0.9587249755859375, 0.9910888671875, 1.0234527587890625, 1.055816650390625, 1.0881805419921875, 1.12054443359375, 1.1529083251953125, 1.185272216796875, 1.2176361083984375, 1.25]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 12.0, 14.0, 30.0, 81.0, 147.0, 238.0, 216.0, 110.0, 62.0, 35.0, 22.0, 14.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.840131759643555, -16.406930923461914, -15.973730087280273, -15.540529251098633, -15.107328414916992, -14.674127578735352, -14.240926742553711, -13.807726860046387, -13.374526023864746, -12.941325187683105, -12.508124351501465, -12.074923515319824, -11.641722679138184, -11.20852279663086, -10.775321960449219, -10.342121124267578, -9.908920288085938, -9.475719451904297, -9.042518615722656, -8.609317779541016, -8.176116943359375, -7.742916584014893, -7.309715747833252, -6.8765153884887695, -6.4433135986328125, -6.010112762451172, -5.576911926269531, -5.143711090087891, -4.710510730743408, -4.277309894561768, -3.844109058380127, -3.4109084606170654, -2.977707862854004, -2.5445070266723633, -2.1113064289093018, -1.6781055927276611, -1.24490487575531, -0.811704158782959, -0.37850332260131836, 0.054697275161743164, 0.4878981113433838, 0.9210988283157349, 1.354299545288086, 1.7875003814697266, 2.220701217651367, 2.6539018154144287, 3.0871026515960693, 3.520303249359131, 3.9535040855407715, 4.386704921722412, 4.819905757904053, 5.253106117248535, 5.686306953430176, 6.119507789611816, 6.552708625793457, 6.985909461975098, 7.419110298156738, 7.852311134338379, 8.28551197052002, 8.71871280670166, 9.1519136428833, 9.585113525390625, 10.018314361572266, 10.451515197753906, 10.884716033935547]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 8.0, 3.0, 7.0, 11.0, 9.0, 7.0, 4.0, 12.0, 8.0, 8.0, 23.0, 22.0, 22.0, 23.0, 39.0, 37.0, 47.0, 43.0, 40.0, 48.0, 55.0, 41.0, 44.0, 52.0, 47.0, 47.0, 60.0, 40.0, 30.0, 28.0, 26.0, 21.0, 12.0, 11.0, 17.0, 9.0, 7.0, 11.0, 10.0, 8.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9288976192474365, -3.7960968017578125, -3.6632959842681885, -3.5304951667785645, -3.3976941108703613, -3.2648935317993164, -3.1320924758911133, -2.9992916584014893, -2.8664908409118652, -2.733690023422241, -2.600889205932617, -2.468088388442993, -2.335287570953369, -2.202486515045166, -2.069685697555542, -1.936884880065918, -1.804084062576294, -1.67128324508667, -1.538482427597046, -1.4056814908981323, -1.2728806734085083, -1.1400798559188843, -1.0072789192199707, -0.8744781017303467, -0.7416772842407227, -0.6088764667510986, -0.47607558965682983, -0.3432747423648834, -0.210473895072937, -0.07767307758331299, 0.05512779951095581, 0.1879286766052246, 0.32072925567626953, 0.45353010296821594, 0.5863309502601624, 0.7191318273544312, 0.8519326448440552, 0.9847334623336792, 1.1175343990325928, 1.2503352165222168, 1.3831360340118408, 1.5159368515014648, 1.6487376689910889, 1.7815386056900024, 1.9143394231796265, 2.047140121459961, 2.179941177368164, 2.312741994857788, 2.445542812347412, 2.578343629837036, 2.71114444732666, 2.843945264816284, 2.976746082305908, 3.1095471382141113, 3.2423479557037354, 3.3751487731933594, 3.5079495906829834, 3.6407504081726074, 3.7735512256622314, 3.9063520431518555, 4.039153099060059, 4.1719536781311035, 4.304754734039307, 4.437555313110352, 4.570356369018555]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 2.0, 14.0, 17.0, 21.0, 26.0, 52.0, 79.0, 133.0, 262.0, 482.0, 1013.0, 2219.0, 5759.0, 16501.0, 55021.0, 219784.0, 500062.0, 178201.0, 45921.0, 14023.0, 5067.0, 2031.0, 905.0, 433.0, 215.0, 101.0, 78.0, 67.0, 19.0, 21.0, 8.0, 9.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.140625, -1.1124114990234375, -1.084197998046875, -1.0559844970703125, -1.02777099609375, -0.9995574951171875, -0.971343994140625, -0.9431304931640625, -0.9149169921875, -0.8867034912109375, -0.858489990234375, -0.8302764892578125, -0.80206298828125, -0.7738494873046875, -0.745635986328125, -0.7174224853515625, -0.689208984375, -0.6609954833984375, -0.632781982421875, -0.6045684814453125, -0.57635498046875, -0.5481414794921875, -0.519927978515625, -0.4917144775390625, -0.4635009765625, -0.4352874755859375, -0.407073974609375, -0.3788604736328125, -0.35064697265625, -0.3224334716796875, -0.294219970703125, -0.2660064697265625, -0.23779296875, -0.2095794677734375, -0.181365966796875, -0.1531524658203125, -0.12493896484375, -0.0967254638671875, -0.068511962890625, -0.0402984619140625, -0.0120849609375, 0.0161285400390625, 0.044342041015625, 0.0725555419921875, 0.10076904296875, 0.1289825439453125, 0.157196044921875, 0.1854095458984375, 0.213623046875, 0.2418365478515625, 0.270050048828125, 0.2982635498046875, 0.32647705078125, 0.3546905517578125, 0.382904052734375, 0.4111175537109375, 0.4393310546875, 0.4675445556640625, 0.495758056640625, 0.5239715576171875, 0.55218505859375, 0.5803985595703125, 0.608612060546875, 0.6368255615234375, 0.6650390625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 7.0, 4.0, 9.0, 11.0, 13.0, 11.0, 18.0, 24.0, 21.0, 40.0, 36.0, 33.0, 54.0, 51.0, 40.0, 52.0, 43.0, 51.0, 49.0, 49.0, 50.0, 37.0, 43.0, 41.0, 43.0, 26.0, 31.0, 19.0, 25.0, 16.0, 11.0, 5.0, 10.0, 12.0, 1.0, 5.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53515625, -0.5177001953125, -0.500244140625, -0.4827880859375, -0.46533203125, -0.4478759765625, -0.430419921875, -0.4129638671875, -0.3955078125, -0.3780517578125, -0.360595703125, -0.3431396484375, -0.32568359375, -0.3082275390625, -0.290771484375, -0.2733154296875, -0.255859375, -0.2384033203125, -0.220947265625, -0.2034912109375, -0.18603515625, -0.1685791015625, -0.151123046875, -0.1336669921875, -0.1162109375, -0.0987548828125, -0.081298828125, -0.0638427734375, -0.04638671875, -0.0289306640625, -0.011474609375, 0.0059814453125, 0.0234375, 0.0408935546875, 0.058349609375, 0.0758056640625, 0.09326171875, 0.1107177734375, 0.128173828125, 0.1456298828125, 0.1630859375, 0.1805419921875, 0.197998046875, 0.2154541015625, 0.23291015625, 0.2503662109375, 0.267822265625, 0.2852783203125, 0.302734375, 0.3201904296875, 0.337646484375, 0.3551025390625, 0.37255859375, 0.3900146484375, 0.407470703125, 0.4249267578125, 0.4423828125, 0.4598388671875, 0.477294921875, 0.4947509765625, 0.51220703125, 0.5296630859375, 0.547119140625, 0.5645751953125, 0.58203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 7.0, 18.0, 16.0, 31.0, 43.0, 41.0, 86.0, 88.0, 139.0, 205.0, 418.0, 693.0, 1501.0, 3946.0, 14618.0, 78245.0, 718292.0, 189735.0, 29236.0, 6653.0, 2240.0, 922.0, 489.0, 296.0, 171.0, 109.0, 99.0, 62.0, 26.0, 32.0, 16.0, 14.0, 13.0, 11.0, 8.0, 4.0, 9.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.166015625, -1.1292572021484375, -1.092498779296875, -1.0557403564453125, -1.01898193359375, -0.9822235107421875, -0.945465087890625, -0.9087066650390625, -0.8719482421875, -0.8351898193359375, -0.798431396484375, -0.7616729736328125, -0.72491455078125, -0.6881561279296875, -0.651397705078125, -0.6146392822265625, -0.577880859375, -0.5411224365234375, -0.504364013671875, -0.4676055908203125, -0.43084716796875, -0.3940887451171875, -0.357330322265625, -0.3205718994140625, -0.2838134765625, -0.2470550537109375, -0.210296630859375, -0.1735382080078125, -0.13677978515625, -0.1000213623046875, -0.063262939453125, -0.0265045166015625, 0.01025390625, 0.0470123291015625, 0.083770751953125, 0.1205291748046875, 0.15728759765625, 0.1940460205078125, 0.230804443359375, 0.2675628662109375, 0.3043212890625, 0.3410797119140625, 0.377838134765625, 0.4145965576171875, 0.45135498046875, 0.4881134033203125, 0.524871826171875, 0.5616302490234375, 0.598388671875, 0.6351470947265625, 0.671905517578125, 0.7086639404296875, 0.74542236328125, 0.7821807861328125, 0.818939208984375, 0.8556976318359375, 0.8924560546875, 0.9292144775390625, 0.965972900390625, 1.0027313232421875, 1.03948974609375, 1.0762481689453125, 1.113006591796875, 1.1497650146484375, 1.1865234375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 12.0, 5.0, 6.0, 11.0, 18.0, 14.0, 35.0, 36.0, 45.0, 40.0, 49.0, 62.0, 83.0, 63.0, 66.0, 77.0, 46.0, 74.0, 51.0, 39.0, 45.0, 20.0, 21.0, 14.0, 17.0, 9.0, 13.0, 10.0, 6.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.92578125, -2.84552001953125, -2.7652587890625, -2.68499755859375, -2.604736328125, -2.52447509765625, -2.4442138671875, -2.36395263671875, -2.28369140625, -2.20343017578125, -2.1231689453125, -2.04290771484375, -1.962646484375, -1.88238525390625, -1.8021240234375, -1.72186279296875, -1.6416015625, -1.56134033203125, -1.4810791015625, -1.40081787109375, -1.320556640625, -1.24029541015625, -1.1600341796875, -1.07977294921875, -0.99951171875, -0.91925048828125, -0.8389892578125, -0.75872802734375, -0.678466796875, -0.59820556640625, -0.5179443359375, -0.43768310546875, -0.357421875, -0.27716064453125, -0.1968994140625, -0.11663818359375, -0.036376953125, 0.04388427734375, 0.1241455078125, 0.20440673828125, 0.28466796875, 0.36492919921875, 0.4451904296875, 0.52545166015625, 0.605712890625, 0.68597412109375, 0.7662353515625, 0.84649658203125, 0.9267578125, 1.00701904296875, 1.0872802734375, 1.16754150390625, 1.247802734375, 1.32806396484375, 1.4083251953125, 1.48858642578125, 1.56884765625, 1.64910888671875, 1.7293701171875, 1.80963134765625, 1.889892578125, 1.97015380859375, 2.0504150390625, 2.13067626953125, 2.2109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 12.0, 9.0, 22.0, 31.0, 49.0, 73.0, 105.0, 193.0, 363.0, 718.0, 1726.0, 4165.0, 12918.0, 55637.0, 709773.0, 215931.0, 32677.0, 8674.0, 2968.0, 1221.0, 561.0, 298.0, 167.0, 104.0, 53.0, 35.0, 14.0, 17.0, 10.0, 12.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44189453125, -0.42601776123046875, -0.4101409912109375, -0.39426422119140625, -0.378387451171875, -0.36251068115234375, -0.3466339111328125, -0.33075714111328125, -0.31488037109375, -0.29900360107421875, -0.2831268310546875, -0.26725006103515625, -0.251373291015625, -0.23549652099609375, -0.2196197509765625, -0.20374298095703125, -0.1878662109375, -0.17198944091796875, -0.1561126708984375, -0.14023590087890625, -0.124359130859375, -0.10848236083984375, -0.0926055908203125, -0.07672882080078125, -0.06085205078125, -0.04497528076171875, -0.0290985107421875, -0.01322174072265625, 0.002655029296875, 0.01853179931640625, 0.0344085693359375, 0.05028533935546875, 0.066162109375, 0.08203887939453125, 0.0979156494140625, 0.11379241943359375, 0.129669189453125, 0.14554595947265625, 0.1614227294921875, 0.17729949951171875, 0.19317626953125, 0.20905303955078125, 0.2249298095703125, 0.24080657958984375, 0.256683349609375, 0.27256011962890625, 0.2884368896484375, 0.30431365966796875, 0.3201904296875, 0.33606719970703125, 0.3519439697265625, 0.36782073974609375, 0.383697509765625, 0.39957427978515625, 0.4154510498046875, 0.43132781982421875, 0.44720458984375, 0.46308135986328125, 0.4789581298828125, 0.49483489990234375, 0.510711669921875, 0.5265884399414062, 0.5424652099609375, 0.5583419799804688, 0.57421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 4.0, 5.0, 5.0, 9.0, 8.0, 15.0, 21.0, 11.0, 20.0, 35.0, 48.0, 76.0, 132.0, 152.0, 151.0, 84.0, 54.0, 38.0, 32.0, 21.0, 12.0, 4.0, 7.0, 12.0, 6.0, 5.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00013518333435058594, -0.00013026967644691467, -0.0001253560185432434, -0.00012044236063957214, -0.00011552870273590088, -0.00011061504483222961, -0.00010570138692855835, -0.00010078772902488708, -9.587407112121582e-05, -9.096041321754456e-05, -8.604675531387329e-05, -8.113309741020203e-05, -7.621943950653076e-05, -7.13057816028595e-05, -6.639212369918823e-05, -6.147846579551697e-05, -5.65648078918457e-05, -5.165114998817444e-05, -4.6737492084503174e-05, -4.182383418083191e-05, -3.6910176277160645e-05, -3.199651837348938e-05, -2.7082860469818115e-05, -2.216920256614685e-05, -1.7255544662475586e-05, -1.2341886758804321e-05, -7.428228855133057e-06, -2.514570951461792e-06, 2.3990869522094727e-06, 7.312744855880737e-06, 1.2226402759552002e-05, 1.7140060663223267e-05, 2.205371856689453e-05, 2.6967376470565796e-05, 3.188103437423706e-05, 3.6794692277908325e-05, 4.170835018157959e-05, 4.6622008085250854e-05, 5.153566598892212e-05, 5.6449323892593384e-05, 6.136298179626465e-05, 6.627663969993591e-05, 7.119029760360718e-05, 7.610395550727844e-05, 8.101761341094971e-05, 8.593127131462097e-05, 9.084492921829224e-05, 9.57585871219635e-05, 0.00010067224502563477, 0.00010558590292930603, 0.0001104995608329773, 0.00011541321873664856, 0.00012032687664031982, 0.0001252405345439911, 0.00013015419244766235, 0.00013506785035133362, 0.00013998150825500488, 0.00014489516615867615, 0.0001498088240623474, 0.00015472248196601868, 0.00015963613986968994, 0.0001645497977733612, 0.00016946345567703247, 0.00017437711358070374, 0.000179290771484375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 16.0, 24.0, 41.0, 51.0, 98.0, 186.0, 335.0, 708.0, 1705.0, 4915.0, 19365.0, 108244.0, 784902.0, 101452.0, 18518.0, 4832.0, 1684.0, 678.0, 330.0, 156.0, 115.0, 54.0, 40.0, 28.0, 13.0, 12.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6064453125, -0.5888595581054688, -0.5712738037109375, -0.5536880493164062, -0.536102294921875, -0.5185165405273438, -0.5009307861328125, -0.48334503173828125, -0.46575927734375, -0.44817352294921875, -0.4305877685546875, -0.41300201416015625, -0.395416259765625, -0.37783050537109375, -0.3602447509765625, -0.34265899658203125, -0.3250732421875, -0.30748748779296875, -0.2899017333984375, -0.27231597900390625, -0.254730224609375, -0.23714447021484375, -0.2195587158203125, -0.20197296142578125, -0.18438720703125, -0.16680145263671875, -0.1492156982421875, -0.13162994384765625, -0.114044189453125, -0.09645843505859375, -0.0788726806640625, -0.06128692626953125, -0.043701171875, -0.02611541748046875, -0.0085296630859375, 0.00905609130859375, 0.026641845703125, 0.04422760009765625, 0.0618133544921875, 0.07939910888671875, 0.09698486328125, 0.11457061767578125, 0.1321563720703125, 0.14974212646484375, 0.167327880859375, 0.18491363525390625, 0.2024993896484375, 0.22008514404296875, 0.2376708984375, 0.25525665283203125, 0.2728424072265625, 0.29042816162109375, 0.308013916015625, 0.32559967041015625, 0.3431854248046875, 0.36077117919921875, 0.37835693359375, 0.39594268798828125, 0.4135284423828125, 0.43111419677734375, 0.448699951171875, 0.46628570556640625, 0.4838714599609375, 0.5014572143554688, 0.51904296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 3.0, 9.0, 7.0, 9.0, 17.0, 17.0, 17.0, 25.0, 25.0, 31.0, 61.0, 73.0, 83.0, 114.0, 124.0, 85.0, 74.0, 37.0, 29.0, 29.0, 25.0, 26.0, 20.0, 10.0, 12.0, 8.0, 5.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3844947814941406, -0.37201690673828125, -0.3595390319824219, -0.3470611572265625, -0.3345832824707031, -0.32210540771484375, -0.3096275329589844, -0.297149658203125, -0.2846717834472656, -0.27219390869140625, -0.2597160339355469, -0.2472381591796875, -0.23476028442382812, -0.22228240966796875, -0.20980453491210938, -0.19732666015625, -0.18484878540039062, -0.17237091064453125, -0.15989303588867188, -0.1474151611328125, -0.13493728637695312, -0.12245941162109375, -0.10998153686523438, -0.097503662109375, -0.08502578735351562, -0.07254791259765625, -0.060070037841796875, -0.0475921630859375, -0.035114288330078125, -0.02263641357421875, -0.010158538818359375, 0.0023193359375, 0.014797210693359375, 0.02727508544921875, 0.039752960205078125, 0.0522308349609375, 0.06470870971679688, 0.07718658447265625, 0.08966445922851562, 0.102142333984375, 0.11462020874023438, 0.12709808349609375, 0.13957595825195312, 0.1520538330078125, 0.16453170776367188, 0.17700958251953125, 0.18948745727539062, 0.20196533203125, 0.21444320678710938, 0.22692108154296875, 0.23939895629882812, 0.2518768310546875, 0.2643547058105469, 0.27683258056640625, 0.2893104553222656, 0.301788330078125, 0.3142662048339844, 0.32674407958984375, 0.3392219543457031, 0.3516998291015625, 0.3641777038574219, 0.37665557861328125, 0.3891334533691406, 0.401611328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 19.0, 21.0, 55.0, 115.0, 341.0, 278.0, 97.0, 36.0, 14.0, 7.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.030405044555664, -14.528647422790527, -14.02688980102539, -13.525132179260254, -13.023374557495117, -12.52161693572998, -12.019859313964844, -11.518101692199707, -11.01634407043457, -10.514586448669434, -10.012828826904297, -9.51107120513916, -9.009313583374023, -8.507555961608887, -8.00579833984375, -7.504040718078613, -7.002283096313477, -6.50052547454834, -5.998767852783203, -5.497010231018066, -4.99525260925293, -4.493494987487793, -3.9917373657226562, -3.4899797439575195, -2.988222122192383, -2.486464500427246, -1.9847068786621094, -1.4829492568969727, -0.9811916351318359, -0.4794340133666992, 0.0223236083984375, 0.5240812301635742, 1.025838851928711, 1.5275964736938477, 2.0293540954589844, 2.531111717224121, 3.032869338989258, 3.5346269607543945, 4.036384582519531, 4.538142204284668, 5.039899826049805, 5.541657447814941, 6.043415069580078, 6.545172691345215, 7.046930313110352, 7.548687934875488, 8.050445556640625, 8.552203178405762, 9.053960800170898, 9.555718421936035, 10.057476043701172, 10.559233665466309, 11.060991287231445, 11.562748908996582, 12.064506530761719, 12.566264152526855, 13.068021774291992, 13.569779396057129, 14.071537017822266, 14.573294639587402, 15.075052261352539, 15.576809883117676, 16.078567504882812, 16.580326080322266, 17.082082748413086]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 3.0, 0.0, 8.0, 10.0, 12.0, 8.0, 9.0, 16.0, 16.0, 19.0, 26.0, 30.0, 23.0, 39.0, 25.0, 34.0, 64.0, 84.0, 92.0, 106.0, 63.0, 39.0, 36.0, 36.0, 25.0, 21.0, 22.0, 21.0, 23.0, 22.0, 12.0, 16.0, 7.0, 10.0, 7.0, 4.0, 4.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.074525833129883, -8.826263427734375, -8.578001976013184, -8.329739570617676, -8.081477165222168, -7.833215236663818, -7.5849528312683105, -7.336690902709961, -7.088428497314453, -6.8401665687561035, -6.591904163360596, -6.343642234802246, -6.095379829406738, -5.847117900848389, -5.598855495452881, -5.350593566894531, -5.102331161499023, -4.854069232940674, -4.605806827545166, -4.357544898986816, -4.109282493591309, -3.861020565032959, -3.612758159637451, -3.3644962310791016, -3.116234302520752, -2.8679721355438232, -2.6197099685668945, -2.371447801589966, -2.123185634613037, -1.874923586845398, -1.6266614198684692, -1.3783992528915405, -1.1301369667053223, -0.8818747997283936, -0.6336126327514648, -0.3853505253791809, -0.1370883584022522, 0.11117374897003174, 0.35943591594696045, 0.6076980829238892, 0.8559602499008179, 1.1042224168777466, 1.3524845838546753, 1.6007466316223145, 1.8490087985992432, 2.097270965576172, 2.3455331325531006, 2.5937952995300293, 2.842057466506958, 3.0903196334838867, 3.3385818004608154, 3.586843967437744, 3.835106134414673, 4.083368301391602, 4.331630229949951, 4.579892635345459, 4.828154563903809, 5.076416492462158, 5.324678897857666, 5.572940826416016, 5.821203231811523, 6.069465160369873, 6.317727565765381, 6.5659894943237305, 6.814251899719238]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 9.0, 7.0, 6.0, 21.0, 36.0, 63.0, 109.0, 164.0, 310.0, 693.0, 1539.0, 3948.0, 12174.0, 56736.0, 537901.0, 2726744.0, 760996.0, 71721.0, 13838.0, 4100.0, 1654.0, 697.0, 352.0, 184.0, 103.0, 71.0, 45.0, 16.0, 15.0, 8.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.42578125, -1.3845367431640625, -1.343292236328125, -1.3020477294921875, -1.26080322265625, -1.2195587158203125, -1.178314208984375, -1.1370697021484375, -1.0958251953125, -1.0545806884765625, -1.013336181640625, -0.9720916748046875, -0.93084716796875, -0.8896026611328125, -0.848358154296875, -0.8071136474609375, -0.765869140625, -0.7246246337890625, -0.683380126953125, -0.6421356201171875, -0.60089111328125, -0.5596466064453125, -0.518402099609375, -0.4771575927734375, -0.4359130859375, -0.3946685791015625, -0.353424072265625, -0.3121795654296875, -0.27093505859375, -0.2296905517578125, -0.188446044921875, -0.1472015380859375, -0.10595703125, -0.0647125244140625, -0.023468017578125, 0.0177764892578125, 0.05902099609375, 0.1002655029296875, 0.141510009765625, 0.1827545166015625, 0.2239990234375, 0.2652435302734375, 0.306488037109375, 0.3477325439453125, 0.38897705078125, 0.4302215576171875, 0.471466064453125, 0.5127105712890625, 0.553955078125, 0.5951995849609375, 0.636444091796875, 0.6776885986328125, 0.71893310546875, 0.7601776123046875, 0.801422119140625, 0.8426666259765625, 0.8839111328125, 0.9251556396484375, 0.966400146484375, 1.0076446533203125, 1.04888916015625, 1.0901336669921875, 1.131378173828125, 1.1726226806640625, 1.2138671875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 12.0, 16.0, 12.0, 21.0, 31.0, 31.0, 49.0, 50.0, 54.0, 70.0, 61.0, 48.0, 60.0, 69.0, 60.0, 62.0, 48.0, 45.0, 33.0, 31.0, 38.0, 18.0, 20.0, 15.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5205078125, -0.4998321533203125, -0.479156494140625, -0.4584808349609375, -0.43780517578125, -0.4171295166015625, -0.396453857421875, -0.3757781982421875, -0.3551025390625, -0.3344268798828125, -0.313751220703125, -0.2930755615234375, -0.27239990234375, -0.2517242431640625, -0.231048583984375, -0.2103729248046875, -0.189697265625, -0.1690216064453125, -0.148345947265625, -0.1276702880859375, -0.10699462890625, -0.0863189697265625, -0.065643310546875, -0.0449676513671875, -0.0242919921875, -0.0036163330078125, 0.017059326171875, 0.0377349853515625, 0.05841064453125, 0.0790863037109375, 0.099761962890625, 0.1204376220703125, 0.14111328125, 0.1617889404296875, 0.182464599609375, 0.2031402587890625, 0.22381591796875, 0.2444915771484375, 0.265167236328125, 0.2858428955078125, 0.3065185546875, 0.3271942138671875, 0.347869873046875, 0.3685455322265625, 0.38922119140625, 0.4098968505859375, 0.430572509765625, 0.4512481689453125, 0.471923828125, 0.4925994873046875, 0.513275146484375, 0.5339508056640625, 0.55462646484375, 0.5753021240234375, 0.595977783203125, 0.6166534423828125, 0.6373291015625, 0.6580047607421875, 0.678680419921875, 0.6993560791015625, 0.72003173828125, 0.7407073974609375, 0.761383056640625, 0.7820587158203125, 0.802734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 3.0, 12.0, 18.0, 34.0, 34.0, 79.0, 137.0, 297.0, 698.0, 1968.0, 12655.0, 3932137.0, 238527.0, 5377.0, 1299.0, 485.0, 228.0, 120.0, 60.0, 45.0, 19.0, 13.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0625, -4.88671875, -4.7109375, -4.53515625, -4.359375, -4.18359375, -4.0078125, -3.83203125, -3.65625, -3.48046875, -3.3046875, -3.12890625, -2.953125, -2.77734375, -2.6015625, -2.42578125, -2.25, -2.07421875, -1.8984375, -1.72265625, -1.546875, -1.37109375, -1.1953125, -1.01953125, -0.84375, -0.66796875, -0.4921875, -0.31640625, -0.140625, 0.03515625, 0.2109375, 0.38671875, 0.5625, 0.73828125, 0.9140625, 1.08984375, 1.265625, 1.44140625, 1.6171875, 1.79296875, 1.96875, 2.14453125, 2.3203125, 2.49609375, 2.671875, 2.84765625, 3.0234375, 3.19921875, 3.375, 3.55078125, 3.7265625, 3.90234375, 4.078125, 4.25390625, 4.4296875, 4.60546875, 4.78125, 4.95703125, 5.1328125, 5.30859375, 5.484375, 5.66015625, 5.8359375, 6.01171875, 6.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 16.0, 17.0, 28.0, 72.0, 121.0, 221.0, 456.0, 873.0, 980.0, 623.0, 319.0, 144.0, 85.0, 55.0, 24.0, 14.0, 8.0, 10.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.0, -3.90032958984375, -3.8006591796875, -3.70098876953125, -3.601318359375, -3.50164794921875, -3.4019775390625, -3.30230712890625, -3.20263671875, -3.10296630859375, -3.0032958984375, -2.90362548828125, -2.803955078125, -2.70428466796875, -2.6046142578125, -2.50494384765625, -2.4052734375, -2.30560302734375, -2.2059326171875, -2.10626220703125, -2.006591796875, -1.90692138671875, -1.8072509765625, -1.70758056640625, -1.60791015625, -1.50823974609375, -1.4085693359375, -1.30889892578125, -1.209228515625, -1.10955810546875, -1.0098876953125, -0.91021728515625, -0.810546875, -0.71087646484375, -0.6112060546875, -0.51153564453125, -0.411865234375, -0.31219482421875, -0.2125244140625, -0.11285400390625, -0.01318359375, 0.08648681640625, 0.1861572265625, 0.28582763671875, 0.385498046875, 0.48516845703125, 0.5848388671875, 0.68450927734375, 0.7841796875, 0.88385009765625, 0.9835205078125, 1.08319091796875, 1.182861328125, 1.28253173828125, 1.3822021484375, 1.48187255859375, 1.58154296875, 1.68121337890625, 1.7808837890625, 1.88055419921875, 1.980224609375, 2.07989501953125, 2.1795654296875, 2.27923583984375, 2.37890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 4.0, 10.0, 17.0, 24.0, 48.0, 84.0, 125.0, 166.0, 167.0, 115.0, 77.0, 34.0, 34.0, 18.0, 15.0, 10.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.069948196411133, -18.429033279418945, -17.788118362426758, -17.147201538085938, -16.50628662109375, -15.865371704101562, -15.224456787109375, -14.583541870117188, -13.942625999450684, -13.301711082458496, -12.660795211791992, -12.019880294799805, -11.378965377807617, -10.738049507141113, -10.097134590148926, -9.456218719482422, -8.815303802490234, -8.174388885498047, -7.533473014831543, -6.8925580978393555, -6.25164270401001, -5.610727310180664, -4.969812393188477, -4.328896999359131, -3.687981605529785, -3.0470662117004395, -2.406151056289673, -1.7652357816696167, -1.1243205070495605, -0.48340511322021484, 0.15751004219055176, 0.7984251976013184, 1.4393386840820312, 2.080254077911377, 2.7211692333221436, 3.36208438873291, 4.002999782562256, 4.643915176391602, 5.284830093383789, 5.925745487213135, 6.5666608810424805, 7.207576274871826, 7.848491668701172, 8.48940658569336, 9.130321502685547, 9.77123737335205, 10.412152290344238, 11.053068161010742, 11.69398307800293, 12.334897994995117, 12.975813865661621, 13.616728782653809, 14.257644653320312, 14.8985595703125, 15.539474487304688, 16.180389404296875, 16.821304321289062, 17.46221923828125, 18.103134155273438, 18.744050979614258, 19.384965896606445, 20.025880813598633, 20.66679573059082, 21.307710647583008, 21.948627471923828]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 6.0, 1.0, 6.0, 9.0, 4.0, 10.0, 17.0, 16.0, 21.0, 24.0, 35.0, 32.0, 50.0, 47.0, 45.0, 53.0, 50.0, 54.0, 80.0, 62.0, 58.0, 49.0, 48.0, 33.0, 31.0, 29.0, 30.0, 16.0, 19.0, 14.0, 15.0, 9.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.165694236755371, -12.798726081848145, -12.431757926940918, -12.064789772033691, -11.697822570800781, -11.330854415893555, -10.963886260986328, -10.596918106079102, -10.229949951171875, -9.862981796264648, -9.496013641357422, -9.129045486450195, -8.762077331542969, -8.395110130310059, -8.028141975402832, -7.6611738204956055, -7.294205665588379, -6.927237510681152, -6.560269355773926, -6.193301677703857, -5.826333522796631, -5.459365367889404, -5.092397689819336, -4.725429534912109, -4.358461380004883, -3.9914932250976562, -3.624525308609009, -3.2575573921203613, -2.8905892372131348, -2.523621082305908, -2.1566531658172607, -1.7896852493286133, -1.4227170944213867, -1.0557490587234497, -0.6887810230255127, -0.3218129873275757, 0.04515504837036133, 0.41212308406829834, 0.7790911197662354, 1.1460590362548828, 1.5130271911621094, 1.8799952268600464, 2.2469632625579834, 2.613931179046631, 2.9808993339538574, 3.347867488861084, 3.7148354053497314, 4.081803321838379, 4.4487714767456055, 4.815739631652832, 5.182707786560059, 5.549675464630127, 5.9166436195373535, 6.28361177444458, 6.650579452514648, 7.017547607421875, 7.384515762329102, 7.751483917236328, 8.118452072143555, 8.485420227050781, 8.852388381958008, 9.219355583190918, 9.586323738098145, 9.953291893005371, 10.320260047912598]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 9.0, 12.0, 21.0, 48.0, 52.0, 86.0, 152.0, 232.0, 419.0, 781.0, 1484.0, 3214.0, 7946.0, 23474.0, 95554.0, 581732.0, 258824.0, 50181.0, 14183.0, 5314.0, 2282.0, 1136.0, 567.0, 336.0, 194.0, 94.0, 91.0, 45.0, 27.0, 18.0, 12.0, 5.0, 8.0, 2.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.0166473388671875, -0.982513427734375, -0.9483795166015625, -0.91424560546875, -0.8801116943359375, -0.845977783203125, -0.8118438720703125, -0.7777099609375, -0.7435760498046875, -0.709442138671875, -0.6753082275390625, -0.64117431640625, -0.6070404052734375, -0.572906494140625, -0.5387725830078125, -0.504638671875, -0.4705047607421875, -0.436370849609375, -0.4022369384765625, -0.36810302734375, -0.3339691162109375, -0.299835205078125, -0.2657012939453125, -0.2315673828125, -0.1974334716796875, -0.163299560546875, -0.1291656494140625, -0.09503173828125, -0.0608978271484375, -0.026763916015625, 0.0073699951171875, 0.04150390625, 0.0756378173828125, 0.109771728515625, 0.1439056396484375, 0.17803955078125, 0.2121734619140625, 0.246307373046875, 0.2804412841796875, 0.3145751953125, 0.3487091064453125, 0.382843017578125, 0.4169769287109375, 0.45111083984375, 0.4852447509765625, 0.519378662109375, 0.5535125732421875, 0.587646484375, 0.6217803955078125, 0.655914306640625, 0.6900482177734375, 0.72418212890625, 0.7583160400390625, 0.792449951171875, 0.8265838623046875, 0.8607177734375, 0.8948516845703125, 0.928985595703125, 0.9631195068359375, 0.99725341796875, 1.0313873291015625, 1.065521240234375, 1.0996551513671875, 1.1337890625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 10.0, 7.0, 9.0, 7.0, 4.0, 11.0, 23.0, 17.0, 22.0, 16.0, 35.0, 28.0, 30.0, 27.0, 40.0, 52.0, 40.0, 44.0, 54.0, 38.0, 51.0, 42.0, 49.0, 41.0, 44.0, 39.0, 34.0, 37.0, 33.0, 22.0, 12.0, 15.0, 16.0, 9.0, 7.0, 5.0, 2.0, 13.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65234375, -0.631439208984375, -0.61053466796875, -0.589630126953125, -0.5687255859375, -0.547821044921875, -0.52691650390625, -0.506011962890625, -0.485107421875, -0.464202880859375, -0.44329833984375, -0.422393798828125, -0.4014892578125, -0.380584716796875, -0.35968017578125, -0.338775634765625, -0.31787109375, -0.296966552734375, -0.27606201171875, -0.255157470703125, -0.2342529296875, -0.213348388671875, -0.19244384765625, -0.171539306640625, -0.150634765625, -0.129730224609375, -0.10882568359375, -0.087921142578125, -0.0670166015625, -0.046112060546875, -0.02520751953125, -0.004302978515625, 0.0166015625, 0.037506103515625, 0.05841064453125, 0.079315185546875, 0.1002197265625, 0.121124267578125, 0.14202880859375, 0.162933349609375, 0.183837890625, 0.204742431640625, 0.22564697265625, 0.246551513671875, 0.2674560546875, 0.288360595703125, 0.30926513671875, 0.330169677734375, 0.35107421875, 0.371978759765625, 0.39288330078125, 0.413787841796875, 0.4346923828125, 0.455596923828125, 0.47650146484375, 0.497406005859375, 0.518310546875, 0.539215087890625, 0.56011962890625, 0.581024169921875, 0.6019287109375, 0.622833251953125, 0.64373779296875, 0.664642333984375, 0.685546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 15.0, 11.0, 20.0, 21.0, 29.0, 45.0, 57.0, 115.0, 185.0, 313.0, 554.0, 1388.0, 5695.0, 48909.0, 922499.0, 59140.0, 6485.0, 1522.0, 667.0, 305.0, 169.0, 132.0, 76.0, 53.0, 28.0, 30.0, 27.0, 9.0, 11.0, 7.0, 5.0, 2.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6123046875, -1.557708740234375, -1.50311279296875, -1.448516845703125, -1.3939208984375, -1.339324951171875, -1.28472900390625, -1.230133056640625, -1.175537109375, -1.120941162109375, -1.06634521484375, -1.011749267578125, -0.9571533203125, -0.902557373046875, -0.84796142578125, -0.793365478515625, -0.73876953125, -0.684173583984375, -0.62957763671875, -0.574981689453125, -0.5203857421875, -0.465789794921875, -0.41119384765625, -0.356597900390625, -0.302001953125, -0.247406005859375, -0.19281005859375, -0.138214111328125, -0.0836181640625, -0.029022216796875, 0.02557373046875, 0.080169677734375, 0.134765625, 0.189361572265625, 0.24395751953125, 0.298553466796875, 0.3531494140625, 0.407745361328125, 0.46234130859375, 0.516937255859375, 0.571533203125, 0.626129150390625, 0.68072509765625, 0.735321044921875, 0.7899169921875, 0.844512939453125, 0.89910888671875, 0.953704833984375, 1.00830078125, 1.062896728515625, 1.11749267578125, 1.172088623046875, 1.2266845703125, 1.281280517578125, 1.33587646484375, 1.390472412109375, 1.445068359375, 1.499664306640625, 1.55426025390625, 1.608856201171875, 1.6634521484375, 1.718048095703125, 1.77264404296875, 1.827239990234375, 1.8818359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 4.0, 4.0, 7.0, 4.0, 8.0, 6.0, 7.0, 9.0, 15.0, 16.0, 14.0, 25.0, 26.0, 20.0, 31.0, 49.0, 48.0, 50.0, 69.0, 61.0, 64.0, 70.0, 63.0, 36.0, 41.0, 23.0, 37.0, 29.0, 18.0, 19.0, 17.0, 14.0, 17.0, 13.0, 14.0, 7.0, 9.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.208984375, -2.1353759765625, -2.061767578125, -1.9881591796875, -1.91455078125, -1.8409423828125, -1.767333984375, -1.6937255859375, -1.6201171875, -1.5465087890625, -1.472900390625, -1.3992919921875, -1.32568359375, -1.2520751953125, -1.178466796875, -1.1048583984375, -1.03125, -0.9576416015625, -0.884033203125, -0.8104248046875, -0.73681640625, -0.6632080078125, -0.589599609375, -0.5159912109375, -0.4423828125, -0.3687744140625, -0.295166015625, -0.2215576171875, -0.14794921875, -0.0743408203125, -0.000732421875, 0.0728759765625, 0.146484375, 0.2200927734375, 0.293701171875, 0.3673095703125, 0.44091796875, 0.5145263671875, 0.588134765625, 0.6617431640625, 0.7353515625, 0.8089599609375, 0.882568359375, 0.9561767578125, 1.02978515625, 1.1033935546875, 1.177001953125, 1.2506103515625, 1.32421875, 1.3978271484375, 1.471435546875, 1.5450439453125, 1.61865234375, 1.6922607421875, 1.765869140625, 1.8394775390625, 1.9130859375, 1.9866943359375, 2.060302734375, 2.1339111328125, 2.20751953125, 2.2811279296875, 2.354736328125, 2.4283447265625, 2.501953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 16.0, 24.0, 20.0, 38.0, 59.0, 84.0, 158.0, 300.0, 467.0, 1162.0, 2940.0, 10822.0, 66730.0, 889161.0, 61216.0, 10280.0, 2859.0, 1116.0, 472.0, 250.0, 144.0, 85.0, 45.0, 37.0, 18.0, 16.0, 12.0, 7.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310302734375, -0.300445556640625, -0.29058837890625, -0.280731201171875, -0.2708740234375, -0.261016845703125, -0.25115966796875, -0.241302490234375, -0.2314453125, -0.221588134765625, -0.21173095703125, -0.201873779296875, -0.1920166015625, -0.182159423828125, -0.17230224609375, -0.162445068359375, -0.152587890625, -0.142730712890625, -0.13287353515625, -0.123016357421875, -0.1131591796875, -0.103302001953125, -0.09344482421875, -0.083587646484375, -0.07373046875, -0.063873291015625, -0.05401611328125, -0.044158935546875, -0.0343017578125, -0.024444580078125, -0.01458740234375, -0.004730224609375, 0.005126953125, 0.014984130859375, 0.02484130859375, 0.034698486328125, 0.0445556640625, 0.054412841796875, 0.06427001953125, 0.074127197265625, 0.083984375, 0.093841552734375, 0.10369873046875, 0.113555908203125, 0.1234130859375, 0.133270263671875, 0.14312744140625, 0.152984619140625, 0.162841796875, 0.172698974609375, 0.18255615234375, 0.192413330078125, 0.2022705078125, 0.212127685546875, 0.22198486328125, 0.231842041015625, 0.24169921875, 0.251556396484375, 0.26141357421875, 0.271270751953125, 0.2811279296875, 0.290985107421875, 0.30084228515625, 0.310699462890625, 0.320556640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 12.0, 11.0, 9.0, 14.0, 16.0, 34.0, 40.0, 64.0, 112.0, 141.0, 137.0, 114.0, 71.0, 67.0, 37.0, 22.0, 21.0, 20.0, 12.0, 9.0, 7.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00011909008026123047, -0.00011627189815044403, -0.00011345371603965759, -0.00011063553392887115, -0.00010781735181808472, -0.00010499916970729828, -0.00010218098759651184, -9.93628054857254e-05, -9.654462337493896e-05, -9.372644126415253e-05, -9.090825915336609e-05, -8.809007704257965e-05, -8.527189493179321e-05, -8.245371282100677e-05, -7.963553071022034e-05, -7.68173485994339e-05, -7.399916648864746e-05, -7.118098437786102e-05, -6.836280226707458e-05, -6.554462015628815e-05, -6.272643804550171e-05, -5.990825593471527e-05, -5.709007382392883e-05, -5.4271891713142395e-05, -5.145370960235596e-05, -4.863552749156952e-05, -4.581734538078308e-05, -4.299916326999664e-05, -4.0180981159210205e-05, -3.736279904842377e-05, -3.454461693763733e-05, -3.172643482685089e-05, -2.8908252716064453e-05, -2.6090070605278015e-05, -2.3271888494491577e-05, -2.045370638370514e-05, -1.76355242729187e-05, -1.4817342162132263e-05, -1.1999160051345825e-05, -9.180977940559387e-06, -6.362795829772949e-06, -3.5446137189865112e-06, -7.264316082000732e-07, 2.0917505025863647e-06, 4.909932613372803e-06, 7.72811472415924e-06, 1.0546296834945679e-05, 1.3364478945732117e-05, 1.6182661056518555e-05, 1.9000843167304993e-05, 2.181902527809143e-05, 2.463720738887787e-05, 2.7455389499664307e-05, 3.0273571610450745e-05, 3.309175372123718e-05, 3.590993583202362e-05, 3.872811794281006e-05, 4.1546300053596497e-05, 4.4364482164382935e-05, 4.718266427516937e-05, 5.000084638595581e-05, 5.281902849674225e-05, 5.5637210607528687e-05, 5.8455392718315125e-05, 6.127357482910156e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 10.0, 17.0, 19.0, 26.0, 61.0, 80.0, 150.0, 299.0, 664.0, 1591.0, 4651.0, 21023.0, 227536.0, 757839.0, 26038.0, 5358.0, 1734.0, 704.0, 336.0, 171.0, 103.0, 49.0, 26.0, 20.0, 17.0, 12.0, 4.0, 8.0, 6.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3330078125, -0.32070159912109375, -0.3083953857421875, -0.29608917236328125, -0.283782958984375, -0.27147674560546875, -0.2591705322265625, -0.24686431884765625, -0.23455810546875, -0.22225189208984375, -0.2099456787109375, -0.19763946533203125, -0.185333251953125, -0.17302703857421875, -0.1607208251953125, -0.14841461181640625, -0.1361083984375, -0.12380218505859375, -0.1114959716796875, -0.09918975830078125, -0.086883544921875, -0.07457733154296875, -0.0622711181640625, -0.04996490478515625, -0.03765869140625, -0.02535247802734375, -0.0130462646484375, -0.00074005126953125, 0.011566162109375, 0.02387237548828125, 0.0361785888671875, 0.04848480224609375, 0.060791015625, 0.07309722900390625, 0.0854034423828125, 0.09770965576171875, 0.110015869140625, 0.12232208251953125, 0.1346282958984375, 0.14693450927734375, 0.15924072265625, 0.17154693603515625, 0.1838531494140625, 0.19615936279296875, 0.208465576171875, 0.22077178955078125, 0.2330780029296875, 0.24538421630859375, 0.2576904296875, 0.26999664306640625, 0.2823028564453125, 0.29460906982421875, 0.306915283203125, 0.31922149658203125, 0.3315277099609375, 0.34383392333984375, 0.35614013671875, 0.36844635009765625, 0.3807525634765625, 0.39305877685546875, 0.405364990234375, 0.41767120361328125, 0.4299774169921875, 0.44228363037109375, 0.45458984375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 8.0, 4.0, 1.0, 5.0, 7.0, 7.0, 5.0, 8.0, 9.0, 13.0, 12.0, 24.0, 27.0, 32.0, 51.0, 103.0, 112.0, 120.0, 124.0, 100.0, 60.0, 53.0, 17.0, 13.0, 14.0, 10.0, 8.0, 10.0, 7.0, 8.0, 8.0, 6.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3564453125, -0.3455085754394531, -0.33457183837890625, -0.3236351013183594, -0.3126983642578125, -0.3017616271972656, -0.29082489013671875, -0.2798881530761719, -0.268951416015625, -0.2580146789550781, -0.24707794189453125, -0.23614120483398438, -0.2252044677734375, -0.21426773071289062, -0.20333099365234375, -0.19239425659179688, -0.18145751953125, -0.17052078247070312, -0.15958404541015625, -0.14864730834960938, -0.1377105712890625, -0.12677383422851562, -0.11583709716796875, -0.10490036010742188, -0.093963623046875, -0.08302688598632812, -0.07209014892578125, -0.061153411865234375, -0.0502166748046875, -0.039279937744140625, -0.02834320068359375, -0.017406463623046875, -0.0064697265625, 0.004467010498046875, 0.01540374755859375, 0.026340484619140625, 0.0372772216796875, 0.048213958740234375, 0.05915069580078125, 0.07008743286132812, 0.081024169921875, 0.09196090698242188, 0.10289764404296875, 0.11383438110351562, 0.1247711181640625, 0.13570785522460938, 0.14664459228515625, 0.15758132934570312, 0.16851806640625, 0.17945480346679688, 0.19039154052734375, 0.20132827758789062, 0.2122650146484375, 0.22320175170898438, 0.23413848876953125, 0.24507522583007812, 0.256011962890625, 0.2669486999511719, 0.27788543701171875, 0.2888221740722656, 0.2997589111328125, 0.3106956481933594, 0.32163238525390625, 0.3325691223144531, 0.343505859375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 9.0, 17.0, 32.0, 97.0, 534.0, 189.0, 61.0, 31.0, 11.0, 12.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.681668281555176, -8.128374099731445, -7.575079917907715, -7.021785736083984, -6.468491554260254, -5.915197372436523, -5.361903667449951, -4.808609485626221, -4.25531530380249, -3.7020211219787598, -3.1487269401550293, -2.595432996749878, -2.0421388149261475, -1.488844633102417, -0.9355506896972656, -0.38225650787353516, 0.1710376739501953, 0.724331796169281, 1.2776259183883667, 1.8309199810028076, 2.384214162826538, 2.9375083446502686, 3.49080228805542, 4.04409646987915, 4.597390651702881, 5.150684833526611, 5.703979015350342, 6.257272720336914, 6.8105669021606445, 7.363861083984375, 7.9171552658081055, 8.470449447631836, 9.023744583129883, 9.577038764953613, 10.130332946777344, 10.683627128601074, 11.236921310424805, 11.790215492248535, 12.343509674072266, 12.89680290222168, 13.450098037719727, 14.003392219543457, 14.556686401367188, 15.109980583190918, 15.663274765014648, 16.216567993164062, 16.76986312866211, 17.323156356811523, 17.876449584960938, 18.42974281311035, 18.9830379486084, 19.536331176757812, 20.08962631225586, 20.642919540405273, 21.19621467590332, 21.749507904052734, 22.30280303955078, 22.856096267700195, 23.409391403198242, 23.962684631347656, 24.515979766845703, 25.069272994995117, 25.622568130493164, 26.175861358642578, 26.729156494140625]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 10.0, 9.0, 8.0, 14.0, 12.0, 12.0, 20.0, 13.0, 23.0, 20.0, 30.0, 35.0, 99.0, 177.0, 178.0, 65.0, 42.0, 31.0, 26.0, 28.0, 21.0, 11.0, 18.0, 12.0, 17.0, 15.0, 11.0, 6.0, 0.0, 9.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.77259635925293, -7.521172046661377, -7.269747734069824, -7.0183234214782715, -6.766899108886719, -6.515474796295166, -6.264050483703613, -6.012625694274902, -5.761201858520508, -5.509777545928955, -5.258353233337402, -5.00692892074585, -4.755504608154297, -4.504080295562744, -4.252655982971191, -4.0012311935424805, -3.7498068809509277, -3.498382568359375, -3.2469582557678223, -2.9955339431762695, -2.744109630584717, -2.492685317993164, -2.2412607669830322, -1.9898364543914795, -1.7384121417999268, -1.486987829208374, -1.2355635166168213, -0.984139084815979, -0.7327147722244263, -0.48129045963287354, -0.22986602783203125, 0.021558284759521484, 0.2729825973510742, 0.524406909942627, 0.7758312821388245, 1.027255654335022, 1.2786799669265747, 1.5301042795181274, 1.7815287113189697, 2.0329530239105225, 2.284377336502075, 2.535801649093628, 2.7872259616851807, 3.0386505126953125, 3.2900748252868652, 3.541499137878418, 3.7929234504699707, 4.044347763061523, 4.295772075653076, 4.547196388244629, 4.798620700836182, 5.050045013427734, 5.301469326019287, 5.55289363861084, 5.804318428039551, 6.055742263793945, 6.307167053222656, 6.558591365814209, 6.810015678405762, 7.0614399909973145, 7.312864303588867, 7.56428861618042, 7.815712928771973, 8.067137718200684, 8.318561553955078]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 3.0, 4.0, 8.0, 8.0, 4.0, 8.0, 3.0, 14.0, 12.0, 14.0, 21.0, 12.0, 17.0, 21.0, 31.0, 40.0, 47.0, 79.0, 193.0, 127.0, 55.0, 45.0, 37.0, 24.0, 32.0, 26.0, 18.0, 22.0, 15.0, 8.0, 6.0, 7.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5934066772460938, -0.5720672607421875, -0.5507278442382812, -0.529388427734375, -0.5080490112304688, -0.4867095947265625, -0.46537017822265625, -0.44403076171875, -0.42269134521484375, -0.4013519287109375, -0.38001251220703125, -0.358673095703125, -0.33733367919921875, -0.3159942626953125, -0.29465484619140625, -0.2733154296875, -0.25197601318359375, -0.2306365966796875, -0.20929718017578125, -0.187957763671875, -0.16661834716796875, -0.1452789306640625, -0.12393951416015625, -0.10260009765625, -0.08126068115234375, -0.0599212646484375, -0.03858184814453125, -0.017242431640625, 0.00409698486328125, 0.0254364013671875, 0.04677581787109375, 0.068115234375, 0.08945465087890625, 0.1107940673828125, 0.13213348388671875, 0.153472900390625, 0.17481231689453125, 0.1961517333984375, 0.21749114990234375, 0.23883056640625, 0.26016998291015625, 0.2815093994140625, 0.30284881591796875, 0.324188232421875, 0.34552764892578125, 0.3668670654296875, 0.38820648193359375, 0.4095458984375, 0.43088531494140625, 0.4522247314453125, 0.47356414794921875, 0.494903564453125, 0.5162429809570312, 0.5375823974609375, 0.5589218139648438, 0.58026123046875, 0.6016006469726562, 0.6229400634765625, 0.6442794799804688, 0.665618896484375, 0.6869583129882812, 0.7082977294921875, 0.7296371459960938, 0.7509765625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 8.0, 8.0, 12.0, 9.0, 16.0, 22.0, 36.0, 31.0, 50.0, 72.0, 122.0, 185.0, 398.0, 901.0, 2661.0, 11848.0, 8323144.0, 41706.0, 4697.0, 1341.0, 565.0, 250.0, 161.0, 103.0, 73.0, 34.0, 25.0, 18.0, 11.0, 3.0, 6.0, 4.0, 6.0, 8.0, 6.0, 4.0, 6.0, 3.0, 7.0, 8.0, 7.0, 2.0, 0.0, 2.0], "bins": [-6.44931697845459, -6.273708343505859, -6.098099708557129, -5.92249059677124, -5.74688196182251, -5.571273326873779, -5.395664215087891, -5.22005558013916, -5.04444694519043, -4.868838310241699, -4.693229675292969, -4.51762056350708, -4.34201192855835, -4.166403293609619, -3.9907944202423096, -3.815185546875, -3.6395769119262695, -3.463968276977539, -3.2883594036102295, -3.11275053024292, -2.9371418952941895, -2.761533260345459, -2.5859243869781494, -2.41031551361084, -2.2347068786621094, -2.059098243713379, -1.8834893703460693, -1.7078806161880493, -1.5322718620300293, -1.3566631078720093, -1.1810543537139893, -1.0054455995559692, -0.829836368560791, -0.654227614402771, -0.478618860244751, -0.30301010608673096, -0.12740135192871094, 0.04820740222930908, 0.2238161563873291, 0.3994249105453491, 0.5750336647033691, 0.7506424188613892, 0.9262511730194092, 1.1018599271774292, 1.2774686813354492, 1.4530774354934692, 1.6286861896514893, 1.8042949438095093, 1.9799036979675293, 2.1555123329162598, 2.3311212062835693, 2.506730079650879, 2.6823387145996094, 2.85794734954834, 3.0335562229156494, 3.209165096282959, 3.3847737312316895, 3.56038236618042, 3.7359912395477295, 3.911600112915039, 4.0872087478637695, 4.2628173828125, 4.4384260177612305, 4.614035129547119, 4.78964376449585]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 5.0, 4.0, 3.0, 6.0, 6.0, 4.0, 6.0, 3.0, 8.0, 0.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.366756439208984, -10.04687213897705, -9.726988792419434, -9.4071044921875, -9.087221145629883, -8.76733684539795, -8.447452545166016, -8.127569198608398, -7.807684898376465, -7.4878010749816895, -7.167917251586914, -6.8480329513549805, -6.528149127960205, -6.20826530456543, -5.888381481170654, -5.568497657775879, -5.2486138343811035, -4.928730010986328, -4.608846187591553, -4.288962364196777, -3.9690780639648438, -3.6491942405700684, -3.329310417175293, -3.0094263553619385, -2.689542531967163, -2.3696587085723877, -2.049774646759033, -1.7298908233642578, -1.4100068807601929, -1.090122938156128, -0.7702391147613525, -0.45035505294799805, -0.13047122955322266, 0.1894126832485199, 0.5092965960502625, 0.8291804790496826, 1.1490644216537476, 1.4689483642578125, 1.788832187652588, 2.1087162494659424, 2.4286000728607178, 2.748483896255493, 3.0683679580688477, 3.388251781463623, 3.7081356048583984, 4.028019905090332, 4.347903251647949, 4.667787551879883, 4.987671375274658, 5.307555198669434, 5.627439022064209, 5.947322845458984, 6.267207145690918, 6.587090969085693, 6.906974792480469, 7.226859092712402, 7.5467424392700195, 7.866626262664795, 8.18651008605957, 8.506394386291504, 8.826277732849121, 9.146162033081055, 9.466045379638672, 9.785929679870605, 10.105813980102539]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 5.0, 11.0, 11.0, 14.0, 23.0, 17.0, 31.0, 29.0, 36.0, 44.0, 45.0, 53.0, 56.0, 57.0, 63.0, 59.0, 84.0, 57.0, 53.0, 52.0, 48.0, 33.0, 22.0, 14.0, 17.0, 14.0, 6.0, 3.0, 7.0, 11.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.3558692932128906, -0.34479522705078125, -0.3337211608886719, -0.3226470947265625, -0.3115730285644531, -0.30049896240234375, -0.2894248962402344, -0.278350830078125, -0.2672767639160156, -0.25620269775390625, -0.24512863159179688, -0.2340545654296875, -0.22298049926757812, -0.21190643310546875, -0.20083236694335938, -0.18975830078125, -0.17868423461914062, -0.16761016845703125, -0.15653610229492188, -0.1454620361328125, -0.13438796997070312, -0.12331390380859375, -0.11223983764648438, -0.101165771484375, -0.09009170532226562, -0.07901763916015625, -0.06794357299804688, -0.0568695068359375, -0.045795440673828125, -0.03472137451171875, -0.023647308349609375, -0.0125732421875, -0.001499176025390625, 0.00957489013671875, 0.020648956298828125, 0.0317230224609375, 0.042797088623046875, 0.05387115478515625, 0.06494522094726562, 0.076019287109375, 0.08709335327148438, 0.09816741943359375, 0.10924148559570312, 0.1203155517578125, 0.13138961791992188, 0.14246368408203125, 0.15353775024414062, 0.16461181640625, 0.17568588256835938, 0.18675994873046875, 0.19783401489257812, 0.2089080810546875, 0.21998214721679688, 0.23105621337890625, 0.24213027954101562, 0.253204345703125, 0.2642784118652344, 0.27535247802734375, 0.2864265441894531, 0.2975006103515625, 0.3085746765136719, 0.31964874267578125, 0.3307228088378906, 0.341796875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 8.0, 4.0, 7.0, 20.0, 20.0, 39.0, 64.0, 103.0, 158.0, 337.0, 688.0, 1560.0, 4041.0, 12415.0, 42066.0, 143867.0, 212125.0, 73827.0, 21600.0, 6872.0, 2323.0, 1062.0, 480.0, 249.0, 141.0, 72.0, 48.0, 27.0, 17.0, 8.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3125, -4.14154052734375, -3.9705810546875, -3.79962158203125, -3.628662109375, -3.45770263671875, -3.2867431640625, -3.11578369140625, -2.94482421875, -2.77386474609375, -2.6029052734375, -2.43194580078125, -2.260986328125, -2.09002685546875, -1.9190673828125, -1.74810791015625, -1.5771484375, -1.40618896484375, -1.2352294921875, -1.06427001953125, -0.893310546875, -0.72235107421875, -0.5513916015625, -0.38043212890625, -0.20947265625, -0.03851318359375, 0.1324462890625, 0.30340576171875, 0.474365234375, 0.64532470703125, 0.8162841796875, 0.98724365234375, 1.158203125, 1.32916259765625, 1.5001220703125, 1.67108154296875, 1.842041015625, 2.01300048828125, 2.1839599609375, 2.35491943359375, 2.52587890625, 2.69683837890625, 2.8677978515625, 3.03875732421875, 3.209716796875, 3.38067626953125, 3.5516357421875, 3.72259521484375, 3.8935546875, 4.06451416015625, 4.2354736328125, 4.40643310546875, 4.577392578125, 4.74835205078125, 4.9193115234375, 5.09027099609375, 5.26123046875, 5.43218994140625, 5.6031494140625, 5.77410888671875, 5.945068359375, 6.11602783203125, 6.2869873046875, 6.45794677734375, 6.62890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 6.0, 12.0, 6.0, 10.0, 14.0, 12.0, 17.0, 25.0, 29.0, 29.0, 47.0, 34.0, 43.0, 40.0, 38.0, 72.0, 54.0, 59.0, 52.0, 64.0, 47.0, 36.0, 42.0, 28.0, 32.0, 25.0, 19.0, 16.0, 12.0, 14.0, 13.0, 7.0, 9.0, 2.0, 8.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.640625, -0.6211013793945312, -0.6015777587890625, -0.5820541381835938, -0.562530517578125, -0.5430068969726562, -0.5234832763671875, -0.5039596557617188, -0.48443603515625, -0.46491241455078125, -0.4453887939453125, -0.42586517333984375, -0.406341552734375, -0.38681793212890625, -0.3672943115234375, -0.34777069091796875, -0.3282470703125, -0.30872344970703125, -0.2891998291015625, -0.26967620849609375, -0.250152587890625, -0.23062896728515625, -0.2111053466796875, -0.19158172607421875, -0.17205810546875, -0.15253448486328125, -0.1330108642578125, -0.11348724365234375, -0.093963623046875, -0.07444000244140625, -0.0549163818359375, -0.03539276123046875, -0.015869140625, 0.00365447998046875, 0.0231781005859375, 0.04270172119140625, 0.062225341796875, 0.08174896240234375, 0.1012725830078125, 0.12079620361328125, 0.14031982421875, 0.15984344482421875, 0.1793670654296875, 0.19889068603515625, 0.218414306640625, 0.23793792724609375, 0.2574615478515625, 0.27698516845703125, 0.2965087890625, 0.31603240966796875, 0.3355560302734375, 0.35507965087890625, 0.374603271484375, 0.39412689208984375, 0.4136505126953125, 0.43317413330078125, 0.45269775390625, 0.47222137451171875, 0.4917449951171875, 0.5112686157226562, 0.530792236328125, 0.5503158569335938, 0.5698394775390625, 0.5893630981445312, 0.60888671875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 8.0, 17.0, 39.0, 55.0, 118.0, 95.0, 66.0, 23.0, 8.0, 15.0, 11.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7005462646484375, -6.4761152267456055, -6.251684188842773, -6.027253150939941, -5.802822113037109, -5.578391075134277, -5.353960037231445, -5.129528999328613, -4.905097961425781, -4.680666923522949, -4.456235885620117, -4.231804847717285, -4.007373809814453, -3.782942771911621, -3.55851149559021, -3.334080457687378, -3.109649181365967, -2.8852181434631348, -2.6607871055603027, -2.4363560676574707, -2.2119250297546387, -1.987493872642517, -1.7630627155303955, -1.5386316776275635, -1.3142006397247314, -1.0897696018218994, -0.8653385043144226, -0.6409074068069458, -0.41647636890411377, -0.19204533100128174, 0.032385826110839844, 0.2568168640136719, 0.4812483787536621, 0.7056794166564941, 0.930110514163971, 1.1545416116714478, 1.3789726495742798, 1.6034036874771118, 1.8278348445892334, 2.0522658824920654, 2.2766969203948975, 2.5011279582977295, 2.7255589962005615, 2.9499902725219727, 3.1744213104248047, 3.3988523483276367, 3.6232833862304688, 3.847714424133301, 4.072145462036133, 4.296576499938965, 4.521007537841797, 4.745438575744629, 4.969869613647461, 5.194300651550293, 5.418731689453125, 5.643162727355957, 5.867593765258789, 6.092024803161621, 6.316455841064453, 6.540886878967285, 6.765317916870117, 6.989748954772949, 7.214179992675781, 7.438611030578613, 7.6630425453186035]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 8.0, 4.0, 2.0, 4.0, 4.0, 5.0, 13.0, 12.0, 16.0, 20.0, 54.0, 74.0, 60.0, 39.0, 45.0, 32.0, 23.0, 16.0, 4.0, 5.0, 3.0, 5.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-3.672778606414795, -3.5743768215179443, -3.4759747982025146, -3.377573013305664, -3.2791709899902344, -3.180769205093384, -3.082367420196533, -2.9839653968811035, -2.885563611984253, -2.7871618270874023, -2.6887598037719727, -2.590358018875122, -2.4919559955596924, -2.393554210662842, -2.295152187347412, -2.1967504024505615, -2.098348617553711, -1.9999467134475708, -1.9015448093414307, -1.80314302444458, -1.70474112033844, -1.6063392162322998, -1.5079373121261597, -1.4095354080200195, -1.3111333847045898, -1.2127314805984497, -1.1143295764923096, -1.015927791595459, -0.9175258874893188, -0.8191239833831787, -0.7207220792770386, -0.6223202347755432, -0.5239183902740479, -0.4255165159702301, -0.32711464166641235, -0.22871273756027222, -0.13031086325645447, -0.03190898895263672, 0.06649291515350342, 0.16489475965499878, 0.2632966637611389, 0.36169853806495667, 0.4601004123687744, 0.5585023164749146, 0.6569042205810547, 0.75530606508255, 0.8537079691886902, 0.9521098136901855, 1.0505117177963257, 1.1489136219024658, 1.247315526008606, 1.345717430114746, 1.4441192150115967, 1.5425211191177368, 1.640923023223877, 1.7393248081207275, 1.8377268314361572, 1.9361287355422974, 2.0345306396484375, 2.132932424545288, 2.2313344478607178, 2.3297362327575684, 2.428138256072998, 2.5265400409698486, 2.624941825866699]}, "eval/loss": 4.055415153503418, "eval/wer": 1.7872867909559698, "eval/runtime": 1259.0833, "eval/samples_per_second": 2.098, "eval/steps_per_second": 0.263} \ No newline at end of file